chrisjay commited on
Commit
2d532b9
1 Parent(s): 74bf3d4

updated article.

Browse files
Files changed (2) hide show
  1. app.py +6 -4
  2. article.py +10 -1
app.py CHANGED
@@ -55,6 +55,8 @@ def save_record(language,text,record,number,age,gender,accent,number_history,cur
55
  speaker_metadata['gender'] = gender if gender!=GENDER[0] else ''
56
  speaker_metadata['age'] = age if age !='' else ''
57
  speaker_metadata['accent'] = accent if accent!='' else ''
 
 
58
  if not done_recording:
59
  if language!=None and language!='Choose language' and record is not None and number is not None:
60
  language = language.lower()
@@ -131,7 +133,7 @@ def save_record(language,text,record,number,age,gender,accent,number_history,cur
131
  output_string = "<div class='finished'>"+output+"</div>"
132
  next_number = 0 # the default number
133
  next_number_image = f'number/best.gif'
134
- return output_string,next_number_image,number_history,next_number,done_recording
135
 
136
  def display_records():
137
  repo.git_pull()
@@ -182,15 +184,15 @@ This is a platform to contribute to your African language by recording your voic
182
  markdown="""
183
  # 🌍 African Digits Recording Sprint
184
 
185
- > This is an event to record numbers (0-9) in your African language.
186
 
187
  1. Choose your African language
188
  2. Fill in the speaker metadata (age, gender, accent). This is optional but important to build better speech models.
189
  3. You will see the image of a number __(this is the number you will record)__.
190
- 4. Fill in the word of that **number** (optional)
191
  5. Click record and say the number in your African language.
192
  6. Click ‘Submit’. It will save your record and go to the next number.
193
- 7. Repeat 1-7
194
  8. Leave a ❤ in the Space, if you found it fun.
195
  """
196
 
55
  speaker_metadata['gender'] = gender if gender!=GENDER[0] else ''
56
  speaker_metadata['age'] = age if age !='' else ''
57
  speaker_metadata['accent'] = accent if accent!='' else ''
58
+
59
+
60
  if not done_recording:
61
  if language!=None and language!='Choose language' and record is not None and number is not None:
62
  language = language.lower()
133
  output_string = "<div class='finished'>"+output+"</div>"
134
  next_number = 0 # the default number
135
  next_number_image = f'number/best.gif'
136
+ return output_string,next_number_image,number_history,next_number,done_recording,default_record
137
 
138
  def display_records():
139
  repo.git_pull()
184
  markdown="""
185
  # 🌍 African Digits Recording Sprint
186
 
187
+ > Record numbers 0-9 in your African language.
188
 
189
  1. Choose your African language
190
  2. Fill in the speaker metadata (age, gender, accent). This is optional but important to build better speech models.
191
  3. You will see the image of a number __(this is the number you will record)__.
192
+ 4. Fill in the word of that number (optional)
193
  5. Click record and say the number in your African language.
194
  6. Click ‘Submit’. It will save your record and go to the next number.
195
+ 7. Repeat 4-7
196
  8. Leave a ❤ in the Space, if you found it fun.
197
  """
198
 
article.py CHANGED
@@ -7,12 +7,21 @@ Existing speech recognition services are not available in many African languages
7
 
8
  This dataset will boost speech technologies (like speech-to-text, text-to-speech, speech translation, and modeling) for African languages, which hitherto had little or no public dataset.
9
 
10
- **Note:** This is a continuous effort. the sprint is just to kick-start the event.
11
 
12
  **Benefits of such a dataset**
13
  - Useful dataset to introduce people to audio-related Machine Learning. It can be used as a simple training and/or evaluation dataset for speech processing tasks.
14
 
 
 
 
 
 
 
 
 
15
  **Contact**
 
16
  In case of questions, issues or anything contact Chris Emezue at:
17
  - chris@huggingface.co
18
 
7
 
8
  This dataset will boost speech technologies (like speech-to-text, text-to-speech, speech translation, and modeling) for African languages, which hitherto had little or no public dataset.
9
 
10
+ **Note:** This is a continuous effort. This sprint is just to kick-start the event.
11
 
12
  **Benefits of such a dataset**
13
  - Useful dataset to introduce people to audio-related Machine Learning. It can be used as a simple training and/or evaluation dataset for speech processing tasks.
14
 
15
+ **About the dataset**
16
+
17
+ The data (metadat,text, and audio recording) are uploaded to [a public Hugging Face dataset](https://huggingface.co/datasets/chrisjay/crowd-speech-africa).
18
+
19
+ We do not collect your name, address or other sensitive information.
20
+
21
+ If for some reason you want to remove your entry, please reach out by email.
22
+
23
  **Contact**
24
+
25
  In case of questions, issues or anything contact Chris Emezue at:
26
  - chris@huggingface.co
27