Spaces:
Build error
Build error
updated article.
Browse files- app.py +6 -4
- article.py +10 -1
app.py
CHANGED
@@ -55,6 +55,8 @@ def save_record(language,text,record,number,age,gender,accent,number_history,cur
|
|
55 |
speaker_metadata['gender'] = gender if gender!=GENDER[0] else ''
|
56 |
speaker_metadata['age'] = age if age !='' else ''
|
57 |
speaker_metadata['accent'] = accent if accent!='' else ''
|
|
|
|
|
58 |
if not done_recording:
|
59 |
if language!=None and language!='Choose language' and record is not None and number is not None:
|
60 |
language = language.lower()
|
@@ -131,7 +133,7 @@ def save_record(language,text,record,number,age,gender,accent,number_history,cur
|
|
131 |
output_string = "<div class='finished'>"+output+"</div>"
|
132 |
next_number = 0 # the default number
|
133 |
next_number_image = f'number/best.gif'
|
134 |
-
return output_string,next_number_image,number_history,next_number,done_recording
|
135 |
|
136 |
def display_records():
|
137 |
repo.git_pull()
|
@@ -182,15 +184,15 @@ This is a platform to contribute to your African language by recording your voic
|
|
182 |
markdown="""
|
183 |
# 🌍 African Digits Recording Sprint
|
184 |
|
185 |
-
>
|
186 |
|
187 |
1. Choose your African language
|
188 |
2. Fill in the speaker metadata (age, gender, accent). This is optional but important to build better speech models.
|
189 |
3. You will see the image of a number __(this is the number you will record)__.
|
190 |
-
4. Fill in the word of that
|
191 |
5. Click record and say the number in your African language.
|
192 |
6. Click ‘Submit’. It will save your record and go to the next number.
|
193 |
-
7. Repeat
|
194 |
8. Leave a ❤ in the Space, if you found it fun.
|
195 |
"""
|
196 |
|
|
|
55 |
speaker_metadata['gender'] = gender if gender!=GENDER[0] else ''
|
56 |
speaker_metadata['age'] = age if age !='' else ''
|
57 |
speaker_metadata['accent'] = accent if accent!='' else ''
|
58 |
+
|
59 |
+
|
60 |
if not done_recording:
|
61 |
if language!=None and language!='Choose language' and record is not None and number is not None:
|
62 |
language = language.lower()
|
|
|
133 |
output_string = "<div class='finished'>"+output+"</div>"
|
134 |
next_number = 0 # the default number
|
135 |
next_number_image = f'number/best.gif'
|
136 |
+
return output_string,next_number_image,number_history,next_number,done_recording,default_record
|
137 |
|
138 |
def display_records():
|
139 |
repo.git_pull()
|
|
|
184 |
markdown="""
|
185 |
# 🌍 African Digits Recording Sprint
|
186 |
|
187 |
+
> Record numbers 0-9 in your African language.
|
188 |
|
189 |
1. Choose your African language
|
190 |
2. Fill in the speaker metadata (age, gender, accent). This is optional but important to build better speech models.
|
191 |
3. You will see the image of a number __(this is the number you will record)__.
|
192 |
+
4. Fill in the word of that number (optional)
|
193 |
5. Click record and say the number in your African language.
|
194 |
6. Click ‘Submit’. It will save your record and go to the next number.
|
195 |
+
7. Repeat 4-7
|
196 |
8. Leave a ❤ in the Space, if you found it fun.
|
197 |
"""
|
198 |
|
article.py
CHANGED
@@ -7,12 +7,21 @@ Existing speech recognition services are not available in many African languages
|
|
7 |
|
8 |
This dataset will boost speech technologies (like speech-to-text, text-to-speech, speech translation, and modeling) for African languages, which hitherto had little or no public dataset.
|
9 |
|
10 |
-
**Note:** This is a continuous effort.
|
11 |
|
12 |
**Benefits of such a dataset**
|
13 |
- Useful dataset to introduce people to audio-related Machine Learning. It can be used as a simple training and/or evaluation dataset for speech processing tasks.
|
14 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
15 |
**Contact**
|
|
|
16 |
In case of questions, issues or anything contact Chris Emezue at:
|
17 | |
18 |
|
|
|
7 |
|
8 |
This dataset will boost speech technologies (like speech-to-text, text-to-speech, speech translation, and modeling) for African languages, which hitherto had little or no public dataset.
|
9 |
|
10 |
+
**Note:** This is a continuous effort. This sprint is just to kick-start the event.
|
11 |
|
12 |
**Benefits of such a dataset**
|
13 |
- Useful dataset to introduce people to audio-related Machine Learning. It can be used as a simple training and/or evaluation dataset for speech processing tasks.
|
14 |
|
15 |
+
**About the dataset**
|
16 |
+
|
17 |
+
The data (metadat,text, and audio recording) are uploaded to [a public Hugging Face dataset](https://huggingface.co/datasets/chrisjay/crowd-speech-africa).
|
18 |
+
|
19 |
+
We do not collect your name, address or other sensitive information.
|
20 |
+
|
21 |
+
If for some reason you want to remove your entry, please reach out by email.
|
22 |
+
|
23 |
**Contact**
|
24 |
+
|
25 |
In case of questions, issues or anything contact Chris Emezue at:
|
26 | |
27 |
|