Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -16,6 +16,7 @@ import librosa
|
|
16 |
import numpy as np
|
17 |
import evaluate
|
18 |
import tempfile
|
|
|
19 |
|
20 |
st.title("📊 Évaluation WER d'un modèle Whisper")
|
21 |
st.markdown("Ce Space permet d'évaluer la performance WER d'un modèle Whisper sur un dataset audio.")
|
@@ -42,7 +43,7 @@ if start_eval:
|
|
42 |
# 🔹 Télécharger dataset
|
43 |
with st.spinner("Chargement du dataset..."):
|
44 |
try:
|
45 |
-
dataset = load_dataset(dataset_link, data_files="metadata.csv", split="train", token=hf_token)
|
46 |
except Exception as e:
|
47 |
st.error(f"Erreur lors du chargement du dataset : {e}")
|
48 |
st.stop()
|
@@ -63,13 +64,17 @@ if start_eval:
|
|
63 |
|
64 |
results = []
|
65 |
|
|
|
|
|
|
|
66 |
for example in dataset:
|
67 |
try:
|
68 |
-
audio_path = example["file_name"] # full path or relative path in AudioFolder
|
|
|
69 |
reference = example["text"]
|
70 |
|
71 |
-
st.write(example)
|
72 |
-
st.write("Exemple brut :", dataset[0])
|
73 |
|
74 |
# Load audio (we assume dataset is structured with 'file_name')
|
75 |
waveform, _ = librosa.load(audio_path, sr=16000)
|
|
|
16 |
import numpy as np
|
17 |
import evaluate
|
18 |
import tempfile
|
19 |
+
from huggingface_hub import hf_hub_download
|
20 |
|
21 |
st.title("📊 Évaluation WER d'un modèle Whisper")
|
22 |
st.markdown("Ce Space permet d'évaluer la performance WER d'un modèle Whisper sur un dataset audio.")
|
|
|
43 |
# 🔹 Télécharger dataset
|
44 |
with st.spinner("Chargement du dataset..."):
|
45 |
try:
|
46 |
+
dataset = load_dataset(dataset_link, data_files="metadata.csv", data_dir=".", split="train", token=hf_token)
|
47 |
except Exception as e:
|
48 |
st.error(f"Erreur lors du chargement du dataset : {e}")
|
49 |
st.stop()
|
|
|
64 |
|
65 |
results = []
|
66 |
|
67 |
+
# Téléchargement explicite du dossier audio (chemin local vers chaque fichier)
|
68 |
+
repo_local_path = hf_hub_download(dataset_link, repo_type="dataset", token=hf_token)
|
69 |
+
|
70 |
for example in dataset:
|
71 |
try:
|
72 |
+
#audio_path = example["file_name"] # full path or relative path in AudioFolder
|
73 |
+
audio_path = os.path.join(repo_local_path, example["file_name"])
|
74 |
reference = example["text"]
|
75 |
|
76 |
+
#st.write(example)
|
77 |
+
#st.write("Exemple brut :", dataset[0])
|
78 |
|
79 |
# Load audio (we assume dataset is structured with 'file_name')
|
80 |
waveform, _ = librosa.load(audio_path, sr=16000)
|