davidpomerenke commited on
Commit
adc94d7
·
verified ·
1 Parent(s): a61d2b3

Upload from GitHub Actions: Ugly fix for CI errors

Browse files
Files changed (2) hide show
  1. evals/main.py +1 -1
  2. evals/tasks.py +6 -8
evals/main.py CHANGED
@@ -20,7 +20,7 @@ async def evaluate():
20
  print("running evaluations")
21
  old_results = pd.read_json("results.json")
22
  results = [
23
- task(task, model, lang, i)
24
  for task_name, task in tasks.items()
25
  for i in range(n_sentences)
26
  for lang in languages.iloc[:n_languages].itertuples()
 
20
  print("running evaluations")
21
  old_results = pd.read_json("results.json")
22
  results = [
23
+ task(task, model, lang._asdict() if hasattr(lang, "_asdict") else dict(lang), i)
24
  for task_name, task in tasks.items()
25
  for i in range(n_sentences)
26
  for lang in languages.iloc[:n_languages].itertuples()
evals/tasks.py CHANGED
@@ -6,11 +6,9 @@ import pandas as pd
6
  import sentencepiece as spm
7
  from datasets_.flores import flores_sentences
8
  from datasets_.mmlu import load_mmlu
9
- from joblib.memory import Memory
10
  from languages import languages, script_name
11
  from models import complete, transcribe
12
 
13
- cache = Memory(location=".cache", verbose=0).cache
14
  bleu = evaluate.load("bleu")
15
  chrf = evaluate.load("chrf")
16
  wer = evaluate.load("wer")
@@ -282,10 +280,10 @@ async def transcribe_and_evaluate(model, language_bcp_47, nr):
282
 
283
 
284
  tasks = {
285
- "translation_from": cache(partial(translate_and_evaluate, mode="from")),
286
- "translation_to": cache(partial(translate_and_evaluate, mode="to")),
287
- # "classification": cache(classify_and_evaluate),
288
- # "mlm": cache(mlm_and_evaluate),
289
- "mmlu": cache(mmlu_and_evaluate),
290
- # "asr": cache(transcribe_and_evaluate),
291
  }
 
6
  import sentencepiece as spm
7
  from datasets_.flores import flores_sentences
8
  from datasets_.mmlu import load_mmlu
 
9
  from languages import languages, script_name
10
  from models import complete, transcribe
11
 
 
12
  bleu = evaluate.load("bleu")
13
  chrf = evaluate.load("chrf")
14
  wer = evaluate.load("wer")
 
280
 
281
 
282
  tasks = {
283
+ "translation_from": partial(translate_and_evaluate, mode="from"),
284
+ "translation_to": partial(translate_and_evaluate, mode="to"),
285
+ # "classification": classify_and_evaluate,
286
+ # "mlm": mlm_and_evaluate,
287
+ "mmlu": mmlu_and_evaluate,
288
+ # "asr": transcribe_and_evaluate,
289
  }