Spaces:

DeepLearning101
/

Corrector101zhTW

Running

App Files Files Community

DeepLearning101 commited on Apr 30, 2024

Commit

5887026

verified ·

1 Parent(s): b9c5636

Update app.py

Browse files

Caching examples at: '/home/user/app/gradio_cached_examples/15'
Caching example 1/5
Traceback (most recent call last):
File "/home/user/app/app.py", line 50, in <module>
gr.Interface(
File "/usr/local/lib/python3.10/site-packages/gradio/interface.py", line 515, in __init__
self.render_examples()
File "/usr/local/lib/python3.10/site-packages/gradio/interface.py", line 861, in render_examples
self.examples_handler = Examples(
File "/usr/local/lib/python3.10/site-packages/gradio/helpers.py", line 74, in create_examples
examples_obj.create()
File "/usr/local/lib/python3.10/site-packages/gradio/helpers.py", line 314, in create
self._start_caching()
File "/usr/local/lib/python3.10/site-packages/gradio/helpers.py", line 365, in _start_caching
client_utils.synchronize_async(self.cache)
File "/usr/local/lib/python3.10/site-packages/gradio_client/utils.py", line 858, in synchronize_async
return fsspec.asyn.sync(fsspec.asyn.get_loop(), func, *args, **kwargs) # type: ignore
File "/usr/local/lib/python3.10/site-packages/fsspec/asyn.py", line 103, in sync
raise return_result
File "/usr/local/lib/python3.10/site-packages/fsspec/asyn.py", line 56, in _runner
result[0] = await coro
File "/usr/local/lib/python3.10/site-packages/gradio/helpers.py", line 486, in cache
prediction = await Context.root_block.process_api(
File "/usr/local/lib/python3.10/site-packages/gradio/blocks.py", line 1847, in process_api
result = await self.call_function(
File "/usr/local/lib/python3.10/site-packages/gradio/blocks.py", line 1433, in call_function
prediction = await anyio.to_thread.run_sync(
File "/usr/local/lib/python3.10/site-packages/anyio/to_thread.py", line 56, in run_sync
return await get_async_backend().run_sync_in_worker_thread(
File "/usr/local/lib/python3.10/site-packages/anyio/_backends/_asyncio.py", line 2144, in run_sync_in_worker_thread
return await future
File "/usr/local/lib/python3.10/site-packages/anyio/_backends/_asyncio.py", line 851, in run
result = context.run(func, *args)
File "/usr/local/lib/python3.10/site-packages/gradio/utils.py", line 788, in wrapper
response = f(*args, **kwargs)
File "/home/user/app/app.py", line 21, in ai_text
corrected_text, details = get_errors(text)
File "/home/user/app/app.py", line 30, in get_errors
corrected_text = tokenizer.decode(torch.argmax(outputs.logits[0], dim=-1), skip_special_tokens=True).replace(' ', '')
NameError: name 'outputs' is not defined

錯誤是因為在get_errors函數中引用了未定義的變數outputs。這個變數在ai_text函數中定義，但並沒有傳遞到get_errors函數中。為了解決這個問題，您需要將outputs作為參數傳遞到get_errors函數中，或在get_errors函數內部重新計算它。

Files changed (1) hide show

app.py +9 -10

app.py CHANGED Viewed

@@ -11,25 +11,24 @@ model_name_or_path = "DeepLearning101/Corrector101zhTW"
 try:
     tokenizer = BertTokenizer.from_pretrained(model_name_or_path)
     model = BertForMaskedLM.from_pretrained(model_name_or_path)
 except Exception as e:
     print(f"加載模型或分詞器失敗，錯誤信息：{e}")
     exit(1)
 def ai_text(text):
     with torch.no_grad():
-        outputs = model(**tokenizer([text], padding=True, return_tensors='pt'))
-    corrected_text, details = get_errors(text)
     return corrected_text + ' ' + str(details)
-def to_highlight(corrected_sent, errs):
-    output = [{"entity": "糾錯", "word": err[1], "start": err[2], "end": err[3]} for err in errs]
-    return {"text": corrected_sent, "entities": output}
-def get_errors(text):
     sub_details = []
     corrected_text = tokenizer.decode(torch.argmax(outputs.logits[0], dim=-1), skip_special_tokens=True).replace(' ', '')
     for i, ori_char in enumerate(text):
-        # 略過特定字符
         if ori_char in [' ', '“', '”', '‘', '’', '琊', '\n', '…', '—', '擤']:
             continue
         if i >= len(corrected_text):
@@ -52,8 +51,8 @@ if __name__ == '__main__':
         inputs=gr.Textbox(lines=2, label="欲校正的文字"),
         outputs=gr.Textbox(lines=2, label="修正後的文字"),
         title="客服ASR文本AI糾錯系統",
-        description="""<a href="https://www.twman.org" target='_blank'>TonTon Huang Ph.D. @ 2024/04 </a><br>
                     輸入ASR文本，糾正同音字/詞錯誤<br>
                     Masked Language Model (MLM) as correction BERT""",
         examples=examples
-    ).launch()

 try:
     tokenizer = BertTokenizer.from_pretrained(model_name_or_path)
     model = BertForMaskedLM.from_pretrained(model_name_or_path)
+    model.eval()  # 將模型設置為評估模式
 except Exception as e:
     print(f"加載模型或分詞器失敗，錯誤信息：{e}")
     exit(1)
 def ai_text(text):
+    """處理輸入文本並返回修正後的文本及錯誤細節"""
     with torch.no_grad():
+        inputs = tokenizer(text, return_tensors="pt", padding=True)
+        outputs = model(**inputs)
+    corrected_text, details = get_errors(text, outputs)
     return corrected_text + ' ' + str(details)
+def get_errors(text, outputs):
+    """識別原始文本和模型輸出之間的差異"""
     sub_details = []
     corrected_text = tokenizer.decode(torch.argmax(outputs.logits[0], dim=-1), skip_special_tokens=True).replace(' ', '')
     for i, ori_char in enumerate(text):
         if ori_char in [' ', '“', '”', '‘', '’', '琊', '\n', '…', '—', '擤']:
             continue
         if i >= len(corrected_text):
         inputs=gr.Textbox(lines=2, label="欲校正的文字"),
         outputs=gr.Textbox(lines=2, label="修正後的文字"),
         title="客服ASR文本AI糾錯系統",
+        description="""<a href='https://www.twman.org' target='_blank'>TonTon Huang Ph.D. @ 2024/04 </a><br>
                     輸入ASR文本，糾正同音字/詞錯誤<br>
                     Masked Language Model (MLM) as correction BERT""",
         examples=examples
+    ).launch()