Spaces:

hHoai
/

vietnam_correction

Runtime error

hHoai commited on 29 days ago

Commit

c16f5b4

verified ·

1 Parent(s): 7e366f8

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,31 +1,35 @@
 import gradio as gr
-import requests
 import time
-def spellcheck(text):
-    url = "https://spellcheck.vcntt.tech/spellcheck"
-    data = {"text": text}
     start_time = time.time()
-    response = requests.post(url, json=data)
     end_time = time.time()
-    if response.status_code != 200:
-        return "Lỗi kết nối API", text, "", "", ""
-    result = response.json()
-    corrected_text = result.get("corrected_text", text)
     processing_time = f"{end_time - start_time:.4f} giây"
-    if not result.get("has_errors", False):
         return "Không có lỗi chính tả", corrected_text, "", "", processing_time
-    errors = result.get("errors", [])
-    error_words = "\n".join([e['word'] for e in errors])
-    suggestions = "\n".join([', '.join(e['suggestions']) if e['suggestions'] else 'Xóa bỏ' for e in errors])
-    return "Có lỗi chính tả", corrected_text, error_words, suggestions, processing_time
 with gr.Blocks() as demo:
     gr.Markdown("# Demo Kiểm tra lỗi chính tả tiếng Việt")

 import gradio as gr
 import time
+from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
+import torch
+# Load mô hình
+model_checkpoint = "hHoai/bartPHO_final"
+tokenizer = AutoTokenizer.from_pretrained(model_checkpoint)
+model = AutoModelForSeq2SeqLM.from_pretrained(model_checkpoint)
+def spellcheck(text):
     start_time = time.time()
+    # Mã hóa đầu vào
+    inputs = tokenizer(text, return_tensors="pt", padding=True, truncation=True)
+    # Sinh văn bản đã sửa lỗi
+    with torch.no_grad():
+        outputs = model.generate(**inputs)
+    corrected_text = tokenizer.decode(outputs[0], skip_special_tokens=True)
     end_time = time.time()
     processing_time = f"{end_time - start_time:.4f} giây"
+    # Giả lập phát hiện lỗi chính tả (có thể thay bằng logic so sánh input-output)
+    has_errors = text.strip() != corrected_text.strip()
+    if not has_errors:
         return "Không có lỗi chính tả", corrected_text, "", "", processing_time
+    # Hiện tại chưa có logic tách từ sai và gợi ý, cần thêm post-processing nếu cần
+    return "Có lỗi chính tả", corrected_text, "Đang cập nhật", "Đang cập nhật", processing_time
 with gr.Blocks() as demo:
     gr.Markdown("# Demo Kiểm tra lỗi chính tả tiếng Việt")