Spaces:

Diezu
/

Correct_spelling_mistakes_app

Sleeping

App Files Files Community

Diezu commited on Jan 16

Commit

ce1c0a8

verified ·

1 Parent(s): fb3b727

Update app.py

Browse files

Files changed (1) hide show

app.py +21 -29

app.py CHANGED Viewed

@@ -13,19 +13,14 @@ def load_model():
 def detect_errors(text, tokenizer, model):
     errors = []
     words = text.split()
     for word in words:
         inputs = tokenizer(word, return_tensors="pt", padding=True, truncation=True)
         with torch.no_grad():
             outputs = model(**inputs)
-        # Xử lý kết quả để phát hiện lỗi (giả sử lớp "1" là từ sai)
         probabilities = torch.softmax(outputs.logits, dim=-1)
         predicted_class = torch.argmax(probabilities, dim=-1).item()
         if predicted_class == 1:  # Nếu từ sai
             errors.append(word)
     return errors
 # Streamlit App
@@ -34,28 +29,25 @@ st.title("Công cụ phát hiện lỗi chính tả")
 # Tải mô hình
 tokenizer, model = load_model()
-# Tạo bố cục ngang với tỷ lệ cột tùy chỉnh
-col1, col2 = st.columns([3, 2])  # Cột 1 rộng hơn cột 2
-# Cột 1: Nhập văn bản
-with col1:
-    st.header("Nhập văn bản")
-    input_text = st.text_area("Nhập văn bản của bạn tại đây:", height=300)  # Tăng chiều cao của vùng nhập
-# Cột 2: Hiển thị kết quả
-with col2:
-    st.header("Kết quả phát hiện lỗi")
-    if st.button("Phát hiện lỗi", use_container_width=True):  # Nút nằm trong cột
-        if input_text.strip():
-            # Phát hiện lỗi
-            errors = detect_errors(input_text, tokenizer, model)
-            if errors:
-                st.write("**Các từ phát hiện lỗi:**")
-                st.markdown(
-                    f"<div style='font-size: 18px; line-height: 1.8;'>{', '.join(f'<b>{word}</b>' for word in errors)}</div>",
-                    unsafe_allow_html=True,
-                )
-            else:
-                st.success("Không phát hiện lỗi nào trong văn bản.")
         else:
-            st.warning("Vui lòng nhập văn bản để kiểm tra.")

 def detect_errors(text, tokenizer, model):
     errors = []
     words = text.split()
     for word in words:
         inputs = tokenizer(word, return_tensors="pt", padding=True, truncation=True)
         with torch.no_grad():
             outputs = model(**inputs)
         probabilities = torch.softmax(outputs.logits, dim=-1)
         predicted_class = torch.argmax(probabilities, dim=-1).item()
         if predicted_class == 1:  # Nếu từ sai
             errors.append(word)
     return errors
 # Streamlit App
 # Tải mô hình
 tokenizer, model = load_model()
+# Tạo giao diện theo phong cách Google Dịch
+input_text = st.text_area(
+    "Nhập văn bản:",
+    height=300,
+    max_chars=5000,
+    placeholder="Nhập văn bản của bạn ở đây..."
+)
+if st.button("Phát hiện lỗi"):
+    if input_text.strip():
+        errors = detect_errors(input_text, tokenizer, model)
+        if errors:
+            st.text_area(
+                "Kết quả phát hiện lỗi:",
+                value=", ".join(errors),
+                height=300,
+                disabled=True,
+            )
         else:
+            st.success("Không phát hiện lỗi nào trong văn bản.")
+    else:
+        st.warning("Vui lòng nhập văn bản để kiểm tra.")