Spaces:

350016z
/

TranslationError_Gradio

Sleeping

App Files Files Community

350016z commited on Feb 14

Commit

77fceba

verified ·

1 Parent(s): 06d8d2d

Update app.py

Browse files

Files changed (1) hide show

app.py +40 -20

app.py CHANGED Viewed

@@ -69,7 +69,6 @@ data = pd.read_csv(data_path, dtype={"id": "Int64"}) # 確保 id 為標準 Pytho
 current_index = 0
 current_errors = []
-current_others = []
 annotations_file = DATASET_DIR / f"test-{uuid4()}.json"
 # ---------------------------------------------------------------------------------------------------------------------
@@ -96,9 +95,6 @@ def save_to_json(entry: dict, json_file: Path):
 def save_current(source, target, rater_selector, error_span, category, subcategory, severity, other):
     global current_index, data, current_errors
-    if category == "No-error":
-        return "", "無錯誤，不需要保存錯誤區間。"
     system = data.loc[current_index, "system"]
     lp = data.loc[current_index, "lp"]
@@ -106,10 +102,10 @@ def save_current(source, target, rater_selector, error_span, category, subcatego
     id = int(data.loc[current_index, "id"])
     reference = data.loc[current_index, "reference"]
-    if category != "Non-translation":
-        category_value = f"{category}/{subcategory}"
-    else:
-        category_value = category
     if error_span and error_span in target:
         start = target.find(error_span)
@@ -123,11 +119,7 @@ def save_current(source, target, rater_selector, error_span, category, subcatego
         "severity": severity.lower(),
         "start": start,
         "end": end
-    })
-    current_others.append({
         "category": category_value,
-        "others": other if other else "",
     })
     # [error_span, status]
@@ -135,7 +127,7 @@ def save_current(source, target, rater_selector, error_span, category, subcatego
 def save_and_next(source, target, score, rater_selector):
-    global current_index, data, annotations_file, current_errors, current_others
     system = data.loc[current_index, "system"]
     lp = data.loc[current_index, "lp"]
@@ -152,15 +144,13 @@ def save_and_next(source, target, score, rater_selector):
         "src": source,
         "mt": target,
         "ref": reference,
-        "sentence_score": score,
-        "errors": current_errors,
-        "others": current_others,
     }
     save_to_json(annotations_entry, annotations_file)
     # 清空當前錯誤緩存
     current_errors = []
-    current_others = []
     current_index += 1
     if current_index >= len(data):
@@ -195,16 +185,29 @@ def update_index_selection(selected_index):
     return get_current_text() + (str(selected_index), f"已跳轉至 id: {selected_index}")
 categories = {
-    "No-error": [],
     "Accuracy": ["Mistranslation", "Addition", "Omission", "Other"],
     "Fluency": ["Grammar", "Spelling", "Punctuation", "Inconsistency", "Register", "Other"],
     "Terminology": ["Inappropriate", "Inconsistent", "Other"],
     "Style": ["Awkward", "Other"],
     "Locale": ["Currency format", "Time format", "Name format", "Date format", "Address format", "Other"],
-    "Non-translation": []
 }
 rater = ['rater1', 'rater2','rater3', 'rater4', 'rater5', 'rater6', 'rater7']
 DEMO_EXPLANATION = """
 ## 翻譯標記工具
 ### 使用規則 [更多細節](https://huggingface.co/spaces/350016z/TranslationError_Gradio/blob/main/README.md)
@@ -221,9 +224,19 @@ DEMO_EXPLANATION = """
         - 33：保留部分原文意思，但有明顯遺漏，敘述難以理解，文法可能很差。
         - 66：保留大部分原文意思，有一些文法錯誤或輕微不一致。
         - 100：原文意思和文法完全正確。
 """
-with gr.Blocks() as demo:
     gr.Markdown(DEMO_EXPLANATION)
     with gr.Tab("標記工具"):
@@ -241,6 +254,9 @@ with gr.Blocks() as demo:
         with gr.Row(variant='panel', equal_height=True):
             with gr.Column(scale=1):
                 error_span = gr.Textbox(label="錯誤區間 (💡可以直接複製「翻譯文本」欄位，並在此貼上)", lines=6, placeholder="請輸入翻譯中文本的錯誤區間 (如無錯誤則不需)")
             with gr.Column(scale=1):
                 with gr.Row(equal_height=True):
                     category = gr.Dropdown(label="錯誤類別", choices=list(categories.keys()), value="No-error")
@@ -269,6 +285,10 @@ with gr.Blocks() as demo:
         file_selector.change(update_file_selection, inputs=[file_selector], outputs=[source, target, error_span, index_selector, current_index_display, status])
         index_selector.change(update_index_selection, inputs=[index_selector], outputs=[source, target, current_index_display, status])
         category.change(update_subcategories, inputs=[category], outputs=[subcategory])
         save_current_button.click(save_current, inputs=[source, target, rater_selector, error_span, category, subcategory, severity, other], outputs=[error_span, status])
         save_next_button.click(save_and_next, inputs=[source, target, score, rater_selector], outputs=[source, target, error_span, current_index_display, status])

 current_index = 0
 current_errors = []
 annotations_file = DATASET_DIR / f"test-{uuid4()}.json"
 # ---------------------------------------------------------------------------------------------------------------------
 def save_current(source, target, rater_selector, error_span, category, subcategory, severity, other):
     global current_index, data, current_errors
     system = data.loc[current_index, "system"]
     lp = data.loc[current_index, "lp"]
     id = int(data.loc[current_index, "id"])
     reference = data.loc[current_index, "reference"]
+    if subcategory:
+        category_value = f"{category}/{subcategory}"
+    else if other:
+        category_value = f"{category}/{other}"
     if error_span and error_span in target:
         start = target.find(error_span)
         "severity": severity.lower(),
         "start": start,
         "end": end
         "category": category_value,
     })
     # [error_span, status]
 def save_and_next(source, target, score, rater_selector):
+    global current_index, data, annotations_file, current_errors
     system = data.loc[current_index, "system"]
     lp = data.loc[current_index, "lp"]
         "src": source,
         "mt": target,
         "ref": reference,
+        "esa_score": score,
+        "esa_spans": current_errors,
     }
     save_to_json(annotations_entry, annotations_file)
     # 清空當前錯誤緩存
     current_errors = []
     current_index += 1
     if current_index >= len(data):
     return get_current_text() + (str(selected_index), f"已跳轉至 id: {selected_index}")
 categories = {
     "Accuracy": ["Mistranslation", "Addition", "Omission", "Other"],
     "Fluency": ["Grammar", "Spelling", "Punctuation", "Inconsistency", "Register", "Other"],
     "Terminology": ["Inappropriate", "Inconsistent", "Other"],
     "Style": ["Awkward", "Other"],
     "Locale": ["Currency format", "Time format", "Name format", "Date format", "Address format", "Other"],
 }
+severity_choices = ["Minor", "Major"]
 rater = ['rater1', 'rater2','rater3', 'rater4', 'rater5', 'rater6', 'rater7']
+def mark_as_correct():
+    return "", "標註為完全正確，無錯誤！"
+def mark_as_too_many_errors():
+    global current_errors
+    current_errors.append({
+        "text": "",
+        "severity": "major",
+        "start": 0,
+        "end": 0,
+        "category": "Non-translation"
+    })
+    return "", "已標註為過多錯誤！"
 DEMO_EXPLANATION = """
 ## 翻譯標記工具
 ### 使用規則 [更多細節](https://huggingface.co/spaces/350016z/TranslationError_Gradio/blob/main/README.md)
         - 33：保留部分原文意思，但有明顯遺漏，敘述難以理解，文法可能很差。
         - 66：保留大部分原文意思，有一些文法錯誤或輕微不一致。
         - 100：原文意思和文法完全正確。
+        (即使選擇 **No-error(沒有錯誤)**，分數也不一定需要評100分)
 """
+with gr.Blocks(css="""
+    #correct_button {
+        background-color: #4CAF50;
+        color: white;
+    }
+    #too_many_errors_button {
+        background-color: #f44336;
+        color: white;
+    }
+""") as demo:
     gr.Markdown(DEMO_EXPLANATION)
     with gr.Tab("標記工具"):
         with gr.Row(variant='panel', equal_height=True):
             with gr.Column(scale=1):
                 error_span = gr.Textbox(label="錯誤區間 (💡可以直接複製「翻譯文本」欄位，並在此貼上)", lines=6, placeholder="請輸入翻譯中文本的錯誤區間 (如無錯誤則不需)")
+            with gr.Column(scale=1):
+                correct_button = gr.Button("✔ 完全正確", elem_id="correct_button")
+                too_many_errors_button = gr.Button("✖ 過多錯誤", elem_id="too_many_errors_button")
             with gr.Column(scale=1):
                 with gr.Row(equal_height=True):
                     category = gr.Dropdown(label="錯誤類別", choices=list(categories.keys()), value="No-error")
         file_selector.change(update_file_selection, inputs=[file_selector], outputs=[source, target, error_span, index_selector, current_index_display, status])
         index_selector.change(update_index_selection, inputs=[index_selector], outputs=[source, target, current_index_display, status])
         category.change(update_subcategories, inputs=[category], outputs=[subcategory])
+        correct_button.click(mark_as_correct, outputs=[error_span, status])
+        too_many_errors_button.click(mark_as_too_many_errors, outputs=[error_span, status])
         save_current_button.click(save_current, inputs=[source, target, rater_selector, error_span, category, subcategory, severity, other], outputs=[error_span, status])
         save_next_button.click(save_and_next, inputs=[source, target, score, rater_selector], outputs=[source, target, error_span, current_index_display, status])