Spaces:
Running
Running
File size: 2,387 Bytes
a578005 80f304b a578005 49e4d23 a578005 88424d7 a578005 80f304b 00b5c9c 4c36da8 a578005 2f36d79 a578005 80f304b a578005 b610e6b 49e4d23 a578005 88424d7 a578005 88424d7 80f304b a578005 88424d7 00b5c9c 80f304b 9ad151d 88424d7 80f304b 88424d7 80f304b 88424d7 80f304b 88424d7 4c36da8 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 |
import pandas as pd
import streamlit as st
import re
import os
st.set_page_config(page_icon='🍃', page_title='MRC for Legal Document Dataset checker', layout='wide', initial_sidebar_state="collapsed")
st.markdown("<h2 style='text-align: center;'>Investigation Legal Dataset checker for Machine Reading Comprehension</h2>", unsafe_allow_html=True)
df = pd.read_csv(filepath_or_buffer='./Legal_AbstractiveA.csv')
if 'idx' not in st.session_state:
st.session_state.idx = 0
st.markdown(f"<h4 style='text-align: center;'>Sample {st.session_state.idx + 1}/{len(df)}</h4>", unsafe_allow_html=True)
root_folder = './'
# Lấy danh sách các thư mục và tập tin trong thư mục gốc
contents = os.listdir(root_folder)
# Hiển thị tiêu đề
st.title("Danh sách thư mục và tập tin trong thư mục gốc")
col_1, col_2, col_3, col_4, col_5, col_6, col_7, col_8, col_9, col_10 = st.columns([1, 1, 1, 1, 1, 1, 1, 1, 1, 1])
btn_previous = col_1.button(label=':arrow_backward: Previous sample', use_container_width=True)
btn_next = col_2.button(label='Next sample :arrow_forward:', use_container_width=True)
btn_save = col_3.button(label=':heavy_check_mark: Save change', use_container_width=True)
if len(df) != 0:
txt_context = st.text_area(height=300, label='Your context:', value=df['context'][st.session_state.idx])
txt_question = st.text_area(height=100, label='Your question:', value=df['question'][st.session_state.idx])
txt_answer = st.text_area(height=100, label='Your answer:', value=df['answer'][st.session_state.idx])
if txt_answer.strip() and txt_context.strip():
highlighted_context = re.sub(re.escape(txt_answer), "<mark>" + txt_answer + "</mark>", txt_context, flags=re.IGNORECASE)
st.markdown(highlighted_context, unsafe_allow_html=True)
if btn_previous:
if st.session_state.idx > 0:
st.session_state.idx -= 1
st.rerun()
else:
pass
if btn_next:
if st.session_state.idx <= (len(df) - 1):
st.session_state.idx += 1
st.rerun()
else:
pass
if btn_save:
df['context'][st.session_state.idx] = txt_context
df['question'][st.session_state.idx] = txt_question
df['answer'][st.session_state.idx] = txt_answer
df.to_csv(path_or_buf='./Legal_AbstractiveA.csv', index=None) |