Spaces:
Sleeping
Sleeping
File size: 2,313 Bytes
a578005 80f304b a578005 88424d7 a578005 80f304b 00b5c9c 4c36da8 a578005 2f36d79 a578005 80f304b a578005 88424d7 a578005 88424d7 80f304b a578005 88424d7 00b5c9c 80f304b 9ad151d 88424d7 80f304b 88424d7 80f304b 88424d7 80f304b 080d2e8 4c36da8 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 |
import pandas as pd
import streamlit as st
import re
st.set_page_config(page_icon='🍃', page_title='MRC for Legal Document Dataset checker', layout='wide', initial_sidebar_state="collapsed")
st.markdown("<h2 style='text-align: center;'>Investigation Legal Dataset checker for Machine Reading Comprehension</h2>", unsafe_allow_html=True)
df = pd.read_csv(filepath_or_buffer='./Legal_AbstractiveA.csv')
if 'idx' not in st.session_state:
st.session_state.idx = 0
st.markdown(f"<h4 style='text-align: center;'>Sample {st.session_state.idx + 1}/{len(df)}</h4>", unsafe_allow_html=True)
col_1, col_2, col_3, col_4, col_5, col_6, col_7, col_8, col_9, col_10 = st.columns([1, 1, 1, 1, 1, 1, 1, 1, 1, 1])
btn_previous = col_1.button(label=':arrow_backward: Previous sample', use_container_width=True)
btn_next = col_2.button(label='Next sample :arrow_forward:', use_container_width=True)
btn_save = col_3.button(label=':heavy_check_mark: Save change', use_container_width=True)
if len(df) != 0:
txt_context = st.text_area(height=300, label='Your context:', value=df['context'][st.session_state.idx])
txt_question = st.text_area(height=100, label='Your question:', value=df['question'][st.session_state.idx])
txt_answer = st.text_area(height=100, label='Your answer:', value=df['answer'][st.session_state.idx])
if txt_answer.strip() and txt_context.strip():
highlighted_context = re.sub(re.escape(txt_answer), "<mark>" + txt_answer + "</mark>", txt_context, flags=re.IGNORECASE)
st.markdown(highlighted_context, unsafe_allow_html=True)
if btn_previous:
if st.session_state.idx > 0:
st.session_state.idx -= 1
st.rerun()
else:
pass
if btn_next:
if st.session_state.idx <= (len(df) - 1):
st.session_state.idx += 1
st.rerun()
else:
pass
if btn_save:
df['context'][st.session_state.idx] = txt_context
df['question'][st.session_state.idx] = txt_question
df['answer'][st.session_state.idx] = txt_answer
btn_download = col_4.download_button(data=df, label=':arrow_down_small: Download file', use_container_width=True, file_name="checked.csv", mime="text/csv")
df.to_csv(path_or_buf='./Legal_AbstractiveA.csv', index=None) |