File size: 4,545 Bytes
491e087
 
ac7f046
344f958
491e087
5344f77
491e087
344f958
491e087
 
 
 
 
 
 
 
 
ae325aa
491e087
 
 
2704216
 
 
491e087
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5344f77
2704216
 
 
 
 
 
 
 
 
 
 
 
 
 
491e087
 
8196f31
 
491e087
 
8196f31
491e087
 
8196f31
491e087
 
8196f31
491e087
5344f77
8196f31
 
 
a887cae
5344f77
8196f31
 
491e087
344f958
 
491e087
2704216
344f958
a887cae
2704216
 
 
ac7f046
344f958
2704216
 
 
 
344f958
2704216
344f958
2704216
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
import streamlit as st
import pandas as pd
from plms.language_model import TransformersQG
import time
import os
import numpy as np

st.set_page_config(page_icon='🧪', page_title='ViQAG for Vietnamese Education', layout='centered', initial_sidebar_state="collapsed")

with open(r"./static/styles.css") as f:
    st.markdown(f"<style>{f.read()}</style>", unsafe_allow_html=True)

st.markdown(f"""
    <div class=logo_area>
        <img src="./app/static/AlphaEdu_logo_trans.png"/>
    </div>
    """, unsafe_allow_html=True)
st.markdown("<h3 style='text-align: center;'>AlphaEdu</h3>", unsafe_allow_html=True)

# =====================================================================================================

if 'output' not in st.session_state:
    st.session_state.output = ''

def file_selector(folder_path=r'./Resources/'):
    filenames = os.listdir(folder_path)
    return filenames
filenames = file_selector()

def load_grades(file_name, folder_path=r'./Resources/'):
    file_path = f"{folder_path}{file_name}"
    df = pd.read_csv(file_path)
    list_grades = df['grade'].drop_duplicates().values
    return list_grades, df

def load_chapters(df, grade_name):
    df_raw = df[df['grade'] == grade_name]
    list_chapters = df_raw['chapter'].drop_duplicates().values
    return list_chapters, df

def load_lessons(df, grade_name, chapter_name):
    df_raw = df[(df['grade'] == grade_name) & (df['chapter'] == chapter_name)]
    return df_raw['lesson'].drop_duplicates().values

def load_context(df, grade_name, chapter_name, lesson_name):
    context = df[(df['grade'] == grade_name) & (df['chapter'] == chapter_name) & (df['lesson'] == lesson_name)]['context'].values
    return len(context), context

def generateQA(context, model_path = 'shnl/vit5-vinewsqa-qg-ae'):
    unique_qa_pairs = set()
    model = TransformersQG(model=model_path, max_length=512)
    output = model.generate_qa(context)
    qa_pairs = ''
    for item in output:
        question, answer = item
        if (question, answer) not in unique_qa_pairs:
            qa_pairs += f'question: {question} \nanswer: {answer} [SEP] '
            unique_qa_pairs.add((question, answer))
    qa = '\n\n'.join(qa_pairs.split(' [SEP] '))
    return qa
    
# =====================================================================================================

col_1, col_2 = st.sidebar.columns(spec=[1, 1])
subject = col_1.selectbox(label='Select your subject:', options=filenames, label_visibility='visible')

list_grades, df = load_grades(file_name=subject)
grade = col_2.selectbox(label='Select your grade:', options=list_grades, label_visibility='visible')

list_chapters, df = load_chapters(df=df, grade_name=grade)
chapter = st.sidebar.selectbox(label='Select your chapter:', options=list_chapters, label_visibility='visible')

lesson_names = load_lessons(df=df, grade_name=grade, chapter_name=chapter)
lesson = st.sidebar.selectbox(label='Lesson:', options=lesson_names, label_visibility='visible')

total_paragraph, context_values = load_context(df=df, grade_name=grade, chapter_name=chapter, lesson_name=lesson)

col_12, col_22 = st.sidebar.columns(spec=[4, 6])
paragraph_idx = col_12.selectbox(label='Paragraph:', options=list(np.arange(1, total_paragraph + 1)), label_visibility='visible')
paragraph = st.text_area(label='Paragraph content', label_visibility='visible', height=200, value=context_values[paragraph_idx - 1])

col_22.selectbox(label='QAG model:', options=['ViT5-ViNewsQA'], label_visibility='visible')
btn_show_answer = st.sidebar.toggle(label='Show answers', disabled=False)

col_14, col_24, col_34, col_44, col_54 = st.columns(spec=[1, 1, 1, 1, 1])
btn_generate = col_34.button(label='Generate', use_container_width=True)

if btn_generate == True:
    with st.spinner(text='Generating QA pairs from the selected paragraph. Please wait ...'):
        st.session_state.output = generateQA(context=paragraph)

if btn_show_answer:
    if st.session_state.output != '':
        st.markdown("<h8 style='text-align: left; font-weight: normal'>Generated QA pairs:</h8>", unsafe_allow_html=True)
        st.code(body=st.session_state.output, language='latex')
    else:
        pass
else:
    if st.session_state.output != '':
        st.markdown("<h8 style='text-align: left; font-weight: normal'>Generated QA pairs:</h8>", unsafe_allow_html=True)
        output_no_answer = st.session_state.output.split(' [SEP] ')[0].split(', answer: ')[0].replace('question: ', '')
        st.code(body=output_no_answer, language='latex')
    else:
        pass