Spaces:
Sleeping
Sleeping
elibrowne
commited on
Commit
·
22f31fd
1
Parent(s):
2787b29
Structure outline, new toggle functionality
Browse files- app.py +38 -10
- structure.js +35 -0
app.py
CHANGED
@@ -59,6 +59,7 @@ generation = "The strongest argument for the constitutionality of the act is tha
|
|
59 |
gold_passage = "Unlike its original jurisdiction, the appellate jurisdiction of the Supreme Court is subject to “exceptions and regulations” prescribed by Congress, and the jurisdiction of the inferior federal courts is subject to congressional prescription. Additionally, Congress has power to regulate modes and practices of proceeding on the part of the inferior federal courts. Whether there are limitations to the exercise of these congressional powers, and what the limitations may be, are matters that have vexed scholarly and judicial interpretation over the years, inasmuch as congressional displeasure with judicial decisions has sometimes led to successful efforts to “curb” the courts and more frequently to proposed but unsuccessful curbs."
|
60 |
gold_passage_generation = "The strongest argument for the constitutionality of the Congressional act is that Congress has the constitutional authority to regulate federal court jurisdiction and procedures. This includes setting limits on judicial orders. By restricting desegregation plans to only require transportation to the nearest or next nearest school, Congress is exercising its power to define and control how federal courts address such issues, ensuring judicial actions align with legislative priorities and practical concerns."
|
61 |
step = 0
|
|
|
62 |
|
63 |
sample_dict = {
|
64 |
"question": question_text,
|
@@ -77,7 +78,6 @@ theme = gr.themes.Soft(
|
|
77 |
primary_hue="sky",
|
78 |
secondary_hue="sky",
|
79 |
neutral_hue="slate",
|
80 |
-
spacing_size="lg",
|
81 |
font=[gr.themes.GoogleFont('Inter'), 'ui-sans-serif', 'system-ui', 'sans-serif'],
|
82 |
)
|
83 |
|
@@ -87,7 +87,7 @@ user_id = "NO_ID"
|
|
87 |
|
88 |
with gr.Blocks(theme = theme) as user_eval:
|
89 |
# Title text introducing study
|
90 |
-
forward_btn = gr.Textbox("unchanged", visible = False, elem_id = "togglebutton")
|
91 |
gr.HTML("""
|
92 |
<h1> Legal Retriever Evaluation Study </h1>
|
93 |
<p> Score the passages based on the question and provided answer choices. Detailed instructions are found <a href="https://docs.google.com/document/d/1ReODJ0hlXz_M3kE2UG1cwSRVoyDLQo88OvG71Gt8lUQ/edit?usp=sharing" target="_blank">here</a>. </p>
|
@@ -138,6 +138,7 @@ with gr.Blocks(theme = theme) as user_eval:
|
|
138 |
|
139 |
def next_p(eval_1, eval_2, eval_3):
|
140 |
global step
|
|
|
141 |
step += 1
|
142 |
print(eval_1 + eval_2 + eval_3)
|
143 |
if step == len(passage_texts):
|
@@ -162,17 +163,25 @@ with gr.Blocks(theme = theme) as user_eval:
|
|
162 |
|
163 |
def next_g(eval_helps, eval_satisfied):
|
164 |
global step
|
|
|
165 |
step += 1
|
166 |
print(eval_helps + eval_satisfied)
|
167 |
if step == 11:
|
168 |
-
# Step 11: guaranteed
|
169 |
return {
|
170 |
selection: gr.HTML("""
|
171 |
<h2> Autogenerated Response </h2> <br />
|
172 |
""" + generation)
|
173 |
}
|
174 |
# Steps 12 and 13 are gold passage + gold passage generation IF it is applicable
|
175 |
-
if step > 11 and not sample_dict["top10_contains_gold_passage"]:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
176 |
if step == 12:
|
177 |
return {
|
178 |
selection: gr.HTML("""
|
@@ -189,12 +198,19 @@ with gr.Blocks(theme = theme) as user_eval:
|
|
189 |
}
|
190 |
else:
|
191 |
return {
|
192 |
-
selection: gr.Markdown("
|
193 |
forward_btn: gr.Textbox("changed")
|
194 |
}
|
195 |
else:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
196 |
return {
|
197 |
-
selection: gr.Markdown("
|
198 |
forward_btn: gr.Textbox("changed")
|
199 |
}
|
200 |
|
@@ -224,17 +240,29 @@ with gr.Blocks(theme = theme) as user_eval:
|
|
224 |
d.click(fn = answer, outputs = [question, evals])
|
225 |
|
226 |
def toggle():
|
227 |
-
|
228 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
229 |
return {
|
230 |
scores_p: gr.Column(visible = True),
|
231 |
scores_g: gr.Column(visible = False),
|
232 |
evals: gr.Row(visible = False),
|
233 |
question: gr.Row(visible = True),
|
234 |
-
forward_btn: gr.HTML("unchanged")
|
235 |
}
|
236 |
|
237 |
-
forward_btn.change(fn = toggle, inputs = None, outputs = [scores_p, scores_g, evals, question
|
238 |
|
239 |
with gr.Row() as login:
|
240 |
with gr.Column():
|
|
|
59 |
gold_passage = "Unlike its original jurisdiction, the appellate jurisdiction of the Supreme Court is subject to “exceptions and regulations” prescribed by Congress, and the jurisdiction of the inferior federal courts is subject to congressional prescription. Additionally, Congress has power to regulate modes and practices of proceeding on the part of the inferior federal courts. Whether there are limitations to the exercise of these congressional powers, and what the limitations may be, are matters that have vexed scholarly and judicial interpretation over the years, inasmuch as congressional displeasure with judicial decisions has sometimes led to successful efforts to “curb” the courts and more frequently to proposed but unsuccessful curbs."
|
60 |
gold_passage_generation = "The strongest argument for the constitutionality of the Congressional act is that Congress has the constitutional authority to regulate federal court jurisdiction and procedures. This includes setting limits on judicial orders. By restricting desegregation plans to only require transportation to the nearest or next nearest school, Congress is exercising its power to define and control how federal courts address such issues, ensuring judicial actions align with legislative priorities and practical concerns."
|
61 |
step = 0
|
62 |
+
mode = 0
|
63 |
|
64 |
sample_dict = {
|
65 |
"question": question_text,
|
|
|
78 |
primary_hue="sky",
|
79 |
secondary_hue="sky",
|
80 |
neutral_hue="slate",
|
|
|
81 |
font=[gr.themes.GoogleFont('Inter'), 'ui-sans-serif', 'system-ui', 'sans-serif'],
|
82 |
)
|
83 |
|
|
|
87 |
|
88 |
with gr.Blocks(theme = theme) as user_eval:
|
89 |
# Title text introducing study
|
90 |
+
forward_btn = gr.Textbox("unchanged", visible = False, elem_id = "togglebutton") # used for toggling windows
|
91 |
gr.HTML("""
|
92 |
<h1> Legal Retriever Evaluation Study </h1>
|
93 |
<p> Score the passages based on the question and provided answer choices. Detailed instructions are found <a href="https://docs.google.com/document/d/1ReODJ0hlXz_M3kE2UG1cwSRVoyDLQo88OvG71Gt8lUQ/edit?usp=sharing" target="_blank">here</a>. </p>
|
|
|
138 |
|
139 |
def next_p(eval_1, eval_2, eval_3):
|
140 |
global step
|
141 |
+
global mode
|
142 |
step += 1
|
143 |
print(eval_1 + eval_2 + eval_3)
|
144 |
if step == len(passage_texts):
|
|
|
163 |
|
164 |
def next_g(eval_helps, eval_satisfied):
|
165 |
global step
|
166 |
+
global mode
|
167 |
step += 1
|
168 |
print(eval_helps + eval_satisfied)
|
169 |
if step == 11:
|
170 |
+
# Step 11: guaranteed to be generation
|
171 |
return {
|
172 |
selection: gr.HTML("""
|
173 |
<h2> Autogenerated Response </h2> <br />
|
174 |
""" + generation)
|
175 |
}
|
176 |
# Steps 12 and 13 are gold passage + gold passage generation IF it is applicable
|
177 |
+
if step > 11 and not sample_dict["top10_contains_gold_passage"]:
|
178 |
+
# When mode is 0 -> reset with mode = 1
|
179 |
+
if mode == 0:
|
180 |
+
return {
|
181 |
+
selection: gr.HTML("<p> Loading second set... </p>") ,
|
182 |
+
forward_btn: gr.Textbox("load new data")
|
183 |
+
}
|
184 |
+
# When mode is 1 -> display GP and GP generation, then switch
|
185 |
if step == 12:
|
186 |
return {
|
187 |
selection: gr.HTML("""
|
|
|
198 |
}
|
199 |
else:
|
200 |
return {
|
201 |
+
selection: gr.Markdown("Advancing to the next question..."),
|
202 |
forward_btn: gr.Textbox("changed")
|
203 |
}
|
204 |
else:
|
205 |
+
# When mode is 0 -> reset with mode = 1
|
206 |
+
if mode == 0:
|
207 |
+
return {
|
208 |
+
selection: gr.HTML("<p> Loading second set... </p>") ,
|
209 |
+
forward_btn: gr.Textbox("load new data")
|
210 |
+
}
|
211 |
+
# When mode is 1 -> change question
|
212 |
return {
|
213 |
+
selection: gr.Markdown("Advancing to the next question..."),
|
214 |
forward_btn: gr.Textbox("changed")
|
215 |
}
|
216 |
|
|
|
240 |
d.click(fn = answer, outputs = [question, evals])
|
241 |
|
242 |
def toggle():
|
243 |
+
global step
|
244 |
+
global mode
|
245 |
+
step = 0
|
246 |
+
if mode == 0:
|
247 |
+
mode = 1 # update mode to 1, will restart with same Q, next set of Ps
|
248 |
+
print("Next set of passages for same question")
|
249 |
+
return {
|
250 |
+
scores_p: gr.Column(visible = True),
|
251 |
+
scores_g: gr.Column(visible = False),
|
252 |
+
evals: gr.Row(visible = True),
|
253 |
+
question: gr.Row(visible = False),
|
254 |
+
}
|
255 |
+
else:
|
256 |
+
mode = 0 # reset mode to 0, will restart with new Q, first set of Ps
|
257 |
+
print("New question")
|
258 |
return {
|
259 |
scores_p: gr.Column(visible = True),
|
260 |
scores_g: gr.Column(visible = False),
|
261 |
evals: gr.Row(visible = False),
|
262 |
question: gr.Row(visible = True),
|
|
|
263 |
}
|
264 |
|
265 |
+
forward_btn.change(fn = toggle, inputs = None, outputs = [scores_p, scores_g, evals, question])
|
266 |
|
267 |
with gr.Row() as login:
|
268 |
with gr.Column():
|
structure.js
ADDED
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
// This is how a question will be formatted in JSON. These will be in a dictionary
|
2 |
+
// formatted as {question ID:question data}.
|
3 |
+
var sample_question = {
|
4 |
+
"question": "What is the best explanation for this law?",
|
5 |
+
"answers": ["Option A", "Option B", "Option C", "Option D"],
|
6 |
+
"correct_answer_index": 0,
|
7 |
+
"top10_e5": ["Passage 1 from E5", "Passage 2 from E5", "Passage 3..."],
|
8 |
+
"generation_e5": "This generation is based on the E5 passages.",
|
9 |
+
"top10_colbert": ["Passage 1 from ColBERT", "Passage 2 from Colbert", "..."],
|
10 |
+
"generation_colbert": "This generation is based on the ColBERT passages.",
|
11 |
+
"top10_contains_gold_passage": false, // in either case
|
12 |
+
"gold_passage": "This is the gold passage.",
|
13 |
+
"gold_passage_generation": "This generation answers the question with the gold passage."
|
14 |
+
}
|
15 |
+
|
16 |
+
// Each user response will take this form. A list of these objects will be uploaded.
|
17 |
+
var user_response = {
|
18 |
+
"user_id": "[email protected]", // track who the respondent is
|
19 |
+
"question_id": "ID ###", // track which question they are responding to
|
20 |
+
"e5_scores": [[1, 2.5, 1.5, 3.5], [0, 1, 4, 1.5]], // [is a law, relevance, quality, helpfulness]
|
21 |
+
"colbert_scores": [[1, 3, 3, 3], [1, 5, 4, 5]], // same format as above
|
22 |
+
}
|
23 |
+
|
24 |
+
// One JSON file for each user -> check if the file exists, download if it does; otherwise, create.
|
25 |
+
var user_data = {
|
26 |
+
"user_id": "[email protected]",
|
27 |
+
"order": ["question ID 1", "question ID 2", "...", "question ID 15"], // randomized and different for each user
|
28 |
+
"modes": [["e5", "colbert"], ["colbert", "e5"], ["colbert", "e5"], "..."], // randomized and different for each user
|
29 |
+
"current": 3, // index in "order" that the user has not yet completed (starts at 0) -> this user would log in at 3
|
30 |
+
"responses": [user_response, user_response] // list of user responses in the same order
|
31 |
+
}
|
32 |
+
// When the file exists, download it and make a LOCAL copy. Modify the local copy (e.g. increasing order
|
33 |
+
// and adding responses), and after each question, rewrite the original JSON object with the new data.
|
34 |
+
// To avoid losing data in the case of a bad overwrite, each individual user_response should also be added to
|
35 |
+
// the commit scheduler.
|