elibrowne commited on
Commit
22f31fd
·
1 Parent(s): 2787b29

Structure outline, new toggle functionality

Browse files
Files changed (2) hide show
  1. app.py +38 -10
  2. structure.js +35 -0
app.py CHANGED
@@ -59,6 +59,7 @@ generation = "The strongest argument for the constitutionality of the act is tha
59
  gold_passage = "Unlike its original jurisdiction, the appellate jurisdiction of the Supreme Court is subject to “exceptions and regulations” prescribed by Congress, and the jurisdiction of the inferior federal courts is subject to congressional prescription. Additionally, Congress has power to regulate modes and practices of proceeding on the part of the inferior federal courts. Whether there are limitations to the exercise of these congressional powers, and what the limitations may be, are matters that have vexed scholarly and judicial interpretation over the years, inasmuch as congressional displeasure with judicial decisions has sometimes led to successful efforts to “curb” the courts and more frequently to proposed but unsuccessful curbs."
60
  gold_passage_generation = "The strongest argument for the constitutionality of the Congressional act is that Congress has the constitutional authority to regulate federal court jurisdiction and procedures. This includes setting limits on judicial orders. By restricting desegregation plans to only require transportation to the nearest or next nearest school, Congress is exercising its power to define and control how federal courts address such issues, ensuring judicial actions align with legislative priorities and practical concerns."
61
  step = 0
 
62
 
63
  sample_dict = {
64
  "question": question_text,
@@ -77,7 +78,6 @@ theme = gr.themes.Soft(
77
  primary_hue="sky",
78
  secondary_hue="sky",
79
  neutral_hue="slate",
80
- spacing_size="lg",
81
  font=[gr.themes.GoogleFont('Inter'), 'ui-sans-serif', 'system-ui', 'sans-serif'],
82
  )
83
 
@@ -87,7 +87,7 @@ user_id = "NO_ID"
87
 
88
  with gr.Blocks(theme = theme) as user_eval:
89
  # Title text introducing study
90
- forward_btn = gr.Textbox("unchanged", visible = False, elem_id = "togglebutton")
91
  gr.HTML("""
92
  <h1> Legal Retriever Evaluation Study </h1>
93
  <p> Score the passages based on the question and provided answer choices. Detailed instructions are found <a href="https://docs.google.com/document/d/1ReODJ0hlXz_M3kE2UG1cwSRVoyDLQo88OvG71Gt8lUQ/edit?usp=sharing" target="_blank">here</a>. </p>
@@ -138,6 +138,7 @@ with gr.Blocks(theme = theme) as user_eval:
138
 
139
  def next_p(eval_1, eval_2, eval_3):
140
  global step
 
141
  step += 1
142
  print(eval_1 + eval_2 + eval_3)
143
  if step == len(passage_texts):
@@ -162,17 +163,25 @@ with gr.Blocks(theme = theme) as user_eval:
162
 
163
  def next_g(eval_helps, eval_satisfied):
164
  global step
 
165
  step += 1
166
  print(eval_helps + eval_satisfied)
167
  if step == 11:
168
- # Step 11: guaranteed summary
169
  return {
170
  selection: gr.HTML("""
171
  <h2> Autogenerated Response </h2> <br />
172
  """ + generation)
173
  }
174
  # Steps 12 and 13 are gold passage + gold passage generation IF it is applicable
175
- if step > 11 and not sample_dict["top10_contains_gold_passage"]:
 
 
 
 
 
 
 
176
  if step == 12:
177
  return {
178
  selection: gr.HTML("""
@@ -189,12 +198,19 @@ with gr.Blocks(theme = theme) as user_eval:
189
  }
190
  else:
191
  return {
192
- selection: gr.Markdown("Click the button to advance to the next question."),
193
  forward_btn: gr.Textbox("changed")
194
  }
195
  else:
 
 
 
 
 
 
 
196
  return {
197
- selection: gr.Markdown("Click the button to advance to the next question."),
198
  forward_btn: gr.Textbox("changed")
199
  }
200
 
@@ -224,17 +240,29 @@ with gr.Blocks(theme = theme) as user_eval:
224
  d.click(fn = answer, outputs = [question, evals])
225
 
226
  def toggle():
227
- global step
228
- step = 0
 
 
 
 
 
 
 
 
 
 
 
 
 
229
  return {
230
  scores_p: gr.Column(visible = True),
231
  scores_g: gr.Column(visible = False),
232
  evals: gr.Row(visible = False),
233
  question: gr.Row(visible = True),
234
- forward_btn: gr.HTML("unchanged")
235
  }
236
 
237
- forward_btn.change(fn = toggle, inputs = None, outputs = [scores_p, scores_g, evals, question, forward_btn])
238
 
239
  with gr.Row() as login:
240
  with gr.Column():
 
59
  gold_passage = "Unlike its original jurisdiction, the appellate jurisdiction of the Supreme Court is subject to “exceptions and regulations” prescribed by Congress, and the jurisdiction of the inferior federal courts is subject to congressional prescription. Additionally, Congress has power to regulate modes and practices of proceeding on the part of the inferior federal courts. Whether there are limitations to the exercise of these congressional powers, and what the limitations may be, are matters that have vexed scholarly and judicial interpretation over the years, inasmuch as congressional displeasure with judicial decisions has sometimes led to successful efforts to “curb” the courts and more frequently to proposed but unsuccessful curbs."
60
  gold_passage_generation = "The strongest argument for the constitutionality of the Congressional act is that Congress has the constitutional authority to regulate federal court jurisdiction and procedures. This includes setting limits on judicial orders. By restricting desegregation plans to only require transportation to the nearest or next nearest school, Congress is exercising its power to define and control how federal courts address such issues, ensuring judicial actions align with legislative priorities and practical concerns."
61
  step = 0
62
+ mode = 0
63
 
64
  sample_dict = {
65
  "question": question_text,
 
78
  primary_hue="sky",
79
  secondary_hue="sky",
80
  neutral_hue="slate",
 
81
  font=[gr.themes.GoogleFont('Inter'), 'ui-sans-serif', 'system-ui', 'sans-serif'],
82
  )
83
 
 
87
 
88
  with gr.Blocks(theme = theme) as user_eval:
89
  # Title text introducing study
90
+ forward_btn = gr.Textbox("unchanged", visible = False, elem_id = "togglebutton") # used for toggling windows
91
  gr.HTML("""
92
  <h1> Legal Retriever Evaluation Study </h1>
93
  <p> Score the passages based on the question and provided answer choices. Detailed instructions are found <a href="https://docs.google.com/document/d/1ReODJ0hlXz_M3kE2UG1cwSRVoyDLQo88OvG71Gt8lUQ/edit?usp=sharing" target="_blank">here</a>. </p>
 
138
 
139
  def next_p(eval_1, eval_2, eval_3):
140
  global step
141
+ global mode
142
  step += 1
143
  print(eval_1 + eval_2 + eval_3)
144
  if step == len(passage_texts):
 
163
 
164
  def next_g(eval_helps, eval_satisfied):
165
  global step
166
+ global mode
167
  step += 1
168
  print(eval_helps + eval_satisfied)
169
  if step == 11:
170
+ # Step 11: guaranteed to be generation
171
  return {
172
  selection: gr.HTML("""
173
  <h2> Autogenerated Response </h2> <br />
174
  """ + generation)
175
  }
176
  # Steps 12 and 13 are gold passage + gold passage generation IF it is applicable
177
+ if step > 11 and not sample_dict["top10_contains_gold_passage"]:
178
+ # When mode is 0 -> reset with mode = 1
179
+ if mode == 0:
180
+ return {
181
+ selection: gr.HTML("<p> Loading second set... </p>") ,
182
+ forward_btn: gr.Textbox("load new data")
183
+ }
184
+ # When mode is 1 -> display GP and GP generation, then switch
185
  if step == 12:
186
  return {
187
  selection: gr.HTML("""
 
198
  }
199
  else:
200
  return {
201
+ selection: gr.Markdown("Advancing to the next question..."),
202
  forward_btn: gr.Textbox("changed")
203
  }
204
  else:
205
+ # When mode is 0 -> reset with mode = 1
206
+ if mode == 0:
207
+ return {
208
+ selection: gr.HTML("<p> Loading second set... </p>") ,
209
+ forward_btn: gr.Textbox("load new data")
210
+ }
211
+ # When mode is 1 -> change question
212
  return {
213
+ selection: gr.Markdown("Advancing to the next question..."),
214
  forward_btn: gr.Textbox("changed")
215
  }
216
 
 
240
  d.click(fn = answer, outputs = [question, evals])
241
 
242
  def toggle():
243
+ global step
244
+ global mode
245
+ step = 0
246
+ if mode == 0:
247
+ mode = 1 # update mode to 1, will restart with same Q, next set of Ps
248
+ print("Next set of passages for same question")
249
+ return {
250
+ scores_p: gr.Column(visible = True),
251
+ scores_g: gr.Column(visible = False),
252
+ evals: gr.Row(visible = True),
253
+ question: gr.Row(visible = False),
254
+ }
255
+ else:
256
+ mode = 0 # reset mode to 0, will restart with new Q, first set of Ps
257
+ print("New question")
258
  return {
259
  scores_p: gr.Column(visible = True),
260
  scores_g: gr.Column(visible = False),
261
  evals: gr.Row(visible = False),
262
  question: gr.Row(visible = True),
 
263
  }
264
 
265
+ forward_btn.change(fn = toggle, inputs = None, outputs = [scores_p, scores_g, evals, question])
266
 
267
  with gr.Row() as login:
268
  with gr.Column():
structure.js ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ // This is how a question will be formatted in JSON. These will be in a dictionary
2
+ // formatted as {question ID:question data}.
3
+ var sample_question = {
4
+ "question": "What is the best explanation for this law?",
5
+ "answers": ["Option A", "Option B", "Option C", "Option D"],
6
+ "correct_answer_index": 0,
7
+ "top10_e5": ["Passage 1 from E5", "Passage 2 from E5", "Passage 3..."],
8
+ "generation_e5": "This generation is based on the E5 passages.",
9
+ "top10_colbert": ["Passage 1 from ColBERT", "Passage 2 from Colbert", "..."],
10
+ "generation_colbert": "This generation is based on the ColBERT passages.",
11
+ "top10_contains_gold_passage": false, // in either case
12
+ "gold_passage": "This is the gold passage.",
13
+ "gold_passage_generation": "This generation answers the question with the gold passage."
14
+ }
15
+
16
+ // Each user response will take this form. A list of these objects will be uploaded.
17
+ var user_response = {
18
+ "user_id": "[email protected]", // track who the respondent is
19
+ "question_id": "ID ###", // track which question they are responding to
20
+ "e5_scores": [[1, 2.5, 1.5, 3.5], [0, 1, 4, 1.5]], // [is a law, relevance, quality, helpfulness]
21
+ "colbert_scores": [[1, 3, 3, 3], [1, 5, 4, 5]], // same format as above
22
+ }
23
+
24
+ // One JSON file for each user -> check if the file exists, download if it does; otherwise, create.
25
+ var user_data = {
26
+ "user_id": "[email protected]",
27
+ "order": ["question ID 1", "question ID 2", "...", "question ID 15"], // randomized and different for each user
28
+ "modes": [["e5", "colbert"], ["colbert", "e5"], ["colbert", "e5"], "..."], // randomized and different for each user
29
+ "current": 3, // index in "order" that the user has not yet completed (starts at 0) -> this user would log in at 3
30
+ "responses": [user_response, user_response] // list of user responses in the same order
31
+ }
32
+ // When the file exists, download it and make a LOCAL copy. Modify the local copy (e.g. increasing order
33
+ // and adding responses), and after each question, rewrite the original JSON object with the new data.
34
+ // To avoid losing data in the case of a bad overwrite, each individual user_response should also be added to
35
+ // the commit scheduler.