|
from datetime import datetime |
|
|
|
import gradio as gr |
|
import pandas as pd |
|
from datasets import load_dataset |
|
|
|
|
|
ds = load_dataset("harshildarji/openlegaldata", "cases", split="main") |
|
df = pd.DataFrame(ds) |
|
|
|
|
|
df["state"] = df["court"].apply( |
|
lambda x: x.get("state", "Unknown") if isinstance(x, dict) else "Unknown" |
|
) |
|
df["court_name"] = df["court"].apply( |
|
lambda x: x.get("name", "Unknown") if isinstance(x, dict) else "Unknown" |
|
) |
|
|
|
|
|
state_list = sorted(df["state"].dropna().unique().tolist()) |
|
state_list.insert(0, "All") |
|
court_list = sorted(df["court_name"].dropna().unique().tolist()) |
|
court_list.insert(0, "All") |
|
|
|
|
|
def filter_cases(state, court, date_from, date_to): |
|
""" |
|
Filter the cases based on state, court name, and date range. |
|
Returns a DataFrame with selected columns. |
|
""" |
|
filtered = df.copy() |
|
if state and state != "All": |
|
filtered = filtered[filtered["state"] == state] |
|
if court and court != "All": |
|
filtered = filtered[filtered["court_name"] == court] |
|
if date_from: |
|
try: |
|
date_from_dt = datetime.strptime(date_from, "%Y-%m-%d") |
|
filtered = filtered[pd.to_datetime(filtered["date"]) >= date_from_dt] |
|
except Exception: |
|
pass |
|
if date_to: |
|
try: |
|
date_to_dt = datetime.strptime(date_to, "%Y-%m-%d") |
|
filtered = filtered[pd.to_datetime(filtered["date"]) <= date_to_dt] |
|
except Exception: |
|
pass |
|
|
|
return filtered[["id", "file_number", "date", "court_name", "type"]] |
|
|
|
|
|
def get_case_details(case_id): |
|
"""Return an HTML formatted string with details for a given case id.""" |
|
try: |
|
case_id = int(case_id) |
|
except: |
|
return "<p style='color:red;'>Invalid case ID</p>" |
|
case_row = df[df["id"] == case_id] |
|
if case_row.empty: |
|
return "<p style='color:red;'>Case not found</p>" |
|
case_data = case_row.iloc[0].to_dict() |
|
|
|
html = "<h2>Case Details</h2>" |
|
html += f"<p><strong>ID:</strong> {case_data.get('id')}</p>" |
|
html += f"<p><strong>File Number:</strong> {case_data.get('file_number')}</p>" |
|
html += f"<p><strong>Date:</strong> {case_data.get('date')}</p>" |
|
|
|
|
|
court_info = case_data.get("court", {}) |
|
html += f"<p><strong>Court:</strong> {court_info.get('name', 'N/A')} ({court_info.get('state', 'N/A')})</p>" |
|
html += f"<p><strong>Type:</strong> {case_data.get('type', 'N/A')}</p>" |
|
html += '<hr style="margin: 15px 0;">' |
|
|
|
|
|
tenors = case_data.get("tenor", []) |
|
if tenors: |
|
html += "<h3>Tenor</h3>" |
|
for t in tenors: |
|
html += f"<p>{t}</p>" |
|
html += '<hr style="margin: 15px 0;">' |
|
|
|
|
|
tatbestand = case_data.get("tatbestand", []) |
|
if tatbestand: |
|
html += "<h3>Tatbestand</h3>" |
|
for t in tatbestand: |
|
html += f"<p>{t}</p>" |
|
html += '<hr style="margin: 15px 0;">' |
|
|
|
|
|
gründe = case_data.get("gründe", []) |
|
if gründe: |
|
html += "<h3>Gründe</h3>" |
|
for g in gründe: |
|
html += f"<p>{g}</p>" |
|
html += '<hr style="margin: 15px 0;">' |
|
|
|
|
|
entscheidungsgründe = case_data.get("entscheidungsgründe", []) |
|
if entscheidungsgründe: |
|
html += "<h3>Entscheidungsgründe</h3>" |
|
for e in entscheidungsgründe: |
|
html += f"<p>{e}</p>" |
|
html += '<hr style="margin: 15px 0;">' |
|
|
|
return html |
|
|
|
|
|
|
|
with gr.Blocks(title="German Legal Case Viewer", fill_width=True) as demo: |
|
gr.Markdown("# German Legal Case Viewer") |
|
gr.Markdown( |
|
"Explore case information from the processed [Open Legal Data dataset](https://huggingface.co/datasets/harshildarji/openlegaldata)." |
|
) |
|
|
|
with gr.Tabs(): |
|
|
|
with gr.Tab("Browse Cases"): |
|
gr.Markdown("## Filter Cases") |
|
with gr.Row(): |
|
state_input = gr.Dropdown( |
|
choices=state_list, label="State", value="All" |
|
) |
|
court_input = gr.Dropdown( |
|
choices=court_list, label="Court", value="All" |
|
) |
|
date_from_input = gr.Textbox( |
|
label="From Date (YYYY-MM-DD)", placeholder="2022-01-01" |
|
) |
|
date_to_input = gr.Textbox( |
|
label="To Date (YYYY-MM-DD)", placeholder="2022-12-31" |
|
) |
|
filter_button = gr.Button("Apply Filters") |
|
output_table = gr.DataFrame(label="Cases Overview") |
|
filter_button.click( |
|
fn=filter_cases, |
|
inputs=[state_input, court_input, date_from_input, date_to_input], |
|
outputs=output_table, |
|
) |
|
|
|
|
|
with gr.Tab("Case Details"): |
|
with gr.Row(): |
|
case_id_input = gr.Textbox( |
|
label="Enter Case ID", placeholder="e.g., 346915" |
|
) |
|
details_button = gr.Button("Get Details") |
|
case_details_output = gr.HTML(label="Case Details") |
|
details_button.click( |
|
fn=get_case_details, |
|
inputs=case_id_input, |
|
outputs=case_details_output, |
|
) |
|
|
|
demo.launch() |
|
|