Spaces:

legaltextai
/

summarizecase

Sleeping

App Files Files Community

legaltextai commited on Jun 4, 2024

Commit

ae8ef07

verified ·

1 Parent(s): b6150e7

Create main.py

Browse files

Files changed (1) hide show

main.py +117 -0

main.py ADDED Viewed

	@@ -0,0 +1,117 @@

+import streamlit as st
+from bs4 import BeautifulSoup
+import requests
+import os
+import anthropic
+from anthropic import Anthropic, HUMAN_PROMPT, AI_PROMPT
+from io import StringIO
+import time
+from io import BytesIO
+anthropic = Anthropic(
+   api_key="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",
+)
+headers = {
+    "User-agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/70.0.3538.102 Safari/537.36 Edge/18.19582"
+}
+proxies = {"http": os.getenv("HTTP_PROXY")}
+@st.cache_data(ttl=3600)
+def search_legal_cases(query, num_results=10):
+    url = "https://scholar.google.com/scholar?hl=en&as_sdt=6"
+    headers = {
+        "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/93.0.4577.63 Safari/537.3"
+    }
+    params = {
+        "q": query,
+        "hl": "en",
+        "num": num_results,
+        "as_sdt": "4",  # This parameter filters the search results to legal cases
+    }
+    response = requests.get(url, proxies=proxies, headers=headers, params=params)
+    soup = BeautifulSoup(response.text, "html.parser")
+    results = []
+    for result in soup.find_all("div", class_="gs_ri"):
+        title = result.find("h3", class_="gs_rt").text
+        base_url = "https://scholar.google.com"
+        link = base_url + result.find("a")["href"]
+        citation = result.find("div", class_="gs_a").text.replace(" - Google Scholar", "")
+        results.append((title, link, citation))
+    return results
+@st.cache_data(ttl=3600)
+def extract_text_from_link(url):
+    headers = {
+        "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/93.0.4577.63 Safari/537.3"
+    }
+    response = requests.get(url, headers=headers, proxies=proxies)
+    soup = BeautifulSoup(response.content, "html.parser")
+    text = soup.get_text(separator="\n")
+    return text
+@st.cache_data(ttl=3600)
+def get_summary(text):
+    prompt = f'''{HUMAN_PROMPT}
+    You are a law professor specialized in legal writing and legal research.
+    Summarize the case in {text} in json format according to the following requirements:
+    Facts (name of the case and its parties, what happened factually).
+    Procedural history (what happened in the past procedurally, what were prior judgements).
+    Issues (what is in dispute).
+    Holding (the applied rule of law).
+    Rationale (reasons for the holding).
+    Decision (what did the court decide, e.g. affirmed, overruled).
+    Other opinions (if there are any dissenting or concurring opinions, summarize majority opinion, dissenting opinion and concurring opinion).
+    Cases cited (which cases the court cited and how it treated them):
+      - 'red flag' means some negative treatment — such as a cited case is being overruled, superseded, or not followed by this court for some reason.
+      - 'yellow flag' means the case has some negative treatment by this court but has not been reversed or overruled. For example, the reasoning of the decision was criticized or its holding was limited to a specific set of facts.
+      - 'blue flag' means the case has been appealed to the U.S. Court of Appeals or the U.S. Supreme Court (excluding appeals originating from agencies).
+   Present the summary in json format.
+    {AI_PROMPT}'''
+    completion = anthropic.completions.create(
+    #model="claude-2",
+    model = "claude-instant-1.2",
+    max_tokens_to_sample=2000,
+    prompt=prompt,
+)
+    response = completion.completion
+    return response
+search_query = st.text_input("case name, e.g. brown v board supreme, 372 US 335, google v oracle appeal")
+if search_query:
+    with st.spinner("Searching for cases..."):
+        results = search_legal_cases(search_query)
+    if results:
+        title, link, citation = results[0]
+        st.write("Title:\n", title)
+        #st.write("Link:\n", link)
+        st.write("Citation:\n", citation)
+        with st.spinner("Extracting text from case..."):
+            text = extract_text_from_link(link)
+        #st.write(text)
+    else:
+        st.write("No results found.")
+if search_query:
+    with st.spinner("Generating summary..."):
+        summary = get_summary(text)
+    st.write(summary)
+    # Convert the response to a file-like object for download
+    download_bytes = BytesIO(summary.encode())
+    st.download_button("Download the results", download_bytes, "summary.txt", "text/plain")