Spaces:

Cheselle
/

AIE4-Demo

Runtime error

App Files Files Community

Cheselle commited on Oct 8, 2024

Commit

43f37ba

verified ·

1 Parent(s): e0a8eac

Update app.py

Browse files

Files changed (1) hide show

app.py +34 -8

app.py CHANGED Viewed

@@ -42,15 +42,19 @@ HF_TOKEN = os.environ["HF_TOKEN"]
 """
 ### 1. CREATE TEXT LOADER AND LOAD DOCUMENTS
 ### NOTE: PAY ATTENTION TO THE PATH THEY ARE IN.
-text_loader =
-documents =
 ### 2. CREATE TEXT SPLITTER AND SPLIT DOCUMENTS
-text_splitter =
-split_documents =
 ### 3. LOAD HUGGINGFACE EMBEDDINGS
-hf_embeddings =
 async def add_documents_async(vectorstore, documents):
     await vectorstore.aadd_documents(documents)
@@ -110,17 +114,39 @@ hf_retriever = asyncio.run(run())
 2. Create a Prompt Template from the String Template
 """
 ### 1. DEFINE STRING TEMPLATE
-RAG_PROMPT_TEMPLATE =
 ### 2. CREATE PROMPT TEMPLATE
-rag_prompt =
 # -- GENERATION -- #
 """
 1. Create a HuggingFaceEndpoint for the LLM
 """
 ### 1. CREATE HUGGINGFACE ENDPOINT FOR LLM
-hf_llm =
 @cl.author_rename
 def rename(original_author: str):

 """
 ### 1. CREATE TEXT LOADER AND LOAD DOCUMENTS
 ### NOTE: PAY ATTENTION TO THE PATH THEY ARE IN.
+text_loader = TextLoader("./paul-graham-to-kindle/paul_graham_essays.txt")
+documents = document_loader.load()
 ### 2. CREATE TEXT SPLITTER AND SPLIT DOCUMENTS
+text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=30)
+split_documents = text_splitter.split_documents(documents)
 ### 3. LOAD HUGGINGFACE EMBEDDINGS
+hf_embeddings = HuggingFaceEndpointEmbeddings(
+    model=YOUR_EMBED_MODEL_URL,
+    task="feature-extraction",
+    huggingfacehub_api_token=os.environ["HF_TOKEN"],
+)
 async def add_documents_async(vectorstore, documents):
     await vectorstore.aadd_documents(documents)
 2. Create a Prompt Template from the String Template
 """
 ### 1. DEFINE STRING TEMPLATE
+RAG_PROMPT_TEMPLATE = """\
+<|start_header_id|>system<|end_header_id|>
+You are a helpful assistant. You answer user questions based on provided context. If you can't answer the question with the provided context, say you don't know.<|eot_id|>
+<|start_header_id|>user<|end_header_id|>
+User Query:
+{query}
+Context:
+{context}<|eot_id|>
+<|start_header_id|>assistant<|end_header_id|>
+"""
 ### 2. CREATE PROMPT TEMPLATE
+rag_prompt = PromptTemplate.from_template(RAG_PROMPT_TEMPLATE)
 # -- GENERATION -- #
 """
 1. Create a HuggingFaceEndpoint for the LLM
 """
 ### 1. CREATE HUGGINGFACE ENDPOINT FOR LLM
+hf_llm = HuggingFaceEndpoint(
+    endpoint_url=f"{YOUR_LLM_ENDPOINT_URL}",
+    max_new_tokens=512,
+    top_k=10,
+    top_p=0.95,
+    typical_p=0.95,
+    temperature=0.01,
+    repetition_penalty=1.03,
+    huggingfacehub_api_token=os.environ["HF_TOKEN"]
+)
 @cl.author_rename
 def rename(original_author: str):