rag-tool

Running

Chris4K commited on Jan 20, 2024

Commit

42d7c62

verified ·

1 Parent(s): 4848d67

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -24,19 +24,14 @@ print("-----------")
 text_splitter = CharacterTextSplitter(chunk_size=100, chunk_overlap=0)
 vdocuments = text_splitter.split_documents(documents)
 # Extract the embedding arrays from the PDF documents
 embeddings = []
-for doc in documents:
-    embeddings.append(getattr(doc, 'embeddings'))
 # Create Chroma vector store for API embeddings
 api_db = Chroma.from_documents(vdocuments, HfApiEmbeddingRetriever, collection_name="api-collection")
-#api_db = Chroma.from_texts(embeddings, api_hf_embeddings, collection_name="api-collection")
 # Define the PDF retrieval function
 def pdf_retrieval(query):
     # Run the query through the retriever
@@ -55,4 +50,4 @@ api_tool = gr.Interface(
 )
 # Launch the Gradio interface
-#api_tool.launch()

 text_splitter = CharacterTextSplitter(chunk_size=100, chunk_overlap=0)
 vdocuments = text_splitter.split_documents(documents)
 # Extract the embedding arrays from the PDF documents
 embeddings = []
+for doc in vdocuments:
+    embeddings.extend(api_hf_embeddings.get_embeddings(doc))
 # Create Chroma vector store for API embeddings
 api_db = Chroma.from_documents(vdocuments, HfApiEmbeddingRetriever, collection_name="api-collection")
 # Define the PDF retrieval function
 def pdf_retrieval(query):
     # Run the query through the retriever
 )
 # Launch the Gradio interface
+api_tool.launch()