Update app.py
Browse files
app.py
CHANGED
@@ -46,27 +46,27 @@ def invoke(openai_api_key, use_rag, prompt):
|
|
46 |
temperature = 0)
|
47 |
if (use_rag):
|
48 |
# Document loading
|
49 |
-
docs = []
|
50 |
# Load PDF
|
51 |
-
loader = PyPDFLoader(PDF_URL)
|
52 |
-
docs.extend(loader.load())
|
53 |
# Load Web
|
54 |
-
loader = WebBaseLoader(WEB_URL)
|
55 |
-
docs.extend(loader.load())
|
56 |
# Load YouTube
|
57 |
-
loader = GenericLoader(YoutubeAudioLoader([YOUTUBE_URL_1,
|
58 |
-
|
59 |
-
|
60 |
-
|
61 |
-
docs.extend(loader.load())
|
62 |
# Document splitting
|
63 |
-
text_splitter = RecursiveCharacterTextSplitter(chunk_overlap = 150,
|
64 |
-
|
65 |
-
splits = text_splitter.split_documents(docs)
|
66 |
# Document storage
|
67 |
-
vector_db = Chroma.from_documents(documents = splits,
|
68 |
-
|
69 |
-
|
70 |
# Document retrieval
|
71 |
vector_db = Chroma(embedding_function = OpenAIEmbeddings(),
|
72 |
persist_directory = CHROMA_DIR)
|
|
|
46 |
temperature = 0)
|
47 |
if (use_rag):
|
48 |
# Document loading
|
49 |
+
#docs = []
|
50 |
# Load PDF
|
51 |
+
#loader = PyPDFLoader(PDF_URL)
|
52 |
+
#docs.extend(loader.load())
|
53 |
# Load Web
|
54 |
+
#loader = WebBaseLoader(WEB_URL)
|
55 |
+
#docs.extend(loader.load())
|
56 |
# Load YouTube
|
57 |
+
#loader = GenericLoader(YoutubeAudioLoader([YOUTUBE_URL_1,
|
58 |
+
# YOUTUBE_URL_2,
|
59 |
+
# YOUTUBE_URL_3], YOUTUBE_DIR),
|
60 |
+
# OpenAIWhisperParser())
|
61 |
+
#docs.extend(loader.load())
|
62 |
# Document splitting
|
63 |
+
#text_splitter = RecursiveCharacterTextSplitter(chunk_overlap = 150,
|
64 |
+
# chunk_size = 1500)
|
65 |
+
#splits = text_splitter.split_documents(docs)
|
66 |
# Document storage
|
67 |
+
#vector_db = Chroma.from_documents(documents = splits,
|
68 |
+
# embedding = OpenAIEmbeddings(disallowed_special = ()),
|
69 |
+
# persist_directory = CHROMA_DIR)
|
70 |
# Document retrieval
|
71 |
vector_db = Chroma(embedding_function = OpenAIEmbeddings(),
|
72 |
persist_directory = CHROMA_DIR)
|