bstraehle commited on
Commit
85e4f86
·
1 Parent(s): bfb520c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +16 -16
app.py CHANGED
@@ -46,27 +46,27 @@ def invoke(openai_api_key, use_rag, prompt):
46
  temperature = 0)
47
  if (use_rag):
48
  # Document loading
49
- docs = []
50
  # Load PDF
51
- loader = PyPDFLoader(PDF_URL)
52
- docs.extend(loader.load())
53
  # Load Web
54
- loader = WebBaseLoader(WEB_URL)
55
- docs.extend(loader.load())
56
  # Load YouTube
57
- loader = GenericLoader(YoutubeAudioLoader([YOUTUBE_URL_1,
58
- YOUTUBE_URL_2,
59
- YOUTUBE_URL_3], YOUTUBE_DIR),
60
- OpenAIWhisperParser())
61
- docs.extend(loader.load())
62
  # Document splitting
63
- text_splitter = RecursiveCharacterTextSplitter(chunk_overlap = 150,
64
- chunk_size = 1500)
65
- splits = text_splitter.split_documents(docs)
66
  # Document storage
67
- vector_db = Chroma.from_documents(documents = splits,
68
- embedding = OpenAIEmbeddings(disallowed_special = ()),
69
- persist_directory = CHROMA_DIR)
70
  # Document retrieval
71
  vector_db = Chroma(embedding_function = OpenAIEmbeddings(),
72
  persist_directory = CHROMA_DIR)
 
46
  temperature = 0)
47
  if (use_rag):
48
  # Document loading
49
+ #docs = []
50
  # Load PDF
51
+ #loader = PyPDFLoader(PDF_URL)
52
+ #docs.extend(loader.load())
53
  # Load Web
54
+ #loader = WebBaseLoader(WEB_URL)
55
+ #docs.extend(loader.load())
56
  # Load YouTube
57
+ #loader = GenericLoader(YoutubeAudioLoader([YOUTUBE_URL_1,
58
+ # YOUTUBE_URL_2,
59
+ # YOUTUBE_URL_3], YOUTUBE_DIR),
60
+ # OpenAIWhisperParser())
61
+ #docs.extend(loader.load())
62
  # Document splitting
63
+ #text_splitter = RecursiveCharacterTextSplitter(chunk_overlap = 150,
64
+ # chunk_size = 1500)
65
+ #splits = text_splitter.split_documents(docs)
66
  # Document storage
67
+ #vector_db = Chroma.from_documents(documents = splits,
68
+ # embedding = OpenAIEmbeddings(disallowed_special = ()),
69
+ # persist_directory = CHROMA_DIR)
70
  # Document retrieval
71
  vector_db = Chroma(embedding_function = OpenAIEmbeddings(),
72
  persist_directory = CHROMA_DIR)