JinHyeong99 commited on
Commit
7d47c0f
Β·
1 Parent(s): 8c31276
Files changed (1) hide show
  1. app.py +10 -11
app.py CHANGED
@@ -34,14 +34,13 @@ def get_text_file(text_docs):
34
  return text_doc
35
 
36
  def get_csv_file(csv_docs):
37
- def get_csv_file(csv_docs):
38
- temp_dir = tempfile.TemporaryDirectory() # μž„μ‹œ 디렉토리λ₯Ό μƒμ„±ν•©λ‹ˆλ‹€.
39
- temp_filepath = os.path.join(temp_dir.name, csv_docs.name) # μž„μ‹œ 파일 경둜λ₯Ό μƒμ„±ν•©λ‹ˆλ‹€.
40
- with open(temp_filepath, "wb") as f: # μž„μ‹œ νŒŒμΌμ„ λ°”μ΄λ„ˆλ¦¬ μ“°κΈ° λͺ¨λ“œλ‘œ μ—½λ‹ˆλ‹€.
41
- f.write(csv_docs.getvalue()) # CSV λ¬Έμ„œμ˜ λ‚΄μš©μ„ μž„μ‹œ νŒŒμΌμ— μ”λ‹ˆλ‹€.
42
- csv_loader = CSVLoader(temp_filepath) # CSVLoader μΈμŠ€ν„΄μŠ€λ₯Ό μƒμ„±ν•©λ‹ˆλ‹€.
43
- csv_doc = csv_loader.load() # ν…μŠ€νŠΈλ₯Ό μΆ”μΆœν•©λ‹ˆλ‹€.
44
- return csv_doc # μΆ”μΆœν•œ ν…μŠ€νŠΈλ₯Ό λ°˜ν™˜ν•©λ‹ˆλ‹€.
45
 
46
 
47
  def get_json_file(json_docs):
@@ -52,8 +51,8 @@ def get_json_file(json_docs):
52
  jq_schema='.messages[].content',
53
  text_content=False)
54
 
55
- data = loader.load()
56
- return data
57
 
58
  # λ¬Έμ„œλ“€μ„ μ²˜λ¦¬ν•˜μ—¬ ν…μŠ€νŠΈ 청크둜 λ‚˜λˆ„λŠ” ν•¨μˆ˜μž…λ‹ˆλ‹€.
59
  def get_text_chunks(documents):
@@ -132,7 +131,7 @@ def main():
132
 
133
  st.subheader("λ¬Έμ„œ 올리기")
134
  docs = st.file_uploader(
135
- "λ¬Έμ„œλ₯Ό μ—…λ‘œλ“œ ν•œ ν›„ Process λ²„νŠΌμ„ ν΄λ¦­ν•˜μ„Έμš”.'", accept_multiple_files=True)
136
  if st.button("Process"):
137
  with st.spinner("Processing"):
138
  # get pdf text
 
34
  return text_doc
35
 
36
  def get_csv_file(csv_docs):
37
+ temp_dir = tempfile.TemporaryDirectory() # μž„μ‹œ 디렉토리λ₯Ό μƒμ„±ν•©λ‹ˆλ‹€.
38
+ temp_filepath = os.path.join(temp_dir.name, csv_docs.name) # μž„μ‹œ 파일 경둜λ₯Ό μƒμ„±ν•©λ‹ˆλ‹€.
39
+ with open(temp_filepath, "wb") as f: # μž„μ‹œ νŒŒμΌμ„ λ°”μ΄λ„ˆλ¦¬ μ“°κΈ° λͺ¨λ“œλ‘œ μ—½λ‹ˆλ‹€.
40
+ f.write(csv_docs.getvalue()) # CSV λ¬Έμ„œμ˜ λ‚΄μš©μ„ μž„μ‹œ νŒŒμΌμ— μ”λ‹ˆλ‹€.
41
+ csv_loader = CSVLoader(temp_filepath) # CSVLoader μΈμŠ€ν„΄μŠ€λ₯Ό μƒμ„±ν•©λ‹ˆλ‹€.
42
+ csv_doc = csv_loader.load() # ν…μŠ€νŠΈλ₯Ό μΆ”μΆœν•©λ‹ˆλ‹€.
43
+ return csv_doc # μΆ”μΆœν•œ ν…μŠ€νŠΈλ₯Ό λ°˜ν™˜ν•©λ‹ˆλ‹€.
 
44
 
45
 
46
  def get_json_file(json_docs):
 
51
  jq_schema='.messages[].content',
52
  text_content=False)
53
 
54
+ json_doc = loader.load()
55
+ return json_doc
56
 
57
  # λ¬Έμ„œλ“€μ„ μ²˜λ¦¬ν•˜μ—¬ ν…μŠ€νŠΈ 청크둜 λ‚˜λˆ„λŠ” ν•¨μˆ˜μž…λ‹ˆλ‹€.
58
  def get_text_chunks(documents):
 
131
 
132
  st.subheader("λ¬Έμ„œ 올리기")
133
  docs = st.file_uploader(
134
+ "λ¬Έμ„œλ₯Ό μ—…λ‘œλ“œ ν•œ ν›„ Process λ²„νŠΌμ„ ν΄λ¦­ν•˜μ„Έμš”.", accept_multiple_files=True)
135
  if st.button("Process"):
136
  with st.spinner("Processing"):
137
  # get pdf text