Moonjunho commited on
Commit
188da05
ยท
1 Parent(s): d55c1c9

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +22 -3
app.py CHANGED
@@ -25,13 +25,32 @@ def get_pdf_text(pdf_docs):
25
  # ๊ณผ์ œ
26
  # ์•„๋ž˜ ํ…์ŠคํŠธ ์ถ”์ถœ ํ•จ์ˆ˜๋ฅผ ์ž‘์„ฑ
27
  def get_text_file(docs):
28
- pass
 
29
 
30
  def get_csv_file(docs):
31
- pass
 
 
 
 
 
 
 
 
 
32
 
33
  def get_json_file(docs):
34
- pass
 
 
 
 
 
 
 
 
 
35
 
36
 
37
  # ๋ฌธ์„œ๋“ค์„ ์ฒ˜๋ฆฌํ•˜์—ฌ ํ…์ŠคํŠธ ์ฒญํฌ๋กœ ๋‚˜๋ˆ„๋Š” ํ•จ์ˆ˜์ž…๋‹ˆ๋‹ค.
 
25
  # ๊ณผ์ œ
26
  # ์•„๋ž˜ ํ…์ŠคํŠธ ์ถ”์ถœ ํ•จ์ˆ˜๋ฅผ ์ž‘์„ฑ
27
  def get_text_file(docs):
28
+ text = file.getvalue().decode("utf-8") # ํ…์ŠคํŠธ ํŒŒ์ผ์„ ๋ฌธ์ž์—ด๋กœ ๋””์ฝ”๋”ฉํ•ฉ๋‹ˆ๋‹ค.
29
+ return [text] # ํ…์ŠคํŠธ๋ฅผ ๋ฆฌ์ŠคํŠธ์— ๋‹ด์•„ ๋ฐ˜ํ™˜ํ•ฉ๋‹ˆ๋‹ค.
30
 
31
  def get_csv_file(docs):
32
+ import pandas as pd
33
+
34
+ # CSV ํŒŒ์ผ์„ Pandas DataFrame์œผ๋กœ ์ฝ์Šต๋‹ˆ๋‹ค.
35
+ df = pd.read_csv(file)
36
+
37
+ # ์—ฌ๊ธฐ์—์„œ ์›ํ•˜๋Š” ์—ด์„ ์„ ํƒํ•˜๊ฑฐ๋‚˜ ์ „์ฒด ํŒŒ์ผ์„ ์ฝ์–ด์˜ฌ ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.
38
+ # ์˜ˆ๋ฅผ ๋“ค์–ด, 'text_column' ์—ด์—์„œ ํ…์ŠคํŠธ๋ฅผ ์ถ”์ถœํ•˜๋Š” ๋ฐฉ๋ฒ•์€ ๋‹ค์Œ๊ณผ ๊ฐ™์Šต๋‹ˆ๋‹ค.
39
+ texts = df['text_column'].tolist()
40
+
41
+ return texts # ํ…์ŠคํŠธ ๋ฆฌ์ŠคํŠธ๋ฅผ ๋ฐ˜ํ™˜ํ•ฉ๋‹ˆ๋‹ค.
42
 
43
  def get_json_file(docs):
44
+ import json
45
+
46
+ # JSON ํŒŒ์ผ์„ ๋””์ฝ”๋”ฉํ•˜์—ฌ ๋ฐ์ดํ„ฐ๋ฅผ ์ถ”์ถœํ•ฉ๋‹ˆ๋‹ค.
47
+ data = json.load(file)
48
+
49
+ # ์—ฌ๊ธฐ์—์„œ ์ ์ ˆํ•œ ๋ฐฉ๋ฒ•์œผ๋กœ JSON ๋ฐ์ดํ„ฐ์—์„œ ํ…์ŠคํŠธ๋ฅผ ์ถ”์ถœํ•ฉ๋‹ˆ๋‹ค.
50
+ # ์˜ˆ๋ฅผ ๋“ค์–ด, 'text' ํ‚ค์— ํ•ด๋‹นํ•˜๋Š” ๊ฐ’์„ ์ถ”์ถœํ•˜๋Š” ๋ฐฉ๋ฒ•์€ ๋‹ค์Œ๊ณผ ๊ฐ™์Šต๋‹ˆ๋‹ค.
51
+ texts = [item['text'] for item in data]
52
+
53
+ return texts
54
 
55
 
56
  # ๋ฌธ์„œ๋“ค์„ ์ฒ˜๋ฆฌํ•˜์—ฌ ํ…์ŠคํŠธ ์ฒญํฌ๋กœ ๋‚˜๋ˆ„๋Š” ํ•จ์ˆ˜์ž…๋‹ˆ๋‹ค.