DDingcheol commited on
Commit
f7e4221
ยท
1 Parent(s): 19f561f

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -10
app.py CHANGED
@@ -26,22 +26,13 @@ def get_pdf_text(pdf_docs):
26
  # ๊ณผ์ œ
27
  # ์•„๋ž˜ ํ…์ŠคํŠธ ์ถ”์ถœ ํ•จ์ˆ˜๋ฅผ ์ž‘์„ฑ
28
  def get_text_file(docs):
29
- # ํ…์ŠคํŠธ ์ƒ์„ฑ์„ ์œ„ํ•œ Hugging Face์˜ ํ…์ŠคํŠธ ์ƒ์„ฑ ํŒŒ์ดํ”„๋ผ์ธ ์ƒ์„ฑ
30
- text_generator = pipeline("text-generation", model="distilgpt2")
31
-
32
  # ํ…์ŠคํŠธ ํŒŒ์ผ๋กœ๋ถ€ํ„ฐ ํ…์ŠคํŠธ๋ฅผ ์ฝ์–ด์™€ ๋ฆฌ์ŠคํŠธ์— ์ €์žฅํ•ฉ๋‹ˆ๋‹ค.
33
  text_list = []
34
  for doc in docs:
35
  content = doc.getvalue().decode("utf-8") # ํŒŒ์ผ ๋‚ด์šฉ์„ ๊ฐ€์ ธ์™€์„œ UTF-8๋กœ ๋””์ฝ”๋”ฉํ•˜์—ฌ ๋ฌธ์ž์—ด๋กœ ๋ณ€ํ™˜
36
  text_list.append(content) # ํ…์ŠคํŠธ๋ฅผ ๋ฆฌ์ŠคํŠธ์— ์ถ”๊ฐ€
37
 
38
- # ๊ฐ ํ…์ŠคํŠธ์— ๋Œ€ํ•ด ํ—ˆ๊น… ํŽ˜์ด์Šค ๋ชจ๋ธ์„ ์‚ฌ์šฉํ•˜์—ฌ ํ…์ŠคํŠธ๋ฅผ ์ƒ์„ฑํ•˜๊ณ  ๊ฒฐ๊ณผ๋ฅผ ์ €์žฅํ•ฉ๋‹ˆ๋‹ค.
39
- generated_texts = []
40
- for text in text_list:
41
- generated_text = text_generator(text, max_length=50, num_return_sequences=1)
42
- generated_texts.append(generated_text[0]['generated_text'])
43
-
44
- return generated_texts # ์ƒ์„ฑ๋œ ํ…์ŠคํŠธ ๋ฆฌ์ŠคํŠธ ๋ฐ˜ํ™˜
45
 
46
 
47
  def get_csv_file(docs):
 
26
  # ๊ณผ์ œ
27
  # ์•„๋ž˜ ํ…์ŠคํŠธ ์ถ”์ถœ ํ•จ์ˆ˜๋ฅผ ์ž‘์„ฑ
28
  def get_text_file(docs):
 
 
 
29
  # ํ…์ŠคํŠธ ํŒŒ์ผ๋กœ๋ถ€ํ„ฐ ํ…์ŠคํŠธ๋ฅผ ์ฝ์–ด์™€ ๋ฆฌ์ŠคํŠธ์— ์ €์žฅํ•ฉ๋‹ˆ๋‹ค.
30
  text_list = []
31
  for doc in docs:
32
  content = doc.getvalue().decode("utf-8") # ํŒŒ์ผ ๋‚ด์šฉ์„ ๊ฐ€์ ธ์™€์„œ UTF-8๋กœ ๋””์ฝ”๋”ฉํ•˜์—ฌ ๋ฌธ์ž์—ด๋กœ ๋ณ€ํ™˜
33
  text_list.append(content) # ํ…์ŠคํŠธ๋ฅผ ๋ฆฌ์ŠคํŠธ์— ์ถ”๊ฐ€
34
 
35
+ return text_list # ์ถ”์ถœ๋œ ํ…์ŠคํŠธ ๋ฆฌ์ŠคํŠธ ๋ฐ˜ํ™˜
 
 
 
 
 
 
36
 
37
 
38
  def get_csv_file(docs):