Spaces:
Sleeping
Sleeping
Commit
Β·
755d925
1
Parent(s):
aa9b219
Update app.py
Browse files
app.py
CHANGED
@@ -12,6 +12,7 @@ import tempfile # μμ νμΌμ μμ±νκΈ° μν λΌμ΄λΈλ¬λ¦¬μ
λλ€.
|
|
12 |
import os
|
13 |
from huggingface_hub import hf_hub_download # Hugging Face Hubμμ λͺ¨λΈμ λ€μ΄λ‘λνκΈ° μν ν¨μμ
λλ€.
|
14 |
|
|
|
15 |
# PDF λ¬Έμλ‘λΆν° ν
μ€νΈλ₯Ό μΆμΆνλ ν¨μμ
λλ€.
|
16 |
def get_pdf_text(pdf_docs):
|
17 |
temp_dir = tempfile.TemporaryDirectory() # μμ λλ ν 리λ₯Ό μμ±ν©λλ€.
|
@@ -27,12 +28,12 @@ def get_pdf_text(pdf_docs):
|
|
27 |
def get_text_file(docs):
|
28 |
text_list = []
|
29 |
for doc in docs:
|
30 |
-
|
31 |
-
|
32 |
text = doc.read().decode("utf-8") # νμΌμ μ½κ³ UTF-8λ‘ λμ½λ©νμ¬ λ¬Έμμ΄λ‘ λ³νν©λλ€.
|
|
|
33 |
else:
|
34 |
-
|
35 |
-
text_list.append(text)
|
36 |
return text_list
|
37 |
|
38 |
|
|
|
12 |
import os
|
13 |
from huggingface_hub import hf_hub_download # Hugging Face Hubμμ λͺ¨λΈμ λ€μ΄λ‘λνκΈ° μν ν¨μμ
λλ€.
|
14 |
|
15 |
+
|
16 |
# PDF λ¬Έμλ‘λΆν° ν
μ€νΈλ₯Ό μΆμΆνλ ν¨μμ
λλ€.
|
17 |
def get_pdf_text(pdf_docs):
|
18 |
temp_dir = tempfile.TemporaryDirectory() # μμ λλ ν 리λ₯Ό μμ±ν©λλ€.
|
|
|
28 |
def get_text_file(docs):
|
29 |
text_list = []
|
30 |
for doc in docs:
|
31 |
+
if hasattr(doc, 'read') and callable(getattr(doc, 'read')):
|
32 |
+
# νμΌ κ°μ²΄μΈμ§ νμΈνκ³ 'read' λ©μλκ° μλμ§ κ²μ¬ν©λλ€.
|
33 |
text = doc.read().decode("utf-8") # νμΌμ μ½κ³ UTF-8λ‘ λμ½λ©νμ¬ λ¬Έμμ΄λ‘ λ³νν©λλ€.
|
34 |
+
text_list.append(text)
|
35 |
else:
|
36 |
+
text_list.append(str(doc)) # νμΌ κ°μ²΄κ° μλ κ²½μ° λ¬Έμμ΄λ‘ λ³ννμ¬ μΆκ°ν©λλ€.
|
|
|
37 |
return text_list
|
38 |
|
39 |
|