Spaces:

chojo12
/

task3

Sleeping

App Files Files Community

chojo12 commited on Nov 22, 2023

Commit

daae5fc

1 Parent(s): 9934126

Upload app.py

Browse files

Files changed (1) hide show

app.py +37 -7

app.py CHANGED Viewed

@@ -24,15 +24,45 @@ def get_pdf_text(pdf_docs):
 # 과제
 # 아래 텍스트 추출 함수를 작성
-def get_text_file(docs):
-    pass
-def get_csv_file(docs):
-    pass
-def get_json_file(docs):
-    pass
 # 문서들을 처리하여 텍스트 청크로 나누는 함수입니다.
 def get_text_chunks(documents):

 # 과제
 # 아래 텍스트 추출 함수를 작성
+def get_text_file(txt_docs):
+    temp_dir = tempfile.TemporaryDirectory()  # 임시 디렉토리를 생성합니다.
+    temp_filepath = os.path.join(temp_dir.name, "temp.txt")  # 고정된 이름인 "temp.txt"로 임시 파일 경로를 생성합니다.
+    with open(temp_filepath, "w", encoding="utf-8") as f:  # 임시 파일을 utf-8 인코딩으로 쓰기 모드로 엽니다.
+        f.write(txt_docs)  # 텍스트 파일 내용을 임시 파일에 씁니다.
+    # 텍스트 파일 내용을 읽어옵니다.
+    with open(temp_filepath, "r", encoding="utf-8") as f:
+        text_content = f.read()
+    return text_content  # 추출된 텍스트 내용을 반환합니다.
+def get_csv_file(csv_docs):
+    temp_dir = tempfile.TemporaryDirectory()  # 임시 디렉토리를 생성합니다.
+    temp_filepath = os.path.join(temp_dir.name, "temp.csv")  # 고정된 이름인 "temp.csv"로 임시 파일 경로를 생성합니다.
+    # CSV 데이터를 임시 파일에 쓰기
+    with open(temp_filepath, "w", newline="", encoding="utf-8") as csv_file:
+        csv_file.write(csv_docs.getvalue())
+    # 임시 파일에서 텍스트 추출
+    with open(temp_filepath, "r", encoding="utf-8") as csv_file:
+        csv_reader = csv.reader(csv_file)
+        text_content = "\n".join(",".join(row) for row in csv_reader)
+    return text_content  # 추출된 텍스트 내용을 반환합니다.
+def get_json_file(json_docs, key_to_extract):
+    try:
+        json_data = json.loads(json_docs)  # JSON 문자열을 파이썬 객체로 로드합니다.
+        extracted_text = json_data.get(key_to_extract, '')  # 지정된 키의 값을 추출합니다. 키가 없을 경우 빈 문자열 반환.
+        return extracted_text
+    except json.JSONDecodeError as e:
+        print(f"Error decoding JSON: {e}")
+        return None
 # 문서들을 처리하여 텍스트 청크로 나누는 함수입니다.
 def get_text_chunks(documents):