Spaces:

panda47
/

lang

Runtime error

panda47 commited on Nov 21, 2023

Commit

ed17b64

1 Parent(s): aa04651

Upload app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -28,17 +28,35 @@ def get_pdf_text(pdf_docs):
 # 과제
 # 아래 텍스트 추출 함수를 작성
-def get_text_file(docs):
-    pass
-def get_csv_file(docs):
-    pass
-def get_json_file(docs):
-    pass
 # 문서들을 처리하여 텍스트 청크로 나누는 함수입니다.
 def get_text_chunks(documents):
     text_splitter = RecursiveCharacterTextSplitter(

 # 과제
 # 아래 텍스트 추출 함수를 작성
+def get_text_file(txt_docs):
+    temp_dir = tempfile.TemporaryDirectory()
+    temp_filepath = os.path.join(temp_dir.name, txt_docs.name)
+    with open(temp_filepath, "wb") as f:
+        f.write(txt_docs.getvalue())
+    txt_loader = TextLoader(temp_filepath)
+    txt_doc = txt_loader.load()
+    return txt_doc
+def get_csv_file(csv_docs):
+    temp_dir = tempfile.TemporaryDirectory()
+    temp_filepath = os.path.join(temp_dir.name, csv_docs.name)
+    with open(temp_filepath, "wb") as f:
+        f.write(csv_docs.getvalue())
+    csv_loader = CSVLoader(temp_filepath)
+    csv_doc = csv_loader.load()
+    return csv_doc
+def get_json_file(json_docs):
+    temp_dir = tempfile.TemporaryDirectory()
+    temp_filepath = os.path.join(temp_dir.name, json_docs.name)
+    with open(temp_filepath, "wb") as f:
+        f.write(json_docs.getvalue())
+    json_loader = JSONLoader(temp_filepath)
+    json_doc = json_loader.load()
+    return json_doc
 # 문서들을 처리하여 텍스트 청크로 나누는 함수입니다.
 def get_text_chunks(documents):
     text_splitter = RecursiveCharacterTextSplitter(