JinHyeong99 commited on
Commit
0cbb204
Β·
1 Parent(s): 5be23da
Files changed (1) hide show
  1. app.py +16 -7
app.py CHANGED
@@ -34,15 +34,24 @@ def get_text_file(text_docs):
34
  return text_doc
35
 
36
  def get_csv_file(csv_docs):
37
- csv_loader = CSVLoader(csv_docs.name)
38
- csv_doc = csv_loader.load()
39
- return csv_doc
 
 
 
 
40
 
41
  def get_json_file(json_docs):
42
- json_loader = JSONLoader(json_docs.name)
43
- json_doc = json_loader.load()
44
- return json_doc
45
-
 
 
 
 
 
46
 
47
  # λ¬Έμ„œλ“€μ„ μ²˜λ¦¬ν•˜μ—¬ ν…μŠ€νŠΈ 청크둜 λ‚˜λˆ„λŠ” ν•¨μˆ˜μž…λ‹ˆλ‹€.
48
  def get_text_chunks(documents):
 
34
  return text_doc
35
 
36
  def get_csv_file(csv_docs):
37
+ temp_dir = tempfile.TemporaryDirectory() # μž„μ‹œ 디렉토리λ₯Ό μƒμ„±ν•©λ‹ˆλ‹€.
38
+ temp_filepath = os.path.join(temp_dir.name, csv_docs.name) # μž„μ‹œ 파일 경둜λ₯Ό μƒμ„±ν•©λ‹ˆλ‹€.
39
+ with open(temp_filepath, "wb") as f: # μž„μ‹œ νŒŒμΌμ„ λ°”μ΄λ„ˆλ¦¬ μ“°κΈ° λͺ¨λ“œλ‘œ μ—½λ‹ˆλ‹€.
40
+ f.write(csv_docs.getvalue()) # CSV λ¬Έμ„œμ˜ λ‚΄μš©μ„ μž„μ‹œ νŒŒμΌμ— μ”λ‹ˆλ‹€.
41
+ csv_loader = CSVLoader(temp_filepath) # CSVLoaderλ₯Ό μ‚¬μš©ν•΄ CSVλ₯Ό λ‘œλ“œν•©λ‹ˆλ‹€.
42
+ csv_doc = CSVLoader.load() # ν…μŠ€νŠΈλ₯Ό μΆ”μΆœν•©λ‹ˆλ‹€.
43
+ return csv_doc # μΆ”μΆœν•œ ν…μŠ€νŠΈλ₯Ό λ°˜ν™˜ν•©λ‹ˆλ‹€.
44
 
45
  def get_json_file(json_docs):
46
+ temp_dir = tempfile.TemporaryDirectory() # μž„μ‹œ 디렉토리λ₯Ό μƒμ„±ν•©λ‹ˆλ‹€.
47
+ temp_filepath = os.path.join(temp_dir.name, json_docs.name) # μž„μ‹œ 파일 경둜λ₯Ό μƒμ„±ν•©λ‹ˆλ‹€.
48
+ loader = JSONLoader(
49
+ file_path=temp_filepath,
50
+ jq_schema='.messages[].content',
51
+ text_content=False)
52
+
53
+ data = loader.load()
54
+ return data
55
 
56
  # λ¬Έμ„œλ“€μ„ μ²˜λ¦¬ν•˜μ—¬ ν…μŠ€νŠΈ 청크둜 λ‚˜λˆ„λŠ” ν•¨μˆ˜μž…λ‹ˆλ‹€.
57
  def get_text_chunks(documents):