YchKhan commited on
Commit
e086aec
1 Parent(s): 64c4a07

Update split_files_to_excel.py

Browse files
Files changed (1) hide show
  1. split_files_to_excel.py +7 -6
split_files_to_excel.py CHANGED
@@ -481,16 +481,17 @@ def split_in_df(files):
481
  documents = split_doc_in_chunks(files)
482
  df = pd.DataFrame()
483
  for document in documents:
 
484
  content = document.page_content
485
 
486
- metadata = document.metadata
487
- metadata_keys = list(metadata.keys())
488
- metadata_values = list(metadata.values())
489
 
490
- doc_data = {'Content': content}
491
 
492
- for key, value in zip(metadata_keys, metadata_values):
493
- doc_data[key] = value
494
 
495
  df = pd.concat([df, pd.DataFrame([doc_data])], ignore_index=True)
496
 
 
481
  documents = split_doc_in_chunks(files)
482
  df = pd.DataFrame()
483
  for document in documents:
484
+ filename = document.metadata['filename']
485
  content = document.page_content
486
 
487
+ # metadata = document.metadata
488
+ # metadata_keys = list(metadata.keys())
489
+ # metadata_values = list(metadata.values())
490
 
491
+ doc_data = {'Filename': filename, 'Content': content}
492
 
493
+ # for key, value in zip(metadata_keys, metadata_values):
494
+ # doc_data[key] = value
495
 
496
  df = pd.concat([df, pd.DataFrame([doc_data])], ignore_index=True)
497