Spaces:

qingxu98
/

gpt-academic

Running

qingxu99 commited on Apr 13, 2023

Commit

98724cd

1 Parent(s): 8ac9b45

更新注释

Files changed (2) hide show

crazy_functional.py CHANGED Viewed

@@ -107,7 +107,7 @@ def get_crazy_functions():
             "Color": "stop",
             "Function": HotReload(总结word文档)
         },
-        "[测试功能] 理解PDF文档内容（通用接口，读取文件输入区）": {
             # HotReload 的意思是热更新，修改函数插件代码后，不需要重启程序，代码直接生效
             "Color": "stop",
             "AsButton": False,  # 加入下拉菜单中

             "Color": "stop",
             "Function": HotReload(总结word文档)
         },
+        "理解PDF文档内容 （模仿ChatPDF）": {
             # HotReload 的意思是热更新，修改函数插件代码后，不需要重启程序，代码直接生效
             "Color": "stop",
             "AsButton": False,  # 加入下拉菜单中

crazy_functions/理解PDF文档内容.py CHANGED Viewed

@@ -10,6 +10,7 @@ def 解析PDF(file_name, llm_kwargs, plugin_kwargs, chatbot, history, system_pro
     print('begin analysis on:', file_name)
     file_content, page_one = read_and_clean_pdf_text(file_name)
     # 递归地切割PDF文件，每一块（尽量是完整的一个section，比如introduction，experiment等，必要时再进行切割）
     # 的长度必须小于 2500 个 Token
     TOKEN_LIMIT_PER_FRAGMENT = 2500

     print('begin analysis on:', file_name)
     file_content, page_one = read_and_clean_pdf_text(file_name)
+    ############################## <第零步，从摘要中提取高价值信息，放到history中> ##################################
     # 递归地切割PDF文件，每一块（尽量是完整的一个section，比如introduction，experiment等，必要时再进行切割）
     # 的长度必须小于 2500 个 Token
     TOKEN_LIMIT_PER_FRAGMENT = 2500