Spaces:

Siyuan0730
/

OmniTutor

Running

App Files Files Community

Siyuan0730 commited on Jan 1, 2024

Commit

9abc2ca

1 Parent(s): ae8b477

更新测试好的代码（openai接口更新）

Browse files

Files changed (2) hide show

app.py +46 -34
requirements.txt +1 -1

app.py CHANGED Viewed

@@ -1,7 +1,7 @@
 import pandas as pd
 import numpy as np
 import faiss
-import openai
 import tempfile
 from PyPDF2 import PdfReader
 import io
@@ -16,8 +16,6 @@ from collections import Counter
 #import jieba.analyse
 import nltk
 @st.cache_data
 def download_nltk():
     nltk.download('punkt')
@@ -65,15 +63,16 @@ def get_keywords(file_paths): #这里的重点是，对每一个file做尽可能
     return keywords_list
-def get_completion_from_messages(messages, model="gpt-4", temperature=0):
-        response = openai.ChatCompletion.create(
-            model=model,
-            messages=messages,
-            temperature=temperature, # this is the degree of randomness of the model's output
-        )
-        return response.choices[0].message["content"]
-def genarating_outline(keywords, num_lessons,language):
     system_message = 'You are a great AI teacher and linguist, skilled at create course outline based on summarized knowledge materials.'
     user_message = f"""You are a great AI teacher and linguist,
             skilled at generating course outline based on keywords of the course.
@@ -96,7 +95,7 @@ def genarating_outline(keywords, num_lessons,language):
                 'content': user_message},
             ]
-    response = get_completion_from_messages(messages)
     list_response = ['nothing in the answers..']
@@ -107,9 +106,9 @@ def genarating_outline(keywords, num_lessons,language):
     return list_response
-def courseOutlineGenerating(file_paths, num_lessons, language):
     summarized_materials = get_keywords(file_paths)
-    course_outline = genarating_outline(summarized_materials, num_lessons, language)
     return course_outline
 def constructVDB(file_paths):
@@ -171,7 +170,7 @@ def searchVDB(search_sentence, paraphrase_embeddings_df, index):
     return retrieved_chunks_list
-def generateCourse(topic, materials, language, style_options):
     system_message = 'You are a great AI teacher and linguist, skilled at writing informative and easy-to-understand course script based on given lesson topic and knowledge materials.'
     user_message = f"""You are a great AI teacher and linguist,
@@ -199,7 +198,7 @@ def generateCourse(topic, materials, language, style_options):
                 'content': user_message},
             ]
-    response = get_completion_from_messages(messages)
     return response
 def decorate_user_question(user_question, retrieved_chunks_for_user):
@@ -236,9 +235,9 @@ def initialize_vdb(temp_file_paths):
     st.success("Constructing vector database from provided materials...Done")
     return embeddings_df, faiss_index
-def initialize_outline(temp_file_paths, num_lessons, language):
     with st.spinner('Generating Course Outline...'):
-        course_outline_list = courseOutlineGenerating(temp_file_paths, num_lessons, language)
     st.success("Generating Course Outline...Done")
     course_outline_string = ''
     lessons_count = 0
@@ -251,14 +250,14 @@ def initialize_outline(temp_file_paths, num_lessons, language):
     return course_outline_list
-def initialize_content(course_outline_list, embeddings_df, faiss_index, language, style_options):
     count_generating_content = 0
     course_content_list = []
     for lesson in course_outline_list:
         count_generating_content += 1
         with st.spinner(f"Writing content for lesson {count_generating_content}..."):
             retrievedChunksList = searchVDB(lesson, embeddings_df, faiss_index)
-            courseContent = generateCourse(lesson, retrievedChunksList, language, style_options)
             course_content_list.append(courseContent)
         st.success(f"Writing content for lesson {count_generating_content}...Done")
         with st.expander(f"Learn the lesson {count_generating_content} ", expanded=False):
@@ -364,9 +363,12 @@ def app():
     if "OPENAI_API_KEY" not in st.session_state:
         st.session_state["OPENAI_API_KEY"] = ''
     if "openai_model" not in st.session_state:
-        st.session_state["openai_model"] = "gpt-3.5-turbo"
-        # Initialize chat history
     if "messages" not in st.session_state:
         st.session_state.messages = []
@@ -425,7 +427,6 @@ def app():
         ''', unsafe_allow_html=True)
     if btn:
         if api_key != "sk-..." and api_key !="" and api_key.startswith("sk-"):
             st.session_state.start_col1.empty()
@@ -438,10 +439,10 @@ def app():
             #initialize app
             temp_file_paths = initialize_file(added_files)
             st.session_state["OPENAI_API_KEY"] = api_key
-            openai.api_key = st.session_state["OPENAI_API_KEY"]
             st.session_state.embeddings_df, st.session_state.faiss_index = initialize_vdb(temp_file_paths)
-            st.session_state.course_outline_list = initialize_outline(temp_file_paths, num_lessons, language)
-            st.session_state.course_content_list = initialize_content(st.session_state.course_outline_list, st.session_state.embeddings_df, st.session_state.faiss_index, language, style_options)
             st.markdown('''
                         > 🤔 <font color = 'grey'> **Not satisfied with this course?** Simply click "Generate my course!" button to regenerate a new one! </font>
@@ -457,7 +458,7 @@ def app():
             st.session_state.case_pay.empty()
             announce.empty()
             divider.empty()
-            warning = st.write("请输入正确的API Key令牌")
     col1, col2 = st.columns([0.6,0.4])
@@ -485,10 +486,12 @@ def app():
                 st.write("Hello👋, how can I help you today? 😄")
             # Display chat messages from history on app rerun
-            for message in st.session_state.messages:
                 with st.chat_message(message["role"]):
-                    st.markdown(message["content"][0])
             # Display new user question.
             with st.chat_message("user"):
                 st.markdown(user_question)
@@ -496,21 +499,30 @@ def app():
             #这里的session.state就是保存了这个对话会话的一些基本信息和设置
             retrieved_chunks_for_user = searchVDB(user_question, st.session_state.embeddings_df, st.session_state.faiss_index)
             prompt = decorate_user_question(user_question, retrieved_chunks_for_user)
-            st.session_state.messages.append({"role": "user", "content": [user_question, prompt]})
             # Display assistant response in chat message container
             with st.chat_message("assistant"):
                 message_placeholder = st.empty()
                 full_response = ""
-                for response in openai.ChatCompletion.create(
                     model=st.session_state["openai_model"],
-                    messages=[{"role": "user", "content": prompt}],
                     stream=True,
                 ):
-                    full_response += response.choices[0].delta.get("content", "")
                     message_placeholder.markdown(full_response + "▌")
                 message_placeholder.markdown(full_response)
-            st.session_state.messages.append({"role": "assistant", "content": [full_response,1]})
 if __name__ == "__main__":

 import pandas as pd
 import numpy as np
 import faiss
+from openai import OpenAI
 import tempfile
 from PyPDF2 import PdfReader
 import io
 #import jieba.analyse
 import nltk
 @st.cache_data
 def download_nltk():
     nltk.download('punkt')
     return keywords_list
+def get_completion_from_messages(client, messages, model="gpt-4-1106-preview", temperature=0):
+    client = client
+    completion = client.chat.completions.create(
+        model=model,
+        messages=messages,
+        temperature=temperature,
+    )
+    return completion.choices[0].message.content
+def genarating_outline(client, keywords, num_lessons,language):
     system_message = 'You are a great AI teacher and linguist, skilled at create course outline based on summarized knowledge materials.'
     user_message = f"""You are a great AI teacher and linguist,
             skilled at generating course outline based on keywords of the course.
                 'content': user_message},
             ]
+    response = get_completion_from_messages(client, messages)
     list_response = ['nothing in the answers..']
     return list_response
+def courseOutlineGenerating(client, file_paths, num_lessons, language):
     summarized_materials = get_keywords(file_paths)
+    course_outline = genarating_outline(client, summarized_materials, num_lessons, language)
     return course_outline
 def constructVDB(file_paths):
     return retrieved_chunks_list
+def generateCourse(client, topic, materials, language, style_options):
     system_message = 'You are a great AI teacher and linguist, skilled at writing informative and easy-to-understand course script based on given lesson topic and knowledge materials.'
     user_message = f"""You are a great AI teacher and linguist,
                 'content': user_message},
             ]
+    response = get_completion_from_messages(client, messages)
     return response
 def decorate_user_question(user_question, retrieved_chunks_for_user):
     st.success("Constructing vector database from provided materials...Done")
     return embeddings_df, faiss_index
+def initialize_outline(client, temp_file_paths, num_lessons, language):
     with st.spinner('Generating Course Outline...'):
+        course_outline_list = courseOutlineGenerating(client, temp_file_paths, num_lessons, language)
     st.success("Generating Course Outline...Done")
     course_outline_string = ''
     lessons_count = 0
     return course_outline_list
+def initialize_content(client, course_outline_list, embeddings_df, faiss_index, language, style_options):
     count_generating_content = 0
     course_content_list = []
     for lesson in course_outline_list:
         count_generating_content += 1
         with st.spinner(f"Writing content for lesson {count_generating_content}..."):
             retrievedChunksList = searchVDB(lesson, embeddings_df, faiss_index)
+            courseContent = generateCourse(client, lesson, retrievedChunksList, language, style_options)
             course_content_list.append(courseContent)
         st.success(f"Writing content for lesson {count_generating_content}...Done")
         with st.expander(f"Learn the lesson {count_generating_content} ", expanded=False):
     if "OPENAI_API_KEY" not in st.session_state:
         st.session_state["OPENAI_API_KEY"] = ''
+    #if "client" not in st.session_state:
+    #    st.session_state["client"] = ''
     if "openai_model" not in st.session_state:
+        st.session_state["openai_model"] = "gpt-4-1106-preview"
+    if "messages_ui" not in st.session_state:
+        st.session_state.messages_ui = []
     if "messages" not in st.session_state:
         st.session_state.messages = []
         ''', unsafe_allow_html=True)
     if btn:
         if api_key != "sk-..." and api_key !="" and api_key.startswith("sk-"):
             st.session_state.start_col1.empty()
             #initialize app
             temp_file_paths = initialize_file(added_files)
             st.session_state["OPENAI_API_KEY"] = api_key
+            client = OpenAI(api_key = st.session_state["OPENAI_API_KEY"])
             st.session_state.embeddings_df, st.session_state.faiss_index = initialize_vdb(temp_file_paths)
+            st.session_state.course_outline_list = initialize_outline(client, temp_file_paths, num_lessons, language)
+            st.session_state.course_content_list = initialize_content(client, st.session_state.course_outline_list, st.session_state.embeddings_df, st.session_state.faiss_index, language, style_options)
             st.markdown('''
                         > 🤔 <font color = 'grey'> **Not satisfied with this course?** Simply click "Generate my course!" button to regenerate a new one! </font>
             st.session_state.case_pay.empty()
             announce.empty()
             divider.empty()
+            warning = st.write("请输入正确的OpenAI API Key令牌")
     col1, col2 = st.columns([0.6,0.4])
                 st.write("Hello👋, how can I help you today? 😄")
             # Display chat messages from history on app rerun
+            for message in st.session_state.messages_ui:
                 with st.chat_message(message["role"]):
+                    st.markdown(message["content"])
+            #更新ui上显示的聊天记录
+            st.session_state.messages_ui.append({"role": "user", "content": user_question})
             # Display new user question.
             with st.chat_message("user"):
                 st.markdown(user_question)
             #这里的session.state就是保存了这个对话会话的一些基本信息和设置
             retrieved_chunks_for_user = searchVDB(user_question, st.session_state.embeddings_df, st.session_state.faiss_index)
             prompt = decorate_user_question(user_question, retrieved_chunks_for_user)
+            st.session_state.messages.append({"role": "user", "content": prompt})
             # Display assistant response in chat message container
             with st.chat_message("assistant"):
                 message_placeholder = st.empty()
                 full_response = ""
+                client = OpenAI(api_key = st.session_state["OPENAI_API_KEY"])
+                for response in client.chat.completions.create(
                     model=st.session_state["openai_model"],
+                    messages=[
+                        {"role": m["role"], "content": m["content"]}
+                        for m in st.session_state.messages #用chatbot那边的隐藏消息记录
+                    ],
                     stream=True,
                 ):
+                    try:
+                        full_response += response.choices[0].delta.content
+                    except:
+                        full_response += ""
                     message_placeholder.markdown(full_response + "▌")
                 message_placeholder.markdown(full_response)
+            st.session_state.messages.append({"role": "assistant", "content": full_response})
+            st.session_state.messages_ui.append({"role": "assistant", "content": full_response})
 if __name__ == "__main__":

requirements.txt CHANGED Viewed

@@ -1,7 +1,7 @@
 faiss_cpu==1.7.3
 nltk==3.8.1
 numpy==1.25.0
-openai==0.27.6
 pandas==2.0.2
 PyPDF2==3.0.1
 sentence_transformers==2.2.2

 faiss_cpu==1.7.3
 nltk==3.8.1
 numpy==1.25.0
+openai==1.6.1
 pandas==2.0.2
 PyPDF2==3.0.1
 sentence_transformers==2.2.2