from openai import OpenAI def predict(message, history, api_key): print('in predict') client = OpenAI(api_key=api_key) history_openai_format = [] for human, assistant in history: history_openai_format.append({"role": "user", "content": human}) history_openai_format.append({"role": "assistant", "content": assistant}) history_openai_format.append({"role": "user", "content": message}) print(history_openai_format) response = client.chat.completions.create( model='gpt-4o', messages=history_openai_format, temperature=1.0, stream=True ) partial_message = "" for chunk in response: #print(chunk) if chunk.choices[0].delta.content: #print(111, chunk.choices[0].delta.content) partial_message += chunk.choices[0].delta.content yield partial_message for msg in predict('Hi',[],'sk-proj-FuXWodUyfcvTYcc6K9ekT3BlbkFJ2eV3qu7UZOAWlW2eWRLQ'): print(msg)