from langchain import OpenAI from langchain.prompts import PromptTemplate, FewShotPromptTemplate from langchain.chains import LLMChain EXAMPLES_PROMPT_TEMPLATE = PromptTemplate( input_variables=["input", "output"], template="Input: {input}\nOutput: {output}" ) PLAN_MOVE_PROMPT_EXAMPLES = [ {"input": "The piles contain 3, 5, 7 sticks", "output": "I'll take one stick from pile A"}, {"input": "The piles contain 2, 5, 7 sticks", "output": "I'll take one stick from pile B"}, {"input": "The piles contain 2, 5, 7 sticks", "output": "I'll take five stick from pile B"}, {"input": "The piles contain 1, 2, 3 sticks", "output": "I'll take two sticks from pile C"}, {"input": "The piles contain 0, 2, 3 sticks", "output": "I'll take one stick from pile C"}, {"input": "The piles contain 0, 2, 0 sticks", "output": "I'll take two sticks from pile B"}, ] PLAN_MOVE_PROMPT_FROM_STRING_EXAMPLES = FewShotPromptTemplate( examples=PLAN_MOVE_PROMPT_EXAMPLES, example_prompt=EXAMPLES_PROMPT_TEMPLATE, prefix="Nim is a two-player game of strategy in which players take turns removing objects from separate piles. " "The goal of the game is to remove the last sticks from a pile when the other piles contain 0 sticks. Each " "of these inputs represent a game state. For each of these game states please express a logical move that " "consists of taking some number of sticks from a pile. You may not take any sticks from a pile that " "contains 0 sticks.", suffix="Input: {text_game_state}\nOutput:", input_variables=["text_game_state"], example_separator="\n\n" ) EXEC_MOVE_PROMPT_EXAMPLES = [ {"input": "I'll take two sticks from pile A", "output": "0,2"}, {"input": "I'll take 3 sticks from the first pile", "output": "0,3"}, {"input": "I'll take two sticks from pile C", "output": "2,2"}, {"input": "I'll take one stick from the third pile", "output": "2,1"}, {"input": "From pile B remove 2 sticks", "output": "1,2"}, {"input": "I'll take the last stick from pile C", "output": "2,1"}, ] EXEC_MOVE_PROMPT_FROM_STRING_EXAMPLES = FewShotPromptTemplate( examples=EXEC_MOVE_PROMPT_EXAMPLES, example_prompt=EXAMPLES_PROMPT_TEMPLATE, prefix="Express every input as two numbers separated by a comma, where the first number is the zero index pile " "number and the second number is the number of sticks to remove.", suffix="Input: {move_to_express}\nOutput:", input_variables=["move_to_express"], example_separator="\n\n" ) def plan_move(text_game_state, temperature, api_key): llm = OpenAI(model_name='text-davinci-003', temperature=temperature, max_tokens=100, openai_api_key=api_key) llm_chain = LLMChain(llm=llm, prompt=PLAN_MOVE_PROMPT_FROM_STRING_EXAMPLES, verbose=False) planned_move = llm_chain.run({'text_game_state': text_game_state}).strip() return planned_move def execute_move(move_to_express, nim_game_env, api_key): llm = OpenAI(model_name='text-davinci-003', temperature=0.0, max_tokens=10, openai_api_key=api_key) llm_chain = LLMChain(llm=llm, prompt=EXEC_MOVE_PROMPT_FROM_STRING_EXAMPLES, verbose=False) step_tuple_str = llm_chain.run({'move_to_express': move_to_express}) step_tuple = tuple(int(x) for x in step_tuple_str.split(',')) try: step_result = nim_game_env.step(step_tuple) except ValueError: return "Invalid move!", [0, 0, 0], 0, True, None text_observation = "The piles contain " + ", ".join(str(x) for x in step_result[0]) + " sticks." return text_observation, step_result[0], step_result[1], step_result[2], step_result[3]