MistriDevLab

Sleeping

App Files Files Community

acecalisto3 commited on Aug 27, 2024

Commit

350b121

verified ·

1 Parent(s): 3ae40d2

Update app.py

Browse files

Files changed (1) hide show

app.py +229 -60

app.py CHANGED Viewed

@@ -13,9 +13,9 @@ import json
 now = datetime.now()
 date_time_str = now.strftime("%Y-%m-%d %H:%M:%S")
-# Define the model globally (or pass it as an argument to main)
-model = "mistralai/Mixtral-8x7B-Instruct-v0.1"
-client = InferenceClient(model)
 # --- Set up logging ---
 logging.basicConfig(
@@ -24,7 +24,7 @@ logging.basicConfig(
     format="%(asctime)s - %(levelname)s - %(message)s",
 )
-agents =[
     "WEB_DEV",
     "AI_SYSTEM_PROMPT",
     "PYTHON_CODE_DEV"
@@ -33,7 +33,7 @@ agents =[
 VERBOSE = True
 MAX_HISTORY = 5
-#MODEL = "gpt-3.5-turbo"  # "gpt-4"
 PREFIX = """
 {date_time_str}
@@ -111,7 +111,200 @@ def run_gpt(
         logging.info(LOG_RESPONSE.format(resp))  # Log the response
     return resp
-def generate(prompt, history, agent_name=agents[0], sys_prompt="", temperature=0.7, max_new_tokens=2048, top_p=0.8, repetition_penalty=1.5):
     seed = random.randint(1,1111111111111111)
     # Correct the line:
@@ -127,21 +320,31 @@ def generate(prompt, history, agent_name=agents[0], sys_prompt="", temperature=0
         temperature = 1e-2
     top_p = float(top_p)
-    generate_kwargs = dict(
-        temperature=temperature,
-        max_new_tokens=max_new_tokens,
-        top_p=top_p,
-        repetition_penalty=repetition_penalty,
-        do_sample=True,
-        seed=seed,
-    )
-    formatted_prompt = format_prompt(prompt, history, max_history_turns=5)  # Truncated history
-    logging.info(f"Formatted Prompt: {formatted_prompt}")
-    messages = [{"role": "user", "content": formatted_prompt}]
-    stream = client.text_generation(messages, **generate_kwargs, stream=True, details=True, return_full_text=False)
     output = ""
     for response in stream:
@@ -275,7 +478,8 @@ def project_explorer(path):
     tree = get_file_tree(path)
     display_file_tree(tree)
-def chat_app_logic(message, history, purpose, agent_name, sys_prompt, temperature, max_new_tokens, top_p, repetition_penalty, model):  # Add 'model' as an argument
     try:
         # Attempt to join the generator output
@@ -311,41 +515,7 @@ def chat_app_logic(message, history, purpose, agent_name, sys_prompt, temperatur
             max_new_tokens=max_new_tokens,
             top_p=top_p,
             repetition_penalty=repetition_penalty,
-                          )
-    try:
-        # Attempt to join the generator output
-        response = ''.join(generate(
-            model=model,  # Now you can use 'model' here
-            messages=messages,
-            stream=True,
-            temperature=0.7,
-            max_tokens=1500
-        ))
-    except TypeError:
-        # If joining fails, collect the output in a list
-        response_parts = []
-        for part in generate(
-            model=model,  # Now you can use 'model' here
-            messages=messages,
-            stream=True,
-            temperature=0.7,
-            max_tokens=1500
-        ):
-            if isinstance(part, str):
-                response_parts.append(part)
-            elif isinstance(part, dict) and 'content' in part:
-                response_parts.append(part['content']),
-        response = ''.join(response_parts,
-        # Run the model and get the response (convert generator to string)
-            prompt=message,
-            history=history,
-            agent_name=agent_name,
-            sys_prompt=sys_prompt,
-            temperature=temperature,
-            max_new_tokens=max_new_tokens,
-            top_p=top_p,
-            repetition_penalty=repetition_penalty,
                           )
         history.append((message, response))
         return history
@@ -353,7 +523,6 @@ def chat_app_logic(message, history, purpose, agent_name, sys_prompt, temperatur
     return history
 def main():
     with gr.Blocks() as demo:
         gr.Markdown("## FragMixt")
         gr.Markdown("### Agents w/ Agents")
@@ -371,6 +540,7 @@ def main():
         max_new_tokens = gr.Slider(label="Max new tokens", value=1048*10, minimum=0, maximum=1048*10, step=64, interactive=True, info="The maximum numbers of new tokens")
         top_p = gr.Slider(label="Top-p (nucleus sampling)", value=0.90, minimum=0.0, maximum=1, step=0.05, interactive=True, info="Higher values sample more low-probability tokens")
         repetition_penalty = gr.Slider(label="Repetition penalty", value=1.2, minimum=1.0, maximum=2.0, step=0.05, interactive=True, info="Penalize repeated tokens")
         # Button to submit the message
         submit_button = gr.Button(value="Send")
@@ -381,16 +551,15 @@ def main():
             explore_button = gr.Button(value="Explore")
             project_output = gr.Textbox(label="File Tree", lines=20)
-                # Chat App Logic Tab
         with gr.Tab("Chat App"):
             history = gr.State([])
             for example in examples:
-                gr.Button(value=example[0]).click(lambda: chat_app_logic(example[0], history, purpose, agent_name, sys_prompt, temperature, max_new_tokens, top_p, repetition_penalty, model), outputs=chatbot)
             # Connect components to the chat app logic
-            submit_button.click(chat_app_logic, inputs=[message, history, purpose, agent_name, sys_prompt, temperature, max_new_tokens, top_p, repetition_penalty, model], outputs=chatbot)  # Pass 'model'
-            message.submit(chat_app_logic, inputs=[message, history, purpose, agent_name, sys_prompt, temperature, max_new_tokens, top_p, repetition_penalty, model], outputs=chatbot)  # Pass 'model'
         # Connect components to the project explorer
         explore_button.click(project_explorer, inputs=project_path, outputs=project_output)

 now = datetime.now()
 date_time_str = now.strftime("%Y-%m-%d %H:%M:%S")
+client = InferenceClient(
+    "mistralai/Mixtral-8x7B-Instruct-v0.1"
+)
 # --- Set up logging ---
 logging.basicConfig(
     format="%(asctime)s - %(levelname)s - %(message)s",
 )
+agents = [
     "WEB_DEV",
     "AI_SYSTEM_PROMPT",
     "PYTHON_CODE_DEV"
 VERBOSE = True
 MAX_HISTORY = 5
+# MODEL = "gpt-3.5-turbo"  # "gpt-4"
 PREFIX = """
 {date_time_str}
         logging.info(LOG_RESPONSE.format(resp))  # Log the response
     return resp
+def generate(prompt, history, agent_name=agents[0], sys_prompt="", temperature=0.7, max_new_tokens=2048, top_p=0.8, repetition_penalty=1.5, model="mistralai/Mixtral-8x7B-Instruct-v0.1"):
+    content = PREFIX.format(
+        date_time_str=date_time_str,
+        purpose=purpose,
+        safe_search=safe_search,
+    ) + prompt_template.format(**prompt_kwargs)
+    if VERBOSE:
+        logging.info(LOG_PROMPT.format(content))  # Log the prompt
+    stream = client.text_generation(content, **generate_kwargs, stream=True, details=True, return_full_text=False)
+    resp = ""
+    for response in stream:
+        resp += response.token.text
+    if VERBOSE:
+        logging.info(LOG_RESPONSE.format(resp))  # Log the response
+    return resp
+def compress_history(purpose, task, history, directory):
+    resp = run_gpt(
+        COMPRESS_HISTORY_PROMPT,
+        stop_tokens=["observation:", "task:", "action:", "thought:"],
+        max_tokens=512,
+        purpose=purpose,
+        task=task,
+        history=history,
+    )
+    history = "observation: {}\n".format(resp)
+    return history
+def call_search(purpose, task, history, directory, action_input):
+    logging.info(f"CALLING SEARCH: {action_input}")
+    try:
+        if "http" in action_input:
+            if "<" in action_input:
+                action_input = action_input.strip("<")
+            if ">" in action_input:
+                action_input = action_input.strip(">")
+            response = i_s(action_input)
+            #response = google(search_return)
+            logging.info(f"Search Result: {response}")
+            history += "observation: search result is: {}\n".format(response)
+        else:
+            history += "observation: I need to provide a valid URL to 'action: SEARCH action_input=https://URL'\n"
+    except Exception as e:
+        history += "observation: {}'\n".format(e)
+    return "MAIN", None, history, task
+def call_main(purpose, task, history, directory, action_input):
+    logging.info(f"CALLING MAIN: {action_input}")
+    resp = run_gpt(
+        ACTION_PROMPT,
+        stop_tokens=["observation:", "task:", "action:","thought:"],
+        max_tokens=32000,
+        purpose=purpose,
+        task=task,
+        history=history,
+    )
+    lines = resp.strip().strip("\n").split("\n")
+    for line in lines:
+        if line == "":
+            continue
+        if line.startswith("thought: "):
+            history += "{}\n".format(line)
+            logging.info(f"Thought: {line}")
+        elif line.startswith("action: "):
+            action_name, action_input = parse_action(line)
+            logging.info(f"Action: {action_name} - {action_input}")
+            history += "{}\n".format(line)
+            if "COMPLETE" in action_name or "COMPLETE" in action_input:
+                task = "END"
+                return action_name, action_input, history, task
+            else:
+                return action_name, action_input, history, task
+        else:
+            history += "{}\n".format(line)
+            logging.info(f"Other Output: {line}")
+            #history += "observation: the following command did not produce any useful output: '{}', I need to check the commands syntax, or use a different command\n".format(line)
+            #return action_name, action_input, history, task
+            #assert False, "unknown action: {}".format(line)
+    return "MAIN", None, history, task
+def call_set_task(purpose, task, history, directory, action_input):
+    logging.info(f"CALLING SET_TASK: {action_input}")
+    task = run_gpt(
+        TASK_PROMPT,
+        stop_tokens=[],
+        max_tokens=64,
+        purpose=purpose,
+        task=task,
+        history=history,
+    ).strip("\n")
+    history += "observation: task has been updated to: {}\n".format(task)
+    return "MAIN", None, history, task
+def end_fn(purpose, task, history, directory, action_input):
+    logging.info(f"CALLING END_FN: {action_input}")
+    task = "END"
+    return "COMPLETE", "COMPLETE", history, task
+NAME_TO_FUNC = {
+    "MAIN": call_main,
+    "UPDATE-TASK": call_set_task,
+    "SEARCH": call_search,
+    "COMPLETE": end_fn,
+}
+def run_action(purpose, task, history, directory, action_name, action_input):
+    logging.info(f"RUNNING ACTION: {action_name} - {action_input}")
+    try:
+        if "RESPONSE" in action_name or "COMPLETE" in action_name:
+            action_name="COMPLETE"
+            task="END"
+            return action_name, "COMPLETE", history, task
+        # compress the history when it is long
+        if len(history.split("\n")) > MAX_HISTORY:
+            logging.info("COMPRESSING HISTORY")
+            history = compress_history(purpose, task, history, directory)
+        if not action_name in NAME_TO_FUNC:
+            action_name="MAIN"
+        if action_name == "" or action_name == None:
+            action_name="MAIN"
+        assert action_name in NAME_TO_FUNC
+        logging.info(f"RUN: {action_name} - {action_input}")
+        return NAME_TO_FUNC[action_name](purpose, task, history, directory, action_input)
+    except Exception as e:
+        history += "observation: the previous command did not produce any useful output, I need to check the commands syntax, or use a different command\n"
+        logging.error(f"Error in run_action: {e}")
+        return "MAIN", None, history, task
+def run(purpose,history):
+    #print(purpose)
+    #print(hist)
+    task=None
+    directory="./"
+    if history:
+        history=str(history).strip("[]")
+    if not history:
+        history = ""
+    action_name = "UPDATE-TASK" if task is None else "MAIN"
+    action_input = None
+    while True:
+        logging.info(f"---")
+        logging.info(f"Purpose: {purpose}")
+        logging.info(f"Task: {task}")
+        logging.info(f"---")
+        logging.info(f"History: {history}")
+        logging.info(f"---")
+        action_name, action_input, history, task = run_action(
+            purpose,
+            task,
+            history,
+            directory,
+            action_name,
+            action_input,
+        )
+        yield (history)
+        #yield ("",[(purpose,history)])
+        if task == "END":
+            return (history)
+            #return ("", [(purpose,history)])
+################################################
+def format_prompt(message, history, max_history_turns=5):
+  prompt = "<s>"
+  # Keep only the last 'max_history_turns' turns
+  for user_prompt, bot_response in history[-max_history_turns:]:
+    prompt += f"[INST] {user_prompt} [/INST]"
+    prompt += f" {bot_response}</s> "
+  prompt += f"[INST] {message} [/INST]"
+  return prompt
+agents =[
+    "WEB_DEV",
+    "AI_SYSTEM_PROMPT",
+    "PYTHON_CODE_DEV"
+]
+def generate(
+    prompt, history, agent_name=agents[0], sys_prompt="", temperature=0.9, max_new_tokens=2048, top_p=0.95, repetition_penalty=1.0, model="mistralai/Mixtral-8x7B-Instruct-v0.1"
+):
     seed = random.randint(1,1111111111111111)
     # Correct the line:
         temperature = 1e-2
     top_p = float(top_p)
+def generate_text_chunked(input_text, model, generation_parameters, max_tokens_to_generate):
+    """Generates text in chunks to avoid token limit errors."""
+    sentences = nltk.sent_tokenize(input_text)
+    generated_text = []
+    generator = pipeline('text-generation', model=model)
+    for sentence in sentences:
+        # Tokenize the sentence and check if it's within the limit
+        tokens = generator.tokenizer(sentence).input_ids
+        if len(tokens) + max_tokens_to_generate <= 32768:
+            # Generate text for this chunk
+            response = generator(sentence, max_length=max_tokens_to_generate, **generation_parameters)
+            generated_text.append(response[0]['generated_text'])
+        else:
+            # Handle cases where the sentence is too long
+            # You could split the sentence further or skip it
+            print(f"Sentence too long: {sentence}")
+    return ''.join(generated_text)
+    formatted_prompt = format_prompt(prompt, history, max_history_turns=5)  # Truncated history
+    logging.info(f"Formatted Prompt: {formatted_prompt}")
+    stream = client.text_generation(formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
     output = ""
     for response in stream:
     tree = get_file_tree(path)
     display_file_tree(tree)
+def chat_app_logic(message, history, purpose, agent_name, sys_prompt, temperature, max_new_tokens, top_p, repetition_penalty, model):
+    # Your existing code here
     try:
         # Attempt to join the generator output
             max_new_tokens=max_new_tokens,
             top_p=top_p,
             repetition_penalty=repetition_penalty,
+            model=model # Pass the model argument here
                           )
         history.append((message, response))
         return history
     return history
 def main():
     with gr.Blocks() as demo:
         gr.Markdown("## FragMixt")
         gr.Markdown("### Agents w/ Agents")
         max_new_tokens = gr.Slider(label="Max new tokens", value=1048*10, minimum=0, maximum=1048*10, step=64, interactive=True, info="The maximum numbers of new tokens")
         top_p = gr.Slider(label="Top-p (nucleus sampling)", value=0.90, minimum=0.0, maximum=1, step=0.05, interactive=True, info="Higher values sample more low-probability tokens")
         repetition_penalty = gr.Slider(label="Repetition penalty", value=1.2, minimum=1.0, maximum=2.0, step=0.05, interactive=True, info="Penalize repeated tokens")
+        model_input = gr.Textbox(label="Model", value="mistralai/Mixtral-8x7B-Instruct-v0.1", visible=False)
         # Button to submit the message
         submit_button = gr.Button(value="Send")
             explore_button = gr.Button(value="Explore")
             project_output = gr.Textbox(label="File Tree", lines=20)
+        # Chat App Logic Tab
         with gr.Tab("Chat App"):
             history = gr.State([])
             for example in examples:
+                gr.Button(value=example[0]).click(lambda: chat_app_logic(example[0], history, purpose, agent_name, sys_prompt, temperature, max_new_tokens, top_p, repetition_penalty, model=model_input), outputs=chatbot)
             # Connect components to the chat app logic
+            submit_button.click(chat_app_logic, inputs=[message, history, purpose, agent_name, sys_prompt, temperature, max_new_tokens, top_p, repetition_penalty, model_input], outputs=chatbot)
+            message.submit(chat_app_logic, inputs=[message, history, purpose, agent_name, sys_prompt, temperature, max_new_tokens, top_p, repetition_penalty, model_input], outputs=chatbot)
         # Connect components to the project explorer
         explore_button.click(project_explorer, inputs=project_path, outputs=project_output)