Spaces:

happzy2633
/

open-o1

Running on Zero

App Files Files Community

Happzy-WHU commited on 13 days ago

Commit

84a6c36

•

1 Parent(s): 6b39623

first commit.

Browse files

Files changed (4) hide show

README.md +23 -5
V3.py +37 -0
app.py +91 -0
requirements.txt +138 -0

README.md CHANGED Viewed

@@ -1,14 +1,32 @@
 ---
 title: Open O1
-emoji: 👁
-colorFrom: gray
-colorTo: green
 sdk: gradio
-sdk_version: 4.44.1
 app_file: app.py
 pinned: false
 license: apache-2.0
 short_description: This is an official demo website for open-o1.
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
 title: Open O1
+emoji: 💬
+colorFrom: yellow
+colorTo: purple
 sdk: gradio
+sdk_version: 4.36.1
 app_file: app.py
 pinned: false
 license: apache-2.0
 short_description: This is an official demo website for open-o1.
 ---
+# open o1 deployment
+1.  Git clone this repository.
+```shell
+git clone https://huggingface.co/spaces/happzy2633/open-o1
+```
+2.  Install the dependencies listed in requirements.txt.
+3.  Replace the value of the use\_auth\_token variable with your own.
+4.  Execute the script below.
+```shell
+python app.py
+```

V3.py ADDED Viewed

	@@ -0,0 +1,37 @@

+import os
+from transformers import AutoTokenizer
+from vllm import LLM, SamplingParams
+from huggingface_hub import snapshot_download
+use_auth_token = os.getenv("YOUR_AUTH_TOKEN")
+repo_id = "m-a-p/qwen2.5-7b-ins-v3"
+local_dir = repo_id.rsplit("/")[-1]
+snapshot_download(repo_id=repo_id, local_dir=local_dir, use_auth_token=use_auth_token, resume_download=True)
+model_path = "qwen2.5-7b-ins-v3/checkpoint-1000"
+tokenizer = AutoTokenizer.from_pretrained(model_path)
+sampling_params = SamplingParams(temperature=0.7, top_p=0.8, repetition_penalty=1.05, max_tokens=8192)
+llm = LLM(model=model_path)
+def api_call_batch(batch_messages):
+    text_list = [
+        tokenizer.apply_chat_template(conversation=messages, tokenize=False, add_generation_prompt=True, return_tensors='pt')
+        for messages in batch_messages
+    ]
+    outputs = llm.generate(text_list, sampling_params)
+    result = [output.outputs[0].text for output in outputs]
+    return result
+def api_call(messages):
+    return api_call_batch([messages])[0]
+def call_gpt(history, prompt):
+    return api_call(history+[{"role":"user", "content":prompt}])
+if __name__ == "__main__":
+    messages = [{"role":"user", "content":"你是谁？"}]
+    breakpoint()
+    print(api_call_batch([messages]*4))

app.py ADDED Viewed

	@@ -0,0 +1,91 @@

+import gradio as gr
+from loguru import logger
+from V3 import call_gpt
+class Conversation:
+    def __init__(self, max_history_len=10):
+        self.max_history_len = max_history_len
+    def pop_history(self, history):
+        while len(history) > self.max_history_len:
+            for item in history:
+                if item["role"] == "user":
+                    history.remove(item)
+                    break
+            for item in history:
+                if item["role"] == "assistant":
+                    history.remove(item)
+                    break
+        return history
+    def ask(self, history, prompt):
+        history = self.pop_history(history)
+        logger.info(history)
+        return call_gpt(history, prompt)
+conv = Conversation()
+def make_history(system_prompt, qa_list):
+    history = [{"role": "system", "content": system_prompt}]
+    for q, a in qa_list:
+        history.append({"role": "user", "content": q})
+        history.append({"role": "assistant", "content": a})
+    return history
+def answer(system_prompt, prompt, history=[]):
+    history.append(prompt)
+    qa_list = [(u, b) for u, b in zip(history[::2], history[1::2])]
+    message = conv.ask(make_history(system_prompt, qa_list), prompt)
+    # 对反引号进行转义
+    message = message.replace("`", "\\`")
+    # 包裹为代码块
+    message = f"```\n{message}\n```"
+    history.append(message)
+    chatbot_messages = []
+    for q, a in qa_list:
+        chatbot_messages.append((q, a))
+    chatbot_messages.append((prompt, message))
+    return "", chatbot_messages, history
+def clear_history(state):
+    state.clear()
+    return state, []
+with gr.Blocks(css="#chatbot{height:500px} .overflow-y-auto{height:500px}") as rxbot:
+    with gr.Row():
+        sys = gr.Textbox(show_label=False, value="You are open-o1, a helpful assistant.")
+    chatbot = gr.Chatbot()
+    state = gr.State([])
+    with gr.Row():
+        txt = gr.Textbox(show_label=False, placeholder="请输入你的问题", max_lines=8)
+    with gr.Row():
+        clear_button = gr.Button("🧹Clear History")
+        send_button = gr.Button("🚀Send")
+        send_button.click(
+            fn=answer,
+            inputs=[sys, txt, state],
+            outputs=[txt, chatbot, state]
+        )
+        txt.submit(
+            fn=answer,
+            inputs=[sys, txt, state],
+            outputs=[txt, chatbot, state]
+        )
+        clear_button.click(
+            fn=clear_history,
+            inputs=[state],
+            outputs=[state, chatbot]
+        )
+rxbot.launch()

requirements.txt ADDED Viewed

	@@ -0,0 +1,138 @@

+aiofiles==23.2.1
+aiohappyeyeballs==2.3.6
+aiohttp==3.10.3
+aiosignal==1.3.1
+annotated-types==0.7.0
+anyio==4.4.0
+async-timeout==4.0.3
+attrs==24.2.0
+blinker==1.8.2
+certifi==2024.7.4
+charset-normalizer==3.3.2
+click==8.1.7
+cloudpickle==3.0.0
+cmake==3.30.2
+contourpy==1.3.0
+cycler==0.12.1
+datasets==2.21.0
+dill==0.3.8
+diskcache==5.6.3
+distro==1.9.0
+exceptiongroup==1.2.2
+fastapi==0.112.1
+ffmpy==0.4.0
+filelock==3.15.4
+Flask==3.0.3
+Flask-Cors==4.0.1
+fonttools==4.54.1
+frozenlist==1.4.1
+fsspec==2024.6.1
+gradio==4.44.1
+gradio_client==1.3.0
+h11==0.14.0
+httpcore==1.0.5
+httptools==0.6.1
+httpx==0.27.0
+huggingface-hub==0.24.5
+idna==3.7
+importlib_resources==6.4.5
+interegular==0.3.3
+itsdangerous==2.2.0
+Jinja2==3.1.4
+jiter==0.5.0
+jsonschema==4.23.0
+jsonschema-specifications==2023.12.1
+kiwisolver==1.4.7
+lark==1.2.2
+llvmlite==0.43.0
+lm-format-enforcer==0.10.3
+loguru==0.7.2
+markdown-it-py==3.0.0
+MarkupSafe==2.1.5
+matplotlib==3.9.2
+mdurl==0.1.2
+mpmath==1.3.0
+msgpack==1.0.8
+multidict==6.0.5
+multiprocess==0.70.16
+nest-asyncio==1.6.0
+networkx==3.3
+ninja==1.11.1.1
+numba==0.60.0
+numpy==1.26.4
+nvidia-cublas-cu12==12.1.3.1
+nvidia-cuda-cupti-cu12==12.1.105
+nvidia-cuda-nvrtc-cu12==12.1.105
+nvidia-cuda-runtime-cu12==12.1.105
+nvidia-cudnn-cu12==9.1.0.70
+nvidia-cufft-cu12==11.0.2.54
+nvidia-curand-cu12==10.3.2.106
+nvidia-cusolver-cu12==11.4.5.107
+nvidia-cusparse-cu12==12.1.0.106
+nvidia-ml-py==12.560.30
+nvidia-nccl-cu12==2.20.5
+nvidia-nvjitlink-cu12==12.6.20
+nvidia-nvtx-cu12==12.1.105
+openai==1.40.8
+orjson==3.10.7
+outlines==0.0.46
+packaging==24.1
+pandas==2.2.2
+pillow==10.4.0
+prometheus-fastapi-instrumentator==7.0.0
+prometheus_client==0.20.0
+protobuf==5.27.3
+psutil==6.0.0
+py-cpuinfo==9.0.0
+pyairports==2.1.1
+pyarrow==17.0.0
+pycountry==24.6.1
+pydantic==2.8.2
+pydantic_core==2.20.1
+pydub==0.25.1
+pyext==0.7
+Pygments==2.18.0
+pyparsing==3.1.4
+python-dateutil==2.9.0.post0
+python-dotenv==1.0.1
+python-multipart==0.0.12
+pytz==2024.1
+PyYAML==6.0.2
+pyzmq==26.1.0
+ray==2.34.0
+referencing==0.35.1
+regex==2024.7.24
+requests==2.32.3
+rich==13.9.1
+rpds-py==0.20.0
+ruff==0.6.8
+safetensors==0.4.4
+semantic-version==2.10.0
+sentencepiece==0.2.0
+shellingham==1.5.4
+six==1.16.0
+sniffio==1.3.1
+starlette==0.38.2
+sympy==1.13.2
+tiktoken==0.7.0
+tokenizers==0.19.1
+tomlkit==0.12.0
+torch==2.4.0
+torchvision==0.19.0
+tqdm==4.66.5
+transformers==4.44.0
+triton==3.0.0
+typer==0.12.5
+typing_extensions==4.12.2
+tzdata==2024.1
+urllib3==2.2.2
+uvicorn==0.30.6
+uvloop==0.20.0
+vllm==0.5.4
+vllm-flash-attn==2.6.1
+watchfiles==0.23.0
+websockets==12.0
+Werkzeug==3.0.3
+xformers==0.0.27.post2
+xxhash==3.4.1
+yarl==1.9.4