Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -16,10 +16,20 @@ import os
|
|
16 |
|
17 |
def http_bot_yield(prompt):
|
18 |
headers = {"User-Agent": "vLLM Client"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
19 |
pload = {
|
20 |
-
"prompt": f"
|
21 |
"stream": True,
|
22 |
-
"max_tokens":
|
23 |
"temperature": 0.1
|
24 |
}
|
25 |
response = requests.post(
|
|
|
16 |
|
17 |
def http_bot_yield(prompt):
|
18 |
headers = {"User-Agent": "vLLM Client"}
|
19 |
+
system_message = """
|
20 |
+
Below is an instruction that describes a task. Write a response that appropriately completes the request.
|
21 |
+
"""
|
22 |
+
# pload = {
|
23 |
+
# "prompt": f"<s>[INST] {prompt} [/INST] ",
|
24 |
+
# "stream": True,
|
25 |
+
# "max_tokens": 1024,
|
26 |
+
# "temperature": 0.1
|
27 |
+
# }
|
28 |
+
|
29 |
pload = {
|
30 |
+
"prompt": f"### System:\n{system_message}\n\n\n\n### Instruction:\n{prompt}\n\n### Response:\n",
|
31 |
"stream": True,
|
32 |
+
"max_tokens": 2048,
|
33 |
"temperature": 0.1
|
34 |
}
|
35 |
response = requests.post(
|