Spaces:
Runtime error
Runtime error
Roger Condori
commited on
Commit
•
fc80b18
1
Parent(s):
0ce15d3
add description restriction maxtokens app.py
Browse files
app.py
CHANGED
@@ -130,7 +130,7 @@ with gr.Blocks(theme=theme, css=css) as demo:
|
|
130 |
gr.HTML("<h3>Only models from the GGML library are accepted.</h3>")
|
131 |
repo_ = gr.Textbox(label="Repository" ,value="TheBloke/Llama-2-7B-Chat-GGML")
|
132 |
file_ = gr.Textbox(label="File name" ,value="llama-2-7b-chat.ggmlv3.q2_K.bin")
|
133 |
-
max_tokens = gr.inputs.Slider(1, MAX_NEW_TOKENS, default=16, label="Max new tokens", step=1)
|
134 |
temperature = gr.inputs.Slider(0.1, 1., default=0.2, label="Temperature", step=0.1)
|
135 |
top_k = gr.inputs.Slider(0.01, 1., default=0.95, label="Top K", step=0.01)
|
136 |
top_p = gr.inputs.Slider(0, 100, default=50, label="Top P", step=1)
|
|
|
130 |
gr.HTML("<h3>Only models from the GGML library are accepted.</h3>")
|
131 |
repo_ = gr.Textbox(label="Repository" ,value="TheBloke/Llama-2-7B-Chat-GGML")
|
132 |
file_ = gr.Textbox(label="File name" ,value="llama-2-7b-chat.ggmlv3.q2_K.bin")
|
133 |
+
max_tokens = gr.inputs.Slider(1, MAX_NEW_TOKENS, default=16, label="Max new tokens; Limited due to excessively long inference times, use Colab or local to avoid these restrictions.", step=1)
|
134 |
temperature = gr.inputs.Slider(0.1, 1., default=0.2, label="Temperature", step=0.1)
|
135 |
top_k = gr.inputs.Slider(0.01, 1., default=0.95, label="Top K", step=0.01)
|
136 |
top_p = gr.inputs.Slider(0, 100, default=50, label="Top P", step=1)
|