Update app.py
Browse files
app.py
CHANGED
@@ -444,7 +444,7 @@ def generate_text (prompt, chatbot, history, rag_option, model_option, openai_ap
|
|
444 |
print("HF Anfrage.......................")
|
445 |
model_kwargs={"temperature": 0.5, "max_length": 512, "num_return_sequences": 1, "top_k": top_k, "top_p": top_p, "repetition_penalty": repetition_penalty}
|
446 |
#llm = HuggingFaceHub(repo_id=repo_id, model_kwargs=model_kwargs)
|
447 |
-
llm =
|
448 |
#llm = HuggingFaceHub(url_??? = "https://wdgsjd6zf201mufn.us-east-1.aws.endpoints.huggingface.cloud", model_kwargs={"temperature": 0.5, "max_length": 64})
|
449 |
#llm = HuggingFaceTextGenInference( inference_server_url="http://localhost:8010/", max_new_tokens=max_new_tokens,top_k=10,top_p=top_p,typical_p=0.95,temperature=temperature,repetition_penalty=repetition_penalty,)
|
450 |
print("HF")
|
|
|
444 |
print("HF Anfrage.......................")
|
445 |
model_kwargs={"temperature": 0.5, "max_length": 512, "num_return_sequences": 1, "top_k": top_k, "top_p": top_p, "repetition_penalty": repetition_penalty}
|
446 |
#llm = HuggingFaceHub(repo_id=repo_id, model_kwargs=model_kwargs)
|
447 |
+
llm = HuggingFaceHub(model=MODEL_NAME_HF, model_kwargs={"temperature": 0.5, "max_length": 128})
|
448 |
#llm = HuggingFaceHub(url_??? = "https://wdgsjd6zf201mufn.us-east-1.aws.endpoints.huggingface.cloud", model_kwargs={"temperature": 0.5, "max_length": 64})
|
449 |
#llm = HuggingFaceTextGenInference( inference_server_url="http://localhost:8010/", max_new_tokens=max_new_tokens,top_k=10,top_p=top_p,typical_p=0.95,temperature=temperature,repetition_penalty=repetition_penalty,)
|
450 |
print("HF")
|