Spaces:
Sleeping
Sleeping
HuggingFaceLLM
Browse files- backend.py +1 -1
backend.py
CHANGED
@@ -66,7 +66,7 @@ llm = HuggingFaceLLM(
|
|
66 |
model_name=model_id,
|
67 |
device_map="auto",
|
68 |
# change these settings below depending on your GPU
|
69 |
-
model_kwargs={"torch_dtype": torch.
|
70 |
)
|
71 |
|
72 |
#Settings.llm = GemmaLLMInterface()
|
|
|
66 |
model_name=model_id,
|
67 |
device_map="auto",
|
68 |
# change these settings below depending on your GPU
|
69 |
+
model_kwargs={"torch_dtype": torch.bfloat16, "load_in_8bit": True},
|
70 |
)
|
71 |
|
72 |
#Settings.llm = GemmaLLMInterface()
|