Update README.md
Browse files
README.md
CHANGED
@@ -184,6 +184,8 @@ model = AutoModel.from_pretrained(
|
|
184 |
low_cpu_mem_usage=True,
|
185 |
trust_remote_code=True).eval().cuda()
|
186 |
# Otherwise, you need to set device_map='auto' to use multiple GPUs for inference.
|
|
|
|
|
187 |
# model = AutoModel.from_pretrained(
|
188 |
# path,
|
189 |
# torch_dtype=torch.bfloat16,
|
|
|
184 |
low_cpu_mem_usage=True,
|
185 |
trust_remote_code=True).eval().cuda()
|
186 |
# Otherwise, you need to set device_map='auto' to use multiple GPUs for inference.
|
187 |
+
# import os
|
188 |
+
# os.environ["CUDA_LAUNCH_BLOCKING"] = "1"
|
189 |
# model = AutoModel.from_pretrained(
|
190 |
# path,
|
191 |
# torch_dtype=torch.bfloat16,
|