Spaces:

microsoft
/

MInference

Running on Zero

iofu728 commited on Jul 7, 2024

Commit

6c68933

1 Parent(s): 38dd464

Feature(MInference): add zeroGPU

Files changed (1) hide show

app.py CHANGED Viewed

@@ -73,7 +73,7 @@ if torch.cuda.is_available() and _is_package_available("pycuda"):
 terminators = [tokenizer.eos_token_id, tokenizer.convert_tokens_to_ids("<|eot_id|>")]
-# @spaces.GPU(duration=120)
 def chat_llama3_8b(
     message: str, history: list, temperature: float, max_new_tokens: int
 ) -> str:

 terminators = [tokenizer.eos_token_id, tokenizer.convert_tokens_to_ids("<|eot_id|>")]
+@spaces.GPU(duration=120)
 def chat_llama3_8b(
     message: str, history: list, temperature: float, max_new_tokens: int
 ) -> str: