mrfakename commited on
Commit
bd743d7
·
verified ·
1 Parent(s): 1c7a2ee

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -25,7 +25,7 @@ model = AutoModelForCausalLM.from_pretrained(
25
  device_map="cuda",
26
  trust_remote_code=True,
27
  torch_dtype="auto",
28
- _attn_implementation='flash_attention_2',
29
  load_in_4bit=True # Optional: Load model in 4-bit mode to save memory
30
  )
31
 
 
25
  device_map="cuda",
26
  trust_remote_code=True,
27
  torch_dtype="auto",
28
+ # _attn_implementation='flash_attention_2',
29
  load_in_4bit=True # Optional: Load model in 4-bit mode to save memory
30
  )
31