BramVanroy Rijgersberg commited on
Commit
04c2cc1
1 Parent(s): c071dea

Load model in bfloat16 (#2)

Browse files

- Load model in bloat16 (2ee99b8b877e3e8442a123ea40045f11815cbc9a)


Co-authored-by: Edwin Rijgersberg <Rijgersberg@users.noreply.huggingface.co>

Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -17,7 +17,7 @@ MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "8192"))
17
 
18
  model_id = "BramVanroy/fietje-2b-chat"
19
  avatar_url = "https://huggingface.co/spaces/BramVanroy/fietje-2b/resolve/main/img/fietje-2b-avatar.png"
20
- model = AutoModelForCausalLM.from_pretrained(model_id, device_map="auto")
21
  tokenizer = AutoTokenizer.from_pretrained(model_id)
22
  tokenizer.pad_token_id = tokenizer.eos_token_id
23
 
 
17
 
18
  model_id = "BramVanroy/fietje-2b-chat"
19
  avatar_url = "https://huggingface.co/spaces/BramVanroy/fietje-2b/resolve/main/img/fietje-2b-avatar.png"
20
+ model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.bfloat16, device_map="auto")
21
  tokenizer = AutoTokenizer.from_pretrained(model_id)
22
  tokenizer.pad_token_id = tokenizer.eos_token_id
23