oz1115 commited on
Commit
b878a39
·
verified ·
1 Parent(s): a0415e1

Upload GemmaForCausalLM

Browse files
Files changed (3) hide show
  1. config.json +3 -1
  2. generation_config.json +1 -1
  3. model.safetensors +1 -1
config.json CHANGED
@@ -9,6 +9,7 @@
9
  "eos_token_id": 1,
10
  "head_dim": 256,
11
  "hidden_act": "gelu",
 
12
  "hidden_size": 2048,
13
  "initializer_range": 0.02,
14
  "intermediate_size": 16384,
@@ -22,6 +23,7 @@
22
  "_load_in_4bit": true,
23
  "_load_in_8bit": false,
24
  "bnb_4bit_compute_dtype": "float16",
 
25
  "bnb_4bit_quant_type": "nf4",
26
  "bnb_4bit_use_double_quant": false,
27
  "llm_int8_enable_fp32_cpu_offload": false,
@@ -36,7 +38,7 @@
36
  "rope_scaling": null,
37
  "rope_theta": 10000.0,
38
  "torch_dtype": "float16",
39
- "transformers_version": "4.38.2",
40
  "use_cache": true,
41
  "vocab_size": 256000
42
  }
 
9
  "eos_token_id": 1,
10
  "head_dim": 256,
11
  "hidden_act": "gelu",
12
+ "hidden_activation": "gelu_pytorch_tanh",
13
  "hidden_size": 2048,
14
  "initializer_range": 0.02,
15
  "intermediate_size": 16384,
 
23
  "_load_in_4bit": true,
24
  "_load_in_8bit": false,
25
  "bnb_4bit_compute_dtype": "float16",
26
+ "bnb_4bit_quant_storage": "uint8",
27
  "bnb_4bit_quant_type": "nf4",
28
  "bnb_4bit_use_double_quant": false,
29
  "llm_int8_enable_fp32_cpu_offload": false,
 
38
  "rope_scaling": null,
39
  "rope_theta": 10000.0,
40
  "torch_dtype": "float16",
41
+ "transformers_version": "4.43.4",
42
  "use_cache": true,
43
  "vocab_size": 256000
44
  }
generation_config.json CHANGED
@@ -3,5 +3,5 @@
3
  "bos_token_id": 2,
4
  "eos_token_id": 1,
5
  "pad_token_id": 0,
6
- "transformers_version": "4.38.2"
7
  }
 
3
  "bos_token_id": 2,
4
  "eos_token_id": 1,
5
  "pad_token_id": 0,
6
+ "transformers_version": "4.43.4"
7
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d54ff6fe08a88d60a94f4a0bb819b4d9c45be052854411605c6092207c220f97
3
  size 2163577968
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75a9ba07b3f54ecd552a161571f680fe11cfa9430ac17cc20f26c4533194c0e8
3
  size 2163577968