Roger Koranteng commited on
Commit
9c80998
1 Parent(s): 773553c

First model version

Browse files
.gitattributes CHANGED
@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ .h5 filter=lfs diff=lfs merge=lfs -text
37
+ *.spm filter=lfs diff=lfs merge=lfs -text
assets/tokenizer/vocabulary.spm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61a7b147390c64585d6c3543dd6fc636906c9af3865a5548f27f31aee1d4c8e2
3
+ size 4241003
config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "module": "keras_nlp.src.models.gemma.gemma_backbone",
3
+ "class_name": "GemmaBackbone",
4
+ "config": {
5
+ "name": "gemma_backbone",
6
+ "trainable": true,
7
+ "vocabulary_size": 256000,
8
+ "num_layers": 18,
9
+ "num_query_heads": 8,
10
+ "num_key_value_heads": 1,
11
+ "hidden_dim": 2048,
12
+ "intermediate_dim": 32768,
13
+ "head_dim": 256,
14
+ "layer_norm_epsilon": 1e-06,
15
+ "dropout": 0
16
+ },
17
+ "registered_name": "keras_nlp>GemmaBackbone",
18
+ "assets": [],
19
+ "weights": "model.weights.h5"
20
+ }
metadata.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "keras_version": "3.0.3",
3
+ "keras_nlp_version": "0.7.0",
4
+ "parameter_count": 2506172416,
5
+ "date_saved": "2024-02-06@16:11:29"
6
+ }
model.weights.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77ccbc6e4ab56b1d787310db33e06500d2a35688c625ef79d25231b92439b2bf
3
+ size 5013019984
tokenizer.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "module": "keras_nlp.src.models.gemma.gemma_tokenizer",
3
+ "class_name": "GemmaTokenizer",
4
+ "config": {
5
+ "name": "gemma_tokenizer",
6
+ "trainable": true,
7
+ "dtype": "int32",
8
+ "proto": null,
9
+ "sequence_length": null
10
+ },
11
+ "registered_name": "keras_nlp>GemmaTokenizer",
12
+ "assets": [
13
+ "assets/tokenizer/vocabulary.spm"
14
+ ],
15
+ "weights": null
16
+ }