maykcaldas commited on
Commit
ddb037c
·
1 Parent(s): 24ddeaf

Upload FlaxBertForPreTraining

Browse files
Files changed (2) hide show
  1. config.json +3 -3
  2. flax_model.msgpack +2 -2
config.json CHANGED
@@ -4,11 +4,11 @@
4
  ],
5
  "attention_probs_dropout_prob": 0.1,
6
  "classifier_dropout": null,
7
- "hidden_act": "gelu",
8
  "hidden_dropout_prob": 0.1,
9
- "hidden_size": 2048,
10
  "initializer_range": 0.02,
11
- "intermediate_size": 1024,
12
  "layer_norm_eps": 1e-12,
13
  "max_position_embeddings": 512,
14
  "model_type": "bert",
 
4
  ],
5
  "attention_probs_dropout_prob": 0.1,
6
  "classifier_dropout": null,
7
+ "hidden_act": "swish",
8
  "hidden_dropout_prob": 0.1,
9
+ "hidden_size": 512,
10
  "initializer_range": 0.02,
11
+ "intermediate_size": 256,
12
  "layer_norm_eps": 1e-12,
13
  "max_position_embeddings": 512,
14
  "model_type": "bert",
flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f6e537fe06ce6550c7613f73852e6118948327fee87eaf6cf44b91b9bc52b542
3
- size 545494790
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e5d438a3bbf1e3f2fe6cabda05870763b5087f4ad0637ce11446559a7631fed
3
+ size 35714822