mastavtsev
commited on
Commit
•
cebfbf0
1
Parent(s):
69156b3
SqueezeBERT model version for course project on CLR and PM
Browse filesThis is the variation of SqueezeBERT model that was trained from scratch for the task of unsupervised anomaly detection in logs of CLR .NET environment. This model is the part of my 3 Year Course project at HSE FCS: https://github.com/mastavtsev/PM_NLP/tree/main
- config.json +28 -0
- model.safetensors +3 -0
- training_args.bin +3 -0
config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"SqueezeBertForMaskedLM"
|
4 |
+
],
|
5 |
+
"attention_probs_dropout_prob": 0.1,
|
6 |
+
"embedding_size": 768,
|
7 |
+
"hidden_act": "gelu",
|
8 |
+
"hidden_dropout_prob": 0.1,
|
9 |
+
"hidden_size": 768,
|
10 |
+
"initializer_range": 0.02,
|
11 |
+
"intermediate_groups": 4,
|
12 |
+
"intermediate_size": 3072,
|
13 |
+
"k_groups": 4,
|
14 |
+
"layer_norm_eps": 1e-12,
|
15 |
+
"max_position_embeddings": 512,
|
16 |
+
"model_type": "squeezebert",
|
17 |
+
"num_attention_heads": 12,
|
18 |
+
"num_hidden_layers": 12,
|
19 |
+
"output_groups": 4,
|
20 |
+
"pad_token_id": 0,
|
21 |
+
"post_attention_groups": 1,
|
22 |
+
"q_groups": 4,
|
23 |
+
"torch_dtype": "float32",
|
24 |
+
"transformers_version": "4.38.2",
|
25 |
+
"type_vocab_size": 2,
|
26 |
+
"v_groups": 4,
|
27 |
+
"vocab_size": 20000
|
28 |
+
}
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e78c311a87435e9b1089ba862b99393440f56c34887fbfcb21d8de23e07d71dd
|
3 |
+
size 174508672
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30bdd15fab99e68c6c4c82019ea86ca1941c15f607b2b7f263b7b7468a3d0203
|
3 |
+
size 5048
|