Update configuration_minGRULM.py
Browse files- configuration_minGRULM.py +9 -19
configuration_minGRULM.py
CHANGED
@@ -1,34 +1,24 @@
|
|
1 |
from transformers import PretrainedConfig
|
2 |
|
3 |
class MinGRULMConfig(PretrainedConfig):
|
4 |
-
model_type = "
|
5 |
|
6 |
def __init__(
|
7 |
self,
|
8 |
vocab_size=50257,
|
9 |
-
|
10 |
-
depth=12,
|
11 |
ff_mult=4,
|
12 |
min_gru_expansion=1.5,
|
13 |
-
|
14 |
-
initializer_range=0.02,
|
15 |
pad_vocab_size_multiple=8,
|
|
|
16 |
**kwargs,
|
17 |
):
|
18 |
self.vocab_size = vocab_size
|
19 |
-
self.
|
20 |
-
self.
|
21 |
-
self.
|
22 |
-
self.
|
23 |
-
self.enable_conv = enable_conv # Whether convolution is enabled
|
24 |
-
self.initializer_range = initializer_range
|
25 |
self.pad_vocab_size_multiple = pad_vocab_size_multiple
|
26 |
-
|
27 |
-
# Adjust vocab size to be a multiple of `pad_vocab_size_multiple`
|
28 |
-
if self.vocab_size % self.pad_vocab_size_multiple != 0:
|
29 |
-
self.vocab_size += (
|
30 |
-
self.pad_vocab_size_multiple
|
31 |
-
- self.vocab_size % self.pad_vocab_size_multiple
|
32 |
-
)
|
33 |
-
|
34 |
super().__init__(**kwargs)
|
|
|
1 |
from transformers import PretrainedConfig
|
2 |
|
3 |
class MinGRULMConfig(PretrainedConfig):
|
4 |
+
model_type = "mingru"
|
5 |
|
6 |
def __init__(
|
7 |
self,
|
8 |
vocab_size=50257,
|
9 |
+
d_model=512, # Burada 'd_model' ekledik
|
|
|
10 |
ff_mult=4,
|
11 |
min_gru_expansion=1.5,
|
12 |
+
depth=12,
|
|
|
13 |
pad_vocab_size_multiple=8,
|
14 |
+
initializer_range=0.02,
|
15 |
**kwargs,
|
16 |
):
|
17 |
self.vocab_size = vocab_size
|
18 |
+
self.d_model = d_model # Burada 'd_model' parametresini ekledik
|
19 |
+
self.ff_mult = ff_mult
|
20 |
+
self.min_gru_expansion = min_gru_expansion
|
21 |
+
self.depth = depth
|
|
|
|
|
22 |
self.pad_vocab_size_multiple = pad_vocab_size_multiple
|
23 |
+
self.initializer_range = initializer_range
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
24 |
super().__init__(**kwargs)
|