suayptalha commited on
Commit
1746bec
·
verified ·
1 Parent(s): d8426d7

Update configuration_minGRULM.py

Browse files
Files changed (1) hide show
  1. configuration_minGRULM.py +9 -19
configuration_minGRULM.py CHANGED
@@ -1,34 +1,24 @@
1
  from transformers import PretrainedConfig
2
 
3
  class MinGRULMConfig(PretrainedConfig):
4
- model_type = "mingru_lm" # Model type for registration in the Transformers library
5
 
6
  def __init__(
7
  self,
8
  vocab_size=50257,
9
- dim=512,
10
- depth=12,
11
  ff_mult=4,
12
  min_gru_expansion=1.5,
13
- enable_conv=False,
14
- initializer_range=0.02,
15
  pad_vocab_size_multiple=8,
 
16
  **kwargs,
17
  ):
18
  self.vocab_size = vocab_size
19
- self.dim = dim # Dimension of embeddings
20
- self.depth = depth # Number of layers
21
- self.ff_mult = ff_mult # Feed-forward multiplier
22
- self.min_gru_expansion = min_gru_expansion # Expansion factor for minGRU
23
- self.enable_conv = enable_conv # Whether convolution is enabled
24
- self.initializer_range = initializer_range
25
  self.pad_vocab_size_multiple = pad_vocab_size_multiple
26
-
27
- # Adjust vocab size to be a multiple of `pad_vocab_size_multiple`
28
- if self.vocab_size % self.pad_vocab_size_multiple != 0:
29
- self.vocab_size += (
30
- self.pad_vocab_size_multiple
31
- - self.vocab_size % self.pad_vocab_size_multiple
32
- )
33
-
34
  super().__init__(**kwargs)
 
1
  from transformers import PretrainedConfig
2
 
3
  class MinGRULMConfig(PretrainedConfig):
4
+ model_type = "mingru"
5
 
6
  def __init__(
7
  self,
8
  vocab_size=50257,
9
+ d_model=512, # Burada 'd_model' ekledik
 
10
  ff_mult=4,
11
  min_gru_expansion=1.5,
12
+ depth=12,
 
13
  pad_vocab_size_multiple=8,
14
+ initializer_range=0.02,
15
  **kwargs,
16
  ):
17
  self.vocab_size = vocab_size
18
+ self.d_model = d_model # Burada 'd_model' parametresini ekledik
19
+ self.ff_mult = ff_mult
20
+ self.min_gru_expansion = min_gru_expansion
21
+ self.depth = depth
 
 
22
  self.pad_vocab_size_multiple = pad_vocab_size_multiple
23
+ self.initializer_range = initializer_range
 
 
 
 
 
 
 
24
  super().__init__(**kwargs)