underspirit
commited on
Commit
•
ddaa64a
1
Parent(s):
a6d67b5
Update configuration_xverse.py
Browse files- configuration_xverse.py +1 -1
configuration_xverse.py
CHANGED
@@ -97,7 +97,7 @@ class XverseConfig(PretrainedConfig):
|
|
97 |
Number of shared experts, None for no shared experts.
|
98 |
output_router_logits (`bool`, optional):
|
99 |
Whether or not to return the router logits.
|
100 |
-
router_aux_loss_coef (`float`, *optional*, defaults to 0.
|
101 |
The aux loss factor for the total loss.
|
102 |
Example:
|
103 |
|
|
|
97 |
Number of shared experts, None for no shared experts.
|
98 |
output_router_logits (`bool`, optional):
|
99 |
Whether or not to return the router logits.
|
100 |
+
router_aux_loss_coef (`float`, *optional*, defaults to 0.01):
|
101 |
The aux loss factor for the total loss.
|
102 |
Example:
|
103 |
|