mirror of
https://github.com/jingyaogong/minimind.git
synced 2026-05-01 19:58:15 +08:00
[fix] reduce aux_loss_alpha
This commit is contained in:
parent
5e1447b913
commit
ecd1ae1563
@ -34,7 +34,7 @@ class MiniMindConfig(PretrainedConfig):
|
||||
n_routed_experts: int = 4,
|
||||
n_shared_experts: int = 1,
|
||||
scoring_func: str = 'softmax',
|
||||
aux_loss_alpha: float = 0.1,
|
||||
aux_loss_alpha: float = 0.01,
|
||||
seq_aux: bool = True,
|
||||
norm_topk_prob: bool = True,
|
||||
**kwargs
|
||||
|
||||
Loading…
Reference in New Issue
Block a user