zhouzaida
commited on
Commit
·
31d002c
1
Parent(s):
14b9a5a
set alpha
Browse files- modeling_kimi_vl.py +1 -0
modeling_kimi_vl.py
CHANGED
@@ -904,6 +904,7 @@ class MoEGate(nn.Module):
|
|
904 |
self.n_routed_experts = config.n_routed_experts
|
905 |
self.routed_scaling_factor = config.routed_scaling_factor
|
906 |
self.scoring_func = config.scoring_func
|
|
|
907 |
self.seq_aux = config.seq_aux
|
908 |
self.topk_method = config.topk_method
|
909 |
self.n_group = config.n_group
|
|
|
904 |
self.n_routed_experts = config.n_routed_experts
|
905 |
self.routed_scaling_factor = config.routed_scaling_factor
|
906 |
self.scoring_func = config.scoring_func
|
907 |
+
self.alpha = config.aux_loss_alpha
|
908 |
self.seq_aux = config.seq_aux
|
909 |
self.topk_method = config.topk_method
|
910 |
self.n_group = config.n_group
|