bzantium commited on
Commit
634c1d1
·
verified ·
1 Parent(s): 0840cea

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +2 -2
config.json CHANGED
@@ -23,7 +23,7 @@
23
  "model_type": "deepseek_v3",
24
  "moe_intermediate_size": 2048,
25
  "moe_layer_freq": 1,
26
- "n_group": 8,
27
  "n_routed_experts": 8,
28
  "n_shared_experts": 1,
29
  "norm_topk_prob": true,
@@ -51,7 +51,7 @@
51
  "scoring_func": "sigmoid",
52
  "seq_aux": true,
53
  "tie_word_embeddings": false,
54
- "topk_group": 4,
55
  "topk_method": "noaux_tc",
56
  "torch_dtype": "bfloat16",
57
  "transformers_version": "4.49.0.dev0",
 
23
  "model_type": "deepseek_v3",
24
  "moe_intermediate_size": 2048,
25
  "moe_layer_freq": 1,
26
+ "n_group": 2,
27
  "n_routed_experts": 8,
28
  "n_shared_experts": 1,
29
  "norm_topk_prob": true,
 
51
  "scoring_func": "sigmoid",
52
  "seq_aux": true,
53
  "tie_word_embeddings": false,
54
+ "topk_group": 2,
55
  "topk_method": "noaux_tc",
56
  "torch_dtype": "bfloat16",
57
  "transformers_version": "4.49.0.dev0",