|
{ |
|
"metadata": { |
|
"total_size": 107060958208 |
|
}, |
|
"weight_map": { |
|
"model.embed_tokens.weight": "model-00001-of-00015.safetensors", |
|
"model.layers.0.input_layernorm.weight": "model-00001-of-00015.safetensors", |
|
"model.layers.0.mlp.down_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.0.mlp.down_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.0.mlp.gate_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.0.mlp.gate_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.0.mlp.up_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.0.mlp.up_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.0.post_attention_layernorm.weight": "model-00001-of-00015.safetensors", |
|
"model.layers.0.self_attn.k_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.0.self_attn.k_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.0.self_attn.o_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.0.self_attn.o_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.0.self_attn.q_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.0.self_attn.q_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.0.self_attn.v_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.0.self_attn.v_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.0.mlp.down_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.0.mlp.gate_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.0.mlp.up_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.0.self_attn.k_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.0.self_attn.o_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.0.self_attn.q_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.0.self_attn.v_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.1.input_layernorm.weight": "model-00001-of-00015.safetensors", |
|
"model.layers.1.mlp.down_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.1.mlp.down_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.1.mlp.gate_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.1.mlp.gate_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.1.mlp.up_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.1.mlp.up_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.1.post_attention_layernorm.weight": "model-00001-of-00015.safetensors", |
|
"model.layers.1.self_attn.k_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.1.self_attn.k_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.1.self_attn.o_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.1.self_attn.o_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.1.self_attn.q_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.1.self_attn.q_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.1.self_attn.v_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.1.self_attn.v_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.1.mlp.down_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.1.mlp.gate_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.1.mlp.up_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.1.self_attn.k_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.1.self_attn.o_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.1.self_attn.q_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.1.self_attn.v_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.2.input_layernorm.weight": "model-00001-of-00015.safetensors", |
|
"model.layers.2.mlp.down_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.2.mlp.down_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.2.mlp.gate_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.2.mlp.gate_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.2.mlp.up_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.2.mlp.up_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.2.post_attention_layernorm.weight": "model-00001-of-00015.safetensors", |
|
"model.layers.2.self_attn.k_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.2.self_attn.k_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.2.self_attn.o_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.2.self_attn.o_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.2.self_attn.q_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.2.self_attn.q_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.2.self_attn.v_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.2.self_attn.v_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.2.mlp.down_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.2.mlp.gate_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.2.mlp.up_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.2.self_attn.k_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.2.self_attn.o_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.2.self_attn.q_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.2.self_attn.v_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.3.input_layernorm.weight": "model-00001-of-00015.safetensors", |
|
"model.layers.3.mlp.down_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.3.mlp.down_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.3.mlp.gate_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.3.mlp.gate_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.3.mlp.up_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.3.mlp.up_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.3.post_attention_layernorm.weight": "model-00001-of-00015.safetensors", |
|
"model.layers.3.self_attn.k_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.3.self_attn.k_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.3.self_attn.o_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.3.self_attn.o_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.3.self_attn.q_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.3.self_attn.q_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.3.self_attn.v_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.3.self_attn.v_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.3.mlp.down_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.3.mlp.gate_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.3.mlp.up_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.3.self_attn.k_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.3.self_attn.o_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.3.self_attn.q_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.3.self_attn.v_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.4.input_layernorm.weight": "model-00001-of-00015.safetensors", |
|
"model.layers.4.mlp.down_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.4.mlp.down_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.4.mlp.gate_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.4.mlp.gate_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.4.mlp.up_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.4.mlp.up_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.4.post_attention_layernorm.weight": "model-00001-of-00015.safetensors", |
|
"model.layers.4.self_attn.k_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.4.self_attn.k_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.4.self_attn.o_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.4.self_attn.o_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.4.self_attn.q_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.4.self_attn.q_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.4.self_attn.v_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.4.self_attn.v_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.4.mlp.down_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.4.mlp.gate_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.4.mlp.up_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.4.self_attn.k_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.4.self_attn.o_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.4.self_attn.q_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.4.self_attn.v_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.5.input_layernorm.weight": "model-00001-of-00015.safetensors", |
|
"model.layers.5.mlp.down_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.5.mlp.down_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.5.mlp.gate_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.5.mlp.gate_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.5.mlp.up_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.5.mlp.up_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.5.post_attention_layernorm.weight": "model-00001-of-00015.safetensors", |
|
"model.layers.5.self_attn.k_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.5.self_attn.k_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.5.self_attn.o_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.5.self_attn.o_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.5.self_attn.q_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.5.self_attn.q_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.5.self_attn.v_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.5.self_attn.v_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.5.mlp.down_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.5.mlp.gate_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.5.mlp.up_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.5.self_attn.k_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.5.self_attn.o_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.5.self_attn.q_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.5.self_attn.v_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.6.input_layernorm.weight": "model-00001-of-00015.safetensors", |
|
"model.layers.6.mlp.down_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.6.mlp.down_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.6.mlp.gate_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.6.mlp.gate_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.6.mlp.up_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.6.mlp.up_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.6.post_attention_layernorm.weight": "model-00001-of-00015.safetensors", |
|
"model.layers.6.self_attn.k_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.6.self_attn.k_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.6.self_attn.o_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.6.self_attn.o_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.6.self_attn.q_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.6.self_attn.q_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.6.self_attn.v_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.6.self_attn.v_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.6.mlp.down_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.6.mlp.gate_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.6.mlp.up_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.6.self_attn.k_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.6.self_attn.o_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.6.self_attn.q_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.6.self_attn.v_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.7.input_layernorm.weight": "model-00001-of-00015.safetensors", |
|
"model.layers.7.mlp.down_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.7.mlp.down_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.7.mlp.gate_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.7.mlp.gate_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.7.mlp.up_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.7.mlp.up_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.7.post_attention_layernorm.weight": "model-00001-of-00015.safetensors", |
|
"model.layers.7.self_attn.k_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.7.self_attn.k_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.7.self_attn.o_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.7.self_attn.o_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.7.self_attn.q_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.7.self_attn.q_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.7.self_attn.v_proj.suh": "model-00001-of-00015.safetensors", |
|
"model.layers.7.self_attn.v_proj.svh": "model-00001-of-00015.safetensors", |
|
"model.layers.7.mlp.down_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.7.mlp.gate_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.7.mlp.up_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.7.self_attn.k_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.7.self_attn.o_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.7.self_attn.q_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.7.self_attn.v_proj.trellis": "model-00001-of-00015.safetensors", |
|
"model.layers.8.input_layernorm.weight": "model-00002-of-00015.safetensors", |
|
"model.layers.8.mlp.down_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.8.mlp.down_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.8.mlp.gate_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.8.mlp.gate_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.8.mlp.up_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.8.mlp.up_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.8.post_attention_layernorm.weight": "model-00002-of-00015.safetensors", |
|
"model.layers.8.self_attn.k_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.8.self_attn.k_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.8.self_attn.o_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.8.self_attn.o_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.8.self_attn.q_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.8.self_attn.q_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.8.self_attn.v_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.8.self_attn.v_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.8.mlp.down_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.8.mlp.gate_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.8.mlp.up_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.8.self_attn.k_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.8.self_attn.o_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.8.self_attn.q_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.8.self_attn.v_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.13.input_layernorm.weight": "model-00002-of-00015.safetensors", |
|
"model.layers.13.mlp.down_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.13.mlp.down_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.13.mlp.gate_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.13.mlp.gate_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.13.mlp.up_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.13.mlp.up_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.13.post_attention_layernorm.weight": "model-00002-of-00015.safetensors", |
|
"model.layers.13.self_attn.k_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.13.self_attn.k_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.13.self_attn.o_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.13.self_attn.o_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.13.self_attn.q_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.13.self_attn.q_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.13.self_attn.v_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.13.self_attn.v_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.13.mlp.down_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.13.mlp.gate_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.13.mlp.up_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.13.self_attn.k_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.13.self_attn.o_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.13.self_attn.q_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.13.self_attn.v_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.14.input_layernorm.weight": "model-00002-of-00015.safetensors", |
|
"model.layers.14.mlp.down_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.14.mlp.down_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.14.mlp.gate_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.14.mlp.gate_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.14.mlp.up_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.14.mlp.up_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.14.post_attention_layernorm.weight": "model-00002-of-00015.safetensors", |
|
"model.layers.14.self_attn.k_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.14.self_attn.k_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.14.self_attn.o_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.14.self_attn.o_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.14.self_attn.q_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.14.self_attn.q_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.14.self_attn.v_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.14.self_attn.v_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.14.mlp.down_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.14.mlp.gate_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.14.mlp.up_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.14.self_attn.k_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.14.self_attn.o_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.14.self_attn.q_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.14.self_attn.v_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.15.input_layernorm.weight": "model-00002-of-00015.safetensors", |
|
"model.layers.15.mlp.down_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.15.mlp.down_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.15.mlp.gate_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.15.mlp.gate_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.15.mlp.up_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.15.mlp.up_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.15.post_attention_layernorm.weight": "model-00002-of-00015.safetensors", |
|
"model.layers.15.self_attn.k_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.15.self_attn.k_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.15.self_attn.o_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.15.self_attn.o_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.15.self_attn.q_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.15.self_attn.q_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.15.self_attn.v_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.15.self_attn.v_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.15.mlp.down_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.15.mlp.gate_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.15.mlp.up_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.15.self_attn.k_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.15.self_attn.o_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.15.self_attn.q_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.15.self_attn.v_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.16.input_layernorm.weight": "model-00002-of-00015.safetensors", |
|
"model.layers.16.mlp.down_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.16.mlp.down_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.16.mlp.gate_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.16.mlp.gate_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.16.mlp.up_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.16.mlp.up_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.16.post_attention_layernorm.weight": "model-00002-of-00015.safetensors", |
|
"model.layers.16.self_attn.k_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.16.self_attn.k_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.16.self_attn.o_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.16.self_attn.o_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.16.self_attn.q_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.16.self_attn.q_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.16.self_attn.v_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.16.self_attn.v_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.16.mlp.down_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.16.mlp.gate_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.16.mlp.up_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.16.self_attn.k_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.16.self_attn.o_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.16.self_attn.q_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.16.self_attn.v_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.17.input_layernorm.weight": "model-00002-of-00015.safetensors", |
|
"model.layers.17.mlp.down_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.17.mlp.down_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.17.mlp.gate_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.17.mlp.gate_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.17.mlp.up_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.17.mlp.up_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.17.post_attention_layernorm.weight": "model-00002-of-00015.safetensors", |
|
"model.layers.17.self_attn.k_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.17.self_attn.k_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.17.self_attn.o_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.17.self_attn.o_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.17.self_attn.q_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.17.self_attn.q_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.17.self_attn.v_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.17.self_attn.v_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.17.mlp.down_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.17.mlp.gate_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.17.mlp.up_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.17.self_attn.k_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.17.self_attn.o_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.17.self_attn.q_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.17.self_attn.v_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.24.input_layernorm.weight": "model-00002-of-00015.safetensors", |
|
"model.layers.24.mlp.down_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.24.mlp.down_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.24.mlp.gate_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.24.mlp.gate_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.24.mlp.up_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.24.mlp.up_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.24.post_attention_layernorm.weight": "model-00002-of-00015.safetensors", |
|
"model.layers.24.self_attn.k_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.24.self_attn.k_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.24.self_attn.o_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.24.self_attn.o_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.24.self_attn.q_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.24.self_attn.q_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.24.self_attn.v_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.24.self_attn.v_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.24.mlp.down_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.24.mlp.gate_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.24.mlp.up_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.24.self_attn.k_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.24.self_attn.o_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.24.self_attn.q_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.24.self_attn.v_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.25.input_layernorm.weight": "model-00002-of-00015.safetensors", |
|
"model.layers.25.mlp.down_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.25.mlp.down_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.25.mlp.gate_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.25.mlp.gate_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.25.mlp.up_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.25.mlp.up_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.25.post_attention_layernorm.weight": "model-00002-of-00015.safetensors", |
|
"model.layers.25.self_attn.k_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.25.self_attn.k_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.25.self_attn.o_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.25.self_attn.o_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.25.self_attn.q_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.25.self_attn.q_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.25.self_attn.v_proj.suh": "model-00002-of-00015.safetensors", |
|
"model.layers.25.self_attn.v_proj.svh": "model-00002-of-00015.safetensors", |
|
"model.layers.25.mlp.down_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.25.mlp.gate_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.25.mlp.up_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.25.self_attn.k_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.25.self_attn.o_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.25.self_attn.q_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.25.self_attn.v_proj.trellis": "model-00002-of-00015.safetensors", |
|
"model.layers.26.input_layernorm.weight": "model-00003-of-00015.safetensors", |
|
"model.layers.26.mlp.down_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.26.mlp.down_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.26.mlp.gate_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.26.mlp.gate_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.26.mlp.up_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.26.mlp.up_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.26.post_attention_layernorm.weight": "model-00003-of-00015.safetensors", |
|
"model.layers.26.self_attn.k_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.26.self_attn.k_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.26.self_attn.o_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.26.self_attn.o_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.26.self_attn.q_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.26.self_attn.q_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.26.self_attn.v_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.26.self_attn.v_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.26.mlp.down_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.26.mlp.gate_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.26.mlp.up_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.26.self_attn.k_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.26.self_attn.o_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.26.self_attn.q_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.26.self_attn.v_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.32.input_layernorm.weight": "model-00003-of-00015.safetensors", |
|
"model.layers.32.mlp.down_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.32.mlp.down_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.32.mlp.gate_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.32.mlp.gate_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.32.mlp.up_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.32.mlp.up_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.32.post_attention_layernorm.weight": "model-00003-of-00015.safetensors", |
|
"model.layers.32.self_attn.k_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.32.self_attn.k_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.32.self_attn.o_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.32.self_attn.o_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.32.self_attn.q_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.32.self_attn.q_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.32.self_attn.v_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.32.self_attn.v_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.32.mlp.down_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.32.mlp.gate_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.32.mlp.up_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.32.self_attn.k_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.32.self_attn.o_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.32.self_attn.q_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.32.self_attn.v_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.33.input_layernorm.weight": "model-00003-of-00015.safetensors", |
|
"model.layers.33.mlp.down_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.33.mlp.down_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.33.mlp.gate_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.33.mlp.gate_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.33.mlp.up_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.33.mlp.up_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.33.post_attention_layernorm.weight": "model-00003-of-00015.safetensors", |
|
"model.layers.33.self_attn.k_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.33.self_attn.k_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.33.self_attn.o_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.33.self_attn.o_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.33.self_attn.q_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.33.self_attn.q_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.33.self_attn.v_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.33.self_attn.v_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.33.mlp.down_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.33.mlp.gate_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.33.mlp.up_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.33.self_attn.k_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.33.self_attn.o_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.33.self_attn.q_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.33.self_attn.v_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.34.input_layernorm.weight": "model-00003-of-00015.safetensors", |
|
"model.layers.34.mlp.down_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.34.mlp.down_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.34.mlp.gate_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.34.mlp.gate_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.34.mlp.up_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.34.mlp.up_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.34.post_attention_layernorm.weight": "model-00003-of-00015.safetensors", |
|
"model.layers.34.self_attn.k_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.34.self_attn.k_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.34.self_attn.o_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.34.self_attn.o_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.34.self_attn.q_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.34.self_attn.q_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.34.self_attn.v_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.34.self_attn.v_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.34.mlp.down_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.34.mlp.gate_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.34.mlp.up_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.34.self_attn.k_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.34.self_attn.o_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.34.self_attn.q_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.34.self_attn.v_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.35.input_layernorm.weight": "model-00003-of-00015.safetensors", |
|
"model.layers.35.mlp.down_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.35.mlp.down_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.35.mlp.gate_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.35.mlp.gate_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.35.mlp.up_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.35.mlp.up_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.35.post_attention_layernorm.weight": "model-00003-of-00015.safetensors", |
|
"model.layers.35.self_attn.k_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.35.self_attn.k_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.35.self_attn.o_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.35.self_attn.o_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.35.self_attn.q_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.35.self_attn.q_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.35.self_attn.v_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.35.self_attn.v_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.35.mlp.down_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.35.mlp.gate_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.35.mlp.up_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.35.self_attn.k_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.35.self_attn.o_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.35.self_attn.q_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.35.self_attn.v_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.39.input_layernorm.weight": "model-00003-of-00015.safetensors", |
|
"model.layers.39.mlp.down_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.39.mlp.down_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.39.mlp.gate_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.39.mlp.gate_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.39.mlp.up_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.39.mlp.up_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.39.post_attention_layernorm.weight": "model-00003-of-00015.safetensors", |
|
"model.layers.39.self_attn.k_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.39.self_attn.k_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.39.self_attn.o_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.39.self_attn.o_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.39.self_attn.q_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.39.self_attn.q_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.39.self_attn.v_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.39.self_attn.v_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.39.mlp.down_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.39.mlp.gate_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.39.mlp.up_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.39.self_attn.k_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.39.self_attn.o_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.39.self_attn.q_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.39.self_attn.v_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.40.input_layernorm.weight": "model-00003-of-00015.safetensors", |
|
"model.layers.40.mlp.down_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.40.mlp.down_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.40.mlp.gate_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.40.mlp.gate_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.40.mlp.up_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.40.mlp.up_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.40.post_attention_layernorm.weight": "model-00003-of-00015.safetensors", |
|
"model.layers.40.self_attn.k_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.40.self_attn.k_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.40.self_attn.o_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.40.self_attn.o_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.40.self_attn.q_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.40.self_attn.q_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.40.self_attn.v_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.40.self_attn.v_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.40.mlp.down_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.40.mlp.gate_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.40.mlp.up_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.40.self_attn.k_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.40.self_attn.o_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.40.self_attn.q_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.40.self_attn.v_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.41.input_layernorm.weight": "model-00003-of-00015.safetensors", |
|
"model.layers.41.mlp.down_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.41.mlp.down_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.41.mlp.gate_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.41.mlp.gate_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.41.mlp.up_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.41.mlp.up_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.41.post_attention_layernorm.weight": "model-00003-of-00015.safetensors", |
|
"model.layers.41.self_attn.k_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.41.self_attn.k_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.41.self_attn.o_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.41.self_attn.o_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.41.self_attn.q_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.41.self_attn.q_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.41.self_attn.v_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.41.self_attn.v_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.41.mlp.down_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.41.mlp.gate_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.41.mlp.up_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.41.self_attn.k_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.41.self_attn.o_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.41.self_attn.q_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.41.self_attn.v_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.42.mlp.down_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.42.mlp.down_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.42.mlp.gate_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.42.mlp.gate_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.42.mlp.up_proj.suh": "model-00003-of-00015.safetensors", |
|
"model.layers.42.mlp.up_proj.svh": "model-00003-of-00015.safetensors", |
|
"model.layers.42.post_attention_layernorm.weight": "model-00003-of-00015.safetensors", |
|
"model.layers.42.mlp.down_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.42.mlp.gate_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.42.mlp.up_proj.trellis": "model-00003-of-00015.safetensors", |
|
"model.layers.43.input_layernorm.weight": "model-00004-of-00015.safetensors", |
|
"model.layers.43.mlp.down_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.43.mlp.down_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.43.mlp.gate_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.43.mlp.gate_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.43.mlp.up_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.43.mlp.up_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.43.post_attention_layernorm.weight": "model-00004-of-00015.safetensors", |
|
"model.layers.43.self_attn.k_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.43.self_attn.k_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.43.self_attn.o_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.43.self_attn.o_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.43.self_attn.q_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.43.self_attn.q_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.43.self_attn.v_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.43.self_attn.v_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.43.mlp.down_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.43.mlp.gate_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.43.mlp.up_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.43.self_attn.k_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.43.self_attn.o_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.43.self_attn.q_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.43.self_attn.v_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.44.mlp.down_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.44.mlp.down_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.44.mlp.gate_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.44.mlp.gate_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.44.mlp.up_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.44.mlp.up_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.44.post_attention_layernorm.weight": "model-00004-of-00015.safetensors", |
|
"model.layers.44.mlp.down_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.44.mlp.gate_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.44.mlp.up_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.50.input_layernorm.weight": "model-00004-of-00015.safetensors", |
|
"model.layers.50.mlp.down_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.50.mlp.down_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.50.mlp.gate_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.50.mlp.gate_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.50.mlp.up_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.50.mlp.up_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.50.post_attention_layernorm.weight": "model-00004-of-00015.safetensors", |
|
"model.layers.50.self_attn.k_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.50.self_attn.k_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.50.self_attn.o_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.50.self_attn.o_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.50.self_attn.q_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.50.self_attn.q_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.50.self_attn.v_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.50.self_attn.v_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.50.mlp.down_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.50.mlp.gate_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.50.mlp.up_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.50.self_attn.k_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.50.self_attn.o_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.50.self_attn.q_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.50.self_attn.v_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.51.input_layernorm.weight": "model-00004-of-00015.safetensors", |
|
"model.layers.51.mlp.down_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.51.mlp.down_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.51.mlp.gate_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.51.mlp.gate_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.51.mlp.up_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.51.mlp.up_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.51.post_attention_layernorm.weight": "model-00004-of-00015.safetensors", |
|
"model.layers.51.self_attn.k_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.51.self_attn.k_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.51.self_attn.o_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.51.self_attn.o_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.51.self_attn.q_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.51.self_attn.q_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.51.self_attn.v_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.51.self_attn.v_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.51.mlp.down_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.51.mlp.gate_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.51.mlp.up_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.51.self_attn.k_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.51.self_attn.o_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.51.self_attn.q_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.51.self_attn.v_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.52.input_layernorm.weight": "model-00004-of-00015.safetensors", |
|
"model.layers.52.mlp.down_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.52.mlp.down_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.52.mlp.gate_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.52.mlp.gate_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.52.mlp.up_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.52.mlp.up_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.52.post_attention_layernorm.weight": "model-00004-of-00015.safetensors", |
|
"model.layers.52.self_attn.k_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.52.self_attn.k_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.52.self_attn.o_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.52.self_attn.o_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.52.self_attn.q_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.52.self_attn.q_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.52.self_attn.v_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.52.self_attn.v_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.52.mlp.down_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.52.mlp.gate_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.52.mlp.up_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.52.self_attn.k_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.52.self_attn.o_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.52.self_attn.q_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.52.self_attn.v_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.53.input_layernorm.weight": "model-00004-of-00015.safetensors", |
|
"model.layers.53.mlp.down_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.53.mlp.down_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.53.mlp.gate_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.53.mlp.gate_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.53.mlp.up_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.53.mlp.up_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.53.post_attention_layernorm.weight": "model-00004-of-00015.safetensors", |
|
"model.layers.53.self_attn.k_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.53.self_attn.k_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.53.self_attn.o_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.53.self_attn.o_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.53.self_attn.q_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.53.self_attn.q_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.53.self_attn.v_proj.suh": "model-00004-of-00015.safetensors", |
|
"model.layers.53.self_attn.v_proj.svh": "model-00004-of-00015.safetensors", |
|
"model.layers.53.mlp.down_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.53.mlp.gate_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.53.mlp.up_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.53.self_attn.k_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.53.self_attn.o_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.53.self_attn.q_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.53.self_attn.v_proj.trellis": "model-00004-of-00015.safetensors", |
|
"model.layers.59.input_layernorm.weight": "model-00005-of-00015.safetensors", |
|
"model.layers.59.mlp.down_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.59.mlp.down_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.59.mlp.gate_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.59.mlp.gate_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.59.mlp.up_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.59.mlp.up_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.59.post_attention_layernorm.weight": "model-00005-of-00015.safetensors", |
|
"model.layers.59.self_attn.k_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.59.self_attn.k_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.59.self_attn.o_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.59.self_attn.o_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.59.self_attn.q_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.59.self_attn.q_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.59.self_attn.v_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.59.self_attn.v_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.59.mlp.down_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.59.mlp.gate_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.59.mlp.up_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.59.self_attn.k_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.59.self_attn.o_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.59.self_attn.q_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.59.self_attn.v_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.60.input_layernorm.weight": "model-00005-of-00015.safetensors", |
|
"model.layers.60.mlp.down_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.60.mlp.down_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.60.mlp.gate_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.60.mlp.gate_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.60.mlp.up_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.60.mlp.up_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.60.post_attention_layernorm.weight": "model-00005-of-00015.safetensors", |
|
"model.layers.60.self_attn.k_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.60.self_attn.k_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.60.self_attn.o_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.60.self_attn.o_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.60.self_attn.q_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.60.self_attn.q_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.60.self_attn.v_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.60.self_attn.v_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.60.mlp.down_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.60.mlp.gate_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.60.mlp.up_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.60.self_attn.k_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.60.self_attn.o_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.60.self_attn.q_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.60.self_attn.v_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.61.input_layernorm.weight": "model-00005-of-00015.safetensors", |
|
"model.layers.61.mlp.down_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.61.mlp.down_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.61.mlp.gate_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.61.mlp.gate_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.61.mlp.up_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.61.mlp.up_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.61.post_attention_layernorm.weight": "model-00005-of-00015.safetensors", |
|
"model.layers.61.self_attn.k_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.61.self_attn.k_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.61.self_attn.o_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.61.self_attn.o_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.61.self_attn.q_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.61.self_attn.q_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.61.self_attn.v_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.61.self_attn.v_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.61.mlp.down_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.61.mlp.gate_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.61.mlp.up_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.61.self_attn.k_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.61.self_attn.o_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.61.self_attn.q_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.61.self_attn.v_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.62.input_layernorm.weight": "model-00005-of-00015.safetensors", |
|
"model.layers.62.mlp.down_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.62.mlp.down_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.62.mlp.gate_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.62.mlp.gate_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.62.mlp.up_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.62.mlp.up_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.62.post_attention_layernorm.weight": "model-00005-of-00015.safetensors", |
|
"model.layers.62.self_attn.k_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.62.self_attn.k_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.62.self_attn.o_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.62.self_attn.o_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.62.self_attn.q_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.62.self_attn.q_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.62.self_attn.v_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.62.self_attn.v_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.62.mlp.down_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.62.mlp.gate_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.62.mlp.up_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.62.self_attn.k_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.62.self_attn.o_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.62.self_attn.q_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.62.self_attn.v_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.68.input_layernorm.weight": "model-00005-of-00015.safetensors", |
|
"model.layers.68.mlp.down_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.68.mlp.down_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.68.mlp.gate_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.68.mlp.gate_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.68.mlp.up_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.68.mlp.up_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.68.post_attention_layernorm.weight": "model-00005-of-00015.safetensors", |
|
"model.layers.68.self_attn.k_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.68.self_attn.k_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.68.self_attn.o_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.68.self_attn.o_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.68.self_attn.q_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.68.self_attn.q_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.68.self_attn.v_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.68.self_attn.v_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.68.mlp.down_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.68.mlp.gate_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.68.mlp.up_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.68.self_attn.k_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.68.self_attn.o_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.68.self_attn.q_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.68.self_attn.v_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.69.input_layernorm.weight": "model-00005-of-00015.safetensors", |
|
"model.layers.69.mlp.down_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.69.mlp.down_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.69.mlp.gate_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.69.mlp.gate_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.69.mlp.up_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.69.mlp.up_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.69.post_attention_layernorm.weight": "model-00005-of-00015.safetensors", |
|
"model.layers.69.self_attn.k_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.69.self_attn.k_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.69.self_attn.o_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.69.self_attn.o_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.69.self_attn.q_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.69.self_attn.q_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.69.self_attn.v_proj.suh": "model-00005-of-00015.safetensors", |
|
"model.layers.69.self_attn.v_proj.svh": "model-00005-of-00015.safetensors", |
|
"model.layers.69.mlp.down_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.69.mlp.gate_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.69.mlp.up_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.69.self_attn.k_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.69.self_attn.o_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.69.self_attn.q_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.69.self_attn.v_proj.trellis": "model-00005-of-00015.safetensors", |
|
"model.layers.70.input_layernorm.weight": "model-00006-of-00015.safetensors", |
|
"model.layers.70.mlp.down_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.70.mlp.down_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.70.mlp.gate_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.70.mlp.gate_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.70.mlp.up_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.70.mlp.up_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.70.post_attention_layernorm.weight": "model-00006-of-00015.safetensors", |
|
"model.layers.70.self_attn.k_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.70.self_attn.k_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.70.self_attn.o_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.70.self_attn.o_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.70.self_attn.q_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.70.self_attn.q_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.70.self_attn.v_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.70.self_attn.v_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.70.mlp.down_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.70.mlp.gate_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.70.mlp.up_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.70.self_attn.k_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.70.self_attn.o_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.70.self_attn.q_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.70.self_attn.v_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.71.input_layernorm.weight": "model-00006-of-00015.safetensors", |
|
"model.layers.71.mlp.down_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.71.mlp.down_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.71.mlp.gate_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.71.mlp.gate_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.71.mlp.up_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.71.mlp.up_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.71.post_attention_layernorm.weight": "model-00006-of-00015.safetensors", |
|
"model.layers.71.self_attn.k_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.71.self_attn.k_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.71.self_attn.o_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.71.self_attn.o_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.71.self_attn.q_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.71.self_attn.q_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.71.self_attn.v_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.71.self_attn.v_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.71.mlp.down_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.71.mlp.gate_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.71.mlp.up_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.71.self_attn.k_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.71.self_attn.o_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.71.self_attn.q_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.71.self_attn.v_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.77.input_layernorm.weight": "model-00006-of-00015.safetensors", |
|
"model.layers.77.mlp.down_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.77.mlp.down_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.77.mlp.gate_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.77.mlp.gate_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.77.mlp.up_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.77.mlp.up_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.77.post_attention_layernorm.weight": "model-00006-of-00015.safetensors", |
|
"model.layers.77.self_attn.k_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.77.self_attn.k_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.77.self_attn.o_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.77.self_attn.o_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.77.self_attn.q_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.77.self_attn.q_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.77.self_attn.v_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.77.self_attn.v_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.77.mlp.down_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.77.mlp.gate_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.77.mlp.up_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.77.self_attn.k_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.77.self_attn.o_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.77.self_attn.q_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.77.self_attn.v_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.78.input_layernorm.weight": "model-00006-of-00015.safetensors", |
|
"model.layers.78.mlp.down_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.78.mlp.down_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.78.mlp.gate_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.78.mlp.gate_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.78.mlp.up_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.78.mlp.up_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.78.post_attention_layernorm.weight": "model-00006-of-00015.safetensors", |
|
"model.layers.78.self_attn.k_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.78.self_attn.k_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.78.self_attn.o_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.78.self_attn.o_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.78.self_attn.q_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.78.self_attn.q_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.78.self_attn.v_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.78.self_attn.v_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.78.mlp.down_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.78.mlp.gate_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.78.mlp.up_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.78.self_attn.k_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.78.self_attn.o_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.78.self_attn.q_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.78.self_attn.v_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.79.input_layernorm.weight": "model-00006-of-00015.safetensors", |
|
"model.layers.79.mlp.down_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.79.mlp.down_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.79.mlp.gate_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.79.mlp.gate_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.79.mlp.up_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.79.mlp.up_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.79.post_attention_layernorm.weight": "model-00006-of-00015.safetensors", |
|
"model.layers.79.self_attn.k_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.79.self_attn.k_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.79.self_attn.o_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.79.self_attn.o_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.79.self_attn.q_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.79.self_attn.q_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.79.self_attn.v_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.79.self_attn.v_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.79.mlp.down_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.79.mlp.gate_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.79.mlp.up_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.79.self_attn.k_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.79.self_attn.o_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.79.self_attn.q_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.79.self_attn.v_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.80.input_layernorm.weight": "model-00006-of-00015.safetensors", |
|
"model.layers.80.mlp.down_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.80.mlp.down_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.80.mlp.gate_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.80.mlp.gate_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.80.mlp.up_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.80.mlp.up_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.80.post_attention_layernorm.weight": "model-00006-of-00015.safetensors", |
|
"model.layers.80.self_attn.k_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.80.self_attn.k_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.80.self_attn.o_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.80.self_attn.o_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.80.self_attn.q_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.80.self_attn.q_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.80.self_attn.v_proj.suh": "model-00006-of-00015.safetensors", |
|
"model.layers.80.self_attn.v_proj.svh": "model-00006-of-00015.safetensors", |
|
"model.layers.80.mlp.down_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.80.mlp.gate_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.80.mlp.up_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.80.self_attn.k_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.80.self_attn.o_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.80.self_attn.q_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.80.self_attn.v_proj.trellis": "model-00006-of-00015.safetensors", |
|
"model.layers.86.input_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.86.mlp.down_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.86.mlp.down_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.86.mlp.gate_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.86.mlp.gate_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.86.mlp.up_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.86.mlp.up_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.86.post_attention_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.86.self_attn.k_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.86.self_attn.k_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.86.self_attn.o_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.86.self_attn.o_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.86.self_attn.q_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.86.self_attn.q_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.86.self_attn.v_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.86.self_attn.v_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.86.mlp.down_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.86.mlp.gate_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.86.mlp.up_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.86.self_attn.k_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.86.self_attn.o_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.86.self_attn.q_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.86.self_attn.v_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.87.input_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.87.mlp.down_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.87.mlp.down_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.87.mlp.gate_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.87.mlp.gate_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.87.mlp.up_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.87.mlp.up_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.87.post_attention_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.87.self_attn.k_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.87.self_attn.k_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.87.self_attn.o_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.87.self_attn.o_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.87.self_attn.q_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.87.self_attn.q_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.87.self_attn.v_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.87.self_attn.v_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.87.mlp.down_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.87.mlp.gate_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.87.mlp.up_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.87.self_attn.k_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.87.self_attn.o_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.87.self_attn.q_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.87.self_attn.v_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.88.input_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.88.mlp.down_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.88.mlp.down_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.88.mlp.gate_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.88.mlp.gate_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.88.mlp.up_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.88.mlp.up_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.88.post_attention_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.88.self_attn.k_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.88.self_attn.k_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.88.self_attn.o_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.88.self_attn.o_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.88.self_attn.q_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.88.self_attn.q_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.88.self_attn.v_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.88.self_attn.v_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.88.mlp.down_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.88.mlp.gate_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.88.mlp.up_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.88.self_attn.k_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.88.self_attn.o_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.88.self_attn.q_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.88.self_attn.v_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.89.input_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.89.mlp.down_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.89.mlp.down_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.89.mlp.gate_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.89.mlp.gate_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.89.mlp.up_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.89.mlp.up_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.89.post_attention_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.89.self_attn.k_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.89.self_attn.k_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.89.self_attn.o_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.89.self_attn.o_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.89.self_attn.q_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.89.self_attn.q_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.89.self_attn.v_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.89.self_attn.v_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.89.mlp.down_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.89.mlp.gate_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.89.mlp.up_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.89.self_attn.k_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.89.self_attn.o_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.89.self_attn.q_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.89.self_attn.v_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.92.input_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.92.mlp.down_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.92.mlp.down_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.92.mlp.gate_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.92.mlp.gate_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.92.mlp.up_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.92.mlp.up_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.92.post_attention_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.92.self_attn.k_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.92.self_attn.k_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.92.self_attn.o_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.92.self_attn.o_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.92.self_attn.q_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.92.self_attn.q_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.92.self_attn.v_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.92.self_attn.v_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.92.mlp.down_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.92.mlp.gate_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.92.mlp.up_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.92.self_attn.k_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.92.self_attn.o_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.92.self_attn.q_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.92.self_attn.v_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.93.input_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.93.mlp.down_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.93.mlp.down_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.93.mlp.gate_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.93.mlp.gate_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.93.mlp.up_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.93.mlp.up_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.93.post_attention_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.93.self_attn.k_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.93.self_attn.k_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.93.self_attn.o_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.93.self_attn.o_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.93.self_attn.q_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.93.self_attn.q_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.93.self_attn.v_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.93.self_attn.v_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.93.mlp.down_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.93.mlp.gate_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.93.mlp.up_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.93.self_attn.k_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.93.self_attn.o_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.93.self_attn.q_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.93.self_attn.v_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.94.input_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.94.mlp.down_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.94.mlp.down_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.94.mlp.gate_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.94.mlp.gate_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.94.mlp.up_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.94.mlp.up_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.94.post_attention_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.94.self_attn.k_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.94.self_attn.k_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.94.self_attn.o_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.94.self_attn.o_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.94.self_attn.q_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.94.self_attn.q_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.94.self_attn.v_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.94.self_attn.v_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.94.mlp.down_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.94.mlp.gate_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.94.mlp.up_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.94.self_attn.k_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.94.self_attn.o_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.94.self_attn.q_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.94.self_attn.v_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.95.input_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.95.mlp.down_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.95.mlp.down_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.95.mlp.gate_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.95.mlp.gate_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.95.mlp.up_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.95.mlp.up_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.95.post_attention_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.95.self_attn.k_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.95.self_attn.k_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.95.self_attn.o_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.95.self_attn.o_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.95.self_attn.q_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.95.self_attn.q_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.95.self_attn.v_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.95.self_attn.v_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.95.mlp.down_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.95.mlp.gate_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.95.mlp.up_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.95.self_attn.k_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.95.self_attn.o_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.95.self_attn.q_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.95.self_attn.v_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.96.mlp.down_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.96.mlp.down_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.96.mlp.gate_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.96.mlp.gate_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.96.mlp.up_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.96.mlp.up_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.96.post_attention_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.96.mlp.down_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.96.mlp.gate_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.96.mlp.up_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.97.mlp.down_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.97.mlp.down_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.97.mlp.gate_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.97.mlp.gate_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.97.mlp.up_proj.suh": "model-00007-of-00015.safetensors", |
|
"model.layers.97.mlp.up_proj.svh": "model-00007-of-00015.safetensors", |
|
"model.layers.97.post_attention_layernorm.weight": "model-00007-of-00015.safetensors", |
|
"model.layers.97.mlp.down_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.97.mlp.gate_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.97.mlp.up_proj.trellis": "model-00007-of-00015.safetensors", |
|
"model.layers.98.input_layernorm.weight": "model-00008-of-00015.safetensors", |
|
"model.layers.98.mlp.down_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.98.mlp.down_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.98.mlp.gate_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.98.mlp.gate_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.98.mlp.up_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.98.mlp.up_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.98.post_attention_layernorm.weight": "model-00008-of-00015.safetensors", |
|
"model.layers.98.self_attn.k_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.98.self_attn.k_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.98.self_attn.o_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.98.self_attn.o_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.98.self_attn.q_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.98.self_attn.q_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.98.self_attn.v_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.98.self_attn.v_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.98.mlp.down_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.98.mlp.gate_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.98.mlp.up_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.98.self_attn.k_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.98.self_attn.o_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.98.self_attn.q_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.98.self_attn.v_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.100.mlp.down_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.100.mlp.down_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.100.mlp.gate_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.100.mlp.gate_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.100.mlp.up_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.100.mlp.up_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.100.post_attention_layernorm.weight": "model-00008-of-00015.safetensors", |
|
"model.layers.100.mlp.down_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.100.mlp.gate_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.100.mlp.up_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.101.mlp.down_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.101.mlp.down_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.101.mlp.gate_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.101.mlp.gate_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.101.mlp.up_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.101.mlp.up_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.101.post_attention_layernorm.weight": "model-00008-of-00015.safetensors", |
|
"model.layers.101.mlp.down_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.101.mlp.gate_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.101.mlp.up_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.102.mlp.down_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.102.mlp.down_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.102.mlp.gate_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.102.mlp.gate_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.102.mlp.up_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.102.mlp.up_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.102.post_attention_layernorm.weight": "model-00008-of-00015.safetensors", |
|
"model.layers.102.mlp.down_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.102.mlp.gate_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.102.mlp.up_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.103.mlp.down_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.103.mlp.down_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.103.mlp.gate_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.103.mlp.gate_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.103.mlp.up_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.103.mlp.up_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.103.post_attention_layernorm.weight": "model-00008-of-00015.safetensors", |
|
"model.layers.103.mlp.down_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.103.mlp.gate_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.103.mlp.up_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.104.mlp.down_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.104.mlp.down_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.104.mlp.gate_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.104.mlp.gate_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.104.mlp.up_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.104.mlp.up_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.104.post_attention_layernorm.weight": "model-00008-of-00015.safetensors", |
|
"model.layers.104.mlp.down_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.104.mlp.gate_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.104.mlp.up_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.105.mlp.down_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.105.mlp.down_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.105.mlp.gate_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.105.mlp.gate_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.105.mlp.up_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.105.mlp.up_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.105.post_attention_layernorm.weight": "model-00008-of-00015.safetensors", |
|
"model.layers.105.mlp.down_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.105.mlp.gate_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.105.mlp.up_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.106.mlp.down_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.106.mlp.down_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.106.mlp.gate_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.106.mlp.gate_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.106.mlp.up_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.106.mlp.up_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.106.post_attention_layernorm.weight": "model-00008-of-00015.safetensors", |
|
"model.layers.106.mlp.down_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.106.mlp.gate_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.106.mlp.up_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.107.input_layernorm.weight": "model-00008-of-00015.safetensors", |
|
"model.layers.107.mlp.down_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.107.mlp.down_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.107.mlp.gate_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.107.mlp.gate_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.107.mlp.up_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.107.mlp.up_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.107.post_attention_layernorm.weight": "model-00008-of-00015.safetensors", |
|
"model.layers.107.self_attn.k_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.107.self_attn.k_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.107.self_attn.o_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.107.self_attn.o_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.107.self_attn.q_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.107.self_attn.q_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.107.self_attn.v_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.107.self_attn.v_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.107.mlp.down_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.107.mlp.gate_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.107.mlp.up_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.107.self_attn.k_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.107.self_attn.o_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.107.self_attn.q_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.107.self_attn.v_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.113.input_layernorm.weight": "model-00008-of-00015.safetensors", |
|
"model.layers.113.mlp.down_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.113.mlp.down_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.113.mlp.gate_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.113.mlp.gate_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.113.mlp.up_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.113.mlp.up_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.113.post_attention_layernorm.weight": "model-00008-of-00015.safetensors", |
|
"model.layers.113.self_attn.k_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.113.self_attn.k_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.113.self_attn.o_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.113.self_attn.o_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.113.self_attn.q_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.113.self_attn.q_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.113.self_attn.v_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.113.self_attn.v_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.113.mlp.down_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.113.mlp.gate_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.113.mlp.up_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.113.self_attn.k_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.113.self_attn.o_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.113.self_attn.q_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.113.self_attn.v_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.114.input_layernorm.weight": "model-00008-of-00015.safetensors", |
|
"model.layers.114.mlp.down_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.114.mlp.down_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.114.mlp.gate_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.114.mlp.gate_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.114.mlp.up_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.114.mlp.up_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.114.post_attention_layernorm.weight": "model-00008-of-00015.safetensors", |
|
"model.layers.114.self_attn.k_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.114.self_attn.k_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.114.self_attn.o_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.114.self_attn.o_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.114.self_attn.q_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.114.self_attn.q_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.114.self_attn.v_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.114.self_attn.v_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.114.mlp.down_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.114.mlp.gate_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.114.mlp.up_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.114.self_attn.k_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.114.self_attn.o_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.114.self_attn.q_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.114.self_attn.v_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.115.mlp.down_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.115.mlp.down_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.115.mlp.gate_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.115.mlp.gate_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.115.mlp.up_proj.suh": "model-00008-of-00015.safetensors", |
|
"model.layers.115.mlp.up_proj.svh": "model-00008-of-00015.safetensors", |
|
"model.layers.115.post_attention_layernorm.weight": "model-00008-of-00015.safetensors", |
|
"model.layers.115.mlp.down_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.115.mlp.gate_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.115.mlp.up_proj.trellis": "model-00008-of-00015.safetensors", |
|
"model.layers.116.input_layernorm.weight": "model-00009-of-00015.safetensors", |
|
"model.layers.116.mlp.down_proj.suh": "model-00009-of-00015.safetensors", |
|
"model.layers.116.mlp.down_proj.svh": "model-00009-of-00015.safetensors", |
|
"model.layers.116.mlp.gate_proj.suh": "model-00009-of-00015.safetensors", |
|
"model.layers.116.mlp.gate_proj.svh": "model-00009-of-00015.safetensors", |
|
"model.layers.116.mlp.up_proj.suh": "model-00009-of-00015.safetensors", |
|
"model.layers.116.mlp.up_proj.svh": "model-00009-of-00015.safetensors", |
|
"model.layers.116.post_attention_layernorm.weight": "model-00009-of-00015.safetensors", |
|
"model.layers.116.self_attn.k_proj.suh": "model-00009-of-00015.safetensors", |
|
"model.layers.116.self_attn.k_proj.svh": "model-00009-of-00015.safetensors", |
|
"model.layers.116.self_attn.o_proj.suh": "model-00009-of-00015.safetensors", |
|
"model.layers.116.self_attn.o_proj.svh": "model-00009-of-00015.safetensors", |
|
"model.layers.116.self_attn.q_proj.suh": "model-00009-of-00015.safetensors", |
|
"model.layers.116.self_attn.q_proj.svh": "model-00009-of-00015.safetensors", |
|
"model.layers.116.self_attn.v_proj.suh": "model-00009-of-00015.safetensors", |
|
"model.layers.116.self_attn.v_proj.svh": "model-00009-of-00015.safetensors", |
|
"model.layers.116.mlp.down_proj.trellis": "model-00009-of-00015.safetensors", |
|
"model.layers.116.mlp.gate_proj.trellis": "model-00009-of-00015.safetensors", |
|
"model.layers.116.mlp.up_proj.trellis": "model-00009-of-00015.safetensors", |
|
"model.layers.116.self_attn.k_proj.trellis": "model-00009-of-00015.safetensors", |
|
"model.layers.116.self_attn.o_proj.trellis": "model-00009-of-00015.safetensors", |
|
"model.layers.116.self_attn.q_proj.trellis": "model-00009-of-00015.safetensors", |
|
"model.layers.116.self_attn.v_proj.trellis": "model-00009-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.0.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.0.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.1.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.1.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.2.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.2.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.3.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.3.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.4.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.4.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.5.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.5.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.6.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.6.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.7.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.7.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.0.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.0.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.1.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.1.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.2.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.2.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.3.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.3.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.4.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.4.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.5.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.5.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.6.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.6.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.7.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.7.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.0.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.0.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.1.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.1.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.2.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.2.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.3.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.3.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.4.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.4.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.5.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.5.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.6.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.6.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.7.suh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.7.svh": "model-00010-of-00015.safetensors", |
|
"model.layers.125.post_attention_layernorm.weight": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.0.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.1.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.2.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.3.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.4.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.5.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.6.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.down_proj.slice.7.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.0.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.1.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.2.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.3.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.4.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.5.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.6.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.gate_proj.slice.7.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.0.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.1.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.2.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.3.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.4.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.5.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.6.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.125.mlp.up_proj.slice.7.trellis": "model-00010-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.0.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.0.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.1.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.1.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.2.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.2.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.3.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.3.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.4.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.4.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.5.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.5.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.6.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.6.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.7.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.7.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.0.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.0.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.1.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.1.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.2.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.2.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.3.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.3.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.4.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.4.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.5.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.5.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.6.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.6.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.7.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.7.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.0.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.0.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.1.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.1.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.2.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.2.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.3.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.3.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.4.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.4.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.5.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.5.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.6.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.6.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.7.suh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.7.svh": "model-00011-of-00015.safetensors", |
|
"model.layers.134.post_attention_layernorm.weight": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.0.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.1.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.2.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.3.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.4.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.5.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.6.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.down_proj.slice.7.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.0.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.1.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.2.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.3.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.4.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.5.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.6.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.gate_proj.slice.7.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.0.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.1.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.2.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.3.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.4.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.5.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.6.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.134.mlp.up_proj.slice.7.trellis": "model-00011-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.0.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.0.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.1.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.1.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.2.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.2.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.3.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.3.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.4.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.4.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.5.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.5.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.6.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.6.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.0.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.0.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.1.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.1.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.2.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.2.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.3.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.3.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.4.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.4.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.5.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.5.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.6.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.6.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.0.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.0.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.1.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.1.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.2.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.2.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.3.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.3.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.4.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.4.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.5.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.5.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.6.suh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.6.svh": "model-00012-of-00015.safetensors", |
|
"model.layers.143.post_attention_layernorm.weight": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.0.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.1.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.2.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.3.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.4.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.5.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.down_proj.slice.6.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.0.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.1.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.2.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.3.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.4.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.5.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.gate_proj.slice.6.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.0.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.1.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.2.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.3.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.4.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.5.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.143.mlp.up_proj.slice.6.trellis": "model-00012-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.0.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.0.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.1.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.1.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.2.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.2.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.3.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.3.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.4.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.4.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.5.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.5.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.0.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.0.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.1.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.1.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.2.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.2.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.3.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.3.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.4.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.4.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.5.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.5.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.0.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.0.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.1.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.1.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.2.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.2.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.3.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.3.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.4.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.4.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.5.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.5.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.149.post_attention_layernorm.weight": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.0.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.1.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.2.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.3.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.4.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.down_proj.slice.5.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.0.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.1.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.2.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.3.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.4.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.gate_proj.slice.5.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.0.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.1.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.2.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.3.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.4.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.149.mlp.up_proj.slice.5.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.150.mlp.down_proj.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.150.mlp.down_proj.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.150.mlp.gate_proj.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.150.mlp.gate_proj.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.150.mlp.up_proj.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.150.mlp.up_proj.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.150.post_attention_layernorm.weight": "model-00013-of-00015.safetensors", |
|
"model.layers.150.mlp.down_proj.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.150.mlp.gate_proj.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.150.mlp.up_proj.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.151.input_layernorm.weight": "model-00013-of-00015.safetensors", |
|
"model.layers.151.mlp.down_proj.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.151.mlp.down_proj.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.151.mlp.gate_proj.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.151.mlp.gate_proj.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.151.mlp.up_proj.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.151.mlp.up_proj.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.151.post_attention_layernorm.weight": "model-00013-of-00015.safetensors", |
|
"model.layers.151.self_attn.k_proj.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.151.self_attn.k_proj.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.151.self_attn.o_proj.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.151.self_attn.o_proj.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.151.self_attn.q_proj.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.151.self_attn.q_proj.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.151.self_attn.v_proj.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.151.self_attn.v_proj.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.151.mlp.down_proj.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.151.mlp.gate_proj.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.151.mlp.up_proj.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.151.self_attn.k_proj.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.151.self_attn.o_proj.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.151.self_attn.q_proj.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.151.self_attn.v_proj.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.152.input_layernorm.weight": "model-00013-of-00015.safetensors", |
|
"model.layers.152.mlp.down_proj.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.152.mlp.down_proj.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.152.mlp.gate_proj.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.152.mlp.gate_proj.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.152.mlp.up_proj.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.152.mlp.up_proj.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.152.post_attention_layernorm.weight": "model-00013-of-00015.safetensors", |
|
"model.layers.152.self_attn.k_proj.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.152.self_attn.k_proj.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.152.self_attn.o_proj.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.152.self_attn.o_proj.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.152.self_attn.q_proj.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.152.self_attn.q_proj.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.152.self_attn.v_proj.suh": "model-00013-of-00015.safetensors", |
|
"model.layers.152.self_attn.v_proj.svh": "model-00013-of-00015.safetensors", |
|
"model.layers.152.mlp.down_proj.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.152.mlp.gate_proj.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.152.mlp.up_proj.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.152.self_attn.k_proj.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.152.self_attn.o_proj.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.152.self_attn.q_proj.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.152.self_attn.v_proj.trellis": "model-00013-of-00015.safetensors", |
|
"model.layers.154.input_layernorm.weight": "model-00014-of-00015.safetensors", |
|
"model.layers.154.mlp.down_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.154.mlp.down_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.154.mlp.gate_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.154.mlp.gate_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.154.mlp.up_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.154.mlp.up_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.154.post_attention_layernorm.weight": "model-00014-of-00015.safetensors", |
|
"model.layers.154.self_attn.k_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.154.self_attn.k_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.154.self_attn.o_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.154.self_attn.o_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.154.self_attn.q_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.154.self_attn.q_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.154.self_attn.v_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.154.self_attn.v_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.154.mlp.down_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.154.mlp.gate_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.154.mlp.up_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.154.self_attn.k_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.154.self_attn.o_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.154.self_attn.q_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.154.self_attn.v_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.155.input_layernorm.weight": "model-00014-of-00015.safetensors", |
|
"model.layers.155.mlp.down_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.155.mlp.down_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.155.mlp.gate_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.155.mlp.gate_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.155.mlp.up_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.155.mlp.up_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.155.post_attention_layernorm.weight": "model-00014-of-00015.safetensors", |
|
"model.layers.155.self_attn.k_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.155.self_attn.k_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.155.self_attn.o_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.155.self_attn.o_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.155.self_attn.q_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.155.self_attn.q_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.155.self_attn.v_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.155.self_attn.v_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.155.mlp.down_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.155.mlp.gate_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.155.mlp.up_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.155.self_attn.k_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.155.self_attn.o_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.155.self_attn.q_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.155.self_attn.v_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.156.input_layernorm.weight": "model-00014-of-00015.safetensors", |
|
"model.layers.156.mlp.down_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.156.mlp.down_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.156.mlp.gate_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.156.mlp.gate_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.156.mlp.up_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.156.mlp.up_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.156.post_attention_layernorm.weight": "model-00014-of-00015.safetensors", |
|
"model.layers.156.self_attn.k_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.156.self_attn.k_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.156.self_attn.o_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.156.self_attn.o_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.156.self_attn.q_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.156.self_attn.q_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.156.self_attn.v_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.156.self_attn.v_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.156.mlp.down_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.156.mlp.gate_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.156.mlp.up_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.156.self_attn.k_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.156.self_attn.o_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.156.self_attn.q_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.156.self_attn.v_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.157.input_layernorm.weight": "model-00014-of-00015.safetensors", |
|
"model.layers.157.mlp.down_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.157.mlp.down_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.157.mlp.gate_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.157.mlp.gate_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.157.mlp.up_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.157.mlp.up_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.157.post_attention_layernorm.weight": "model-00014-of-00015.safetensors", |
|
"model.layers.157.self_attn.k_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.157.self_attn.k_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.157.self_attn.o_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.157.self_attn.o_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.157.self_attn.q_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.157.self_attn.q_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.157.self_attn.v_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.157.self_attn.v_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.157.mlp.down_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.157.mlp.gate_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.157.mlp.up_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.157.self_attn.k_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.157.self_attn.o_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.157.self_attn.q_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.157.self_attn.v_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.158.input_layernorm.weight": "model-00014-of-00015.safetensors", |
|
"model.layers.158.mlp.down_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.158.mlp.down_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.158.mlp.gate_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.158.mlp.gate_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.158.mlp.up_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.158.mlp.up_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.158.post_attention_layernorm.weight": "model-00014-of-00015.safetensors", |
|
"model.layers.158.self_attn.k_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.158.self_attn.k_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.158.self_attn.o_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.158.self_attn.o_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.158.self_attn.q_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.158.self_attn.q_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.158.self_attn.v_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.158.self_attn.v_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.158.mlp.down_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.158.mlp.gate_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.158.mlp.up_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.158.self_attn.k_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.158.self_attn.o_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.158.self_attn.q_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.158.self_attn.v_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.159.input_layernorm.weight": "model-00014-of-00015.safetensors", |
|
"model.layers.159.mlp.down_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.159.mlp.down_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.159.mlp.gate_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.159.mlp.gate_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.159.mlp.up_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.159.mlp.up_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.159.post_attention_layernorm.weight": "model-00014-of-00015.safetensors", |
|
"model.layers.159.self_attn.k_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.159.self_attn.k_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.159.self_attn.o_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.159.self_attn.o_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.159.self_attn.q_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.159.self_attn.q_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.159.self_attn.v_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.159.self_attn.v_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.159.mlp.down_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.159.mlp.gate_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.159.mlp.up_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.159.self_attn.k_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.159.self_attn.o_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.159.self_attn.q_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.159.self_attn.v_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.160.input_layernorm.weight": "model-00014-of-00015.safetensors", |
|
"model.layers.160.mlp.down_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.160.mlp.down_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.160.mlp.gate_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.160.mlp.gate_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.160.mlp.up_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.160.mlp.up_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.160.post_attention_layernorm.weight": "model-00014-of-00015.safetensors", |
|
"model.layers.160.self_attn.k_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.160.self_attn.k_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.160.self_attn.o_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.160.self_attn.o_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.160.self_attn.q_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.160.self_attn.q_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.160.self_attn.v_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.160.self_attn.v_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.160.mlp.down_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.160.mlp.gate_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.160.mlp.up_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.160.self_attn.k_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.160.self_attn.o_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.160.self_attn.q_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.160.self_attn.v_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.161.input_layernorm.weight": "model-00014-of-00015.safetensors", |
|
"model.layers.161.mlp.down_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.161.mlp.down_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.161.mlp.gate_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.161.mlp.gate_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.161.mlp.up_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.161.mlp.up_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.161.post_attention_layernorm.weight": "model-00014-of-00015.safetensors", |
|
"model.layers.161.self_attn.k_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.161.self_attn.k_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.161.self_attn.o_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.161.self_attn.o_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.161.self_attn.q_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.161.self_attn.q_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.161.self_attn.v_proj.suh": "model-00014-of-00015.safetensors", |
|
"model.layers.161.self_attn.v_proj.svh": "model-00014-of-00015.safetensors", |
|
"model.layers.161.mlp.down_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.161.mlp.gate_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.161.mlp.up_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.161.self_attn.k_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.161.self_attn.o_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.161.self_attn.q_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.layers.161.self_attn.v_proj.trellis": "model-00014-of-00015.safetensors", |
|
"model.norm.weight": "model-00014-of-00015.safetensors", |
|
"lm_head.suh": "model-00015-of-00015.safetensors", |
|
"lm_head.svh": "model-00015-of-00015.safetensors", |
|
"lm_head.trellis": "model-00015-of-00015.safetensors" |
|
} |
|
} |