File size: 376 Bytes
da3d5c4 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 |
from transformers.models.qwen2.configuration_qwen2 import Qwen2Config
class MiMoConfig(Qwen2Config):
model_type = "mimo"
def __init__(
self,
*args,
num_nextn_predict_layers=0,
**kwargs
):
self.num_nextn_predict_layers = num_nextn_predict_layers
super().__init__(
*args,
**kwargs,
)
|