MiMo-7B-Base / configuration_mimo.py
bwshen-mi's picture
init Xiaomi-MiMo
da3d5c4 verified
raw
history blame contribute delete
376 Bytes
from transformers.models.qwen2.configuration_qwen2 import Qwen2Config
class MiMoConfig(Qwen2Config):
model_type = "mimo"
def __init__(
self,
*args,
num_nextn_predict_layers=0,
**kwargs
):
self.num_nextn_predict_layers = num_nextn_predict_layers
super().__init__(
*args,
**kwargs,
)