Files
MiMo-7B-RL/configuration_mimo.py
2025-04-30 04:29:39 +00:00

17 lines
376 B
Python

from transformers.models.qwen2.configuration_qwen2 import Qwen2Config
class MiMoConfig(Qwen2Config):
model_type = "mimo"
def __init__(
self,
*args,
num_nextn_predict_layers=0,
**kwargs
):
self.num_nextn_predict_layers = num_nextn_predict_layers
super().__init__(
*args,
**kwargs,
)