mirror of
https://www.modelscope.cn/XiaomiMiMo/MiMo-7B-RL.git
synced 2026-04-02 19:52:52 +08:00
17 lines
376 B
Python
17 lines
376 B
Python
from transformers.models.qwen2.configuration_qwen2 import Qwen2Config
|
|
|
|
class MiMoConfig(Qwen2Config):
|
|
model_type = "mimo"
|
|
|
|
def __init__(
|
|
self,
|
|
*args,
|
|
num_nextn_predict_layers=0,
|
|
**kwargs
|
|
):
|
|
self.num_nextn_predict_layers = num_nextn_predict_layers
|
|
super().__init__(
|
|
*args,
|
|
**kwargs,
|
|
)
|