| from transformers.models.qwen2.configuration_qwen2 import Qwen2Config | |
| class MiMoConfig(Qwen2Config): | |
| model_type = "mimo" | |
| def __init__( | |
| self, | |
| *args, | |
| num_nextn_predict_layers=0, | |
| **kwargs | |
| ): | |
| self.num_nextn_predict_layers = num_nextn_predict_layers | |
| super().__init__( | |
| *args, | |
| **kwargs, | |
| ) | |