mirror of
https://www.modelscope.cn/XiaomiMiMo/MiMo-7B-RL.git
synced 2026-04-02 19:52:52 +08:00
Update README.md
This commit is contained in:
12
README.md
12
README.md
@ -28,7 +28,7 @@ library_name: transformers
|
|||||||
|
|
|
|
||||||
<a href="https://www.modelscope.cn/organization/XiaomiMiMo" target="_blank">🤖️ ModelScope</a>
|
<a href="https://www.modelscope.cn/organization/XiaomiMiMo" target="_blank">🤖️ ModelScope</a>
|
||||||
|
|
|
|
||||||
<a href="https://github.com/XiaomiMiMo/MiMo/blob/main/MiMo-7B-Technical-Report.pdf" target="_blank">📔 Technical Report</a>
|
<a href="https://arxiv.org/abs/2505.07608" target="_blank">📔 Technical Report</a>
|
||||||
|
|
|
|
||||||
<br/>
|
<br/>
|
||||||
</div>
|
</div>
|
||||||
@ -203,7 +203,7 @@ Example script
|
|||||||
```py
|
```py
|
||||||
from transformers import AutoModel, AutoModelForCausalLM, AutoTokenizer
|
from transformers import AutoModel, AutoModelForCausalLM, AutoTokenizer
|
||||||
|
|
||||||
model_id = "XiaomiMiMo/MiMo-7B-Base"
|
model_id = "XiaomiMiMo/MiMo-7B-RL"
|
||||||
model = AutoModelForCausalLM.from_pretrained(model_id, trust_remote_code=True)
|
model = AutoModelForCausalLM.from_pretrained(model_id, trust_remote_code=True)
|
||||||
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
||||||
inputs = tokenizer(["Today is"], return_tensors='pt')
|
inputs = tokenizer(["Today is"], return_tensors='pt')
|
||||||
@ -221,12 +221,14 @@ print(tokenizer.decode(output.tolist()[0]))
|
|||||||
## V. Citation
|
## V. Citation
|
||||||
|
|
||||||
```bibtex
|
```bibtex
|
||||||
@misc{xiaomi2025mimo,
|
@misc{coreteam2025mimounlockingreasoningpotential,
|
||||||
title={MiMo: Unlocking the Reasoning Potential of Language Model – From Pretraining to Posttraining},
|
title={MiMo: Unlocking the Reasoning Potential of Language Model -- From Pretraining to Posttraining},
|
||||||
author={{Xiaomi LLM-Core Team}},
|
author={{Xiaomi LLM-Core Team}},
|
||||||
year={2025},
|
year={2025},
|
||||||
|
eprint={2505.07608},
|
||||||
|
archivePrefix={arXiv},
|
||||||
primaryClass={cs.CL},
|
primaryClass={cs.CL},
|
||||||
url={https://github.com/XiaomiMiMo/MiMo},
|
url={https://arxiv.org/abs/2505.07608},
|
||||||
}
|
}
|
||||||
```
|
```
|
||||||
|
|
||||||
|
|||||||
@ -2,6 +2,9 @@
|
|||||||
"architectures": [
|
"architectures": [
|
||||||
"MiMoForCausalLM"
|
"MiMoForCausalLM"
|
||||||
],
|
],
|
||||||
|
"tokenizer_class":[
|
||||||
|
"Qwen2Tokenizer"
|
||||||
|
],
|
||||||
"auto_map": {
|
"auto_map": {
|
||||||
"AutoConfig": "configuration_mimo.MiMoConfig",
|
"AutoConfig": "configuration_mimo.MiMoConfig",
|
||||||
"AutoModel": "modeling_mimo.MiMoModel",
|
"AutoModel": "modeling_mimo.MiMoModel",
|
||||||
|
|||||||
Reference in New Issue
Block a user