152 Commits

Author SHA1 Message Date
62ee2f8ebd update for new format config of transformers lib / sglang lib (batch 1/1) 2026-06-11 18:32:54 +00:00
fd92a094c2 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-06-10 18:21:31 +00:00
1c97e7adee update for new format config of transformers lib / sglang lib (batch 1/1) 2026-06-09 18:45:52 +00:00
257979fd39 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-06-08 15:29:39 +00:00
0dabdef802 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-06-07 13:14:39 +00:00
2236e0b1af update for new format config of transformers lib / sglang lib (batch 1/1) 2026-06-06 17:02:53 +00:00
b0872b7794 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-06-05 16:08:37 +00:00
35bfb6657d update for new format config of transformers lib / sglang lib (batch 1/1) 2026-06-04 20:44:25 +00:00
0613213f11 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-06-03 18:50:26 +00:00
09c913ff71 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-06-02 16:28:03 +00:00
f2e8f73ada update for new format config of transformers lib / sglang lib (batch 1/1) 2026-06-01 16:01:40 +00:00
2c5a0c61dd update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-31 16:01:58 +00:00
d2d32cfcb1 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-30 18:54:27 +00:00
7db4ca304d update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-29 18:13:03 +00:00
435419c52d update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-28 13:20:02 +00:00
5db418414d update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-27 16:40:14 +00:00
c8a7d0963f update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-26 16:41:18 +00:00
31b66e679d update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-25 18:38:09 +00:00
7051418798 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-24 18:40:11 +00:00
f9a9b744a3 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-23 18:13:05 +00:00
07a5204d7c update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-21 15:32:16 +00:00
9355dcde75 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-21 00:05:35 +00:00
71fced2779 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-19 05:05:57 +00:00
f36b3e1114 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-16 15:40:02 +00:00
5770a2c93f update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-15 22:27:26 +00:00
eea3d25a9d update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-15 00:30:19 +00:00
5181066a32 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-13 23:17:49 +00:00
af10462fe9 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-12 21:15:20 +00:00
a1b9d15988 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-11 21:56:56 +00:00
8256a4e5ac update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-10 21:54:00 +00:00
8707695690 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-09 19:43:17 +00:00
ea5103057f update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-08 22:42:38 +00:00
07d57847a7 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-07 20:52:26 +00:00
3fb7c80c22 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-06 21:38:45 +00:00
6cf7fec891 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-05 21:09:31 +00:00
5a87b42726 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-04 23:05:33 +00:00
26a6379252 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-03 20:07:13 +00:00
bf670f6e47 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-02 19:31:43 +00:00
f3e92c6283 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-05-01 21:24:32 +00:00
68e1a18c4f update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-30 22:19:58 +00:00
15caa86165 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-29 19:43:12 +00:00
78170a76d4 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-28 23:16:33 +00:00
a96c62f3c6 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-27 19:16:24 +00:00
c9b0a3712a update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-26 17:45:55 +00:00
513122fb6b update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-25 21:58:51 +00:00
e634423499 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-24 19:08:46 +00:00
4189e78e82 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-23 18:57:25 +00:00
b9962d86d7 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-22 17:36:16 +00:00
5b54a2c8a4 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-21 18:26:46 +00:00
5627c3e221 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-20 18:14:34 +00:00
d1fa1eb77b update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-19 20:50:37 +00:00
1dd5dea5c8 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-18 19:59:59 +00:00
1f96a11038 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-16 22:50:40 +00:00
c0c8ab6b12 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-15 21:21:52 +00:00
12953d1d55 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-14 03:46:10 +00:00
109e69fbb4 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-13 07:41:18 +00:00
1ec558733e update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-12 04:16:10 +00:00
171de346d2 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-10 18:48:11 +00:00
50bc379f48 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-09 21:19:30 +00:00
43562b321f update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-09 09:22:24 +00:00
27c94755b7 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-08 04:35:16 +00:00
90735b4930 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-07 06:52:02 +00:00
a14b7ee944 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-05 22:42:04 +00:00
1888286b6f update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-04 19:27:50 +00:00
fe9c2f230c update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-03 13:10:17 +00:00
7393bf6a0b update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-02 13:53:16 +00:00
a28562c226 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-04-01 13:47:20 +00:00
dcfce55c4c update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-31 14:22:09 +00:00
399a51fb2b update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-30 15:26:16 +00:00
4f6de1dca6 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-29 13:54:01 +00:00
6d685baab9 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-28 13:55:25 +00:00
a380d4601a update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-27 13:51:06 +00:00
7cc2ae24b1 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-26 14:01:00 +00:00
ada03b9d38 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-25 14:00:06 +00:00
9db7824676 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-24 13:51:49 +00:00
18ab00aa7b update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-23 13:33:55 +00:00
6778c7a8fc update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-22 14:00:51 +00:00
88676c1db0 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-21 14:10:44 +00:00
08cf4d93a2 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-20 14:14:14 +00:00
23ff5af1e9 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-19 13:56:55 +00:00
14051cc226 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-18 13:39:17 +00:00
fc732bbad2 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-17 14:01:41 +00:00
55bab11e83 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-16 14:06:18 +00:00
b15d4c2292 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-15 13:53:52 +00:00
3906a4d8e3 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-14 13:46:32 +00:00
e9892c8226 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-13 14:40:38 +00:00
86a914356f update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-12 13:51:58 +00:00
c6e72bdcc5 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-11 14:04:05 +00:00
94ac4ea6d5 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-10 13:28:37 +00:00
5eab5eb239 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-09 13:49:03 +00:00
5fd252ce8c update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-08 13:37:51 +00:00
dfe3b94896 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-07 13:48:50 +00:00
84f7e07a2d update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-06 14:32:04 +00:00
6f6848583d update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-05 13:21:53 +00:00
87fe415681 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-04 13:43:29 +00:00
58136e3240 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-03 14:10:57 +00:00
3e3a7e75b1 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-02 14:02:40 +00:00
a99b3355e6 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-03-01 13:21:00 +00:00
cf29e981de update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-28 13:38:04 +00:00
79b0bc60b2 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-27 13:29:49 +00:00
33d0975fe7 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-26 13:13:31 +00:00
195967d00f update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-25 14:04:21 +00:00
3c235c94e6 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-24 14:32:54 +00:00
b0c6621429 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-23 14:17:59 +00:00
999651e2f7 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-22 14:15:45 +00:00
402fa3b8b3 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-21 15:21:35 +00:00
620e3ee2c5 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-20 13:44:30 +00:00
c7bd410da1 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-19 13:56:09 +00:00
322cd74896 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-18 14:00:45 +00:00
f0527e343d update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-17 14:33:37 +00:00
317dd3f01a update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-16 14:06:52 +00:00
1d4e1ae616 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-15 14:03:35 +00:00
131977428a update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-14 14:08:03 +00:00
1178fdc33b update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-13 14:26:12 +00:00
255d2cc26f update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-12 13:47:04 +00:00
9972904e1b update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-11 14:24:03 +00:00
4102f1dfd5 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-10 13:40:49 +00:00
2346111083 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-09 14:28:48 +00:00
a133dac63c update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-08 14:15:36 +00:00
585c678101 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-07 14:35:48 +00:00
c4691f2c54 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-06 13:57:55 +00:00
524e92f1a4 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-05 14:43:38 +00:00
e4a6856510 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-04 13:56:56 +00:00
3afb88eaef update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-03 14:21:34 +00:00
8622a64f24 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-02 14:08:05 +00:00
75575e9ac7 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-02-01 13:54:00 +00:00
b7009ea267 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-01-31 13:49:59 +00:00
09c074da7e update for new format config of transformers lib / sglang lib (batch 1/1) 2026-01-30 13:55:08 +00:00
284d3287fd update for new format config of transformers lib / sglang lib (batch 1/1) 2026-01-29 14:43:14 +00:00
ce20c8a020 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-01-28 14:03:54 +00:00
af35d9190e update for new format config of transformers lib / sglang lib (batch 1/1) 2026-01-27 13:44:44 +00:00
19c96042e9 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-01-26 13:49:05 +00:00
1033d7d688 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-01-25 13:46:42 +00:00
8e4962743d update for new format config of transformers lib / sglang lib (batch 1/1) 2026-01-24 13:25:12 +00:00
1001265d1d update for new format config of transformers lib / sglang lib (batch 1/1) 2026-01-23 13:34:40 +00:00
026f8b735a update for new format config of transformers lib / sglang lib (batch 1/1) 2026-01-22 13:46:40 +00:00
a38b10913a update for new format config of transformers lib / sglang lib (batch 1/1) 2026-01-21 13:50:45 +00:00
93431ca8e5 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-01-20 13:43:16 +00:00
2ebbeacb86 update for new format config of transformers lib / sglang lib (batch 1/1) 2026-01-20 02:52:00 +00:00
c4bf60a31e update for new format config of transformers lib / sglang lib (batch 1/1) 2026-01-20 02:51:58 +00:00
9ad8636d9b update for new format config of transformers lib / sglang lib 2025-10-25 21:28:26 +08:00
06910fdafb update for new format config of transformers lib / sglang lib 2025-10-25 21:28:01 +08:00
45fd0841b8 update for new format config of transformers lib / sglang lib 2025-10-25 21:27:31 +08:00
f221c89443 Merge branch 'master' of https://www.modelscope.cn/ZhipuAI/GLM-4.1V-9B-Thinking 2025-08-28 21:18:31 +08:00
f58a52db7a update 2025-08-28 21:18:25 +08:00
5b849bb3a9 Update README.md 2025-07-07 03:27:08 +00:00
ddd07b32b8 set 64000 to 65536 2025-07-03 16:38:32 +08:00
591f89245d update 2025-07-03 16:32:29 +08:00
bc64e132a0 update 2025-07-02 17:01:59 +08:00
b1abac70a1 Merge branch 'master' of https://www.modelscope.cn/ZhipuAI/GLM-4.1V-9B-Thinking 2025-07-02 16:40:32 +08:00
c886823f1d update 2025-07-02 16:40:17 +08:00
c5166d0d5c Update README.md 2025-07-02 07:44:30 +00:00
6 changed files with 177 additions and 143 deletions

4
.gitattributes vendored
View File

@ -11,7 +11,7 @@
*.model filter=lfs diff=lfs merge=lfs -text
*.msgpack filter=lfs diff=lfs merge=lfs -text
*.onnx filter=lfs diff=lfs merge=lfs -text
*.ot filter=lfs diff=lfs merge=lfs -text
*.parquet filter=lfs diff=lfs merge=lfs -text
*.pb filter=lfs diff=lfs merge=lfs -text
*.pt filter=lfs diff=lfs merge=lfs -text
@ -45,3 +45,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.wasm filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
notebook.ipynb filter=lfs diff=lfs merge=lfs -text

View File

@ -1,60 +1,78 @@
---
license: mit
language:
- en
- zh
base_model:
- zai-org/GLM-4-9B-0414
pipeline_tag: image-text-to-text
library_name: transformers
tags:
- reasoning
---
# GLM-4.1V-9B-Thinking
<div align="center">
<img src=https://raw.githubusercontent.com/THUDM/GLM-4.1V-Thinking/99c5eb6563236f0ff43605d91d107544da9863b2/resources/logo.svg width="40%"/>
<img src=https://raw.githubusercontent.com/zai-org/GLM-4.1V-Thinking/99c5eb6563236f0ff43605d91d107544da9863b2/resources/logo.svg width="40%"/>
</div>
<p align="center">
📖 查看 GLM-4.1V-9B-Thinking <a href="https://arxiv.org/abs/2507.01006" target="_blank">论文</a>
📖 View the GLM-4.1V-9B-Thinking <a href="https://arxiv.org/abs/2507.01006" target="_blank">paper</a>.
<br>
💡 立即在线体验 <a href="https://huggingface.co/spaces/THUDM/GLM-4.1V-9B-Thinking-Demo" target="_blank">Hugging Face</a><a href="https://modelscope.cn/studios/ZhipuAI/GLM-4.1V-9B-Thinking-Demo" target="_blank">ModelScope</a> 上的 GLM-4.1V-9B-Thinking。
<br>
📍 在 <a href="https://www.bigmodel.cn/dev/api/visual-reasoning-model/GLM-4.1V-Thinking">智谱大模型开放平台</a> 使用 GLM-4.1V-9B-Thinking 的API服务。
📍 Using GLM-4.1V-9B-Thinking API at <a href="https://www.bigmodel.cn/dev/api/visual-reasoning-model/GLM-4.1V-Thinking">Zhipu Foundation Model Open Platform</a>
</p>
## 模型介绍
视觉语言大模型VLM已经成为智能系统的关键基石。随着真实世界的智能任务越来越复杂VLM模型也亟需在基本的多模态感知之外
逐渐增强复杂任务中的推理能力,提升自身的准确性、全面性和智能化程度,使得复杂问题解决、长上下文理解、多模态智能体等智能任务成为可能。
## Model Introduction
基于 [GLM-4-9B-0414](https://github.com/THUDM/GLM-4) 基座模型我们推出新版VLM开源模型 **GLM-4.1V-9B-Thinking**
,引入思考范式,通过课程采样强化学习 RLCSReinforcement Learning with Curriculum Sampling全面提升模型能力
达到 10B 参数级别的视觉语言模型的最强性能在18个榜单任务中持平甚至超过8倍参数量的 Qwen-2.5-VL-72B。
我们同步开源基座模型 **GLM-4.1V-9B-Base**,希望能够帮助更多研究者探索视觉语言模型的能力边界。
Vision-Language Models (VLMs) have become foundational components of intelligent systems. As real-world AI tasks grow
increasingly complex, VLMs must evolve beyond basic multimodal perception to enhance their reasoning capabilities in
complex tasks. This involves improving accuracy, comprehensiveness, and intelligence, enabling applications such as
complex problem solving, long-context understanding, and multimodal agents.
![rl](https://raw.githubusercontent.com/THUDM/GLM-4.1V-Thinking/refs/heads/main/resources/rl.jpeg)
Based on the [GLM-4-9B-0414](https://github.com/zai-org/GLM-4) foundation model, we present the new open-source VLM model
**GLM-4.1V-9B-Thinking**, designed to explore the upper limits of reasoning in vision-language models. By introducing
a "thinking paradigm" and leveraging reinforcement learning, the model significantly enhances its capabilities. It
achieves state-of-the-art performance among 10B-parameter VLMs, matching or even surpassing the 72B-parameter
Qwen-2.5-VL-72B on 18 benchmark tasks. We are also open-sourcing the base model GLM-4.1V-9B-Base to
support further research into the boundaries of VLM capabilities.
与上一代的 CogVLM2 及 GLM-4V 系列模型相比,**GLM-4.1V-Thinking** 有如下改进:
![rl](https://raw.githubusercontent.com/zai-org/GLM-4.1V-Thinking/refs/heads/main/resources/rl.jpeg)
1. 系列中首个推理模型,不仅仅停留在数学领域,在多个子领域均达到世界前列的水平。
2. 支持 **64k** 上下长度。
3. 支持**任意长宽比**和高达 **4k** 的图像分辨率。
4. 提供支持**中英文双语**的开源模型版本。
Compared to the previous generation models CogVLM2 and the GLM-4V series, **GLM-4.1V-Thinking** offers the
following improvements:
## 榜单信息
1. The first reasoning-focused model in the series, achieving world-leading performance not only in mathematics but also
across various sub-domains.
2. Supports **64k** context length.
3. Handles **arbitrary aspect ratios** and up to **4K** image resolution.
4. Provides an open-source version supporting both **Chinese and English bilingual** usage.
GLM-4.1V-9B-Thinking 通过引入「思维链」Chain-of-Thought推理机制在回答准确性、内容丰富度与可解释性方面
全面超越传统的非推理式视觉模型。在28项评测任务中有23项达到10B级别模型最佳甚至有18项任务超过8倍参数量的Qwen-2.5-VL-72B。
## Benchmark Performance
![bench](https://raw.githubusercontent.com/THUDM/GLM-4.1V-Thinking/refs/heads/main/resources/bench.jpeg)
By incorporating the Chain-of-Thought reasoning paradigm, GLM-4.1V-9B-Thinking significantly improves answer accuracy,
richness, and interpretability. It comprehensively surpasses traditional non-reasoning visual models.
Out of 28 benchmark tasks, it achieved the best performance among 10B-level models on 23 tasks,
and even outperformed the 72B-parameter Qwen-2.5-VL-72B on 18 tasks.
## 快速推理
![bench](https://raw.githubusercontent.com/zai-org/GLM-4.1V-Thinking/refs/heads/main/resources/bench.jpeg)
## Quick Inference
This is a simple example of running single-image inference using the `transformers` library.
First, install the `transformers` library from source:
这里展现了一个使用`transformers`进行单张图片推理的代码。首先,从源代码安装`transformers`库。
```
pip install git+https://github.com/huggingface/transformers.git
pip install transformers>=4.57.1
```
接着按照以下代码运行:
Then, run the following code:
```python
from transformers import AutoProcessor, Glm4vForConditionalGeneration
import torch
MODEL_PATH = "THUDM/GLM-4.1V-9B-Thinking"
MODEL_PATH = "zai-org/GLM-4.1V-9B-Thinking"
messages = [
{
"role": "user",
@ -88,6 +106,5 @@ output_text = processor.decode(generated_ids[0][inputs["input_ids"].shape[1]:],
print(output_text)
```
视频推理网页端Demo部署等更代码请查看我们的 [github](https://github.com/THUDM/GLM-4.1V-Thinking)
For video reasoning, web demo deployment, and more code, please check
our [GitHub](https://github.com/zai-org/GLM-V).

View File

@ -3,38 +3,50 @@
"Glm4vForConditionalGeneration"
],
"model_type": "glm4v",
"attention_bias": true,
"attention_dropout": 0.0,
"pad_token_id": 151329,
"eos_token_id": [
151329,
151336,
151338,
151348
],
"image_start_token_id": 151339,
"image_end_token_id": 151340,
"video_start_token_id": 151341,
"video_end_token_id": 151342,
"image_token_id": 151343,
"video_token_id": 151344,
"hidden_act": "silu",
"hidden_size": 4096,
"initializer_range": 0.02,
"intermediate_size": 13696,
"max_position_embeddings": 32768,
"num_attention_heads": 32,
"num_hidden_layers": 40,
"num_key_value_heads": 2,
"rms_norm_eps": 1e-05,
"rope_theta": 10000.0,
"tie_word_embeddings": false,
"torch_dtype": "bfloat16",
"transformers_version": "4.53.0dev",
"use_cache": true,
"vocab_size": 151552,
"partial_rotary_factor": 0.5,
"transformers_version": "4.57.1",
"text_config": {
"model_type": "glm4v_text",
"attention_bias": true,
"attention_dropout": 0.0,
"pad_token_id": 151329,
"eos_token_id": [
151329,
151336,
151338,
151348
],
"hidden_act": "silu",
"hidden_size": 4096,
"initializer_range": 0.02,
"intermediate_size": 13696,
"max_position_embeddings": 65536,
"num_attention_heads": 32,
"num_hidden_layers": 40,
"num_key_value_heads": 2,
"rms_norm_eps": 1e-05,
"dtype": "bfloat16",
"use_cache": true,
"vocab_size": 151552,
"partial_rotary_factor": 0.5,
"rope_theta": 10000,
"rope_scaling": {
"rope_type": "default",
"mrope_section": [
8,
12,
12
]
}
},
"vision_config": {
"model_type": "glm4v",
"hidden_size": 1536,
"depth": 24,
"num_heads": 12,
@ -49,13 +61,5 @@
"rms_norm_eps": 1e-05,
"spatial_merge_size": 2,
"temporal_patch_size": 2
},
"rope_scaling": {
"type": "default",
"mrope_section": [
8,
12,
12
]
}
}

15
generation_config.json Normal file
View File

@ -0,0 +1,15 @@
{
"_from_model_config": true,
"do_sample": true,
"eos_token_id": [
151329,
151336,
151338,
151348
],
"pad_token_id": 151329,
"top_p": 0.6,
"temperature": 0.8,
"top_k": 2,
"transformers_version": "4.57.1"
}

BIN
notebook.ipynb (Stored with Git LFS) Normal file

Binary file not shown.

View File

@ -134,7 +134,7 @@
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
"special": false
},
"151346": {
"content": "</think>",
@ -142,7 +142,7 @@
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
"special": false
},
"151347": {
"content": "<answer>",
@ -150,7 +150,7 @@
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
"special": false
},
"151348": {
"content": "</answer>",
@ -158,7 +158,7 @@
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
"special": false
},
"151349": {
"content": "<|begin_of_box|>",
@ -166,7 +166,7 @@
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
"special": false
},
"151350": {
"content": "<|end_of_box|>",
@ -174,7 +174,7 @@
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
"special": false
},
"151351": {
"content": "<|sep|>",
@ -182,7 +182,7 @@
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
"special": false
}
},
"additional_special_tokens": [
@ -200,15 +200,8 @@
"<|end_of_image|>",
"<|begin_of_video|>",
"<|end_of_video|>",
"<|begin_of_box|>",
"<|end_of_box|>",
"<|sep|>",
"<|image|>",
"<|video|>",
"<think>",
"</think>",
"<answer>",
"</answer>"
"<|video|>"
],
"clean_up_tokenization_spaces": false,
"do_lower_case": false,
@ -218,7 +211,7 @@
"input_ids",
"attention_mask"
],
"model_max_length": 64000,
"model_max_length": 65536,
"padding_side": "left",
"remove_space": false,
"tokenizer_class": "PreTrainedTokenizer"