mirror of
https://www.modelscope.cn/deepseek-ai/DeepSeek-R1-0528-Qwen3-8B.git
synced 2026-04-02 21:52:53 +08:00
Small fix
This commit is contained in:
@ -21,7 +21,8 @@
|
||||
"rope_scaling": {
|
||||
"rope_type": "yarn",
|
||||
"factor": 4.0,
|
||||
"original_max_position_embeddings": 32768
|
||||
"original_max_position_embeddings": 32768,
|
||||
"attn_factor": 0.8782488562869419
|
||||
},
|
||||
"rope_theta": 1000000,
|
||||
"sliding_window": null,
|
||||
|
||||
Reference in New Issue
Block a user