[{"data":1,"prerenderedAt":582},["ShallowReactive",2],{"content-query-EGcy0qAfRv":3},{"_path":4,"_dir":5,"_draft":6,"_partial":6,"_locale":7,"title":8,"description":9,"date":10,"cover":11,"type":12,"body":13,"_type":576,"_id":577,"_source":578,"_file":579,"_stem":580,"_extension":581},"/news/zh/3700","zh",false,"","同步首发！智谱开源GLM-4-0414全部6个模型并上线昇思、魔乐开源社区","4月15日，昇思MindSpore开源社区、魔乐社区第一时间上架智谱全新开源的GLM-4-0414 32B/9B模型，并完成精度测试。","2025-04-15","https://obs-mindspore-file.obs.cn-north-4.myhuaweicloud.com/file/2025/04/18/41ef5be4e88a42409163e69636e3e12e.png","news",{"type":14,"children":15,"toc":570},"root",[16,24,45,50,58,68,73,80,90,95,102,107,114,145,150,155,216,224,232,240,245,253,261,266,276,284,292,297,305,310,323,331,339,344,352,357,365,370,378,382,395,403,411,418,426,431,439,446,454,459,467,472,485,490,498,503,510,518,523,531,548,553,565],{"type":17,"tag":18,"props":19,"children":21},"element","h1",{"id":20},"同步首发智谱开源glm-4-0414全部6个模型并上线昇思魔乐开源社区",[22],{"type":23,"value":8},"text",{"type":17,"tag":25,"props":26,"children":27},"p",{},[28,30,36,38,43],{"type":23,"value":29},"4月15日，昇思MindSpore开源社区、魔乐社区第一时间上架",{"type":17,"tag":31,"props":32,"children":33},"strong",{},[34],{"type":23,"value":35},"智谱全新开源的GLM-4-0414 32B/9B模型",{"type":23,"value":37},"，并完成精度测试。智谱",{"type":17,"tag":31,"props":39,"children":40},{},[41],{"type":23,"value":42},"GLM-4-0414拥有",{"type":23,"value":44}," 32B/9B两个尺寸，涵盖基座、推理、沉思模型，均遵循 MIT 许可协议。其中，推理模型 GLM-Z1-32B-0414 性能媲美 DeepSeek-R1 等顶尖模型，实测推理速度可达 200 Tokens/秒。",{"type":17,"tag":25,"props":46,"children":47},{},[48],{"type":23,"value":49},"模型介绍：",{"type":17,"tag":25,"props":51,"children":52},{},[53],{"type":17,"tag":54,"props":55,"children":57},"img",{"alt":7,"src":56},"https://obs-mindspore-file.obs.cn-north-4.myhuaweicloud.com/file/2025/04/18/badad5c858644d75900c51e191ce728c.png",[],{"type":17,"tag":25,"props":59,"children":60},{},[61,66],{"type":17,"tag":31,"props":62,"children":63},{},[64],{"type":23,"value":65},"基座模型 GLM-4-32B-0414",{"type":23,"value":67}," 拥有 320 亿参数，其性能可与国内、外参数量更大的主流模型相媲美。该模型利用 15T 高质量数据进行预训练，特别纳入了丰富的推理类合成数据，为后续的强化学习扩展奠定了基础。在后训练阶段，除了进行面向对话场景的人类偏好对齐，还通过拒绝采样和强化学习等技术，重点增强了模型在指令遵循、工程代码生成、函数调用等任务上的表现，以强化智能体任务所需的原子能力。",{"type":17,"tag":25,"props":69,"children":70},{},[71],{"type":23,"value":72},"GLM-4-32B-0414 在工程代码、Artifacts生成、函数调用、搜索问答及报告撰写等任务上均表现出色，部分 Benchmark 指标已接近甚至超越**GPT-4o、DeepSeek-V3-0324（671B）**等更大模型的水平。",{"type":17,"tag":25,"props":74,"children":75},{},[76],{"type":17,"tag":54,"props":77,"children":79},{"alt":7,"src":78},"https://obs-mindspore-file.obs.cn-north-4.myhuaweicloud.com/file/2025/04/18/ae37f6a839e04c52bd31954785544a4e.png",[],{"type":17,"tag":25,"props":81,"children":82},{},[83,88],{"type":17,"tag":31,"props":84,"children":85},{},[86],{"type":23,"value":87},"GLM-Z1-32B-0414",{"type":23,"value":89}," 是一款具备深度思考能力的推理模型。该模型在 GLM-4-32B-0414 的基础上，采用了冷启动与扩展强化学习策略，并针对数学、代码、逻辑等关键任务进行了深度优化训练。与基础模型相比，GLM-Z1-32B-0414 的数理能力和复杂问题解决能力得到显著增强。此外，训练中整合了基于对战排序反馈的通用强化学习技术，有效提升了模型的通用能力。",{"type":17,"tag":25,"props":91,"children":92},{},[93],{"type":23,"value":94},"在部分任务上，**GLM-Z1-32B-0414 凭借 32B 参数，其性能已能与拥有 671B 参数的 DeepSeek-R1 相媲美。**通过在 AIME 24/25、LiveCodeBench、GPQA 等基准测试中的评估，GLM-Z1-32B-0414 展现了较强的数理推理能力，能够支持解决更广泛复杂任务。",{"type":17,"tag":25,"props":96,"children":97},{},[98],{"type":17,"tag":54,"props":99,"children":101},{"alt":7,"src":100},"https://obs-mindspore-file.obs.cn-north-4.myhuaweicloud.com/file/2025/04/18/98c13a631cdb411fab363991cc509eab.png",[],{"type":17,"tag":25,"props":103,"children":104},{},[105],{"type":23,"value":106},"GLM-Z1-9B-0414是沿用了上述一系列技术，训练出的一个 9B 的小尺寸模型。虽然参数量更少，但GLM-Z1-9B-0414 在数学推理及通用任务上依然表现出色，整体性能已跻身同尺寸开源模型的领先水平。特别是在资源受限的场景下，该模型可以很好地在效率与效果之间取得平衡，为需要轻量化部署的用户提供强有力的选择。",{"type":17,"tag":25,"props":108,"children":109},{},[110],{"type":17,"tag":54,"props":111,"children":113},{"alt":7,"src":112},"https://obs-mindspore-file.obs.cn-north-4.myhuaweicloud.com/file/2025/04/18/37df67c5503d47a69532bff4b969c221.png",[],{"type":17,"tag":25,"props":115,"children":116},{},[117,122,124,129,131,136,138,143],{"type":17,"tag":31,"props":118,"children":119},{},[120],{"type":23,"value":121},"沉思模型GLM-Z1-Rumination-32B-0414",{"type":23,"value":123},"代表了智谱对 AGI 未来形态的下一步探索。与一般推理模型不同，沉思模型通过更多步骤的深度思考来解决高度开放与复杂的问题。其关键创新在于，它能在深度思考过程中整合搜索工具处理复杂任务，并运用多种规则型奖励机制来指导和扩展端到端的强化学习训练。该模型支持“",{"type":17,"tag":31,"props":125,"children":126},{},[127],{"type":23,"value":128},"自主提出问题—搜索信息—构建分析—完成任务",{"type":23,"value":130},"”的完整研究闭环，从而在",{"type":17,"tag":31,"props":132,"children":133},{},[134],{"type":23,"value":135},"研究型写作",{"type":23,"value":137},"和",{"type":17,"tag":31,"props":139,"children":140},{},[141],{"type":23,"value":142},"复杂检索任务",{"type":23,"value":144},"上的能力得到了显著提升。",{"type":17,"tag":25,"props":146,"children":147},{},[148],{"type":23,"value":149},"欢迎广大开发者下载体验！",{"type":17,"tag":25,"props":151,"children":152},{},[153],{"type":23,"value":154},"魔乐社区模型下载链接：",{"type":17,"tag":156,"props":157,"children":158},"ul",{},[159,171,180,189,198,207],{"type":17,"tag":160,"props":161,"children":162},"li",{},[163],{"type":17,"tag":164,"props":165,"children":169},"a",{"href":166,"rel":167},"https://modelers.cn/models/MindSpore-Lab/GLM-4-32B-Base-0414",[168],"nofollow",[170],{"type":23,"value":166},{"type":17,"tag":160,"props":172,"children":173},{},[174],{"type":17,"tag":164,"props":175,"children":178},{"href":176,"rel":177},"https://modelers.cn/models/MindSpore-Lab/GLM-Z1-Rumination-32B-0414",[168],[179],{"type":23,"value":176},{"type":17,"tag":160,"props":181,"children":182},{},[183],{"type":17,"tag":164,"props":184,"children":187},{"href":185,"rel":186},"https://modelers.cn/models/MindSpore-Lab/GLM-Z1-32B-0414",[168],[188],{"type":23,"value":185},{"type":17,"tag":160,"props":190,"children":191},{},[192],{"type":17,"tag":164,"props":193,"children":196},{"href":194,"rel":195},"https://modelers.cn/models/MindSpore-Lab/GLM-Z1-9B-0414",[168],[197],{"type":23,"value":194},{"type":17,"tag":160,"props":199,"children":200},{},[201],{"type":17,"tag":164,"props":202,"children":205},{"href":203,"rel":204},"https://modelers.cn/models/MindSpore-Lab/GLM-4-32B-0414",[168],[206],{"type":23,"value":203},{"type":17,"tag":160,"props":208,"children":209},{},[210],{"type":17,"tag":164,"props":211,"children":214},{"href":212,"rel":213},"https://modelers.cn/models/MindSpore-Lab/GLM-4-9B-0414",[168],[215],{"type":23,"value":212},{"type":17,"tag":25,"props":217,"children":218},{},[219],{"type":17,"tag":31,"props":220,"children":221},{},[222],{"type":23,"value":223},"以下为手把手教程：（以GLM-Z1-9B-0414+昇思MindSpore基于昇腾推理为例）",{"type":17,"tag":25,"props":225,"children":226},{},[227],{"type":17,"tag":31,"props":228,"children":229},{},[230],{"type":23,"value":231},"# 01",{"type":17,"tag":25,"props":233,"children":234},{},[235],{"type":17,"tag":31,"props":236,"children":237},{},[238],{"type":23,"value":239},"快速开始",{"type":17,"tag":25,"props":241,"children":242},{},[243],{"type":23,"value":244},"GLM-Z1-9B-0414推理至少需要1台（1卡）Atlas 800T A2（64G）服务器（基于BF16权重）。昇思MindSpore提供了GLM-Z1-9B-0414推理可用的Docker容器镜像，供开发者快速体验。",{"type":17,"tag":25,"props":246,"children":247},{},[248],{"type":17,"tag":31,"props":249,"children":250},{},[251],{"type":23,"value":252},"1",{"type":17,"tag":25,"props":254,"children":255},{},[256],{"type":17,"tag":31,"props":257,"children":258},{},[259],{"type":23,"value":260},"下载昇思MindSpore推理容器镜像",{"type":17,"tag":25,"props":262,"children":263},{},[264],{"type":23,"value":265},"执行以下 Shell 命令，拉取昇思 MindSpore GLM-Z1 推理容器镜像：",{"type":17,"tag":267,"props":268,"children":270},"pre",{"code":269},"\ndocker pull swr.cn-central-221.ovaijisuan.com/mindformers/mindspore_glm_z1:20250414\n",[271],{"type":17,"tag":272,"props":273,"children":274},"code",{"__ignoreMap":7},[275],{"type":23,"value":269},{"type":17,"tag":25,"props":277,"children":278},{},[279],{"type":17,"tag":31,"props":280,"children":281},{},[282],{"type":23,"value":283},"2",{"type":17,"tag":25,"props":285,"children":286},{},[287],{"type":17,"tag":31,"props":288,"children":289},{},[290],{"type":23,"value":291},"启动容器",{"type":17,"tag":25,"props":293,"children":294},{},[295],{"type":23,"value":296},"执行以下命令创建并启动容器：",{"type":17,"tag":267,"props":298,"children":300},{"code":299},"docker run -it --privileged  --name=GLM-Z1 --net=host \\\n   --shm-size 500g \\\n   --device=/dev/davinci0 \\\n   --device=/dev/davinci1 \\\n   --device=/dev/davinci2 \\\n   --device=/dev/davinci3 \\\n   --device=/dev/davinci4 \\\n   --device=/dev/davinci5 \\\n   --device=/dev/davinci6 \\\n   --device=/dev/davinci7 \\\n   --device=/dev/davinci_manager \\\n   --device=/dev/hisi_hdc \\\n   --device /dev/devmm_svm \\\n   -v /usr/local/Ascend/driver:/usr/local/Ascend/driver \\\n   -v /usr/local/Ascend/firmware:/usr/local/Ascend/firmware \\\n   -v /usr/local/sbin/npu-smi:/usr/local/sbin/npu-smi \\\n   -v /usr/local/sbin:/usr/local/sbin \\\n   -v /etc/hccn.conf:/etc/hccn.conf \\\n   swr.cn-central-221.ovaijisuan.com/mindformers/mindspore_glm_z1:20250414\n   /bin/bash\n",[301],{"type":17,"tag":272,"props":302,"children":303},{"__ignoreMap":7},[304],{"type":23,"value":299},{"type":17,"tag":25,"props":306,"children":307},{},[308],{"type":23,"value":309},"注意事项：",{"type":17,"tag":156,"props":311,"children":312},{},[313,318],{"type":17,"tag":160,"props":314,"children":315},{},[316],{"type":23,"value":317},"如果部署在多机上，每台机器中容器的hostname不能重复。如果有部分宿主机的hostname是一致的，需要在起容器的时候修改容器的hostname。",{"type":17,"tag":160,"props":319,"children":320},{},[321],{"type":23,"value":322},"后续所有操作均在容器内操作。",{"type":17,"tag":25,"props":324,"children":325},{},[326],{"type":17,"tag":31,"props":327,"children":328},{},[329],{"type":23,"value":330},"3",{"type":17,"tag":25,"props":332,"children":333},{},[334],{"type":17,"tag":31,"props":335,"children":336},{},[337],{"type":23,"value":338},"模型下载",{"type":17,"tag":25,"props":340,"children":341},{},[342],{"type":23,"value":343},"执行以下命令为自定义下载路径 /home/work/GLM-Z1-9B-0414 添加白名单：",{"type":17,"tag":267,"props":345,"children":347},{"code":346},"export HUB_WHITE_LIST_PATHS=/home/work/GLM-Z1-9B-0414\n",[348],{"type":17,"tag":272,"props":349,"children":350},{"__ignoreMap":7},[351],{"type":23,"value":346},{"type":17,"tag":25,"props":353,"children":354},{},[355],{"type":23,"value":356},"执行以下 Python 脚本从魔乐社区下载昇思 MindSpore 版本的 GLM-Z1-9B-0414 文件至指定路径 /home/work/GLM-Z1-9B-0414 。下载的文件包含模型代码、权重、分词模型和示例代码，占用约18GB 的磁盘空间：",{"type":17,"tag":267,"props":358,"children":360},{"code":359},"from openmind_hub import snapshot_download\nsnapshot_download(\n    repo_id=\"MindSpore-Lab/GLM-Z1-9B-0414\",\n    local_dir=\"/home/work/GLM-Z1-9B-0414\",\n    local_dir_use_symlink=False\n)\n",[361],{"type":17,"tag":272,"props":362,"children":363},{"__ignoreMap":7},[364],{"type":23,"value":359},{"type":17,"tag":25,"props":366,"children":367},{},[368],{"type":23,"value":369},"下载完成的 /home/work/GLM-Z1-9B-0414 文件夹目录结构如下：",{"type":17,"tag":267,"props":371,"children":373},{"code":372},"GLM-Z1-9B-0414\n  ├── config.json                               # 模型json配置文件\n  ├── tokenizer.model                           # 词表model文件\n  ├── tokenizer_config.json                     # 词表配置文件\n  ├── predict_glm4_z1_9b.yaml                   # 模型yaml配置文件\n  └── weights\n        ├── model-xxxxx-of-xxxxx.safetensors    # 模型权重文件\n        ├── tokenizer.json                      # 模型词表文件\n        ├── xxxxx                               # 若干其他文件\n        └── model.safetensors.index.json        # 模型权重映射文件\n",[374],{"type":17,"tag":272,"props":375,"children":376},{"__ignoreMap":7},[377],{"type":23,"value":372},{"type":17,"tag":25,"props":379,"children":380},{},[381],{"type":23,"value":309},{"type":17,"tag":156,"props":383,"children":384},{},[385,390],{"type":17,"tag":160,"props":386,"children":387},{},[388],{"type":23,"value":389},"/home/work/GLM-Z1-9B-0414 可修改为自定义路径，确保该路径有足够的磁盘空间（约 18GB）。",{"type":17,"tag":160,"props":391,"children":392},{},[393],{"type":23,"value":394},"下载时间可能因网络环境而异，建议在稳定的网络环境下操作。",{"type":17,"tag":25,"props":396,"children":397},{},[398],{"type":17,"tag":31,"props":399,"children":400},{},[401],{"type":23,"value":402},"# 02",{"type":17,"tag":25,"props":404,"children":405},{},[406],{"type":17,"tag":31,"props":407,"children":408},{},[409],{"type":23,"value":410},"服务化部署",{"type":17,"tag":25,"props":412,"children":413},{},[414],{"type":17,"tag":31,"props":415,"children":416},{},[417],{"type":23,"value":252},{"type":17,"tag":25,"props":419,"children":420},{},[421],{"type":17,"tag":31,"props":422,"children":423},{},[424],{"type":23,"value":425},"修改模型配置文件",{"type":17,"tag":25,"props":427,"children":428},{},[429],{"type":23,"value":430},"在 predict_glm4_z1_9b.yaml 中对以下配置进行修改（若为默认路径则无需修改）：",{"type":17,"tag":267,"props":432,"children":434},{"code":433},"\nload_checkpoint: '/home/work/GLM-Z1-9B-0414/weights'         # 配置为实际的模型绝对路径\nauto_trans_ckpt: True                                  # 打开权重自动切分，自动将权重转换为分布式任务所需的形式\nload_ckpt_format: 'safetensors'\nprocessor:\n  tokenizer:\n    vocab_file: \"/home/work/GLM-Z1-9B-0414/tokenizer.model\"  # 配置为tokenizer文件的绝对路径\n",[435],{"type":17,"tag":272,"props":436,"children":437},{"__ignoreMap":7},[438],{"type":23,"value":433},{"type":17,"tag":25,"props":440,"children":441},{},[442],{"type":17,"tag":31,"props":443,"children":444},{},[445],{"type":23,"value":283},{"type":17,"tag":25,"props":447,"children":448},{},[449],{"type":17,"tag":31,"props":450,"children":451},{},[452],{"type":23,"value":453},"一键启动MindIE",{"type":17,"tag":25,"props":455,"children":456},{},[457],{"type":23,"value":458},"MindSpore Transformers提供了一键拉起MindIE脚本，脚本中已预置环境变量设置和服务化配置，仅需输入模型文件目录后即可快速拉起服务。 进入 mindformers/scripts 目录下，执行MindIE启动脚本：",{"type":17,"tag":267,"props":460,"children":462},{"code":461},"\ncd /home/work/mindformers/scripts\nbash run_mindie.sh --model-name GLM-Z1-9B-0414 --model-path /home/work/GLM-Z1-9B-0414 --max-prefill-batch-size 1\n",[463],{"type":17,"tag":272,"props":464,"children":465},{"__ignoreMap":7},[466],{"type":23,"value":461},{"type":17,"tag":25,"props":468,"children":469},{},[470],{"type":23,"value":471},"参数说明：",{"type":17,"tag":156,"props":473,"children":474},{},[475,480],{"type":17,"tag":160,"props":476,"children":477},{},[478],{"type":23,"value":479},"--model-name：设置模型名称",{"type":17,"tag":160,"props":481,"children":482},{},[483],{"type":23,"value":484},"--model-path：设置模型目录路径",{"type":17,"tag":25,"props":486,"children":487},{},[488],{"type":23,"value":489},"查看日志：",{"type":17,"tag":267,"props":491,"children":493},{"code":492},"\ntail -f output.log\n",[494],{"type":17,"tag":272,"props":495,"children":496},{"__ignoreMap":7},[497],{"type":23,"value":492},{"type":17,"tag":25,"props":499,"children":500},{},[501],{"type":23,"value":502},"当log日志中出现 `Daemon start success!` ，表示服务启动成功。",{"type":17,"tag":25,"props":504,"children":505},{},[506],{"type":17,"tag":31,"props":507,"children":508},{},[509],{"type":23,"value":330},{"type":17,"tag":25,"props":511,"children":512},{},[513],{"type":17,"tag":31,"props":514,"children":515},{},[516],{"type":23,"value":517},"执行推理请求测试",{"type":17,"tag":25,"props":519,"children":520},{},[521],{"type":23,"value":522},"执行以下命令发送流式推理请求进行测试：",{"type":17,"tag":267,"props":524,"children":526},{"code":525},"\ncurl -w \"\\ntime_total=%{time_total}\\n\" -H \"Accept: application/json\" -H \"Content-type: application/json\" -X POST -d '{\"inputs\": \"请介绍一个北京的景点\", \"parameters\": {\"do_sample\": false, \"max_new_tokens\": 128}, \"stream\": false}' http://127.0.0.1:1025/generate_stream &\n",[527],{"type":17,"tag":272,"props":528,"children":529},{"__ignoreMap":7},[530],{"type":23,"value":525},{"type":17,"tag":532,"props":533,"children":535},"h3",{"id":534},"_03-声明",[536,541,543],{"type":17,"tag":31,"props":537,"children":538},{},[539],{"type":23,"value":540},"# 03",{"type":23,"value":542}," ",{"type":17,"tag":31,"props":544,"children":545},{},[546],{"type":23,"value":547},"声明",{"type":17,"tag":25,"props":549,"children":550},{},[551],{"type":23,"value":552},"本文档提供的模型代码、权重文件和部署镜像，当前仅限于基于昇思MindSpore AI框架体验 GLM-Z1-9B-0414 的部署效果，不支持生产环境部署。",{"type":17,"tag":25,"props":554,"children":555},{},[556,558],{"type":23,"value":557},"相关使用问题请反馈至ISSUE（链接：",{"type":17,"tag":164,"props":559,"children":562},{"href":560,"rel":561},"https://gitee.com/mindspore/mindformers/issues%EF%BC%89%E3%80%82",[168],[563],{"type":23,"value":564},"https://gitee.com/mindspore/mindformers/issues）。",{"type":17,"tag":25,"props":566,"children":567},{},[568],{"type":23,"value":569},"昇思MindSpore AI框架将持续支持相关主流模型演进，并根据开源情况面向全体开发者提供镜像与支持。",{"title":7,"searchDepth":571,"depth":571,"links":572},4,[573],{"id":534,"depth":574,"text":575},3,"# 03 声明","markdown","content:news:zh:3700.md","content","news/zh/3700.md","news/zh/3700","md",1776506087887]