[{"data":1,"prerenderedAt":379},["ShallowReactive",2],{"content-query-KUUDJ7IFVe":3},{"_path":4,"_dir":5,"_draft":6,"_partial":6,"_locale":7,"title":8,"description":9,"date":10,"cover":11,"type":12,"category":13,"body":14,"_type":373,"_id":374,"_source":375,"_file":376,"_stem":377,"_extension":378},"/technology-blogs/zh/3745","zh",false,"","不到10行代码、小时级完成适配！昇思版本DeepSeek-R1-0528上线开源社区","2025年5月28日深夜，DeepSeek 官方在用户群中宣布完成“小版本试升级”，发布DeepSeek-R1-0528，昇思MindSpore开源社区开发者基于已支持的DeepSeek V3进行快速适配，1小时内完成开发，修改代码小于10行，实现镜像替换、推理任务拉起，经测试验证，模型精度与官方开源版本一致。","2025-06-03","https://obs-mindspore-file.obs.cn-north-4.myhuaweicloud.com/file/2025/06/06/8375ffdf90244bc0a732a34f47853e81.png","technology-blogs","实践",{"type":15,"children":16,"toc":370},"root",[17,25,31,36,41,46,51,64,69,78,83,92,97,106,111,116,124,129,134,142,147,152,157,165,175,183,191,196,201,211,216,224,229,234,242,250,258,263,271,276,284,292,300,305,313,318,323,331,336,344,349,357,362],{"type":18,"tag":19,"props":20,"children":22},"element","h1",{"id":21},"不到10行代码小时级完成适配昇思版本deepseek-r1-0528上线开源社区",[23],{"type":24,"value":8},"text",{"type":18,"tag":26,"props":27,"children":28},"p",{},[29],{"type":24,"value":30},"2025年5月28日深夜，DeepSeek 官方在用户群中宣布完成“小版本试升级”，发布DeepSeek-R1-0528，昇思MindSpore开源社区开发者基于已支持的DeepSeek V3进行快速适配，1小时内完成开发，修改",{"type":18,"tag":26,"props":32,"children":33},{},[34],{"type":24,"value":35},"代码小于10行，实现镜像替换、推理任务拉起，经测试验证，模型精度与官方开源版本一致。",{"type":18,"tag":26,"props":37,"children":38},{},[39],{"type":24,"value":40},"基于昇思版本适配的DeepSeek-R1-0528已上架开源社区代码仓及魔乐社区，面向开发者提供开箱即用的模型，便于开发者直接使用或二次开发。",{"type":18,"tag":26,"props":42,"children":43},{},[44],{"type":24,"value":45},"本次快速适配应用了MindSpore Transformers大模型使能套件，该套件依托MindSpore AI框架提供的丰富的多维混合并行能力，亲和开源工具与通用数据格式，原生支持大模型蒸馏的端到端全流程开发，提供了高效、便捷的开发能力",{"type":18,"tag":26,"props":47,"children":48},{},[49],{"type":24,"value":50},"同时，本次推理服务的拉起与部署应用了MindSpore-vLLM插件，支持基于vLLM框架部署MindSpore模型的推理服务。",{"type":18,"tag":26,"props":52,"children":53},{},[54,56],{"type":24,"value":55},"MindSpore Transformers代码仓：",{"type":18,"tag":57,"props":58,"children":62},"a",{"href":59,"rel":60},"https://gitee.com/mindspore/mindformers",[61],"nofollow",[63],{"type":24,"value":59},{"type":18,"tag":26,"props":65,"children":66},{},[67],{"type":24,"value":68},"MindSpore-vLLM代码仓：",{"type":18,"tag":26,"props":70,"children":71},{},[72],{"type":18,"tag":57,"props":73,"children":76},{"href":74,"rel":75},"https://gitee.com/mindspore/vllm-mindspore",[61],[77],{"type":24,"value":74},{"type":18,"tag":26,"props":79,"children":80},{},[81],{"type":24,"value":82},"魔乐社区代码仓：",{"type":18,"tag":26,"props":84,"children":85},{},[86],{"type":18,"tag":57,"props":87,"children":90},{"href":88,"rel":89},"https://modelers.cn/models/MindSpore-Lab/DeepSeek-R1-0528",[61],[91],{"type":24,"value":88},{"type":18,"tag":26,"props":93,"children":94},{},[95],{"type":24,"value":96},"本次发布的DeepSeek-R1-0528主要升级以下能力：",{"type":18,"tag":26,"props":98,"children":99},{},[100],{"type":18,"tag":101,"props":102,"children":103},"strong",{},[104],{"type":24,"value":105},"1、推理与思维深度增强",{"type":18,"tag":26,"props":107,"children":108},{},[109],{"type":24,"value":110},"思考长度翻倍：平均每题推理token从12K增至23K，解题步骤更详尽（如AIME数学题准确率从70%→87.5%）。",{"type":18,"tag":26,"props":112,"children":113},{},[114],{"type":24,"value":115},"幻觉率降低45~50%：在摘要、改写等任务中输出更可靠。",{"type":18,"tag":26,"props":117,"children":118},{},[119],{"type":18,"tag":101,"props":120,"children":121},{},[122],{"type":24,"value":123},"2、编程能力突破",{"type":18,"tag":26,"props":125,"children":126},{},[127],{"type":24,"value":128},"前端代码生成：可一次性生成超千行无Bug代码，支持复杂动态效果（如天气动画、数据可视化）。",{"type":18,"tag":26,"props":130,"children":131},{},[132],{"type":24,"value":133},"多语言支持：在LiveCodeBench测试中Pass@1从63.5%→73.3%，媲美OpenAI o3高版本。",{"type":18,"tag":26,"props":135,"children":136},{},[137],{"type":18,"tag":101,"props":138,"children":139},{},[140],{"type":24,"value":141},"3、新增功能与体验优化",{"type":18,"tag":26,"props":143,"children":144},{},[145],{"type":24,"value":146},"工具调用（Function Calling）：支持外部API调用，Tau-Bench成绩达OpenAI o1-high水平。",{"type":18,"tag":26,"props":148,"children":149},{},[150],{"type":24,"value":151},"创意写作提升：长文本结构更完整，更贴近人类风格。",{"type":18,"tag":26,"props":153,"children":154},{},[155],{"type":24,"value":156},"API兼容性：接口不变，新增JSON输出支持。",{"type":18,"tag":26,"props":158,"children":159},{},[160],{"type":18,"tag":101,"props":161,"children":162},{},[163],{"type":24,"value":164},"手把手教程：DeepSeek-R1-0528 vLLM-MindSpore 使用指南",{"type":18,"tag":166,"props":167,"children":168},"ul",{},[169],{"type":18,"tag":170,"props":171,"children":172},"li",{},[173],{"type":24,"value":174},"本项目中提供的DeepSeek-R1-0528模型权重已反量化为BF16，权重文件大小1.3T。",{"type":18,"tag":26,"props":176,"children":177},{},[178],{"type":18,"tag":101,"props":179,"children":180},{},[181],{"type":24,"value":182},"# 01",{"type":18,"tag":26,"props":184,"children":185},{},[186],{"type":18,"tag":101,"props":187,"children":188},{},[189],{"type":24,"value":190},"环境搭建",{"type":18,"tag":26,"props":192,"children":193},{},[194],{"type":24,"value":195},"环境准备：四台Atlas 800I A2 (64G)，并配置好组网，四台设备的卡与卡之间能够互相ping通。",{"type":18,"tag":26,"props":197,"children":198},{},[199],{"type":24,"value":200},"四台设备分别拉取镜像：",{"type":18,"tag":202,"props":203,"children":205},"pre",{"code":204},"docker pull hub.oepkgs.net/oedeploy/openeuler/aarch64/mindspore:20250529\n",[206],{"type":18,"tag":207,"props":208,"children":209},"code",{"__ignoreMap":7},[210],{"type":24,"value":204},{"type":18,"tag":26,"props":212,"children":213},{},[214],{"type":24,"value":215},"四台设备分别杀进程，避免其他进程影响：",{"type":18,"tag":202,"props":217,"children":219},{"code":218},"pkill -9 python\npkill -9 mindie\npkill -9 ray\n",[220],{"type":18,"tag":207,"props":221,"children":222},{"__ignoreMap":7},[223],{"type":24,"value":218},{"type":18,"tag":26,"props":225,"children":226},{},[227],{"type":24,"value":228},"四台设备分别启动容器，四台设备的hostname需要不同，但容器名称需要一致。",{"type":18,"tag":26,"props":230,"children":231},{},[232],{"type":24,"value":233},"/data/deeepseek_r1_0528/用于存放权重及yaml配置文件。四台服务器都需要下载权重，而且存放路径需要一致，权重文件大小1.3T，需要预留足够磁盘空间。",{"type":18,"tag":202,"props":235,"children":237},{"code":236},"docker run -it --name=DSR10528 --ipc=host\n--network=host --privileged=true --hostname=worker23 \\\n        --device=/dev/davinci0 \\\n        --device=/dev/davinci1 \\\n        --device=/dev/davinci2 \\\n        --device=/dev/davinci3 \\\n        --device=/dev/davinci4 \\\n        --device=/dev/davinci5 \\\n        --device=/dev/davinci6 \\\n        --device=/dev/davinci7 \\\n        --device=/dev/davinci_manager \\\n        --device=/dev/devmm_svm \\\n        --device=/dev/hisi_hdc \\\n        -v /usr/local/sbin/:/usr/local/sbin/ \\\n        -v /etc/hccn.conf:/etc/hccn.conf \\\n        -v /usr/local/bin/npu-smi:/usr/local/bin/npu-smi \\\n        -v /usr/local/dcmi:/usr/local/dcmi \\\n        -v /usr/local/Ascend/driver:/usr/local/Ascend/driver\\\n        -v /etc/ascend_install.info:/etc/ascend_install.info \\\n        -v /etc/vnpu.cfg:/etc/vnpu.cfg \\\n        -v /data/deeepseek_r1_0528/:/data/deeepseek_r1_0528/ \\\n        hub.oepkgs.net/oedeploy/openeuler/aarch64/mindspore:20250428 \\\n        /bin/bash\n",[238],{"type":18,"tag":207,"props":239,"children":240},{"__ignoreMap":7},[241],{"type":24,"value":236},{"type":18,"tag":26,"props":243,"children":244},{},[245],{"type":18,"tag":101,"props":246,"children":247},{},[248],{"type":24,"value":249},"# 02",{"type":18,"tag":26,"props":251,"children":252},{},[253],{"type":18,"tag":101,"props":254,"children":255},{},[256],{"type":24,"value":257},"下载权重及yaml配置文件",{"type":18,"tag":26,"props":259,"children":260},{},[261],{"type":24,"value":262},"四台设备分别从魔乐社区下载权重及yamel配置文件。",{"type":18,"tag":202,"props":264,"children":266},{"code":265},"pip install openmind_hub\nexport HUB_WHITE_LIST_PATHS=/data/deeepseek_r1_0528\npython\nfrom openmind_hub import snapshot_download\n \nsnapshot_download(  \n    repo_id=\"MindSpore-Lab/DeepSeek-R1-0528\",  \n    local_dir=\"/data/deeepseek_r1_0528\", \n    local_dir_use_symlinks=False\n)\nexit()\n",[267],{"type":18,"tag":207,"props":268,"children":269},{"__ignoreMap":7},[270],{"type":24,"value":265},{"type":18,"tag":26,"props":272,"children":273},{},[274],{"type":24,"value":275},"四台设备分别修改yamel配置文件：",{"type":18,"tag":202,"props":277,"children":279},{"code":278},"\n# 修改为模型权重路径 \nload_checkpoint: '/data/deeepseek_r1_0528/'\n \n# 修改为模型tokenizer.json文件所在路径\nvocab_file: '/data/deeepseek_r1_0528/tokenizer.json'\n \n# 修改为模型tokenizer.json文件所在路径\ntokenizer_file:\n'/data/deeepseek_r1_0528/tokenizer.json'\n",[280],{"type":18,"tag":207,"props":281,"children":282},{"__ignoreMap":7},[283],{"type":24,"value":278},{"type":18,"tag":26,"props":285,"children":286},{},[287],{"type":18,"tag":101,"props":288,"children":289},{},[290],{"type":24,"value":291},"# 03",{"type":18,"tag":26,"props":293,"children":294},{},[295],{"type":18,"tag":101,"props":296,"children":297},{},[298],{"type":24,"value":299},"启动",{"type":18,"tag":26,"props":301,"children":302},{},[303],{"type":24,"value":304},"四台设备的容器中分别添加环境变量。enp189s0f0是ifconfig命令显示的网卡名称，根据需要调整。",{"type":18,"tag":202,"props":306,"children":308},{"code":307},"\nexport MINDFORMERS_MODEL_CONFIG=/data/deeepseek_r1_0528/peizhi/predict_deepseek_r1__671b.yaml\nexport\nASCEND_CUSTOM_PATH=$ASCEND_HOME_PATH/../\nexport vLLM_MODEL_BACKEND=MindFormers\nexport MS_ENABLE_LCCL=off\nexport HCCL_OP_EXPANSION_MODE=AIV\nexport HCCL_SOCKET_IFNAME=enp189s0f0\nexport GLOO_SOCKET_IFNAME=enp189s0f0\nexport TP_SOCKET_IFNAME=enp189s0f0\nexport HCCL_CONNECT_TIMEOUT=3600\nexport\nASCEND_RT_VISIBLE_DEVICES=0,1,2,3,4,5,6,7\n",[309],{"type":18,"tag":207,"props":310,"children":311},{"__ignoreMap":7},[312],{"type":24,"value":307},{"type":18,"tag":26,"props":314,"children":315},{},[316],{"type":24,"value":317},"主机及辅机设置。",{"type":18,"tag":26,"props":319,"children":320},{},[321],{"type":24,"value":322},"选择一台设备作为主节点，执行如下命令：",{"type":18,"tag":202,"props":324,"children":326},{"code":325},"\nray stop\nray start --head --port=6380\n",[327],{"type":18,"tag":207,"props":328,"children":329},{"__ignoreMap":7},[330],{"type":24,"value":325},{"type":18,"tag":26,"props":332,"children":333},{},[334],{"type":24,"value":335},"其他三台设备作为辅节点，依次执行如下命令：",{"type":18,"tag":202,"props":337,"children":339},{"code":338},"ray stop\nray start --address=主节点IP:6380\n",[340],{"type":18,"tag":207,"props":341,"children":342},{"__ignoreMap":7},[343],{"type":24,"value":338},{"type":18,"tag":26,"props":345,"children":346},{},[347],{"type":24,"value":348},"在主节点容器中拉起服务，其他节点不需要。模型路径根据需要调整。",{"type":18,"tag":202,"props":350,"children":352},{"code":351},"python3 -m vllm_mindspore.entrypoints vllm.entrypoints.openai.api_server --\nmodel \"/data/deepseek_r1_0528_bf16\" --trust_remote_code -- \ntensor_parallel_size=32 --max-num-seqs=256 --block-size=32 -- \nmax_model_len=16384 --max-num-batched-tokens=4096 --distributed-executor\n-backend=ray --gpu-memory-utilization=0.93\n",[353],{"type":18,"tag":207,"props":354,"children":355},{"__ignoreMap":7},[356],{"type":24,"value":351},{"type":18,"tag":26,"props":358,"children":359},{},[360],{"type":24,"value":361},"发起推理服务请求，若在主节点发起请求，新开一个终端，IP地址是0.0.0.0或者localhost。",{"type":18,"tag":202,"props":363,"children":365},{"code":364},"curl http://localhost:8000/v1/chat/completions \\\n  -H \"Content-Type: application/json\" \\\n  -d '{\n     \"model\": \"/data/deepseek_r1_0528_bf16\",\n   \n     \"messages\": [  \n      {\"role\": \"user\", \"content\": \"请介绍下北京的top景点\"}\n    ], \n    \"temperature\": 0.1, \n    \"max_tokens\": 4096, \n    \"top_p\": 0.9,\n    \"repetition_penalty\": 1.2\n  }' \n",[366],{"type":18,"tag":207,"props":367,"children":368},{"__ignoreMap":7},[369],{"type":24,"value":364},{"title":7,"searchDepth":371,"depth":371,"links":372},4,[],"markdown","content:technology-blogs:zh:3745.md","content","technology-blogs/zh/3745.md","technology-blogs/zh/3745","md",1776506134280]