[{"data":1,"prerenderedAt":173},["ShallowReactive",2],{"content-query-JnSF9cPOJW":3},{"_path":4,"_dir":5,"_draft":6,"_partial":6,"_locale":7,"title":8,"description":9,"date":10,"cover":11,"type":12,"body":13,"_type":167,"_id":168,"_source":169,"_file":170,"_stem":171,"_extension":172},"/news/zh/3683","zh",false,"","使能AI智能体算法性能倍增！昇思多维混合并行等技术助力小艺语音交互、AI修图体验升级","3月20日华为发布阔折叠屏手机Pura X，发布会上首发了鸿蒙AI，全新小艺焕新登场，实现更拟人的自然语音交互。","2025-04-03","https://obs-mindspore-file.obs.cn-north-4.myhuaweicloud.com/file/2025/04/11/7354d85c170647199405a3dfe4130cac.png","news",{"type":14,"children":15,"toc":155},"root",[16,24,30,48,53,58,66,81,86,93,108,113,118,123,130,145,150],{"type":17,"tag":18,"props":19,"children":21},"element","h1",{"id":20},"使能ai智能体算法性能倍增昇思多维混合并行等技术助力小艺语音交互ai修图体验升级",[22],{"type":23,"value":8},"text",{"type":17,"tag":25,"props":26,"children":27},"p",{},[28],{"type":23,"value":29},"3月20日华为发布阔折叠屏手机Pura X，发布会上首发了鸿蒙AI，全新小艺焕新登场，实现更拟人的自然语音交互。全新小艺基于昇思MindSpore，实现小艺语音合成算法推理性能提升30%，AI人像精修算法推理性能倍增，提升用户对话体验的实时性与修图效率。",{"type":17,"tag":31,"props":32,"children":34},"h3",{"id":33},"_01-提升语音输出响应效率生成性能",[35,41,43],{"type":17,"tag":36,"props":37,"children":38},"strong",{},[39],{"type":23,"value":40},"# 01",{"type":23,"value":42}," ",{"type":17,"tag":36,"props":44,"children":45},{},[46],{"type":23,"value":47},"提升语音输出响应效率、生成性能",{"type":17,"tag":25,"props":49,"children":50},{},[51],{"type":23,"value":52},"语音合成算法中，存在Decode算法模型多次迭代的场景，导致在不同次迭代过程中，需要拷贝上一次的模型输出作为下一次的模型输入，因此Device到Host的数据拷贝以及Host到Device的数据拷贝存在性能瓶颈。",{"type":17,"tag":25,"props":54,"children":55},{},[56],{"type":23,"value":57},"小艺研发团队基于昇思MindSpore AI框架，通过使用模型运算结果Cache缓存机制，支持将模型输出缓存在Device侧，在下次迭代直接使用Device侧数据，有效解决语音类模型在迭代过程中Device侧和Host侧间的数据拷贝时延问题，语音输出首响效率提升20%。昇思MindSpore联合算法团队深度优化Decode模型结构，并构建使能Attention、RotaryMul等融合算子，语音生成性能综合提升10%。",{"type":17,"tag":25,"props":59,"children":60},{},[61],{"type":17,"tag":62,"props":63,"children":65},"img",{"alt":7,"src":64},"https://obs-mindspore-file.obs.cn-north-4.myhuaweicloud.com/file/2025/04/11/60dd44a8224c467493e28ac4fd3031ff.png",[],{"type":17,"tag":31,"props":67,"children":69},{"id":68},"_02-实现小艺语音双麦降噪算法的极低时延推理",[70,75,76],{"type":17,"tag":36,"props":71,"children":72},{},[73],{"type":23,"value":74},"# 02",{"type":23,"value":42},{"type":17,"tag":36,"props":77,"children":78},{},[79],{"type":23,"value":80},"实现小艺语音双麦降噪算法的极低时延推理",{"type":17,"tag":25,"props":82,"children":83},{},[84],{"type":23,"value":85},"告别传统机械问答，小艺凭借“打断不中断“的全双工技术，带来无缝、流畅的语音交互。全双工离不开声音的精准捕捉，双麦降噪业务算法团队实现HAL层极近调用MindSpore Lite超轻量端侧AI框架，降低传输时延和推理底噪，利用多音频流批次推理，高效发挥硬件算力，实现毫秒级超低时延降噪，让全双工对话轻松实现。",{"type":17,"tag":25,"props":87,"children":88},{},[89],{"type":17,"tag":62,"props":90,"children":92},{"alt":7,"src":91},"https://obs-mindspore-file.obs.cn-north-4.myhuaweicloud.com/file/2025/04/11/cbfc069e3972488fb302053edfe78cab.png",[],{"type":17,"tag":31,"props":94,"children":96},{"id":95},"_03-多维混合并行图结构融合优化实现ai修图效率倍增",[97,102,103],{"type":17,"tag":36,"props":98,"children":99},{},[100],{"type":23,"value":101},"# 03",{"type":23,"value":42},{"type":17,"tag":36,"props":104,"children":105},{},[106],{"type":23,"value":107},"多维混合并行、图结构融合优化实现AI修图效率倍增",{"type":17,"tag":25,"props":109,"children":110},{},[111],{"type":23,"value":112},"AI人像精修算法中，为得到更高质量的人像精修效果，算法扩大图片分辨率，导致模型推理过程中Attention模块的序列长度增加。因此，业务模型推理过程中，Attention模块的计算量成倍增加。",{"type":17,"tag":25,"props":114,"children":115},{},[116],{"type":23,"value":117},"昇思MindSpore通过构建TP/CP等多维混合并行策略，针对Conv算子，将算子输出特征图进行多份切分，实现多卡并行计算。针对Matmul类算子通过权重与特征图的切分，实现多卡并行，通过不同的并行策略实现AIGC类大模型出图效率倍增。",{"type":17,"tag":25,"props":119,"children":120},{},[121],{"type":23,"value":122},"为进一步提升业务模型推理性能，针对AI生成式算法模型结构，昇思MindSpore通过构建自动图结构融合优化能力，将模型中Attention结构的小算子结合成昇腾硬件支持的PromptFlashAttention大算子、以及将算法中的GroupNorm算子与激活算子融合成GroupNormSilu大算子，出图效率提升20%。",{"type":17,"tag":25,"props":124,"children":125},{},[126],{"type":17,"tag":62,"props":127,"children":129},{"alt":7,"src":128},"https://obs-mindspore-file.obs.cn-north-4.myhuaweicloud.com/file/2025/04/11/91d975e9fb8248a484ccfe743721c0d9.png",[],{"type":17,"tag":31,"props":131,"children":133},{"id":132},"_04-ai人像精修算法业务部署优化",[134,139,140],{"type":17,"tag":36,"props":135,"children":136},{},[137],{"type":23,"value":138},"# 04",{"type":23,"value":42},{"type":17,"tag":36,"props":141,"children":142},{},[143],{"type":23,"value":144},"AI人像精修算法业务部署优化",{"type":17,"tag":25,"props":146,"children":147},{},[148],{"type":23,"value":149},"AI人像精修算法业务复杂，在线部署过程中存在多个业务模型，导致业务部署加载时间长达小时级别。MindSpore联合业务深入优化部署方案，通过使能图编译缓存能力，业务在部署过程中直接使用编译缓存，部署加载时延从小时级优化到分钟级，极大方便业务服务化部署。",{"type":17,"tag":25,"props":151,"children":152},{},[153],{"type":23,"value":154},"未来，昇思MindSpore将持续助力小艺优化AI智能体能力，提升AI落地应用体验，加速行业应用创新。",{"title":7,"searchDepth":156,"depth":156,"links":157},4,[158,161,163,165],{"id":33,"depth":159,"text":160},3,"# 01 提升语音输出响应效率、生成性能",{"id":68,"depth":159,"text":162},"# 02 实现小艺语音双麦降噪算法的极低时延推理",{"id":95,"depth":159,"text":164},"# 03 多维混合并行、图结构融合优化实现AI修图效率倍增",{"id":132,"depth":159,"text":166},"# 04 AI人像精修算法业务部署优化","markdown","content:news:zh:3683.md","content","news/zh/3683.md","news/zh/3683","md",1776506087593]