[{"data":1,"prerenderedAt":307},["ShallowReactive",2],{"content-doc-\u002Fzh\u002Fblogs\u002Fopen-A-IInfra-summit-review":3,"surround-\u002Fzh\u002Fblogs\u002Fopen-A-IInfra-summit-review":305},{"_path":4,"_dir":5,"_draft":6,"_partial":6,"_locale":7,"title":8,"description":9,"date":10,"category":11,"author":12,"body":16,"_type":297,"_id":298,"_source":299,"_file":300,"_stem":301,"_extension":302,"coverImage":36,"plainText":303,"authorNames":304},"\u002Fzh\u002Fblogs\u002Fopen-A-IInfra-summit-review","blogs",false,"","Open AI Infra Summit 2026｜openUBMC以架构创新和开源标准破解智算集群运维痛点","2026年4月9-10日，2026 Open AI Infra Summit 在北京举办。\nopenUBMC 社区技术委员会委员 & iBMC 集群管理软件专家黄晗，在超节点生态分论坛发表《基于 openUBMC 打造超节点硬件智能管理平台》主题演讲，分享开源体系下硬件智能管理最新实践，以标准化方案破解智算集群运维痛点，引发行业广泛关注。\n","2026\u002F05\u002F06","essentials",[13],{"name":14,"description":15},"黄晗","openUBMC 社区技术委员会委员& iBMC 集群管理软件专家",{"type":17,"children":18,"toc":288},"root",[19,27,38,44,57,66,71,76,83,88,102,111,136,142,154,159,165,177,224,229,247,252,257,262,267,272],{"type":20,"tag":21,"props":22,"children":24},"element","h2",{"id":23},"分论坛回顾",[25],{"type":26,"value":23},"text",{"type":20,"tag":28,"props":29,"children":30},"p",{},[31,32],{"type":26,"value":9},{"type":20,"tag":33,"props":34,"children":37},"img",{"alt":35,"src":36},"alt text","\u002Fcategory\u002Fblog\u002Fopen%20A%20IInfra%20summit-review\u002F640.webp",[],{"type":20,"tag":21,"props":39,"children":41},{"id":40},"智算规模化发展运维标准供需失衡凸显",[42],{"type":26,"value":43},"智算规模化发展，运维标准供需失衡凸显",{"type":20,"tag":28,"props":45,"children":46},{},[47,49,55],{"type":26,"value":48},"随着智算集群快速扩张，",{"type":20,"tag":50,"props":51,"children":52},"strong",{},[53],{"type":26,"value":54},"硬件模块化、供应多元化",{"type":26,"value":56},"趋势明显，也对 BMC 带外管理提出新要求：",{"type":20,"tag":28,"props":58,"children":59},{},[60,62],{"type":26,"value":61},"以灵衢为代表的高速互联技术普及，推动超节点Scale-up架构快速落地，统一内存语义技术进一步实现硬件资源池化，BMC随之面临可组合解耦基础设施（CDI）的管理挑战，以Redfish、Sunfish等BMC北向模型，正在突破传统单机管理的物理边界，为超节点多设备协同管理提供了技术基础。\n",{"type":20,"tag":33,"props":63,"children":65},{"alt":35,"src":64},"\u002Fcategory\u002Fblog\u002Fopen%20A%20IInfra%20summit-review\u002F%E5%9B%BE1.jpg",[],{"type":20,"tag":28,"props":67,"children":68},{},[69],{"type":26,"value":70},"与此同时，用户对统一设备北向运维接入能力的需求日益迫切，但现有标准难以适配新一代智算硬件的复杂场景：整机与部件厂商虽希望通过差异化构建竞争力，却因缺乏统一规范导致北向接口参差不齐，形成用户统一运维诉求与厂商差异化规划之间的行业鸿沟。",{"type":20,"tag":28,"props":72,"children":73},{},[74],{"type":26,"value":75},"以互联网为代表的客户趋向硬件与BMC固件规范白盒化，却未形成全行业统一标准，一方面导致各厂商需基于同一代码基线适配多套客户规范，代码复用率极低，研发与适配成本居高不下；另一方面，用户运维系统仍需针对设备能力差异做定制化适配（如屏蔽不支持的功能），进一步推高设备接入与运维开发成本。",{"type":20,"tag":28,"props":77,"children":78},{},[79],{"type":20,"tag":33,"props":80,"children":82},{"alt":35,"src":81},"\u002Fcategory\u002Fblog\u002Fopen%20A%20IInfra%20summit-review\u002F%E5%9B%BE%E7%89%87%202.png",[],{"type":20,"tag":28,"props":84,"children":85},{},[86],{"type":26,"value":87},"以服务器硬件指标采集为例，不同客户在采集范围上各有定义，采集方式也呈现碎片化：",{"type":20,"tag":28,"props":89,"children":90},{},[91,93,98],{"type":26,"value":92},"➣ ",{"type":20,"tag":50,"props":94,"children":95},{},[96],{"type":26,"value":97},"采集范围：无统一界定",{"type":20,"tag":33,"props":99,"children":101},{"alt":35,"src":100},"\u002Fcategory\u002Fblog\u002Fopen%20A%20IInfra%20summit-review\u002F%E5%9B%BE%E7%89%87%203.png",[],{"type":20,"tag":28,"props":103,"children":104},{},[105,106],{"type":26,"value":92},{"type":20,"tag":50,"props":107,"children":108},{},[109],{"type":26,"value":110},"采集方式：",{"type":20,"tag":112,"props":113,"children":114},"ul",{},[115,121,126,131],{"type":20,"tag":116,"props":117,"children":118},"li",{},[119],{"type":26,"value":120},"IPMI传感器",{"type":20,"tag":116,"props":122,"children":123},{},[124],{"type":26,"value":125},"自定义rest接口下载csv文件",{"type":20,"tag":116,"props":127,"children":128},{},[129],{"type":26,"value":130},"自定义redfish查询接口",{"type":20,"tag":116,"props":132,"children":133},{},[134],{"type":26,"value":135},"其他定制化方式",{"type":20,"tag":21,"props":137,"children":139},{"id":138},"构建超节点多bmc协同底座cdi资源透明管理",[140],{"type":26,"value":141},"构建超节点多BMC协同底座，CDI资源透明管理",{"type":20,"tag":28,"props":143,"children":144},{},[145,147,152],{"type":26,"value":146},"针对超节点管理的核心痛点，openUBMC 从",{"type":20,"tag":50,"props":148,"children":149},{},[150],{"type":26,"value":151},"软件架构层面",{"type":26,"value":153},"给出针对性解决方案：",{"type":20,"tag":28,"props":155,"children":156},{},[157],{"type":26,"value":158},"统一超节点计算域与交换域的设备管理对象模型，并基于统一模型实现高性能数据同步，进而实现超节点系统在资产、故障、能效等维度的多节点协同管理，让 CDI 资源可被上层运维系统透明感知、统一调度。\n图三",{"type":20,"tag":21,"props":160,"children":162},{"id":161},"以标准筑基以社区赋能-ai-智能运维",[163],{"type":26,"value":164},"以标准筑基，以社区赋能 AI 智能运维",{"type":20,"tag":28,"props":166,"children":167},{},[168,170,175],{"type":26,"value":169},"面对行业痛点，openUBMC 以开源生态为底座，从标准协同与技术实现",{"type":20,"tag":50,"props":171,"children":172},{},[173],{"type":26,"value":174},"双重维度",{"type":26,"value":176},"给出系统性解决方案：",{"type":20,"tag":112,"props":178,"children":179},{},[180,190,204],{"type":20,"tag":116,"props":181,"children":182},{},[183,188],{"type":20,"tag":50,"props":184,"children":185},{},[186],{"type":26,"value":187},"接轨国际标准",{"type":26,"value":189},"\nopenUBMC社区提前布局技术预研，平台满足国际主流标准，为北向运维接入提供稳定、通用的基础能力。",{"type":20,"tag":116,"props":191,"children":192},{},[193,198,200],{"type":20,"tag":50,"props":194,"children":195},{},[196],{"type":26,"value":197},"共建行业统一标准",{"type":26,"value":199},"\n联合行业标准组织、用户、整机及部件厂商共建统一北向标准，当前正在围绕灵衢部件、DPU等关键部件制定管理接口规范，同步搭建测评认证体系，相关标准在社区优先落地并实现 100% 复用，以“社区 + 标准”推动产业协同创新。\n",{"type":20,"tag":33,"props":201,"children":203},{"alt":35,"src":202},"\u002Fcategory\u002Fblog\u002Fopen%20A%20IInfra%20summit-review\u002F%E5%9B%BE%E7%89%87%204.png",[],{"type":20,"tag":116,"props":205,"children":206},{},[207,212,214,218,220],{"type":20,"tag":50,"props":208,"children":209},{},[210],{"type":26,"value":211},"标准化遥测接口，赋能 AI 运维闭环",{"type":26,"value":213},"\n通过标准化流式遥测接口与统一指标定义，用户运维系统可以无缝对接不同厂商的设备，采集高精准、低时延的数据，支撑 AI 运维系统完成 “收集–分析–决策–执行”全流程闭环。\n",{"type":20,"tag":33,"props":215,"children":217},{"alt":35,"src":216},"\u002Fcategory\u002Fblog\u002Fopen%20A%20IInfra%20summit-review\u002F%E5%9B%BE%E7%89%87%206.png",[],{"type":26,"value":219},"\n数据主动推送，重构硬件运维效能\n",{"type":20,"tag":33,"props":221,"children":223},{"alt":35,"src":222},"\u002Fcategory\u002Fblog\u002Fopen%20A%20IInfra%20summit-review\u002F%E5%9B%BE%E7%89%87%207.png",[],{"type":20,"tag":28,"props":225,"children":226},{},[227],{"type":26,"value":228},"相比传统轮询模式，openUBMC采用的主动推送模式优势显著：",{"type":20,"tag":112,"props":230,"children":231},{},[232,237,242],{"type":20,"tag":116,"props":233,"children":234},{},[235],{"type":26,"value":236},"分层架构，被采集侧主动上报，无需采集侧频繁轮询；",{"type":20,"tag":116,"props":238,"children":239},{},[240],{"type":26,"value":241},"采集侧与被采集侧仅一次订阅交互，大幅降低交互开销；",{"type":20,"tag":116,"props":243,"children":244},{},[245],{"type":26,"value":246},"亚秒级实时采集并推送，无采样盲区，保障数据实时性；",{"type":20,"tag":28,"props":248,"children":249},{},[250],{"type":26,"value":251},"通过数据主动推送，用户运维系统可实现从硬件到固件的全方位可观测，经过LLM训练推理，硬件运维管理从传统的故障被动响应升级为主动预防，同时支撑系统负载与能耗的深度调优，为智算集群高效稳定运行提供坚实保障。",{"type":20,"tag":21,"props":253,"children":255},{"id":254},"携手共筑硬件管理统一标准",[256],{"type":26,"value":254},{"type":20,"tag":28,"props":258,"children":259},{},[260],{"type":26,"value":261},"openUBMC 社区诚邀整机、部件、云厂商及行业用户：",{"type":20,"tag":28,"props":263,"children":264},{},[265],{"type":26,"value":266},"携手共建算力基础设施硬件管理北向统一标准，使能产业高质量发展！",{"type":20,"tag":28,"props":268,"children":269},{},[270],{"type":26,"value":271},"欢迎加入openUBMC社区Interface SIG，共商标准、共建生态、共启智算硬件管理新未来。",{"type":20,"tag":112,"props":273,"children":274},{},[275],{"type":20,"tag":116,"props":276,"children":277},{},[278,280],{"type":26,"value":279},"Interface SIG：",{"type":20,"tag":281,"props":282,"children":286},"a",{"href":283,"rel":284},"https:\u002F\u002Fwww.openubmc.cn\u002Fzh\u002Fsig\u002Fsig-interface",[285],"nofollow",[287],{"type":26,"value":283},{"title":7,"searchDepth":289,"depth":289,"links":290},4,[291,293,294,295,296],{"id":23,"depth":292,"text":23},2,{"id":40,"depth":292,"text":43},{"id":138,"depth":292,"text":141},{"id":161,"depth":292,"text":164},{"id":254,"depth":292,"text":254},"markdown","content:zh:blogs:open A IInfra summit-review.md","content","zh\u002Fblogs\u002Fopen A IInfra summit-review.md","zh\u002Fblogs\u002Fopen A IInfra summit-review","md","分论坛回顾 2026年4月9-10日，2026 Open AI Infra Summit 在北京举办。\nopenUBMC 社区技术委员会委员 & iBMC 集群管理软件专家黄晗，在超节点生态分论坛发表《基于 openUBMC 打造超节点硬件智能管理平台》主题演讲，分享开源体系下硬件智能管理最新实践，以标准化方案破解智算集群运维痛点，引发行业广泛关注。\n  智算规模化发展，运维标准供需失衡凸显 随着智算集群快速扩张， 硬件模块化、供应多元化 趋势明显，也对 BMC 带外管理提出新要求： 以灵衢为代表的高速互联技术普及，推动超节点Scale-up架构快速落地，统一内存语义技术进一步实现硬件资源池化，BMC随之面临可组合解耦基础设施（CDI）的管理挑战，以Redfish、Sunfish等BMC北向模型，正在突破传统单机管理的物理边界，为超节点多设备协同管理提供了技术基础。\n  与此同时，用户对统一设备北向运维接入能力的需求日益迫切，但现有标准难以适配新一代智算硬件的复杂场景：整机与部件厂商虽希望通过差异化构建竞争力，却因缺乏统一规范导致北向接口参差不齐，形成用户统一运维诉求与厂商差异化规划之间的行业鸿沟。 以互联网为代表的客户趋向硬件与BMC固件规范白盒化，却未形成全行业统一标准，一方面导致各厂商需基于同一代码基线适配多套客户规范，代码复用率极低，研发与适配成本居高不下；另一方面，用户运维系统仍需针对设备能力差异做定制化适配（如屏蔽不支持的功能），进一步推高设备接入与运维开发成本。  以服务器硬件指标采集为例，不同客户在采集范围上各有定义，采集方式也呈现碎片化： ➣  采集范围：无统一界定  ➣  采集方式： IPMI传感器 自定义rest接口下载csv文件 自定义redfish查询接口 其他定制化方式 构建超节点多BMC协同底座，CDI资源透明管理 针对超节点管理的核心痛点，openUBMC 从 软件架构层面 给出针对性解决方案： 统一超节点计算域与交换域的设备管理对象模型，并基于统一模型实现高性能数据同步，进而实现超节点系统在资产、故障、能效等维度的多节点协同管理，让 CDI 资源可被上层运维系统透明感知、统一调度。\n图三 以标准筑基，以社区赋能 AI 智能运维 面对行业痛点，openUBMC 以开源生态为底座，从标准协同与技术实现 双重维度 给出系统性解决方案： 接轨国际标准 \nopenUBMC社区提前布局技术预研，平台满足国际主流标准，为北向运维接入提供稳定、通用的基础能力。 共建行业统一标准 \n联合行业标准组织、用户、整机及部件厂商共建统一北向标准，当前正在围绕灵衢部件、DPU等关键部件制定管理接口规范，同步搭建测评认证体系，相关标准在社区优先落地并实现 100% 复用，以“社区 + 标准”推动产业协同创新。\n  标准化遥测接口，赋能 AI 运维闭环 \n通过标准化流式遥测接口与统一指标定义，用户运维系统可以无缝对接不同厂商的设备，采集高精准、低时延的数据，支撑 AI 运维系统完成 “收集–分析–决策–执行”全流程闭环。\n  \n数据主动推送，重构硬件运维效能\n  相比传统轮询模式，openUBMC采用的主动推送模式优势显著： 分层架构，被采集侧主动上报，无需采集侧频繁轮询； 采集侧与被采集侧仅一次订阅交互，大幅降低交互开销； 亚秒级实时采集并推送，无采样盲区，保障数据实时性； 通过数据主动推送，用户运维系统可实现从硬件到固件的全方位可观测，经过LLM训练推理，硬件运维管理从传统的故障被动响应升级为主动预防，同时支撑系统负载与能耗的深度调优，为智算集群高效稳定运行提供坚实保障。 携手共筑硬件管理统一标准 openUBMC 社区诚邀整机、部件、云厂商及行业用户： 携手共建算力基础设施硬件管理北向统一标准，使能产业高质量发展！ 欢迎加入openUBMC社区Interface SIG，共商标准、共建生态、共启智算硬件管理新未来。 Interface SIG： https:\u002F\u002Fwww.openubmc.cn\u002Fzh\u002Fsig\u002Fsig-interface",[14],[306,306],null,1782831329641]