<?xml version="1.0" encoding="utf-8" standalone="yes"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>动态批处理 on 黄文卓 | DevOps Engineer</title>
    <link>https://socake.github.io/tags/%E5%8A%A8%E6%80%81%E6%89%B9%E5%A4%84%E7%90%86/</link>
    <description>Recent content in 动态批处理 on 黄文卓 | DevOps Engineer</description>
    <generator>Hugo -- gohugo.io</generator>
    <language>zh-CN</language>
    <managingEditor>17691281867@163.com (Wenzhuo Huang)</managingEditor>
    <webMaster>17691281867@163.com (Wenzhuo Huang)</webMaster>
    <copyright>© 2026 Wenzhuo Huang</copyright>
    <lastBuildDate>Wed, 11 Mar 2026 10:00:00 +0800</lastBuildDate><atom:link href="https://socake.github.io/tags/%E5%8A%A8%E6%80%81%E6%89%B9%E5%A4%84%E7%90%86/index.xml" rel="self" type="application/rss+xml" />
    
    <item>
      <title>Triton Inference Server 生产部署：模型编排、动态批处理与多框架混部</title>
      <link>https://socake.github.io/posts/triton-inference-server-production/</link>
      <pubDate>Wed, 11 Mar 2026 10:00:00 +0800</pubDate>
      <author>17691281867@163.com (Wenzhuo Huang)</author>
      <guid>https://socake.github.io/posts/triton-inference-server-production/</guid>
      <description>把 Triton 从一个陌生的 NVIDIA 推理服务器讲清楚：model repository、backend、动态批处理、ensemble、BLS、Python backend、生产监控和踩坑实录。</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://socake.github.io/posts/triton-inference-server-production/featured.jpg" />
    </item>
    
  </channel>
</rss>
