<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>Michał Wojdylak — Blog</title>
    <link>https://michalwojdylak.com/blog</link>
    <description>Building production AI systems, LLM infrastructure, inference platforms and cloud-native ML solutions.</description>
    <language>en</language>
    <lastBuildDate>Wed, 10 Jun 2026 00:00:00 GMT</lastBuildDate>
    <atom:link href="https://michalwojdylak.com/rss.xml" rel="self" type="application/rss+xml" />
    <item>
      <title>Deploying LLMs in Production: An Infrastructure Playbook</title>
      <link>https://michalwojdylak.com/blog/first-post</link>
      <guid isPermaLink="true">https://michalwojdylak.com/blog/first-post</guid>
      <description>A practical walkthrough of the infrastructure decisions behind serving large language models reliably — from GPU selection to batching, autoscaling, and observability.</description>
      <pubDate>Wed, 10 Jun 2026 00:00:00 GMT</pubDate>
      <category>LLM</category>
      <category>Infrastructure</category>
      <category>Inference</category>
    </item>
    <item>
      <title>Cutting GPU Inference Costs Without Hurting Latency</title>
      <link>https://michalwojdylak.com/blog/optimizing-gpu-inference-costs</link>
      <guid isPermaLink="true">https://michalwojdylak.com/blog/optimizing-gpu-inference-costs</guid>
      <description>Quantization, batching, and right-sizing strategies that reduced our inference bill by 60% while keeping p99 latency flat.</description>
      <pubDate>Fri, 22 May 2026 00:00:00 GMT</pubDate>
      <category>Inference</category>
      <category>Optimization</category>
      <category>Cost</category>
    </item>
    <item>
      <title>Building an MLOps Platform on Kubernetes from Scratch</title>
      <link>https://michalwojdylak.com/blog/building-mlops-platform-kubernetes</link>
      <guid isPermaLink="true">https://michalwojdylak.com/blog/building-mlops-platform-kubernetes</guid>
      <description>The core building blocks of a production MLOps platform — model registry, CI/CD for models, and safe rollouts with canaries and shadow deployments.</description>
      <pubDate>Thu, 30 Apr 2026 00:00:00 GMT</pubDate>
      <category>MLOps</category>
      <category>Kubernetes</category>
      <category>Infrastructure</category>
    </item>
  </channel>
</rss>