<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9"
        xmlns:image="http://www.google.com/schemas/sitemap-image/1.1">
  <url>
    <loc>https://hongping-zh.github.io/</loc>
    <lastmod>2026-06-22</lastmod>
    <changefreq>weekly</changefreq>
    <priority>1.0</priority>
    <image:image>
      <image:loc>https://hongping-zh.github.io/og-image.png</image:loc>
      <image:title>LLM Energy Benchmark — Quantization Energy-Accuracy Trade-offs</image:title>
      <image:caption>Real GPU power measurements for INT8, NF4, and FP16 LLM inference across 4 NVIDIA architectures, with perplexity accuracy data.</image:caption>
    </image:image>
  </url>
  <url>
    <loc>https://hongping-zh.github.io/paper/</loc>
    <lastmod>2026-06-22</lastmod>
    <changefreq>monthly</changefreq>
    <priority>0.9</priority>
    <image:image>
      <image:loc>https://hongping-zh.github.io/og-image.png</image:loc>
      <image:title>Weight-Only Quantization Does Not Always Save Energy</image:title>
    </image:image>
  </url>
  <url>
    <loc>https://hongping-zh.github.io/papers/ssrn-6854700.pdf</loc>
    <lastmod>2026-06-22</lastmod>
    <changefreq>monthly</changefreq>
    <priority>0.8</priority>
  </url>
  <url>
    <loc>https://hongping-zh.github.io/compare.html</loc>
    <lastmod>2026-06-22</lastmod>
    <changefreq>monthly</changefreq>
    <priority>0.8</priority>
  </url>
  <url>
    <loc>https://hongping-zh.github.io/updates/</loc>
    <lastmod>2026-06-08</lastmod>
    <changefreq>weekly</changefreq>
    <priority>0.6</priority>
  </url>
  <url>
    <loc>https://hongping-zh.github.io/updates/2026-06-08-rtx-pro6000-fp16-e2e/</loc>
    <lastmod>2026-06-08</lastmod>
    <changefreq>monthly</changefreq>
    <priority>0.7</priority>
  </url>
  <url>
    <loc>https://hongping-zh.github.io/updates/2026-06-03-rtx-pro6000-blackwell-phase/</loc>
    <lastmod>2026-06-03</lastmod>
    <changefreq>monthly</changefreq>
    <priority>0.7</priority>
  </url>
  <url>
    <loc>https://hongping-zh.github.io/updates/2026-04-18-qwen25-3b-t4/</loc>
    <lastmod>2026-04-18</lastmod>
    <changefreq>monthly</changefreq>
    <priority>0.6</priority>
  </url>
  <url>
    <loc>https://hongping-zh.github.io/bot-landing/</loc>
    <lastmod>2026-06-22</lastmod>
    <changefreq>monthly</changefreq>
    <priority>0.3</priority>
  </url>
</urlset>
