<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:news="http://www.google.com/schemas/sitemap-news/0.9" xmlns:xhtml="http://www.w3.org/1999/xhtml" xmlns:image="http://www.google.com/schemas/sitemap-image/1.1" xmlns:video="http://www.google.com/schemas/sitemap-video/1.1">
    
  <url>
    <loc>https://mintlify.wiki/pytorch/rl/advanced/llm-post-training</loc>
    <lastmod>2026-06-28T06:45:38.361Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/advanced/model-based-rl</loc>
    <lastmod>2026-06-28T06:23:50.891Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/advanced/offline-rl</loc>
    <lastmod>2026-06-28T06:45:38.366Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/advanced/performance-optimization</loc>
    <lastmod>2026-06-28T06:23:50.891Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/concepts/collectors</loc>
    <lastmod>2026-06-28T06:45:38.367Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/concepts/environments</loc>
    <lastmod>2026-06-28T06:45:38.364Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/concepts/modules-policies</loc>
    <lastmod>2026-06-28T06:45:38.365Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/concepts/objectives-losses</loc>
    <lastmod>2026-06-28T06:45:38.362Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/concepts/replay-buffers</loc>
    <lastmod>2026-06-28T06:45:38.365Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/concepts/tensordict-model</loc>
    <lastmod>2026-06-28T06:45:38.363Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/installation</loc>
    <lastmod>2026-06-28T06:45:38.360Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/introduction</loc>
    <lastmod>2026-06-28T06:45:38.362Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/quickstart</loc>
    <lastmod>2026-06-28T06:45:40.796Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/collectors/distributed</loc>
    <lastmod>2026-06-28T06:45:40.789Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/collectors/single</loc>
    <lastmod>2026-06-28T06:45:40.792Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/data/datasets</loc>
    <lastmod>2026-06-28T06:45:40.797Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/data/replay-buffers</loc>
    <lastmod>2026-06-28T06:45:40.791Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/data/specs</loc>
    <lastmod>2026-06-28T06:45:40.790Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/envs/overview</loc>
    <lastmod>2026-06-28T06:45:40.789Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/envs/third-party-libs</loc>
    <lastmod>2026-06-28T06:45:40.797Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/envs/transforms</loc>
    <lastmod>2026-06-28T06:45:40.795Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/envs/vectorized</loc>
    <lastmod>2026-06-28T06:45:40.793Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/modules/actors-critics</loc>
    <lastmod>2026-06-28T06:45:42.699Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/modules/distributions</loc>
    <lastmod>2026-06-28T06:45:42.699Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/modules/exploration</loc>
    <lastmod>2026-06-28T06:45:42.702Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/modules/recurrent</loc>
    <lastmod>2026-06-28T06:45:42.695Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/objectives/multi-agent</loc>
    <lastmod>2026-06-28T06:45:42.698Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/objectives/offline-imitation</loc>
    <lastmod>2026-06-28T06:45:42.695Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/objectives/policy-gradient</loc>
    <lastmod>2026-06-28T06:24:02.008Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/objectives/value-based</loc>
    <lastmod>2026-06-28T06:45:42.697Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/reference/objectives/value-estimators</loc>
    <lastmod>2026-06-28T06:45:42.694Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/tutorials/custom-environment</loc>
    <lastmod>2026-06-28T06:45:42.700Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/tutorials/distributed-training</loc>
    <lastmod>2026-06-28T06:45:42.696Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/tutorials/first-training-loop</loc>
    <lastmod>2026-06-28T06:45:44.242Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/tutorials/multi-agent-training</loc>
    <lastmod>2026-06-28T06:45:44.236Z</lastmod>
  </url>

  <url>
    <loc>https://mintlify.wiki/pytorch/rl/tutorials/recurrent-policies</loc>
    <lastmod>2026-06-28T06:45:44.238Z</lastmod>
  </url>
</urlset>