<?xml version="1.0" encoding="UTF-8"?><urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:news="http://www.google.com/schemas/sitemap-news/0.9" xmlns:xhtml="http://www.w3.org/1999/xhtml" xmlns:image="http://www.google.com/schemas/sitemap-image/1.1" xmlns:video="http://www.google.com/schemas/sitemap-video/1.1"><url><loc>https://stable-lab.github.io/stable-learning/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/cache/01-fundamentals/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/cache/01-fundamentals/cache-operations/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/cache/01-fundamentals/cache-organization/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/cache/02-coherence-protocols/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/cache/02-coherence-protocols/mesi-moesi/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/cache/02-coherence-protocols/msi-protocol/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/cache/03-consistency-models/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/cache/03-consistency-models/sequential-consistency/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/cache/03-consistency-models/tso-relaxed/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/cache/04-modern-systems/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/cache/04-modern-systems/directory-protocol/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/cache/04-modern-systems/fences-barriers/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/rl/01-action-chain-rewards/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/rl/01-action-chain-rewards/rewards-and-return/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/rl/01-action-chain-rewards/states-and-actions/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/rl/02-policy-gradient/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/rl/02-policy-gradient/baseline-variance/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/rl/02-policy-gradient/reinforce/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/rl/03-ppo/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/rl/03-ppo/clipped-surrogate/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/rl/03-ppo/gae/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/rl/04-grpo/</loc></url><url><loc>https://stable-lab.github.io/stable-learning/rl/04-grpo/group-relative-policy/</loc></url></urlset>