<?xml version="1.0" encoding="UTF-8"?><urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:news="http://www.google.com/schemas/sitemap-news/0.9" xmlns:xhtml="http://www.w3.org/1999/xhtml" xmlns:image="http://www.google.com/schemas/sitemap-image/1.1" xmlns:video="http://www.google.com/schemas/sitemap-video/1.1"><url><loc>https://rl-and-control-guide.brandon-behring.dev/</loc></url><url><loc>https://rl-and-control-guide.brandon-behring.dev/chapters/</loc></url><url><loc>https://rl-and-control-guide.brandon-behring.dev/chapters/ch01-mdp-dp/</loc></url><url><loc>https://rl-and-control-guide.brandon-behring.dev/chapters/ch02-async-dp/</loc></url><url><loc>https://rl-and-control-guide.brandon-behring.dev/chapters/ch03-monte-carlo/</loc></url><url><loc>https://rl-and-control-guide.brandon-behring.dev/chapters/ch04-td-learning/</loc></url><url><loc>https://rl-and-control-guide.brandon-behring.dev/chapters/ch05-function-approx/</loc></url><url><loc>https://rl-and-control-guide.brandon-behring.dev/chapters/ch06-dqn/</loc></url><url><loc>https://rl-and-control-guide.brandon-behring.dev/chapters/ch07-policy-gradient/</loc></url><url><loc>https://rl-and-control-guide.brandon-behring.dev/chapters/ch08-actor-critic-ppo/</loc></url><url><loc>https://rl-and-control-guide.brandon-behring.dev/chapters/ch09-continuous-control/</loc></url><url><loc>https://rl-and-control-guide.brandon-behring.dev/chapters/ch10-rl-robotics-survey/</loc></url><url><loc>https://rl-and-control-guide.brandon-behring.dev/chapters/ch11-state-space/</loc></url><url><loc>https://rl-and-control-guide.brandon-behring.dev/chapters/ch12-stability-controllability/</loc></url><url><loc>https://rl-and-control-guide.brandon-behring.dev/chapters/ch13-lqr-lqg/</loc></url><url><loc>https://rl-and-control-guide.brandon-behring.dev/chapters/ch14-nonlinear-control/</loc></url><url><loc>https://rl-and-control-guide.brandon-behring.dev/references/</loc></url><url><loc>https://rl-and-control-guide.brandon-behring.dev/search/</loc></url></urlset>