<?xml version="1.0" encoding="UTF-8"?>
<?xml-stylesheet type="text/xsl" href="https://thenlpstudent.github.io/sitemap.xsl"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd" xmlns:image="http://www.google.com/schemas/sitemap-image/1.1">
<url>
<loc>https://thenlpstudent.github.io/</loc>
</url>
<url>
<loc>https://thenlpstudent.github.io/deep-reinforcement-learning-from-human-preferences-paper-explained.html</loc>
<lastmod>2023-04-12T22:12:34+05:30</lastmod>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/9/sss.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/9/Group-14.png</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/9/Group-15.png</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/9/Group-3.png</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
</url>
<url>
<loc>https://thenlpstudent.github.io/introduction-to-reinforcement-learning.html</loc>
<lastmod>2021-10-21T07:51:32+05:30</lastmod>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/returneq.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/returnmodified.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/returnwhole.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/Group-5-2.png</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/bellman_1.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/bellman_2.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/bellman_5.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/bellman_6.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/bellman_7.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/bellamn_3.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/v_policy_s.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/v_policy_s_s.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/q_policy_s_a.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/optimal_val_policy.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/optimal_q_value.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/q_optimal_s_a_expe-2.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/big_equ.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/q_optimal_stup.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/policyexample.PNG</image:loc>
<image:title><![CDATA[Reinforcement Learning: 2nd Edition (Finite Markov Decision Processes)]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/2/gridworld2.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
</url>
<url>
<loc>https://thenlpstudent.github.io/looking-at-entropy.html</loc>
<lastmod>2023-04-06T13:45:35+05:30</lastmod>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/7/Group-12.png</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/7/Group-2.png</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/7/gg22.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/7/sss.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/7/ludecomp.gif</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
</url>
<url>
<loc>https://thenlpstudent.github.io/new-post-2.html</loc>
<lastmod>2023-04-05T15:40:27+05:30</lastmod>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/4/Capture-2.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/4/Group-11.png</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/4/test2.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/4/sim-2.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/4/ss.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/4/qq.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/4/tttt.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/4/sigmod.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/4/sigmoidgg-3.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/4/ttttt.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/4/gra1.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/4/grr.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/4/ggg22.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/4/ggrr.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/4/anchor2-2.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/4/graph3d.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
</url>
<url>
<loc>https://thenlpstudent.github.io/page/2/</loc>
</url>
<url>
<loc>https://thenlpstudent.github.io/summary-of-the-generalization-bounds-via-convex-analysis-paper.html</loc>
<lastmod>2023-05-27T10:26:18+05:30</lastmod>
</url>
<url>
<loc>https://thenlpstudent.github.io/the-multi-armed-bandits-problem.html</loc>
<lastmod>2021-10-27T08:04:03+05:30</lastmod>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/3/captur1.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/3/captur2.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/3/incremental-2.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/3/updaterule.PNG</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/3/carbon7-2.png</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/3/maincode1-2.png</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/3/stepsize.png</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/3/f22.png</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
<image:image>
<image:loc>https://thenlpstudent.github.io/media/posts/3/f2.png</image:loc>
<image:title><![CDATA[]]></image:title>
</image:image>
</url>
<url>
<loc>https://thenlpstudent.github.io/transformers-and-attention.html</loc>
<lastmod>2021-09-09T17:11:20+05:30</lastmod>
</url>
</urlset>