<?xml version="1.0" encoding="UTF-8"?>
<!-- generator="FeedCreator 1.8" -->
<?xml-stylesheet href="https://www.daiphys.com/portal/lib/exe/css.php?s=feed" type="text/css"?>
<rdf:RDF
    xmlns="http://purl.org/rss/1.0/"
    xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
    xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
    xmlns:dc="http://purl.org/dc/elements/1.1/">
    <channel rdf:about="https://www.daiphys.com/portal/feed.php">
        <title>Daiphys Tech Portal - ml:rl</title>
        <description></description>
        <link>https://www.daiphys.com/portal/</link>
        <image rdf:resource="https://www.daiphys.com/portal/_media/wiki/dokuwiki.svg" />
       <dc:date>2026-04-30T21:20:44+00:00</dc:date>
        <items>
            <rdf:Seq>
                <rdf:li rdf:resource="https://www.daiphys.com/portal/ml/rl/breakout.html?rev=1697169260&amp;do=diff"/>
                <rdf:li rdf:resource="https://www.daiphys.com/portal/ml/rl/cartpole.html?rev=1697169237&amp;do=diff"/>
                <rdf:li rdf:resource="https://www.daiphys.com/portal/ml/rl/index.html?rev=1680827153&amp;do=diff"/>
                <rdf:li rdf:resource="https://www.daiphys.com/portal/ml/rl/mountaincar.html?rev=1697169199&amp;do=diff"/>
                <rdf:li rdf:resource="https://www.daiphys.com/portal/ml/rl/quest-track.html?rev=1697169191&amp;do=diff"/>
                <rdf:li rdf:resource="https://www.daiphys.com/portal/ml/rl/quest.html?rev=1697169170&amp;do=diff"/>
                <rdf:li rdf:resource="https://www.daiphys.com/portal/ml/rl/sealane.html?rev=1697169160&amp;do=diff"/>
            </rdf:Seq>
        </items>
    </channel>
    <image rdf:about="https://www.daiphys.com/portal/_media/wiki/dokuwiki.svg">
        <title>Daiphys Tech Portal</title>
        <link>https://www.daiphys.com/portal/</link>
        <url>https://www.daiphys.com/portal/_media/wiki/dokuwiki.svg</url>
    </image>
    <item rdf:about="https://www.daiphys.com/portal/ml/rl/breakout.html?rev=1697169260&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-10-13T03:54:20+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>Breakout</title>
        <link>https://www.daiphys.com/portal/ml/rl/breakout.html?rev=1697169260&amp;do=diff</link>
        <description>Breakout

Tutorials

Google Colaboratory - Dueling DQN/CNN

&lt;https://colab.research.google.com/drive/1cD2S8dvnRVJmSrbLpR56ZVOHD88qZUpV&gt;

Results

Dueling DQN/CNN - to be trained...




Video



References

&lt;https://gymnasium.farama.org/environments/atari/breakout/&gt;

&lt;https://storage.googleapis.com/deepmind-data/assets/papers/DeepMindNature14236Paper.pdf&gt;

&lt;https://arxiv.org/abs/1511.06581&gt;

&lt;https://www.datahubbs.com/deepmind-dqn/&gt;

&lt;https://www.dskomei.com/entry/2021/10/05/140156&gt;

&lt;https://qii…</description>
    </item>
    <item rdf:about="https://www.daiphys.com/portal/ml/rl/cartpole.html?rev=1697169237&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-10-13T03:53:57+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>Cart Pole</title>
        <link>https://www.daiphys.com/portal/ml/rl/cartpole.html?rev=1697169237&amp;do=diff</link>
        <description>Cart Pole

Tutorials

Google Colaboratory - DQN/MLP

&lt;https://colab.research.google.com/drive/1goyULtqCz8FKjc7-RYww2Y2_B3OTs8f3&gt;

Google Colaboratory - Rainbow/MLP (RLlib)

&lt;https://colab.research.google.com/drive/1xuJyTHinhJABp9ct9tCy17GbnuP9JE1b&gt;

Google Colaboratory - PPO/MLP (Stable Baselines 3)

&lt;https://colab.research.google.com/drive/1s7ycZBPAojJqHOmZE0fq7PtMZOqUNot9&gt;

Trained Models





Results

DQN/MLP




Rainbow/MLP (RLlib) - to be tuned...




PPO/MLP (Stable Baselines 3)</description>
    </item>
    <item rdf:about="https://www.daiphys.com/portal/ml/rl/index.html?rev=1680827153&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-04-07T00:25:53+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>Reinforcement Learning</title>
        <link>https://www.daiphys.com/portal/ml/rl/index.html?rev=1680827153&amp;do=diff</link>
        <description>Reinforcement Learning


	* Breakout
	* Cart Pole
	* Mountain Car
	* Quest
	* Quest Track
	* Sea Lane</description>
    </item>
    <item rdf:about="https://www.daiphys.com/portal/ml/rl/mountaincar.html?rev=1697169199&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-10-13T03:53:19+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>Mountain Car</title>
        <link>https://www.daiphys.com/portal/ml/rl/mountaincar.html?rev=1697169199&amp;do=diff</link>
        <description>Mountain Car

Tutorials

Google Colaboratory - DQN/MLP

&lt;https://colab.research.google.com/drive/1T9UGr7vdXj1HYE_4qo8KXptIwCS7S-3v&gt;

Trained Model



Results

DQN/MLP




Video



References

&lt;https://pytorch.org/tutorials/intermediate/reinforcement_q_learning.html&gt;

&lt;https://sebarnold.net/tutorials/intermediate/reinforcement_q_learning.html&gt;

&lt;https://www.gymlibrary.dev/&gt;

&lt;https://www.gymlibrary.dev/environments/classic_control/mountain_car/&gt;

&lt;https://github.com/openai/gym/wiki/MountainCar-v0…</description>
    </item>
    <item rdf:about="https://www.daiphys.com/portal/ml/rl/quest-track.html?rev=1697169191&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-10-13T03:53:11+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>Quest Track</title>
        <link>https://www.daiphys.com/portal/ml/rl/quest-track.html?rev=1697169191&amp;do=diff</link>
        <description>Quest Track

Tutorials

Google Colaboratory - DQN/MLP

&lt;https://colab.research.google.com/drive/1FbKXzS9xNcw1SDmqHv5rHmSWl8Z50WS1&gt;

Google Colaboratory - PPO/MLP (Stable Baselines 3)

&lt;https://colab.research.google.com/drive/1ke5bsYQjV_xWNU9SfDPM20OxUKKYvc9K&gt;

Trained Models





Results

DQN/MLP




PPO/MLP (Stable Baselines 3)




Video



References

&lt;https://agirobots.com/openai-gym-custom-env/&gt;

&lt;https://github.com/openai/gym/blob/master/gym/envs/classic_control/mountain_car.py&gt;

&lt;https://r…</description>
    </item>
    <item rdf:about="https://www.daiphys.com/portal/ml/rl/quest.html?rev=1697169170&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-10-13T03:52:50+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>Quest</title>
        <link>https://www.daiphys.com/portal/ml/rl/quest.html?rev=1697169170&amp;do=diff</link>
        <description>Quest

Tutorials

Google Colaboratory - DQN/MLP

&lt;https://colab.research.google.com/drive/1kSVYB1l2xez2ozAd6qL_nBEPCkRwpdyH&gt;

Google Colaboratory - Dueling DQN/MLP

&lt;https://colab.research.google.com/drive/1NCcUATL0o01HH23wEtRVGrFUEM6MmLEo&gt;

Google Colaboratory - PPO/MLP (Stable Baselines 3)

&lt;https://colab.research.google.com/drive/1yo9sojEF8U7OmjwxPmhPMGl48P5HZf8x&gt;

Trained Model







Results

DQN/MLP




Dueling DQN/MLP




PPO/MLP (Stable Baselines 3)




Video



References</description>
    </item>
    <item rdf:about="https://www.daiphys.com/portal/ml/rl/sealane.html?rev=1697169160&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-10-13T03:52:40+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>Sea Lane</title>
        <link>https://www.daiphys.com/portal/ml/rl/sealane.html?rev=1697169160&amp;do=diff</link>
        <description>Sea Lane

Tutorials

Google Colaboratory - DQN/MLP (Stable Baselines 3)

&lt;https://colab.research.google.com/drive/1hBgYbzpZr5TAyaXmBocxZXdYmQ9zBh26&gt;

Google Colaboratory - PPO/MLP (Stable Baselines 3)

&lt;https://colab.research.google.com/drive/1KhqJ4mtMD0oL16Us45JX3i-d-mkBWJRj&gt;

Google Colaboratory - Recurrent PPO/MLP (Stable Baselines 3 - Contrib)

&lt;https://colab.research.google.com/drive/13PNP10S-7HaKwDhC4g886jizpL4-ZTsR&gt;

Google Colaboratory - ARS/MLP (Stable Baselines 3 - Contrib)</description>
    </item>
</rdf:RDF>
