d4l3k
diff --git a/‎.circleci/scripts/build_for_windows.sh
Lines changed: 1 addition & 1 deletion b/‎.circleci/scripts/build_for_windows.sh
Lines changed: 1 addition & 1 deletion
diff --git a/‎_static/img/mario.gif
4.89 MB b/‎_static/img/mario.gif
4.89 MB
diff --git a/‎_static/img/mario_env.png
38.7 KB b/‎_static/img/mario_env.png
38.7 KB
diff --git a/‎index.rst
Lines changed: 10 additions & 1 deletion b/‎index.rst
Lines changed: 10 additions & 1 deletion
@@ -32,7 +32,7 @@ conda create -qyn testenv python=3.7
 conda activate testenv
 
 conda install sphinx
-pip install sphinx_gallery==0.3.1 sphinx-copybutton flask pandas spacy ipython scipy pySoundFile scikit-image
+pip install sphinx_gallery==0.3.1 sphinx-copybutton flask pandas spacy ipython scipy pySoundFile scikit-image gym gym-super-mario-bros==7.3.0
 pip install -e git+git://github.com/pytorch/pytorch_sphinx_theme.git#egg=pytorch_sphinx_theme
 pip install ray[tune] tabulate
 conda install -yq -c pytorch "cudatoolkit=10.1" pytorch torchvision torchtext
 
@@ -177,6 +177,14 @@ Welcome to PyTorch Tutorials
    :link: intermediate/reinforcement_q_learning.html
    :tags: Reinforcement-Learning
 
+.. customcarditem::
+   :header: Game-playing AI (Mario)
+   :card_description: Use PyTorch to train a Double Q-learning agent to play Mario .
+   :image: _static/img/mario.gif
+   :link: intermediate/mario_rl_tutorial.html
+   :tags: Reinforcement-Learning
+
+
 .. Deploying PyTorch Models in Production
 
 .. customcarditem::
@@ -366,7 +374,7 @@ Welcome to PyTorch Tutorials
    :image: _static/img/thumbnails/cropped/Implementing-Batch-RPC-Processing-Using-Asynchronous-Executions.png
    :link: intermediate/rpc_async_execution.html
    :tags: Parallel-and-Distributed-Training
-   
+
 .. customcarditem::
    :header: Combining Distributed DataParallel with Distributed RPC Framework
    :card_description: Walk through a through a simple example of how to combine distributed data parallelism with distributed model parallelism.
@@ -491,6 +499,7 @@ Additional Resources
    :caption: Reinforcement Learning
 
    intermediate/reinforcement_q_learning
+   intermediate/mario_rl_tutorial
 
 .. toctree::
    :maxdepth: 2