File tree Expand file tree Collapse file tree 6 files changed +799
-2
lines changed Expand file tree Collapse file tree 6 files changed +799
-2
lines changed Original file line number Diff line number Diff line change @@ -32,7 +32,7 @@ conda create -qyn testenv python=3.7
32
32
conda activate testenv
33
33
34
34
conda install sphinx
35
- pip install sphinx_gallery==0.3.1 sphinx-copybutton flask pandas spacy ipython scipy pySoundFile scikit-image
35
+ pip install sphinx_gallery==0.3.1 sphinx-copybutton flask pandas spacy ipython scipy pySoundFile scikit-image gym gym-super-mario-bros==7.3.0
36
36
pip install -e git+git://github.com/pytorch/pytorch_sphinx_theme.git#egg=pytorch_sphinx_theme
37
37
pip install ray[tune] tabulate
38
38
conda install -yq -c pytorch " cudatoolkit=10.1" pytorch torchvision torchtext
Original file line number Diff line number Diff line change @@ -177,6 +177,14 @@ Welcome to PyTorch Tutorials
177
177
:link: intermediate/reinforcement_q_learning.html
178
178
:tags: Reinforcement-Learning
179
179
180
+ .. customcarditem ::
181
+ :header: Game-playing AI (Mario)
182
+ :card_description: Use PyTorch to train a Double Q-learning agent to play Mario .
183
+ :image: _static/img/mario.gif
184
+ :link: intermediate/mario_rl_tutorial.html
185
+ :tags: Reinforcement-Learning
186
+
187
+
180
188
.. Deploying PyTorch Models in Production
181
189
182
190
.. customcarditem ::
@@ -366,7 +374,7 @@ Welcome to PyTorch Tutorials
366
374
:image: _static/img/thumbnails/cropped/Implementing-Batch-RPC-Processing-Using-Asynchronous-Executions.png
367
375
:link: intermediate/rpc_async_execution.html
368
376
:tags: Parallel-and-Distributed-Training
369
-
377
+
370
378
.. customcarditem ::
371
379
:header: Combining Distributed DataParallel with Distributed RPC Framework
372
380
:card_description: Walk through a through a simple example of how to combine distributed data parallelism with distributed model parallelism.
@@ -491,6 +499,7 @@ Additional Resources
491
499
:caption: Reinforcement Learning
492
500
493
501
intermediate/reinforcement_q_learning
502
+ intermediate/mario_rl_tutorial
494
503
495
504
.. toctree ::
496
505
:maxdepth: 2
You can’t perform that action at this time.
0 commit comments