File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -32,7 +32,7 @@ conda create -qyn testenv python=3.7
3232conda activate testenv
3333
3434conda install sphinx
35- pip install sphinx_gallery==0.3.1 sphinx-copybutton flask pandas spacy ipython scipy pySoundFile scikit-image
35+ pip install sphinx_gallery==0.3.1 sphinx-copybutton flask pandas spacy ipython scipy pySoundFile scikit-image gym gym-super-mario-bros==7.3.0
3636pip install -e git+git://github.com/pytorch/pytorch_sphinx_theme.git#egg=pytorch_sphinx_theme
3737pip install ray[tune] tabulate
3838conda install -yq -c pytorch " cudatoolkit=10.1" pytorch torchvision torchtext
Original file line number Diff line number Diff line change @@ -177,6 +177,14 @@ Welcome to PyTorch Tutorials
177177 :link: intermediate/reinforcement_q_learning.html
178178 :tags: Reinforcement-Learning
179179
180+ .. customcarditem ::
181+ :header: Game-playing AI (Mario)
182+ :card_description: Use PyTorch to train a Double Q-learning agent to play Mario .
183+ :image: _static/img/mario.gif
184+ :link: intermediate/mario_rl_tutorial.html
185+ :tags: Reinforcement-Learning
186+
187+
180188.. Deploying PyTorch Models in Production
181189
182190 .. customcarditem ::
@@ -366,7 +374,7 @@ Welcome to PyTorch Tutorials
366374 :image: _static/img/thumbnails/cropped/Implementing-Batch-RPC-Processing-Using-Asynchronous-Executions.png
367375 :link: intermediate/rpc_async_execution.html
368376 :tags: Parallel-and-Distributed-Training
369-
377+
370378.. customcarditem ::
371379 :header: Combining Distributed DataParallel with Distributed RPC Framework
372380 :card_description: Walk through a through a simple example of how to combine distributed data parallelism with distributed model parallelism.
@@ -491,6 +499,7 @@ Additional Resources
491499 :caption: Reinforcement Learning
492500
493501 intermediate/reinforcement_q_learning
502+ intermediate/mario_rl_tutorial
494503
495504.. toctree ::
496505 :maxdepth: 2
You can’t perform that action at this time.
0 commit comments