diff --git a/intermediate_source/reinforcement_ppo.py b/intermediate_source/reinforcement_ppo.py index 44d5c05a8a..c707c0ebb1 100644 --- a/intermediate_source/reinforcement_ppo.py +++ b/intermediate_source/reinforcement_ppo.py @@ -25,12 +25,12 @@ We will cover six crucial components of TorchRL: -* `environments `__ -* `transforms `__ -* `models (policy and value function) `__ -* `loss modules `__ -* `data collectors `__ -* `replay buffers `__ +* `environments `__ +* `transforms `__ +* `models (policy and value function) `__ +* `loss modules `__ +* `data collectors `__ +* `replay buffers `__ """ @@ -466,7 +466,7 @@ # Data collector # -------------- # -# TorchRL provides a set of `DataCollector classes `__. +# TorchRL provides a set of `DataCollector classes `__. # Briefly, these classes execute three operations: reset an environment, # compute an action given the latest observation, execute a step in the environment, # and repeat the last two steps until the environment signals a stop (or reaches