diff options
Diffstat (limited to 'rl/tutorials/actor_critic.ipynb')
| -rw-r--r-- | rl/tutorials/actor_critic.ipynb | 8 |
1 files changed, 7 insertions, 1 deletions
diff --git a/rl/tutorials/actor_critic.ipynb b/rl/tutorials/actor_critic.ipynb index 32e28ad..0b357d7 100644 --- a/rl/tutorials/actor_critic.ipynb +++ b/rl/tutorials/actor_critic.ipynb @@ -14,7 +14,13 @@ "metadata": {}, "source": [ "- references\n", - " - https://github.com/pytorch/examples/tree/main/reinforcement_learning" + " - https://github.com/pytorch/examples/tree/main/reinforcement_learning\n", + " - https://towardsdatascience.com/understanding-actor-critic-methods-931b97b6df3f\n", + " - https://lilianweng.github.io/posts/2018-04-08-policy-gradient/\n", + "- Actor - Critic\n", + " - Actor\n", + " - The policy gradient method is also the “actor” part of Actor-Critic methods \n", + " - Critic" ] } ], |
