summaryrefslogtreecommitdiff
path: root/rl/tutorials
diff options
context:
space:
mode:
Diffstat (limited to 'rl/tutorials')
-rw-r--r--rl/tutorials/actor_critic.ipynb8
1 files changed, 7 insertions, 1 deletions
diff --git a/rl/tutorials/actor_critic.ipynb b/rl/tutorials/actor_critic.ipynb
index 32e28ad..0b357d7 100644
--- a/rl/tutorials/actor_critic.ipynb
+++ b/rl/tutorials/actor_critic.ipynb
@@ -14,7 +14,13 @@
"metadata": {},
"source": [
"- references\n",
- " - https://github.com/pytorch/examples/tree/main/reinforcement_learning"
+ " - https://github.com/pytorch/examples/tree/main/reinforcement_learning\n",
+ " - https://towardsdatascience.com/understanding-actor-critic-methods-931b97b6df3f\n",
+ " - https://lilianweng.github.io/posts/2018-04-08-policy-gradient/\n",
+ "- Actor - Critic\n",
+ " - Actor\n",
+ " - The policy gradient method is also the “actor” part of Actor-Critic methods \n",
+ " - Critic"
]
}
],