1 files changed, 7 insertions, 1 deletions
diff --git a/rl/tutorials/actor_critic.ipynb b/rl/tutorials/actor_critic.ipynb
index 32e28ad..0b357d7 100644
--- a/rl/tutorials/actor_critic.ipynb
+++ b/rl/tutorials/actor_critic.ipynb
@@ -14,7 +14,13 @@
    "metadata": {},
    "source": [
     "- references\n",
-    "    - https://github.com/pytorch/examples/tree/main/reinforcement_learning"
+    "    - https://github.com/pytorch/examples/tree/main/reinforcement_learning\n",
+    "    - https://towardsdatascience.com/understanding-actor-critic-methods-931b97b6df3f\n",
+    "    - https://lilianweng.github.io/posts/2018-04-08-policy-gradient/\n",
+    "- Actor - Critic\n",
+    "    - Actor\n",
+    "        - The policy gradient method is also the “actor” part of Actor-Critic methods \n",
+    "  - Critic"
    ]
   }
  ],