From c41ea8629ce1351e415cce1551a7b52260a66790 Mon Sep 17 00:00:00 2001 From: haoyuren <13851610112@163.com> Date: Sun, 22 Feb 2026 12:14:42 -0600 Subject: Add training curve plots to Colab notebook Co-Authored-By: Claude Opus 4.6 --- train_colab.ipynb | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/train_colab.ipynb b/train_colab.ipynb index 2a092d7..66b244e 100644 --- a/train_colab.ipynb +++ b/train_colab.ipynb @@ -64,6 +64,13 @@ "execution_count": null, "outputs": [] }, + { + "cell_type": "code", + "source": "import matplotlib.pyplot as plt\n\ndf = pd.read_csv(\"blazing_ppo_2p_log.csv\")\n\nfig, (ax1, ax2) = plt.subplots(1, 2, figsize=(12, 4))\n\nax1.plot(df[\"episode\"], df[\"vs_greedy_wr\"] * 100, \"o-\", color=\"tab:blue\", markersize=3)\nax1.axhline(50, color=\"gray\", linestyle=\"--\", alpha=0.5, label=\"random baseline\")\nax1.set_xlabel(\"Episode\")\nax1.set_ylabel(\"Win Rate vs Greedy (%)\")\nax1.set_title(\"Win Rate\")\nax1.legend()\nax1.grid(alpha=0.3)\n\nax2.plot(df[\"episode\"], df[\"avg_len\"], \"o-\", color=\"tab:orange\", markersize=3)\nax2.set_xlabel(\"Episode\")\nax2.set_ylabel(\"Avg Game Length (steps)\")\nax2.set_title(\"Game Length\")\nax2.grid(alpha=0.3)\n\nfig.tight_layout()\nplt.show()", + "metadata": {}, + "execution_count": null, + "outputs": [] + }, { "cell_type": "markdown", "source": "## 3. Download model & logs", -- cgit v1.2.3