From d022688ea9fcfcb81f900751ee92e35597ef19b8 Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Wed, 8 Apr 2026 19:11:40 -0500 Subject: paper v2.32: BP+penalty multi-seeded (was single-seed s42) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit The §5 ¶3 BP+penalty value (0.530, +18.1 pp margin) was single-seed s42. Ran s123 and s456 to multi-seed it, matching the BP-no-pen 3-seed control. 3-seed BP+pen 30ep results (lam=0.01, AdamW lr=1e-3 wd=0.01, cosine, batch 128): s42: 0.5303, +18.13 pp vs frozen s123: 0.5262, +17.72 pp s456: 0.5397, +19.07 pp 3-seed mean: 0.5321 ± 0.0057, +18.31 pp Updates: - §5 ¶3: BP+pen "0.530 (single seed)" → "0.532 ± 0.006" (3-seed) - §5 ¶3: BP penalty cost -5.5 pp → -5.3 pp - §5 ¶3: BP+pen margin +18.1 → +18.3 pp - §5 ¶3: BP-to-DFA gap 17.0 → 17.2 pp - §4 ¶4: BP+pen +18.1 → +18.3 pp comparison - Figure 3 panel C bar values: BP with_pen 0.530 → 0.532 - Figure 3 panel C title: BP-pen-cost -5.5pp → -5.3pp The +18.3 pp 3-seed mean is essentially the same as the s42 single-seed +18.13 pp, so the headline conclusion (BP+pen far above frozen baseline, huge gap vs DFA+pen) is unchanged. This commit removes the last single-seed value labeled as a key control. New auditable file: results/bp_with_penalty_3seed_summary.json Page layout preserved: 9 pages main, refs p10, 0 overfull boxes. Co-Authored-By: Claude Opus 4.6 (1M context) --- results/bp_with_penalty/bp_pen_lam0.01_s456.json | 42 ++++++++++++++++++++++++ 1 file changed, 42 insertions(+) create mode 100644 results/bp_with_penalty/bp_pen_lam0.01_s456.json (limited to 'results/bp_with_penalty/bp_pen_lam0.01_s456.json') diff --git a/results/bp_with_penalty/bp_pen_lam0.01_s456.json b/results/bp_with_penalty/bp_pen_lam0.01_s456.json new file mode 100644 index 0000000..225c109 --- /dev/null +++ b/results/bp_with_penalty/bp_pen_lam0.01_s456.json @@ -0,0 +1,42 @@ +{ + "config": { + "seed": 456, + "epochs": 30, + "lr": 0.001, + "wd": 0.01, + "lam": 0.01, + "output_dir": "results/bp_with_penalty" + }, + "final_acc": 0.5397, + "log": [ + { + "epoch": 1, + "test_acc": 0.3652 + }, + { + "epoch": 5, + "test_acc": 0.4027 + }, + { + "epoch": 10, + "test_acc": 0.4639 + }, + { + "epoch": 15, + "test_acc": 0.4963 + }, + { + "epoch": 20, + "test_acc": 0.5189 + }, + { + "epoch": 25, + "test_acc": 0.5345 + }, + { + "epoch": 30, + "test_acc": 0.5397 + } + ], + "margin_pp": 19.069999999999997 +} \ No newline at end of file -- cgit v1.2.3