From fe36805c894671b571f0dd573185394ca2e88c8d Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Thu, 2 Apr 2026 14:42:02 -0500 Subject: Add EP baseline (5 seeds), GELU ablation (20 runs), CNN BP+DFA (10 runs) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit EP (L=4 d=256): acc≈30%, Gamma≈0, rho≈0 — EP credit signal weak on feedforward MLP GELU ablation (ReLU variant): 4 methods × 5 seeds complete CNN BP+DFA: 5 seeds each, BP + DFA on SmallCNN Co-Authored-By: Claude Opus 4.6 (1M context) --- results/cnn_baseline/bp_s1024.json | 25 +++++++++++++++++++++++++ results/cnn_baseline/bp_s123.json | 25 +++++++++++++++++++++++++ results/cnn_baseline/bp_s42.json | 25 +++++++++++++++++++++++++ results/cnn_baseline/bp_s456.json | 25 +++++++++++++++++++++++++ results/cnn_baseline/bp_s789.json | 25 +++++++++++++++++++++++++ results/cnn_baseline/dfa_s1024.json | 25 +++++++++++++++++++++++++ results/cnn_baseline/dfa_s123.json | 25 +++++++++++++++++++++++++ results/cnn_baseline/dfa_s42.json | 25 +++++++++++++++++++++++++ results/cnn_baseline/dfa_s456.json | 25 +++++++++++++++++++++++++ results/cnn_baseline/dfa_s789.json | 25 +++++++++++++++++++++++++ 10 files changed, 250 insertions(+) create mode 100644 results/cnn_baseline/bp_s1024.json create mode 100644 results/cnn_baseline/bp_s123.json create mode 100644 results/cnn_baseline/bp_s42.json create mode 100644 results/cnn_baseline/bp_s456.json create mode 100644 results/cnn_baseline/bp_s789.json create mode 100644 results/cnn_baseline/dfa_s1024.json create mode 100644 results/cnn_baseline/dfa_s123.json create mode 100644 results/cnn_baseline/dfa_s42.json create mode 100644 results/cnn_baseline/dfa_s456.json create mode 100644 results/cnn_baseline/dfa_s789.json (limited to 'results/cnn_baseline') diff --git a/results/cnn_baseline/bp_s1024.json b/results/cnn_baseline/bp_s1024.json new file mode 100644 index 0000000..0965221 --- /dev/null +++ b/results/cnn_baseline/bp_s1024.json @@ -0,0 +1,25 @@ +{ + "method": "bp", + "seed": 1024, + "acc": 0.8716, + "Gamma": 0.23036077618598938, + "rho": 0.24998444318771362, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9214431047439575 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9999377727508545 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +} \ No newline at end of file diff --git a/results/cnn_baseline/bp_s123.json b/results/cnn_baseline/bp_s123.json new file mode 100644 index 0000000..6f9812b --- /dev/null +++ b/results/cnn_baseline/bp_s123.json @@ -0,0 +1,25 @@ +{ + "method": "bp", + "seed": 123, + "acc": 0.8683, + "Gamma": 0.24026203155517578, + "rho": 0.2499578297138214, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9610481262207031 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9998313188552856 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +} \ No newline at end of file diff --git a/results/cnn_baseline/bp_s42.json b/results/cnn_baseline/bp_s42.json new file mode 100644 index 0000000..1f1e041 --- /dev/null +++ b/results/cnn_baseline/bp_s42.json @@ -0,0 +1,25 @@ +{ + "method": "bp", + "seed": 42, + "acc": 0.8621, + "Gamma": 0.2417115569114685, + "rho": 0.24997350573539734, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.966846227645874 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9998940229415894 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +} \ No newline at end of file diff --git a/results/cnn_baseline/bp_s456.json b/results/cnn_baseline/bp_s456.json new file mode 100644 index 0000000..6e358c1 --- /dev/null +++ b/results/cnn_baseline/bp_s456.json @@ -0,0 +1,25 @@ +{ + "method": "bp", + "seed": 456, + "acc": 0.8681, + "Gamma": 0.24036112427711487, + "rho": 0.24996760487556458, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9614444971084595 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9998704195022583 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +} \ No newline at end of file diff --git a/results/cnn_baseline/bp_s789.json b/results/cnn_baseline/bp_s789.json new file mode 100644 index 0000000..4e913d8 --- /dev/null +++ b/results/cnn_baseline/bp_s789.json @@ -0,0 +1,25 @@ +{ + "method": "bp", + "seed": 789, + "acc": 0.8677, + "Gamma": 0.23751218616962433, + "rho": 0.24997900426387787, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9500487446784973 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9999160170555115 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +} \ No newline at end of file diff --git a/results/cnn_baseline/dfa_s1024.json b/results/cnn_baseline/dfa_s1024.json new file mode 100644 index 0000000..64755e1 --- /dev/null +++ b/results/cnn_baseline/dfa_s1024.json @@ -0,0 +1,25 @@ +{ + "method": "dfa", + "seed": 1024, + "acc": 0.5868, + "Gamma": 0.22504013776779175, + "rho": 0.01557417493313551, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.900160551071167 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.06229669973254204 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +} \ No newline at end of file diff --git a/results/cnn_baseline/dfa_s123.json b/results/cnn_baseline/dfa_s123.json new file mode 100644 index 0000000..179cbe3 --- /dev/null +++ b/results/cnn_baseline/dfa_s123.json @@ -0,0 +1,25 @@ +{ + "method": "dfa", + "seed": 123, + "acc": 0.5501, + "Gamma": 0.21116971969604492, + "rho": 0.03002248704433441, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.8446788787841797 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.12008994817733765 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +} \ No newline at end of file diff --git a/results/cnn_baseline/dfa_s42.json b/results/cnn_baseline/dfa_s42.json new file mode 100644 index 0000000..dbc1099 --- /dev/null +++ b/results/cnn_baseline/dfa_s42.json @@ -0,0 +1,25 @@ +{ + "method": "dfa", + "seed": 42, + "acc": 0.5527, + "Gamma": 0.22270919382572174, + "rho": 0.011658251285552979, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.890836775302887 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.046633005142211914 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +} \ No newline at end of file diff --git a/results/cnn_baseline/dfa_s456.json b/results/cnn_baseline/dfa_s456.json new file mode 100644 index 0000000..30de9b1 --- /dev/null +++ b/results/cnn_baseline/dfa_s456.json @@ -0,0 +1,25 @@ +{ + "method": "dfa", + "seed": 456, + "acc": 0.5954, + "Gamma": 0.2133052498102188, + "rho": 0.01581542007625103, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.8532209992408752 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.06326168030500412 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +} \ No newline at end of file diff --git a/results/cnn_baseline/dfa_s789.json b/results/cnn_baseline/dfa_s789.json new file mode 100644 index 0000000..5c030df --- /dev/null +++ b/results/cnn_baseline/dfa_s789.json @@ -0,0 +1,25 @@ +{ + "method": "dfa", + "seed": 789, + "acc": 0.5481, + "Gamma": 0.20736519992351532, + "rho": 0.01041002944111824, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.8294607996940613 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.04164011776447296 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +} \ No newline at end of file -- cgit v1.2.3