diff options
| author | YurenHao0426 <Blackhao0426@gmail.com> | 2026-04-02 14:42:02 -0500 |
|---|---|---|
| committer | YurenHao0426 <Blackhao0426@gmail.com> | 2026-04-02 14:42:02 -0500 |
| commit | fe36805c894671b571f0dd573185394ca2e88c8d (patch) | |
| tree | dc04ab3d0057f50d0d2392904198a8a800c4c092 /results | |
| parent | 100ae0eb429774ae9cd4f3085de7c87bf9d56d45 (diff) | |
Add EP baseline (5 seeds), GELU ablation (20 runs), CNN BP+DFA (10 runs)
EP (L=4 d=256): acc≈30%, Gamma≈0, rho≈0 — EP credit signal weak on feedforward MLP
GELU ablation (ReLU variant): 4 methods × 5 seeds complete
CNN BP+DFA: 5 seeds each, BP + DFA on SmallCNN
Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
Diffstat (limited to 'results')
35 files changed, 565 insertions, 0 deletions
diff --git a/results/cnn_baseline/bp_s1024.json b/results/cnn_baseline/bp_s1024.json new file mode 100644 index 0000000..0965221 --- /dev/null +++ b/results/cnn_baseline/bp_s1024.json @@ -0,0 +1,25 @@ +{ + "method": "bp", + "seed": 1024, + "acc": 0.8716, + "Gamma": 0.23036077618598938, + "rho": 0.24998444318771362, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9214431047439575 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9999377727508545 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +}
\ No newline at end of file diff --git a/results/cnn_baseline/bp_s123.json b/results/cnn_baseline/bp_s123.json new file mode 100644 index 0000000..6f9812b --- /dev/null +++ b/results/cnn_baseline/bp_s123.json @@ -0,0 +1,25 @@ +{ + "method": "bp", + "seed": 123, + "acc": 0.8683, + "Gamma": 0.24026203155517578, + "rho": 0.2499578297138214, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9610481262207031 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9998313188552856 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +}
\ No newline at end of file diff --git a/results/cnn_baseline/bp_s42.json b/results/cnn_baseline/bp_s42.json new file mode 100644 index 0000000..1f1e041 --- /dev/null +++ b/results/cnn_baseline/bp_s42.json @@ -0,0 +1,25 @@ +{ + "method": "bp", + "seed": 42, + "acc": 0.8621, + "Gamma": 0.2417115569114685, + "rho": 0.24997350573539734, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.966846227645874 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9998940229415894 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +}
\ No newline at end of file diff --git a/results/cnn_baseline/bp_s456.json b/results/cnn_baseline/bp_s456.json new file mode 100644 index 0000000..6e358c1 --- /dev/null +++ b/results/cnn_baseline/bp_s456.json @@ -0,0 +1,25 @@ +{ + "method": "bp", + "seed": 456, + "acc": 0.8681, + "Gamma": 0.24036112427711487, + "rho": 0.24996760487556458, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9614444971084595 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9998704195022583 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +}
\ No newline at end of file diff --git a/results/cnn_baseline/bp_s789.json b/results/cnn_baseline/bp_s789.json new file mode 100644 index 0000000..4e913d8 --- /dev/null +++ b/results/cnn_baseline/bp_s789.json @@ -0,0 +1,25 @@ +{ + "method": "bp", + "seed": 789, + "acc": 0.8677, + "Gamma": 0.23751218616962433, + "rho": 0.24997900426387787, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9500487446784973 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.9999160170555115 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +}
\ No newline at end of file diff --git a/results/cnn_baseline/dfa_s1024.json b/results/cnn_baseline/dfa_s1024.json new file mode 100644 index 0000000..64755e1 --- /dev/null +++ b/results/cnn_baseline/dfa_s1024.json @@ -0,0 +1,25 @@ +{ + "method": "dfa", + "seed": 1024, + "acc": 0.5868, + "Gamma": 0.22504013776779175, + "rho": 0.01557417493313551, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.900160551071167 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.06229669973254204 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +}
\ No newline at end of file diff --git a/results/cnn_baseline/dfa_s123.json b/results/cnn_baseline/dfa_s123.json new file mode 100644 index 0000000..179cbe3 --- /dev/null +++ b/results/cnn_baseline/dfa_s123.json @@ -0,0 +1,25 @@ +{ + "method": "dfa", + "seed": 123, + "acc": 0.5501, + "Gamma": 0.21116971969604492, + "rho": 0.03002248704433441, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.8446788787841797 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.12008994817733765 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +}
\ No newline at end of file diff --git a/results/cnn_baseline/dfa_s42.json b/results/cnn_baseline/dfa_s42.json new file mode 100644 index 0000000..dbc1099 --- /dev/null +++ b/results/cnn_baseline/dfa_s42.json @@ -0,0 +1,25 @@ +{ + "method": "dfa", + "seed": 42, + "acc": 0.5527, + "Gamma": 0.22270919382572174, + "rho": 0.011658251285552979, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.890836775302887 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.046633005142211914 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +}
\ No newline at end of file diff --git a/results/cnn_baseline/dfa_s456.json b/results/cnn_baseline/dfa_s456.json new file mode 100644 index 0000000..30de9b1 --- /dev/null +++ b/results/cnn_baseline/dfa_s456.json @@ -0,0 +1,25 @@ +{ + "method": "dfa", + "seed": 456, + "acc": 0.5954, + "Gamma": 0.2133052498102188, + "rho": 0.01581542007625103, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.8532209992408752 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.06326168030500412 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +}
\ No newline at end of file diff --git a/results/cnn_baseline/dfa_s789.json b/results/cnn_baseline/dfa_s789.json new file mode 100644 index 0000000..5c030df --- /dev/null +++ b/results/cnn_baseline/dfa_s789.json @@ -0,0 +1,25 @@ +{ + "method": "dfa", + "seed": 789, + "acc": 0.5481, + "Gamma": 0.20736519992351532, + "rho": 0.01041002944111824, + "gammas_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.8294607996940613 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.04164011776447296 + ], + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.05 +}
\ No newline at end of file diff --git a/results/ep_baseline/ep_s1024.json b/results/ep_baseline/ep_s1024.json new file mode 100644 index 0000000..a6f16e2 --- /dev/null +++ b/results/ep_baseline/ep_s1024.json @@ -0,0 +1,23 @@ +{ + "method": "ep", + "seed": 1024, + "acc": 0.2981, + "Gamma": -0.001718481391435489, + "rho": 0.0012313337065279484, + "naive_StateErr": 0.804000735282898, + "gammas_per_layer": [ + 0.0, + 0.004800701513886452, + -0.00025482603814452887, + -0.011419801041483879 + ], + "rhos_per_layer": [ + 0.0, + -0.01354932226240635, + 0.03151280805468559, + -0.01303815096616745 + ], + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.1 +}
\ No newline at end of file diff --git a/results/ep_baseline/ep_s123.json b/results/ep_baseline/ep_s123.json new file mode 100644 index 0000000..7924a39 --- /dev/null +++ b/results/ep_baseline/ep_s123.json @@ -0,0 +1,23 @@ +{ + "method": "ep", + "seed": 123, + "acc": 0.2924, + "Gamma": -0.010700209351853118, + "rho": -0.01468805002514273, + "naive_StateErr": 0.21454104781150818, + "gammas_per_layer": [ + 0.0, + -0.00011013347102561966, + 7.618003292009234e-05, + -0.042766883969306946 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.003175207879394293, + -0.06192740797996521 + ], + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.1 +}
\ No newline at end of file diff --git a/results/ep_baseline/ep_s42.json b/results/ep_baseline/ep_s42.json new file mode 100644 index 0000000..b60502b --- /dev/null +++ b/results/ep_baseline/ep_s42.json @@ -0,0 +1,23 @@ +{ + "method": "ep", + "seed": 42, + "acc": 0.359, + "Gamma": -0.007905199148808606, + "rho": -0.07944288477301598, + "naive_StateErr": 0.5929934978485107, + "gammas_per_layer": [ + 0.0, + -0.0006224570679478347, + -0.000845100381411612, + -0.030153239145874977 + ], + "rhos_per_layer": [ + 0.0, + -0.025672510266304016, + 0.0, + -0.2920990288257599 + ], + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.1 +}
\ No newline at end of file diff --git a/results/ep_baseline/ep_s456.json b/results/ep_baseline/ep_s456.json new file mode 100644 index 0000000..3a04367 --- /dev/null +++ b/results/ep_baseline/ep_s456.json @@ -0,0 +1,23 @@ +{ + "method": "ep", + "seed": 456, + "acc": 0.2976, + "Gamma": -0.01223632060282398, + "rho": -0.07857450563460588, + "naive_StateErr": 1.5853830575942993, + "gammas_per_layer": [ + 0.0, + -0.00014890515012666583, + -0.0018156982259824872, + -0.04698067903518677 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + -0.03213520720601082, + -0.2821628153324127 + ], + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.1 +}
\ No newline at end of file diff --git a/results/ep_baseline/ep_s789.json b/results/ep_baseline/ep_s789.json new file mode 100644 index 0000000..587aeca --- /dev/null +++ b/results/ep_baseline/ep_s789.json @@ -0,0 +1,23 @@ +{ + "method": "ep", + "seed": 789, + "acc": 0.3458, + "Gamma": -0.00443847177666612, + "rho": -0.011359908618032932, + "naive_StateErr": 0.8419253826141357, + "gammas_per_layer": [ + 0.0, + 0.0016552513698115945, + 0.0009475427214056253, + -0.0203566811978817 + ], + "rhos_per_layer": [ + 0.0, + 0.0253923200070858, + 0.0, + -0.07083195447921753 + ], + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.1 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_bp_s1024.json b/results/gelu_ablation/relu_bp_s1024.json new file mode 100644 index 0000000..aa8d306 --- /dev/null +++ b/results/gelu_ablation/relu_bp_s1024.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "bp", + "seed": 1024, + "acc": 0.6097, + "StateErr": null, + "Gamma": 1.0, + "rho": 0.9974461048841476, + "naive_StateErr": 0.4324362277984619 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_bp_s123.json b/results/gelu_ablation/relu_bp_s123.json new file mode 100644 index 0000000..e3ffbd2 --- /dev/null +++ b/results/gelu_ablation/relu_bp_s123.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "bp", + "seed": 123, + "acc": 0.613, + "StateErr": null, + "Gamma": 1.0, + "rho": 0.997876763343811, + "naive_StateErr": 0.5002583861351013 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_bp_s42.json b/results/gelu_ablation/relu_bp_s42.json new file mode 100644 index 0000000..d35d1b6 --- /dev/null +++ b/results/gelu_ablation/relu_bp_s42.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "bp", + "seed": 42, + "acc": 0.6129, + "StateErr": null, + "Gamma": 1.0, + "rho": 0.9975161552429199, + "naive_StateErr": 0.6057583093643188 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_bp_s456.json b/results/gelu_ablation/relu_bp_s456.json new file mode 100644 index 0000000..0ddf182 --- /dev/null +++ b/results/gelu_ablation/relu_bp_s456.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "bp", + "seed": 456, + "acc": 0.608, + "StateErr": null, + "Gamma": 1.0, + "rho": 0.9971267879009247, + "naive_StateErr": 0.3411523401737213 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_bp_s789.json b/results/gelu_ablation/relu_bp_s789.json new file mode 100644 index 0000000..f845b43 --- /dev/null +++ b/results/gelu_ablation/relu_bp_s789.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "bp", + "seed": 789, + "acc": 0.6095, + "StateErr": null, + "Gamma": 1.0, + "rho": 0.9979429095983505, + "naive_StateErr": 0.27360349893569946 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_credit_bridge_s1024.json b/results/gelu_ablation/relu_credit_bridge_s1024.json new file mode 100644 index 0000000..fd55fa1 --- /dev/null +++ b/results/gelu_ablation/relu_credit_bridge_s1024.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "credit_bridge", + "seed": 1024, + "acc": 0.2969, + "StateErr": null, + "Gamma": 1.0, + "rho": 0.008778431452810764, + "naive_StateErr": 1.527748942375183 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_credit_bridge_s123.json b/results/gelu_ablation/relu_credit_bridge_s123.json new file mode 100644 index 0000000..8d311e8 --- /dev/null +++ b/results/gelu_ablation/relu_credit_bridge_s123.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "credit_bridge", + "seed": 123, + "acc": 0.2644, + "StateErr": null, + "Gamma": 1.0, + "rho": 0.004790207836776972, + "naive_StateErr": 0.1871446669101715 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_credit_bridge_s42.json b/results/gelu_ablation/relu_credit_bridge_s42.json new file mode 100644 index 0000000..38fc810 --- /dev/null +++ b/results/gelu_ablation/relu_credit_bridge_s42.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "credit_bridge", + "seed": 42, + "acc": 0.3021, + "StateErr": null, + "Gamma": 1.0, + "rho": -0.008028814569115639, + "naive_StateErr": 0.27361318469047546 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_credit_bridge_s456.json b/results/gelu_ablation/relu_credit_bridge_s456.json new file mode 100644 index 0000000..a6934ba --- /dev/null +++ b/results/gelu_ablation/relu_credit_bridge_s456.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "credit_bridge", + "seed": 456, + "acc": 0.2842, + "StateErr": null, + "Gamma": 1.0, + "rho": -0.0007395216962322593, + "naive_StateErr": 1.9933160543441772 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_credit_bridge_s789.json b/results/gelu_ablation/relu_credit_bridge_s789.json new file mode 100644 index 0000000..4f3ff0d --- /dev/null +++ b/results/gelu_ablation/relu_credit_bridge_s789.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "credit_bridge", + "seed": 789, + "acc": 0.2898, + "StateErr": null, + "Gamma": 1.0, + "rho": 0.01000211015343666, + "naive_StateErr": 0.6378490328788757 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_dfa_s1024.json b/results/gelu_ablation/relu_dfa_s1024.json new file mode 100644 index 0000000..12efe95 --- /dev/null +++ b/results/gelu_ablation/relu_dfa_s1024.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "dfa", + "seed": 1024, + "acc": 0.312, + "StateErr": null, + "Gamma": 1.0, + "rho": 0.005766347981989384, + "naive_StateErr": 1.1434805393218994 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_dfa_s123.json b/results/gelu_ablation/relu_dfa_s123.json new file mode 100644 index 0000000..717abcc --- /dev/null +++ b/results/gelu_ablation/relu_dfa_s123.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "dfa", + "seed": 123, + "acc": 0.3072, + "StateErr": null, + "Gamma": 1.0, + "rho": -0.00010712328366935253, + "naive_StateErr": 53.51875686645508 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_dfa_s42.json b/results/gelu_ablation/relu_dfa_s42.json new file mode 100644 index 0000000..ae9b9da --- /dev/null +++ b/results/gelu_ablation/relu_dfa_s42.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "dfa", + "seed": 42, + "acc": 0.3113, + "StateErr": null, + "Gamma": 1.0, + "rho": 0.010042589157819748, + "naive_StateErr": 1.0625700950622559 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_dfa_s456.json b/results/gelu_ablation/relu_dfa_s456.json new file mode 100644 index 0000000..85404d8 --- /dev/null +++ b/results/gelu_ablation/relu_dfa_s456.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "dfa", + "seed": 456, + "acc": 0.2991, + "StateErr": null, + "Gamma": 1.0, + "rho": -0.00946012232452631, + "naive_StateErr": 0.08919885009527206 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_dfa_s789.json b/results/gelu_ablation/relu_dfa_s789.json new file mode 100644 index 0000000..bc16a09 --- /dev/null +++ b/results/gelu_ablation/relu_dfa_s789.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "dfa", + "seed": 789, + "acc": 0.3065, + "StateErr": null, + "Gamma": 1.0, + "rho": 0.012797923758625984, + "naive_StateErr": 1.1228328943252563 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_state_bridge_s1024.json b/results/gelu_ablation/relu_state_bridge_s1024.json new file mode 100644 index 0000000..a70242b --- /dev/null +++ b/results/gelu_ablation/relu_state_bridge_s1024.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "state_bridge", + "seed": 1024, + "acc": 0.1478, + "StateErr": 98715213479.28064, + "Gamma": 1.0, + "rho": -0.0005375983892008662, + "naive_StateErr": 0.06271713972091675 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_state_bridge_s123.json b/results/gelu_ablation/relu_state_bridge_s123.json new file mode 100644 index 0000000..f56548e --- /dev/null +++ b/results/gelu_ablation/relu_state_bridge_s123.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "state_bridge", + "seed": 123, + "acc": 0.1868, + "StateErr": 537733263750.59454, + "Gamma": 1.0, + "rho": 0.13547618687152863, + "naive_StateErr": 16.496652603149414 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_state_bridge_s42.json b/results/gelu_ablation/relu_state_bridge_s42.json new file mode 100644 index 0000000..e3c1036 --- /dev/null +++ b/results/gelu_ablation/relu_state_bridge_s42.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "state_bridge", + "seed": 42, + "acc": 0.0797, + "StateErr": 94040208847.33952, + "Gamma": 1.0, + "rho": 0.22764702141284943, + "naive_StateErr": 1.150978446006775 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_state_bridge_s456.json b/results/gelu_ablation/relu_state_bridge_s456.json new file mode 100644 index 0000000..0f50fc8 --- /dev/null +++ b/results/gelu_ablation/relu_state_bridge_s456.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "state_bridge", + "seed": 456, + "acc": 0.1848, + "StateErr": 18242855682493.645, + "Gamma": 1.0, + "rho": 0.27895813807845116, + "naive_StateErr": 0.9801409244537354 +}
\ No newline at end of file diff --git a/results/gelu_ablation/relu_state_bridge_s789.json b/results/gelu_ablation/relu_state_bridge_s789.json new file mode 100644 index 0000000..427e444 --- /dev/null +++ b/results/gelu_ablation/relu_state_bridge_s789.json @@ -0,0 +1,10 @@ +{ + "activation": "relu", + "method": "state_bridge", + "seed": 789, + "acc": 0.1761, + "StateErr": 9722809715963.986, + "Gamma": 1.0, + "rho": 0.1464090496301651, + "naive_StateErr": 1.3677430152893066 +}
\ No newline at end of file |
