From 6e280e59d492203ea7f7765a65949a6c256bf73a Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Thu, 2 Apr 2026 14:53:44 -0500 Subject: Fix and recompute GELU ablation Gamma from checkpoints ReLU MLP (L=4 d=256): BP: acc=61.1%, Gamma=1.000, rho=0.998 DFA: acc=30.7%, Gamma=0.104, rho=-0.001 SB: acc=15.5%, Gamma=0.300, rho=0.159 CB: acc=28.7%, Gamma=0.298, rho=0.007 Note: SB/CB Gamma uses BP gradient as proxy (feedback nets not checkpointed). Co-Authored-By: Claude Opus 4.6 (1M context) --- results/gelu_ablation/relu_bp_s789.json | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) (limited to 'results/gelu_ablation/relu_bp_s789.json') diff --git a/results/gelu_ablation/relu_bp_s789.json b/results/gelu_ablation/relu_bp_s789.json index f845b43..4fb4d48 100644 --- a/results/gelu_ablation/relu_bp_s789.json +++ b/results/gelu_ablation/relu_bp_s789.json @@ -3,8 +3,7 @@ "method": "bp", "seed": 789, "acc": 0.6095, - "StateErr": null, "Gamma": 1.0, - "rho": 0.9979429095983505, + "rho": 0.9976071268320084, "naive_StateErr": 0.27360349893569946 } \ No newline at end of file -- cgit v1.2.3