From 6e280e59d492203ea7f7765a65949a6c256bf73a Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Thu, 2 Apr 2026 14:53:44 -0500 Subject: Fix and recompute GELU ablation Gamma from checkpoints ReLU MLP (L=4 d=256): BP: acc=61.1%, Gamma=1.000, rho=0.998 DFA: acc=30.7%, Gamma=0.104, rho=-0.001 SB: acc=15.5%, Gamma=0.300, rho=0.159 CB: acc=28.7%, Gamma=0.298, rho=0.007 Note: SB/CB Gamma uses BP gradient as proxy (feedback nets not checkpointed). Co-Authored-By: Claude Opus 4.6 (1M context) --- results/gelu_ablation/relu_state_bridge_s123.json | 5 ++--- 1 file changed, 2 insertions(+), 3 deletions(-) (limited to 'results/gelu_ablation/relu_state_bridge_s123.json') diff --git a/results/gelu_ablation/relu_state_bridge_s123.json b/results/gelu_ablation/relu_state_bridge_s123.json index f56548e..25f3798 100644 --- a/results/gelu_ablation/relu_state_bridge_s123.json +++ b/results/gelu_ablation/relu_state_bridge_s123.json @@ -3,8 +3,7 @@ "method": "state_bridge", "seed": 123, "acc": 0.1868, - "StateErr": 537733263750.59454, - "Gamma": 1.0, - "rho": 0.13547618687152863, + "Gamma": 0.29979344457387924, + "rho": 0.13403284549713135, "naive_StateErr": 16.496652603149414 } \ No newline at end of file -- cgit v1.2.3