From 6e280e59d492203ea7f7765a65949a6c256bf73a Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Thu, 2 Apr 2026 14:53:44 -0500 Subject: Fix and recompute GELU ablation Gamma from checkpoints ReLU MLP (L=4 d=256): BP: acc=61.1%, Gamma=1.000, rho=0.998 DFA: acc=30.7%, Gamma=0.104, rho=-0.001 SB: acc=15.5%, Gamma=0.300, rho=0.159 CB: acc=28.7%, Gamma=0.298, rho=0.007 Note: SB/CB Gamma uses BP gradient as proxy (feedback nets not checkpointed). Co-Authored-By: Claude Opus 4.6 (1M context) --- results/gelu_ablation/relu_dfa_s456.json | 5 ++--- 1 file changed, 2 insertions(+), 3 deletions(-) (limited to 'results/gelu_ablation/relu_dfa_s456.json') diff --git a/results/gelu_ablation/relu_dfa_s456.json b/results/gelu_ablation/relu_dfa_s456.json index 85404d8..bf9c40e 100644 --- a/results/gelu_ablation/relu_dfa_s456.json +++ b/results/gelu_ablation/relu_dfa_s456.json @@ -3,8 +3,7 @@ "method": "dfa", "seed": 456, "acc": 0.2991, - "StateErr": null, - "Gamma": 1.0, - "rho": -0.00946012232452631, + "Gamma": 0.10119568518712185, + "rho": 0.004686151631176472, "naive_StateErr": 0.08919885009527206 } \ No newline at end of file -- cgit v1.2.3