diff options
Diffstat (limited to 'results/nudging_test_3seed_summary.json')
| -rw-r--r-- | results/nudging_test_3seed_summary.json | 122 |
1 files changed, 122 insertions, 0 deletions
diff --git a/results/nudging_test_3seed_summary.json b/results/nudging_test_3seed_summary.json new file mode 100644 index 0000000..b970c59 --- /dev/null +++ b/results/nudging_test_3seed_summary.json @@ -0,0 +1,122 @@ +{ + "description": "Nudging test 3-seed values for \u00a74 \u00b64 cross-method functional dissociation. Each value is the test-loss change after a single step of size eta=0.01 along the per-layer credit direction at the converged checkpoint.", + "eta": 0.01, + "epochs": 30, + "arch": "4-block d=256 pre-LN ResMLP", + "penalty_lam": 0.01, + "methods": { + "state_bridge": { + "per_seed": { + "42": { + "per_block": [ + -0.0035966814029961824, + -0.0023783869110047817, + -0.0017011994495987892, + -0.0012592736165970564 + ], + "deep_mean": -0.0017796199924002092, + "note": "deep = blocks l1, l2, l3 (excluding l0)" + }, + "123": { + "per_block": [ + -0.003914414905011654, + -0.002520129084587097, + -0.0018878313712775707, + -0.0014582867734134197 + ], + "deep_mean": -0.0019554157430926957, + "note": "deep = blocks l1, l2, l3 (excluding l0)" + }, + "456": { + "per_block": [ + -0.004026009701192379, + -0.0028109778650105, + -0.001904117758385837, + -0.0014447440626099706 + ], + "deep_mean": -0.002053279895335436, + "note": "deep = blocks l1, l2, l3 (excluding l0)" + } + }, + "three_seed_deep_mean": -0.0019294385436094469, + "three_seed_deep_std_ddof0": 0.00011322116053216024 + }, + "credit_bridge": { + "per_seed": { + "42": { + "per_block": [ + -0.0005118446424603462, + -0.0004658599500544369, + -0.00044331286335363984, + -0.00042594311526045203 + ], + "deep_mean": -0.0004450386428895096, + "note": "deep = blocks l1, l2, l3 (excluding l0)" + }, + "123": { + "per_block": [ + -0.00045391899766400456, + -0.00041642854921519756, + -0.00038977732765488327, + -0.00037192515446804464 + ], + "deep_mean": -0.00039271034377937514, + "note": "deep = blocks l1, l2, l3 (excluding l0)" + }, + "456": { + "per_block": [ + -0.00048537791008129716, + -0.00046242878306657076, + -0.00043993344297632575, + -0.00042223266791552305 + ], + "deep_mean": -0.0004415316313194732, + "note": "deep = blocks l1, l2, l3 (excluding l0)" + } + }, + "three_seed_deep_mean": -0.000426426872662786, + "three_seed_deep_std_ddof0": 2.3884137309066322e-05 + }, + "dfa": { + "per_seed": { + "42": { + "per_block": [ + -0.00013115769252181053, + -5.455967038869858e-05, + -5.524198058992624e-05, + -5.596294067800045e-05 + ], + "deep_mean": -5.525486388554176e-05, + "note": "deep = blocks l1, l2, l3 (excluding l0)" + }, + "123": { + "per_block": [ + -0.00010294892126694322, + -3.057112917304039e-05, + -4.6447094064205885e-05, + -5.68098621442914e-05 + ], + "deep_mean": -4.460936179384589e-05, + "note": "deep = blocks l1, l2, l3 (excluding l0)" + }, + "456": { + "per_block": [ + -0.00014482333790510893, + -4.394981078803539e-05, + -4.4448592234402895e-05, + -5.99866034463048e-05 + ], + "deep_mean": -4.946166882291436e-05, + "note": "deep = blocks l1, l2, l3 (excluding l0)" + } + }, + "three_seed_deep_mean": -4.9775298167434004e-05, + "three_seed_deep_std_ddof0": 4.3516626110321815e-06 + } + }, + "ratios_3seed_means": { + "SB / CB": 4.5246645258569975, + "SB / DFA": 38.76297309398745, + "CB / DFA": 8.56703803618358 + } +}
\ No newline at end of file |
