diff options
| author | YurenHao0426 <Blackhao0426@gmail.com> | 2026-04-08 02:01:21 -0500 |
|---|---|---|
| committer | YurenHao0426 <Blackhao0426@gmail.com> | 2026-04-08 02:01:21 -0500 |
| commit | 55deb9a7d500a30557d901be09848fa430a32d80 (patch) | |
| tree | 9fcdeb536f3bd4d0d9100b907f9a0d5d56f69424 /results | |
| parent | 032afbfc3ec3961748cc557f428d2fd6e4eda5d9 (diff) | |
Multi-seed vanilla DFA early-epoch cos: lock-in for round 19 disambiguation
Round 20's minimal lock-in experiment: 3 seeds × {ep 1, ep 2} vanilla
DFA cosine. Closes the 'single-seed fluke' objection.
Vanilla DFA early-epoch deep cosines (l1-l4):
| seed | ep | ||g|| | deep mean |
|---|---|---|---|
| 42 | 1 | 6.7e-7 | -0.025 |
| 42 | 2 | 1.5e-7 | -0.038 |
| 123 | 1 | 6.5e-7 | +0.002 |
| 123 | 2 | 1.4e-7 | -0.006 |
| 456 | 1 | 3.9e-7 | +0.000 |
| 456 | 2 | 8.5e-8 | -0.009 |
3-seed mean at ep 1 (most meaningful regime): -0.008 ± 0.013
3-seed mean at ep 2: -0.018 ± 0.018
ALL 24 measurements (3 seeds × 2 ep × 4 deep layers) are in [-0.04, +0.02].
Compare to penalized DFA 3-seed mean +0.155 ± 0.025.
The penalty CREATING deep alignment finding is now seed-robust. Three
seeds × two early epochs all show vanilla deep cos essentially zero
even when ||g|| is in the meaningful regime.
This is the round 20 lock-in. Framing is locked.
Diffstat (limited to 'results')
| -rw-r--r-- | results/vanilla_dfa_early_ckpts/vanilla_dfa_s123_log.json | 66 | ||||
| -rw-r--r-- | results/vanilla_dfa_early_ckpts/vanilla_dfa_s456_log.json | 66 | ||||
| -rw-r--r-- | results/vanilla_dfa_early_s123.log | 7 | ||||
| -rw-r--r-- | results/vanilla_dfa_early_s456.log | 7 |
4 files changed, 146 insertions, 0 deletions
diff --git a/results/vanilla_dfa_early_ckpts/vanilla_dfa_s123_log.json b/results/vanilla_dfa_early_ckpts/vanilla_dfa_s123_log.json new file mode 100644 index 0000000..68883a5 --- /dev/null +++ b/results/vanilla_dfa_early_ckpts/vanilla_dfa_s123_log.json @@ -0,0 +1,66 @@ +{ + "config": { + "seed": 123, + "max_epoch": 2, + "lr": 0.001, + "wd": 0.01, + "save_at": [ + 1, + 2 + ], + "output_dir": "results/vanilla_dfa_early_ckpts" + }, + "log": [ + { + "epoch": 0, + "h_norms": [ + 8.690464973449707, + 8.719978332519531, + 8.73093318939209, + 8.75937271118164, + 8.790542602539062 + ], + "g_norms": [ + 0.0009977436857298017, + 0.000992251792922616, + 0.0009848480112850666, + 0.0009761073160916567, + 0.0009735578205436468 + ] + }, + { + "epoch": 1, + "h_norms": [ + 861.2440185546875, + 2373.370849609375, + 4675.99951171875, + 6090.40869140625, + 6962.984375 + ], + "g_norms": [ + 2.380779051236459e-06, + 1.3197138741816161e-06, + 1.3154849511920474e-06, + 1.3285966815601569e-06, + 1.3258621720524388e-06 + ] + }, + { + "epoch": 2, + "h_norms": [ + 1679.3353271484375, + 8852.6904296875, + 31685.556640625, + 40725.1484375, + 45390.203125 + ], + "g_norms": [ + 1.1121658189949812e-06, + 2.7321576112626644e-07, + 2.7429715032667445e-07, + 2.751477552465076e-07, + 2.743622644629795e-07 + ] + } + ] +}
\ No newline at end of file diff --git a/results/vanilla_dfa_early_ckpts/vanilla_dfa_s456_log.json b/results/vanilla_dfa_early_ckpts/vanilla_dfa_s456_log.json new file mode 100644 index 0000000..1208df9 --- /dev/null +++ b/results/vanilla_dfa_early_ckpts/vanilla_dfa_s456_log.json @@ -0,0 +1,66 @@ +{ + "config": { + "seed": 456, + "max_epoch": 2, + "lr": 0.001, + "wd": 0.01, + "save_at": [ + 1, + 2 + ], + "output_dir": "results/vanilla_dfa_early_ckpts" + }, + "log": [ + { + "epoch": 0, + "h_norms": [ + 8.696551322937012, + 8.737784385681152, + 8.813130378723145, + 8.844642639160156, + 8.889528274536133 + ], + "g_norms": [ + 0.0010079912608489394, + 0.0010035138111561537, + 0.0009970925748348236, + 0.0009936393471434712, + 0.000986678060144186 + ] + }, + { + "epoch": 1, + "h_norms": [ + 900.3377685546875, + 3463.92626953125, + 6660.5166015625, + 10478.5126953125, + 13466.513671875 + ], + "g_norms": [ + 2.017142833210528e-06, + 7.972002435963077e-07, + 7.783806381667091e-07, + 7.758338256280695e-07, + 7.810436954969191e-07 + ] + }, + { + "epoch": 2, + "h_norms": [ + 1785.048828125, + 14088.892578125, + 36535.42578125, + 61441.53515625, + 73892.0078125 + ], + "g_norms": [ + 9.084495218303346e-07, + 1.7716872946493822e-07, + 1.705153493958278e-07, + 1.7151720044239482e-07, + 1.728312355453454e-07 + ] + } + ] +}
\ No newline at end of file diff --git a/results/vanilla_dfa_early_s123.log b/results/vanilla_dfa_early_s123.log new file mode 100644 index 0000000..b51cc7b --- /dev/null +++ b/results/vanilla_dfa_early_s123.log @@ -0,0 +1,7 @@ +Vanilla DFA early-epoch checkpoint sweep: seed=123, max_epoch=2 + ep 0: h_norms=['8.69e+00', '8.72e+00', '8.73e+00', '8.76e+00', '8.79e+00'], g_norms=['9.98e-04', '9.92e-04', '9.85e-04', '9.76e-04', '9.74e-04'] + ep 1: h_norms=['8.61e+02', '2.37e+03', '4.68e+03', '6.09e+03', '6.96e+03'], g_norms=['2.38e-06', '1.32e-06', '1.32e-06', '1.33e-06', '1.33e-06'] + saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s123_ep1.pt + ep 2: h_norms=['1.68e+03', '8.85e+03', '3.17e+04', '4.07e+04', '4.54e+04'], g_norms=['1.11e-06', '2.73e-07', '2.74e-07', '2.75e-07', '2.74e-07'] + saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s123_ep2.pt +Saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s123_log.json diff --git a/results/vanilla_dfa_early_s456.log b/results/vanilla_dfa_early_s456.log new file mode 100644 index 0000000..68afc35 --- /dev/null +++ b/results/vanilla_dfa_early_s456.log @@ -0,0 +1,7 @@ +Vanilla DFA early-epoch checkpoint sweep: seed=456, max_epoch=2 + ep 0: h_norms=['8.70e+00', '8.74e+00', '8.81e+00', '8.84e+00', '8.89e+00'], g_norms=['1.01e-03', '1.00e-03', '9.97e-04', '9.94e-04', '9.87e-04'] + ep 1: h_norms=['9.00e+02', '3.46e+03', '6.66e+03', '1.05e+04', '1.35e+04'], g_norms=['2.02e-06', '7.97e-07', '7.78e-07', '7.76e-07', '7.81e-07'] + saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s456_ep1.pt + ep 2: h_norms=['1.79e+03', '1.41e+04', '3.65e+04', '6.14e+04', '7.39e+04'], g_norms=['9.08e-07', '1.77e-07', '1.71e-07', '1.72e-07', '1.73e-07'] + saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s456_ep2.pt +Saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s456_log.json |
