Vanilla DFA early-epoch checkpoint sweep: seed=42, max_epoch=5 ep 0: h_norms=['8.72e+00', '8.78e+00', '8.81e+00', '8.83e+00', '8.89e+00'], g_norms=['1.01e-03', '9.97e-04', '9.93e-04', '9.87e-04', '9.83e-04'] ep 1: h_norms=['8.02e+02', '3.06e+03', '4.91e+03', '6.49e+03', '7.30e+03'], g_norms=['2.53e-06', '1.36e-06', '1.37e-06', '1.38e-06', '1.39e-06'] saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s42_ep1.pt ep 2: h_norms=['1.58e+03', '1.33e+04', '2.28e+04', '3.24e+04', '3.78e+04'], g_norms=['1.14e-06', '3.09e-07', '3.11e-07', '3.14e-07', '3.17e-07'] saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s42_ep2.pt ep 3: h_norms=['2.34e+03', '3.25e+04', '5.82e+04', '8.73e+04', '1.05e+05'], g_norms=['8.22e-07', '1.30e-07', '1.27e-07', '1.29e-07', '1.29e-07'] saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s42_ep3.pt ep 4: h_norms=['3.13e+03', '6.29e+04', '1.18e+05', '1.83e+05', '2.24e+05'], g_norms=['6.48e-07', '7.03e-08', '6.72e-08', '6.80e-08', '6.81e-08'] saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s42_ep4.pt ep 5: h_norms=['3.95e+03', '1.09e+05', '2.04e+05', '3.30e+05', '4.06e+05'], g_norms=['5.14e-07', '4.36e-08', '4.20e-08', '4.26e-08', '4.25e-08'] saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s42_ep5.pt Saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s42_log.json