1
2
3
4
5
6
7
8
9
10
11
12
13
|
Vanilla DFA early-epoch checkpoint sweep: seed=42, max_epoch=5
ep 0: h_norms=['8.72e+00', '8.78e+00', '8.81e+00', '8.83e+00', '8.89e+00'], g_norms=['1.01e-03', '9.97e-04', '9.93e-04', '9.87e-04', '9.83e-04']
ep 1: h_norms=['8.02e+02', '3.06e+03', '4.91e+03', '6.49e+03', '7.30e+03'], g_norms=['2.53e-06', '1.36e-06', '1.37e-06', '1.38e-06', '1.39e-06']
saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s42_ep1.pt
ep 2: h_norms=['1.58e+03', '1.33e+04', '2.28e+04', '3.24e+04', '3.78e+04'], g_norms=['1.14e-06', '3.09e-07', '3.11e-07', '3.14e-07', '3.17e-07']
saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s42_ep2.pt
ep 3: h_norms=['2.34e+03', '3.25e+04', '5.82e+04', '8.73e+04', '1.05e+05'], g_norms=['8.22e-07', '1.30e-07', '1.27e-07', '1.29e-07', '1.29e-07']
saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s42_ep3.pt
ep 4: h_norms=['3.13e+03', '6.29e+04', '1.18e+05', '1.83e+05', '2.24e+05'], g_norms=['6.48e-07', '7.03e-08', '6.72e-08', '6.80e-08', '6.81e-08']
saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s42_ep4.pt
ep 5: h_norms=['3.95e+03', '1.09e+05', '2.04e+05', '3.30e+05', '4.06e+05'], g_norms=['5.14e-07', '4.36e-08', '4.20e-08', '4.26e-08', '4.25e-08']
saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s42_ep5.pt
Saved results/vanilla_dfa_early_ckpts/vanilla_dfa_s42_log.json
|