diff options
Diffstat (limited to 'results/snapshot_synth_v1/run_a1.0_s42.log')
| -rw-r--r-- | results/snapshot_synth_v1/run_a1.0_s42.log | 44 |
1 files changed, 44 insertions, 0 deletions
diff --git a/results/snapshot_synth_v1/run_a1.0_s42.log b/results/snapshot_synth_v1/run_a1.0_s42.log new file mode 100644 index 0000000..d1e834a --- /dev/null +++ b/results/snapshot_synth_v1/run_a1.0_s42.log @@ -0,0 +1,44 @@ +device=cuda:0, alpha=1.0, depth=4, d_hidden=128, epochs=80, seed=42 +train: torch.Size([12800, 128]), test eval buffer: torch.Size([2000, 128]) + +=== BP training === + [BP] Ep 0: ||h_L||=1.140e+01 ||g||=2.816e-04 acc=0.0845 + [BP] Ep 1: ||h_L||=1.393e+01 ||g||=3.616e-04 acc=0.7095 + [BP] Ep 5: ||h_L||=2.067e+01 ||g||=2.195e-04 acc=0.7855 + [BP] Ep 10: ||h_L||=2.332e+01 ||g||=1.576e-04 acc=0.7915 + [BP] Ep 15: ||h_L||=2.609e+01 ||g||=9.301e-05 acc=0.8000 + [BP] Ep 20: ||h_L||=2.880e+01 ||g||=4.764e-05 acc=0.7950 + [BP] Ep 25: ||h_L||=3.096e+01 ||g||=3.036e-05 acc=0.7995 + [BP] Ep 30: ||h_L||=3.235e+01 ||g||=1.972e-05 acc=0.7975 + [BP] Ep 35: ||h_L||=3.329e+01 ||g||=1.527e-05 acc=0.8000 + [BP] Ep 40: ||h_L||=3.398e+01 ||g||=1.181e-05 acc=0.7975 + [BP] Ep 45: ||h_L||=3.449e+01 ||g||=1.028e-05 acc=0.7980 + [BP] Ep 50: ||h_L||=3.489e+01 ||g||=9.180e-06 acc=0.7980 + [BP] Ep 55: ||h_L||=3.516e+01 ||g||=8.594e-06 acc=0.7975 + [BP] Ep 60: ||h_L||=3.538e+01 ||g||=8.124e-06 acc=0.7960 + [BP] Ep 65: ||h_L||=3.553e+01 ||g||=7.551e-06 acc=0.7960 + [BP] Ep 70: ||h_L||=3.561e+01 ||g||=7.443e-06 acc=0.7960 + [BP] Ep 75: ||h_L||=3.565e+01 ||g||=7.344e-06 acc=0.7960 + [BP] Ep 80: ||h_L||=3.565e+01 ||g||=7.323e-06 acc=0.7960 + +=== DFA training === + [DFA] Ep 0: ||h_L||=1.140e+01 ||g||=2.816e-04 acc=0.0845 + [DFA] Ep 1: ||h_L||=1.244e+01 ||g||=2.737e-04 acc=0.3775 γ_dfa=0.1151 + [DFA] Ep 5: ||h_L||=5.072e+01 ||g||=1.943e-04 acc=0.7350 γ_dfa=0.1674 + [DFA] Ep 10: ||h_L||=1.381e+02 ||g||=1.229e-04 acc=0.7175 γ_dfa=0.1132 + [DFA] Ep 15: ||h_L||=2.302e+02 ||g||=1.030e-04 acc=0.7110 γ_dfa=0.0913 + [DFA] Ep 20: ||h_L||=3.213e+02 ||g||=1.112e-04 acc=0.7070 γ_dfa=0.0795 + [DFA] Ep 25: ||h_L||=4.041e+02 ||g||=1.027e-04 acc=0.7035 γ_dfa=0.0709 + [DFA] Ep 30: ||h_L||=4.810e+02 ||g||=1.014e-04 acc=0.6845 γ_dfa=0.0650 + [DFA] Ep 35: ||h_L||=5.483e+02 ||g||=1.116e-04 acc=0.6955 γ_dfa=0.0630 + [DFA] Ep 40: ||h_L||=6.078e+02 ||g||=1.203e-04 acc=0.6880 γ_dfa=0.0578 + [DFA] Ep 45: ||h_L||=6.578e+02 ||g||=1.118e-04 acc=0.6845 γ_dfa=0.0563 + [DFA] Ep 50: ||h_L||=6.988e+02 ||g||=1.262e-04 acc=0.6945 γ_dfa=0.0562 + [DFA] Ep 55: ||h_L||=7.301e+02 ||g||=1.428e-04 acc=0.6720 γ_dfa=0.0559 + [DFA] Ep 60: ||h_L||=7.519e+02 ||g||=1.238e-04 acc=0.6910 γ_dfa=0.0542 + [DFA] Ep 65: ||h_L||=7.678e+02 ||g||=1.230e-04 acc=0.6895 γ_dfa=0.0530 + [DFA] Ep 70: ||h_L||=7.757e+02 ||g||=1.224e-04 acc=0.6950 γ_dfa=0.0530 + [DFA] Ep 75: ||h_L||=7.791e+02 ||g||=1.214e-04 acc=0.6915 γ_dfa=0.0526 + [DFA] Ep 80: ||h_L||=7.797e+02 ||g||=1.203e-04 acc=0.6930 γ_dfa=0.0526 + +Saved results/snapshot_synth_v1/snapshot_synth_a1.0_L4_s42.json |
