diff options
Diffstat (limited to 'results/h2_no_residual_full_s456.log')
| -rw-r--r-- | results/h2_no_residual_full_s456.log | 107 |
1 files changed, 107 insertions, 0 deletions
diff --git a/results/h2_no_residual_full_s456.log b/results/h2_no_residual_full_s456.log new file mode 100644 index 0000000..d0f198c --- /dev/null +++ b/results/h2_no_residual_full_s456.log @@ -0,0 +1,107 @@ +device=cuda:0, depth=4, d_hidden=256, epochs=100, seed=456 +eval buffer: torch.Size([1024, 3072]) + +=== DFA training === + [DFA] Ep 0: ||h||_med=[8.696551322937012, 42.47159957885742, 42.67432403564453, 45.272701263427734, 43.449092864990234] ||g||_med=[0.0011182057205587626, 0.00021166827355045825, 0.00014748115791007876, 0.00011803740198956802, 0.00010102539090439677] acc=0.1143 + [DFA] Ep 1: ||h_L||=9.975e+03 ||g_2||=4.843e-07 acc=0.1113 gamma_dfa=0.0185 + [DFA] Ep 2: ||h_L||=4.258e+04 ||g_2||=8.536e-08 acc=0.1006 gamma_dfa=0.0173 + [DFA] Ep 3: ||h_L||=9.508e+04 ||g_2||=3.481e-08 acc=0.0801 gamma_dfa=0.0150 + [DFA] Ep 4: ||h_L||=1.685e+05 ||g_2||=1.968e-08 acc=0.0654 gamma_dfa=0.0208 + [DFA] Ep 5: ||h_L||=2.704e+05 ||g_2||=1.294e-08 acc=0.0732 gamma_dfa=0.0239 + [DFA] Ep 6: ||h_L||=4.002e+05 ||g_2||=9.634e-09 acc=0.1064 gamma_dfa=0.0241 + [DFA] Ep 7: ||h_L||=5.563e+05 ||g_2||=7.954e-09 acc=0.1123 gamma_dfa=0.0292 + [DFA] Ep 8: ||h_L||=7.605e+05 ||g_2||=6.522e-09 acc=0.1152 gamma_dfa=0.0312 + [DFA] Ep 9: ||h_L||=1.011e+06 ||g_2||=5.556e-09 acc=0.1162 gamma_dfa=0.0348 + [DFA] Ep 10: ||h_L||=1.307e+06 ||g_2||=4.731e-09 acc=0.1152 gamma_dfa=0.0403 + [DFA] Ep 11: ||h_L||=1.643e+06 ||g_2||=4.127e-09 acc=0.1162 gamma_dfa=0.0408 + [DFA] Ep 12: ||h_L||=2.047e+06 ||g_2||=3.521e-09 acc=0.1123 gamma_dfa=0.0411 + [DFA] Ep 13: ||h_L||=2.529e+06 ||g_2||=3.068e-09 acc=0.1143 gamma_dfa=0.0436 + [DFA] Ep 14: ||h_L||=3.069e+06 ||g_2||=2.661e-09 acc=0.1152 gamma_dfa=0.0434 + [DFA] Ep 15: ||h_L||=3.672e+06 ||g_2||=2.340e-09 acc=0.1123 gamma_dfa=0.0459 + [DFA] Ep 16: ||h_L||=4.363e+06 ||g_2||=2.085e-09 acc=0.1104 gamma_dfa=0.0443 + [DFA] Ep 17: ||h_L||=5.116e+06 ||g_2||=1.862e-09 acc=0.1035 gamma_dfa=0.0453 + [DFA] Ep 18: ||h_L||=5.947e+06 ||g_2||=1.664e-09 acc=0.0859 gamma_dfa=0.0454 + [DFA] Ep 19: ||h_L||=6.799e+06 ||g_2||=1.496e-09 acc=0.0762 gamma_dfa=0.0448 + [DFA] Ep 20: ||h_L||=7.803e+06 ||g_2||=1.355e-09 acc=0.0801 gamma_dfa=0.0458 + [DFA] Ep 21: ||h_L||=8.837e+06 ||g_2||=1.236e-09 acc=0.0928 gamma_dfa=0.0458 + [DFA] Ep 22: ||h_L||=9.928e+06 ||g_2||=1.132e-09 acc=0.1045 gamma_dfa=0.0462 + [DFA] Ep 23: ||h_L||=1.110e+07 ||g_2||=1.038e-09 acc=0.1055 gamma_dfa=0.0465 + [DFA] Ep 24: ||h_L||=1.236e+07 ||g_2||=9.618e-10 acc=0.1055 gamma_dfa=0.0462 + [DFA] Ep 25: ||h_L||=1.366e+07 ||g_2||=8.898e-10 acc=0.1055 gamma_dfa=0.0468 + [DFA] Ep 26: ||h_L||=1.500e+07 ||g_2||=8.268e-10 acc=0.1055 gamma_dfa=0.0475 + [DFA] Ep 27: ||h_L||=1.650e+07 ||g_2||=7.703e-10 acc=0.1064 gamma_dfa=0.0474 + [DFA] Ep 28: ||h_L||=1.811e+07 ||g_2||=7.228e-10 acc=0.1055 gamma_dfa=0.0473 + [DFA] Ep 29: ||h_L||=1.965e+07 ||g_2||=6.773e-10 acc=0.1055 gamma_dfa=0.0472 + [DFA] Ep 30: ||h_L||=2.139e+07 ||g_2||=6.385e-10 acc=0.1055 gamma_dfa=0.0478 + [DFA] Ep 31: ||h_L||=2.306e+07 ||g_2||=6.001e-10 acc=0.1055 gamma_dfa=0.0481 + [DFA] Ep 32: ||h_L||=2.490e+07 ||g_2||=5.676e-10 acc=0.1064 gamma_dfa=0.0476 + [DFA] Ep 33: ||h_L||=2.693e+07 ||g_2||=5.345e-10 acc=0.1055 gamma_dfa=0.0476 + [DFA] Ep 34: ||h_L||=2.880e+07 ||g_2||=5.057e-10 acc=0.1055 gamma_dfa=0.0481 + [DFA] Ep 35: ||h_L||=3.075e+07 ||g_2||=4.826e-10 acc=0.1055 gamma_dfa=0.0478 + [DFA] Ep 36: ||h_L||=3.269e+07 ||g_2||=4.582e-10 acc=0.1055 gamma_dfa=0.0478 + [DFA] Ep 37: ||h_L||=3.458e+07 ||g_2||=4.370e-10 acc=0.1055 gamma_dfa=0.0480 + [DFA] Ep 38: ||h_L||=3.663e+07 ||g_2||=4.178e-10 acc=0.1055 gamma_dfa=0.0481 + [DFA] Ep 39: ||h_L||=3.877e+07 ||g_2||=4.003e-10 acc=0.1055 gamma_dfa=0.0479 + [DFA] Ep 40: ||h_L||=4.085e+07 ||g_2||=3.838e-10 acc=0.1055 gamma_dfa=0.0483 + [DFA] Ep 41: ||h_L||=4.301e+07 ||g_2||=3.697e-10 acc=0.1055 gamma_dfa=0.0488 + [DFA] Ep 42: ||h_L||=4.527e+07 ||g_2||=3.547e-10 acc=0.1055 gamma_dfa=0.0488 + [DFA] Ep 43: ||h_L||=4.735e+07 ||g_2||=3.417e-10 acc=0.1055 gamma_dfa=0.0487 + [DFA] Ep 44: ||h_L||=4.957e+07 ||g_2||=3.287e-10 acc=0.1055 gamma_dfa=0.0491 + [DFA] Ep 45: ||h_L||=5.152e+07 ||g_2||=3.176e-10 acc=0.1055 gamma_dfa=0.0493 + [DFA] Ep 46: ||h_L||=5.370e+07 ||g_2||=3.079e-10 acc=0.1055 gamma_dfa=0.0490 + [DFA] Ep 47: ||h_L||=5.579e+07 ||g_2||=2.985e-10 acc=0.1055 gamma_dfa=0.0497 + [DFA] Ep 48: ||h_L||=5.788e+07 ||g_2||=2.902e-10 acc=0.1055 gamma_dfa=0.0495 + [DFA] Ep 49: ||h_L||=6.001e+07 ||g_2||=2.819e-10 acc=0.1055 gamma_dfa=0.0495 + [DFA] Ep 50: ||h_L||=6.212e+07 ||g_2||=2.740e-10 acc=0.1055 gamma_dfa=0.0500 + [DFA] Ep 51: ||h_L||=6.409e+07 ||g_2||=2.676e-10 acc=0.1055 gamma_dfa=0.0503 + [DFA] Ep 52: ||h_L||=6.611e+07 ||g_2||=2.606e-10 acc=0.1055 gamma_dfa=0.0498 + [DFA] Ep 53: ||h_L||=6.824e+07 ||g_2||=2.535e-10 acc=0.1055 gamma_dfa=0.0503 + [DFA] Ep 54: ||h_L||=7.033e+07 ||g_2||=2.483e-10 acc=0.1055 gamma_dfa=0.0506 + [DFA] Ep 55: ||h_L||=7.230e+07 ||g_2||=2.428e-10 acc=0.1055 gamma_dfa=0.0507 + [DFA] Ep 56: ||h_L||=7.415e+07 ||g_2||=2.379e-10 acc=0.1055 gamma_dfa=0.0508 + [DFA] Ep 57: ||h_L||=7.599e+07 ||g_2||=2.338e-10 acc=0.1055 gamma_dfa=0.0508 + [DFA] Ep 58: ||h_L||=7.792e+07 ||g_2||=2.293e-10 acc=0.1055 gamma_dfa=0.0510 + [DFA] Ep 59: ||h_L||=7.974e+07 ||g_2||=2.247e-10 acc=0.1055 gamma_dfa=0.0511 + [DFA] Ep 60: ||h_L||=8.161e+07 ||g_2||=2.218e-10 acc=0.1055 gamma_dfa=0.0513 + [DFA] Ep 61: ||h_L||=8.329e+07 ||g_2||=2.178e-10 acc=0.1055 gamma_dfa=0.0515 + [DFA] Ep 62: ||h_L||=8.490e+07 ||g_2||=2.139e-10 acc=0.1055 gamma_dfa=0.0518 + [DFA] Ep 63: ||h_L||=8.655e+07 ||g_2||=2.119e-10 acc=0.1055 gamma_dfa=0.0518 + [DFA] Ep 64: ||h_L||=8.808e+07 ||g_2||=2.085e-10 acc=0.1055 gamma_dfa=0.0519 + [DFA] Ep 65: ||h_L||=8.967e+07 ||g_2||=2.067e-10 acc=0.1055 gamma_dfa=0.0517 + [DFA] Ep 66: ||h_L||=9.106e+07 ||g_2||=2.040e-10 acc=0.1055 gamma_dfa=0.0519 + [DFA] Ep 67: ||h_L||=9.243e+07 ||g_2||=2.017e-10 acc=0.1055 gamma_dfa=0.0520 + [DFA] Ep 68: ||h_L||=9.373e+07 ||g_2||=1.995e-10 acc=0.1055 gamma_dfa=0.0521 + [DFA] Ep 69: ||h_L||=9.486e+07 ||g_2||=1.975e-10 acc=0.1055 gamma_dfa=0.0522 + [DFA] Ep 70: ||h_L||=9.607e+07 ||g_2||=1.956e-10 acc=0.1055 gamma_dfa=0.0521 + [DFA] Ep 71: ||h_L||=9.723e+07 ||g_2||=1.938e-10 acc=0.1055 gamma_dfa=0.0521 + [DFA] Ep 72: ||h_L||=9.818e+07 ||g_2||=1.921e-10 acc=0.1055 gamma_dfa=0.0522 + [DFA] Ep 73: ||h_L||=9.925e+07 ||g_2||=1.908e-10 acc=0.1055 gamma_dfa=0.0523 + [DFA] Ep 74: ||h_L||=1.003e+08 ||g_2||=1.891e-10 acc=0.1055 gamma_dfa=0.0523 + [DFA] Ep 75: ||h_L||=1.012e+08 ||g_2||=1.877e-10 acc=0.1055 gamma_dfa=0.0524 + [DFA] Ep 76: ||h_L||=1.020e+08 ||g_2||=1.867e-10 acc=0.1055 gamma_dfa=0.0523 + [DFA] Ep 77: ||h_L||=1.028e+08 ||g_2||=1.857e-10 acc=0.1055 gamma_dfa=0.0524 + [DFA] Ep 78: ||h_L||=1.035e+08 ||g_2||=1.846e-10 acc=0.1055 gamma_dfa=0.0524 + [DFA] Ep 79: ||h_L||=1.041e+08 ||g_2||=1.838e-10 acc=0.1055 gamma_dfa=0.0525 + [DFA] Ep 80: ||h_L||=1.047e+08 ||g_2||=1.829e-10 acc=0.1055 gamma_dfa=0.0526 + [DFA] Ep 81: ||h_L||=1.052e+08 ||g_2||=1.821e-10 acc=0.1055 gamma_dfa=0.0527 + [DFA] Ep 82: ||h_L||=1.057e+08 ||g_2||=1.815e-10 acc=0.1055 gamma_dfa=0.0527 + [DFA] Ep 83: ||h_L||=1.062e+08 ||g_2||=1.808e-10 acc=0.1055 gamma_dfa=0.0526 + [DFA] Ep 84: ||h_L||=1.066e+08 ||g_2||=1.802e-10 acc=0.1055 gamma_dfa=0.0527 + [DFA] Ep 85: ||h_L||=1.070e+08 ||g_2||=1.797e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 86: ||h_L||=1.073e+08 ||g_2||=1.794e-10 acc=0.1055 gamma_dfa=0.0527 + [DFA] Ep 87: ||h_L||=1.076e+08 ||g_2||=1.790e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 88: ||h_L||=1.079e+08 ||g_2||=1.787e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 89: ||h_L||=1.081e+08 ||g_2||=1.784e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 90: ||h_L||=1.082e+08 ||g_2||=1.782e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 91: ||h_L||=1.084e+08 ||g_2||=1.780e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 92: ||h_L||=1.085e+08 ||g_2||=1.778e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 93: ||h_L||=1.086e+08 ||g_2||=1.777e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 94: ||h_L||=1.087e+08 ||g_2||=1.776e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 95: ||h_L||=1.087e+08 ||g_2||=1.776e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 96: ||h_L||=1.087e+08 ||g_2||=1.775e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 97: ||h_L||=1.088e+08 ||g_2||=1.775e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 98: ||h_L||=1.088e+08 ||g_2||=1.775e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 99: ||h_L||=1.088e+08 ||g_2||=1.775e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 100: ||h_L||=1.088e+08 ||g_2||=1.775e-10 acc=0.1055 gamma_dfa=0.0528 + +Saved results/h2_no_residual_full_s456/snapshot_evolution_s456.json |
