diff options
Diffstat (limited to 'results/fa_depth_scan_d512_L12/results_cifar10.json')
| -rw-r--r-- | results/fa_depth_scan_d512_L12/results_cifar10.json | 499 |
1 files changed, 499 insertions, 0 deletions
diff --git a/results/fa_depth_scan_d512_L12/results_cifar10.json b/results/fa_depth_scan_d512_L12/results_cifar10.json new file mode 100644 index 0000000..15a5792 --- /dev/null +++ b/results/fa_depth_scan_d512_L12/results_cifar10.json @@ -0,0 +1,499 @@ +{ + "42": { + "fa": { + "log": { + "train_loss": [ + 2.0427230606079103, + 1.9547925742340089, + 1.9269662255096436, + 1.9024112060546876, + 1.88389292137146, + 1.874641305809021, + 1.8671076870727539, + 1.8585125997543335, + 1.8507517318725586, + 1.8509845052719116, + 1.8455515924835204, + 1.8402700800323486, + 1.8322524318695068, + 1.8287768964385986, + 1.824175419845581, + 1.8240570126342774, + 1.817736747970581, + 1.8165113877105712, + 1.8092418829345702, + 1.8068542711639404, + 1.8066692431640625, + 1.8037006209945678, + 1.7959260940551758, + 1.797553392868042, + 1.7958658642196654, + 1.7940396698379517, + 1.7932731056976319, + 1.7874454331207275, + 1.7880735418319702, + 1.7836660583496093, + 1.7832960818862915, + 1.7804118716812134, + 1.7788523398208618, + 1.772011728515625, + 1.7708375668716432, + 1.7682569339370728, + 1.7717147860336304, + 1.7703663568115235, + 1.7637487329864503, + 1.7676782482910156, + 1.7649735053253175, + 1.7634011583709717, + 1.7645813860702515, + 1.7605182119369507, + 1.7599670697021483, + 1.7621903922271729, + 1.756671106300354, + 1.7577124716949464, + 1.7564089126205444, + 1.7521357986450194, + 1.7525928847885133, + 1.7497260301971436, + 1.7528332720184325, + 1.7475884844207763, + 1.7469696446990968, + 1.7445055263519287, + 1.752090754776001, + 1.7456406805038451, + 1.747734097251892, + 1.7441029932403564, + 1.743490291824341, + 1.7414577841949463, + 1.742126556777954, + 1.7391094409942627, + 1.7401588076019288, + 1.7370625415420533, + 1.7388630017471314, + 1.7353392750930785, + 1.736816965751648, + 1.7355695288085937, + 1.73539924369812, + 1.7323005257797242, + 1.7321935805511475, + 1.7312652449798585, + 1.7298928540420533, + 1.73121183719635, + 1.7288608194351196, + 1.7294834777069092, + 1.726299252166748, + 1.73074989528656, + 1.7293904189682008, + 1.7276834594345092, + 1.7300372393035888, + 1.731684062461853, + 1.7275019702529908, + 1.729561651916504, + 1.7284230736923218, + 1.7257295697021484, + 1.7226565048217772, + 1.726801979408264, + 1.7250631372833252, + 1.7279036038970947, + 1.726708238143921, + 1.7242388882064819, + 1.7248469045257568, + 1.7260398196411133, + 1.721121542892456, + 1.7220706603240967, + 1.7268135174942016, + 1.729515742111206 + ], + "train_acc": [ + 0.24062, + 0.28346, + 0.2951, + 0.30692, + 0.31778, + 0.3211, + 0.32388, + 0.32854, + 0.33456, + 0.33332, + 0.33668, + 0.33984, + 0.34108, + 0.34376, + 0.346, + 0.34636, + 0.35004, + 0.34922, + 0.35104, + 0.35196, + 0.35292, + 0.35532, + 0.3572, + 0.35614, + 0.3578, + 0.35934, + 0.35694, + 0.35918, + 0.36018, + 0.35928, + 0.3622, + 0.362, + 0.36236, + 0.36548, + 0.36778, + 0.36536, + 0.36884, + 0.367, + 0.36852, + 0.36842, + 0.36944, + 0.36784, + 0.3697, + 0.37156, + 0.37064, + 0.3725, + 0.37072, + 0.37062, + 0.37082, + 0.37298, + 0.37268, + 0.37554, + 0.3732, + 0.3752, + 0.37724, + 0.37652, + 0.37506, + 0.37708, + 0.37712, + 0.37668, + 0.37814, + 0.37944, + 0.37878, + 0.37886, + 0.38042, + 0.3778, + 0.38022, + 0.37988, + 0.38096, + 0.3807, + 0.3811, + 0.38084, + 0.37994, + 0.37914, + 0.38104, + 0.38152, + 0.38376, + 0.38158, + 0.38472, + 0.38244, + 0.38066, + 0.38392, + 0.3839, + 0.38222, + 0.38382, + 0.38384, + 0.38472, + 0.385, + 0.38792, + 0.3839, + 0.38516, + 0.3858, + 0.38262, + 0.38758, + 0.38396, + 0.38268, + 0.38628, + 0.38618, + 0.3846, + 0.38336 + ], + "test_acc": [ + 0.2963, + 0.3132, + 0.3406, + 0.3377, + 0.3353, + 0.3407, + 0.3367, + 0.3657, + 0.3618, + 0.3712, + 0.3519, + 0.3722, + 0.371, + 0.379, + 0.3666, + 0.372, + 0.3674, + 0.3754, + 0.3733, + 0.3747, + 0.3712, + 0.3772, + 0.3792, + 0.3804, + 0.3742, + 0.3852, + 0.3864, + 0.3907, + 0.3861, + 0.3827, + 0.3852, + 0.3833, + 0.3885, + 0.3865, + 0.3933, + 0.391, + 0.3837, + 0.3915, + 0.4, + 0.4088, + 0.3956, + 0.3878, + 0.407, + 0.3928, + 0.3983, + 0.4042, + 0.4064, + 0.4019, + 0.3975, + 0.3905, + 0.399, + 0.3953, + 0.3981, + 0.3986, + 0.399, + 0.3963, + 0.4013, + 0.3988, + 0.401, + 0.4042, + 0.3978, + 0.399, + 0.4035, + 0.4022, + 0.4052, + 0.4033, + 0.4035, + 0.4041, + 0.4026, + 0.4046, + 0.4012, + 0.3996, + 0.4052, + 0.4034, + 0.3962, + 0.4036, + 0.3996, + 0.4008, + 0.4053, + 0.4037, + 0.4033, + 0.4058, + 0.408, + 0.4066, + 0.4017, + 0.4038, + 0.4015, + 0.4035, + 0.4052, + 0.4014, + 0.4046, + 0.4027, + 0.4046, + 0.4036, + 0.4035, + 0.4042, + 0.4039, + 0.4033, + 0.4034, + 0.4035 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.04570477455854416, + 0.10783404111862183, + -0.03488321602344513, + -0.0594203844666481, + -0.04577865079045296, + -0.024857502430677414, + -0.03406952694058418, + 0.030555542558431625, + -0.00125521095469594, + 0.010614164173603058, + 0.05838795006275177, + 0.9949829578399658 + ], + "perturbation_rho": [ + -0.010346438735723495, + 0.04423713684082031, + 0.01146540604531765, + 0.03663264587521553, + -0.011911284178495407, + 0.0016591008752584457, + -0.02494950033724308, + 0.02218942530453205, + 0.0039163315668702126, + 0.07129630446434021, + 0.00445366557687521, + -0.01873880997300148 + ], + "nudging": { + "0.001": [ + -2.829881850630045e-06, + -3.539607860147953e-07, + 7.35744833946228e-08, + 8.218921720981598e-08, + 4.21423465013504e-08, + 2.7241185307502747e-08, + 7.008202373981476e-08, + -3.632158041000366e-08, + -3.958120942115784e-09, + -3.073364496231079e-08, + -9.918585419654846e-08, + -1.0794028639793396e-06 + ], + "0.003": [ + -8.66112532094121e-06, + -9.669456630945206e-07, + 1.387670636177063e-07, + 2.7869828045368195e-07, + 1.7974525690078735e-07, + 1.0058283805847168e-07, + 1.448206603527069e-07, + -2.1746382117271423e-07, + -1.0011717677116394e-08, + -1.1711381375789642e-07, + -2.377200871706009e-07, + -3.898283466696739e-06 + ], + "0.01": [ + -2.8825539629906416e-05, + -3.2445532269775867e-06, + 4.411558620631695e-07, + 9.136274456977844e-07, + 6.3673360273242e-07, + 3.696768544614315e-07, + 4.895846359431744e-07, + -5.699694156646729e-07, + -7.869675755500793e-08, + -1.8370337784290314e-07, + -8.582137525081635e-07, + -1.4071993064135313e-05 + ] + }, + "hidden_norms_per_layer": [ + 7405.54296875, + 126799.640625, + 722124.125, + 1197351.125, + 1311770.625, + 1445317.875, + 1575290.0, + 1646774.0, + 1672649.625, + 1692752.625, + 1726090.75, + 1747446.5, + 1108917.0 + ], + "bp_grad_norms_per_layer": [ + 2.2136026018415578e-05, + 1.0887044936680468e-06, + 6.514224537568225e-07, + 6.450830483117898e-07, + 6.397550009751285e-07, + 6.399715175575693e-07, + 6.393033231688605e-07, + 6.382227297763166e-07, + 6.320739203147241e-07, + 6.241282335395226e-07, + 6.161063197396288e-07, + 6.117401767369302e-07, + 5.839314667355211e-07 + ] + }, + "drift": { + "embed.weight": 52.2471866434948, + "embed.bias": 18.97250327390356, + "blocks.0.ln.weight": 1.2566883045780834, + "blocks.0.w1.weight": 17.12006786604635, + "blocks.0.w1.bias": 14.342858083073688, + "blocks.0.w2.weight": 63.004850525998116, + "blocks.1.ln.weight": 1.0284467630081824, + "blocks.1.w1.weight": 21.225831949490352, + "blocks.1.w1.bias": 18.554260026881323, + "blocks.1.w2.weight": 42.67940842745791, + "blocks.2.ln.weight": 0.5431388174757359, + "blocks.2.w1.weight": 20.036899880398536, + "blocks.2.w1.bias": 21.66446091790098, + "blocks.2.w2.weight": 26.571695423395656, + "blocks.3.ln.weight": 0.4791053623183397, + "blocks.3.w1.weight": 17.857825652507895, + "blocks.3.w1.bias": 19.196407269205075, + "blocks.3.w2.weight": 24.453272281036483, + "blocks.4.ln.weight": 0.40179147711472446, + "blocks.4.w1.weight": 16.142007729189494, + "blocks.4.w1.bias": 18.38189338630125, + "blocks.4.w2.weight": 22.251118320035413, + "blocks.5.ln.weight": 0.3999388280630244, + "blocks.5.w1.weight": 16.08867610628456, + "blocks.5.w1.bias": 18.228301269113516, + "blocks.5.w2.weight": 22.282579138688718, + "blocks.6.ln.weight": 0.5139340433841122, + "blocks.6.w1.weight": 16.498928955337856, + "blocks.6.w1.bias": 17.341930385247757, + "blocks.6.w2.weight": 44.47264444577482, + "blocks.7.ln.weight": 0.5190564871460961, + "blocks.7.w1.weight": 15.921519106035, + "blocks.7.w1.bias": 13.554678640598476, + "blocks.7.w2.weight": 55.375944465972985, + "blocks.8.ln.weight": 0.5783217006624557, + "blocks.8.w1.weight": 15.308415657722076, + "blocks.8.w1.bias": 12.359797369765815, + "blocks.8.w2.weight": 60.55354023990087, + "blocks.9.ln.weight": 0.5265177438656736, + "blocks.9.w1.weight": 14.699539264919315, + "blocks.9.w1.bias": 12.199485985244364, + "blocks.9.w2.weight": 53.496852348666465, + "blocks.10.ln.weight": 0.5541756864436261, + "blocks.10.w1.weight": 14.732920668123558, + "blocks.10.w1.bias": 10.868519121164393, + "blocks.10.w2.weight": 61.24451839129346, + "blocks.11.ln.weight": 0.6274670342096703, + "blocks.11.w1.weight": 18.31665424290367, + "blocks.11.w1.bias": 18.6607903814988, + "blocks.11.w2.weight": 57.15975509546593, + "out_ln.weight": 0.317930900746446, + "out_head.weight": 6.3670164706750825, + "out_head.bias": 0.940628348025828 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 512, + "num_blocks": 12, + "batch_size": 128, + "epochs": 100, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 42 + ], + "gpu": 0, + "output_dir": "results/fa_depth_scan_d512", + "methods": [ + "fa" + ], + "random_targets": false, + "penalty_lam": 0.0, + "num_classes": 10 + } +}
\ No newline at end of file |
