{ "42": { "fa": { "log": { "train_loss": [ 2.0427230606079103, 1.9547925742340089, 1.9269662255096436, 1.9024112060546876, 1.88389292137146, 1.874641305809021, 1.8671076870727539, 1.8585125997543335, 1.8507517318725586, 1.8509845052719116, 1.8455515924835204, 1.8402700800323486, 1.8322524318695068, 1.8287768964385986, 1.824175419845581, 1.8240570126342774, 1.817736747970581, 1.8165113877105712, 1.8092418829345702, 1.8068542711639404, 1.8066692431640625, 1.8037006209945678, 1.7959260940551758, 1.797553392868042, 1.7958658642196654, 1.7940396698379517, 1.7932731056976319, 1.7874454331207275, 1.7880735418319702, 1.7836660583496093, 1.7832960818862915, 1.7804118716812134, 1.7788523398208618, 1.772011728515625, 1.7708375668716432, 1.7682569339370728, 1.7717147860336304, 1.7703663568115235, 1.7637487329864503, 1.7676782482910156, 1.7649735053253175, 1.7634011583709717, 1.7645813860702515, 1.7605182119369507, 1.7599670697021483, 1.7621903922271729, 1.756671106300354, 1.7577124716949464, 1.7564089126205444, 1.7521357986450194, 1.7525928847885133, 1.7497260301971436, 1.7528332720184325, 1.7475884844207763, 1.7469696446990968, 1.7445055263519287, 1.752090754776001, 1.7456406805038451, 1.747734097251892, 1.7441029932403564, 1.743490291824341, 1.7414577841949463, 1.742126556777954, 1.7391094409942627, 1.7401588076019288, 1.7370625415420533, 1.7388630017471314, 1.7353392750930785, 1.736816965751648, 1.7355695288085937, 1.73539924369812, 1.7323005257797242, 1.7321935805511475, 1.7312652449798585, 1.7298928540420533, 1.73121183719635, 1.7288608194351196, 1.7294834777069092, 1.726299252166748, 1.73074989528656, 1.7293904189682008, 1.7276834594345092, 1.7300372393035888, 1.731684062461853, 1.7275019702529908, 1.729561651916504, 1.7284230736923218, 1.7257295697021484, 1.7226565048217772, 1.726801979408264, 1.7250631372833252, 1.7279036038970947, 1.726708238143921, 1.7242388882064819, 1.7248469045257568, 1.7260398196411133, 1.721121542892456, 1.7220706603240967, 1.7268135174942016, 1.729515742111206 ], "train_acc": [ 0.24062, 0.28346, 0.2951, 0.30692, 0.31778, 0.3211, 0.32388, 0.32854, 0.33456, 0.33332, 0.33668, 0.33984, 0.34108, 0.34376, 0.346, 0.34636, 0.35004, 0.34922, 0.35104, 0.35196, 0.35292, 0.35532, 0.3572, 0.35614, 0.3578, 0.35934, 0.35694, 0.35918, 0.36018, 0.35928, 0.3622, 0.362, 0.36236, 0.36548, 0.36778, 0.36536, 0.36884, 0.367, 0.36852, 0.36842, 0.36944, 0.36784, 0.3697, 0.37156, 0.37064, 0.3725, 0.37072, 0.37062, 0.37082, 0.37298, 0.37268, 0.37554, 0.3732, 0.3752, 0.37724, 0.37652, 0.37506, 0.37708, 0.37712, 0.37668, 0.37814, 0.37944, 0.37878, 0.37886, 0.38042, 0.3778, 0.38022, 0.37988, 0.38096, 0.3807, 0.3811, 0.38084, 0.37994, 0.37914, 0.38104, 0.38152, 0.38376, 0.38158, 0.38472, 0.38244, 0.38066, 0.38392, 0.3839, 0.38222, 0.38382, 0.38384, 0.38472, 0.385, 0.38792, 0.3839, 0.38516, 0.3858, 0.38262, 0.38758, 0.38396, 0.38268, 0.38628, 0.38618, 0.3846, 0.38336 ], "test_acc": [ 0.2963, 0.3132, 0.3406, 0.3377, 0.3353, 0.3407, 0.3367, 0.3657, 0.3618, 0.3712, 0.3519, 0.3722, 0.371, 0.379, 0.3666, 0.372, 0.3674, 0.3754, 0.3733, 0.3747, 0.3712, 0.3772, 0.3792, 0.3804, 0.3742, 0.3852, 0.3864, 0.3907, 0.3861, 0.3827, 0.3852, 0.3833, 0.3885, 0.3865, 0.3933, 0.391, 0.3837, 0.3915, 0.4, 0.4088, 0.3956, 0.3878, 0.407, 0.3928, 0.3983, 0.4042, 0.4064, 0.4019, 0.3975, 0.3905, 0.399, 0.3953, 0.3981, 0.3986, 0.399, 0.3963, 0.4013, 0.3988, 0.401, 0.4042, 0.3978, 0.399, 0.4035, 0.4022, 0.4052, 0.4033, 0.4035, 0.4041, 0.4026, 0.4046, 0.4012, 0.3996, 0.4052, 0.4034, 0.3962, 0.4036, 0.3996, 0.4008, 0.4053, 0.4037, 0.4033, 0.4058, 0.408, 0.4066, 0.4017, 0.4038, 0.4015, 0.4035, 0.4052, 0.4014, 0.4046, 0.4027, 0.4046, 0.4036, 0.4035, 0.4042, 0.4039, 0.4033, 0.4034, 0.4035 ] }, "diagnostics": { "bp_cosine": [ 0.04570477455854416, 0.10783404111862183, -0.03488321602344513, -0.0594203844666481, -0.04577865079045296, -0.024857502430677414, -0.03406952694058418, 0.030555542558431625, -0.00125521095469594, 0.010614164173603058, 0.05838795006275177, 0.9949829578399658 ], "perturbation_rho": [ -0.010346438735723495, 0.04423713684082031, 0.01146540604531765, 0.03663264587521553, -0.011911284178495407, 0.0016591008752584457, -0.02494950033724308, 0.02218942530453205, 0.0039163315668702126, 0.07129630446434021, 0.00445366557687521, -0.01873880997300148 ], "nudging": { "0.001": [ -2.829881850630045e-06, -3.539607860147953e-07, 7.35744833946228e-08, 8.218921720981598e-08, 4.21423465013504e-08, 2.7241185307502747e-08, 7.008202373981476e-08, -3.632158041000366e-08, -3.958120942115784e-09, -3.073364496231079e-08, -9.918585419654846e-08, -1.0794028639793396e-06 ], "0.003": [ -8.66112532094121e-06, -9.669456630945206e-07, 1.387670636177063e-07, 2.7869828045368195e-07, 1.7974525690078735e-07, 1.0058283805847168e-07, 1.448206603527069e-07, -2.1746382117271423e-07, -1.0011717677116394e-08, -1.1711381375789642e-07, -2.377200871706009e-07, -3.898283466696739e-06 ], "0.01": [ -2.8825539629906416e-05, -3.2445532269775867e-06, 4.411558620631695e-07, 9.136274456977844e-07, 6.3673360273242e-07, 3.696768544614315e-07, 4.895846359431744e-07, -5.699694156646729e-07, -7.869675755500793e-08, -1.8370337784290314e-07, -8.582137525081635e-07, -1.4071993064135313e-05 ] }, "hidden_norms_per_layer": [ 7405.54296875, 126799.640625, 722124.125, 1197351.125, 1311770.625, 1445317.875, 1575290.0, 1646774.0, 1672649.625, 1692752.625, 1726090.75, 1747446.5, 1108917.0 ], "bp_grad_norms_per_layer": [ 2.2136026018415578e-05, 1.0887044936680468e-06, 6.514224537568225e-07, 6.450830483117898e-07, 6.397550009751285e-07, 6.399715175575693e-07, 6.393033231688605e-07, 6.382227297763166e-07, 6.320739203147241e-07, 6.241282335395226e-07, 6.161063197396288e-07, 6.117401767369302e-07, 5.839314667355211e-07 ] }, "drift": { "embed.weight": 52.2471866434948, "embed.bias": 18.97250327390356, "blocks.0.ln.weight": 1.2566883045780834, "blocks.0.w1.weight": 17.12006786604635, "blocks.0.w1.bias": 14.342858083073688, "blocks.0.w2.weight": 63.004850525998116, "blocks.1.ln.weight": 1.0284467630081824, "blocks.1.w1.weight": 21.225831949490352, "blocks.1.w1.bias": 18.554260026881323, "blocks.1.w2.weight": 42.67940842745791, "blocks.2.ln.weight": 0.5431388174757359, "blocks.2.w1.weight": 20.036899880398536, "blocks.2.w1.bias": 21.66446091790098, "blocks.2.w2.weight": 26.571695423395656, "blocks.3.ln.weight": 0.4791053623183397, "blocks.3.w1.weight": 17.857825652507895, "blocks.3.w1.bias": 19.196407269205075, "blocks.3.w2.weight": 24.453272281036483, "blocks.4.ln.weight": 0.40179147711472446, "blocks.4.w1.weight": 16.142007729189494, "blocks.4.w1.bias": 18.38189338630125, "blocks.4.w2.weight": 22.251118320035413, "blocks.5.ln.weight": 0.3999388280630244, "blocks.5.w1.weight": 16.08867610628456, "blocks.5.w1.bias": 18.228301269113516, "blocks.5.w2.weight": 22.282579138688718, "blocks.6.ln.weight": 0.5139340433841122, "blocks.6.w1.weight": 16.498928955337856, "blocks.6.w1.bias": 17.341930385247757, "blocks.6.w2.weight": 44.47264444577482, "blocks.7.ln.weight": 0.5190564871460961, "blocks.7.w1.weight": 15.921519106035, "blocks.7.w1.bias": 13.554678640598476, "blocks.7.w2.weight": 55.375944465972985, "blocks.8.ln.weight": 0.5783217006624557, "blocks.8.w1.weight": 15.308415657722076, "blocks.8.w1.bias": 12.359797369765815, "blocks.8.w2.weight": 60.55354023990087, "blocks.9.ln.weight": 0.5265177438656736, "blocks.9.w1.weight": 14.699539264919315, "blocks.9.w1.bias": 12.199485985244364, "blocks.9.w2.weight": 53.496852348666465, "blocks.10.ln.weight": 0.5541756864436261, "blocks.10.w1.weight": 14.732920668123558, "blocks.10.w1.bias": 10.868519121164393, "blocks.10.w2.weight": 61.24451839129346, "blocks.11.ln.weight": 0.6274670342096703, "blocks.11.w1.weight": 18.31665424290367, "blocks.11.w1.bias": 18.6607903814988, "blocks.11.w2.weight": 57.15975509546593, "out_ln.weight": 0.317930900746446, "out_head.weight": 6.3670164706750825, "out_head.bias": 0.940628348025828 } } }, "config": { "dataset": "cifar10", "d_hidden": 512, "num_blocks": 12, "batch_size": 128, "epochs": 100, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 42 ], "gpu": 0, "output_dir": "results/fa_depth_scan_d512", "methods": [ "fa" ], "random_targets": false, "penalty_lam": 0.0, "num_classes": 10 } }