{ "42": { "fa": { "log": { "train_loss": [ 2.061217526626587, 1.9565438193130493, 1.9224825448608398, 1.9001438703155518, 1.8821109796524047, 1.8704035317230225, 1.857736103477478, 1.844048505897522, 1.8342980657958985, 1.8290129190063475, 1.8224646506118773, 1.8214716808319091, 1.8136491051483155, 1.8157705508041382, 1.8199064575195312, 1.816836177368164, 1.8065774325180053, 1.8125089934921266, 1.8090396573638916, 1.81023629032135, 1.8082425650787353, 1.8127569119644165, 1.808132509727478, 1.8062178915405274, 1.8039376613998412, 1.8006342431259155, 1.797272424888611, 1.795366856956482, 1.795199264755249, 1.796318228149414, 1.7931722381973267, 1.790380922317505, 1.787453678970337, 1.7863555522918702, 1.7848892670059204, 1.782602568359375, 1.7844260739135742, 1.7822325122833251, 1.7821675496673584, 1.7775094485092162, 1.775276083984375, 1.772415744934082, 1.771381389389038, 1.7729799353790283, 1.7665789907073974, 1.7650687371063232, 1.7673343083953856, 1.7628559505844117, 1.7635160286712646, 1.7610479801177978, 1.757714970741272, 1.7587621269989013, 1.75955526802063, 1.7605536008453369, 1.7632213006973267, 1.7597938927459718, 1.764720836868286, 1.7602048022460937, 1.7601288507843018, 1.7592250678253174, 1.763182290611267, 1.7588830117034913, 1.7620349166107179, 1.762400091934204, 1.7608643816375733, 1.7610327990341186, 1.7634911743164063, 1.761160830154419, 1.7584447234344482, 1.758816735496521, 1.7580244549560546, 1.758498070678711, 1.757904008178711, 1.7605663097381592, 1.7611833373260497, 1.7573552610778809, 1.7571686492538452, 1.7577348608016967, 1.7563239881134034, 1.7563734949493408, 1.757859500465393, 1.7567143533325196, 1.7577434346771241, 1.75511939453125, 1.7555543961334228, 1.756235351524353, 1.7555060604095458, 1.7561510982894897, 1.7538081964874268, 1.7542751317977905, 1.7549605862426758, 1.7509819832611084, 1.755103257446289, 1.7511512590789795, 1.7497140390396118, 1.755158496170044, 1.7556276675033569, 1.7520254708862304, 1.7512920989227294, 1.7526899521255492 ], "train_acc": [ 0.24758, 0.29054, 0.30476, 0.31646, 0.3238, 0.33244, 0.334, 0.33794, 0.34238, 0.34354, 0.3469, 0.34778, 0.34922, 0.34738, 0.34754, 0.3477, 0.3522, 0.35128, 0.3501, 0.34894, 0.3502, 0.34714, 0.35396, 0.35312, 0.35266, 0.35432, 0.35642, 0.35256, 0.35418, 0.35464, 0.35604, 0.35646, 0.35824, 0.35708, 0.35856, 0.35934, 0.35824, 0.35668, 0.36006, 0.36048, 0.36242, 0.3658, 0.36572, 0.36512, 0.36582, 0.36634, 0.36442, 0.36774, 0.3675, 0.36846, 0.36932, 0.36868, 0.3692, 0.36584, 0.36652, 0.3708, 0.36522, 0.36784, 0.36796, 0.37036, 0.36874, 0.37152, 0.37144, 0.37078, 0.36992, 0.37114, 0.3711, 0.37028, 0.37068, 0.37472, 0.3726, 0.372, 0.37436, 0.37286, 0.37184, 0.37572, 0.37322, 0.37538, 0.37558, 0.37514, 0.37416, 0.37244, 0.37488, 0.3776, 0.37426, 0.37688, 0.37648, 0.3746, 0.37672, 0.37686, 0.3762, 0.37536, 0.3752, 0.37636, 0.37886, 0.37486, 0.3733, 0.37878, 0.3779, 0.37676 ], "test_acc": [ 0.3028, 0.3196, 0.3402, 0.3524, 0.3584, 0.3591, 0.3566, 0.3543, 0.3712, 0.3705, 0.3579, 0.3373, 0.3627, 0.3557, 0.3414, 0.3688, 0.3572, 0.3632, 0.354, 0.3634, 0.362, 0.3549, 0.363, 0.3531, 0.345, 0.3459, 0.3517, 0.3421, 0.3294, 0.3398, 0.3294, 0.3409, 0.3476, 0.3318, 0.3477, 0.3302, 0.3283, 0.3309, 0.3337, 0.3497, 0.3314, 0.3292, 0.3374, 0.3361, 0.3335, 0.3461, 0.3254, 0.3366, 0.3353, 0.3288, 0.3467, 0.3374, 0.3445, 0.3415, 0.3358, 0.3474, 0.3382, 0.333, 0.3356, 0.3376, 0.3356, 0.3418, 0.3358, 0.3446, 0.35, 0.3412, 0.3452, 0.3429, 0.3438, 0.3421, 0.3477, 0.3497, 0.3499, 0.3473, 0.3451, 0.3504, 0.3474, 0.3503, 0.344, 0.3497, 0.3487, 0.3488, 0.3521, 0.3509, 0.3455, 0.3511, 0.3469, 0.3474, 0.353, 0.3472, 0.3472, 0.3501, 0.3493, 0.3492, 0.349, 0.3496, 0.3496, 0.3494, 0.3494, 0.3495 ] }, "diagnostics": { "bp_cosine": [ 0.03441809490323067, 0.955886721611023 ], "perturbation_rho": [ 0.04754525423049927, 0.05055658146739006 ], "nudging": { "0.001": [ -5.270587280392647e-06, -7.06920400261879e-06 ], "0.003": [ -1.57852191478014e-05, -2.1289335563778877e-05 ], "0.01": [ -5.261087790131569e-05, -7.100868970155716e-05 ] }, "hidden_norms_per_layer": [ 4686.95556640625, 94784.5546875, 138362.359375 ], "bp_grad_norms_per_layer": [ 1.9998093193862587e-05, 1.4634815670433454e-06, 1.188113401440205e-06 ] }, "drift": { "embed.weight": 28.586715545463985, "embed.bias": 19.716378864552336, "blocks.0.ln.weight": 1.4738119287890208, "blocks.0.w1.weight": 26.045392429453724, "blocks.0.w1.bias": 15.939058582542359, "blocks.0.w2.weight": 59.12906119267325, "blocks.1.ln.weight": 1.2124303196678357, "blocks.1.w1.weight": 16.696964117465345, "blocks.1.w1.bias": 8.535990814749171, "blocks.1.w2.weight": 37.85731940298285, "out_ln.weight": 0.5125606883018807, "out_head.weight": 3.721893823331011, "out_head.bias": 11.592811594248388 } } }, "config": { "dataset": "cifar10", "d_hidden": 512, "num_blocks": 2, "batch_size": 128, "epochs": 100, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 42 ], "gpu": 0, "output_dir": "results/fa_depth_scan_d512_L2", "methods": [ "fa" ], "random_targets": false, "penalty_lam": 0.0, "num_classes": 10 } }