diff options
Diffstat (limited to 'results/cifar100_d256_L4_s42/results_cifar100.json')
| -rw-r--r-- | results/cifar100_d256_L4_s42/results_cifar100.json | 1175 |
1 files changed, 1175 insertions, 0 deletions
diff --git a/results/cifar100_d256_L4_s42/results_cifar100.json b/results/cifar100_d256_L4_s42/results_cifar100.json new file mode 100644 index 0000000..d7c1337 --- /dev/null +++ b/results/cifar100_d256_L4_s42/results_cifar100.json @@ -0,0 +1,1175 @@ +{ + "42": { + "bp": { + "log": { + "train_loss": [ + 3.975249941253662, + 3.6423986249542235, + 3.4934494227600097, + 3.3944045304870607, + 3.3128096391296387, + 3.249527327423096, + 3.202136681060791, + 3.1545809954071045, + 3.118299830780029, + 3.08477955947876, + 3.05101420211792, + 3.014707311477661, + 2.9815688012695314, + 2.9542644719696045, + 2.917737830657959, + 2.8987481777954103, + 2.877259644317627, + 2.8476891691589357, + 2.826910527801514, + 2.8041292054748537, + 2.7817903074645995, + 2.7624645190429686, + 2.736394059448242, + 2.7153989936065672, + 2.6938070545959474, + 2.6722896592712404, + 2.656808620452881, + 2.6342206648254396, + 2.6130940935516356, + 2.601909016876221, + 2.5847591175842286, + 2.5616293630218507, + 2.540946982421875, + 2.528531006851196, + 2.508262563323975, + 2.494774736251831, + 2.471127844619751, + 2.455823439178467, + 2.443439641647339, + 2.419278503417969, + 2.409900106124878, + 2.3866433473205566, + 2.3731185454559327, + 2.348314314727783, + 2.336296524658203, + 2.3228698544311523, + 2.299138896865845, + 2.2919679093933105, + 2.271020979156494, + 2.263141948699951, + 2.242116179199219, + 2.2228171809387205, + 2.210650175628662, + 2.1947706311798094, + 2.1783614316558837, + 2.1615723634338377, + 2.152301993675232, + 2.139739892730713, + 2.11690347366333, + 2.1134400886535643, + 2.0890519944000245, + 2.076347621765137, + 2.067469055480957, + 2.0518165933990478, + 2.041287666015625, + 2.027727124786377, + 2.0111099968719484, + 1.9989793057250977, + 1.991382496948242, + 1.9685791171264648, + 1.966265661239624, + 1.9562527508544922, + 1.942470475769043, + 1.9250774355316163, + 1.9187585319137572, + 1.9093894129943847, + 1.9017769010162353, + 1.8909222549438476, + 1.8789906490707398, + 1.87238977394104, + 1.876755567703247, + 1.8579993398284913, + 1.8549057474517823, + 1.8437388555145264, + 1.83396729637146, + 1.8345417359161378, + 1.83224958152771, + 1.8185578295516969, + 1.8260858072280883, + 1.8161109666442872, + 1.8139908428573608, + 1.8139760601043702, + 1.8037351627349854, + 1.8002028354644775, + 1.8035412215423583, + 1.8000410940933227, + 1.7957222201156615, + 1.79567547290802, + 1.7953530138397218, + 1.7897127409744262 + ], + "train_acc": [ + 0.09828, + 0.14442, + 0.16788, + 0.18412, + 0.1995, + 0.21148, + 0.21652, + 0.2278, + 0.23422, + 0.24242, + 0.24772, + 0.25402, + 0.26126, + 0.2639, + 0.27258, + 0.27642, + 0.2808, + 0.28564, + 0.2893, + 0.29352, + 0.29922, + 0.3014, + 0.30794, + 0.31222, + 0.31722, + 0.322, + 0.32392, + 0.32726, + 0.33092, + 0.3352, + 0.33782, + 0.34382, + 0.34482, + 0.34966, + 0.3531, + 0.35308, + 0.36068, + 0.36312, + 0.36942, + 0.37268, + 0.3705, + 0.3762, + 0.38242, + 0.38778, + 0.38854, + 0.39198, + 0.3985, + 0.39664, + 0.4058, + 0.40534, + 0.40916, + 0.41304, + 0.41528, + 0.42002, + 0.42598, + 0.4278, + 0.42834, + 0.43244, + 0.43612, + 0.43712, + 0.4414, + 0.44592, + 0.44574, + 0.44904, + 0.4551, + 0.45958, + 0.46296, + 0.4616, + 0.46646, + 0.47288, + 0.4693, + 0.47354, + 0.47626, + 0.48042, + 0.4848, + 0.48688, + 0.4857, + 0.4874, + 0.49078, + 0.49406, + 0.49478, + 0.49768, + 0.49744, + 0.50144, + 0.50262, + 0.5014, + 0.50426, + 0.5064, + 0.5074, + 0.50692, + 0.50832, + 0.50964, + 0.5119, + 0.51018, + 0.5099, + 0.51064, + 0.51258, + 0.515, + 0.51522, + 0.5126 + ], + "test_acc": [ + 0.1432, + 0.181, + 0.1871, + 0.212, + 0.2185, + 0.2122, + 0.2368, + 0.2466, + 0.241, + 0.2492, + 0.2563, + 0.2629, + 0.2656, + 0.2695, + 0.2731, + 0.2753, + 0.2737, + 0.2823, + 0.2832, + 0.2883, + 0.2946, + 0.2915, + 0.2957, + 0.2922, + 0.2981, + 0.294, + 0.2961, + 0.301, + 0.3015, + 0.3078, + 0.3127, + 0.3097, + 0.308, + 0.3058, + 0.3138, + 0.3098, + 0.3114, + 0.3129, + 0.3126, + 0.3158, + 0.3146, + 0.3119, + 0.313, + 0.3137, + 0.3127, + 0.3167, + 0.3186, + 0.3181, + 0.3165, + 0.316, + 0.3222, + 0.3188, + 0.3228, + 0.3173, + 0.3178, + 0.3174, + 0.3217, + 0.3173, + 0.3196, + 0.3223, + 0.3181, + 0.3186, + 0.3196, + 0.3161, + 0.3202, + 0.314, + 0.3178, + 0.3172, + 0.3174, + 0.3207, + 0.3193, + 0.3214, + 0.3213, + 0.3175, + 0.3228, + 0.3207, + 0.3208, + 0.3213, + 0.3187, + 0.3197, + 0.3226, + 0.32, + 0.3205, + 0.3213, + 0.3217, + 0.3192, + 0.3203, + 0.3207, + 0.3209, + 0.3197, + 0.3207, + 0.3195, + 0.3192, + 0.3186, + 0.3178, + 0.3191, + 0.3189, + 0.3193, + 0.3189, + 0.3192 + ] + }, + "diagnostics": { + "bp_cosine": [ + 1.0, + 1.0, + 1.0, + 1.0 + ], + "perturbation_rho": [ + 0.9980340600013733, + 0.9982945919036865, + 0.9984437227249146, + 0.9987074136734009 + ], + "nudging": { + "0.001": [ + -0.0022835906129330397, + -0.0023387258406728506, + -0.002373999450355768, + -0.002260879147797823 + ], + "0.003": [ + -0.006846790201961994, + -0.007012245710939169, + -0.007117925677448511, + -0.006779024377465248 + ], + "0.01": [ + -0.022776642814278603, + -0.02332628145813942, + -0.023679494857788086, + -0.02255532145500183 + ] + }, + "hidden_norms_per_layer": [ + 236.57855224609375, + 217.48927307128906, + 197.1617889404297, + 187.24839782714844, + 191.277587890625 + ], + "bp_grad_norms_per_layer": [ + 0.0010384325869381428, + 0.0010872395941987634, + 0.0011213896796107292, + 0.001103188842535019, + 0.0009315301431342959 + ] + }, + "drift": { + "embed.weight": 7.433656905137662, + "embed.bias": 13.602162006682997, + "blocks.0.ln.weight": 0.14788760244846344, + "blocks.0.w1.weight": 3.605816897627063, + "blocks.0.w1.bias": 5.290238058535016, + "blocks.0.w2.weight": 13.310045077395138, + "blocks.1.ln.weight": 0.2914122939109802, + "blocks.1.w1.weight": 3.997572101972956, + "blocks.1.w1.bias": 4.732854205627193, + "blocks.1.w2.weight": 14.921397012401421, + "blocks.2.ln.weight": 0.35930144786834717, + "blocks.2.w1.weight": 4.149029664687284, + "blocks.2.w1.bias": 3.8845074849434162, + "blocks.2.w2.weight": 16.00171210299565, + "blocks.3.ln.weight": 0.5467617511749268, + "blocks.3.w1.weight": 4.475958556672767, + "blocks.3.w1.bias": 3.7954587976923664, + "blocks.3.w2.weight": 17.52879838948756, + "out_ln.weight": 0.1443399339914322, + "out_head.weight": 2.871805586504566, + "out_head.bias": 3.1293217686796893 + } + }, + "dfa": { + "log": { + "train_loss": [ + 4.17356710144043, + 4.045213865203857, + 4.0394830491638185, + 4.052726871032715, + 4.062585520324707, + 4.077131650848389, + 4.081288940353393, + 4.082902023620606, + 4.082292946929932, + 4.084377682189942, + 4.082009593811035, + 4.078371176147461, + 4.0787283967590335, + 4.0781014080810545, + 4.071053223266602, + 4.073739369049072, + 4.070565816497803, + 4.068224396362305, + 4.064294567718506, + 4.062663984680176, + 4.060789375686645, + 4.060499965057373, + 4.05942348953247, + 4.05340063583374, + 4.054450568389893, + 4.051036394500732, + 4.052292782592773, + 4.04923277923584, + 4.047891028900146, + 4.046583199005127, + 4.046011067352295, + 4.0444303074646, + 4.045907030334472, + 4.044839619445801, + 4.03859343673706, + 4.043664588165283, + 4.0400294355773925, + 4.035496199493408, + 4.038207025909424, + 4.035675854187012, + 4.037980937347412, + 4.038932502746582, + 4.036024468383789, + 4.037031109313965, + 4.034120268630981, + 4.036895367584228, + 4.037431150054932, + 4.033238902282715, + 4.036427326049805, + 4.03467604888916, + 4.03339782157898, + 4.0328554144287105, + 4.031013775024414, + 4.031612381286621, + 4.0287201686096195, + 4.031132036132813, + 4.029230642242432, + 4.029863064575196, + 4.03147859588623, + 4.029825403366089, + 4.030359633789063, + 4.028107041168213, + 4.02976943069458, + 4.029035094909668, + 4.028509668731689, + 4.0304917379760745, + 4.030941032562255, + 4.026340734710693, + 4.027734536590576, + 4.024428620147705, + 4.025526253967286, + 4.025494504394532, + 4.026692573547363, + 4.0229616456604, + 4.026408356018067, + 4.024612335662842, + 4.023342019500732, + 4.024318858337402, + 4.023249450683593, + 4.023151823806763, + 4.026289680709839, + 4.023877305831909, + 4.023189326248169, + 4.022549798278809, + 4.024784528045655, + 4.022774189758301, + 4.024208254547119, + 4.023730496368408, + 4.02367640625, + 4.021903743209839, + 4.02390080947876, + 4.022859935150146, + 4.023393632354736, + 4.021766328201294, + 4.02325630645752, + 4.023518178710938, + 4.021166778717041, + 4.023976897583008, + 4.023609465179443, + 4.024444749069214 + ], + "train_acc": [ + 0.06788, + 0.08332, + 0.08406, + 0.0818, + 0.08046, + 0.08148, + 0.07862, + 0.07956, + 0.08038, + 0.07976, + 0.08042, + 0.0808, + 0.08058, + 0.08086, + 0.08006, + 0.08136, + 0.08244, + 0.08388, + 0.08354, + 0.084, + 0.08448, + 0.08518, + 0.08594, + 0.08624, + 0.08568, + 0.08764, + 0.08492, + 0.08604, + 0.08814, + 0.0876, + 0.08836, + 0.08956, + 0.08702, + 0.08854, + 0.08976, + 0.08954, + 0.0895, + 0.09006, + 0.0894, + 0.08964, + 0.09064, + 0.09034, + 0.09288, + 0.0913, + 0.0914, + 0.09116, + 0.09094, + 0.09192, + 0.09044, + 0.0909, + 0.09252, + 0.09214, + 0.09332, + 0.0931, + 0.09364, + 0.09176, + 0.09246, + 0.09302, + 0.09276, + 0.09334, + 0.09404, + 0.0942, + 0.09392, + 0.09358, + 0.09336, + 0.09392, + 0.09252, + 0.0949, + 0.09444, + 0.0958, + 0.09542, + 0.0949, + 0.0954, + 0.09438, + 0.09338, + 0.0958, + 0.09376, + 0.0959, + 0.09448, + 0.09388, + 0.09458, + 0.09422, + 0.09542, + 0.09522, + 0.09468, + 0.0951, + 0.09564, + 0.09586, + 0.09536, + 0.09624, + 0.09588, + 0.09594, + 0.09642, + 0.09588, + 0.09496, + 0.09496, + 0.096, + 0.09454, + 0.09542, + 0.09488 + ], + "test_acc": [ + 0.0775, + 0.0794, + 0.0808, + 0.0828, + 0.0742, + 0.0795, + 0.0788, + 0.0855, + 0.0809, + 0.0819, + 0.0767, + 0.0826, + 0.0854, + 0.0752, + 0.0798, + 0.0796, + 0.0813, + 0.0771, + 0.0823, + 0.0759, + 0.0814, + 0.0772, + 0.0826, + 0.079, + 0.0803, + 0.0815, + 0.0818, + 0.0819, + 0.0818, + 0.084, + 0.0853, + 0.0855, + 0.0875, + 0.0818, + 0.0861, + 0.0827, + 0.0847, + 0.0825, + 0.0853, + 0.0862, + 0.0841, + 0.0857, + 0.0852, + 0.0852, + 0.0827, + 0.0863, + 0.0878, + 0.0858, + 0.0857, + 0.0879, + 0.0888, + 0.088, + 0.0878, + 0.0871, + 0.0878, + 0.0845, + 0.0863, + 0.0852, + 0.0872, + 0.0879, + 0.086, + 0.0878, + 0.0851, + 0.0863, + 0.0877, + 0.0861, + 0.0889, + 0.0839, + 0.0893, + 0.0883, + 0.0867, + 0.0855, + 0.0878, + 0.086, + 0.0876, + 0.0882, + 0.0895, + 0.0877, + 0.0876, + 0.0871, + 0.088, + 0.0876, + 0.088, + 0.0885, + 0.0879, + 0.0888, + 0.0882, + 0.0876, + 0.0882, + 0.087, + 0.0873, + 0.0877, + 0.0876, + 0.0882, + 0.0878, + 0.0876, + 0.0877, + 0.0876, + 0.0875, + 0.0875 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.14061881601810455, + 0.0022556069307029247, + -0.009000124409794807, + -0.013949227519333363 + ], + "perturbation_rho": [ + 0.04333949834108353, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -5.513429641723633e-07, + 0.0, + 0.0, + -3.725290298461914e-09 + ], + "0.003": [ + -1.7480924725532532e-06, + -1.4901161193847656e-08, + 0.0, + -1.862645149230957e-09 + ], + "0.01": [ + -5.760230123996735e-06, + 2.3283064365386963e-08, + -1.862645149230957e-09, + 0.0 + ] + }, + "hidden_norms_per_layer": [ + 20187.3125, + 13252251.0, + 93144488.0, + 163952208.0, + 202900624.0 + ], + "bp_grad_norms_per_layer": [ + 1.3867399957234738e-06, + 9.786202070927175e-09, + 9.394233835280374e-09, + 9.39475075512064e-09, + 9.382485899323001e-09 + ] + }, + "drift": { + "embed.weight": 164.5243882671684, + "embed.bias": 86.31975598233767, + "blocks.0.ln.weight": 9.94965648651123, + "blocks.0.w1.weight": 116.60864500939675, + "blocks.0.w1.bias": 119.5896283256837, + "blocks.0.w2.weight": 139.89574047116318, + "blocks.1.ln.weight": 6.952559471130371, + "blocks.1.w1.weight": 171.01066211955538, + "blocks.1.w1.bias": 184.66872276388008, + "blocks.1.w2.weight": 113.70390206644275, + "blocks.2.ln.weight": 8.037435531616211, + "blocks.2.w1.weight": 204.0534914689403, + "blocks.2.w1.bias": 205.1741516813065, + "blocks.2.w2.weight": 112.9529550385935, + "blocks.3.ln.weight": 7.489717483520508, + "blocks.3.w1.weight": 199.12470243900225, + "blocks.3.w1.bias": 198.81992912624156, + "blocks.3.w2.weight": 104.7339169635497, + "out_ln.weight": 1.6446622610092163, + "out_head.weight": 8.633984180685534, + "out_head.bias": 0.8233496742420285 + } + }, + "fa": { + "log": { + "train_loss": [ + 4.184186522827148, + 4.179929753265381, + 4.089846964416504, + 4.048904882202148, + 4.019415323638916, + 4.003474291839599, + 3.9891197368621825, + 3.9800468362426757, + 3.9685846406555174, + 3.9551162309265138, + 3.942166231536865, + 3.9271056993865967, + 3.915979294891357, + 3.9063652964782714, + 3.8933532473754884, + 3.892304434890747, + 3.8851386541748045, + 3.880706764526367, + 3.8791183966064455, + 3.874532577972412, + 3.870268273162842, + 3.8705162049865725, + 3.8667305128479006, + 3.8626690478515626, + 3.8593408808898926, + 3.8570751000213623, + 3.858237083206177, + 3.8517847180938722, + 3.8476831745910642, + 3.8457262559509275, + 3.840909554901123, + 3.835939132537842, + 3.834127527542114, + 3.830621910324097, + 3.8192956964874267, + 3.8194126902770997, + 3.8129332183074953, + 3.803470793991089, + 3.8037892980194092, + 3.7975124457550047, + 3.7967339707946777, + 3.7944636122131348, + 3.786077890625, + 3.7846675917053223, + 3.7791504066467283, + 3.7762106622314455, + 3.777709127731323, + 3.7638775648498535, + 3.765332045440674, + 3.7623159846496583, + 3.761364775314331, + 3.7529254064178468, + 3.749479592971802, + 3.744997635345459, + 3.7406992932128906, + 3.74050118598938, + 3.740082041091919, + 3.7403511964416505, + 3.7391156189727783, + 3.7338412855529786, + 3.733470021286011, + 3.726227327346802, + 3.7261299742889404, + 3.722200173187256, + 3.7222453344726563, + 3.7236415620422365, + 3.720610160598755, + 3.71873546585083, + 3.7171892735290526, + 3.710947210006714, + 3.7083427098846435, + 3.7072678149414062, + 3.70656751663208, + 3.704509799041748, + 3.7028028456115725, + 3.7015775603485106, + 3.7001070789337156, + 3.6981460167694093, + 3.696165197067261, + 3.6909815367889403, + 3.6975155518341065, + 3.693085638427734, + 3.6924814643096924, + 3.6891826426696777, + 3.688821280517578, + 3.689004655685425, + 3.6925391107177736, + 3.6897733489990236, + 3.687680895843506, + 3.6844489430236815, + 3.688553215789795, + 3.6839564624023438, + 3.685328346557617, + 3.6844889741516114, + 3.682617470626831, + 3.685823777923584, + 3.6817508575439453, + 3.6835061328125, + 3.683719411773682, + 3.685913360671997 + ], + "train_acc": [ + 0.06392, + 0.06052, + 0.07254, + 0.0799, + 0.0863, + 0.08926, + 0.09172, + 0.09366, + 0.0967, + 0.09784, + 0.10026, + 0.10226, + 0.10344, + 0.10226, + 0.10548, + 0.10614, + 0.10576, + 0.1094, + 0.10852, + 0.11026, + 0.1109, + 0.1113, + 0.11464, + 0.11204, + 0.114, + 0.11382, + 0.11484, + 0.11308, + 0.11652, + 0.116, + 0.11544, + 0.11934, + 0.1164, + 0.11756, + 0.12118, + 0.12098, + 0.1208, + 0.1226, + 0.12196, + 0.12346, + 0.1241, + 0.12418, + 0.12376, + 0.12556, + 0.12682, + 0.12578, + 0.12646, + 0.12802, + 0.12834, + 0.12896, + 0.1285, + 0.13022, + 0.13064, + 0.13266, + 0.132, + 0.13304, + 0.13302, + 0.13274, + 0.13234, + 0.13406, + 0.1352, + 0.1352, + 0.13452, + 0.13546, + 0.1378, + 0.1353, + 0.13576, + 0.13548, + 0.13744, + 0.1404, + 0.13826, + 0.13848, + 0.14008, + 0.13914, + 0.13812, + 0.14022, + 0.14048, + 0.14066, + 0.14008, + 0.1426, + 0.1408, + 0.1407, + 0.1429, + 0.14204, + 0.14294, + 0.14272, + 0.14102, + 0.14226, + 0.14414, + 0.1436, + 0.14408, + 0.14312, + 0.1434, + 0.14338, + 0.14488, + 0.14448, + 0.14394, + 0.1426, + 0.14502, + 0.14398 + ], + "test_acc": [ + 0.0598, + 0.0694, + 0.069, + 0.0805, + 0.086, + 0.0911, + 0.0953, + 0.0986, + 0.0954, + 0.0949, + 0.0993, + 0.1051, + 0.1069, + 0.1004, + 0.1066, + 0.11, + 0.1087, + 0.1039, + 0.1151, + 0.1101, + 0.1136, + 0.1096, + 0.1118, + 0.1138, + 0.1155, + 0.1151, + 0.1171, + 0.1197, + 0.1188, + 0.1212, + 0.1182, + 0.1194, + 0.12, + 0.122, + 0.1259, + 0.1204, + 0.1205, + 0.1259, + 0.1231, + 0.1247, + 0.1263, + 0.1294, + 0.1233, + 0.1265, + 0.1299, + 0.1267, + 0.1297, + 0.1338, + 0.1276, + 0.1332, + 0.1337, + 0.1302, + 0.1399, + 0.1354, + 0.1322, + 0.1382, + 0.1372, + 0.1363, + 0.1369, + 0.1397, + 0.1357, + 0.1394, + 0.144, + 0.1395, + 0.1448, + 0.1373, + 0.1435, + 0.1417, + 0.1398, + 0.14, + 0.1409, + 0.1409, + 0.1408, + 0.141, + 0.145, + 0.1425, + 0.1425, + 0.1452, + 0.1449, + 0.1457, + 0.1432, + 0.1449, + 0.1446, + 0.1486, + 0.1429, + 0.1477, + 0.1458, + 0.146, + 0.1449, + 0.1455, + 0.1442, + 0.1453, + 0.1458, + 0.1462, + 0.1468, + 0.1456, + 0.1462, + 0.1464, + 0.1465, + 0.1464 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.032749101519584656, + -0.02806573174893856, + -0.13188865780830383, + 0.9981366395950317 + ], + "perturbation_rho": [ + 0.023128217086195946, + -0.033153705298900604, + -0.03114410489797592, + -0.04209538549184799 + ], + "nudging": { + "0.001": [ + -3.4319236874580383e-07, + 3.664754331111908e-07, + 2.3958273231983185e-07, + -1.4158431440591812e-06 + ], + "0.003": [ + -1.9101426005363464e-06, + 6.353948265314102e-07, + 1.5594996511936188e-06, + -8.973991498351097e-06 + ], + "0.01": [ + -6.851274520158768e-06, + 8.617062121629715e-07, + 6.175599992275238e-06, + -3.897189162671566e-05 + ] + }, + "hidden_norms_per_layer": [ + 10709.3916015625, + 183619.875, + 1852831.0, + 3034211.25, + 169794.0625 + ], + "bp_grad_norms_per_layer": [ + 1.2192158465040848e-05, + 2.159640871468582e-06, + 1.9386970961932093e-06, + 1.93888718058588e-06, + 1.940315996762365e-06 + ] + }, + "drift": { + "embed.weight": 97.51059845469358, + "embed.bias": 45.31500470139968, + "blocks.0.ln.weight": 2.126800775527954, + "blocks.0.w1.weight": 24.113425166766486, + "blocks.0.w1.bias": 25.534244327420822, + "blocks.0.w2.weight": 69.8748433766199, + "blocks.1.ln.weight": 1.5964641571044922, + "blocks.1.w1.weight": 35.519098992915914, + "blocks.1.w1.bias": 42.27561830539123, + "blocks.1.w2.weight": 61.05750225415427, + "blocks.2.ln.weight": 1.4540088176727295, + "blocks.2.w1.weight": 41.92037705190106, + "blocks.2.w1.bias": 47.8882125375433, + "blocks.2.w2.weight": 47.86373297818362, + "blocks.3.ln.weight": 1.6165372133255005, + "blocks.3.w1.weight": 47.10451321088829, + "blocks.3.w1.bias": 53.07025310766248, + "blocks.3.w2.weight": 48.00579573400754, + "out_ln.weight": 0.49529579281806946, + "out_head.weight": 4.173857948425521, + "out_head.bias": 3.4238911704789996 + } + } + }, + "config": { + "dataset": "cifar100", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 100, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 42 + ], + "gpu": 0, + "output_dir": "results/cifar100_d256_L4_s42", + "methods": [ + "bp", + "fa", + "dfa" + ], + "random_targets": false, + "penalty_lam": 0.0, + "num_classes": 100 + } +}
\ No newline at end of file |
