{ "3": { "dfa": { "log": { "train_loss": [ 2.080998458023071, 2.0535908667755125, 2.0456236054992676, 2.0437664754867555, 2.04373485496521, 2.0431359854125977, 2.0434441787338256, 2.0382570924377443, 2.038818662261963, 2.0345919523620606, 2.03406599155426, 2.031346089324951, 2.0293883434677125, 2.0278041764831545, 2.0296552677154542, 2.0259662225723267, 2.0258015427017213, 2.024105228805542, 2.0241383403778075, 2.0237019972991943, 2.021524270172119, 2.0192913208389283, 2.020055650939941, 2.0187213849639893, 2.0182762395858767, 2.018081063079834, 2.0169390340805053, 2.015762889480591, 2.014286817321777, 2.0149634075164795, 2.012851970252991, 2.0143834255218507, 2.012589658126831, 2.013470998764038, 2.0132155655670165, 2.0125345434570314, 2.014651682510376, 2.011008670730591, 2.010692717514038, 2.0098264505767824, 2.010699557571411, 2.010047173309326, 2.0120795148086548, 2.012862138290405, 2.010627545700073, 2.012053688697815, 2.012078428192139, 2.0087205919647215, 2.010501960144043, 2.0095251747131346, 2.0100318467712404, 2.009802308883667, 2.008675379104614, 2.009749626541138, 2.0081673904037474, 2.010975965423584, 2.0075539178466797, 2.007934888153076, 2.0076504850769044, 2.0063897485733033, 2.007999542160034, 2.0096467161560057, 2.0087811013031005, 2.0079173694229127, 2.005330057106018, 2.006340228881836, 2.008018601989746, 2.0075161946868896, 2.0061075159454345, 2.00557112739563, 2.0092006335449217, 2.005981811904907, 2.008798143310547, 2.006232444229126, 2.0086249324798584, 2.0055838273620608, 2.0056044164276123, 2.0061014500427246, 2.00520422416687, 2.0060690811538695, 2.0042829446411132, 2.007496082611084, 2.006376414794922, 2.007382208404541, 2.0068653521347044, 2.00715774230957, 2.0046533392715453, 2.0055563162994385, 2.0043802153778074, 2.00596639465332, 2.0056586725234986, 2.0065873177337648, 2.006924060974121, 2.007017402496338, 2.007137279701233, 2.007027236022949, 2.005679884109497, 2.00417349899292, 2.006064287567139, 2.0064190141296385 ], "train_acc": [ 0.2315, 0.2422, 0.242, 0.2424, 0.24744, 0.24618, 0.24638, 0.25122, 0.2481, 0.2553, 0.25512, 0.25802, 0.2577, 0.25796, 0.2582, 0.2618, 0.26004, 0.262, 0.25824, 0.26126, 0.26322, 0.26556, 0.26414, 0.26362, 0.26414, 0.2653, 0.26648, 0.26604, 0.26904, 0.26534, 0.26784, 0.26806, 0.2689, 0.26802, 0.26812, 0.26996, 0.26976, 0.26924, 0.27148, 0.26982, 0.2701, 0.27084, 0.27122, 0.27068, 0.2739, 0.26968, 0.27164, 0.27262, 0.27076, 0.2726, 0.27058, 0.26984, 0.27202, 0.27046, 0.2735, 0.27262, 0.27144, 0.27432, 0.2739, 0.27494, 0.27442, 0.2727, 0.27466, 0.2713, 0.27138, 0.27472, 0.27394, 0.27338, 0.27562, 0.274, 0.27062, 0.2747, 0.27102, 0.27396, 0.27284, 0.27616, 0.27526, 0.27456, 0.27508, 0.27278, 0.27454, 0.2754, 0.27318, 0.27526, 0.27438, 0.27674, 0.27516, 0.27372, 0.27594, 0.2748, 0.27798, 0.27314, 0.27486, 0.27464, 0.2744, 0.2761, 0.27524, 0.27572, 0.27546, 0.27596 ], "test_acc": [ 0.2643, 0.2485, 0.2666, 0.258, 0.2678, 0.2703, 0.276, 0.2618, 0.2717, 0.2773, 0.2889, 0.281, 0.2829, 0.2771, 0.2647, 0.2713, 0.29, 0.2779, 0.2855, 0.2833, 0.2932, 0.276, 0.2898, 0.2953, 0.2799, 0.2835, 0.286, 0.2849, 0.2838, 0.291, 0.2948, 0.2955, 0.2873, 0.2931, 0.2908, 0.2927, 0.2896, 0.2932, 0.2863, 0.2927, 0.2886, 0.2954, 0.2871, 0.2946, 0.2925, 0.2889, 0.3005, 0.2984, 0.2954, 0.2876, 0.2852, 0.2888, 0.2943, 0.2923, 0.2934, 0.2888, 0.2941, 0.2926, 0.287, 0.2969, 0.2969, 0.2895, 0.2982, 0.2961, 0.2972, 0.2998, 0.2986, 0.2932, 0.2877, 0.2875, 0.2914, 0.2958, 0.2935, 0.2963, 0.2987, 0.2948, 0.2952, 0.296, 0.2993, 0.2935, 0.2962, 0.2933, 0.2948, 0.2986, 0.291, 0.2968, 0.2948, 0.2976, 0.2946, 0.2958, 0.2968, 0.2977, 0.2977, 0.2966, 0.2962, 0.2963, 0.2963, 0.2966, 0.2968, 0.2968 ] }, "diagnostics": { "bp_cosine": [ 0.384052038192749, 0.00187331298366189, 0.0014918153174221516, -0.003990606404840946, 0.0011513899080455303, -0.0013353436952456832, -0.0003460634616203606, -0.0025712824426591396, 0.0021760533563792706, 0.0015363170532509685, 0.0023321444168686867, -0.0023729477543383837 ], "perturbation_rho": [ 0.008436945267021656, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "nudging": { "0.001": [ -2.48197466135025e-07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.003": [ -1.144595444202423e-06, -2.7939677238464355e-09, 3.725290298461914e-09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.01": [ -3.5781413316726685e-06, -4.6566128730773926e-09, 3.725290298461914e-09, -2.7939677238464355e-09, -3.725290298461914e-09, -6.51925802230835e-09, 9.313225746154785e-10, 0.0, 0.0, 0.0, -3.725290298461914e-09, 0.0 ] }, "hidden_norms_per_layer": [ 40862.5703125, 302949600.0, 779490368.0, 866010048.0, 1434764928.0, 1708853376.0, 1753628672.0, 2062010112.0, 2322754048.0, 2426205952.0, 2646477312.0, 3046314752.0, 3080729344.0 ], "bp_grad_norms_per_layer": [ 3.3795413401094265e-07, 9.012455781665096e-10, 8.881588797748918e-10, 8.880864932336863e-10, 8.938522144674721e-10, 8.938976781003305e-10, 8.937018902699378e-10, 8.93527418721618e-10, 8.935119866215757e-10, 8.93440765814546e-10, 8.933446760117647e-10, 8.934304962515682e-10, 8.93500051724061e-10 ] }, "drift": { "embed.weight": 357.53469530895904, "embed.bias": 290.04318739609596, "blocks.0.ln.weight": 10.989575386047363, "blocks.0.w1.weight": 220.1012762362677, "blocks.0.w1.bias": 206.37217351266216, "blocks.0.w2.weight": 501.3829415210294, "blocks.1.ln.weight": 9.839688301086426, "blocks.1.w1.weight": 256.6554332372174, "blocks.1.w1.bias": 237.5977187566281, "blocks.1.w2.weight": 396.28129110774046, "blocks.2.ln.weight": 8.956626892089844, "blocks.2.w1.weight": 225.58790523471438, "blocks.2.w1.bias": 219.9504694961951, "blocks.2.w2.weight": 332.68534972274165, "blocks.3.ln.weight": 10.4323091506958, "blocks.3.w1.weight": 304.362127476672, "blocks.3.w1.bias": 271.4581804566994, "blocks.3.w2.weight": 456.776518831265, "blocks.4.ln.weight": 10.220683097839355, "blocks.4.w1.weight": 294.88770495280846, "blocks.4.w1.bias": 278.17483493032455, "blocks.4.w2.weight": 422.86722605618826, "blocks.5.ln.weight": 7.415699005126953, "blocks.5.w1.weight": 190.23919300974276, "blocks.5.w1.bias": 170.52475346607713, "blocks.5.w2.weight": 282.6076353329658, "blocks.6.ln.weight": 11.005321502685547, "blocks.6.w1.weight": 315.1699742985849, "blocks.6.w1.bias": 293.37584502861324, "blocks.6.w2.weight": 428.46065418838674, "blocks.7.ln.weight": 11.400951385498047, "blocks.7.w1.weight": 320.1547970124374, "blocks.7.w1.bias": 312.2252164433187, "blocks.7.w2.weight": 444.7674866393189, "blocks.8.ln.weight": 9.238995552062988, "blocks.8.w1.weight": 261.6975850751966, "blocks.8.w1.bias": 251.09895252390498, "blocks.8.w2.weight": 352.9133162081499, "blocks.9.ln.weight": 11.197455406188965, "blocks.9.w1.weight": 315.7224672836386, "blocks.9.w1.bias": 295.82606170712853, "blocks.9.w2.weight": 416.36578033635686, "blocks.10.ln.weight": 11.847606658935547, "blocks.10.w1.weight": 338.01615076254603, "blocks.10.w1.bias": 307.22711286489067, "blocks.10.w2.weight": 464.68687019974544, "blocks.11.ln.weight": 7.684996128082275, "blocks.11.w1.weight": 188.9801145292558, "blocks.11.w1.bias": 178.35247968031155, "blocks.11.w2.weight": 244.64524232865998, "out_ln.weight": 1.0227844715118408, "out_head.weight": 10.424635519375226, "out_head.bias": 0.7962212896591503 } }, "fa": { "log": { "train_loss": [ 2.1018029602050783, 2.0231987742614748, 1.9913426873779296, 1.9757863534164428, 1.9628748377227783, 1.949777193145752, 1.9388965420150757, 1.9255553958511353, 1.9167609970474244, 1.9067581841278076, 1.9039552599716187, 1.899418589744568, 1.8931139596176147, 1.8900751802825928, 1.8894958589935302, 1.8822405550384522, 1.8818315468597413, 1.8777127625274659, 1.8790236785125733, 1.8758525806045532, 1.8699211498641968, 1.8684503372573853, 1.868811384048462, 1.8628138626098634, 1.8617137921524047, 1.859757089614868, 1.8566949377059936, 1.8563865858459472, 1.8520149837493896, 1.852164205932617, 1.846489913673401, 1.847879118347168, 1.8489951482391358, 1.8469820216369628, 1.8453059420394897, 1.8414616915893556, 1.845604056930542, 1.8367319815063476, 1.838143812828064, 1.8364125064468384, 1.8365082810211182, 1.8345620361328125, 1.8362988974761962, 1.8378243299102783, 1.833498821182251, 1.8334047562408446, 1.8298064031600951, 1.828000364303589, 1.8265536352539062, 1.829135093307495, 1.8257994495391845, 1.8226896044158936, 1.826085818748474, 1.8257194399261474, 1.820882752685547, 1.823325060119629, 1.821622840309143, 1.8205207012939453, 1.8186096018218993, 1.8195034896469116, 1.8178193243026732, 1.8202132829284667, 1.8164496115112305, 1.8147546480941772, 1.8138668438720704, 1.8105954584121704, 1.8140293844604491, 1.8142269690704347, 1.8139710745239257, 1.812066497116089, 1.8160650396728515, 1.8103228116607666, 1.81037494846344, 1.8109107693481445, 1.8118848001480103, 1.80986087184906, 1.8117412914276123, 1.8095279247283935, 1.8082179739379882, 1.8077979961395263, 1.8045953066635132, 1.8087207033920287, 1.8068067630004883, 1.8097841464996338, 1.8086548376846314, 1.8075193279266357, 1.8061525051498413, 1.8061482022476196, 1.805157029685974, 1.806752130088806, 1.8043223245239257, 1.8059532889175416, 1.804686725730896, 1.8053256253051757, 1.8066633655166626, 1.805836711769104, 1.8080352004241944, 1.803317499961853, 1.801328492088318, 1.8052216162109376 ], "train_acc": [ 0.20742, 0.24158, 0.25614, 0.26952, 0.27686, 0.28706, 0.29562, 0.30176, 0.3048, 0.30964, 0.3102, 0.31448, 0.31506, 0.31792, 0.32218, 0.3222, 0.3216, 0.3241, 0.32336, 0.32284, 0.32752, 0.3269, 0.3251, 0.33148, 0.3297, 0.32996, 0.33296, 0.333, 0.3372, 0.33618, 0.336, 0.33676, 0.3361, 0.33558, 0.33656, 0.34134, 0.3399, 0.34096, 0.34498, 0.34478, 0.34308, 0.34372, 0.34374, 0.34298, 0.3446, 0.34562, 0.34566, 0.34838, 0.34956, 0.34546, 0.34762, 0.34824, 0.34838, 0.34946, 0.35068, 0.35008, 0.35006, 0.35236, 0.35148, 0.35128, 0.35232, 0.3504, 0.35356, 0.3535, 0.3542, 0.35762, 0.3522, 0.35422, 0.35474, 0.3524, 0.3533, 0.3531, 0.35642, 0.356, 0.35522, 0.35664, 0.35594, 0.35494, 0.3547, 0.35866, 0.35694, 0.35732, 0.35788, 0.35534, 0.35586, 0.35614, 0.35642, 0.3569, 0.35992, 0.35596, 0.35776, 0.35608, 0.35652, 0.35726, 0.35692, 0.35758, 0.35714, 0.35754, 0.35816, 0.35878 ], "test_acc": [ 0.2378, 0.2506, 0.2725, 0.2937, 0.3002, 0.3155, 0.3308, 0.3192, 0.3399, 0.3382, 0.3357, 0.3429, 0.3428, 0.3431, 0.3337, 0.3418, 0.3495, 0.3491, 0.3603, 0.357, 0.3506, 0.3612, 0.3593, 0.3643, 0.3621, 0.3646, 0.3621, 0.3668, 0.3625, 0.3621, 0.3598, 0.3715, 0.3627, 0.37, 0.373, 0.3567, 0.3681, 0.3703, 0.3744, 0.3688, 0.3656, 0.3763, 0.37, 0.3705, 0.3778, 0.3681, 0.3743, 0.3804, 0.3765, 0.374, 0.373, 0.3763, 0.3756, 0.3773, 0.3779, 0.3734, 0.3834, 0.3806, 0.3719, 0.3795, 0.3785, 0.3767, 0.3782, 0.3827, 0.3801, 0.3815, 0.3842, 0.3829, 0.38, 0.3814, 0.3821, 0.3831, 0.382, 0.3796, 0.3846, 0.3786, 0.3789, 0.382, 0.3786, 0.3818, 0.3831, 0.3849, 0.3807, 0.3828, 0.3799, 0.382, 0.3804, 0.3823, 0.3797, 0.3821, 0.3812, 0.3807, 0.3819, 0.3817, 0.3818, 0.3809, 0.3816, 0.3816, 0.3817, 0.3818 ] }, "diagnostics": { "bp_cosine": [ 0.027911242097616196, 0.0825929045677185, 0.0342608243227005, -0.01674751378595829, -0.02788889780640602, -0.001998391468077898, 0.007203143555670977, -0.022960849106311798, -0.001600538264028728, -0.02186085283756256, 0.013902194797992706, 0.99517422914505 ], "perturbation_rho": [ 0.024441849440336227, 0.023016899824142456, -0.07353583723306656, 0.014823662117123604, 0.003079652786254883, -0.01875249855220318, -0.01764325238764286, -0.009929117746651173, -0.04451639950275421, 0.0320318341255188, -0.0011818185448646545, 0.022136203944683075 ], "nudging": { "0.001": [ -7.490161806344986e-07, -2.367887645959854e-07, -8.963979780673981e-08, -9.546056389808655e-09, -3.026798367500305e-09, 2.7939677238464355e-08, 2.60770320892334e-08, 2.3283064365386963e-08, 1.210719347000122e-08, -1.3969838619232178e-08, 1.862645149230957e-08, -7.632188498973846e-07 ], "0.003": [ -2.018176019191742e-06, -6.172340363264084e-07, -1.916196197271347e-07, -3.3527612686157227e-08, -1.210719347000122e-08, -6.51925802230835e-08, 2.514570951461792e-08, 4.493631422519684e-08, -4.912726581096649e-08, 1.5366822481155396e-08, -1.4901161193847656e-08, -2.5206245481967926e-06 ], "0.01": [ -6.553716957569122e-06, -1.8514692783355713e-06, -4.6426430344581604e-07, 1.8603168427944183e-07, 1.6205012798309326e-07, -1.210719347000122e-08, -1.2363307178020477e-07, 2.6961788535118103e-07, 1.83936208486557e-08, 2.1792948246002197e-07, -8.521601557731628e-08, -9.013805538415909e-06 ] }, "hidden_norms_per_layer": [ 7627.2177734375, 77014.5703125, 261090.03125, 402920.15625, 531063.4375, 650439.0625, 771807.6875, 876618.25, 1137488.875, 1214998.0, 1291784.5, 1356458.875, 1186984.25 ], "bp_grad_norms_per_layer": [ 1.7493783161626197e-05, 1.0944853556793532e-06, 5.515285579349438e-07, 5.171301609152579e-07, 5.162664820090868e-07, 5.121610797687026e-07, 5.100455382489599e-07, 5.093034474157321e-07, 5.131421971782402e-07, 5.133904323884053e-07, 5.137007974553853e-07, 5.171222028366174e-07, 5.011079906580562e-07 ] }, "drift": { "embed.weight": 71.59970957169052, "embed.bias": 34.13643636527804, "blocks.0.ln.weight": 1.511795163154602, "blocks.0.w1.weight": 18.837866685893864, "blocks.0.w1.bias": 13.70267468651505, "blocks.0.w2.weight": 93.71863715934398, "blocks.1.ln.weight": 1.3081063032150269, "blocks.1.w1.weight": 21.240305602835985, "blocks.1.w1.bias": 13.685504606064915, "blocks.1.w2.weight": 61.028360088185984, "blocks.2.ln.weight": 1.0054956674575806, "blocks.2.w1.weight": 19.38818821685861, "blocks.2.w1.bias": 16.089163443737224, "blocks.2.w2.weight": 50.045867786081864, "blocks.3.ln.weight": 0.7472347021102905, "blocks.3.w1.weight": 19.199307011929896, "blocks.3.w1.bias": 18.432771215086387, "blocks.3.w2.weight": 37.33602068975751, "blocks.4.ln.weight": 0.6882285475730896, "blocks.4.w1.weight": 19.489052040551293, "blocks.4.w1.bias": 20.122343743742668, "blocks.4.w2.weight": 40.50107681410708, "blocks.5.ln.weight": 0.7229293584823608, "blocks.5.w1.weight": 19.290019148333055, "blocks.5.w1.bias": 19.20270861199211, "blocks.5.w2.weight": 44.78405827498682, "blocks.6.ln.weight": 0.7572810649871826, "blocks.6.w1.weight": 22.02089472340751, "blocks.6.w1.bias": 22.158527807844386, "blocks.6.w2.weight": 39.04536700764983, "blocks.7.ln.weight": 0.7923915386199951, "blocks.7.w1.weight": 22.987184790170787, "blocks.7.w1.bias": 25.461720259715808, "blocks.7.w2.weight": 43.420459766425545, "blocks.8.ln.weight": 0.7664017081260681, "blocks.8.w1.weight": 19.084502786198005, "blocks.8.w1.bias": 19.896472419541702, "blocks.8.w2.weight": 45.39367900417946, "blocks.9.ln.weight": 0.7352473735809326, "blocks.9.w1.weight": 18.514530575989, "blocks.9.w1.bias": 19.155701487630136, "blocks.9.w2.weight": 38.96532462321347, "blocks.10.ln.weight": 0.7539297342300415, "blocks.10.w1.weight": 18.499939513355947, "blocks.10.w1.bias": 18.297859410049362, "blocks.10.w2.weight": 33.573172219147224, "blocks.11.ln.weight": 0.7084934711456299, "blocks.11.w1.weight": 16.503202421262042, "blocks.11.w1.bias": 12.571542518226021, "blocks.11.w2.weight": 90.02901137589497, "out_ln.weight": 0.44491103291511536, "out_head.weight": 6.031580417677323, "out_head.bias": 0.5341898346582782 } } }, "config": { "dataset": "cifar10", "d_hidden": 256, "num_blocks": 12, "batch_size": 128, "epochs": 100, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 3 ], "gpu": 0, "output_dir": "results/fa_dfa_d256_L12_seed3", "methods": [ "fa", "dfa" ], "random_targets": false, "penalty_lam": 0.0, "num_classes": 10 } }