{ "42": { "bp": { "log": { "train_loss": [ 1.9159408319854736, 1.6833457696151732, 1.5935267736053467, 1.5389775912475585, 1.4867800998687744, 1.4524269732284545, 1.4178237664794922, 1.3897597776794433, 1.3664597565460206, 1.342870984840393, 1.3235610486221314, 1.301216788482666, 1.279724592475891, 1.2618738833999634, 1.2407353455352783, 1.22462412940979, 1.2109693797302246, 1.1892420639038086, 1.1723702849578856, 1.1557361126327514, 1.1423172385787963, 1.1261568475341797, 1.1062135691070556, 1.0966129437637329, 1.0756375621795655, 1.0581538507270813, 1.0487863679885865, 1.0285031553268433, 1.0112163684082032, 0.9978593858337402, 0.9784134501266479, 0.9645692346191406, 0.9500791883468628, 0.9311204533195495, 0.9137258143806457, 0.8955737284660339, 0.8760775566101074, 0.8636410433959961, 0.8472155108451843, 0.8257175942802429, 0.8081484350395203, 0.7949162258720398, 0.7682366105842591, 0.7535309395217895, 0.7374585538101196, 0.7163707330703736, 0.7002532124710082, 0.6810121598052978, 0.6590044124794007, 0.6416365943050385, 0.6245126323890686, 0.6053193593788146, 0.5843256318569183, 0.5672504850196839, 0.5574265190124512, 0.5282080096054077, 0.5124851553916931, 0.49809444856643675, 0.4815664218711853, 0.46325312936782836, 0.44530024614334107, 0.4232256102848053, 0.41155227093696595, 0.3951142164516449, 0.3779419419193268, 0.36394513979434967, 0.3495154238319397, 0.33435829617500307, 0.3247876634025574, 0.31244264134407046, 0.30034732496261596, 0.2886586371707916, 0.2739575230407715, 0.26273826862812044, 0.25702780318260193, 0.23921729731559754, 0.2356625511932373, 0.23087995275020598, 0.21462623807907105, 0.21162452461242676, 0.20137000153541565, 0.1957099277973175, 0.19024162811279297, 0.1820225635457039, 0.17860664487838745, 0.17204254170417785, 0.1648883514738083, 0.1611987146615982, 0.15891523240566255, 0.15874515238285064, 0.15378751336574553, 0.15460485486030578, 0.1495811799764633, 0.14360208065509797, 0.14562011506080627, 0.14506465085983275, 0.1431816494703293, 0.1397772234392166, 0.14342590034008026, 0.142473215675354 ], "train_acc": [ 0.31126, 0.39118, 0.41882, 0.44388, 0.4617, 0.4731, 0.48828, 0.49882, 0.50712, 0.51646, 0.5211, 0.53098, 0.53964, 0.54616, 0.55448, 0.55806, 0.56566, 0.57324, 0.57908, 0.58582, 0.58824, 0.59418, 0.60314, 0.60678, 0.61408, 0.62094, 0.62264, 0.63056, 0.63836, 0.64046, 0.64822, 0.65186, 0.65832, 0.66298, 0.67222, 0.67798, 0.686, 0.688, 0.695, 0.7014, 0.709, 0.71344, 0.7245, 0.72892, 0.73524, 0.7426, 0.74692, 0.75382, 0.76378, 0.76914, 0.77694, 0.78392, 0.78984, 0.79764, 0.79948, 0.81182, 0.81536, 0.82284, 0.82968, 0.83584, 0.84158, 0.8514, 0.85392, 0.86052, 0.86604, 0.87092, 0.87644, 0.88364, 0.88486, 0.88988, 0.89316, 0.89914, 0.9048, 0.90892, 0.90944, 0.91828, 0.9189, 0.92122, 0.92622, 0.92784, 0.93044, 0.9332, 0.93514, 0.93836, 0.93948, 0.94166, 0.94506, 0.9452, 0.94606, 0.94738, 0.9493, 0.94928, 0.94976, 0.95178, 0.9521, 0.95234, 0.95228, 0.9543, 0.95236, 0.9534 ], "test_acc": [ 0.3908, 0.433, 0.4419, 0.4858, 0.4871, 0.4878, 0.5141, 0.5211, 0.5188, 0.5279, 0.5296, 0.5402, 0.5415, 0.5584, 0.5559, 0.5648, 0.5531, 0.5686, 0.5685, 0.575, 0.5694, 0.5749, 0.5711, 0.585, 0.5778, 0.5875, 0.5827, 0.5876, 0.5868, 0.5947, 0.5903, 0.6001, 0.5963, 0.6013, 0.5943, 0.5994, 0.5879, 0.5925, 0.6006, 0.5978, 0.6007, 0.6034, 0.5914, 0.5958, 0.5959, 0.5959, 0.5928, 0.5961, 0.6013, 0.5978, 0.5974, 0.5998, 0.5919, 0.5936, 0.5958, 0.6019, 0.5972, 0.5927, 0.5998, 0.5945, 0.5942, 0.5984, 0.5904, 0.5907, 0.595, 0.5928, 0.5944, 0.5973, 0.5924, 0.5909, 0.5976, 0.5938, 0.5943, 0.5926, 0.5969, 0.5918, 0.5943, 0.5881, 0.5907, 0.5921, 0.5934, 0.5926, 0.5919, 0.5923, 0.5912, 0.5908, 0.5888, 0.5899, 0.5904, 0.5911, 0.5911, 0.5905, 0.5894, 0.5918, 0.5926, 0.5931, 0.5935, 0.5936, 0.5939, 0.594 ] }, "diagnostics": { "bp_cosine": [ 0.9423961043357849, 0.9423063397407532, 0.9428478479385376, 0.9422410726547241, 0.9424552917480469, 0.9417660236358643, 0.9408372640609741, 0.9404677152633667, 0.9403290748596191, 0.9396632313728333, 0.935971736907959, 0.9338305592536926 ], "perturbation_rho": [ 0.987454891204834, 0.9897942543029785, 0.990141749382019, 0.9901803731918335, 0.9920680522918701, 0.9906818866729736, 0.9903223514556885, 0.9926531910896301, 0.9914379119873047, 0.9897843599319458, 0.9882909059524536, 0.9869540929794312 ], "nudging": { "0.001": [ -0.002897711703553796, -0.002905686851590872, -0.0029487141873687506, -0.0030073150992393494, -0.002988070249557495, -0.0028954721055924892, -0.0027900305576622486, -0.002700705546885729, -0.0025893584825098515, -0.0024207504466176033, -0.002165877493098378, -0.00189895648509264 ], "0.003": [ -0.008684658445417881, -0.008708733133971691, -0.008837150409817696, -0.009012945927679539, -0.008955370634794235, -0.008678246289491653, -0.008362163789570332, -0.008094580844044685, -0.007761792279779911, -0.007257224526256323, -0.006493166089057922, -0.005693747662007809 ], "0.01": [ -0.028850272297859192, -0.028929298743605614, -0.029354672878980637, -0.029939891770482063, -0.029747068881988525, -0.028829604387283325, -0.027784891426563263, -0.026898572221398354, -0.025797637179493904, -0.024130169302225113, -0.02159387245774269, -0.018940377980470657 ] } }, "drift": { "embed.weight": 8.833701837291958, "embed.bias": 14.261815769395275, "blocks.0.ln.weight": 0.34404799666331826, "blocks.0.w1.weight": 4.175094808562947, "blocks.0.w1.bias": 6.98398106061982, "blocks.0.w2.weight": 10.592751719664884, "blocks.1.ln.weight": 0.2322510556310593, "blocks.1.w1.weight": 4.523413515316886, "blocks.1.w1.bias": 4.3749413052218085, "blocks.1.w2.weight": 11.940958034527862, "blocks.2.ln.weight": 0.2150404740407862, "blocks.2.w1.weight": 4.58583359520105, "blocks.2.w1.bias": 4.159787661269507, "blocks.2.w2.weight": 12.401201224911981, "blocks.3.ln.weight": 0.22107801019329978, "blocks.3.w1.weight": 4.586995215167557, "blocks.3.w1.bias": 3.881613437324734, "blocks.3.w2.weight": 12.64024804795375, "blocks.4.ln.weight": 0.23170407382172373, "blocks.4.w1.weight": 4.578125313924808, "blocks.4.w1.bias": 3.7932938751482683, "blocks.4.w2.weight": 12.963501907885533, "blocks.5.ln.weight": 0.23628225424614754, "blocks.5.w1.weight": 4.5240873092186416, "blocks.5.w1.bias": 3.803760854867017, "blocks.5.w2.weight": 12.912394584749915, "blocks.6.ln.weight": 0.2619501911907522, "blocks.6.w1.weight": 4.461384236716512, "blocks.6.w1.bias": 3.799496573870174, "blocks.6.w2.weight": 13.155197671866139, "blocks.7.ln.weight": 0.2657175505296468, "blocks.7.w1.weight": 4.422447215896801, "blocks.7.w1.bias": 3.725743197114046, "blocks.7.w2.weight": 13.149302405423146, "blocks.8.ln.weight": 0.28028080422594653, "blocks.8.w1.weight": 4.320993108213275, "blocks.8.w1.bias": 3.577600797368634, "blocks.8.w2.weight": 13.112473965027567, "blocks.9.ln.weight": 0.3122222575319159, "blocks.9.w1.weight": 4.3011661234952125, "blocks.9.w1.bias": 3.5701937101673704, "blocks.9.w2.weight": 13.20746990540504, "blocks.10.ln.weight": 0.2907587848995931, "blocks.10.w1.weight": 4.244185315341837, "blocks.10.w1.bias": 3.487530574891753, "blocks.10.w2.weight": 13.342063167376029, "blocks.11.ln.weight": 0.30672613980463925, "blocks.11.w1.weight": 4.1911870376224645, "blocks.11.w1.bias": 3.626239385452188, "blocks.11.w2.weight": 13.53569165604796, "out_ln.weight": 0.304987181878743, "out_head.weight": 3.659824943443211, "out_head.bias": 0.7848376848440143 } }, "dfa": { "log": { "train_loss": [ 2.060509294204712, 2.0283543349456785, 2.0286419232940673, 2.0282608281707764, 2.0229165492248535, 2.0251557587432862, 2.0200582264709475, 2.021266340560913, 2.0176746366119387, 2.0216268117523195, 2.016007042388916, 2.0150310187530516, 2.0130176863098144, 2.011090052871704, 2.0114055884552, 2.012881319503784, 2.0109381372070314, 2.011416566619873, 2.009194619445801, 2.008145341949463, 2.008374558181763, 2.009201191329956, 2.0073699200820925, 2.0068252397155764, 2.006670061340332, 2.006027181663513, 2.0085990719604494, 2.006233550338745, 2.007863084945679, 2.007588200149536, 2.0059480542755126, 2.0044747730255126, 2.006523677520752, 2.0035686435317994, 2.0047321628189088, 2.005557894821167, 2.003938685531616, 2.005093680458069, 2.0022387979507448, 2.004965279159546, 2.006689316253662, 2.0055594663238527, 2.004364362411499, 2.0020452467346193, 2.005489226150513, 2.003978981628418, 2.0023497142791746, 2.003284743270874, 2.0037755869293212, 2.001501432533264, 2.003944476890564, 2.0025060961914063, 2.002634817123413, 2.0017083084869385, 2.0028567737579346, 2.000872339820862, 2.003729987487793, 2.002261364898682, 2.0024312939453126, 2.0008276205444337, 2.001199483261108, 2.0006834197235106, 2.000615832366943, 1.9993626528930664, 2.0005247971343993, 1.9997058053588868, 1.999853487548828, 1.9997802280044557, 1.9991605996704103, 2.0015039880752563, 1.9991352321624756, 1.9994654761505126, 1.99805854221344, 1.9966946460723878, 1.9976105904388428, 1.9990063135528564, 1.995104397277832, 1.9979646807479858, 1.996112073097229, 1.999074932899475, 1.997551460647583, 1.9962433197784424, 1.997741110534668, 1.998971039352417, 1.9981346895599366, 1.9993204745864868, 1.9973036824798585, 1.9972220791625976, 1.9969999575042725, 1.9983418984222412, 1.9977535138702394, 1.9974792404174804, 1.9975066395568848, 1.9948017989349365, 1.9976891431427002, 1.9985219841003419, 1.9948620611190795, 1.995753077468872, 1.998552144088745, 1.9990386080932616 ], "train_acc": [ 0.23936, 0.25434, 0.25346, 0.25514, 0.25882, 0.25722, 0.25998, 0.25844, 0.262, 0.25976, 0.26256, 0.2639, 0.26116, 0.26558, 0.26594, 0.26562, 0.26654, 0.26378, 0.2653, 0.26746, 0.26592, 0.2681, 0.26896, 0.27006, 0.26992, 0.26862, 0.26736, 0.27126, 0.26738, 0.2694, 0.26836, 0.26744, 0.27024, 0.27184, 0.26816, 0.26806, 0.27192, 0.26898, 0.27294, 0.27124, 0.2707, 0.27056, 0.272, 0.27288, 0.27096, 0.27286, 0.27098, 0.27252, 0.26964, 0.27208, 0.27, 0.2737, 0.27368, 0.27134, 0.27342, 0.27386, 0.27258, 0.27398, 0.27468, 0.27518, 0.27328, 0.2752, 0.27404, 0.27526, 0.2754, 0.27588, 0.27358, 0.27472, 0.27548, 0.27356, 0.27508, 0.27656, 0.27638, 0.27784, 0.27648, 0.27606, 0.27718, 0.27632, 0.27822, 0.27514, 0.27692, 0.27566, 0.27648, 0.276, 0.27642, 0.27526, 0.27678, 0.2763, 0.27776, 0.27652, 0.27578, 0.27868, 0.27676, 0.27782, 0.27764, 0.27704, 0.27938, 0.27672, 0.2781, 0.2784 ], "test_acc": [ 0.2781, 0.2717, 0.2892, 0.2711, 0.2577, 0.2687, 0.2516, 0.281, 0.2759, 0.2822, 0.2529, 0.2933, 0.2908, 0.3048, 0.2739, 0.2751, 0.2888, 0.2869, 0.3078, 0.2855, 0.2884, 0.2932, 0.2955, 0.2952, 0.2919, 0.2886, 0.2871, 0.3017, 0.295, 0.3001, 0.2957, 0.2866, 0.2896, 0.3055, 0.2928, 0.3027, 0.2836, 0.2903, 0.2958, 0.2913, 0.2966, 0.287, 0.2877, 0.2879, 0.303, 0.3006, 0.2946, 0.2867, 0.2973, 0.2899, 0.2917, 0.3002, 0.2971, 0.2964, 0.3037, 0.2892, 0.3038, 0.2898, 0.2999, 0.3003, 0.3047, 0.2936, 0.2972, 0.2905, 0.3016, 0.2933, 0.295, 0.2998, 0.3, 0.3008, 0.3028, 0.3003, 0.303, 0.2946, 0.2915, 0.2974, 0.2901, 0.2978, 0.2991, 0.2973, 0.2948, 0.3032, 0.3049, 0.3017, 0.2999, 0.3019, 0.2958, 0.2981, 0.3009, 0.2968, 0.2987, 0.297, 0.2988, 0.2996, 0.3002, 0.3003, 0.3001, 0.3003, 0.3001, 0.3001 ] }, "diagnostics": { "bp_cosine": [ 0.3634233772754669, 0.001164254266768694, -0.0006461217999458313, -0.00019622840045485646, 0.0002198266884079203, -9.971270628739148e-06, 0.00014979815750848502, -0.0004021040804218501, -5.425223207566887e-05, -0.00024170493998099118, -0.00025007897056639194, -0.00018576104776002467 ], "perturbation_rho": [ 0.061064913868904114, 0.0, 0.0, 0.0, 0.00392885273322463, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "nudging": { "0.001": [ -3.8743019104003906e-07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.003": [ -1.1324882507324219e-06, 0.0, 2.7939677238464355e-09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.01": [ -3.606081008911133e-06, 0.0, 1.3504177331924438e-08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ] } }, "drift": { "embed.weight": 333.70584841410414, "embed.bias": 239.49966422804454, "blocks.0.ln.weight": 10.156513336148182, "blocks.0.w1.weight": 293.93859688585053, "blocks.0.w1.bias": 281.7468078045666, "blocks.0.w2.weight": 492.64207719718667, "blocks.1.ln.weight": 8.920722535237505, "blocks.1.w1.weight": 311.4826752480239, "blocks.1.w1.bias": 310.86370160689785, "blocks.1.w2.weight": 324.5405256645745, "blocks.2.ln.weight": 10.152850269187711, "blocks.2.w1.weight": 422.5618024966304, "blocks.2.w1.bias": 406.03916399589247, "blocks.2.w2.weight": 427.4195122419038, "blocks.3.ln.weight": 6.982139429700868, "blocks.3.w1.weight": 239.67203375670587, "blocks.3.w1.bias": 218.06238930657585, "blocks.3.w2.weight": 238.92558897030935, "blocks.4.ln.weight": 7.833071503056953, "blocks.4.w1.weight": 298.1966678874803, "blocks.4.w1.bias": 278.16504637194174, "blocks.4.w2.weight": 274.11280875965394, "blocks.5.ln.weight": 7.242266411414109, "blocks.5.w1.weight": 264.2525555458606, "blocks.5.w1.bias": 252.72325009085455, "blocks.5.w2.weight": 257.616366671581, "blocks.6.ln.weight": 7.548699630616584, "blocks.6.w1.weight": 262.2510067819824, "blocks.6.w1.bias": 251.81627023731494, "blocks.6.w2.weight": 273.41300895523614, "blocks.7.ln.weight": 8.476523067012732, "blocks.7.w1.weight": 318.7369678667611, "blocks.7.w1.bias": 299.5996411120576, "blocks.7.w2.weight": 294.5553970248432, "blocks.8.ln.weight": 10.089688663753533, "blocks.8.w1.weight": 404.9516419003623, "blocks.8.w1.bias": 379.7449486217603, "blocks.8.w2.weight": 384.6524371767172, "blocks.9.ln.weight": 10.376434921092248, "blocks.9.w1.weight": 410.9149275889754, "blocks.9.w1.bias": 383.0074711781066, "blocks.9.w2.weight": 392.8539842927831, "blocks.10.ln.weight": 6.445966095557191, "blocks.10.w1.weight": 233.37502830905152, "blocks.10.w1.bias": 219.30705311523053, "blocks.10.w2.weight": 224.7808320380166, "blocks.11.ln.weight": 9.439442353351934, "blocks.11.w1.weight": 374.5461893118647, "blocks.11.w1.bias": 354.2106427892852, "blocks.11.w2.weight": 349.272673385976, "out_ln.weight": 0.6481155342918145, "out_head.weight": 9.174388328815116, "out_head.bias": 0.47817510393040696 } }, "state_bridge": { "log": { "train_loss": [ 2.249122398071289, 2.143466188659668, 2.182890202178955, 2.316445587387085, 2.3062049280548096, 2.266785619735718, 2.2987561087799073, 2.2884853198242188, 2.240994506072998, 2.2790724418640136, 2.2708915201568605, 2.266933690185547, 2.2886832971954347, 2.2700843003845215, 2.1964657810211183, 2.129935463180542, 2.1168104545593263, 2.12433757270813, 2.113173648223877, 2.1130354350280762, 2.1059150744628905, 2.091750974731445, 2.092220969924927, 2.124610143814087, 2.096196698989868, 2.089525361709595, 2.0865603291320802, 2.0807934146118163, 2.069572374725342, 2.0693005324554443, 2.064417702713013, 2.061735754241943, 2.0726303718566896, 2.068593667602539, 2.0655730045318603, 2.0626395158386233, 2.063313564758301, 2.0622880627441407, 2.058299614639282, 2.059487857131958, 2.0631128742980955, 2.0610568396759033, 2.0551611611938476, 2.056872489852905, 2.0546858750915526, 2.056325934524536, 2.053202699737549, 2.0516857704162597, 2.0511376399230956, 2.052292654342651, 2.0525611149597167, 2.052803971786499, 2.0563543517684937, 2.058361290130615, 2.059238384399414, 2.060622958755493, 2.063846826324463, 2.0644858879852297, 2.0641055697631834, 2.062063186683655, 2.0649280325317383, 2.065730286026001, 2.0664522916412356, 2.066531411819458, 2.0671734712982177, 2.066738704376221, 2.06800027633667, 2.0698299375915528, 2.0699130378723143, 2.069541824951172, 2.069294273452759, 2.068808924255371, 2.071917738342285, 2.0731585116577147, 2.0724312242126466, 2.073472029876709, 2.0752377517700196, 2.0765309967041015, 2.0784705491638182, 2.079111976928711, 2.079522602157593, 2.080129363708496, 2.0800775938415526, 2.0806046531677245, 2.080093946685791, 2.082602798614502, 2.0823856858062744, 2.083605904006958, 2.082737918624878, 2.0829258354187012, 2.082134012680054, 2.081413818206787, 2.080659938735962, 2.079646938858032, 2.079785990867615, 2.079912822265625, 2.0787852781677247, 2.080009171295166, 2.0796959645080566, 2.07859284072876 ], "train_acc": [ 0.14508, 0.16856, 0.15632, 0.11096, 0.12388, 0.14108, 0.12374, 0.1273, 0.14434, 0.12372, 0.13196, 0.13698, 0.1278, 0.13406, 0.15046, 0.17556, 0.18282, 0.17838, 0.18174, 0.1771, 0.1835, 0.18812, 0.1935, 0.17326, 0.18206, 0.1833, 0.18656, 0.19114, 0.19432, 0.19874, 0.19688, 0.19564, 0.19196, 0.19548, 0.1934, 0.19826, 0.19794, 0.19896, 0.20276, 0.20258, 0.20152, 0.20098, 0.2025, 0.20058, 0.20388, 0.20206, 0.2039, 0.20444, 0.2054, 0.20728, 0.2042, 0.20478, 0.204, 0.1998, 0.20252, 0.2013, 0.1988, 0.2002, 0.20158, 0.2012, 0.20384, 0.20102, 0.1987, 0.20136, 0.19972, 0.20122, 0.19876, 0.19792, 0.20008, 0.20138, 0.1992, 0.19956, 0.20076, 0.19942, 0.20054, 0.20192, 0.20256, 0.2009, 0.1972, 0.20028, 0.19826, 0.1992, 0.19678, 0.19736, 0.19872, 0.20076, 0.20126, 0.20262, 0.20088, 0.20116, 0.2009, 0.20188, 0.20326, 0.20284, 0.20404, 0.20164, 0.20386, 0.20324, 0.20414, 0.2032 ], "test_acc": [ 0.1701, 0.1589, 0.0964, 0.0977, 0.147, 0.1388, 0.1311, 0.1208, 0.1018, 0.1576, 0.117, 0.1127, 0.1215, 0.1579, 0.1648, 0.1561, 0.179, 0.1723, 0.1962, 0.1791, 0.1863, 0.1757, 0.161, 0.166, 0.1768, 0.1795, 0.18, 0.1802, 0.1787, 0.1767, 0.1754, 0.1604, 0.1761, 0.1675, 0.1741, 0.171, 0.1697, 0.1797, 0.1836, 0.1869, 0.19, 0.1893, 0.1907, 0.1866, 0.1877, 0.1889, 0.1871, 0.1949, 0.1817, 0.1912, 0.1923, 0.1955, 0.1958, 0.1893, 0.1961, 0.1915, 0.1966, 0.2031, 0.1959, 0.1915, 0.1753, 0.1929, 0.18, 0.1823, 0.194, 0.1869, 0.1969, 0.1912, 0.1946, 0.1919, 0.1971, 0.1907, 0.2003, 0.1926, 0.1998, 0.1947, 0.1862, 0.1997, 0.1874, 0.1841, 0.188, 0.1869, 0.1828, 0.1856, 0.1888, 0.1734, 0.1826, 0.1813, 0.1816, 0.1868, 0.1879, 0.1846, 0.1837, 0.182, 0.1821, 0.1836, 0.1838, 0.1833, 0.1832, 0.1836 ], "state_pred_error": [ 0.3305018243932724, 0.3240715994644165, 0.2682553328800201, 0.13893559893369675, 0.07450400803923607, 0.05266491491317749, 0.035537137892246246, 0.08557363073348999, 0.0663624380338192, 0.05056835491657257, 0.057957575828433035, 0.03669406015276909, 0.044723540180921555, 0.05952853068828583, 0.06200094776391983, 0.034456856629252436, 0.02363166331708431, 0.030915076084136964, 0.027922455305457117, 0.022749129890203477, 0.01869435190498829, 0.016911904378533363, 0.012851448996663094, 0.009603057160079479, 0.0068074954861402515, 0.004831086874008178, 0.002716479171216488, 0.0017772294883430003, 0.0011674952478520572, 0.0009641216253489256, 0.000903967960383743, 0.0008178514664620161, 0.0009606654725596308, 0.0010464790955930948, 0.0009382549912855029, 0.0008025767210498452, 0.0006237311275862158, 0.0005590206385217607, 0.0006743966669589281, 0.0007392789867147803, 0.0007174553440324963, 0.0006993773563578725, 0.000645849712882191, 0.0005546821858268231, 0.00046942476788535716, 0.0003906826237775385, 0.0003712719864305109, 0.0003606485006958246, 0.0003457060167193413, 0.0003746068775840104, 0.00038963068067096173, 0.0003513397928327322, 0.00032962770885787906, 0.00033959761667996645, 0.0003122131848614663, 0.00028035666743293406, 0.00026064857746940106, 0.00022029355119913816, 0.00019001943845301867, 0.00020799835772719233, 0.0002275417461199686, 0.00020783223733305932, 0.00018264570890925825, 0.00015985633003059774, 0.0001389945726841688, 0.00011476213769754394, 8.967853816691787e-05, 7.122783363331109e-05, 5.970104366540909e-05, 5.121438584523275e-05, 4.536606192123145e-05, 4.0154456216841935e-05, 3.647202713880688e-05, 3.4129825913114475e-05, 3.2702885311446155e-05, 3.160392617806792e-05, 3.0352398289833216e-05, 2.940795918868389e-05, 2.8640556085156276e-05, 2.736381722963415e-05, 2.6395615809597075e-05, 2.5282455111155287e-05, 2.4516119782347232e-05, 2.388914132665377e-05, 2.2789849505061285e-05, 2.1843732089619152e-05, 2.0776926304679363e-05, 1.9760204966296442e-05, 1.8386752204969525e-05, 1.7638299430254845e-05, 1.702676533255726e-05, 1.6189092184067705e-05, 1.5407667033723554e-05, 1.4915904570952988e-05, 1.4520096725318581e-05, 1.3764947652525734e-05, 1.333884218824096e-05, 1.3029495921800845e-05, 1.262850838684244e-05, 1.2368245947291143e-05 ] }, "diagnostics": { "bp_cosine": [ 0.15691214799880981, 0.015022292733192444, 0.006593926809728146, 0.007205793634057045, 0.008038382977247238, 0.0067636389285326, 0.005863174330443144, 0.0026869114954024553, 0.00880957767367363, 0.009782599285244942, 0.00875927321612835, 0.015338878147304058 ], "perturbation_rho": [ 0.046312831342220306, 0.002848614938557148, -7.617553637828678e-05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "nudging": { "0.001": [ -4.103407263755798e-06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.003": [ -1.2268312275409698e-05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.01": [ -4.0831975638866425e-05, 7.450580596923828e-09, 0.0, 0.0, 0.0, 0.0, 0.0, 9.313225746154785e-10, 0.0, 0.0, 0.0, 0.0 ] } }, "drift": { "embed.weight": 20.26978490963512, "embed.bias": 97.32930339256669, "blocks.0.ln.weight": 1.9308135867617757, "blocks.0.w1.weight": 66.3483568365869, "blocks.0.w1.bias": 53.284724707801, "blocks.0.w2.weight": 177.08907259952375, "blocks.1.ln.weight": 3.057512831818983, "blocks.1.w1.weight": 170.34177401016777, "blocks.1.w1.bias": 213.60524387953882, "blocks.1.w2.weight": 200.26342063170046, "blocks.2.ln.weight": 2.5608747595416883, "blocks.2.w1.weight": 103.95319184812183, "blocks.2.w1.bias": 101.21405935076268, "blocks.2.w2.weight": 134.8362490743747, "blocks.3.ln.weight": 2.3109975543869266, "blocks.3.w1.weight": 116.99989433662596, "blocks.3.w1.bias": 120.91968382837668, "blocks.3.w2.weight": 142.44744178171467, "blocks.4.ln.weight": 2.718708135007822, "blocks.4.w1.weight": 124.26248150423525, "blocks.4.w1.bias": 121.48105264933947, "blocks.4.w2.weight": 118.7892683407888, "blocks.5.ln.weight": 1.8158878954501887, "blocks.5.w1.weight": 56.878036794490896, "blocks.5.w1.bias": 36.57930796279972, "blocks.5.w2.weight": 85.47839722655326, "blocks.6.ln.weight": 3.0875197025983447, "blocks.6.w1.weight": 100.99150638794737, "blocks.6.w1.bias": 97.42240055489651, "blocks.6.w2.weight": 87.13862478741176, "blocks.7.ln.weight": 7.772248541992971, "blocks.7.w1.weight": 297.4998489055548, "blocks.7.w1.bias": 282.6199479818741, "blocks.7.w2.weight": 193.40369417394206, "blocks.8.ln.weight": 3.0697438474661696, "blocks.8.w1.weight": 143.40991382362168, "blocks.8.w1.bias": 132.0178424400649, "blocks.8.w2.weight": 126.31745589603334, "blocks.9.ln.weight": 3.3171246104472094, "blocks.9.w1.weight": 150.22737087992024, "blocks.9.w1.bias": 147.1140425995551, "blocks.9.w2.weight": 118.0665737085708, "blocks.10.ln.weight": 6.064775829759772, "blocks.10.w1.weight": 281.65394416567705, "blocks.10.w1.bias": 267.43803892028814, "blocks.10.w2.weight": 206.89673602536328, "blocks.11.ln.weight": 2.0710718946854763, "blocks.11.w1.weight": 93.44069995553728, "blocks.11.w1.bias": 93.69984582471675, "blocks.11.w2.weight": 110.16073882917532, "out_ln.weight": 0.4517673564729089, "out_head.weight": 5.403719578492724, "out_head.bias": 2.04427795310877 } }, "credit_bridge": { "log": { "train_loss": [ 2.06320516204834, 2.0399101606750487, 2.033929338531494, 2.0309921591186524, 2.0298601413726804, 2.0217224433135987, 2.024232417259216, 2.019040475921631, 2.0207128286361695, 2.019753430519104, 2.016178896408081, 2.011948891983032, 2.0130044828796385, 2.0113372691345215, 2.012964423980713, 2.0107208766937257, 2.0117168256378175, 2.0097561017227172, 2.0089866023254395, 2.009570707740784, 2.011733226318359, 2.007577508773804, 2.0085436083602906, 2.0043470149230957, 2.0070890647888184, 2.0043670698547364, 2.0048324042129515, 2.0042362908935547, 2.0050302404403686, 2.004891293258667, 2.005185372543335, 2.003529516067505, 2.0045382270050047, 2.005508458251953, 2.00552710067749, 2.002495421791077, 1.9999042555999755, 1.998048825454712, 1.9961405738067628, 1.989240593185425, 1.9859777431488037, 1.9825943405532838, 1.9781343281555175, 1.9761270376968383, 1.9706906524658203, 1.9723773523712158, 1.9700259783172607, 1.9686059323883056, 1.9655450037384032, 1.965288708114624, 1.9665511059570313, 1.9662485723114014, 1.9659714967346191, 1.9650201892852783, 1.962706196937561, 1.9626981174468994, 1.962720913772583, 1.9627574170684814, 1.9608846031951905, 1.9610804913711548, 1.9616359865570068, 1.9621461741638184, 1.9603107889556886, 1.9571026586914062, 1.9596751629257203, 1.9583080463409424, 1.9566787594604491, 1.9575193979644776, 1.9559337323760986, 1.9559677182006836, 1.9548421646499634, 1.9558928606414796, 1.9595830995941161, 1.9542909908676147, 1.9583268686676025, 1.9573874398040771, 1.9573734212875367, 1.956038475189209, 1.9572998455047608, 1.95643936958313, 1.9555049303436278, 1.9551573079681397, 1.9559287934112548, 1.9554652740859986, 1.9546309524536132, 1.9547708898925782, 1.9570305030059814, 1.9546662924194336, 1.953575323562622, 1.9553636624526978, 1.954565380935669, 1.9541568119812012, 1.9543512627410888, 1.954592315673828, 1.9545559118652345, 1.9531384017562867, 1.9550698448944093, 1.955762207107544, 1.9552061297988892, 1.957028095779419 ], "train_acc": [ 0.23984, 0.24842, 0.2523, 0.25414, 0.25272, 0.25882, 0.257, 0.26044, 0.25976, 0.26, 0.26116, 0.2649, 0.26124, 0.2642, 0.26532, 0.26592, 0.26512, 0.26658, 0.26512, 0.2671, 0.2687, 0.26848, 0.26662, 0.26946, 0.26794, 0.26952, 0.26786, 0.26836, 0.26706, 0.27072, 0.26694, 0.26872, 0.2661, 0.26742, 0.26802, 0.26896, 0.26998, 0.27168, 0.2705, 0.27562, 0.27362, 0.27702, 0.27414, 0.2807, 0.28288, 0.2806, 0.28036, 0.28098, 0.28132, 0.28288, 0.28464, 0.28428, 0.28284, 0.28638, 0.28584, 0.28538, 0.28668, 0.28688, 0.28718, 0.2852, 0.28592, 0.28522, 0.28774, 0.29002, 0.28946, 0.28842, 0.28964, 0.29052, 0.29124, 0.29164, 0.29108, 0.29114, 0.28798, 0.28992, 0.28808, 0.29178, 0.28762, 0.28974, 0.29016, 0.28958, 0.29256, 0.29012, 0.29266, 0.29038, 0.2914, 0.2924, 0.2919, 0.2951, 0.2932, 0.29244, 0.29184, 0.2924, 0.29446, 0.2932, 0.29322, 0.29452, 0.29264, 0.29084, 0.29366, 0.2917 ], "test_acc": [ 0.2379, 0.2678, 0.2756, 0.2987, 0.2573, 0.2947, 0.2621, 0.2983, 0.2971, 0.2616, 0.278, 0.2983, 0.2803, 0.2915, 0.2714, 0.2835, 0.2837, 0.2794, 0.2915, 0.2982, 0.2854, 0.2997, 0.3019, 0.2841, 0.2873, 0.2874, 0.2676, 0.3023, 0.3033, 0.2965, 0.2888, 0.279, 0.3008, 0.2752, 0.2953, 0.3039, 0.3075, 0.3057, 0.2836, 0.2859, 0.303, 0.2871, 0.3052, 0.3119, 0.2982, 0.2954, 0.3026, 0.303, 0.3007, 0.3087, 0.3026, 0.301, 0.3082, 0.3071, 0.3137, 0.3006, 0.3102, 0.3033, 0.3079, 0.3136, 0.3092, 0.3083, 0.3181, 0.3098, 0.312, 0.312, 0.3052, 0.3092, 0.3124, 0.3069, 0.3038, 0.3079, 0.3117, 0.3054, 0.3065, 0.3056, 0.3086, 0.3103, 0.3038, 0.3132, 0.3157, 0.3131, 0.3092, 0.313, 0.3106, 0.3118, 0.3085, 0.3115, 0.3113, 0.3129, 0.3098, 0.3146, 0.3102, 0.3109, 0.3104, 0.3117, 0.3113, 0.3106, 0.3104, 0.3104 ], "value_loss": [ 0.4835468523311615, 0.17319115218162537, 0.12466768116235732, 0.1044780854511261, 0.11361225022792816, 0.09506864285826683, 0.08982749298095703, 0.06943095141410828, 0.06597960061311722, 0.0689908292388916, 0.05427408220410347, 0.048282792123556136, 0.04676814959049225, 0.04863041600465774, 0.0471925854742527, 0.043705004994869234, 0.0460531382226944, 0.03692107924818993, 0.03888409217596054, 0.03788371595621109, 0.03733079287290573, 0.0377624527490139, 0.036395574208498004, 0.03193316010415554, 0.03243833178460598, 0.027760677633285522, 0.029560993740558626, 0.029699042382240297, 0.02779862470269203, 0.02897036738872528, 0.025522839539051056, 0.02311282460749149, 0.020680676515102386, 0.023304677747488022, 0.022652746698856353, 0.019273730003237725, 0.018258913558125495, 0.02010319753885269, 0.01653825303465128, 0.02135470446884632, 0.018013720120489598, 0.016730768181085588, 0.01824077806353569, 0.013809284281134605, 0.01404231985926628, 0.016477530472278595, 0.01449635619878769, 0.013006495736837388, 0.013415186036229133, 0.011523299672305583, 0.01087947401329875, 0.0120885151720047, 0.011659734555482864, 0.009783919822871684, 0.009495561037063598, 0.01004114615738392, 0.009555040076076984, 0.009653655390739441, 0.009292597230225802, 0.009270159545093774, 0.008550122949182988, 0.00753715006917715, 0.007719495616853237, 0.006912159933894873, 0.006747392172813415, 0.007531150514781475, 0.006493680753260851, 0.006225158845484257, 0.006196837233901024, 0.006545155131220818, 0.005813424973487854, 0.0052813203772902485, 0.0056783805817365645, 0.005296767835021019, 0.005148515439927578, 0.004331958843171596, 0.00367335773833096, 0.003545896329060197, 0.0034597759203612802, 0.003181714376732707, 0.0032860505221784116, 0.002376726396679878, 0.002331429560147226, 0.002127379362359643, 0.0018355507389456033, 0.0019746782282367347, 0.0013750521056354046, 0.0016369795854389668, 0.0013883132124319672, 0.0014942838795110583, 0.0011334093083441258, 0.0013581191193312407, 0.0012651530192419886, 0.0013948661609459669, 0.00119701892176643, 0.0009705750445276499, 0.0009873379099927843, 0.0013789990733936428, 0.0015264763329923153, 0.0007223523693159222 ] }, "diagnostics": { "bp_cosine": [ 0.442160040140152, 0.011405838653445244, 0.021783415228128433, 0.02257826365530491, 0.022579727694392204, 0.022490674629807472, 0.022444019094109535, 0.02243717387318611, 0.02238454297184944, 0.021799881011247635, 0.021308548748493195, 0.021358368918299675 ], "perturbation_rho": [ -0.0024002324789762497, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "nudging": { "0.001": [ -9.359791874885559e-07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.003": [ -3.080349415540695e-06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.01": [ -1.0516028851270676e-05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ] } }, "drift": { "embed.weight": 185.7504766018605, "embed.bias": 113.97655387234977, "blocks.0.ln.weight": 8.006394857140304, "blocks.0.w1.weight": 201.9426375330318, "blocks.0.w1.bias": 163.53267733285352, "blocks.0.w2.weight": 338.84776840881347, "blocks.1.ln.weight": 6.295072957460427, "blocks.1.w1.weight": 219.06553999907572, "blocks.1.w1.bias": 226.32772829898, "blocks.1.w2.weight": 242.1925329344591, "blocks.2.ln.weight": 7.320912432081406, "blocks.2.w1.weight": 311.3035934820304, "blocks.2.w1.bias": 298.6852088590304, "blocks.2.w2.weight": 316.80472460197296, "blocks.3.ln.weight": 4.940329586675122, "blocks.3.w1.weight": 172.30509352305455, "blocks.3.w1.bias": 152.69976843471107, "blocks.3.w2.weight": 171.54613400302898, "blocks.4.ln.weight": 5.398528552340865, "blocks.4.w1.weight": 194.3066729117384, "blocks.4.w1.bias": 177.2111282722944, "blocks.4.w2.weight": 181.75464322675703, "blocks.5.ln.weight": 5.0186360723250045, "blocks.5.w1.weight": 177.28809608368013, "blocks.5.w1.bias": 166.1128575027424, "blocks.5.w2.weight": 177.87652026549083, "blocks.6.ln.weight": 5.11718383519975, "blocks.6.w1.weight": 175.68155404770292, "blocks.6.w1.bias": 165.18102396382997, "blocks.6.w2.weight": 188.26739446960036, "blocks.7.ln.weight": 5.749714981932067, "blocks.7.w1.weight": 211.62845167555633, "blocks.7.w1.bias": 194.987439334531, "blocks.7.w2.weight": 197.40821780414132, "blocks.8.ln.weight": 7.020310313763905, "blocks.8.w1.weight": 281.07720524059584, "blocks.8.w1.bias": 259.36087916311686, "blocks.8.w2.weight": 264.53573649142305, "blocks.9.ln.weight": 7.277383166194383, "blocks.9.w1.weight": 285.7959615127006, "blocks.9.w1.bias": 261.89392533705353, "blocks.9.w2.weight": 274.12202590162974, "blocks.10.ln.weight": 4.304915932630116, "blocks.10.w1.weight": 146.38313888426148, "blocks.10.w1.bias": 134.29068175155572, "blocks.10.w2.weight": 146.4223780813692, "blocks.11.ln.weight": 6.661402581393363, "blocks.11.w1.weight": 265.5729059266825, "blocks.11.w1.bias": 247.27216580071305, "blocks.11.w2.weight": 242.98119602092984, "out_ln.weight": 0.5446617517258924, "out_head.weight": 7.799632034433011, "out_head.bias": 1.2214285543387151 } } }, "config": { "dataset": "cifar10", "d_hidden": 512, "num_blocks": 12, "batch_size": 128, "epochs": 100, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 42 ], "gpu": 0, "output_dir": "results/cifar10", "num_classes": 10 } }