{ "123": { "bp": { "log": { "train_loss": [ 1.9175124251556397, 1.6847565829849243, 1.5875056425857543, 1.5320447119140626, 1.4794927943801879, 1.4405573056030274, 1.4091039984893798, 1.3804642078399658, 1.3562547276306152, 1.3386102033233642, 1.3113672603607178, 1.286414957962036, 1.2713352434539795, 1.2514976085662841, 1.2332095288848877, 1.2136467219924927, 1.2016698885345458, 1.1760129442214966, 1.1615581885910033, 1.1460976659965516, 1.1286324452972412, 1.1125253838348388, 1.0944270223999024, 1.0830238839530946, 1.0608218252563477, 1.0437702729034424, 1.034650561027527, 1.017014478340149, 0.9988842744445801, 0.9852388265800476, 0.9635365026664734, 0.9439176512908936, 0.9298832908248902, 0.9137922927856446, 0.895711201210022, 0.8814193804550171, 0.8632927577590942, 0.84351964012146, 0.827347836894989, 0.807900242767334, 0.7877964169311523, 0.7770450174331665, 0.7534891272926331, 0.7365407562255859, 0.7147518105125428, 0.6962322827911377, 0.6742078248596192, 0.6564239510726929, 0.6403258143234253, 0.6197586893653869, 0.6014538905525207, 0.583438274936676, 0.5667518968963623, 0.543176082239151, 0.5258174272155761, 0.5108640935707093, 0.4897696580505371, 0.47116634141922, 0.4534935041809082, 0.4354778845024109, 0.4233958884239197, 0.4017178301334381, 0.3859938202762604, 0.37423386340141296, 0.365246470451355, 0.3411486894798279, 0.32471628838539124, 0.31114961336135866, 0.29552998408317566, 0.28871005929946897, 0.27408093184471133, 0.26901549862384794, 0.2596221783256531, 0.24521093573570252, 0.2299592537355423, 0.22053928468227388, 0.21593001784324645, 0.1976856986284256, 0.19874527307510376, 0.19333338455200194, 0.18259587281227113, 0.17466963967323304, 0.1689953342151642, 0.16150579230308532, 0.15866700973510742, 0.15368373103141786, 0.1482925960588455, 0.145876254529953, 0.14030234585762025, 0.13952740331172944, 0.1361180233001709, 0.1323960340666771, 0.12677059319972991, 0.1287061265563965, 0.12679034420013427, 0.12853138402462005, 0.12579439376831056, 0.1280787334895134, 0.12339243181705475, 0.12544435278892518 ], "train_acc": [ 0.31434, 0.39008, 0.42376, 0.44654, 0.46472, 0.47872, 0.49158, 0.5009, 0.51142, 0.51944, 0.52706, 0.53622, 0.54168, 0.55052, 0.5568, 0.56322, 0.56372, 0.57526, 0.58298, 0.58918, 0.59476, 0.6007, 0.6078, 0.61058, 0.61816, 0.62692, 0.62922, 0.63428, 0.64188, 0.64736, 0.6547, 0.65824, 0.6673, 0.67046, 0.67872, 0.68352, 0.68988, 0.69742, 0.70294, 0.7099, 0.71534, 0.72286, 0.72898, 0.73446, 0.74268, 0.75076, 0.75844, 0.76398, 0.76912, 0.77878, 0.78504, 0.78992, 0.79944, 0.80564, 0.81262, 0.81906, 0.82502, 0.83208, 0.83826, 0.84468, 0.8507, 0.8589, 0.86356, 0.86656, 0.87174, 0.87936, 0.88406, 0.8908, 0.89792, 0.89858, 0.90396, 0.90662, 0.90894, 0.91456, 0.9191, 0.92516, 0.92578, 0.93306, 0.93206, 0.93384, 0.9388, 0.94064, 0.94322, 0.94482, 0.9463, 0.94904, 0.94962, 0.95136, 0.95286, 0.9532, 0.95498, 0.95586, 0.9589, 0.95728, 0.95824, 0.95676, 0.95896, 0.95834, 0.95978, 0.95964 ], "test_acc": [ 0.3978, 0.4369, 0.4561, 0.4846, 0.4943, 0.5129, 0.5144, 0.5192, 0.5235, 0.5332, 0.53, 0.5382, 0.5478, 0.5507, 0.5534, 0.5638, 0.5725, 0.5626, 0.572, 0.5735, 0.5778, 0.5778, 0.583, 0.5789, 0.5885, 0.589, 0.5849, 0.5957, 0.5916, 0.5872, 0.5864, 0.589, 0.599, 0.6012, 0.5912, 0.5967, 0.5973, 0.5923, 0.5983, 0.5947, 0.5966, 0.5996, 0.6007, 0.5935, 0.6005, 0.6016, 0.5972, 0.5976, 0.596, 0.5938, 0.5933, 0.598, 0.5987, 0.5998, 0.5914, 0.5916, 0.5988, 0.5984, 0.5936, 0.6002, 0.5917, 0.5921, 0.5944, 0.5968, 0.5925, 0.5974, 0.5946, 0.5979, 0.5923, 0.5956, 0.5968, 0.5956, 0.5974, 0.5934, 0.5943, 0.5954, 0.5982, 0.5923, 0.5921, 0.5937, 0.5937, 0.5941, 0.5921, 0.5957, 0.5953, 0.5939, 0.5939, 0.5965, 0.5952, 0.5957, 0.5951, 0.5976, 0.5967, 0.5968, 0.5974, 0.5965, 0.5973, 0.596, 0.5961, 0.5962 ] }, "diagnostics": { "bp_cosine": [ 0.9620110392570496, 0.9621291160583496, 0.9621908664703369, 0.9623005986213684, 0.9625044465065002, 0.9625605344772339, 0.9631243348121643, 0.9631022214889526, 0.9631184935569763, 0.9626430869102478, 0.9622764587402344, 0.9619318246841431 ], "perturbation_rho": [ 0.9879884719848633, 0.9869263172149658, 0.9891279935836792, 0.9888099431991577, 0.991609513759613, 0.9902887344360352, 0.9909973740577698, 0.9915982484817505, 0.9906468987464905, 0.9890569448471069, 0.9870684146881104, 0.9818294644355774 ], "nudging": { "0.001": [ -0.003427116898819804, -0.003351739142090082, -0.0033903690055012703, -0.003365215379744768, -0.0033891985658556223, -0.003362787188962102, -0.0032895321492105722, -0.0031716772355139256, -0.0029750647954642773, -0.002764828037470579, -0.0024368567392230034, -0.0021113622933626175 ], "0.003": [ -0.010271656326949596, -0.010045798495411873, -0.010160606354475021, -0.010086143389344215, -0.01015765406191349, -0.010078245773911476, -0.009858867153525352, -0.009506190195679665, -0.008917586877942085, -0.008288294076919556, -0.007305148057639599, -0.006330306641757488 ], "0.01": [ -0.03411904349923134, -0.033372972160577774, -0.033751748502254486, -0.03350646048784256, -0.0337451696395874, -0.03347958251833916, -0.03275400772690773, -0.03158621862530708, -0.029637902975082397, -0.02755369432270527, -0.024292215704917908, -0.02105848491191864 ] } }, "drift": { "embed.weight": 8.763637326480993, "embed.bias": 15.277378973045789, "blocks.0.ln.weight": 0.34908970813559786, "blocks.0.w1.weight": 4.164846741111791, "blocks.0.w1.bias": 6.735275454452179, "blocks.0.w2.weight": 10.512885267241659, "blocks.1.ln.weight": 0.2548678557191968, "blocks.1.w1.weight": 4.428344802990091, "blocks.1.w1.bias": 4.431127174572938, "blocks.1.w2.weight": 11.609675967743058, "blocks.2.ln.weight": 0.20993716494835368, "blocks.2.w1.weight": 4.563301300136555, "blocks.2.w1.bias": 4.053222361596439, "blocks.2.w2.weight": 12.283684374504883, "blocks.3.ln.weight": 0.22639993499269975, "blocks.3.w1.weight": 4.586109188420391, "blocks.3.w1.bias": 3.9811075138013527, "blocks.3.w2.weight": 12.651716892358182, "blocks.4.ln.weight": 0.23813753747592467, "blocks.4.w1.weight": 4.55512749423403, "blocks.4.w1.bias": 3.7036288780635465, "blocks.4.w2.weight": 12.900508521442045, "blocks.5.ln.weight": 0.24851322774648468, "blocks.5.w1.weight": 4.519407405633592, "blocks.5.w1.bias": 3.7828748042863825, "blocks.5.w2.weight": 12.877614228932648, "blocks.6.ln.weight": 0.24789524956961745, "blocks.6.w1.weight": 4.510086973031788, "blocks.6.w1.bias": 3.7520206765756337, "blocks.6.w2.weight": 13.18270185196777, "blocks.7.ln.weight": 0.27277168975906585, "blocks.7.w1.weight": 4.471720887903336, "blocks.7.w1.bias": 3.7457909142015353, "blocks.7.w2.weight": 13.30644187374482, "blocks.8.ln.weight": 0.29086480529883674, "blocks.8.w1.weight": 4.434570868617996, "blocks.8.w1.bias": 3.7342218578126882, "blocks.8.w2.weight": 13.49877934675731, "blocks.9.ln.weight": 0.2919660181755758, "blocks.9.w1.weight": 4.429555710823986, "blocks.9.w1.bias": 3.634447923096686, "blocks.9.w2.weight": 13.75719577660119, "blocks.10.ln.weight": 0.32005145624529063, "blocks.10.w1.weight": 4.353451334572149, "blocks.10.w1.bias": 3.4614471694540865, "blocks.10.w2.weight": 13.887069102514094, "blocks.11.ln.weight": 0.29895213239033414, "blocks.11.w1.weight": 4.374616657143753, "blocks.11.w1.bias": 3.645530912656648, "blocks.11.w2.weight": 14.561155498919536, "out_ln.weight": 0.283104664197929, "out_head.weight": 3.694886816637194, "out_head.bias": 1.105623778518022 } }, "dfa": { "log": { "train_loss": [ 2.0684899793243408, 2.0445925352478027, 2.03087772151947, 2.027939418258667, 2.0253660607528685, 2.0250345896148683, 2.022372142868042, 2.019951826019287, 2.017632607574463, 2.015866649131775, 2.017579344139099, 2.01485851020813, 2.012323605117798, 2.009420676612854, 2.0132182874298095, 2.007821100616455, 2.0097865366363528, 2.005040230484009, 2.004450204849243, 2.0059849935150145, 2.005384602432251, 2.001610414581299, 2.002629147567749, 2.0022453118896486, 1.9994831539154052, 1.9995977224349974, 2.0003068398284913, 2.0012258628082273, 1.9992249011611938, 1.9970151906967164, 1.9978694770812988, 1.997133782272339, 1.9935067112731935, 1.9952505539321899, 1.992918910446167, 1.9958944741058349, 1.9945134730529785, 1.993255687599182, 1.9926469972991943, 1.9950547982406617, 1.9904610315322877, 1.9907950922393798, 1.991843765411377, 1.9908243858337402, 1.9923807875823976, 1.9917906607055664, 1.992043903465271, 1.9904995797348022, 1.9916813136291505, 1.98937647026062, 1.9889434642791748, 1.9899712393188476, 1.9896988627624512, 1.9895934002304076, 1.9901937147521973, 1.9906840317535401, 1.9852267303466797, 1.989434090652466, 1.9889313174438477, 1.9886722135925292, 1.9877896743392944, 1.9861792268371583, 1.986029208984375, 1.9876557461547852, 1.985245605545044, 1.9858075296401978, 1.9867199410247802, 1.9870598261260985, 1.9854085816955567, 1.9867712688827515, 1.9855045788955688, 1.9881172052764893, 1.9837462771987915, 1.98582817527771, 1.9842846584320069, 1.9848911337280273, 1.9850436270904541, 1.9835600254821777, 1.9840570623779297, 1.9839281851196289, 1.984888575820923, 1.9857918256378173, 1.9845330112075805, 1.984420718612671, 1.9853396697998047, 1.9839463347625732, 1.9833207806396485, 1.9841535271453858, 1.9810106130218506, 1.9846471352386474, 1.9849586167144775, 1.984921664199829, 1.984304642715454, 1.9863978981781005, 1.9833829919052124, 1.984193635787964, 1.983270346107483, 1.9827691938018799, 1.9846319453430177, 1.9829401163101197 ], "train_acc": [ 0.2366, 0.24504, 0.25212, 0.25468, 0.25604, 0.2569, 0.25714, 0.2588, 0.25558, 0.2631, 0.2608, 0.26104, 0.26492, 0.26478, 0.26264, 0.26596, 0.26544, 0.267, 0.26848, 0.26756, 0.26702, 0.26954, 0.27278, 0.26886, 0.26902, 0.27146, 0.272, 0.2698, 0.2728, 0.27384, 0.2713, 0.27288, 0.27422, 0.2767, 0.2742, 0.2748, 0.27392, 0.27568, 0.27816, 0.27558, 0.27752, 0.27658, 0.27714, 0.277, 0.27766, 0.27532, 0.27622, 0.27806, 0.27688, 0.27908, 0.27896, 0.27908, 0.27972, 0.28032, 0.27848, 0.27914, 0.2816, 0.27856, 0.27972, 0.28028, 0.28068, 0.27928, 0.28124, 0.2814, 0.28118, 0.28066, 0.2815, 0.28218, 0.28352, 0.2822, 0.28114, 0.28234, 0.28204, 0.28104, 0.28, 0.2824, 0.28114, 0.28372, 0.282, 0.28204, 0.28208, 0.28162, 0.28212, 0.28526, 0.28178, 0.28234, 0.28358, 0.28328, 0.28346, 0.28396, 0.28374, 0.28334, 0.28204, 0.28406, 0.28382, 0.28466, 0.28292, 0.28436, 0.28206, 0.28276 ], "test_acc": [ 0.2589, 0.2617, 0.2631, 0.2816, 0.2556, 0.2607, 0.2876, 0.2818, 0.2763, 0.2847, 0.3005, 0.2738, 0.283, 0.2729, 0.2859, 0.2782, 0.3055, 0.2874, 0.2796, 0.3027, 0.2977, 0.3013, 0.2869, 0.2663, 0.2917, 0.2707, 0.2784, 0.3006, 0.2812, 0.2801, 0.2755, 0.2935, 0.3091, 0.3041, 0.2967, 0.3054, 0.3107, 0.2963, 0.2956, 0.2927, 0.2941, 0.2943, 0.2948, 0.3057, 0.3015, 0.3116, 0.2928, 0.301, 0.288, 0.296, 0.2909, 0.2957, 0.3145, 0.3124, 0.2994, 0.307, 0.3047, 0.3026, 0.2989, 0.2978, 0.3023, 0.2971, 0.3062, 0.3025, 0.2919, 0.309, 0.301, 0.2947, 0.3086, 0.2976, 0.3106, 0.3013, 0.3109, 0.3012, 0.3019, 0.2969, 0.3022, 0.3038, 0.3035, 0.3087, 0.2972, 0.2974, 0.2952, 0.3032, 0.3034, 0.3027, 0.3024, 0.3055, 0.3031, 0.3003, 0.3044, 0.3046, 0.3032, 0.3029, 0.303, 0.3028, 0.3038, 0.3032, 0.3035, 0.3034 ] }, "diagnostics": { "bp_cosine": [ 0.40911683440208435, 0.0002619648876134306, -0.00015980367606971413, 0.0005440536187961698, 0.0002772972220554948, 7.781770545989275e-05, -0.00020515912910923362, -0.00044000157504342496, -0.0008366729598492384, 0.00015155941946431994, 0.00032340025063604116, -0.00015023337618913502 ], "perturbation_rho": [ 0.0528201088309288, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "nudging": { "0.001": [ -4.898756742477417e-07, 1.862645149230957e-09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, -1.862645149230957e-09, 0.0, 0.0, 0.0 ], "0.003": [ -1.2246891856193542e-06, 1.862645149230957e-09, -9.313225746154785e-10, 0.0, 0.0, 0.0, 0.0, 0.0, -1.862645149230957e-09, 0.0, 0.0, 0.0 ], "0.01": [ -4.1155144572257996e-06, -1.862645149230957e-09, -9.313225746154785e-10, 0.0, 0.0, 0.0, 0.0, 0.0, -2.7939677238464355e-09, 0.0, -9.313225746154785e-10, 0.0 ] } }, "drift": { "embed.weight": 323.8982252804048, "embed.bias": 232.81638531211948, "blocks.0.ln.weight": 10.852100889778994, "blocks.0.w1.weight": 272.36679039121384, "blocks.0.w1.bias": 238.87995630640614, "blocks.0.w2.weight": 445.2406120934057, "blocks.1.ln.weight": 9.73650143893558, "blocks.1.w1.weight": 390.9712215089673, "blocks.1.w1.bias": 374.17715191606453, "blocks.1.w2.weight": 403.2488589095519, "blocks.2.ln.weight": 6.710448026907898, "blocks.2.w1.weight": 227.28731670207446, "blocks.2.w1.bias": 202.7493867156122, "blocks.2.w2.weight": 223.99250691076898, "blocks.3.ln.weight": 7.215269500019514, "blocks.3.w1.weight": 231.09319791624182, "blocks.3.w1.bias": 206.9745974350102, "blocks.3.w2.weight": 238.74614111179253, "blocks.4.ln.weight": 9.257100922232066, "blocks.4.w1.weight": 374.01823924044805, "blocks.4.w1.bias": 343.71540244431617, "blocks.4.w2.weight": 350.8111852358107, "blocks.5.ln.weight": 6.914568252312619, "blocks.5.w1.weight": 266.9118711467473, "blocks.5.w1.bias": 256.9588103323234, "blocks.5.w2.weight": 254.31906752172955, "blocks.6.ln.weight": 8.82549425820829, "blocks.6.w1.weight": 354.28665902336076, "blocks.6.w1.bias": 332.44091471694884, "blocks.6.w2.weight": 326.29279154408147, "blocks.7.ln.weight": 10.262108389389345, "blocks.7.w1.weight": 411.01500781893094, "blocks.7.w1.bias": 383.25852137267697, "blocks.7.w2.weight": 398.26834704743106, "blocks.8.ln.weight": 9.486443170916516, "blocks.8.w1.weight": 379.7970569993528, "blocks.8.w1.bias": 353.44640446436694, "blocks.8.w2.weight": 354.75408312717866, "blocks.9.ln.weight": 7.225265383958218, "blocks.9.w1.weight": 280.98274227898526, "blocks.9.w1.bias": 264.21754537134655, "blocks.9.w2.weight": 250.42097452359232, "blocks.10.ln.weight": 9.12118778587681, "blocks.10.w1.weight": 363.4177719662398, "blocks.10.w1.bias": 333.2020904512465, "blocks.10.w2.weight": 343.55519901127, "blocks.11.ln.weight": 9.146084772655259, "blocks.11.w1.weight": 367.21625652465485, "blocks.11.w1.bias": 343.39432049385726, "blocks.11.w2.weight": 338.5639684764078, "out_ln.weight": 0.5993398286123665, "out_head.weight": 9.522011867407477, "out_head.bias": 0.44134062139959057 } }, "state_bridge": { "log": { "train_loss": [ 2.27535658454895, 2.2637348059844973, 2.23140262840271, 2.13100928276062, 2.1194422898101806, 2.113937710952759, 2.123109260482788, 2.123372416381836, 2.118385257644653, 2.123976169281006, 2.143634383087158, 2.15997088432312, 2.1503283737182617, 2.2361232402801514, 2.31340713142395, 2.312125205230713, 2.3117453997802735, 2.3094616239929198, 2.3084144255065917, 2.3107836222076417, 2.3105288831329345, 2.312015315246582, 2.311362181777954, 2.3104846384429933, 2.3100794078826903, 2.308620408859253, 2.2244751792907715, 2.1188239234924318, 2.099667515487671, 2.1012451152038576, 2.101906224517822, 2.1015794395446776, 2.102679093170166, 2.104404850845337, 2.105138458328247, 2.1025040253448486, 2.09926293258667, 2.0996690463256837, 2.0955256491851806, 2.0939024459075926, 2.0932679664611817, 2.0943772303771975, 2.087596756668091, 2.0909996266937254, 2.087642866668701, 2.089086704559326, 2.0858034885406496, 2.084843352355957, 2.081013270111084, 2.0763836125183106, 2.068111530685425, 2.0633422270965576, 2.059932788619995, 2.0572856521987917, 2.0567763134765626, 2.055301329345703, 2.0559660177230836, 2.0547456675720217, 2.0552883127593993, 2.052630202102661, 2.050533991241455, 2.0526472858428955, 2.051843546676636, 2.0524809063720704, 2.052277666931152, 2.049621379356384, 2.0498316369628906, 2.049651178665161, 2.0472222846221926, 2.0483968115997313, 2.04511710357666, 2.0473428889465333, 2.0471922763061525, 2.050198796348572, 2.0515007726287844, 2.051603550682068, 2.0523804613494874, 2.054355347518921, 2.055121799697876, 2.0543520391082764, 2.0561765496063233, 2.056192929840088, 2.054548904418945, 2.05620756149292, 2.055558791809082, 2.056474009552002, 2.055143079071045, 2.054688854446411, 2.0569355255126953, 2.0542632417297364, 2.054791463470459, 2.054189739532471, 2.0533234220123293, 2.0529643350982667, 2.053456902542114, 2.0533332372283937, 2.0545412349700927, 2.053972573928833, 2.0536360316467284, 2.053008867416382 ], "train_acc": [ 0.13698, 0.13998, 0.1447, 0.17058, 0.17036, 0.1725, 0.1677, 0.16766, 0.1698, 0.1709, 0.16482, 0.1638, 0.16334, 0.14304, 0.10524, 0.11206, 0.10998, 0.11288, 0.11528, 0.10822, 0.10712, 0.10462, 0.1037, 0.10238, 0.10366, 0.10334, 0.15168, 0.17212, 0.17798, 0.17688, 0.17846, 0.17562, 0.17644, 0.17718, 0.175, 0.17492, 0.1766, 0.17688, 0.17674, 0.18138, 0.18304, 0.17868, 0.18296, 0.18172, 0.18454, 0.18428, 0.18226, 0.18568, 0.18754, 0.19132, 0.2004, 0.20496, 0.207, 0.20808, 0.2054, 0.20596, 0.20646, 0.20616, 0.20466, 0.20608, 0.20848, 0.20616, 0.20746, 0.20588, 0.20528, 0.20778, 0.20856, 0.2078, 0.2101, 0.20888, 0.21296, 0.211, 0.20934, 0.20746, 0.20674, 0.20832, 0.20954, 0.20736, 0.20522, 0.20496, 0.20606, 0.20302, 0.20594, 0.20828, 0.2064, 0.20466, 0.20378, 0.20496, 0.20534, 0.20862, 0.20546, 0.20594, 0.20688, 0.20658, 0.20712, 0.20672, 0.20568, 0.20664, 0.20646, 0.20888 ], "test_acc": [ 0.1514, 0.1391, 0.1828, 0.1457, 0.1765, 0.186, 0.1602, 0.1723, 0.1754, 0.1714, 0.1724, 0.1634, 0.1615, 0.0959, 0.1252, 0.1087, 0.135, 0.1366, 0.1028, 0.1085, 0.1257, 0.114, 0.119, 0.1, 0.0848, 0.1194, 0.1607, 0.1795, 0.1859, 0.1635, 0.1571, 0.1682, 0.1748, 0.1717, 0.1789, 0.1658, 0.1673, 0.1783, 0.1799, 0.1761, 0.1812, 0.173, 0.1716, 0.164, 0.1657, 0.1769, 0.1728, 0.1726, 0.1801, 0.1758, 0.1873, 0.1862, 0.1948, 0.1935, 0.2009, 0.1933, 0.2102, 0.2094, 0.2153, 0.2097, 0.2054, 0.211, 0.2109, 0.1975, 0.2107, 0.2099, 0.2109, 0.202, 0.2055, 0.2103, 0.2068, 0.2068, 0.2085, 0.2085, 0.206, 0.203, 0.1998, 0.2021, 0.2092, 0.2039, 0.2034, 0.1976, 0.2064, 0.2098, 0.2078, 0.2045, 0.2078, 0.2055, 0.2068, 0.2065, 0.2075, 0.2084, 0.206, 0.2056, 0.2061, 0.2063, 0.2066, 0.2067, 0.2068, 0.2069 ], "state_pred_error": [ 0.3455641258764267, 0.1890164827811718, 0.06542741327524185, 0.15099643572807311, 0.15767600553512573, 0.14595494849205018, 0.09619720283508301, 0.05848943448066712, 0.04476255656838417, 0.03768930072784424, 0.034250264310240745, 0.02679455811023712, 0.024154067809581757, 0.020689564958810806, 0.015427032306194306, 0.01494347603648901, 0.012853515672385693, 0.00926094017356634, 0.00883663154706359, 0.00866620466351509, 0.008630412181615829, 0.009436789927184582, 0.010587773686945438, 0.006365314861536026, 0.0058888214336335655, 0.004059859301149845, 0.0059570299243927, 0.005231297912150622, 0.004334697146564722, 0.005451656972020865, 0.005537090619504452, 0.006261329069137574, 0.006663460256308317, 0.0068712751638889315, 0.006620877954363823, 0.0059924150297045705, 0.004774981212168932, 0.0035280540695041417, 0.003671990767121315, 0.0035207420617341997, 0.0030331813983619214, 0.0031412731628119943, 0.0028461132158339023, 0.002806654215082526, 0.0028670129170268776, 0.0030720302928984164, 0.0032383741122484207, 0.002952979260608554, 0.002582101986259222, 0.0024391376911848785, 0.002423995024561882, 0.002365549064427614, 0.002312273128144443, 0.0020981324925273656, 0.0018509870688617229, 0.001701984341070056, 0.001557768930643797, 0.001504055576622486, 0.0015004488579928876, 0.0016905955363065005, 0.001851444918513298, 0.002072783012315631, 0.0021090806840360164, 0.0020937418549507856, 0.001958419643007219, 0.0018501618901640177, 0.0017675739562511444, 0.001684609704464674, 0.0016207635071873664, 0.0015579476598650216, 0.0014976035876572132, 0.0014524117913842201, 0.0013800759248435498, 0.001322413182966411, 0.0012982203678414226, 0.0012594390138238667, 0.0012120740934088827, 0.0011591399506293237, 0.001117924986295402, 0.0010595228926092387, 0.0010102490696310997, 0.0009533731169998645, 0.0009156427671574056, 0.0008670865286141634, 0.0008243481399863959, 0.0007827390401065349, 0.0007445751608535648, 0.0007058267378434539, 0.0006572319846227765, 0.0006192173832282424, 0.0005905027001723647, 0.0005582181675359607, 0.0005225332551077009, 0.0004948109107278287, 0.0004635604086332023, 0.0004460584534611553, 0.00041995075650513175, 0.00039428566612303257, 0.0003732312531303614, 0.0003609425350651145 ] }, "diagnostics": { "bp_cosine": [ 0.13039325177669525, -0.0001226231688633561, -6.530806422233582e-05, 0.0008607044583186507, 0.00019595431513153017, 0.0003264691913500428, 0.0007734490791335702, 0.00040342434658668935, 0.0006691448506899178, 0.0006843262817710638, 0.0009011077927425504, 0.0007364039774984121 ], "perturbation_rho": [ 0.06105021387338638, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "nudging": { "0.001": [ -8.485279977321625e-06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.003": [ -2.5329645723104477e-05, 9.313225746154785e-09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.01": [ -8.417712524533272e-05, -4.190951585769653e-09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ] } }, "drift": { "embed.weight": 18.244614908467394, "embed.bias": 91.4065704680882, "blocks.0.ln.weight": 2.7002334851153766, "blocks.0.w1.weight": 134.61543991177393, "blocks.0.w1.bias": 122.71752984768428, "blocks.0.w2.weight": 276.02165008885817, "blocks.1.ln.weight": 6.996325721977635, "blocks.1.w1.weight": 316.6573873211569, "blocks.1.w1.bias": 288.7266985364082, "blocks.1.w2.weight": 232.96436903686606, "blocks.2.ln.weight": 3.005190384482946, "blocks.2.w1.weight": 113.28816941109099, "blocks.2.w1.bias": 102.79639141280903, "blocks.2.w2.weight": 154.79558550064107, "blocks.3.ln.weight": 3.854659793583277, "blocks.3.w1.weight": 136.45977626032953, "blocks.3.w1.bias": 125.02248154351406, "blocks.3.w2.weight": 160.12595576311708, "blocks.4.ln.weight": 5.321574474789146, "blocks.4.w1.weight": 200.03582097403066, "blocks.4.w1.bias": 185.1705216854366, "blocks.4.w2.weight": 197.8192680660012, "blocks.5.ln.weight": 3.689939791539998, "blocks.5.w1.weight": 121.91986650696485, "blocks.5.w1.bias": 112.80564875251632, "blocks.5.w2.weight": 175.23886752618034, "blocks.6.ln.weight": 5.257637367329094, "blocks.6.w1.weight": 159.5448554465857, "blocks.6.w1.bias": 148.9053783966513, "blocks.6.w2.weight": 146.5770282072606, "blocks.7.ln.weight": 4.684853931243148, "blocks.7.w1.weight": 133.95190141354294, "blocks.7.w1.bias": 120.52600626182299, "blocks.7.w2.weight": 137.015420718898, "blocks.8.ln.weight": 4.553687541635819, "blocks.8.w1.weight": 134.4598258206248, "blocks.8.w1.bias": 124.54115675222299, "blocks.8.w2.weight": 138.93702924685354, "blocks.9.ln.weight": 4.188852950738847, "blocks.9.w1.weight": 128.35707494719534, "blocks.9.w1.bias": 120.498165463794, "blocks.9.w2.weight": 149.134498305582, "blocks.10.ln.weight": 3.3037616990170426, "blocks.10.w1.weight": 108.25092049032806, "blocks.10.w1.bias": 101.78620102240454, "blocks.10.w2.weight": 127.47031512506157, "blocks.11.ln.weight": 1.6054786857904342, "blocks.11.w1.weight": 50.83956015087797, "blocks.11.w1.bias": 49.1835893514986, "blocks.11.w2.weight": 90.71530778227628, "out_ln.weight": 0.5849072301486865, "out_head.weight": 3.217267238682831, "out_head.bias": 0.8024946363335762 } }, "credit_bridge": { "log": { "train_loss": [ 2.07422056892395, 2.055305141906738, 2.0377359949493408, 2.0334118033599853, 2.034562978172302, 2.0315364552307127, 2.0276041582489013, 2.029994778060913, 2.025310488204956, 2.0206511740875244, 2.024435912742615, 2.017680696372986, 2.014923624572754, 2.015591604614258, 2.0193257177734374, 2.0126227207946776, 2.013033943634033, 2.0076499520111084, 2.0094668504333497, 2.0096006536865234, 2.0050730683135987, 2.006946638031006, 2.0071442542266844, 2.004831351776123, 2.0035909980010986, 2.004108156204224, 2.0006491820907595, 2.0016160436248778, 1.9999982108306884, 1.9992566723251344, 1.9979173023986816, 1.996204802093506, 1.9980539007568359, 1.995016636199951, 1.9975717867279053, 1.9963324966812135, 1.9947675510406495, 1.9942235395812988, 1.995222140235901, 1.9917342311096191, 1.9899134133148193, 1.988487755279541, 1.9872248657608031, 1.9865933574676513, 1.9852813260650635, 1.9867496614837648, 1.9831518542480469, 1.9813233506011962, 1.9796981923675536, 1.9797288468933105, 1.9774669593811036, 1.9774521997833252, 1.9714781398773193, 1.9715750045013427, 1.9715392060089112, 1.970840647201538, 1.9684521988296508, 1.9670102074813842, 1.9633512356948852, 1.9662449013900758, 1.9640194422149657, 1.9607671911239624, 1.9630818260955811, 1.9602737934112549, 1.960026322631836, 1.961152883758545, 1.9590496487426758, 1.9572670712280273, 1.9577932699966432, 1.957121894493103, 1.9570679434585572, 1.954615853881836, 1.9549290727996826, 1.9529239632415771, 1.9538047943115235, 1.9561965101623535, 1.9530966287994385, 1.9537969312286376, 1.9531251779174805, 1.9546874990463257, 1.9529049239730836, 1.9550184294891357, 1.9533232469940185, 1.9538247448730468, 1.9541607789611817, 1.954350821533203, 1.9529511869049072, 1.9544397570037841, 1.9555162839126587, 1.9529233142089844, 1.9550124865722656, 1.954115503501892, 1.9515360607910157, 1.9521209592056274, 1.9523113599014281, 1.9537422107696534, 1.953715394668579, 1.952323772354126, 1.9519077111434937, 1.9538698761367799 ], "train_acc": [ 0.2349, 0.23648, 0.24714, 0.25066, 0.24922, 0.2532, 0.25626, 0.25148, 0.2532, 0.26078, 0.25636, 0.2586, 0.26336, 0.26146, 0.25874, 0.26418, 0.2629, 0.26778, 0.26784, 0.26732, 0.26768, 0.26668, 0.2681, 0.26688, 0.26936, 0.26936, 0.2677, 0.2705, 0.2677, 0.2709, 0.27164, 0.27174, 0.27098, 0.27192, 0.27154, 0.26932, 0.27164, 0.26854, 0.26818, 0.27076, 0.26892, 0.26664, 0.27098, 0.2697, 0.2714, 0.2725, 0.27024, 0.27174, 0.27278, 0.26878, 0.27302, 0.27324, 0.27562, 0.2744, 0.27374, 0.2738, 0.27576, 0.27626, 0.2782, 0.27834, 0.27942, 0.27984, 0.28104, 0.27978, 0.28036, 0.281, 0.28012, 0.28318, 0.28276, 0.28262, 0.28174, 0.28244, 0.28384, 0.28378, 0.28154, 0.2809, 0.28316, 0.2827, 0.2864, 0.2831, 0.2849, 0.28526, 0.28446, 0.28448, 0.28456, 0.28378, 0.28358, 0.28354, 0.2834, 0.2829, 0.28564, 0.28302, 0.28616, 0.28478, 0.2849, 0.28396, 0.28816, 0.28346, 0.28456, 0.28572 ], "test_acc": [ 0.2422, 0.2524, 0.2511, 0.2709, 0.2522, 0.2695, 0.2654, 0.2622, 0.282, 0.2861, 0.259, 0.2868, 0.2668, 0.2736, 0.2902, 0.2962, 0.3035, 0.2747, 0.296, 0.2894, 0.2905, 0.2902, 0.3018, 0.2788, 0.2989, 0.2832, 0.3054, 0.2928, 0.2921, 0.2723, 0.29, 0.281, 0.2819, 0.2924, 0.3021, 0.291, 0.2721, 0.2887, 0.2827, 0.2766, 0.2938, 0.2976, 0.2883, 0.2888, 0.3015, 0.2923, 0.2893, 0.2859, 0.2876, 0.2915, 0.2857, 0.2848, 0.2936, 0.2842, 0.2815, 0.2766, 0.2905, 0.2933, 0.2846, 0.2876, 0.2872, 0.2876, 0.293, 0.2942, 0.2917, 0.2816, 0.2931, 0.2874, 0.2906, 0.2935, 0.2918, 0.2838, 0.2872, 0.29, 0.2891, 0.2893, 0.2908, 0.2873, 0.293, 0.292, 0.286, 0.286, 0.2872, 0.2867, 0.2876, 0.2865, 0.2841, 0.2826, 0.2844, 0.2853, 0.2866, 0.2887, 0.2856, 0.2867, 0.2882, 0.2895, 0.2885, 0.2885, 0.2885, 0.2885 ], "value_loss": [ 0.46219210285663603, 0.16240292426109315, 0.11675834127902984, 0.10173126588344573, 0.10192921797513962, 0.08491676461458206, 0.08081110213756561, 0.10098561144590378, 0.086660576441288, 0.07095537901163101, 0.07209414057731628, 0.06507166877388953, 0.05680496859550476, 0.051555730621814726, 0.05897924602746964, 0.0477625340873003, 0.050076086919903756, 0.04791341652750969, 0.043811181032657624, 0.048990424308776856, 0.041765395416021346, 0.04788978707790375, 0.038938788844347, 0.038173083332777025, 0.037605566675663, 0.03472667615830898, 0.029743025472164154, 0.03321148899495602, 0.031504894320964816, 0.028381420345902443, 0.02973802535891533, 0.025553143047094346, 0.028812745112776757, 0.026098545892238617, 0.02787227361112833, 0.022305913635492326, 0.02363199061870575, 0.021854550403952597, 0.02323986495792866, 0.018420420945882796, 0.018242734627723693, 0.019795424582660197, 0.01764130767583847, 0.01667629898786545, 0.016429091787040235, 0.015772414491176605, 0.014359855057001113, 0.012779874252080917, 0.012927391214668751, 0.014349255759716033, 0.013130034263134003, 0.013914088915586471, 0.010768152612149716, 0.012323264547288418, 0.012266730073690415, 0.012296598086953162, 0.011092334405183792, 0.008943616542220116, 0.009557433066666126, 0.008033960376381873, 0.008238149175047874, 0.0075173489648103714, 0.009243258455693721, 0.008397357228696346, 0.008250873034894466, 0.009054240943193436, 0.0061908810329437255, 0.007204210565388202, 0.006787694528698921, 0.006576583880782127, 0.0068760585397481915, 0.00587797952502966, 0.006058499993383884, 0.004864574173986912, 0.005336316513419152, 0.004476593678146601, 0.00504198596701026, 0.00414283695474267, 0.003692763058245182, 0.0036398935145139696, 0.0031052616691589355, 0.003147630747780204, 0.002547671852298081, 0.0023914932864904405, 0.0022162304655462504, 0.0017571020238101483, 0.0018844479297846555, 0.0015003561322391033, 0.001468994250819087, 0.0015521602664142846, 0.0010236410408467054, 0.000977659215182066, 0.001276740662381053, 0.0008685083091259003, 0.0012216014919430019, 0.001092172961011529, 0.0008087569988891483, 0.0009069699543341994, 0.0013558788930997253, 0.0006715716527029872 ] }, "diagnostics": { "bp_cosine": [ 0.37664300203323364, 0.00668198149651289, 0.02027757838368416, 0.02049040049314499, 0.020580384880304337, 0.020434698089957237, 0.020465239882469177, 0.021316751837730408, 0.021797576919198036, 0.021945470944046974, 0.021979298442602158, 0.021852022036910057 ], "perturbation_rho": [ 0.009359830990433693, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "nudging": { "0.001": [ -9.862706065177917e-07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.003": [ -2.905726432800293e-06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.01": [ -9.72812995314598e-06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ] } }, "drift": { "embed.weight": 179.58500900515028, "embed.bias": 134.71300218044718, "blocks.0.ln.weight": 9.192845521766614, "blocks.0.w1.weight": 201.0064270139136, "blocks.0.w1.bias": 136.56099913744478, "blocks.0.w2.weight": 299.7118104200996, "blocks.1.ln.weight": 6.775393287001583, "blocks.1.w1.weight": 298.99303772053656, "blocks.1.w1.bias": 288.6803183648879, "blocks.1.w2.weight": 299.96832262513726, "blocks.2.ln.weight": 4.442030759950682, "blocks.2.w1.weight": 156.3224513959878, "blocks.2.w1.bias": 134.77200050699193, "blocks.2.w2.weight": 164.77485249426002, "blocks.3.ln.weight": 4.854857462306176, "blocks.3.w1.weight": 165.45425459739124, "blocks.3.w1.bias": 143.7040311765167, "blocks.3.w2.weight": 178.2893036667054, "blocks.4.ln.weight": 6.433765762816246, "blocks.4.w1.weight": 262.9945171233052, "blocks.4.w1.bias": 237.2497554637253, "blocks.4.w2.weight": 247.70202715443386, "blocks.5.ln.weight": 4.669370190359616, "blocks.5.w1.weight": 179.65430058156437, "blocks.5.w1.bias": 167.17352257399838, "blocks.5.w2.weight": 176.56809805245783, "blocks.6.ln.weight": 5.836574580577738, "blocks.6.w1.weight": 236.71076201812485, "blocks.6.w1.bias": 216.59863578081908, "blocks.6.w2.weight": 222.1449202786447, "blocks.7.ln.weight": 7.017034323466784, "blocks.7.w1.weight": 283.45578137085835, "blocks.7.w1.bias": 258.2162159056869, "blocks.7.w2.weight": 275.54620177391195, "blocks.8.ln.weight": 6.320927520653432, "blocks.8.w1.weight": 252.95263320055057, "blocks.8.w1.bias": 230.26130735012416, "blocks.8.w2.weight": 239.07712197948655, "blocks.9.ln.weight": 4.771737132124388, "blocks.9.w1.weight": 184.2226928948631, "blocks.9.w1.bias": 168.12677483943122, "blocks.9.w2.weight": 169.7918496964596, "blocks.10.ln.weight": 6.193554347477001, "blocks.10.w1.weight": 248.40930737157998, "blocks.10.w1.bias": 221.7518821584096, "blocks.10.w2.weight": 238.1444968107213, "blocks.11.ln.weight": 5.976649802588373, "blocks.11.w1.weight": 240.99115354219526, "blocks.11.w1.bias": 220.01049332622438, "blocks.11.w2.weight": 226.72197924893874, "out_ln.weight": 0.47882108182026845, "out_head.weight": 7.4188430237353336, "out_head.bias": 1.3782394013786212 } } }, "config": { "dataset": "cifar10", "d_hidden": 512, "num_blocks": 12, "batch_size": 128, "epochs": 100, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 123 ], "gpu": 0, "output_dir": "results/cifar10_seed123", "num_classes": 10 } }