{ "bp": { "log": { "train_loss": [ 1.9181581103515626, 1.6830080932235718, 1.5920702320480347, 1.5328609270477296, 1.4799005626678468, 1.443107092781067, 1.4138772471618652, 1.3873612524032592, 1.3651276648712158, 1.3390819979095459, 1.3217692392349243, 1.305022211074829, 1.2817235651779175, 1.2682050260925293, 1.2521741982269288, 1.2378110882568358, 1.215573044204712, 1.2035384091949464, 1.1932872578430176, 1.1754147102737427, 1.1641269732284545, 1.1506621165275575, 1.1339097010803223, 1.1212864548492432, 1.1109269207000732, 1.0991801218032837, 1.085493840484619, 1.068724670715332, 1.0622537975883484, 1.0497802551078796, 1.0335843839645387, 1.0245532283782959, 1.0139307324409486, 1.003597820968628, 0.9886502099990845, 0.9805063750457763, 0.9631068154907226, 0.9566182117843628, 0.9359624940299988, 0.9330330731201172, 0.9160753777313232, 0.9056328008651734, 0.8898537806510926, 0.8787901188278199, 0.8694718393707276, 0.8506128107833862, 0.8468854373931884, 0.8328564296150207, 0.8235082776260376, 0.8091592510604858, 0.7912276449775696, 0.7819558120727539, 0.7648613720703125, 0.7557380415725709, 0.7431310074996949, 0.7325722367095947, 0.7191381365394592, 0.7073116994094849, 0.6935642263793945, 0.6829617013549805, 0.6721186479949951, 0.6607764552879334, 0.6520131350326538, 0.6347136948776245, 0.6286079556655884, 0.6146584116744995, 0.6037020747566223, 0.5897762714195252, 0.5843867614936828, 0.57075146068573, 0.5668514904212951, 0.5526476261138916, 0.5426406643104553, 0.5337510031700134, 0.524534646692276, 0.5152219123649597, 0.508841796541214, 0.5018864378547668, 0.49528331829071043, 0.4755337562465668, 0.47835412044525144, 0.47154994369506836, 0.4639086106681824, 0.4569279855918884, 0.45118384454727173, 0.4504211899662018, 0.44511490434646606, 0.44647758895874023, 0.4362948834133148, 0.43578986066818237, 0.42930271067619324, 0.4292936919593811, 0.42567773310661317, 0.4261182806301117, 0.4239413748073578, 0.42333943349838254, 0.42293740759849546, 0.4217962563323975, 0.4224112439918518, 0.41819300340652465 ], "train_acc": [ 0.3148, 0.3896, 0.4219, 0.4456, 0.4649, 0.47824, 0.48992, 0.49962, 0.50886, 0.51698, 0.5202, 0.52942, 0.5382, 0.5446, 0.55176, 0.5529, 0.56062, 0.56588, 0.57028, 0.577, 0.58132, 0.58658, 0.59166, 0.5987, 0.59994, 0.60574, 0.6103, 0.61766, 0.61624, 0.62304, 0.62624, 0.63198, 0.63774, 0.6413, 0.64644, 0.64766, 0.65282, 0.6553, 0.66614, 0.66296, 0.67122, 0.67416, 0.68156, 0.68518, 0.6881, 0.69356, 0.69534, 0.70084, 0.70508, 0.7084, 0.71508, 0.72034, 0.72434, 0.72938, 0.73464, 0.73592, 0.7404, 0.74552, 0.75048, 0.75408, 0.75802, 0.76272, 0.76562, 0.77362, 0.77548, 0.77904, 0.78336, 0.78934, 0.79158, 0.79514, 0.79768, 0.80414, 0.80546, 0.80986, 0.81272, 0.8163, 0.81728, 0.82112, 0.82318, 0.83366, 0.83042, 0.83306, 0.836, 0.83884, 0.84078, 0.83852, 0.84302, 0.8422, 0.84388, 0.84512, 0.84892, 0.85022, 0.84986, 0.85088, 0.85284, 0.8506, 0.85018, 0.85162, 0.85258, 0.85238 ], "test_acc": [ 0.3995, 0.428, 0.4626, 0.4828, 0.4996, 0.4961, 0.5122, 0.5214, 0.5273, 0.5318, 0.5434, 0.5431, 0.5502, 0.5495, 0.5558, 0.561, 0.5593, 0.5638, 0.5727, 0.5612, 0.5661, 0.5729, 0.5769, 0.5734, 0.5798, 0.5882, 0.5883, 0.5755, 0.5828, 0.5873, 0.597, 0.5833, 0.5976, 0.5915, 0.5937, 0.5918, 0.5933, 0.5934, 0.5907, 0.5972, 0.5938, 0.5974, 0.5929, 0.5938, 0.6001, 0.5933, 0.6036, 0.5987, 0.5999, 0.6037, 0.594, 0.5996, 0.598, 0.6017, 0.597, 0.6042, 0.6017, 0.5988, 0.6004, 0.6015, 0.5984, 0.6042, 0.6041, 0.6052, 0.5989, 0.605, 0.6022, 0.6055, 0.6057, 0.6064, 0.6051, 0.6055, 0.6057, 0.6056, 0.6008, 0.6045, 0.6039, 0.6033, 0.6037, 0.6022, 0.6002, 0.6018, 0.5997, 0.6029, 0.6038, 0.601, 0.6044, 0.6028, 0.603, 0.6031, 0.6026, 0.6029, 0.6016, 0.6033, 0.6014, 0.6027, 0.6025, 0.602, 0.6014, 0.6015 ] }, "diagnostics": { "bp_cosine": [ 0.9925569295883179, 0.9925950765609741, 0.9925851225852966, 0.9926368594169617, 0.992660403251648, 0.9924540519714355 ], "perturbation_rho": [ 0.9874800443649292, 0.9890985488891602, 0.991584300994873, 0.9924823641777039, 0.9907411336898804, 0.9890323877334595 ], "nudging": { "0.001": [ -0.0019930435810238123, -0.002028408693149686, -0.002009383402764797, -0.001996344421058893, -0.0018836274975910783, -0.001594579080119729 ], "0.003": [ -0.00597399240359664, -0.006079169921576977, -0.006022875662893057, -0.005983929615467787, -0.005646158009767532, -0.004780753515660763 ], "0.01": [ -0.01984817534685135, -0.020196668803691864, -0.020013831555843353, -0.019886385649442673, -0.018769418820738792, -0.015900740399956703 ] } }, "drift": { "embed.weight": 8.830199479874222, "embed.bias": 13.652383066527548, "blocks.0.ln.weight": 0.3209315667509576, "blocks.0.w1.weight": 4.304189279431552, "blocks.0.w1.bias": 6.874941583705022, "blocks.0.w2.weight": 11.040131085404404, "blocks.1.ln.weight": 0.19033462322360514, "blocks.1.w1.weight": 4.611319361803835, "blocks.1.w1.bias": 4.589828072495789, "blocks.1.w2.weight": 12.410841455300883, "blocks.2.ln.weight": 0.17767497411972724, "blocks.2.w1.weight": 4.66461449969762, "blocks.2.w1.bias": 4.221528366446113, "blocks.2.w2.weight": 13.02617784277652, "blocks.3.ln.weight": 0.18648530933637847, "blocks.3.w1.weight": 4.703468866414805, "blocks.3.w1.bias": 3.845782047024037, "blocks.3.w2.weight": 13.668238845356765, "blocks.4.ln.weight": 0.20878906370184375, "blocks.4.w1.weight": 4.6585385757744255, "blocks.4.w1.bias": 3.740256675221265, "blocks.4.w2.weight": 14.188102590431034, "blocks.5.ln.weight": 0.21537598403409916, "blocks.5.w1.weight": 4.700384882175978, "blocks.5.w1.bias": 3.7260920466734655, "blocks.5.w2.weight": 15.8432281824125, "out_ln.weight": 0.3676580083270373, "out_head.weight": 2.951732465896682, "out_head.bias": 1.3797369883266803 } }, "dfa": { "log": { "train_loss": [ 2.0429981646728517, 2.0311185948181154, 2.025969026145935, 2.0156248236846923, 2.012451182785034, 2.0101683282852174, 2.0090535586547853, 2.0049661489105226, 2.0042781643676757, 2.007534557952881, 2.005720973892212, 2.0033944567108155, 2.0026611005401613, 2.0042629623413086, 2.0030657132339478, 2.0019637285614014, 2.0002238693237304, 2.0020113787841796, 2.002593652191162, 1.999959507446289, 1.99915257938385, 1.996764479637146, 1.99686444190979, 1.9965196546936035, 1.9979205041503907, 1.9956562859344482, 1.9973748725128173, 1.9964571334075927, 1.9960263302993775, 1.9924271702575684, 1.992831787261963, 1.99499480758667, 1.9891729098892212, 1.9939897597503662, 1.9930099172210693, 1.993308459815979, 1.9917978497314452, 1.9914746307754516, 1.9900447463989257, 1.992962121963501, 1.9900524688720702, 1.9900013018798828, 1.990018187599182, 1.9914000466537476, 1.9891149829864503, 1.9894212562561036, 1.99083076171875, 1.9897665852355957, 1.98873883934021, 1.990058041343689, 1.987586608581543, 1.987379070777893, 1.9863710124206544, 1.988468872642517, 1.9863781386947632, 1.9846030602264404, 1.986063505783081, 1.9875353760147094, 1.9865796419525146, 1.9875003507995606, 1.9842604379272462, 1.9855676065444947, 1.9839949224472047, 1.985175651473999, 1.9853779614639282, 1.9842977197265625, 1.9852548834228516, 1.9850790433120729, 1.983184485321045, 1.9850950769805908, 1.9860374071502687, 1.985449473876953, 1.986313660736084, 1.9834488523864746, 1.9854728340911865, 1.9834792975616455, 1.9839858917999267, 1.983295297241211, 1.9832000505065919, 1.9842015452575683, 1.9817747521209716, 1.9825036289215088, 1.983466981277466, 1.9826897898864746, 1.9832522836303712, 1.9837559247589112, 1.9846134539031983, 1.980646923828125, 1.9809106316375733, 1.9838191221618653, 1.981862756576538, 1.9802230101013183, 1.9814140343475342, 1.9822363115692139, 1.982738264541626, 1.9809983926773072, 1.9829246353912353, 1.981134694480896, 1.9824947088241578, 1.9818510884094238 ], "train_acc": [ 0.25012, 0.2569, 0.25934, 0.26228, 0.26296, 0.26604, 0.2663, 0.26786, 0.26776, 0.26536, 0.26794, 0.2679, 0.27008, 0.26912, 0.27114, 0.27122, 0.27314, 0.27074, 0.26774, 0.26882, 0.2714, 0.27276, 0.27218, 0.2744, 0.27288, 0.27368, 0.27384, 0.27596, 0.27198, 0.27772, 0.27426, 0.27528, 0.27714, 0.2757, 0.27328, 0.27562, 0.27496, 0.27752, 0.27654, 0.27576, 0.27678, 0.2766, 0.27842, 0.2765, 0.28062, 0.2769, 0.27744, 0.27504, 0.27708, 0.2794, 0.27856, 0.27826, 0.28152, 0.2805, 0.27904, 0.28034, 0.28012, 0.27994, 0.27844, 0.27932, 0.28254, 0.28096, 0.28152, 0.2795, 0.28278, 0.28194, 0.28228, 0.28134, 0.28312, 0.28172, 0.2811, 0.28118, 0.2794, 0.28338, 0.2802, 0.2814, 0.28282, 0.28256, 0.2834, 0.28248, 0.28152, 0.28336, 0.28338, 0.28288, 0.28162, 0.28292, 0.28282, 0.2848, 0.28472, 0.28266, 0.28232, 0.2875, 0.28232, 0.28272, 0.28286, 0.28446, 0.28254, 0.28228, 0.28414, 0.28394 ], "test_acc": [ 0.2768, 0.2776, 0.2962, 0.2815, 0.2956, 0.2956, 0.2961, 0.2963, 0.3082, 0.2895, 0.2713, 0.2959, 0.299, 0.2984, 0.2889, 0.3083, 0.2967, 0.2921, 0.2979, 0.3049, 0.2897, 0.2956, 0.308, 0.2866, 0.2924, 0.2989, 0.2996, 0.3051, 0.2983, 0.3066, 0.2983, 0.3082, 0.3046, 0.2948, 0.3114, 0.2894, 0.3002, 0.298, 0.3016, 0.2936, 0.3076, 0.3011, 0.2884, 0.2918, 0.3046, 0.2889, 0.3154, 0.3042, 0.2921, 0.3109, 0.283, 0.3003, 0.2988, 0.3024, 0.2983, 0.295, 0.304, 0.3112, 0.3015, 0.3044, 0.314, 0.3058, 0.3094, 0.3042, 0.3112, 0.3133, 0.3064, 0.2975, 0.2975, 0.3004, 0.3054, 0.3134, 0.3093, 0.3082, 0.3084, 0.3096, 0.3041, 0.3089, 0.3033, 0.3073, 0.311, 0.3131, 0.3036, 0.3127, 0.3087, 0.3117, 0.3102, 0.3056, 0.3102, 0.3087, 0.3107, 0.3099, 0.3092, 0.3094, 0.3093, 0.3102, 0.3092, 0.31, 0.3098, 0.3098 ] }, "diagnostics": { "bp_cosine": [ 0.38683176040649414, 0.0029573289211839437, -0.0009689683793112636, -0.0011474918574094772, 0.0005293102003633976, -0.0015941932797431946 ], "perturbation_rho": [ -0.0035741720348596573, 0.0, 0.0, 0.0, 0.0, 0.0 ], "nudging": { "0.001": [ -3.972090780735016e-07, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.003": [ -1.2861564755439758e-06, -1.862645149230957e-09, 3.725290298461914e-09, 0.0, 0.0, -1.862645149230957e-09 ], "0.01": [ -4.382338374853134e-06, -4.6566128730773926e-09, 3.725290298461914e-09, 0.0, 9.313225746154785e-10, -1.862645149230957e-09 ] } }, "drift": { "embed.weight": 317.7495659655673, "embed.bias": 246.61272235367505, "blocks.0.ln.weight": 8.188531285985507, "blocks.0.w1.weight": 202.7185165753587, "blocks.0.w1.bias": 170.46943772700087, "blocks.0.w2.weight": 332.85691144395827, "blocks.1.ln.weight": 6.620851917635279, "blocks.1.w1.weight": 230.61620075220995, "blocks.1.w1.bias": 215.19134278855063, "blocks.1.w2.weight": 203.35112374907072, "blocks.2.ln.weight": 7.98453379220575, "blocks.2.w1.weight": 315.5497282597786, "blocks.2.w1.bias": 271.50424171303735, "blocks.2.w2.weight": 248.3335414952481, "blocks.3.ln.weight": 5.77177430564541, "blocks.3.w1.weight": 199.54069059972556, "blocks.3.w1.bias": 166.19848046359377, "blocks.3.w2.weight": 156.3431036649652, "blocks.4.ln.weight": 6.358256142081412, "blocks.4.w1.weight": 230.11944086882187, "blocks.4.w1.bias": 194.42511513927937, "blocks.4.w2.weight": 171.6648008658166, "blocks.5.ln.weight": 5.859230703676208, "blocks.5.w1.weight": 209.3533985279986, "blocks.5.w1.bias": 181.2514045255841, "blocks.5.w2.weight": 161.81010288736894, "out_ln.weight": 0.520622874797811, "out_head.weight": 8.076281865086848, "out_head.bias": 1.2313841339767553 } }, "credit_bridge": { "log": { "train_loss": [ 2.0568496820831297, 2.0357495067596436, 2.0265325052642824, 2.0255675648498537, 2.0211820729827883, 2.0130653564453125, 2.0164043712615967, 2.011985154876709, 2.0152608364868163, 2.0114740381622314, 2.0100359706878663, 2.0067753753662108, 2.0120022153091432, 2.009950690765381, 2.0081368783187865, 2.012003229904175, 2.0099324744415283, 2.010634113998413, 2.0069234494400026, 2.003235507774353, 2.0058242790985106, 2.0072046648406983, 2.00108302066803, 2.0016218561553956, 1.9978092765045166, 1.995793134841919, 1.994058724822998, 1.9918723776245117, 1.98977053981781, 1.989516119003296, 1.9898863918304444, 1.9870066958236694, 1.9896904999160767, 1.9879004209136963, 1.9867612840270996, 1.9895719361877442, 1.9847314866638184, 1.9836825936508178, 1.9799864123535156, 1.978990509414673, 1.97883055809021, 1.9726349740219116, 1.9712072018432618, 1.978619043121338, 1.9836511195373536, 1.9836528234100341, 1.9868938672256469, 1.993108935470581, 1.9985688564300537, 2.0061389767074584, 2.0023673818969727, 1.9980067819595337, 1.990028013458252, 1.9925069525146484, 1.9965549280548096, 2.0004678047943116, 2.0091910595321654, 2.0153573443603516, 2.0439902848815916, 2.087756749229431, 2.1218214894104004, 2.133594408798218, 2.1355165560913085, 2.1193470074462892, 2.070676408615112, 2.0247885906219483, 2.002980169754028, 2.001423611793518, 2.011682106933594, 2.0117178466796877, 2.0037788080596926, 1.9931315280914306, 1.986942767906189, 1.9871479096984863, 1.9841199736785888, 1.9854342544555663, 1.984901067276001, 1.9828116521835326, 1.987117846031189, 1.980504002685547, 1.9845846620178222, 1.9854082400131225, 1.9839192948150635, 1.9855693399429322, 1.9832484759521485, 1.9859395289611816, 1.9864675799942018, 1.98523220413208, 1.9856301559066774, 1.9843646090698241, 1.983153977355957, 1.984056966934204, 1.9850010103607179, 1.986421587867737, 1.9846718848037719, 1.9840921591186524, 1.9866302879333495, 1.9842277576065064, 1.9866961249160766, 1.9863304554748535 ], "train_acc": [ 0.24782, 0.25582, 0.25558, 0.25876, 0.2594, 0.26644, 0.26466, 0.2638, 0.26388, 0.26448, 0.26608, 0.26734, 0.26408, 0.26614, 0.26748, 0.26298, 0.2657, 0.26878, 0.26736, 0.27, 0.26918, 0.2684, 0.27234, 0.27186, 0.26998, 0.27096, 0.27406, 0.27414, 0.27628, 0.27624, 0.27302, 0.27606, 0.27518, 0.27628, 0.27844, 0.27712, 0.2805, 0.27752, 0.27616, 0.27868, 0.27654, 0.28048, 0.27978, 0.2762, 0.26926, 0.27272, 0.2737, 0.26804, 0.26878, 0.26534, 0.26856, 0.27126, 0.27694, 0.28054, 0.2827, 0.2824, 0.28504, 0.28396, 0.2755, 0.26492, 0.25088, 0.24706, 0.24506, 0.25206, 0.26578, 0.27702, 0.28328, 0.27956, 0.26926, 0.26452, 0.2656, 0.27034, 0.2789, 0.2823, 0.28274, 0.28074, 0.28288, 0.28368, 0.28134, 0.28298, 0.28284, 0.28366, 0.28172, 0.28472, 0.28516, 0.2844, 0.2836, 0.28454, 0.28676, 0.28268, 0.28488, 0.28714, 0.28404, 0.286, 0.28564, 0.28672, 0.28564, 0.28652, 0.2853, 0.28532 ], "test_acc": [ 0.2802, 0.284, 0.3008, 0.2741, 0.286, 0.2865, 0.2852, 0.2925, 0.286, 0.3018, 0.3012, 0.2835, 0.3037, 0.2877, 0.3014, 0.3066, 0.2908, 0.2958, 0.2946, 0.2903, 0.2807, 0.2935, 0.3134, 0.3113, 0.3034, 0.2931, 0.3001, 0.311, 0.3128, 0.3116, 0.3099, 0.2976, 0.2893, 0.291, 0.2988, 0.2959, 0.2992, 0.3119, 0.2906, 0.2967, 0.3031, 0.3076, 0.2874, 0.282, 0.289, 0.2638, 0.2745, 0.2872, 0.2764, 0.2711, 0.2732, 0.2744, 0.3014, 0.302, 0.2931, 0.3077, 0.2884, 0.2883, 0.2814, 0.2816, 0.2618, 0.2679, 0.2625, 0.269, 0.2844, 0.2972, 0.2945, 0.2752, 0.276, 0.2833, 0.2859, 0.2809, 0.3011, 0.2909, 0.3046, 0.3047, 0.2977, 0.3012, 0.3024, 0.2816, 0.3022, 0.2915, 0.2965, 0.3004, 0.3024, 0.299, 0.2977, 0.3026, 0.295, 0.3036, 0.2982, 0.3023, 0.2953, 0.3008, 0.3, 0.3001, 0.299, 0.2995, 0.2985, 0.2989 ], "value_loss": [ 0.5431940293550491, 0.19173510383605957, 0.12268259384393693, 0.10493469659805298, 0.10201048459529877, 0.0708414131128788, 0.06408844601988792, 0.0720686790394783, 0.06697397160291672, 0.06196294789075851, 0.05502780232191086, 0.04616951223134994, 0.05243575494527817, 0.04471795217871666, 0.044362507430315015, 0.045647807506322864, 0.04227230613827705, 0.04649371607661247, 0.037143924347162245, 0.03761421796441078, 0.0374193194770813, 0.03865032393813133, 0.03604385726451874, 0.0348061216533184, 0.034909065720438955, 0.03548428529679775, 0.03034081528186798, 0.030923059933185577, 0.03219221098482609, 0.028869735319614412, 0.02921472702085972, 0.025344824229478837, 0.03069723398923874, 0.023911022167205812, 0.02546191979944706, 0.0234756334400177, 0.021548947972655295, 0.024292344799041746, 0.021204249440431595, 0.023217988926172255, 0.032371759564876555, 0.027472765368819235, 0.03582359938144684, 0.040054642882347107, 0.0429941078042984, 0.04646095623970032, 0.05297355647087097, 0.07127084519863129, 0.0587913763999939, 0.0855120901298523, 0.5175958820724488, 2.393956252441406, 11.913925989227295, 21.20466460494995, 122.39695868041993, 517.7628999365235, 530.3028672167969, 404.2268926171875, 258.459100078125, 283.38131254882813, 102.50320305175781, 27.287051020507814, 12.905007503051758, 4.956491999969482, 1.5449322800445557, 0.5012244256973266, 0.26081433165550233, 0.14692765646934508, 0.10439578160524368, 0.07197002289533615, 0.05530310579776764, 0.04514324131727219, 0.031837492654323576, 0.024001008454561233, 0.019366809893846513, 0.01406323720932007, 0.010792444348335267, 0.008763177410960197, 0.007306897183656693, 0.009082207316458226, 0.005549766648113728, 0.005990845524594187, 0.004990600987970829, 0.00429255537956953, 0.005432345700562001, 0.003525814834535122, 0.004226339301913976, 0.003729854447096586, 0.004537549587935209, 0.0023256922054290773, 0.003219376254081726, 0.0022955145540088416, 0.00276749915830791, 0.003175384805947542, 0.0025999026219546795, 0.0021026480976492168, 0.0022611236164718864, 0.0022266844733059405, 0.002546760700196028, 0.0024256033681333065 ] }, "diagnostics": { "bp_cosine": [ 0.3041490912437439, 0.03387444466352463, 0.05120290070772171, 0.0619620680809021, 0.06251867115497589, 0.06249140202999115 ], "perturbation_rho": [ -0.005746336653828621, 0.0, 0.0, 0.0, 0.0, 0.0 ], "nudging": { "0.001": [ -7.874332368373871e-07, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.003": [ -2.527143806219101e-06, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.01": [ -8.463859558105469e-06, 0.0, 0.0, 0.0, 0.0, 0.0 ] } }, "drift": { "embed.weight": 150.13851572417417, "embed.bias": 128.41508525356625, "blocks.0.ln.weight": 5.836368229603896, "blocks.0.w1.weight": 137.83692167652973, "blocks.0.w1.bias": 120.59820508387907, "blocks.0.w2.weight": 191.89941055268133, "blocks.1.ln.weight": 5.7364977300128475, "blocks.1.w1.weight": 223.49362295122356, "blocks.1.w1.bias": 194.26884532235184, "blocks.1.w2.weight": 197.19643675985097, "blocks.2.ln.weight": 5.407984956609397, "blocks.2.w1.weight": 224.96419292004586, "blocks.2.w1.bias": 183.18926393313106, "blocks.2.w2.weight": 163.77095460658097, "blocks.3.ln.weight": 3.788219163278833, "blocks.3.w1.weight": 178.78795349787814, "blocks.3.w1.bias": 158.67792032092242, "blocks.3.w2.weight": 127.01894259639586, "blocks.4.ln.weight": 3.65585411727934, "blocks.4.w1.weight": 138.57885809433404, "blocks.4.w1.bias": 99.2214242231741, "blocks.4.w2.weight": 101.99300788405023, "blocks.5.ln.weight": 3.409437674208733, "blocks.5.w1.weight": 110.32921272933086, "blocks.5.w1.bias": 71.51527802753176, "blocks.5.w2.weight": 83.53550127994924, "out_ln.weight": 0.3630675420960623, "out_head.weight": 5.826911511271652, "out_head.bias": 3.507322897493987 } } }