summaryrefslogtreecommitdiff
path: root/results/cifar10_seed456/results_cifar10.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/cifar10_seed456/results_cifar10.json')
-rw-r--r--results/cifar10_seed456/results_cifar10.json1985
1 files changed, 1985 insertions, 0 deletions
diff --git a/results/cifar10_seed456/results_cifar10.json b/results/cifar10_seed456/results_cifar10.json
new file mode 100644
index 0000000..06a3107
--- /dev/null
+++ b/results/cifar10_seed456/results_cifar10.json
@@ -0,0 +1,1985 @@
+{
+ "456": {
+ "bp": {
+ "log": {
+ "train_loss": [
+ 1.932577501449585,
+ 1.6900249602508546,
+ 1.6011367318725587,
+ 1.5466754390716553,
+ 1.4920579125213622,
+ 1.4546358205413819,
+ 1.4231391117858887,
+ 1.3938725402450562,
+ 1.3629425603866576,
+ 1.342505719642639,
+ 1.3237205046844482,
+ 1.300122989501953,
+ 1.2825427363967896,
+ 1.2623162283325196,
+ 1.2426594482040405,
+ 1.227365916481018,
+ 1.206711524925232,
+ 1.190613479347229,
+ 1.1721268761444092,
+ 1.1622920285797118,
+ 1.1426683759689331,
+ 1.1272672763824463,
+ 1.1123097320747375,
+ 1.095245484790802,
+ 1.0796047261238098,
+ 1.0664704471588136,
+ 1.0544639612579345,
+ 1.0334472966003418,
+ 1.0216301371002197,
+ 1.0061453499603272,
+ 0.9892120691299439,
+ 0.9690513248062134,
+ 0.9597649993705749,
+ 0.9393893640518188,
+ 0.9262461110305786,
+ 0.9142684574699402,
+ 0.8982764770317078,
+ 0.882060844745636,
+ 0.8589154948616028,
+ 0.8484143830871582,
+ 0.8298149911689758,
+ 0.8117531860733033,
+ 0.7923431532669067,
+ 0.7819426927185058,
+ 0.7630360532951355,
+ 0.7432640241622925,
+ 0.725852869091034,
+ 0.7111906971359253,
+ 0.6900048795890809,
+ 0.6697983954048157,
+ 0.6541705364608764,
+ 0.6370760979270935,
+ 0.6198028992843628,
+ 0.5972342865371704,
+ 0.5801713646697998,
+ 0.5637391392326355,
+ 0.5492425328063965,
+ 0.5351220473480225,
+ 0.517744523601532,
+ 0.4910259468269348,
+ 0.48044670740127565,
+ 0.4666313941383362,
+ 0.4454871296596527,
+ 0.4287984812068939,
+ 0.4167753814029694,
+ 0.4019090121555328,
+ 0.3892905419158936,
+ 0.3745353739929199,
+ 0.3589991714382172,
+ 0.34674671503067017,
+ 0.3343308783531189,
+ 0.32089566977500916,
+ 0.3101300811481476,
+ 0.2954042288208008,
+ 0.2848380702114105,
+ 0.2828438286781311,
+ 0.264346894235611,
+ 0.26094838644981383,
+ 0.25063199663162233,
+ 0.24315124837875365,
+ 0.2345473566555977,
+ 0.22507079369306565,
+ 0.2194176360464096,
+ 0.21162880234241485,
+ 0.20445122440338134,
+ 0.2012126348876953,
+ 0.19840873272895812,
+ 0.19022230600357057,
+ 0.1889617627120018,
+ 0.18509810159683227,
+ 0.18254041098594664,
+ 0.1836097541332245,
+ 0.17741597022533417,
+ 0.1746750330734253,
+ 0.17486595999717713,
+ 0.17480743077754973,
+ 0.17309590301036834,
+ 0.17227657488822937,
+ 0.1740615609550476,
+ 0.16915745746612548
+ ],
+ "train_acc": [
+ 0.30628,
+ 0.38592,
+ 0.42152,
+ 0.4394,
+ 0.45908,
+ 0.47766,
+ 0.48482,
+ 0.49718,
+ 0.51004,
+ 0.51544,
+ 0.52028,
+ 0.53156,
+ 0.53764,
+ 0.54346,
+ 0.55342,
+ 0.55874,
+ 0.56678,
+ 0.571,
+ 0.57738,
+ 0.57968,
+ 0.59098,
+ 0.59448,
+ 0.59972,
+ 0.60702,
+ 0.61296,
+ 0.61686,
+ 0.62066,
+ 0.629,
+ 0.63218,
+ 0.63706,
+ 0.6458,
+ 0.65254,
+ 0.6557,
+ 0.66064,
+ 0.66696,
+ 0.67284,
+ 0.67792,
+ 0.68442,
+ 0.6895,
+ 0.69484,
+ 0.69998,
+ 0.70706,
+ 0.71588,
+ 0.71756,
+ 0.72552,
+ 0.7343,
+ 0.74024,
+ 0.74394,
+ 0.75236,
+ 0.76022,
+ 0.76464,
+ 0.77054,
+ 0.7777,
+ 0.78372,
+ 0.79538,
+ 0.7972,
+ 0.80364,
+ 0.8092,
+ 0.81504,
+ 0.82654,
+ 0.82918,
+ 0.83316,
+ 0.84092,
+ 0.84854,
+ 0.85006,
+ 0.85778,
+ 0.8616,
+ 0.8676,
+ 0.87464,
+ 0.87672,
+ 0.88258,
+ 0.88796,
+ 0.89154,
+ 0.89712,
+ 0.90188,
+ 0.90184,
+ 0.90858,
+ 0.90758,
+ 0.9118,
+ 0.91542,
+ 0.9187,
+ 0.92286,
+ 0.9233,
+ 0.92722,
+ 0.93012,
+ 0.93172,
+ 0.93268,
+ 0.936,
+ 0.93634,
+ 0.9374,
+ 0.93696,
+ 0.93802,
+ 0.94054,
+ 0.94164,
+ 0.9409,
+ 0.9415,
+ 0.94154,
+ 0.94296,
+ 0.94158,
+ 0.94336
+ ],
+ "test_acc": [
+ 0.3915,
+ 0.4289,
+ 0.4595,
+ 0.4775,
+ 0.4915,
+ 0.4936,
+ 0.5132,
+ 0.5139,
+ 0.5291,
+ 0.5317,
+ 0.5407,
+ 0.5449,
+ 0.5481,
+ 0.5499,
+ 0.5545,
+ 0.5589,
+ 0.5696,
+ 0.5674,
+ 0.5737,
+ 0.5776,
+ 0.573,
+ 0.583,
+ 0.5773,
+ 0.572,
+ 0.5836,
+ 0.5774,
+ 0.5838,
+ 0.5796,
+ 0.5884,
+ 0.5942,
+ 0.5925,
+ 0.5927,
+ 0.5974,
+ 0.5934,
+ 0.5962,
+ 0.5972,
+ 0.5995,
+ 0.595,
+ 0.5921,
+ 0.5848,
+ 0.5907,
+ 0.5934,
+ 0.5935,
+ 0.5921,
+ 0.5969,
+ 0.5936,
+ 0.5961,
+ 0.5948,
+ 0.5992,
+ 0.5954,
+ 0.5978,
+ 0.5933,
+ 0.5934,
+ 0.5987,
+ 0.5987,
+ 0.591,
+ 0.5889,
+ 0.5924,
+ 0.5937,
+ 0.593,
+ 0.5925,
+ 0.5944,
+ 0.5938,
+ 0.5924,
+ 0.5946,
+ 0.5905,
+ 0.5928,
+ 0.5899,
+ 0.5891,
+ 0.587,
+ 0.5891,
+ 0.5846,
+ 0.5867,
+ 0.586,
+ 0.5865,
+ 0.585,
+ 0.5851,
+ 0.5824,
+ 0.5821,
+ 0.5855,
+ 0.5825,
+ 0.5861,
+ 0.5857,
+ 0.5869,
+ 0.5855,
+ 0.589,
+ 0.5887,
+ 0.5872,
+ 0.5863,
+ 0.5857,
+ 0.5865,
+ 0.5868,
+ 0.5867,
+ 0.5874,
+ 0.5872,
+ 0.5876,
+ 0.5869,
+ 0.5879,
+ 0.5871,
+ 0.587
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.9672282934188843,
+ 0.9684309363365173,
+ 0.9675205945968628,
+ 0.9669639468193054,
+ 0.9665698409080505,
+ 0.967890739440918,
+ 0.9664402008056641,
+ 0.9660602807998657,
+ 0.9652657508850098,
+ 0.9614400863647461,
+ 0.9602784514427185,
+ 0.9578725099563599
+ ],
+ "perturbation_rho": [
+ 0.9848342537879944,
+ 0.9891709685325623,
+ 0.9909648895263672,
+ 0.9893825054168701,
+ 0.9924193024635315,
+ 0.9927305579185486,
+ 0.9941403865814209,
+ 0.9934987425804138,
+ 0.9928717017173767,
+ 0.9915444254875183,
+ 0.9898866415023804,
+ 0.9873980283737183
+ ],
+ "nudging": {
+ "0.001": [
+ -0.0028492475394159555,
+ -0.0028252778574824333,
+ -0.0028643091209232807,
+ -0.0029328675009310246,
+ -0.002945749554783106,
+ -0.0029587389435619116,
+ -0.00288290623575449,
+ -0.0028087471146136522,
+ -0.0026325639337301254,
+ -0.002420567674562335,
+ -0.002228461904451251,
+ -0.0018789597088471055
+ ],
+ "0.003": [
+ -0.008540419861674309,
+ -0.008468939922749996,
+ -0.008585674688220024,
+ -0.008790891617536545,
+ -0.008829280734062195,
+ -0.008868295699357986,
+ -0.00864122249186039,
+ -0.008419105783104897,
+ -0.007891927845776081,
+ -0.007256433367729187,
+ -0.006680862978100777,
+ -0.0056340815499424934
+ ],
+ "0.01": [
+ -0.028379585593938828,
+ -0.028143716976046562,
+ -0.028530558571219444,
+ -0.02920939214527607,
+ -0.02933822199702263,
+ -0.029468875378370285,
+ -0.028714874759316444,
+ -0.027982797473669052,
+ -0.026236172765493393,
+ -0.024128224700689316,
+ -0.022218093276023865,
+ -0.018745578825473785
+ ]
+ }
+ },
+ "drift": {
+ "embed.weight": 8.834297843591171,
+ "embed.bias": 15.413548194165312,
+ "blocks.0.ln.weight": 0.3280907780755125,
+ "blocks.0.w1.weight": 4.220952328018163,
+ "blocks.0.w1.bias": 6.7337611045609105,
+ "blocks.0.w2.weight": 10.671510043086428,
+ "blocks.1.ln.weight": 0.22467724575060716,
+ "blocks.1.w1.weight": 4.523437520518719,
+ "blocks.1.w1.bias": 4.4537544678846235,
+ "blocks.1.w2.weight": 11.922866714123732,
+ "blocks.2.ln.weight": 0.19572857698834295,
+ "blocks.2.w1.weight": 4.598553685356083,
+ "blocks.2.w1.bias": 4.125724114621679,
+ "blocks.2.w2.weight": 12.310215404426595,
+ "blocks.3.ln.weight": 0.21390126577946425,
+ "blocks.3.w1.weight": 4.584201339373962,
+ "blocks.3.w1.bias": 3.7580021741696004,
+ "blocks.3.w2.weight": 12.601184193203743,
+ "blocks.4.ln.weight": 0.24161530581374482,
+ "blocks.4.w1.weight": 4.518574188984943,
+ "blocks.4.w1.bias": 3.8030594737653343,
+ "blocks.4.w2.weight": 12.669272886895255,
+ "blocks.5.ln.weight": 0.25422945739387653,
+ "blocks.5.w1.weight": 4.461826473966918,
+ "blocks.5.w1.bias": 3.6451227277370744,
+ "blocks.5.w2.weight": 12.680759003338304,
+ "blocks.6.ln.weight": 0.25745358599301726,
+ "blocks.6.w1.weight": 4.47036651988774,
+ "blocks.6.w1.bias": 3.706163791416811,
+ "blocks.6.w2.weight": 13.119190581706045,
+ "blocks.7.ln.weight": 0.263116520949555,
+ "blocks.7.w1.weight": 4.434269376799208,
+ "blocks.7.w1.bias": 3.6960182135036708,
+ "blocks.7.w2.weight": 13.098144437096936,
+ "blocks.8.ln.weight": 0.27514230251440513,
+ "blocks.8.w1.weight": 4.344487791539744,
+ "blocks.8.w1.bias": 3.648654542354885,
+ "blocks.8.w2.weight": 13.035629633632155,
+ "blocks.9.ln.weight": 0.29172129249550904,
+ "blocks.9.w1.weight": 4.255456615430207,
+ "blocks.9.w1.bias": 3.6968063474376733,
+ "blocks.9.w2.weight": 13.086873727145367,
+ "blocks.10.ln.weight": 0.3000076159356563,
+ "blocks.10.w1.weight": 4.2734266858824945,
+ "blocks.10.w1.bias": 3.6213422959644603,
+ "blocks.10.w2.weight": 13.200754189456744,
+ "blocks.11.ln.weight": 0.2902311063472059,
+ "blocks.11.w1.weight": 4.144956242341598,
+ "blocks.11.w1.bias": 3.5713523930610735,
+ "blocks.11.w2.weight": 13.254643701043216,
+ "out_ln.weight": 0.3155177407468068,
+ "out_head.weight": 3.523856665191762,
+ "out_head.bias": 1.0793116101743525
+ }
+ },
+ "dfa": {
+ "log": {
+ "train_loss": [
+ 2.07058688041687,
+ 2.0397231711578367,
+ 2.040001149024963,
+ 2.036939584312439,
+ 2.035007101402283,
+ 2.0326563871002197,
+ 2.0309880726623537,
+ 2.028131689300537,
+ 2.0242818844223023,
+ 2.021325262145996,
+ 2.01944966506958,
+ 2.0185741081237794,
+ 2.0193587062072753,
+ 2.0140840717315673,
+ 2.01566628868103,
+ 2.0162557276153565,
+ 2.01352592338562,
+ 2.0122515713882447,
+ 2.007948448524475,
+ 2.0104500115966797,
+ 2.008844228897095,
+ 2.007831936798096,
+ 2.0087617783355713,
+ 2.0067150954437256,
+ 2.0060685678100585,
+ 2.0067182321548462,
+ 2.004691079711914,
+ 2.004318997192383,
+ 2.006708196105957,
+ 2.0059428287506105,
+ 2.002060938720703,
+ 2.0030168786239626,
+ 2.0013856718444822,
+ 2.001412846107483,
+ 2.0029963275909424,
+ 2.001156611251831,
+ 2.0020238697052,
+ 2.0013174156951905,
+ 2.001038536148071,
+ 1.9974690299224853,
+ 1.9983380174255372,
+ 2.00068127532959,
+ 2.002073029937744,
+ 1.9994858475494384,
+ 1.999331954574585,
+ 1.9974100791168212,
+ 1.9981875708389283,
+ 1.9986576483917236,
+ 1.9978187020492553,
+ 1.9974584699249267,
+ 1.9957377856063843,
+ 1.995005799217224,
+ 1.9989547797012328,
+ 1.997181711654663,
+ 1.995425957107544,
+ 1.9960723597717285,
+ 1.996761396522522,
+ 1.9958302701187134,
+ 1.9968557986450195,
+ 1.9969658164215087,
+ 1.9949297325134276,
+ 1.9950204270172118,
+ 1.9955382054901123,
+ 1.9956761499786377,
+ 1.9941519859313965,
+ 1.9952024503326415,
+ 1.995510894241333,
+ 1.9926798336791993,
+ 1.9947078677749635,
+ 1.9926326573181152,
+ 1.9923986828231812,
+ 1.993803144607544,
+ 1.9924064002227784,
+ 1.9935845022583008,
+ 1.993097350692749,
+ 1.9917376801300049,
+ 1.9939163592147826,
+ 1.9913390029144287,
+ 1.9931303585052491,
+ 1.992877590637207,
+ 1.9936017736434937,
+ 1.9915303264999389,
+ 1.9928937450408934,
+ 1.9911755990600586,
+ 1.9931563230133056,
+ 1.992949102935791,
+ 1.9930351052856445,
+ 1.9907214881134032,
+ 1.9905328282165526,
+ 1.9933595889282227,
+ 1.9914652145385743,
+ 1.99171005859375,
+ 1.9924902798080444,
+ 1.992575800704956,
+ 1.99016278049469,
+ 1.9921005247497559,
+ 1.9918115587615968,
+ 1.9918856573867798,
+ 1.988608092727661,
+ 1.9906916750717163
+ ],
+ "train_acc": [
+ 0.23438,
+ 0.24682,
+ 0.24856,
+ 0.24744,
+ 0.2493,
+ 0.25268,
+ 0.25096,
+ 0.25544,
+ 0.25558,
+ 0.25914,
+ 0.2613,
+ 0.2586,
+ 0.26004,
+ 0.26336,
+ 0.2627,
+ 0.26136,
+ 0.26178,
+ 0.26482,
+ 0.26748,
+ 0.26462,
+ 0.26374,
+ 0.26504,
+ 0.26682,
+ 0.26656,
+ 0.26808,
+ 0.26636,
+ 0.26534,
+ 0.26986,
+ 0.26678,
+ 0.26804,
+ 0.27068,
+ 0.27112,
+ 0.2728,
+ 0.27114,
+ 0.27098,
+ 0.27242,
+ 0.27134,
+ 0.269,
+ 0.27124,
+ 0.27356,
+ 0.27462,
+ 0.27154,
+ 0.27048,
+ 0.27332,
+ 0.27462,
+ 0.2742,
+ 0.2748,
+ 0.27136,
+ 0.27366,
+ 0.27372,
+ 0.2756,
+ 0.2745,
+ 0.27688,
+ 0.2753,
+ 0.2738,
+ 0.27568,
+ 0.27534,
+ 0.2752,
+ 0.2746,
+ 0.27426,
+ 0.2754,
+ 0.27652,
+ 0.27636,
+ 0.27514,
+ 0.27602,
+ 0.2772,
+ 0.27466,
+ 0.27792,
+ 0.27762,
+ 0.27772,
+ 0.2748,
+ 0.27744,
+ 0.27738,
+ 0.2778,
+ 0.27648,
+ 0.27882,
+ 0.27752,
+ 0.2773,
+ 0.27792,
+ 0.27792,
+ 0.27564,
+ 0.2783,
+ 0.2765,
+ 0.27966,
+ 0.27638,
+ 0.27776,
+ 0.27614,
+ 0.27868,
+ 0.27806,
+ 0.27834,
+ 0.27876,
+ 0.2785,
+ 0.27914,
+ 0.27822,
+ 0.27976,
+ 0.2771,
+ 0.2782,
+ 0.27906,
+ 0.27974,
+ 0.278
+ ],
+ "test_acc": [
+ 0.267,
+ 0.2833,
+ 0.2633,
+ 0.2623,
+ 0.2722,
+ 0.2805,
+ 0.2629,
+ 0.2946,
+ 0.2836,
+ 0.2778,
+ 0.2841,
+ 0.2871,
+ 0.2812,
+ 0.2675,
+ 0.2747,
+ 0.2994,
+ 0.2768,
+ 0.2969,
+ 0.2894,
+ 0.3029,
+ 0.2895,
+ 0.296,
+ 0.2693,
+ 0.2842,
+ 0.2805,
+ 0.2916,
+ 0.2823,
+ 0.2769,
+ 0.2952,
+ 0.2914,
+ 0.2952,
+ 0.2872,
+ 0.2933,
+ 0.2701,
+ 0.2877,
+ 0.2897,
+ 0.2824,
+ 0.2808,
+ 0.2978,
+ 0.2775,
+ 0.2873,
+ 0.2938,
+ 0.2942,
+ 0.2895,
+ 0.2924,
+ 0.2896,
+ 0.2957,
+ 0.2915,
+ 0.294,
+ 0.2914,
+ 0.2868,
+ 0.2964,
+ 0.2861,
+ 0.2952,
+ 0.2823,
+ 0.3038,
+ 0.2965,
+ 0.3008,
+ 0.2928,
+ 0.2991,
+ 0.2963,
+ 0.295,
+ 0.2983,
+ 0.2957,
+ 0.2997,
+ 0.2953,
+ 0.2891,
+ 0.2982,
+ 0.3011,
+ 0.2934,
+ 0.2948,
+ 0.305,
+ 0.2971,
+ 0.3022,
+ 0.2961,
+ 0.2952,
+ 0.3052,
+ 0.2981,
+ 0.2997,
+ 0.2923,
+ 0.2967,
+ 0.299,
+ 0.2967,
+ 0.2969,
+ 0.2986,
+ 0.2949,
+ 0.2994,
+ 0.2954,
+ 0.2994,
+ 0.2989,
+ 0.2964,
+ 0.2977,
+ 0.2943,
+ 0.2971,
+ 0.296,
+ 0.2965,
+ 0.296,
+ 0.2968,
+ 0.2968,
+ 0.2967
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.39808189868927,
+ -0.0005002215621061623,
+ -0.00010176157957175747,
+ -0.00011934398207813501,
+ -0.000299518636893481,
+ 0.0004310115473344922,
+ -0.0001575749192852527,
+ -0.00013478680921252817,
+ -0.00013778718130197376,
+ -0.0002350577706238255,
+ -7.549257134087384e-06,
+ -3.051616658922285e-05
+ ],
+ "perturbation_rho": [
+ 0.026208851486444473,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0
+ ],
+ "nudging": {
+ "0.001": [
+ -3.781169652938843e-07,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0
+ ],
+ "0.003": [
+ -9.867362678050995e-07,
+ 0.0,
+ -1.1175870895385742e-08,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ -1.862645149230957e-09,
+ 0.0
+ ],
+ "0.01": [
+ -3.6079436540603638e-06,
+ 0.0,
+ -1.30385160446167e-08,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ -1.862645149230957e-09,
+ 0.0
+ ]
+ }
+ },
+ "drift": {
+ "embed.weight": 330.294227499211,
+ "embed.bias": 259.4924618202614,
+ "blocks.0.ln.weight": 10.952609998429608,
+ "blocks.0.w1.weight": 280.8978034197629,
+ "blocks.0.w1.bias": 260.7432178686956,
+ "blocks.0.w2.weight": 459.75981344197356,
+ "blocks.1.ln.weight": 8.338033915232403,
+ "blocks.1.w1.weight": 303.52507755893413,
+ "blocks.1.w1.bias": 305.583927901598,
+ "blocks.1.w2.weight": 333.8270370300826,
+ "blocks.2.ln.weight": 10.70947460327803,
+ "blocks.2.w1.weight": 423.89849941751544,
+ "blocks.2.w1.bias": 420.3062621668287,
+ "blocks.2.w2.weight": 429.4082983364606,
+ "blocks.3.ln.weight": 8.290240736902255,
+ "blocks.3.w1.weight": 317.09537244180814,
+ "blocks.3.w1.bias": 287.7440748790634,
+ "blocks.3.w2.weight": 298.4352829162209,
+ "blocks.4.ln.weight": 9.625651853706938,
+ "blocks.4.w1.weight": 380.24334326208,
+ "blocks.4.w1.bias": 350.1027945318976,
+ "blocks.4.w2.weight": 351.4361032986557,
+ "blocks.5.ln.weight": 9.64751089559273,
+ "blocks.5.w1.weight": 381.41558228811317,
+ "blocks.5.w1.bias": 348.41973459641565,
+ "blocks.5.w2.weight": 358.39732437217214,
+ "blocks.6.ln.weight": 9.747382743882953,
+ "blocks.6.w1.weight": 390.26899720474756,
+ "blocks.6.w1.bias": 371.3396255333559,
+ "blocks.6.w2.weight": 383.2513961535749,
+ "blocks.7.ln.weight": 8.825122691585458,
+ "blocks.7.w1.weight": 346.68999846263586,
+ "blocks.7.w1.bias": 322.5261718218226,
+ "blocks.7.w2.weight": 338.7459123423596,
+ "blocks.8.ln.weight": 8.098539333504899,
+ "blocks.8.w1.weight": 318.2267389133952,
+ "blocks.8.w1.bias": 297.59966764417567,
+ "blocks.8.w2.weight": 295.4097011432017,
+ "blocks.9.ln.weight": 7.141109927159286,
+ "blocks.9.w1.weight": 262.58513708371515,
+ "blocks.9.w1.bias": 251.1580247152912,
+ "blocks.9.w2.weight": 243.52122031424597,
+ "blocks.10.ln.weight": 10.631727490611157,
+ "blocks.10.w1.weight": 421.8663669312304,
+ "blocks.10.w1.bias": 393.793856832655,
+ "blocks.10.w2.weight": 426.1507190170269,
+ "blocks.11.ln.weight": 11.204882830494729,
+ "blocks.11.w1.weight": 446.3738461267888,
+ "blocks.11.w1.bias": 412.5154467592355,
+ "blocks.11.w2.weight": 426.65837546735577,
+ "out_ln.weight": 0.6667026319780115,
+ "out_head.weight": 9.48630928590299,
+ "out_head.bias": 0.44493816450857304
+ }
+ },
+ "state_bridge": {
+ "log": {
+ "train_loss": [
+ 2.3018941720581054,
+ 2.2664404193878176,
+ 2.241582181625366,
+ 2.2375785102844237,
+ 2.134529279785156,
+ 2.119604638824463,
+ 2.112871742706299,
+ 2.1424258409881594,
+ 2.158468070068359,
+ 2.143250986175537,
+ 2.1479166007995607,
+ 2.141409687652588,
+ 2.1494772535705566,
+ 2.1696451356506348,
+ 2.2107076875305176,
+ 2.216366109008789,
+ 2.2074287937927246,
+ 2.1900475843811034,
+ 2.1331632147216797,
+ 2.130491197357178,
+ 2.1317693274688723,
+ 2.1269900135040283,
+ 2.1228091914367675,
+ 2.099304881210327,
+ 2.085384643859863,
+ 2.085484384918213,
+ 2.087498538970947,
+ 2.0871505451202395,
+ 2.0823512071990966,
+ 2.0860876009368896,
+ 2.086019044647217,
+ 2.0951096993255613,
+ 2.0864567431259156,
+ 2.078469701538086,
+ 2.072162138824463,
+ 2.0764309199523927,
+ 2.0748440283203125,
+ 2.0789254627990723,
+ 2.0826576986694336,
+ 2.0871692906188963,
+ 2.086170325393677,
+ 2.084945154571533,
+ 2.0844455377197266,
+ 2.085197698135376,
+ 2.0900804764556886,
+ 2.082403769226074,
+ 2.082503260040283,
+ 2.0882599214935302,
+ 2.0945081477355956,
+ 2.0928621436309816,
+ 2.091693960571289,
+ 2.101140612335205,
+ 2.095073269882202,
+ 2.0920650315856935,
+ 2.091407716522217,
+ 2.092963116760254,
+ 2.102848686065674,
+ 2.10209814743042,
+ 2.100728988342285,
+ 2.1085473413085936,
+ 2.1115043045043946,
+ 2.1238191069030763,
+ 2.1308215964508057,
+ 2.1344855577087403,
+ 2.1272054124450683,
+ 2.1218687773132325,
+ 2.12194469039917,
+ 2.127710237426758,
+ 2.1268114820861816,
+ 2.1254331665039063,
+ 2.1245197431182863,
+ 2.125965220489502,
+ 2.12684192817688,
+ 2.1273793972015382,
+ 2.128570475311279,
+ 2.1321925525665284,
+ 2.13282696762085,
+ 2.1370943976593018,
+ 2.1397155253601072,
+ 2.143300206756592,
+ 2.1476288512420654,
+ 2.152116884613037,
+ 2.1553422878265383,
+ 2.154549729385376,
+ 2.155469595031738,
+ 2.155468685760498,
+ 2.15419854057312,
+ 2.1527544927978517,
+ 2.151362074584961,
+ 2.1510060634613035,
+ 2.1480546588134763,
+ 2.1468420223999023,
+ 2.1457022499084473,
+ 2.1455462963104246,
+ 2.144765656814575,
+ 2.146289216003418,
+ 2.142656379470825,
+ 2.1456896996307373,
+ 2.1448883264923095,
+ 2.144138221282959
+ ],
+ "train_acc": [
+ 0.13994,
+ 0.14018,
+ 0.1448,
+ 0.1448,
+ 0.16884,
+ 0.17316,
+ 0.1748,
+ 0.1631,
+ 0.15902,
+ 0.1599,
+ 0.15558,
+ 0.16126,
+ 0.16064,
+ 0.15736,
+ 0.1483,
+ 0.14638,
+ 0.15088,
+ 0.15526,
+ 0.16726,
+ 0.16864,
+ 0.1672,
+ 0.17562,
+ 0.1804,
+ 0.1857,
+ 0.19408,
+ 0.19066,
+ 0.1875,
+ 0.19146,
+ 0.19404,
+ 0.18652,
+ 0.1868,
+ 0.18316,
+ 0.1862,
+ 0.19086,
+ 0.19266,
+ 0.18878,
+ 0.19202,
+ 0.18684,
+ 0.18708,
+ 0.18076,
+ 0.18768,
+ 0.18408,
+ 0.18372,
+ 0.18428,
+ 0.18508,
+ 0.18442,
+ 0.1863,
+ 0.18434,
+ 0.18142,
+ 0.17946,
+ 0.18168,
+ 0.18058,
+ 0.1805,
+ 0.18198,
+ 0.18268,
+ 0.1812,
+ 0.17942,
+ 0.17946,
+ 0.18054,
+ 0.17744,
+ 0.17834,
+ 0.17516,
+ 0.17416,
+ 0.17206,
+ 0.17546,
+ 0.17682,
+ 0.17458,
+ 0.17444,
+ 0.1757,
+ 0.17654,
+ 0.1778,
+ 0.17268,
+ 0.1757,
+ 0.1751,
+ 0.17666,
+ 0.1775,
+ 0.17746,
+ 0.17622,
+ 0.17406,
+ 0.17472,
+ 0.17496,
+ 0.17596,
+ 0.17324,
+ 0.17394,
+ 0.17302,
+ 0.1713,
+ 0.17072,
+ 0.17288,
+ 0.1718,
+ 0.17242,
+ 0.1725,
+ 0.17408,
+ 0.1736,
+ 0.17198,
+ 0.17344,
+ 0.17254,
+ 0.17392,
+ 0.17376,
+ 0.17466,
+ 0.1739
+ ],
+ "test_acc": [
+ 0.0608,
+ 0.1367,
+ 0.1165,
+ 0.1638,
+ 0.1577,
+ 0.176,
+ 0.1529,
+ 0.136,
+ 0.1352,
+ 0.1245,
+ 0.1322,
+ 0.137,
+ 0.1201,
+ 0.1178,
+ 0.1187,
+ 0.1118,
+ 0.1187,
+ 0.1373,
+ 0.1421,
+ 0.1151,
+ 0.1412,
+ 0.1284,
+ 0.1374,
+ 0.1796,
+ 0.1927,
+ 0.1818,
+ 0.1859,
+ 0.1762,
+ 0.1865,
+ 0.1827,
+ 0.1708,
+ 0.1826,
+ 0.1859,
+ 0.191,
+ 0.1833,
+ 0.1858,
+ 0.1875,
+ 0.1902,
+ 0.1859,
+ 0.1872,
+ 0.1894,
+ 0.193,
+ 0.1882,
+ 0.1783,
+ 0.1792,
+ 0.179,
+ 0.1836,
+ 0.1618,
+ 0.1749,
+ 0.1881,
+ 0.1879,
+ 0.1757,
+ 0.1705,
+ 0.1868,
+ 0.1871,
+ 0.1811,
+ 0.1727,
+ 0.16,
+ 0.1799,
+ 0.1524,
+ 0.1648,
+ 0.1445,
+ 0.1739,
+ 0.1721,
+ 0.1828,
+ 0.1857,
+ 0.1719,
+ 0.1722,
+ 0.1716,
+ 0.1694,
+ 0.1512,
+ 0.1719,
+ 0.1704,
+ 0.1747,
+ 0.1718,
+ 0.1712,
+ 0.173,
+ 0.175,
+ 0.1733,
+ 0.1749,
+ 0.165,
+ 0.1672,
+ 0.1708,
+ 0.161,
+ 0.155,
+ 0.1605,
+ 0.1629,
+ 0.1598,
+ 0.1625,
+ 0.1628,
+ 0.1625,
+ 0.1609,
+ 0.1603,
+ 0.1616,
+ 0.1607,
+ 0.1644,
+ 0.1622,
+ 0.1621,
+ 0.1639,
+ 0.1637
+ ],
+ "state_pred_error": [
+ 0.4747012776184082,
+ 0.8295380383682252,
+ 0.21469590087890625,
+ 0.12448142728805542,
+ 0.08570515047073364,
+ 0.08470476587295532,
+ 0.12634123967647554,
+ 0.09733817555308343,
+ 0.0353814222663641,
+ 0.03443111445069313,
+ 0.03137257686555386,
+ 0.029351851464509963,
+ 0.03382749609231949,
+ 0.03600793175697327,
+ 0.028298149601221085,
+ 0.02450420175075531,
+ 0.025809087952375413,
+ 0.033925389347076416,
+ 0.039575903968811034,
+ 0.03546395682752133,
+ 0.03896381706476212,
+ 0.035592052783966065,
+ 0.020547916915416718,
+ 0.027013523270487786,
+ 0.024955789625644684,
+ 0.01776892081618309,
+ 0.010803042232394219,
+ 0.008741003857254981,
+ 0.009176803540587425,
+ 0.00826898938536644,
+ 0.007538356708586216,
+ 0.0065028233194351194,
+ 0.006696901108622551,
+ 0.006364495917409658,
+ 0.004348094679266215,
+ 0.0027382008469104767,
+ 0.001712799895554781,
+ 0.001062507140468806,
+ 0.0006733776653371752,
+ 0.0004975279747322202,
+ 0.0005460627448558807,
+ 0.0007091301748156548,
+ 0.0008156654949113727,
+ 0.0005741439528390766,
+ 0.0004632441856153309,
+ 0.0004077366246469319,
+ 0.00037149273524992167,
+ 0.00032670746902935206,
+ 0.0003252365568652749,
+ 0.0002759585575200617,
+ 0.00019474619667977095,
+ 0.00015623675198294222,
+ 0.00016898068460635842,
+ 0.00014236534488853067,
+ 0.00010944471210241317,
+ 8.656780364457518e-05,
+ 8.127526033436879e-05,
+ 7.092417092993855e-05,
+ 7.672614848706871e-05,
+ 6.656669022282586e-05,
+ 6.597209698753432e-05,
+ 6.993545684730634e-05,
+ 7.107698564883322e-05,
+ 7.049443874042482e-05,
+ 6.95053919684142e-05,
+ 6.41730681899935e-05,
+ 6.155454550869764e-05,
+ 6.015078729018569e-05,
+ 5.4422928835265336e-05,
+ 4.830317224375904e-05,
+ 4.409612072864547e-05,
+ 3.9640857164049524e-05,
+ 3.758983974112198e-05,
+ 3.4887928910320625e-05,
+ 3.156908231205307e-05,
+ 2.8848007169435732e-05,
+ 2.6238742939895017e-05,
+ 2.2889468831708655e-05,
+ 2.021120209712535e-05,
+ 1.8343317908002065e-05,
+ 1.5500704940350262e-05,
+ 1.386145944125019e-05,
+ 1.3288812919927295e-05,
+ 1.3635638843989e-05,
+ 1.4378732023760676e-05,
+ 1.5836126625945327e-05,
+ 1.6757641757139935e-05,
+ 1.6754487288417295e-05,
+ 1.670292949071154e-05,
+ 1.5964577784761785e-05,
+ 1.5669193891226315e-05,
+ 1.4928079603705555e-05,
+ 1.4118930798722432e-05,
+ 1.3290679465862922e-05,
+ 1.259699832968181e-05,
+ 1.169607178599108e-05,
+ 1.0905416535097175e-05,
+ 9.99030330684036e-06,
+ 9.378302599070595e-06,
+ 8.833123445947422e-06
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.07415470480918884,
+ 0.005267417058348656,
+ 0.006899588741362095,
+ 0.009260526858270168,
+ 0.014165668748319149,
+ 0.007070831023156643,
+ 0.003572859801352024,
+ 0.0013162376126274467,
+ 0.01693638414144516,
+ 0.011615054681897163,
+ 0.01297210343182087,
+ 0.019879184663295746
+ ],
+ "perturbation_rho": [
+ 0.06713278591632843,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0
+ ],
+ "nudging": {
+ "0.001": [
+ -3.7383288145065308e-06,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0
+ ],
+ "0.003": [
+ -1.1199153959751129e-05,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0
+ ],
+ "0.01": [
+ -3.7682242691516876e-05,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0
+ ]
+ }
+ },
+ "drift": {
+ "embed.weight": 16.995931312362433,
+ "embed.bias": 107.50455214257622,
+ "blocks.0.ln.weight": 1.1747809607171977,
+ "blocks.0.w1.weight": 87.48144222271058,
+ "blocks.0.w1.bias": 108.71150020387606,
+ "blocks.0.w2.weight": 231.25407676027953,
+ "blocks.1.ln.weight": 2.5949076659471078,
+ "blocks.1.w1.weight": 171.7945773092806,
+ "blocks.1.w1.bias": 169.71996864021074,
+ "blocks.1.w2.weight": 213.0622571876725,
+ "blocks.2.ln.weight": 3.47458321612997,
+ "blocks.2.w1.weight": 89.72539771461543,
+ "blocks.2.w1.bias": 64.43223038220326,
+ "blocks.2.w2.weight": 130.15474280855415,
+ "blocks.3.ln.weight": 3.2490652039574544,
+ "blocks.3.w1.weight": 125.1742859456183,
+ "blocks.3.w1.bias": 103.82426516529186,
+ "blocks.3.w2.weight": 122.83893982946046,
+ "blocks.4.ln.weight": 3.143539271549031,
+ "blocks.4.w1.weight": 124.0384309768722,
+ "blocks.4.w1.bias": 100.70299850760337,
+ "blocks.4.w2.weight": 149.19128092745697,
+ "blocks.5.ln.weight": 3.8369736269462678,
+ "blocks.5.w1.weight": 70.0473609489046,
+ "blocks.5.w1.bias": 55.88760753160443,
+ "blocks.5.w2.weight": 86.95978496337405,
+ "blocks.6.ln.weight": 2.788527931096308,
+ "blocks.6.w1.weight": 68.53157012655858,
+ "blocks.6.w1.bias": 60.09690095738387,
+ "blocks.6.w2.weight": 89.81505023786389,
+ "blocks.7.ln.weight": 6.399420463964318,
+ "blocks.7.w1.weight": 211.5238472865523,
+ "blocks.7.w1.bias": 193.8907626146654,
+ "blocks.7.w2.weight": 198.88821232136138,
+ "blocks.8.ln.weight": 3.718593242696815,
+ "blocks.8.w1.weight": 131.87660631337303,
+ "blocks.8.w1.bias": 117.13821442329933,
+ "blocks.8.w2.weight": 175.03912755183418,
+ "blocks.9.ln.weight": 2.399620577204472,
+ "blocks.9.w1.weight": 62.45119981781294,
+ "blocks.9.w1.bias": 48.049978443761816,
+ "blocks.9.w2.weight": 88.05873456328695,
+ "blocks.10.ln.weight": 4.012307554325392,
+ "blocks.10.w1.weight": 150.00438163426782,
+ "blocks.10.w1.bias": 134.3950208692614,
+ "blocks.10.w2.weight": 137.82521611752918,
+ "blocks.11.ln.weight": 2.857283266360585,
+ "blocks.11.w1.weight": 108.3646369610001,
+ "blocks.11.w1.bias": 100.36750299157434,
+ "blocks.11.w2.weight": 117.58094348226459,
+ "out_ln.weight": 0.45424689776008886,
+ "out_head.weight": 5.496813200883646,
+ "out_head.bias": 3.0092640143628198
+ }
+ },
+ "credit_bridge": {
+ "log": {
+ "train_loss": [
+ 2.080038804626465,
+ 2.0486898488616943,
+ 2.046282894744873,
+ 2.046656800842285,
+ 2.039552648086548,
+ 2.0396751835632325,
+ 2.037381534881592,
+ 2.035384338226318,
+ 2.035809118041992,
+ 2.0331781942749023,
+ 2.0284877285385132,
+ 2.027495804901123,
+ 2.026125898208618,
+ 2.020480899810791,
+ 2.0207955992126463,
+ 2.0185290005874634,
+ 2.017150591125488,
+ 2.0164879455566407,
+ 2.0157563932037355,
+ 2.0127871045684813,
+ 2.0112040578460695,
+ 2.010815860519409,
+ 2.009171763458252,
+ 2.007995718460083,
+ 2.0075271183013914,
+ 2.006510923538208,
+ 2.003063318405151,
+ 2.004764850692749,
+ 2.0030145164489745,
+ 2.001830623397827,
+ 2.0015824402618407,
+ 2.0029561541748047,
+ 2.0005920767593386,
+ 1.9996838995361328,
+ 2.0028357711029052,
+ 2.0006233686065675,
+ 2.002561650390625,
+ 2.0042890097808836,
+ 2.0027454135513305,
+ 2.0027183213806152,
+ 2.0006818413543703,
+ 2.0015592734146117,
+ 1.9975921591949464,
+ 1.9961159555053711,
+ 1.9909970508575439,
+ 1.9920473384857178,
+ 1.9899114678192138,
+ 1.9886371549987794,
+ 1.9901284057998658,
+ 1.9869096327972413,
+ 1.9846498122406007,
+ 1.986077251586914,
+ 1.9829593098449707,
+ 1.9857685099792481,
+ 1.9820374918365478,
+ 1.9831326490783692,
+ 1.9809515007781981,
+ 1.9830830813980103,
+ 1.9793231730651855,
+ 1.9804900155639649,
+ 1.9807616325378419,
+ 1.9796239783096314,
+ 1.9790023094177247,
+ 1.976966079940796,
+ 1.978210344467163,
+ 1.9777095768737794,
+ 1.9761795248794556,
+ 1.9757038269042968,
+ 1.9747423070907593,
+ 1.9738406778717041,
+ 1.9735038549041748,
+ 1.97461932346344,
+ 1.9734378964233399,
+ 1.9701263136291505,
+ 1.9708808054351807,
+ 1.974146450958252,
+ 1.9722303295135497,
+ 1.9706154293823241,
+ 1.968834009361267,
+ 1.970496709022522,
+ 1.9716806288909912,
+ 1.9713043495941163,
+ 1.9710750988769532,
+ 1.9707429261016847,
+ 1.9708539364242554,
+ 1.9677796157455445,
+ 1.969852265663147,
+ 1.9710520673370362,
+ 1.970287728881836,
+ 1.9704584929656983,
+ 1.9702265856552124,
+ 1.9696108251571656,
+ 1.9689367693328856,
+ 1.9707266571044921,
+ 1.967924552001953,
+ 1.9694965203857422,
+ 1.9685778493881225,
+ 1.9698442002868652,
+ 1.9704585931015015,
+ 1.9684682028961182
+ ],
+ "train_acc": [
+ 0.23092,
+ 0.24236,
+ 0.24134,
+ 0.2427,
+ 0.24468,
+ 0.24838,
+ 0.25104,
+ 0.24966,
+ 0.24992,
+ 0.2533,
+ 0.25824,
+ 0.25604,
+ 0.25956,
+ 0.25866,
+ 0.25884,
+ 0.26064,
+ 0.26036,
+ 0.26042,
+ 0.26344,
+ 0.26316,
+ 0.26514,
+ 0.26496,
+ 0.26788,
+ 0.26702,
+ 0.26586,
+ 0.2673,
+ 0.27052,
+ 0.26806,
+ 0.26714,
+ 0.26944,
+ 0.26906,
+ 0.26936,
+ 0.27068,
+ 0.27078,
+ 0.26864,
+ 0.26786,
+ 0.26666,
+ 0.26666,
+ 0.26544,
+ 0.26578,
+ 0.26854,
+ 0.26384,
+ 0.26708,
+ 0.26708,
+ 0.2699,
+ 0.26658,
+ 0.2711,
+ 0.26876,
+ 0.26902,
+ 0.27082,
+ 0.27148,
+ 0.266,
+ 0.27216,
+ 0.26798,
+ 0.27106,
+ 0.26994,
+ 0.27048,
+ 0.26962,
+ 0.2742,
+ 0.27182,
+ 0.27056,
+ 0.27532,
+ 0.27016,
+ 0.2717,
+ 0.2714,
+ 0.27288,
+ 0.274,
+ 0.27434,
+ 0.27378,
+ 0.27492,
+ 0.27316,
+ 0.27746,
+ 0.27542,
+ 0.27628,
+ 0.27614,
+ 0.27594,
+ 0.27926,
+ 0.27974,
+ 0.28028,
+ 0.27698,
+ 0.27918,
+ 0.28146,
+ 0.27674,
+ 0.27706,
+ 0.2764,
+ 0.27804,
+ 0.27652,
+ 0.27794,
+ 0.27888,
+ 0.27896,
+ 0.27918,
+ 0.2798,
+ 0.27814,
+ 0.27842,
+ 0.2812,
+ 0.28084,
+ 0.27868,
+ 0.2795,
+ 0.27768,
+ 0.28226
+ ],
+ "test_acc": [
+ 0.258,
+ 0.2756,
+ 0.2609,
+ 0.2627,
+ 0.2583,
+ 0.2669,
+ 0.2661,
+ 0.2481,
+ 0.2517,
+ 0.278,
+ 0.2729,
+ 0.2822,
+ 0.2748,
+ 0.2742,
+ 0.2787,
+ 0.2778,
+ 0.2707,
+ 0.2794,
+ 0.2583,
+ 0.2854,
+ 0.2723,
+ 0.2857,
+ 0.2747,
+ 0.2855,
+ 0.2884,
+ 0.2972,
+ 0.3,
+ 0.2951,
+ 0.278,
+ 0.3009,
+ 0.2933,
+ 0.2909,
+ 0.2962,
+ 0.2866,
+ 0.2697,
+ 0.2857,
+ 0.2673,
+ 0.2944,
+ 0.2914,
+ 0.2886,
+ 0.2744,
+ 0.2794,
+ 0.286,
+ 0.2811,
+ 0.2905,
+ 0.2843,
+ 0.2743,
+ 0.2756,
+ 0.279,
+ 0.2945,
+ 0.2845,
+ 0.2711,
+ 0.2852,
+ 0.2824,
+ 0.2842,
+ 0.2934,
+ 0.2924,
+ 0.287,
+ 0.2801,
+ 0.2987,
+ 0.282,
+ 0.2911,
+ 0.2793,
+ 0.2753,
+ 0.2963,
+ 0.2823,
+ 0.2872,
+ 0.2971,
+ 0.2958,
+ 0.2753,
+ 0.285,
+ 0.2899,
+ 0.2999,
+ 0.2834,
+ 0.2931,
+ 0.2934,
+ 0.2869,
+ 0.2886,
+ 0.2916,
+ 0.2905,
+ 0.2822,
+ 0.2883,
+ 0.2927,
+ 0.3001,
+ 0.295,
+ 0.2954,
+ 0.2931,
+ 0.2848,
+ 0.2906,
+ 0.2907,
+ 0.291,
+ 0.2922,
+ 0.2929,
+ 0.2921,
+ 0.2908,
+ 0.2913,
+ 0.29,
+ 0.2895,
+ 0.2894,
+ 0.2893
+ ],
+ "value_loss": [
+ 0.4853640641069412,
+ 0.13146528634786606,
+ 0.10278774485111236,
+ 0.10451403197526932,
+ 0.09186984123706818,
+ 0.09725872883081436,
+ 0.08755186069607734,
+ 0.07744781212091446,
+ 0.08400812898874283,
+ 0.0792426191854477,
+ 0.07378534253954887,
+ 0.06448388241052627,
+ 0.06442826303482056,
+ 0.062765171585083,
+ 0.05268099952340126,
+ 0.046547150465250015,
+ 0.04977830931901932,
+ 0.046939543528556824,
+ 0.04594481763601303,
+ 0.04108059468030929,
+ 0.04083769999027252,
+ 0.04402205483198166,
+ 0.04000264639854431,
+ 0.03796569113850594,
+ 0.035944590538740155,
+ 0.03808709916114807,
+ 0.03455143286049366,
+ 0.038163829424381256,
+ 0.03331702991783619,
+ 0.033281468888521196,
+ 0.02748794436097145,
+ 0.030440516521930694,
+ 0.028207264231443405,
+ 0.02704140617221594,
+ 0.026097478928565978,
+ 0.025327355717718603,
+ 0.024099903733730315,
+ 0.027659756012558937,
+ 0.022987231121063233,
+ 0.020967545130252837,
+ 0.021579559311568738,
+ 0.020051995359063147,
+ 0.01838304534137249,
+ 0.02002642317146063,
+ 0.017698023419380187,
+ 0.018389571142196654,
+ 0.013522476999759675,
+ 0.01383736302614212,
+ 0.014502173573970795,
+ 0.016614098087251186,
+ 0.013939322325885297,
+ 0.014496620377600192,
+ 0.010598833594471216,
+ 0.012348202850222588,
+ 0.011290375513732433,
+ 0.009235630955398083,
+ 0.011637351908683776,
+ 0.00849102252393961,
+ 0.009930187560021878,
+ 0.0093223687428236,
+ 0.008464423409998418,
+ 0.007654866740107537,
+ 0.007954280150234699,
+ 0.00844777645289898,
+ 0.008321732766479253,
+ 0.007419437230825424,
+ 0.008567752386033535,
+ 0.007364120395183563,
+ 0.006373357061594725,
+ 0.00595162553101778,
+ 0.006675690564513207,
+ 0.0059091412272304295,
+ 0.0058950428107380866,
+ 0.005543788010179997,
+ 0.004646000351905823,
+ 0.004232099659517407,
+ 0.00391991232007742,
+ 0.003104630061686039,
+ 0.0029366533225774765,
+ 0.0028203235547989607,
+ 0.0027620538933947683,
+ 0.002386382454186678,
+ 0.0019722532033920287,
+ 0.001968352645486593,
+ 0.001672238507643342,
+ 0.0015232293362915515,
+ 0.0017160395857319236,
+ 0.0012631227846443653,
+ 0.0011414727784320711,
+ 0.0009458377653546632,
+ 0.0011035545341856778,
+ 0.0009393164394423365,
+ 0.001123441938534379,
+ 0.0008937438951432705,
+ 0.0009866366090252995,
+ 0.0011745557901449502,
+ 0.0006501818283647299,
+ 0.0009478944011032582,
+ 0.001031599847562611,
+ 0.0008783576951175928
+ ]
+ },
+ "diagnostics": {
+ "bp_cosine": [
+ 0.4526920020580292,
+ 0.006497844588011503,
+ 0.01631792262196541,
+ 0.01694033294916153,
+ 0.017034951597452164,
+ 0.01775282248854637,
+ 0.01775078848004341,
+ 0.017723549157381058,
+ 0.01778416708111763,
+ 0.01786961778998375,
+ 0.017997052520513535,
+ 0.017978299409151077
+ ],
+ "perturbation_rho": [
+ -0.054250095039606094,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0
+ ],
+ "nudging": {
+ "0.001": [
+ -8.353963494300842e-07,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0
+ ],
+ "0.003": [
+ -2.439599484205246e-06,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0
+ ],
+ "0.01": [
+ -7.801689207553864e-06,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0,
+ 0.0
+ ]
+ }
+ },
+ "drift": {
+ "embed.weight": 193.53208266596525,
+ "embed.bias": 115.78380404718655,
+ "blocks.0.ln.weight": 8.867635038294205,
+ "blocks.0.w1.weight": 196.51094816310516,
+ "blocks.0.w1.bias": 74.82582896315267,
+ "blocks.0.w2.weight": 317.40620630343955,
+ "blocks.1.ln.weight": 5.764116391727315,
+ "blocks.1.w1.weight": 210.05221683875882,
+ "blocks.1.w1.bias": 200.7126628347933,
+ "blocks.1.w2.weight": 235.05000374612118,
+ "blocks.2.ln.weight": 7.735844453849748,
+ "blocks.2.w1.weight": 328.46033970353545,
+ "blocks.2.w1.bias": 322.5548152476072,
+ "blocks.2.w2.weight": 334.35863169713303,
+ "blocks.3.ln.weight": 5.5455094513045,
+ "blocks.3.w1.weight": 213.2636693536328,
+ "blocks.3.w1.bias": 189.3065053401033,
+ "blocks.3.w2.weight": 201.9218429504037,
+ "blocks.4.ln.weight": 6.963102540839665,
+ "blocks.4.w1.weight": 281.1829353200361,
+ "blocks.4.w1.bias": 254.14827278048986,
+ "blocks.4.w2.weight": 252.72823154554072,
+ "blocks.5.ln.weight": 6.651053338270696,
+ "blocks.5.w1.weight": 265.808423173078,
+ "blocks.5.w1.bias": 237.94000901426764,
+ "blocks.5.w2.weight": 246.35312384551574,
+ "blocks.6.ln.weight": 6.796230689261986,
+ "blocks.6.w1.weight": 277.37913499866477,
+ "blocks.6.w1.bias": 258.5087504829616,
+ "blocks.6.w2.weight": 266.3321474533456,
+ "blocks.7.ln.weight": 6.190933150629552,
+ "blocks.7.w1.weight": 247.84752961611798,
+ "blocks.7.w1.bias": 225.69508996072392,
+ "blocks.7.w2.weight": 237.71747748473527,
+ "blocks.8.ln.weight": 5.572316870464946,
+ "blocks.8.w1.weight": 220.49723448227533,
+ "blocks.8.w1.bias": 201.84500185584645,
+ "blocks.8.w2.weight": 203.8926634145943,
+ "blocks.9.ln.weight": 4.956248620217523,
+ "blocks.9.w1.weight": 176.87866597616605,
+ "blocks.9.w1.bias": 165.25106759218716,
+ "blocks.9.w2.weight": 166.2448646005026,
+ "blocks.10.ln.weight": 7.452869833755125,
+ "blocks.10.w1.weight": 298.53765102170973,
+ "blocks.10.w1.bias": 273.411202411899,
+ "blocks.10.w2.weight": 295.16401679878913,
+ "blocks.11.ln.weight": 7.774196063602293,
+ "blocks.11.w1.weight": 313.80618162900083,
+ "blocks.11.w1.bias": 283.94177751762567,
+ "blocks.11.w2.weight": 294.8394911964541,
+ "out_ln.weight": 0.5766241941627794,
+ "out_head.weight": 8.360089920565844,
+ "out_head.bias": 1.5207819852306046
+ }
+ }
+ },
+ "config": {
+ "dataset": "cifar10",
+ "d_hidden": 512,
+ "num_blocks": 12,
+ "batch_size": 128,
+ "epochs": 100,
+ "lr": 0.001,
+ "lr_fb": 0.001,
+ "wd": 0.01,
+ "lam": 0.1,
+ "K": 4,
+ "sigma_bridge": 0.05,
+ "ema_momentum": 0.995,
+ "term_grad_weight": 1.0,
+ "seeds": [
+ 456
+ ],
+ "gpu": 0,
+ "output_dir": "results/cifar10_seed456",
+ "num_classes": 10
+ }
+} \ No newline at end of file