{ "42": { "bp": { "log": { "train_loss": [ 0.7028828698158264, 0.5331447437604269, 0.4640675885995229, 0.416527880080541, 0.3784152720451355 ], "train_acc": [ 0.73755, 0.8002166666666667, 0.8256666666666667, 0.8436666666666667, 0.8591833333333333 ], "test_acc": [ 0.7939, 0.8157, 0.8379, 0.8606, 0.8658 ] }, "diagnostics": { "bp_cosine": [ 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0 ], "perturbation_rho": [ 0.9998708367347717, 0.9998407959938049, 0.9997469186782837, 0.9998122453689575, 0.9997262358665466, 0.9996491074562073, 0.9996585845947266, 0.9995328783988953 ], "nudging": { "0.001": [ -0.0019641336984932423, -0.00174636859446764, -0.00154352025128901, -0.0013810225063934922, -0.0012467722408473492, -0.0011190228397026658, -0.0010304137831553817, -0.0009783159475773573 ], "0.003": [ -0.005858615506440401, -0.005213461350649595, -0.004612031392753124, -0.004128905013203621, -0.0037290011532604694, -0.003348270896822214, -0.003083921270444989, -0.002928499598056078 ], "0.01": [ -0.019138235598802567, -0.017080917954444885, -0.015158241614699364, -0.013598069548606873, -0.01229821052402258, -0.01105712354183197, -0.010194781236350536, -0.009686501696705818 ] } }, "drift": { "embed.weight": 1.1395236897587921, "embed.bias": 0.6760135861021652, "blocks.0.ln.weight": 0.0347786583006382, "blocks.0.w1.weight": 0.8267150385727446, "blocks.0.w1.bias": 0.7665003752239994, "blocks.0.w2.weight": 2.522163826858937, "blocks.1.ln.weight": 0.0373835414648056, "blocks.1.w1.weight": 0.8094006579319112, "blocks.1.w1.bias": 0.7074648417912711, "blocks.1.w2.weight": 2.427488314293417, "blocks.2.ln.weight": 0.0362338162958622, "blocks.2.w1.weight": 0.7981608599321399, "blocks.2.w1.bias": 0.6653993627306621, "blocks.2.w2.weight": 2.3264717248101827, "blocks.3.ln.weight": 0.03489774093031883, "blocks.3.w1.weight": 0.8024856088475522, "blocks.3.w1.bias": 0.6243261101573547, "blocks.3.w2.weight": 2.2732641732905714, "blocks.4.ln.weight": 0.036862026900053024, "blocks.4.w1.weight": 0.7702369058900084, "blocks.4.w1.bias": 0.671902653164234, "blocks.4.w2.weight": 2.11229934068397, "blocks.5.ln.weight": 0.04049132019281387, "blocks.5.w1.weight": 0.74033776504041, "blocks.5.w1.bias": 0.6447910547850285, "blocks.5.w2.weight": 1.9146335569252138, "blocks.6.ln.weight": 0.03797098994255066, "blocks.6.w1.weight": 0.7241522377185389, "blocks.6.w1.bias": 0.6486550903936706, "blocks.6.w2.weight": 1.8210870137239685, "blocks.7.ln.weight": 0.03962903097271919, "blocks.7.w1.weight": 0.6992516513120532, "blocks.7.w1.bias": 0.7021825186584477, "blocks.7.w2.weight": 1.7902862835380957, "out_ln.weight": 0.026629405096173286, "out_head.weight": 0.5610428179907003, "out_head.bias": 0.24151687322978704 } }, "dfa": { "log": { "train_loss": [ 1.4100907169977823, 1.4334057479222615, 1.4326289967854817, 1.4254953683853149, 1.4169784986495972 ], "train_acc": [ 0.4805, 0.49806666666666666, 0.49725, 0.5031166666666667, 0.5098 ], "test_acc": [ 0.5175, 0.5282, 0.5025, 0.5027, 0.5338 ] }, "diagnostics": { "bp_cosine": [ 0.2141590267419815, 0.0797841027379036, 0.04707183688879013, 0.0032249214127659798, 0.024886084720492363, -0.0050605954602360725, 0.009758025407791138, 0.020020857453346252 ], "perturbation_rho": [ 0.07338915765285492, -0.004745986312627792, 0.018682830035686493, 0.031185101717710495, -0.02063235454261303, 0.0006608979310840368, 0.0, 0.04759033024311066 ], "nudging": { "0.001": [ -3.5976991057395935e-06, 2.3283064365386963e-09, -9.313225746154785e-10, -9.313225746154785e-09, 4.656612873077393e-10, -3.725290298461914e-09, 1.3969838619232178e-09, 9.313225746154785e-10 ], "0.003": [ -1.0745832696557045e-05, 2.3283064365386963e-09, 1.6298145055770874e-09, -2.3283064365386963e-09, 6.752088665962219e-09, 1.0244548320770264e-08, -4.6566128730773926e-09, 0.0 ], "0.01": [ -3.5760458558797836e-05, -9.313225746154785e-10, 1.3271346688270569e-08, -1.0244548320770264e-08, -8.381903171539307e-09, 4.1443854570388794e-08, 8.847564458847046e-09, 1.30385160446167e-08 ] } }, "drift": { "embed.weight": 34.15137184586086, "embed.bias": 25.886722942466992, "blocks.0.ln.weight": 2.2413852214813232, "blocks.0.w1.weight": 42.91370684219911, "blocks.0.w1.bias": 42.38937429728957, "blocks.0.w2.weight": 115.11173260217275, "blocks.1.ln.weight": 2.0233230590820312, "blocks.1.w1.weight": 36.64772802731374, "blocks.1.w1.bias": 34.57367344043412, "blocks.1.w2.weight": 84.1198032305499, "blocks.2.ln.weight": 1.9000216722488403, "blocks.2.w1.weight": 33.172328512058, "blocks.2.w1.bias": 31.908254113444393, "blocks.2.w2.weight": 78.32752075434591, "blocks.3.ln.weight": 1.9099335670471191, "blocks.3.w1.weight": 36.73019631908303, "blocks.3.w1.bias": 32.60666919280332, "blocks.3.w2.weight": 83.75068434979308, "blocks.4.ln.weight": 1.891120195388794, "blocks.4.w1.weight": 35.27032832987592, "blocks.4.w1.bias": 38.017692746712825, "blocks.4.w2.weight": 80.26417466790754, "blocks.5.ln.weight": 2.0106024742126465, "blocks.5.w1.weight": 42.09808335703852, "blocks.5.w1.bias": 43.15100280108635, "blocks.5.w2.weight": 94.64753309078039, "blocks.6.ln.weight": 1.8941009044647217, "blocks.6.w1.weight": 38.94163125135345, "blocks.6.w1.bias": 38.10426587138794, "blocks.6.w2.weight": 84.40488806201412, "blocks.7.ln.weight": 1.9035111665725708, "blocks.7.w1.weight": 38.65051912560395, "blocks.7.w1.bias": 40.760402959190415, "blocks.7.w2.weight": 81.97372863530312, "out_ln.weight": 0.39740806818008423, "out_head.weight": 3.609484615833081, "out_head.bias": 0.8344298895862311 } }, "state_bridge": { "log": { "train_loss": [ 1.7336509002049765, 1.5851847206751506, 1.8742321704864502, 1.8100628153483074, 1.5580067304611207 ], "train_acc": [ 0.32705, 0.3616333333333333, 0.2679166666666667, 0.31853333333333333, 0.4080166666666667 ], "test_acc": [ 0.4036, 0.4047, 0.3046, 0.4005, 0.4651 ], "state_pred_error": [ 5076234.573784879, 343992182.36586666, 517900685.38026667, 557639895.7226666, 383439664.5205333 ] }, "diagnostics": { "bp_cosine": [ 0.35149621963500977, 0.27368226647377014, 0.045176729559898376, 0.04587914049625397, 0.06403794139623642, 0.06599076837301254, 0.10026843845844269, 0.11267217993736267 ], "perturbation_rho": [ 0.37996596097946167, 0.0075237625278532505, -0.017497196793556213, 0.001783197745680809, 0.026772135868668556, 0.011043311096727848, 0.0037202914245426655, 0.008577261120080948 ], "nudging": { "0.001": [ -7.0138368755579e-05, -1.0319054126739502e-06, -6.495974957942963e-08, -4.190951585769653e-09, -3.3993273973464966e-08, -2.2584572434425354e-08, -6.123445928096771e-08, -4.1443854570388794e-08 ], "0.003": [ -0.00021021789871156216, -3.0745286494493484e-06, -1.0547228157520294e-07, -4.866160452365875e-08, -8.591450750827789e-08, -6.938353180885315e-08, -1.1292286217212677e-07, -9.825453162193298e-08 ], "0.01": [ -0.0006983885541558266, -1.027202233672142e-05, -3.688037395477295e-07, -1.073349267244339e-07, -2.153683453798294e-07, -2.0815059542655945e-07, -2.6938505470752716e-07, -3.08966264128685e-07 ] } }, "drift": { "embed.weight": 4.244627827603776, "embed.bias": 2.284214237417933, "blocks.0.ln.weight": 0.7376585006713867, "blocks.0.w1.weight": 10.052587254542228, "blocks.0.w1.bias": 12.863219234970343, "blocks.0.w2.weight": 32.7856072339516, "blocks.1.ln.weight": 0.8459606170654297, "blocks.1.w1.weight": 17.10440998330836, "blocks.1.w1.bias": 22.587196662115986, "blocks.1.w2.weight": 48.94107595877311, "blocks.2.ln.weight": 0.5776991248130798, "blocks.2.w1.weight": 12.17296546064332, "blocks.2.w1.bias": 14.464613959802604, "blocks.2.w2.weight": 33.58238884289355, "blocks.3.ln.weight": 0.6916943788528442, "blocks.3.w1.weight": 11.021146543598332, "blocks.3.w1.bias": 11.779720628235973, "blocks.3.w2.weight": 25.18170826322489, "blocks.4.ln.weight": 0.5363020300865173, "blocks.4.w1.weight": 8.488676390390957, "blocks.4.w1.bias": 11.968348972417077, "blocks.4.w2.weight": 23.562556821259157, "blocks.5.ln.weight": 0.749293863773346, "blocks.5.w1.weight": 13.199470836216618, "blocks.5.w1.bias": 17.384581140704626, "blocks.5.w2.weight": 36.38642209120496, "blocks.6.ln.weight": 0.45835214853286743, "blocks.6.w1.weight": 10.662863447362852, "blocks.6.w1.bias": 15.855775302559838, "blocks.6.w2.weight": 28.70293410646866, "blocks.7.ln.weight": 0.4122738838195801, "blocks.7.w1.weight": 7.193545064718527, "blocks.7.w1.bias": 7.340520731384394, "blocks.7.w2.weight": 22.53669113456487, "out_ln.weight": 0.06885236501693726, "out_head.weight": 1.473306835980063, "out_head.bias": 1.5084479134035678 } }, "credit_bridge": { "log": { "train_loss": [ 2.0466531958262126, 2.2737758037567137, 2.280587441889445, 2.25820095837911, 2.270971960576375 ], "train_acc": [ 0.22976666666666667, 0.13306666666666667, 0.13921666666666666, 0.15853333333333333, 0.15521666666666667 ], "test_acc": [ 0.1866, 0.101, 0.1455, 0.1616, 0.0958 ], "value_loss": [ 1.105676996310552, 0.06329173700014751, 0.02014747195293506, 0.01469622576336066, 0.0050645585257560015 ] }, "diagnostics": { "bp_cosine": [ -0.04117349535226822, 0.006370606832206249, 0.03125208616256714, -0.015287259593605995, -0.04197325184941292, -0.021368175745010376, 0.009605868719518185, 0.029422588646411896 ], "perturbation_rho": [ -0.09283949434757233, -0.030718784779310226, 0.00206748116761446, 0.0, -0.0060626850463449955, -0.015737878158688545, 0.02677903138101101, -0.040315717458724976 ], "nudging": { "0.001": [ 3.939494490623474e-06, -1.4901161193847656e-08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.003": [ 1.1788681149482727e-05, -3.725290298461914e-09, 1.862645149230957e-09, 0.0, 0.0, -1.862645149230957e-09, 1.862645149230957e-09, 0.0 ], "0.01": [ 3.923662006855011e-05, 2.60770320892334e-08, 7.450580596923828e-09, -1.862645149230957e-09, 1.862645149230957e-09, 1.862645149230957e-09, 1.862645149230957e-09, 5.587935447692871e-09 ] } }, "drift": { "embed.weight": 5.5176286267072285, "embed.bias": 5.84115130180781, "blocks.0.ln.weight": 0.7516779899597168, "blocks.0.w1.weight": 13.130250396475844, "blocks.0.w1.bias": 16.418874968953887, "blocks.0.w2.weight": 35.524006089100524, "blocks.1.ln.weight": 1.0247337818145752, "blocks.1.w1.weight": 24.629494668532566, "blocks.1.w1.bias": 31.389502706524333, "blocks.1.w2.weight": 66.32116257377548, "blocks.2.ln.weight": 1.0405563116073608, "blocks.2.w1.weight": 19.820545045709153, "blocks.2.w1.bias": 21.04420170821489, "blocks.2.w2.weight": 47.599865577930004, "blocks.3.ln.weight": 0.698647677898407, "blocks.3.w1.weight": 11.782448138509505, "blocks.3.w1.bias": 11.300932589985935, "blocks.3.w2.weight": 29.52897326429494, "blocks.4.ln.weight": 0.7269545197486877, "blocks.4.w1.weight": 12.151248949786332, "blocks.4.w1.bias": 11.545512427875654, "blocks.4.w2.weight": 31.11028303079019, "blocks.5.ln.weight": 0.7007301449775696, "blocks.5.w1.weight": 10.093534441471926, "blocks.5.w1.bias": 8.779689334059729, "blocks.5.w2.weight": 24.2612493038314, "blocks.6.ln.weight": 0.7457646727561951, "blocks.6.w1.weight": 9.34015610077582, "blocks.6.w1.bias": 7.819986138941612, "blocks.6.w2.weight": 24.326245888357803, "blocks.7.ln.weight": 0.7317199110984802, "blocks.7.w1.weight": 10.73492434511088, "blocks.7.w1.bias": 9.150645079981764, "blocks.7.w2.weight": 27.11222424242763, "out_ln.weight": 0.07713422179222107, "out_head.weight": 1.4131541672079744, "out_head.bias": 0.7976411656775528 } } }, "config": { "dataset": "fashionmnist", "d_hidden": 256, "num_blocks": 8, "batch_size": 128, "epochs": 5, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 42 ], "gpu": 0, "output_dir": "results/smoke_test", "num_classes": 10 } }