diff options
Diffstat (limited to 'results/smoke_test/results_fashionmnist.json')
| -rw-r--r-- | results/smoke_test/results_fashionmnist.json | 511 |
1 files changed, 511 insertions, 0 deletions
diff --git a/results/smoke_test/results_fashionmnist.json b/results/smoke_test/results_fashionmnist.json new file mode 100644 index 0000000..8fd82c0 --- /dev/null +++ b/results/smoke_test/results_fashionmnist.json @@ -0,0 +1,511 @@ +{ + "42": { + "bp": { + "log": { + "train_loss": [ + 0.7028828698158264, + 0.5331447437604269, + 0.4640675885995229, + 0.416527880080541, + 0.3784152720451355 + ], + "train_acc": [ + 0.73755, + 0.8002166666666667, + 0.8256666666666667, + 0.8436666666666667, + 0.8591833333333333 + ], + "test_acc": [ + 0.7939, + 0.8157, + 0.8379, + 0.8606, + 0.8658 + ] + }, + "diagnostics": { + "bp_cosine": [ + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "perturbation_rho": [ + 0.9998708367347717, + 0.9998407959938049, + 0.9997469186782837, + 0.9998122453689575, + 0.9997262358665466, + 0.9996491074562073, + 0.9996585845947266, + 0.9995328783988953 + ], + "nudging": { + "0.001": [ + -0.0019641336984932423, + -0.00174636859446764, + -0.00154352025128901, + -0.0013810225063934922, + -0.0012467722408473492, + -0.0011190228397026658, + -0.0010304137831553817, + -0.0009783159475773573 + ], + "0.003": [ + -0.005858615506440401, + -0.005213461350649595, + -0.004612031392753124, + -0.004128905013203621, + -0.0037290011532604694, + -0.003348270896822214, + -0.003083921270444989, + -0.002928499598056078 + ], + "0.01": [ + -0.019138235598802567, + -0.017080917954444885, + -0.015158241614699364, + -0.013598069548606873, + -0.01229821052402258, + -0.01105712354183197, + -0.010194781236350536, + -0.009686501696705818 + ] + } + }, + "drift": { + "embed.weight": 1.1395236897587921, + "embed.bias": 0.6760135861021652, + "blocks.0.ln.weight": 0.0347786583006382, + "blocks.0.w1.weight": 0.8267150385727446, + "blocks.0.w1.bias": 0.7665003752239994, + "blocks.0.w2.weight": 2.522163826858937, + "blocks.1.ln.weight": 0.0373835414648056, + "blocks.1.w1.weight": 0.8094006579319112, + "blocks.1.w1.bias": 0.7074648417912711, + "blocks.1.w2.weight": 2.427488314293417, + "blocks.2.ln.weight": 0.0362338162958622, + "blocks.2.w1.weight": 0.7981608599321399, + "blocks.2.w1.bias": 0.6653993627306621, + "blocks.2.w2.weight": 2.3264717248101827, + "blocks.3.ln.weight": 0.03489774093031883, + "blocks.3.w1.weight": 0.8024856088475522, + "blocks.3.w1.bias": 0.6243261101573547, + "blocks.3.w2.weight": 2.2732641732905714, + "blocks.4.ln.weight": 0.036862026900053024, + "blocks.4.w1.weight": 0.7702369058900084, + "blocks.4.w1.bias": 0.671902653164234, + "blocks.4.w2.weight": 2.11229934068397, + "blocks.5.ln.weight": 0.04049132019281387, + "blocks.5.w1.weight": 0.74033776504041, + "blocks.5.w1.bias": 0.6447910547850285, + "blocks.5.w2.weight": 1.9146335569252138, + "blocks.6.ln.weight": 0.03797098994255066, + "blocks.6.w1.weight": 0.7241522377185389, + "blocks.6.w1.bias": 0.6486550903936706, + "blocks.6.w2.weight": 1.8210870137239685, + "blocks.7.ln.weight": 0.03962903097271919, + "blocks.7.w1.weight": 0.6992516513120532, + "blocks.7.w1.bias": 0.7021825186584477, + "blocks.7.w2.weight": 1.7902862835380957, + "out_ln.weight": 0.026629405096173286, + "out_head.weight": 0.5610428179907003, + "out_head.bias": 0.24151687322978704 + } + }, + "dfa": { + "log": { + "train_loss": [ + 1.4100907169977823, + 1.4334057479222615, + 1.4326289967854817, + 1.4254953683853149, + 1.4169784986495972 + ], + "train_acc": [ + 0.4805, + 0.49806666666666666, + 0.49725, + 0.5031166666666667, + 0.5098 + ], + "test_acc": [ + 0.5175, + 0.5282, + 0.5025, + 0.5027, + 0.5338 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.2141590267419815, + 0.0797841027379036, + 0.04707183688879013, + 0.0032249214127659798, + 0.024886084720492363, + -0.0050605954602360725, + 0.009758025407791138, + 0.020020857453346252 + ], + "perturbation_rho": [ + 0.07338915765285492, + -0.004745986312627792, + 0.018682830035686493, + 0.031185101717710495, + -0.02063235454261303, + 0.0006608979310840368, + 0.0, + 0.04759033024311066 + ], + "nudging": { + "0.001": [ + -3.5976991057395935e-06, + 2.3283064365386963e-09, + -9.313225746154785e-10, + -9.313225746154785e-09, + 4.656612873077393e-10, + -3.725290298461914e-09, + 1.3969838619232178e-09, + 9.313225746154785e-10 + ], + "0.003": [ + -1.0745832696557045e-05, + 2.3283064365386963e-09, + 1.6298145055770874e-09, + -2.3283064365386963e-09, + 6.752088665962219e-09, + 1.0244548320770264e-08, + -4.6566128730773926e-09, + 0.0 + ], + "0.01": [ + -3.5760458558797836e-05, + -9.313225746154785e-10, + 1.3271346688270569e-08, + -1.0244548320770264e-08, + -8.381903171539307e-09, + 4.1443854570388794e-08, + 8.847564458847046e-09, + 1.30385160446167e-08 + ] + } + }, + "drift": { + "embed.weight": 34.15137184586086, + "embed.bias": 25.886722942466992, + "blocks.0.ln.weight": 2.2413852214813232, + "blocks.0.w1.weight": 42.91370684219911, + "blocks.0.w1.bias": 42.38937429728957, + "blocks.0.w2.weight": 115.11173260217275, + "blocks.1.ln.weight": 2.0233230590820312, + "blocks.1.w1.weight": 36.64772802731374, + "blocks.1.w1.bias": 34.57367344043412, + "blocks.1.w2.weight": 84.1198032305499, + "blocks.2.ln.weight": 1.9000216722488403, + "blocks.2.w1.weight": 33.172328512058, + "blocks.2.w1.bias": 31.908254113444393, + "blocks.2.w2.weight": 78.32752075434591, + "blocks.3.ln.weight": 1.9099335670471191, + "blocks.3.w1.weight": 36.73019631908303, + "blocks.3.w1.bias": 32.60666919280332, + "blocks.3.w2.weight": 83.75068434979308, + "blocks.4.ln.weight": 1.891120195388794, + "blocks.4.w1.weight": 35.27032832987592, + "blocks.4.w1.bias": 38.017692746712825, + "blocks.4.w2.weight": 80.26417466790754, + "blocks.5.ln.weight": 2.0106024742126465, + "blocks.5.w1.weight": 42.09808335703852, + "blocks.5.w1.bias": 43.15100280108635, + "blocks.5.w2.weight": 94.64753309078039, + "blocks.6.ln.weight": 1.8941009044647217, + "blocks.6.w1.weight": 38.94163125135345, + "blocks.6.w1.bias": 38.10426587138794, + "blocks.6.w2.weight": 84.40488806201412, + "blocks.7.ln.weight": 1.9035111665725708, + "blocks.7.w1.weight": 38.65051912560395, + "blocks.7.w1.bias": 40.760402959190415, + "blocks.7.w2.weight": 81.97372863530312, + "out_ln.weight": 0.39740806818008423, + "out_head.weight": 3.609484615833081, + "out_head.bias": 0.8344298895862311 + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.7336509002049765, + 1.5851847206751506, + 1.8742321704864502, + 1.8100628153483074, + 1.5580067304611207 + ], + "train_acc": [ + 0.32705, + 0.3616333333333333, + 0.2679166666666667, + 0.31853333333333333, + 0.4080166666666667 + ], + "test_acc": [ + 0.4036, + 0.4047, + 0.3046, + 0.4005, + 0.4651 + ], + "state_pred_error": [ + 5076234.573784879, + 343992182.36586666, + 517900685.38026667, + 557639895.7226666, + 383439664.5205333 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.35149621963500977, + 0.27368226647377014, + 0.045176729559898376, + 0.04587914049625397, + 0.06403794139623642, + 0.06599076837301254, + 0.10026843845844269, + 0.11267217993736267 + ], + "perturbation_rho": [ + 0.37996596097946167, + 0.0075237625278532505, + -0.017497196793556213, + 0.001783197745680809, + 0.026772135868668556, + 0.011043311096727848, + 0.0037202914245426655, + 0.008577261120080948 + ], + "nudging": { + "0.001": [ + -7.0138368755579e-05, + -1.0319054126739502e-06, + -6.495974957942963e-08, + -4.190951585769653e-09, + -3.3993273973464966e-08, + -2.2584572434425354e-08, + -6.123445928096771e-08, + -4.1443854570388794e-08 + ], + "0.003": [ + -0.00021021789871156216, + -3.0745286494493484e-06, + -1.0547228157520294e-07, + -4.866160452365875e-08, + -8.591450750827789e-08, + -6.938353180885315e-08, + -1.1292286217212677e-07, + -9.825453162193298e-08 + ], + "0.01": [ + -0.0006983885541558266, + -1.027202233672142e-05, + -3.688037395477295e-07, + -1.073349267244339e-07, + -2.153683453798294e-07, + -2.0815059542655945e-07, + -2.6938505470752716e-07, + -3.08966264128685e-07 + ] + } + }, + "drift": { + "embed.weight": 4.244627827603776, + "embed.bias": 2.284214237417933, + "blocks.0.ln.weight": 0.7376585006713867, + "blocks.0.w1.weight": 10.052587254542228, + "blocks.0.w1.bias": 12.863219234970343, + "blocks.0.w2.weight": 32.7856072339516, + "blocks.1.ln.weight": 0.8459606170654297, + "blocks.1.w1.weight": 17.10440998330836, + "blocks.1.w1.bias": 22.587196662115986, + "blocks.1.w2.weight": 48.94107595877311, + "blocks.2.ln.weight": 0.5776991248130798, + "blocks.2.w1.weight": 12.17296546064332, + "blocks.2.w1.bias": 14.464613959802604, + "blocks.2.w2.weight": 33.58238884289355, + "blocks.3.ln.weight": 0.6916943788528442, + "blocks.3.w1.weight": 11.021146543598332, + "blocks.3.w1.bias": 11.779720628235973, + "blocks.3.w2.weight": 25.18170826322489, + "blocks.4.ln.weight": 0.5363020300865173, + "blocks.4.w1.weight": 8.488676390390957, + "blocks.4.w1.bias": 11.968348972417077, + "blocks.4.w2.weight": 23.562556821259157, + "blocks.5.ln.weight": 0.749293863773346, + "blocks.5.w1.weight": 13.199470836216618, + "blocks.5.w1.bias": 17.384581140704626, + "blocks.5.w2.weight": 36.38642209120496, + "blocks.6.ln.weight": 0.45835214853286743, + "blocks.6.w1.weight": 10.662863447362852, + "blocks.6.w1.bias": 15.855775302559838, + "blocks.6.w2.weight": 28.70293410646866, + "blocks.7.ln.weight": 0.4122738838195801, + "blocks.7.w1.weight": 7.193545064718527, + "blocks.7.w1.bias": 7.340520731384394, + "blocks.7.w2.weight": 22.53669113456487, + "out_ln.weight": 0.06885236501693726, + "out_head.weight": 1.473306835980063, + "out_head.bias": 1.5084479134035678 + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.0466531958262126, + 2.2737758037567137, + 2.280587441889445, + 2.25820095837911, + 2.270971960576375 + ], + "train_acc": [ + 0.22976666666666667, + 0.13306666666666667, + 0.13921666666666666, + 0.15853333333333333, + 0.15521666666666667 + ], + "test_acc": [ + 0.1866, + 0.101, + 0.1455, + 0.1616, + 0.0958 + ], + "value_loss": [ + 1.105676996310552, + 0.06329173700014751, + 0.02014747195293506, + 0.01469622576336066, + 0.0050645585257560015 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.04117349535226822, + 0.006370606832206249, + 0.03125208616256714, + -0.015287259593605995, + -0.04197325184941292, + -0.021368175745010376, + 0.009605868719518185, + 0.029422588646411896 + ], + "perturbation_rho": [ + -0.09283949434757233, + -0.030718784779310226, + 0.00206748116761446, + 0.0, + -0.0060626850463449955, + -0.015737878158688545, + 0.02677903138101101, + -0.040315717458724976 + ], + "nudging": { + "0.001": [ + 3.939494490623474e-06, + -1.4901161193847656e-08, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "0.003": [ + 1.1788681149482727e-05, + -3.725290298461914e-09, + 1.862645149230957e-09, + 0.0, + 0.0, + -1.862645149230957e-09, + 1.862645149230957e-09, + 0.0 + ], + "0.01": [ + 3.923662006855011e-05, + 2.60770320892334e-08, + 7.450580596923828e-09, + -1.862645149230957e-09, + 1.862645149230957e-09, + 1.862645149230957e-09, + 1.862645149230957e-09, + 5.587935447692871e-09 + ] + } + }, + "drift": { + "embed.weight": 5.5176286267072285, + "embed.bias": 5.84115130180781, + "blocks.0.ln.weight": 0.7516779899597168, + "blocks.0.w1.weight": 13.130250396475844, + "blocks.0.w1.bias": 16.418874968953887, + "blocks.0.w2.weight": 35.524006089100524, + "blocks.1.ln.weight": 1.0247337818145752, + "blocks.1.w1.weight": 24.629494668532566, + "blocks.1.w1.bias": 31.389502706524333, + "blocks.1.w2.weight": 66.32116257377548, + "blocks.2.ln.weight": 1.0405563116073608, + "blocks.2.w1.weight": 19.820545045709153, + "blocks.2.w1.bias": 21.04420170821489, + "blocks.2.w2.weight": 47.599865577930004, + "blocks.3.ln.weight": 0.698647677898407, + "blocks.3.w1.weight": 11.782448138509505, + "blocks.3.w1.bias": 11.300932589985935, + "blocks.3.w2.weight": 29.52897326429494, + "blocks.4.ln.weight": 0.7269545197486877, + "blocks.4.w1.weight": 12.151248949786332, + "blocks.4.w1.bias": 11.545512427875654, + "blocks.4.w2.weight": 31.11028303079019, + "blocks.5.ln.weight": 0.7007301449775696, + "blocks.5.w1.weight": 10.093534441471926, + "blocks.5.w1.bias": 8.779689334059729, + "blocks.5.w2.weight": 24.2612493038314, + "blocks.6.ln.weight": 0.7457646727561951, + "blocks.6.w1.weight": 9.34015610077582, + "blocks.6.w1.bias": 7.819986138941612, + "blocks.6.w2.weight": 24.326245888357803, + "blocks.7.ln.weight": 0.7317199110984802, + "blocks.7.w1.weight": 10.73492434511088, + "blocks.7.w1.bias": 9.150645079981764, + "blocks.7.w2.weight": 27.11222424242763, + "out_ln.weight": 0.07713422179222107, + "out_head.weight": 1.4131541672079744, + "out_head.bias": 0.7976411656775528 + } + } + }, + "config": { + "dataset": "fashionmnist", + "d_hidden": 256, + "num_blocks": 8, + "batch_size": 128, + "epochs": 5, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 42 + ], + "gpu": 0, + "output_dir": "results/smoke_test", + "num_classes": 10 + } +}
\ No newline at end of file |
