diff options
Diffstat (limited to 'results/synth_ladder_v2_lo/summary.json')
| -rw-r--r-- | results/synth_ladder_v2_lo/summary.json | 3590 |
1 files changed, 3590 insertions, 0 deletions
diff --git a/results/synth_ladder_v2_lo/summary.json b/results/synth_ladder_v2_lo/summary.json new file mode 100644 index 0000000..4e13fce --- /dev/null +++ b/results/synth_ladder_v2_lo/summary.json @@ -0,0 +1,3590 @@ +{ + "a0.0_L2_s42": { + "bp": { + "test_acc": 0.9185, + "mean_bp_cosine": 0.8935370743274689, + "mean_rho": 0.9999973475933075, + "mean_nudge_001": -0.016880770213901997, + "mean_nudge_003": -0.046150531619787216, + "mean_nudge_01": -0.11240250617265701, + "bp_cosine_per_layer": [ + 0.9016435146331787, + 0.885430634021759 + ], + "rho_per_layer": [ + 0.9999990463256836, + 0.9999956488609314 + ], + "nudge_per_layer": [ + -0.1530623733997345, + -0.07174263894557953 + ] + }, + "dfa": { + "test_acc": 0.842, + "mean_bp_cosine": 0.030407493002712727, + "mean_rho": 0.008977552875876427, + "mean_nudge_001": -0.00023997636890271679, + "mean_nudge_003": -0.0006689573347102851, + "mean_nudge_01": -0.0016241300618276, + "bp_cosine_per_layer": [ + -0.003507068380713463, + 0.06432205438613892 + ], + "rho_per_layer": [ + 0.009520611725747585, + 0.008434494026005268 + ], + "nudge_per_layer": [ + -0.0012172441929578781, + -0.002031015930697322 + ] + }, + "state_bridge": { + "test_acc": 0.825, + "mean_bp_cosine": 0.666242927312851, + "mean_rho": 0.5969350039958954, + "mean_nudge_001": -0.015545505564659834, + "mean_nudge_003": -0.04490915546193719, + "mean_nudge_01": -0.13079415168613195, + "bp_cosine_per_layer": [ + 0.9153801202774048, + 0.4171057343482971 + ], + "rho_per_layer": [ + 0.8286964893341064, + 0.3651735186576843 + ], + "nudge_per_layer": [ + -0.23136131465435028, + -0.030226988717913628 + ], + "state_pred_error_per_layer": [ + 438.86456298828125, + 353.2518310546875 + ], + "mean_state_pred_error": 396.0581970214844 + }, + "credit_bridge": { + "test_acc": 0.6675, + "mean_bp_cosine": 0.16703729704022408, + "mean_rho": 0.26396652311086655, + "mean_nudge_001": -0.00457099755294621, + "mean_nudge_003": -0.013636467512696981, + "mean_nudge_01": -0.04456503316760063, + "bp_cosine_per_layer": [ + 0.1011175885796547, + 0.23295700550079346 + ], + "rho_per_layer": [ + 0.19994769990444183, + 0.32798534631729126 + ], + "nudge_per_layer": [ + -0.07033564895391464, + -0.01879441738128662 + ], + "final_value_loss": 0.5091902822494507, + "final_term_loss": 0.2335890076160431, + "final_bridge_loss": 0.035112081968784334, + "final_tgrad_loss": 0.2404891884803772 + } + }, + "a0.0_L2_s123": { + "bp": { + "test_acc": 0.9205, + "mean_bp_cosine": 0.8566932380199432, + "mean_rho": 0.9999960958957672, + "mean_nudge_001": -0.015286394860595465, + "mean_nudge_003": -0.04188752360641956, + "mean_nudge_01": -0.10229892283678055, + "bp_cosine_per_layer": [ + 0.8634263277053833, + 0.8499601483345032 + ], + "rho_per_layer": [ + 0.9999988079071045, + 0.9999933838844299 + ], + "nudge_per_layer": [ + -0.13922545313835144, + -0.06537239253520966 + ] + }, + "dfa": { + "test_acc": 0.841, + "mean_bp_cosine": 0.08572041988372803, + "mean_rho": 0.10125503316521645, + "mean_nudge_001": -0.001035464447340928, + "mean_nudge_003": -0.0030792844481766224, + "mean_nudge_01": -0.009957430185750127, + "bp_cosine_per_layer": [ + 0.048809632658958435, + 0.12263120710849762 + ], + "rho_per_layer": [ + 0.09689537435770035, + 0.10561469197273254 + ], + "nudge_per_layer": [ + -0.015226385556161404, + -0.00468847481533885 + ] + }, + "state_bridge": { + "test_acc": 0.822, + "mean_bp_cosine": 0.7052022516727448, + "mean_rho": 0.608213409781456, + "mean_nudge_001": -0.014205678016878664, + "mean_nudge_003": -0.04078014753758907, + "mean_nudge_01": -0.11634222697466612, + "bp_cosine_per_layer": [ + 0.9309895038604736, + 0.47941499948501587 + ], + "rho_per_layer": [ + 0.8439192175865173, + 0.37250760197639465 + ], + "nudge_per_layer": [ + -0.2068808674812317, + -0.025803586468100548 + ], + "state_pred_error_per_layer": [ + 436.0709533691406, + 352.44915771484375 + ], + "mean_state_pred_error": 394.2600555419922 + }, + "credit_bridge": { + "test_acc": 0.664, + "mean_bp_cosine": 0.14723356813192368, + "mean_rho": 0.27719707787036896, + "mean_nudge_001": -0.0040612792945466936, + "mean_nudge_003": -0.012125232955440879, + "mean_nudge_01": -0.03972679190337658, + "bp_cosine_per_layer": [ + 0.08253486454486847, + 0.21193227171897888 + ], + "rho_per_layer": [ + 0.16999724507331848, + 0.38439691066741943 + ], + "nudge_per_layer": [ + -0.06126694008708, + -0.018186643719673157 + ], + "final_value_loss": 0.6019191103935242, + "final_term_loss": 0.28414561631679536, + "final_bridge_loss": 0.04602321577072144, + "final_tgrad_loss": 0.27175028200149537 + } + }, + "a0.0_L2_s456": { + "bp": { + "test_acc": 0.9295, + "mean_bp_cosine": 0.870507538318634, + "mean_rho": 0.9999973773956299, + "mean_nudge_001": -0.014503923710435629, + "mean_nudge_003": -0.039223295636475086, + "mean_nudge_01": -0.09240655042231083, + "bp_cosine_per_layer": [ + 0.8826531171798706, + 0.8583619594573975 + ], + "rho_per_layer": [ + 0.9999988079071045, + 0.9999959468841553 + ], + "nudge_per_layer": [ + -0.12340263277292252, + -0.06141046807169914 + ] + }, + "dfa": { + "test_acc": 0.8485, + "mean_bp_cosine": 0.051622094586491585, + "mean_rho": 0.014518704265356064, + "mean_nudge_001": -0.00044165633153170347, + "mean_nudge_003": -0.0013033851282671094, + "mean_nudge_01": -0.0040968600660562515, + "bp_cosine_per_layer": [ + 0.016239378601312637, + 0.08700481057167053 + ], + "rho_per_layer": [ + -0.0633457601070404, + 0.09238316863775253 + ], + "nudge_per_layer": [ + -0.004778302274644375, + -0.003415417857468128 + ] + }, + "state_bridge": { + "test_acc": 0.8285, + "mean_bp_cosine": 0.7213762998580933, + "mean_rho": 0.644424170255661, + "mean_nudge_001": -0.014933469472452998, + "mean_nudge_003": -0.042839838191866875, + "mean_nudge_01": -0.12188584543764591, + "bp_cosine_per_layer": [ + 0.9387110471725464, + 0.5040415525436401 + ], + "rho_per_layer": [ + 0.7997298240661621, + 0.4891185164451599 + ], + "nudge_per_layer": [ + -0.21233828365802765, + -0.031433407217264175 + ], + "state_pred_error_per_layer": [ + 387.8657531738281, + 319.336669921875 + ], + "mean_state_pred_error": 353.60121154785156 + }, + "credit_bridge": { + "test_acc": 0.7115, + "mean_bp_cosine": 0.16614358872175217, + "mean_rho": 0.25560564547777176, + "mean_nudge_001": -0.0032864182721823454, + "mean_nudge_003": -0.009816689416766167, + "mean_nudge_01": -0.03221969399601221, + "bp_cosine_per_layer": [ + 0.08927787840366364, + 0.2430092990398407 + ], + "rho_per_layer": [ + 0.16060538589954376, + 0.35060590505599976 + ], + "nudge_per_layer": [ + -0.047705113887786865, + -0.016734274104237556 + ], + "final_value_loss": 0.31588549439907077, + "final_term_loss": 0.09000624770522117, + "final_bridge_loss": 0.023082720217108728, + "final_tgrad_loss": 0.20279652795791625 + } + }, + "a0.0_L4_s42": { + "bp": { + "test_acc": 0.925, + "mean_bp_cosine": 0.8320528566837311, + "mean_rho": 0.9999772906303406, + "mean_nudge_001": -0.009003315295558423, + "mean_nudge_003": -0.024674441665410995, + "mean_nudge_01": -0.06179796298965812, + "bp_cosine_per_layer": [ + 0.8599773645401001, + 0.8422204256057739, + 0.8250665664672852, + 0.8009470701217651 + ], + "rho_per_layer": [ + 0.9999991655349731, + 0.9999953508377075, + 0.9999807476997375, + 0.9999338984489441 + ], + "nudge_per_layer": [ + -0.12188813835382462, + -0.07056954503059387, + -0.034971628338098526, + -0.019762540236115456 + ] + }, + "dfa": { + "test_acc": 0.856, + "mean_bp_cosine": 0.10417622653767467, + "mean_rho": 0.09206205606460571, + "mean_nudge_001": -0.00045079714618623257, + "mean_nudge_003": -0.0013433840940706432, + "mean_nudge_01": -0.004383910913020372, + "bp_cosine_per_layer": [ + 0.004014266654849052, + 0.16519895195960999, + 0.13244280219078064, + 0.11504888534545898 + ], + "rho_per_layer": [ + 0.042726192623376846, + 0.18379396200180054, + 0.108277827501297, + 0.03345024213194847 + ], + "nudge_per_layer": [ + -0.005573366768658161, + -0.005793239921331406, + -0.003338021691888571, + -0.002831015270203352 + ] + }, + "state_bridge": { + "test_acc": 0.7615, + "mean_bp_cosine": 0.38204737193882465, + "mean_rho": 0.3213508538901806, + "mean_nudge_001": -0.006838726330897771, + "mean_nudge_003": -0.01991741475649178, + "mean_nudge_01": -0.059746103768702596, + "bp_cosine_per_layer": [ + 0.8646283149719238, + 0.4090673327445984, + 0.1404263973236084, + 0.114067442715168 + ], + "rho_per_layer": [ + 0.7375176548957825, + 0.33617356419563293, + 0.14259827136993408, + 0.06911392509937286 + ], + "nudge_per_layer": [ + -0.218303382396698, + -0.013712376356124878, + -0.003879058640450239, + -0.0030895976815372705 + ], + "state_pred_error_per_layer": [ + 6951.521484375, + 6099.5322265625, + 5877.8310546875, + 3832.076416015625 + ], + "mean_state_pred_error": 5690.240295410156 + }, + "credit_bridge": { + "test_acc": 0.6585, + "mean_bp_cosine": 0.10922159999608994, + "mean_rho": 0.21513587795197964, + "mean_nudge_001": -0.00137018840177916, + "mean_nudge_003": -0.004100472666323185, + "mean_nudge_01": -0.013550454750657082, + "bp_cosine_per_layer": [ + 0.049023956060409546, + 0.11911389231681824, + 0.12341275811195374, + 0.14533579349517822 + ], + "rho_per_layer": [ + 0.09633419662714005, + 0.23598268628120422, + 0.24357257783412933, + 0.28465405106544495 + ], + "nudge_per_layer": [ + -0.026128236204385757, + -0.008897590450942516, + -0.009167088195681572, + -0.01000890415161848 + ], + "final_value_loss": 0.5270826056480408, + "final_term_loss": 0.22659661755561827, + "final_bridge_loss": 0.04233165686130524, + "final_tgrad_loss": 0.25815433073043825 + } + }, + "a0.0_L4_s123": { + "bp": { + "test_acc": 0.926, + "mean_bp_cosine": 0.7713210135698318, + "mean_rho": 0.9999768882989883, + "mean_nudge_001": -0.010334675083868206, + "mean_nudge_003": -0.028318932512775064, + "mean_nudge_01": -0.06953301187604666, + "bp_cosine_per_layer": [ + 0.808335542678833, + 0.780368447303772, + 0.7579712271690369, + 0.7386088371276855 + ], + "rho_per_layer": [ + 0.9999986886978149, + 0.999996542930603, + 0.9999827146530151, + 0.9999296069145203 + ], + "nudge_per_layer": [ + -0.13544964790344238, + -0.08136264234781265, + -0.039826083928346634, + -0.02149367332458496 + ] + }, + "dfa": { + "test_acc": 0.8375, + "mean_bp_cosine": 0.1401939271017909, + "mean_rho": 0.11219900287687778, + "mean_nudge_001": -0.000286264817987103, + "mean_nudge_003": -0.0008422381652053446, + "mean_nudge_01": -0.0026496590580791235, + "bp_cosine_per_layer": [ + -0.028116505593061447, + 0.29581546783447266, + 0.170908123254776, + 0.12216862291097641 + ], + "rho_per_layer": [ + -0.07312458753585815, + 0.3015226125717163, + 0.09657395631074905, + 0.12382403016090393 + ], + "nudge_per_layer": [ + 0.0038727924693375826, + -0.007415304891765118, + -0.0039948043413460255, + -0.0030613194685429335 + ] + }, + "state_bridge": { + "test_acc": 0.788, + "mean_bp_cosine": 0.3973395489156246, + "mean_rho": 0.36834993585944176, + "mean_nudge_001": -0.006569715158548206, + "mean_nudge_003": -0.019017601298401132, + "mean_nudge_01": -0.055994155758526176, + "bp_cosine_per_layer": [ + 0.8812471032142639, + 0.4430118799209595, + 0.14485391974449158, + 0.12024529278278351 + ], + "rho_per_layer": [ + 0.803270697593689, + 0.4108988642692566, + 0.12428833544254303, + 0.13494184613227844 + ], + "nudge_per_layer": [ + -0.20551547408103943, + -0.01310029998421669, + -0.0029572518542408943, + -0.0024035971146076918 + ], + "state_pred_error_per_layer": [ + 6307.859375, + 4221.2177734375, + 3825.8369140625, + 3284.16064453125 + ], + "mean_state_pred_error": 4409.7686767578125 + }, + "credit_bridge": { + "test_acc": 0.7305, + "mean_bp_cosine": 0.10989296156913042, + "mean_rho": 0.18325010500848293, + "mean_nudge_001": -0.0012505464837886393, + "mean_nudge_003": -0.00373545300681144, + "mean_nudge_01": -0.012258320581167936, + "bp_cosine_per_layer": [ + 0.03434538468718529, + 0.12379913777112961, + 0.1433446854352951, + 0.13808263838291168 + ], + "rho_per_layer": [ + 0.03924814611673355, + 0.21971622109413147, + 0.26409071683883667, + 0.20994533598423004 + ], + "nudge_per_layer": [ + -0.020018436014652252, + -0.00925234891474247, + -0.010285570286214352, + -0.009476927109062672 + ], + "final_value_loss": 0.454630423784256, + "final_term_loss": 0.185297670173645, + "final_bridge_loss": 0.03432008520960808, + "final_tgrad_loss": 0.2350126650452614 + } + }, + "a0.0_L4_s456": { + "bp": { + "test_acc": 0.9285, + "mean_bp_cosine": 0.7884698659181595, + "mean_rho": 0.999981090426445, + "mean_nudge_001": -0.01117145799798891, + "mean_nudge_003": -0.030768739874474704, + "mean_nudge_01": -0.07730476558208466, + "bp_cosine_per_layer": [ + 0.8268355131149292, + 0.7960893511772156, + 0.7726784944534302, + 0.758276104927063 + ], + "rho_per_layer": [ + 0.9999993443489075, + 0.999996542930603, + 0.999983549118042, + 0.9999449253082275 + ], + "nudge_per_layer": [ + -0.15056422352790833, + -0.08916378021240234, + -0.04451071470975876, + -0.024980343878269196 + ] + }, + "dfa": { + "test_acc": 0.8655, + "mean_bp_cosine": 0.06126724602654576, + "mean_rho": 0.09146236767992377, + "mean_nudge_001": -0.00023738171148579568, + "mean_nudge_003": -0.0006991284317336977, + "mean_nudge_01": -0.0021681145881302655, + "bp_cosine_per_layer": [ + -0.012256121262907982, + 0.07949584722518921, + 0.0787847638130188, + 0.09904449433088303 + ], + "rho_per_layer": [ + -0.003950485959649086, + 0.06165219843387604, + 0.14469987154006958, + 0.16344788670539856 + ], + "nudge_per_layer": [ + 0.002696676878258586, + -0.005506287328898907, + -0.0027312645688652992, + -0.003131583333015442 + ] + }, + "state_bridge": { + "test_acc": 0.7455, + "mean_bp_cosine": 0.4014641270041466, + "mean_rho": 0.3732803575694561, + "mean_nudge_001": -0.007542004925198853, + "mean_nudge_003": -0.022030926978914067, + "mean_nudge_01": -0.06684440147364512, + "bp_cosine_per_layer": [ + 0.8436356782913208, + 0.46039146184921265, + 0.16277557611465454, + 0.13905379176139832 + ], + "rho_per_layer": [ + 0.7277628183364868, + 0.48849108815193176, + 0.1771586537361145, + 0.09970887005329132 + ], + "nudge_per_layer": [ + -0.2401106357574463, + -0.018598388880491257, + -0.004775169305503368, + -0.0038934119511395693 + ], + "state_pred_error_per_layer": [ + 3442.556884765625, + 2195.27490234375, + 2035.546875, + 2293.3291015625 + ], + "mean_state_pred_error": 2491.6769409179688 + }, + "credit_bridge": { + "test_acc": 0.644, + "mean_bp_cosine": 0.1536249229684472, + "mean_rho": 0.26861424930393696, + "mean_nudge_001": -0.0018619927868712693, + "mean_nudge_003": -0.005573431379161775, + "mean_nudge_01": -0.018431853968650103, + "bp_cosine_per_layer": [ + 0.053475264459848404, + 0.17959368228912354, + 0.19590041041374207, + 0.18553033471107483 + ], + "rho_per_layer": [ + 0.04320300370454788, + 0.30398592352867126, + 0.35316282510757446, + 0.3741052448749542 + ], + "nudge_per_layer": [ + -0.027841825038194656, + -0.015361151657998562, + -0.015351004898548126, + -0.015173434279859066 + ], + "final_value_loss": 0.7469501955509186, + "final_term_loss": 0.4142983556270599, + "final_bridge_loss": 0.05541581681370735, + "final_tgrad_loss": 0.2772360302686691 + } + }, + "a0.0_L8_s42": { + "bp": { + "test_acc": 0.906, + "mean_bp_cosine": 0.8584278598427773, + "mean_rho": 0.9999460652470589, + "mean_nudge_001": -0.008581212867284194, + "mean_nudge_003": -0.02450006199069321, + "mean_nudge_01": -0.06902276305481791, + "bp_cosine_per_layer": [ + 0.8854324817657471, + 0.8737501502037048, + 0.8630377054214478, + 0.8562113046646118, + 0.8509326577186584, + 0.8481521606445312, + 0.84560626745224, + 0.8443001508712769 + ], + "rho_per_layer": [ + 0.9999991655349731, + 0.9999963045120239, + 0.9999881386756897, + 0.9999630451202393, + 0.9999364614486694, + 0.9999151825904846, + 0.9998926520347595, + 0.9998775720596313 + ], + "nudge_per_layer": [ + -0.21767401695251465, + -0.12408202886581421, + -0.06762672960758209, + -0.04208396375179291, + -0.031123068183660507, + -0.025745777413249016, + -0.022784877568483353, + -0.021061642095446587 + ] + }, + "dfa": { + "test_acc": 0.8325, + "mean_bp_cosine": 0.0621855678036809, + "mean_rho": 0.08102096850052476, + "mean_nudge_001": 7.459322478098329e-05, + "mean_nudge_003": 0.00026162770882365294, + "mean_nudge_01": 0.0013351911620702595, + "bp_cosine_per_layer": [ + -0.02968163788318634, + 0.08609121292829514, + 0.09377065300941467, + 0.10205866396427155, + 0.08807726949453354, + 0.053033627569675446, + 0.056919872760772705, + 0.04721488058567047 + ], + "rho_per_layer": [ + -0.09032663702964783, + 0.17043988406658173, + 0.18389353156089783, + 0.16770029067993164, + 0.1504741907119751, + 0.05179755389690399, + 0.050898581743240356, + -0.03670964762568474 + ], + "nudge_per_layer": [ + 0.028243789449334145, + -0.00520662497729063, + -0.0028999613132327795, + -0.002869710559025407, + -0.0023996694944798946, + -0.0015899656573310494, + -0.0014181910082697868, + -0.0011781371431425214 + ] + }, + "state_bridge": { + "test_acc": 0.726, + "mean_bp_cosine": 0.26912851445376873, + "mean_rho": 0.2629122715443373, + "mean_nudge_001": -0.0034038230442092754, + "mean_nudge_003": -0.010012732280301861, + "mean_nudge_01": -0.0311450962908566, + "bp_cosine_per_layer": [ + 0.8151727914810181, + 0.4042307734489441, + 0.16176781058311462, + 0.1698867678642273, + 0.14891386032104492, + 0.1726662963628769, + 0.1322125643491745, + 0.14817725121974945 + ], + "rho_per_layer": [ + 0.7261759042739868, + 0.36915943026542664, + 0.17840053141117096, + 0.16105638444423676, + 0.14931628108024597, + 0.15696927905082703, + 0.17820878326892853, + 0.1840115785598755 + ], + "nudge_per_layer": [ + -0.21425020694732666, + -0.011446774937212467, + -0.004181142896413803, + -0.004114024806767702, + -0.0038589704781770706, + -0.00422251783311367, + -0.003358659567311406, + -0.003728472860530019 + ], + "state_pred_error_per_layer": [ + 7398.20849609375, + 5242.7607421875, + 3768.9609375, + 3258.12548828125, + 3060.2021484375, + 2786.609619140625, + 3211.44921875, + 2939.81005859375 + ], + "mean_state_pred_error": 3958.265838623047 + }, + "credit_bridge": { + "test_acc": 0.64, + "mean_bp_cosine": 0.09559969999827445, + "mean_rho": 0.20091960858553648, + "mean_nudge_001": -0.0007423463721352164, + "mean_nudge_003": -0.0022244660067372024, + "mean_nudge_01": -0.007368246268015355, + "bp_cosine_per_layer": [ + 0.010387556627392769, + 0.06787668168544769, + 0.11108389496803284, + 0.11367877572774887, + 0.11491300165653229, + 0.1093105673789978, + 0.11488444358110428, + 0.12266267836093903 + ], + "rho_per_layer": [ + 0.0504305437207222, + 0.11780044436454773, + 0.23789767920970917, + 0.24238067865371704, + 0.22429296374320984, + 0.25153419375419617, + 0.25647929310798645, + 0.22654107213020325 + ], + "nudge_per_layer": [ + -0.003928218502551317, + -0.0057389335706830025, + -0.007835019379854202, + -0.008116443641483784, + -0.0081653306260705, + -0.00813683308660984, + -0.008312376216053963, + -0.00871281512081623 + ], + "final_value_loss": 0.6615465266227722, + "final_term_loss": 0.43013124598264696, + "final_bridge_loss": 0.0357342723429203, + "final_tgrad_loss": 0.19568100452423096 + } + }, + "a0.0_L8_s123": { + "bp": { + "test_acc": 0.913, + "mean_bp_cosine": 0.8645070418715477, + "mean_rho": 0.999944381415844, + "mean_nudge_001": -0.007505885470891371, + "mean_nudge_003": -0.021483065967913717, + "mean_nudge_01": -0.06040166970342398, + "bp_cosine_per_layer": [ + 0.9087610840797424, + 0.8890509605407715, + 0.8756387233734131, + 0.860000729560852, + 0.8513467311859131, + 0.8465403914451599, + 0.8431664705276489, + 0.8415512442588806 + ], + "rho_per_layer": [ + 0.9999994039535522, + 0.9999971389770508, + 0.9999857544898987, + 0.9999687671661377, + 0.9999316930770874, + 0.9999115467071533, + 0.9998936653137207, + 0.9998670816421509 + ], + "nudge_per_layer": [ + -0.19297254085540771, + -0.10940254479646683, + -0.05867426097393036, + -0.03609157353639603, + -0.026526644825935364, + -0.02192458137869835, + -0.019491419196128845, + -0.01812979206442833 + ] + }, + "dfa": { + "test_acc": 0.849, + "mean_bp_cosine": 0.07409168453887105, + "mean_rho": 0.0943274952005595, + "mean_nudge_001": -6.366873094520997e-06, + "mean_nudge_003": -1.1956191883655265e-05, + "mean_nudge_01": 5.2888659411109984e-05, + "bp_cosine_per_layer": [ + -0.02848462387919426, + 0.15189720690250397, + 0.09141203761100769, + 0.07272940874099731, + 0.09136377274990082, + 0.0857112780213356, + 0.044680722057819366, + 0.0834236741065979 + ], + "rho_per_layer": [ + 0.03057212010025978, + 0.16072696447372437, + 0.13512857258319855, + 0.0885201245546341, + 0.1377822607755661, + 0.04239961504936218, + 0.0035119224339723587, + 0.15597838163375854 + ], + "nudge_per_layer": [ + 0.015482441522181034, + -0.004561400040984154, + -0.0020816801115870476, + -0.0015152986161410809, + -0.0019329312490299344, + -0.002064004773274064, + -0.001068722689524293, + -0.0018352947663515806 + ] + }, + "state_bridge": { + "test_acc": 0.7725, + "mean_bp_cosine": 0.2933046016842127, + "mean_rho": 0.25743963569402695, + "mean_nudge_001": -0.0033750918046280276, + "mean_nudge_003": -0.009846233486314304, + "mean_nudge_01": -0.02971906404127367, + "bp_cosine_per_layer": [ + 0.8679102659225464, + 0.46438825130462646, + 0.22033852338790894, + 0.1893446445465088, + 0.16738475859165192, + 0.14945879578590393, + 0.1267041563987732, + 0.16090741753578186 + ], + "rho_per_layer": [ + 0.6897462606430054, + 0.42848390340805054, + 0.19369670748710632, + 0.19582855701446533, + 0.14048044383525848, + 0.12853404879570007, + 0.09809397161006927, + 0.18465319275856018 + ], + "nudge_per_layer": [ + -0.2050759196281433, + -0.01248687319457531, + -0.004478689283132553, + -0.003817938268184662, + -0.00330835347995162, + -0.002980519086122513, + -0.002494834130629897, + -0.003109385259449482 + ], + "state_pred_error_per_layer": [ + 7121.279296875, + 6133.4482421875, + 3940.991943359375, + 2496.587646484375, + 2560.85595703125, + 2498.587890625, + 3539.93115234375, + 2449.22607421875 + ], + "mean_state_pred_error": 3842.613525390625 + }, + "credit_bridge": { + "test_acc": 0.656, + "mean_bp_cosine": 0.092392878344981, + "mean_rho": 0.17488694936037064, + "mean_nudge_001": -0.0007325447659241036, + "mean_nudge_003": -0.002192195039242506, + "mean_nudge_01": -0.0072501768881920725, + "bp_cosine_per_layer": [ + 0.001700198045000434, + 0.04125010222196579, + 0.1112770289182663, + 0.11907510459423065, + 0.11768756806850433, + 0.11733907461166382, + 0.11329221725463867, + 0.117521733045578 + ], + "rho_per_layer": [ + 0.043069981038570404, + 0.1044735386967659, + 0.23828034102916718, + 0.18111932277679443, + 0.19782572984695435, + 0.1971191018819809, + 0.20729684829711914, + 0.2299107313156128 + ], + "nudge_per_layer": [ + -0.006082434207201004, + -0.003400696674361825, + -0.007903593592345715, + -0.008138573728501797, + -0.008289994671940804, + -0.007994470186531544, + -0.00807441771030426, + -0.008117234334349632 + ], + "final_value_loss": 0.5009399848937989, + "final_term_loss": 0.26505257573127744, + "final_bridge_loss": 0.027039055764675142, + "final_tgrad_loss": 0.20884835484027864 + } + }, + "a0.0_L8_s456": { + "bp": { + "test_acc": 0.8965, + "mean_bp_cosine": 0.8864798843860626, + "mean_rho": 0.9999493733048439, + "mean_nudge_001": -0.007212058277218603, + "mean_nudge_003": -0.02048966591246426, + "mean_nudge_01": -0.05707334354519844, + "bp_cosine_per_layer": [ + 0.9283311367034912, + 0.9162832498550415, + 0.8925424814224243, + 0.8799441456794739, + 0.8746041655540466, + 0.8698863983154297, + 0.8666130304336548, + 0.863634467124939 + ], + "rho_per_layer": [ + 0.9999991059303284, + 0.9999967217445374, + 0.9999891519546509, + 0.9999651908874512, + 0.9999410510063171, + 0.9999043941497803, + 0.9998966455459595, + 0.9999027252197266 + ], + "nudge_per_layer": [ + -0.17811693251132965, + -0.10346511751413345, + -0.05678309500217438, + -0.035222865641117096, + -0.025761041790246964, + -0.021198198199272156, + -0.01872769370675087, + -0.017311803996562958 + ] + }, + "dfa": { + "test_acc": 0.833, + "mean_bp_cosine": 0.10069436486810446, + "mean_rho": 0.11729028820991516, + "mean_nudge_001": -0.00045204991511127446, + "mean_nudge_003": -0.0013379494193941355, + "mean_nudge_01": -0.004276915889931843, + "bp_cosine_per_layer": [ + 0.020978286862373352, + 0.16464680433273315, + 0.15073026716709137, + 0.08116275072097778, + 0.08070477098226547, + 0.0867747962474823, + 0.10854049026966095, + 0.11201675236225128 + ], + "rho_per_layer": [ + 0.032643549144268036, + 0.2071959227323532, + 0.2057623416185379, + 0.09326457977294922, + 0.06205561012029648, + 0.1389445811510086, + 0.11340519785881042, + 0.08505052328109741 + ], + "nudge_per_layer": [ + -0.012655803002417088, + -0.005697320215404034, + -0.004094945732504129, + -0.0018561023753136396, + -0.0020380420610308647, + -0.0022426587529480457, + -0.002856952603906393, + -0.0027735023759305477 + ] + }, + "state_bridge": { + "test_acc": 0.7495, + "mean_bp_cosine": 0.246165806427598, + "mean_rho": 0.20948901865631342, + "mean_nudge_001": -0.0035059251604252495, + "mean_nudge_003": -0.010245608449622523, + "mean_nudge_01": -0.03114599542459473, + "bp_cosine_per_layer": [ + 0.8467778563499451, + 0.3549606502056122, + 0.1711018681526184, + 0.12375819683074951, + 0.1153455525636673, + 0.12219913303852081, + 0.12895643711090088, + 0.10622675716876984 + ], + "rho_per_layer": [ + 0.7416437268257141, + 0.2796669900417328, + 0.14060860872268677, + 0.09820520132780075, + 0.10454020649194717, + 0.08740514516830444, + 0.10375625640153885, + 0.12008601427078247 + ], + "nudge_per_layer": [ + -0.2212277054786682, + -0.010068328119814396, + -0.00393392750993371, + -0.002955838106572628, + -0.0027290289290249348, + -0.0028208147268742323, + -0.002979037119075656, + -0.002453283406794071 + ], + "state_pred_error_per_layer": [ + 10942.7939453125, + 10293.740234375, + 7482.4482421875, + 5008.9619140625, + 4863.818359375, + 4492.451171875, + 3565.2744140625, + 3837.47998046875 + ], + "mean_state_pred_error": 6310.871032714844 + }, + "credit_bridge": { + "test_acc": 0.617, + "mean_bp_cosine": 0.09351247036829591, + "mean_rho": 0.15350601403042674, + "mean_nudge_001": -0.0010894104561884888, + "mean_nudge_003": -0.0032592675706837326, + "mean_nudge_01": -0.010775732051115483, + "bp_cosine_per_layer": [ + 0.03283574804663658, + 0.05836774408817291, + 0.11590129137039185, + 0.10100162029266357, + 0.1079024076461792, + 0.10276803374290466, + 0.11581481993198395, + 0.11350809782743454 + ], + "rho_per_layer": [ + 0.06095704063773155, + 0.13836193084716797, + 0.1803440898656845, + 0.1439131498336792, + 0.14064353704452515, + 0.15858328342437744, + 0.22606094181537628, + 0.17918413877487183 + ], + "nudge_per_layer": [ + -0.023668643087148666, + -0.006166210863739252, + -0.009575091302394867, + -0.00891521479934454, + -0.00932026281952858, + -0.008899858221411705, + -0.009868312627077103, + -0.009792262688279152 + ], + "final_value_loss": 1.2871107803344726, + "final_term_loss": 0.9274139808654785, + "final_bridge_loss": 0.0815536917924881, + "final_tgrad_loss": 0.2781431001186371 + } + }, + "a0.0_L12_s42": { + "bp": { + "test_acc": 0.9135, + "mean_bp_cosine": 0.8262566576401392, + "mean_rho": 0.9998530795176824, + "mean_nudge_001": -0.005460524485291292, + "mean_nudge_003": -0.015294013021048158, + "mean_nudge_01": -0.04075813665986061, + "bp_cosine_per_layer": [ + 0.8936765193939209, + 0.875713586807251, + 0.8523612022399902, + 0.835299551486969, + 0.8243429064750671, + 0.8148068189620972, + 0.809612512588501, + 0.8055970668792725, + 0.8028815984725952, + 0.8011909127235413, + 0.8001247644424438, + 0.799472451210022 + ], + "rho_per_layer": [ + 0.9999988079071045, + 0.999997615814209, + 0.9999872446060181, + 0.9999661445617676, + 0.9999244213104248, + 0.9998762011528015, + 0.9998204708099365, + 0.9997811317443848, + 0.9997683167457581, + 0.9997478723526001, + 0.9997052550315857, + 0.9996634721755981 + ], + "nudge_per_layer": [ + -0.15880361199378967, + -0.10216463357210159, + -0.058997806161642075, + -0.0368044376373291, + -0.02622675709426403, + -0.02074911817908287, + -0.017529264092445374, + -0.015481802634894848, + -0.014148212037980556, + -0.013247357681393623, + -0.012655021622776985, + -0.012289617210626602 + ] + }, + "dfa": { + "test_acc": 0.8405, + "mean_bp_cosine": 0.06366231696059306, + "mean_rho": 0.0974447913467884, + "mean_nudge_001": -0.00019441865091115082, + "mean_nudge_003": -0.0005761026429051223, + "mean_nudge_01": -0.001826463839582478, + "bp_cosine_per_layer": [ + 0.022819485515356064, + 0.10611869394779205, + 0.08763782680034637, + 0.06361521780490875, + 0.08818645775318146, + 0.07573625445365906, + 0.07574683427810669, + 0.025106821209192276, + 0.029594242572784424, + 0.09018446505069733, + 0.04191981628537178, + 0.05728168785572052 + ], + "rho_per_layer": [ + -0.0498071163892746, + 0.18554872274398804, + 0.19663047790527344, + 0.14150168001651764, + 0.06663499772548676, + 0.12039551883935928, + 0.12434913218021393, + 0.05157296732068062, + 0.09405694901943207, + 0.07376686483621597, + 0.061272408813238144, + 0.10341489315032959 + ], + "nudge_per_layer": [ + 0.000284646637737751, + -0.005279931705445051, + -0.002400151453912258, + -0.0017087131273001432, + -0.0019207102013751864, + -0.0020927595905959606, + -0.0017691099783405662, + -0.0008208724320866168, + -0.0012333606136962771, + -0.0026537002995610237, + -0.0007275568204931915, + -0.0015953464899212122 + ] + }, + "state_bridge": { + "test_acc": 0.675, + "mean_bp_cosine": 0.16806975565850735, + "mean_rho": 0.14302178906897703, + "mean_nudge_001": -0.0021900876042006225, + "mean_nudge_003": -0.006470390944741666, + "mean_nudge_01": -0.020386384644856054, + "bp_cosine_per_layer": [ + 0.7431880235671997, + 0.2796655595302582, + 0.13151727616786957, + 0.09881292283535004, + 0.0924338698387146, + 0.10159576684236526, + 0.09764175117015839, + 0.09642879664897919, + 0.09804226458072662, + 0.09603762626647949, + 0.09261822700500488, + 0.08885498344898224 + ], + "rho_per_layer": [ + 0.611870527267456, + 0.24307268857955933, + 0.10120554268360138, + 0.09459854662418365, + 0.09521515667438507, + 0.07265714555978775, + 0.07570740580558777, + 0.0650622695684433, + 0.07738275825977325, + 0.11346932500600815, + 0.08958262950181961, + 0.07643747329711914 + ], + "nudge_per_layer": [ + -0.20912763476371765, + -0.00893338117748499, + -0.0035844063386321068, + -0.0027289288118481636, + -0.0024399380199611187, + -0.0026743747293949127, + -0.0025294050574302673, + -0.002557961270213127, + -0.0026802942156791687, + -0.002547960262745619, + -0.002460954710841179, + -0.0023713763803243637 + ], + "state_pred_error_per_layer": [ + 20223.798828125, + 14219.4013671875, + 11048.2333984375, + 10263.419921875, + 8570.201171875, + 7224.33740234375, + 7281.2197265625, + 8034.87548828125, + 6686.9033203125, + 6885.98291015625, + 6667.048828125, + 6627.78125 + ], + "mean_state_pred_error": 9477.766967773438 + }, + "credit_bridge": { + "test_acc": 0.6635, + "mean_bp_cosine": 0.07870348079207663, + "mean_rho": 0.1263093726399044, + "mean_nudge_001": -0.000519128576949394, + "mean_nudge_003": -0.0015524110640399158, + "mean_nudge_01": -0.005132454059397181, + "bp_cosine_per_layer": [ + 9.498395957052708e-05, + 0.029415149241685867, + 0.062070880085229874, + 0.07393385469913483, + 0.07970248907804489, + 0.08624569326639175, + 0.10002343356609344, + 0.10488344728946686, + 0.10920242965221405, + 0.10451158881187439, + 0.09929930418729782, + 0.09505851566791534 + ], + "rho_per_layer": [ + 0.025425152853131294, + 0.0574759915471077, + 0.13417154550552368, + 0.10034967213869095, + 0.17468321323394775, + 0.17164339125156403, + 0.15925100445747375, + 0.08668951690196991, + 0.1521437168121338, + 0.14672580361366272, + 0.1825145184993744, + 0.12463894486427307 + ], + "nudge_per_layer": [ + 0.001420565415173769, + -0.0026360084302723408, + -0.00476992130279541, + -0.005131378769874573, + -0.005615689791738987, + -0.006001932080835104, + -0.006417973432689905, + -0.006630052346736193, + -0.006984136067330837, + -0.0066003259271383286, + -0.00623705331236124, + -0.005985542666167021 + ], + "final_value_loss": 0.9863593735218048, + "final_term_loss": 0.7168336891174316, + "final_bridge_loss": 0.05245816183909774, + "final_tgrad_loss": 0.21706753172874452 + } + }, + "a0.0_L12_s123": { + "bp": { + "test_acc": 0.9145, + "mean_bp_cosine": 0.7868696798880895, + "mean_rho": 0.9998756001393, + "mean_nudge_001": -0.005259950548255195, + "mean_nudge_003": -0.014897353908357521, + "mean_nudge_01": -0.04119087569415569, + "bp_cosine_per_layer": [ + 0.832116425037384, + 0.8141677379608154, + 0.8023761510848999, + 0.7934653759002686, + 0.7857377529144287, + 0.7797414064407349, + 0.7767306566238403, + 0.7744640111923218, + 0.7725205421447754, + 0.7711977958679199, + 0.7703278064727783, + 0.7695904970169067 + ], + "rho_per_layer": [ + 0.9999991655349731, + 0.9999972581863403, + 0.9999898672103882, + 0.999970555305481, + 0.9999305009841919, + 0.9999109506607056, + 0.9998676180839539, + 0.999832808971405, + 0.9997924566268921, + 0.9997202754020691, + 0.9997268319129944, + 0.9997689127922058 + ], + "nudge_per_layer": [ + -0.17892791330814362, + -0.10439710319042206, + -0.05659153312444687, + -0.034265220165252686, + -0.02416030317544937, + -0.01895919442176819, + -0.015955276787281036, + -0.01404004916548729, + -0.01277724839746952, + -0.011922692880034447, + -0.011335920542478561, + -0.010958053171634674 + ] + }, + "dfa": { + "test_acc": 0.841, + "mean_bp_cosine": 0.10045036673545837, + "mean_rho": 0.06510928040370345, + "mean_nudge_001": -0.000200933368432743, + "mean_nudge_003": -0.000600688594810587, + "mean_nudge_01": -0.001976225830730982, + "bp_cosine_per_layer": [ + 0.009534038603305817, + 0.2771005630493164, + 0.12846891582012177, + 0.12727834284305573, + 0.09264838695526123, + 0.08494879305362701, + 0.1454543173313141, + 0.07647830247879028, + 0.055110231041908264, + 0.08491981029510498, + 0.054209403693675995, + 0.06925329566001892 + ], + "rho_per_layer": [ + -0.030354971066117287, + 0.19958093762397766, + 0.10430362075567245, + 0.06749340891838074, + 0.08917459845542908, + 0.06985980272293091, + 0.08990536630153656, + -0.0003178045153617859, + -0.05352415516972542, + 0.12398940324783325, + 0.05844062566757202, + 0.06276053190231323 + ], + "nudge_per_layer": [ + 0.0008368014823645353, + -0.00641840323805809, + -0.0027151124086230993, + -0.002792379120364785, + -0.0018645611125975847, + -0.0017843465320765972, + -0.002957880962640047, + -0.0012784524587914348, + -0.0007560949889011681, + -0.0015581869520246983, + -0.0010259757982566953, + -0.0014001178788021207 + ] + }, + "state_bridge": { + "test_acc": 0.675, + "mean_bp_cosine": 0.21027903320888677, + "mean_rho": 0.16716737858951092, + "mean_nudge_001": -0.002424063318661259, + "mean_nudge_003": -0.007164865601225756, + "mean_nudge_01": -0.02264038595603779, + "bp_cosine_per_layer": [ + 0.7589784860610962, + 0.34465640783309937, + 0.20695620775222778, + 0.15412747859954834, + 0.14041899144649506, + 0.152847021818161, + 0.1464981734752655, + 0.13855373859405518, + 0.13026131689548492, + 0.11798880249261856, + 0.11249798536300659, + 0.11956378817558289 + ], + "rho_per_layer": [ + 0.6762608289718628, + 0.29351934790611267, + 0.15623700618743896, + 0.07772233337163925, + 0.09808109700679779, + 0.14218339323997498, + 0.09985582530498505, + 0.07779418677091599, + 0.10923020541667938, + 0.10118008404970169, + 0.08211226016283035, + 0.09183197468519211 + ], + "nudge_per_layer": [ + -0.22324970364570618, + -0.01123635284602642, + -0.0056420015171170235, + -0.0040974924340844154, + -0.0037027131766080856, + -0.003983458504080772, + -0.0038626876194030046, + -0.0036268262192606926, + -0.003363188588991761, + -0.0030670221894979477, + -0.0028224957641214132, + -0.0030306889675557613 + ], + "state_pred_error_per_layer": [ + 10215.58203125, + 8926.0654296875, + 5285.6044921875, + 5192.0830078125, + 4575.35791015625, + 4063.82666015625, + 4966.6884765625, + 5378.6435546875, + 4702.37890625, + 4026.143310546875, + 3985.35595703125, + 3780.156494140625 + ], + "mean_state_pred_error": 5424.8238525390625 + }, + "credit_bridge": { + "test_acc": 0.721, + "mean_bp_cosine": 0.020079606105961528, + "mean_rho": 0.0501531979146724, + "mean_nudge_001": -0.00015450727914867457, + "mean_nudge_003": -0.0004599024711448389, + "mean_nudge_01": -0.001498352525231894, + "bp_cosine_per_layer": [ + -0.0035465662367641926, + -0.001160490675829351, + 0.00486466521397233, + 0.012821277603507042, + 0.012568866834044456, + 0.019143100827932358, + 0.022381767630577087, + 0.024246837943792343, + 0.027966029942035675, + 0.03333558514714241, + 0.04247187077999115, + 0.04586232826113701 + ], + "rho_per_layer": [ + 0.01447216235101223, + -0.01648387312889099, + 0.027175014838576317, + 0.03045208379626274, + 0.05211577191948891, + -0.0074118818156421185, + 0.0508866012096405, + 0.01983593963086605, + 0.03707783669233322, + 0.12354743480682373, + 0.16596439480781555, + 0.10420688986778259 + ], + "nudge_per_layer": [ + 0.002342540305107832, + -0.0004765552293974906, + -0.0007624666905030608, + -0.0012423819862306118, + -0.0012568822130560875, + -0.0016762344166636467, + -0.0018269497668370605, + -0.0020500137470662594, + -0.0022837575525045395, + -0.0026187507901340723, + -0.0029940432868897915, + -0.0031347349286079407 + ], + "final_value_loss": 0.37253577736616134, + "final_term_loss": 0.18445234730243684, + "final_bridge_loss": 0.0251624245762825, + "final_tgrad_loss": 0.16292100727558137 + } + }, + "a0.0_L12_s456": { + "bp": { + "test_acc": 0.9115, + "mean_bp_cosine": 0.7958964506785074, + "mean_rho": 0.9998697290817896, + "mean_nudge_001": -0.0046546936306792, + "mean_nudge_003": -0.013125322526320815, + "mean_nudge_01": -0.03561708889901638, + "bp_cosine_per_layer": [ + 0.841245174407959, + 0.830803632736206, + 0.8195754885673523, + 0.8066799640655518, + 0.7983194589614868, + 0.7908304929733276, + 0.7860588431358337, + 0.7811387777328491, + 0.7771316170692444, + 0.7744728326797485, + 0.7727954983711243, + 0.7717056274414062 + ], + "rho_per_layer": [ + 0.9999991059303284, + 0.9999973177909851, + 0.9999889731407166, + 0.9999734163284302, + 0.9999427795410156, + 0.9998763799667358, + 0.9998629093170166, + 0.9998323321342468, + 0.9997599720954895, + 0.9997479319572449, + 0.9997410774230957, + 0.9997145533561707 + ], + "nudge_per_layer": [ + -0.1470111906528473, + -0.09042022377252579, + -0.050197783857584, + -0.030754856765270233, + -0.021816428750753403, + -0.017199307680130005, + -0.014493460766971111, + -0.012762569822371006, + -0.01160583458840847, + -0.010828070342540741, + -0.010316012427210808, + -0.00999932736158371 + ] + }, + "dfa": { + "test_acc": 0.8275, + "mean_bp_cosine": 0.109907116740942, + "mean_rho": 0.10316232999321073, + "mean_nudge_001": -0.00034242031688336283, + "mean_nudge_003": -0.001020948082441464, + "mean_nudge_01": -0.0033549320845243833, + "bp_cosine_per_layer": [ + 0.0384417325258255, + 0.27492010593414307, + 0.17608770728111267, + 0.12729278206825256, + 0.09575799107551575, + 0.13158489763736725, + 0.07343505322933197, + 0.08012130856513977, + 0.08938327431678772, + 0.09414967149496078, + 0.06517850607633591, + 0.07253237068653107 + ], + "rho_per_layer": [ + -0.00336202559992671, + 0.18004602193832397, + 0.18598641455173492, + 0.15388232469558716, + 0.058810293674468994, + 0.14123386144638062, + 0.05320374667644501, + 0.10196533054113388, + 0.09802494943141937, + 0.10918877273797989, + 0.09344048798084259, + 0.0655277818441391 + ], + "nudge_per_layer": [ + -0.010087584145367146, + -0.006617182400077581, + -0.004152917303144932, + -0.0031182561069726944, + -0.0022262579295784235, + -0.0028664623387157917, + -0.0016081882640719414, + -0.0017378728371113539, + -0.0020772137213498354, + -0.002457245485857129, + -0.0015545324422419071, + -0.0017554720398038626 + ] + }, + "state_bridge": { + "test_acc": 0.684, + "mean_bp_cosine": 0.21628577137986818, + "mean_rho": 0.17074896084765592, + "mean_nudge_001": -0.0019644595328524397, + "mean_nudge_003": -0.0058011185271122185, + "mean_nudge_01": -0.018295541075834382, + "bp_cosine_per_layer": [ + 0.7363088726997375, + 0.32443851232528687, + 0.21702790260314941, + 0.21007081866264343, + 0.16975754499435425, + 0.1722516119480133, + 0.16474759578704834, + 0.12138545513153076, + 0.1178494393825531, + 0.13036376237869263, + 0.11493153870105743, + 0.1162962019443512 + ], + "rho_per_layer": [ + 0.6429969072341919, + 0.2531689405441284, + 0.22036504745483398, + 0.17542049288749695, + 0.15819020569324493, + 0.14438438415527344, + 0.07042165100574493, + 0.11963094770908356, + 0.1070300042629242, + 0.07622774690389633, + 0.035559043288230896, + 0.045592159032821655 + ], + "nudge_per_layer": [ + -0.1725819855928421, + -0.009430286474525928, + -0.0054127369076013565, + -0.005186344031244516, + -0.004062540829181671, + -0.0039931111969053745, + -0.003901706077158451, + -0.003083862829953432, + -0.002966922242194414, + -0.0033692335709929466, + -0.002796228276565671, + -0.002761534880846739 + ], + "state_pred_error_per_layer": [ + 8107.484375, + 6015.64697265625, + 3272.651123046875, + 3025.219970703125, + 3498.379150390625, + 2962.442626953125, + 2732.457275390625, + 3394.069091796875, + 3050.444091796875, + 3397.53271484375, + 3068.22607421875, + 3145.807373046875 + ], + "mean_state_pred_error": 3805.8634033203125 + }, + "credit_bridge": { + "test_acc": 0.669, + "mean_bp_cosine": 0.048155296875241525, + "mean_rho": 0.07334851861620943, + "mean_nudge_001": -0.00035685058537637815, + "mean_nudge_003": -0.0010696607399343823, + "mean_nudge_01": -0.0035326933624067656, + "bp_cosine_per_layer": [ + 0.0015124600613489747, + 0.020085982978343964, + 0.03127610310912132, + 0.03517032414674759, + 0.042219605296850204, + 0.05027471110224724, + 0.05683741718530655, + 0.057938531041145325, + 0.06581299006938934, + 0.06761687994003296, + 0.07107532024383545, + 0.07804323732852936 + ], + "rho_per_layer": [ + 0.03147998824715614, + -0.015333062037825584, + 0.020876668393611908, + 0.07304719090461731, + 0.0599740669131279, + 0.08874240517616272, + 0.05341971293091774, + 0.07721589505672455, + 0.08801877498626709, + 0.10527393221855164, + 0.16833831369876862, + 0.1291283369064331 + ], + "nudge_per_layer": [ + -0.004048495087772608, + -0.0012588155223056674, + -0.0019918864127248526, + -0.002725755563005805, + -0.0028244066052138805, + -0.003425109200179577, + -0.0036919033154845238, + -0.003999053034931421, + -0.0042928787879645824, + -0.004538967739790678, + -0.004742524586617947, + -0.004852524492889643 + ], + "final_value_loss": 0.8257113872528076, + "final_term_loss": 0.5509136886596679, + "final_bridge_loss": 0.049323998257517813, + "final_tgrad_loss": 0.22547370266914368 + } + }, + "a0.25_L2_s42": { + "bp": { + "test_acc": 0.908, + "mean_bp_cosine": 0.8980661034584045, + "mean_rho": 0.9999964535236359, + "mean_nudge_001": -0.01618960639461875, + "mean_nudge_003": -0.04483883548527956, + "mean_nudge_01": -0.11487101018428802, + "bp_cosine_per_layer": [ + 0.9068200588226318, + 0.8893121480941772 + ], + "rho_per_layer": [ + 0.9999985098838806, + 0.9999943971633911 + ], + "nudge_per_layer": [ + -0.15680165588855743, + -0.07294036448001862 + ] + }, + "dfa": { + "test_acc": 0.847, + "mean_bp_cosine": 0.026606750674545765, + "mean_rho": -0.0022891219705343246, + "mean_nudge_001": -2.3714659619145095e-05, + "mean_nudge_003": -1.6182020772248507e-05, + "mean_nudge_01": 0.0005980018759146333, + "bp_cosine_per_layer": [ + -0.008382977917790413, + 0.06159647926688194 + ], + "rho_per_layer": [ + -0.022914212197065353, + 0.018335968255996704 + ], + "nudge_per_layer": [ + 0.0033093439415097237, + -0.002113340189680457 + ] + }, + "state_bridge": { + "test_acc": 0.827, + "mean_bp_cosine": 0.6775506436824799, + "mean_rho": 0.6271905303001404, + "mean_nudge_001": -0.015066297259181738, + "mean_nudge_003": -0.04329914692789316, + "mean_nudge_01": -0.12377128005027771, + "bp_cosine_per_layer": [ + 0.9188902378082275, + 0.4362110495567322 + ], + "rho_per_layer": [ + 0.8401009440422058, + 0.41428011655807495 + ], + "nudge_per_layer": [ + -0.21947401762008667, + -0.02806854248046875 + ], + "state_pred_error_per_layer": [ + 753.1610107421875, + 333.87890625 + ], + "mean_state_pred_error": 543.5199584960938 + }, + "credit_bridge": { + "test_acc": 0.6455, + "mean_bp_cosine": 0.15288914740085602, + "mean_rho": 0.2540942281484604, + "mean_nudge_001": -0.003834493225440383, + "mean_nudge_003": -0.011456333566457033, + "mean_nudge_01": -0.03762407600879669, + "bp_cosine_per_layer": [ + 0.07500731945037842, + 0.23077097535133362 + ], + "rho_per_layer": [ + 0.12894567847251892, + 0.37924277782440186 + ], + "nudge_per_layer": [ + -0.05425257235765457, + -0.020995579659938812 + ], + "final_value_loss": 0.5630231554031372, + "final_term_loss": 0.2533654543399811, + "final_bridge_loss": 0.03314736911058426, + "final_tgrad_loss": 0.27651033034324646 + } + }, + "a0.25_L2_s123": { + "bp": { + "test_acc": 0.92, + "mean_bp_cosine": 0.8535160422325134, + "mean_rho": 0.9999972283840179, + "mean_nudge_001": -0.01451590727083385, + "mean_nudge_003": -0.03988213837146759, + "mean_nudge_01": -0.09831684827804565, + "bp_cosine_per_layer": [ + 0.8569881916046143, + 0.8500438928604126 + ], + "rho_per_layer": [ + 0.9999989867210388, + 0.9999954700469971 + ], + "nudge_per_layer": [ + -0.13159069418907166, + -0.06504300236701965 + ] + }, + "dfa": { + "test_acc": 0.853, + "mean_bp_cosine": 0.0877363346517086, + "mean_rho": 0.0626654140651226, + "mean_nudge_001": -0.0009488673531450331, + "mean_nudge_003": -0.0028224033303558826, + "mean_nudge_01": -0.009134252090007067, + "bp_cosine_per_layer": [ + 0.05345926433801651, + 0.1220134049654007 + ], + "rho_per_layer": [ + 0.09254007041454315, + 0.03279075771570206 + ], + "nudge_per_layer": [ + -0.0142319705337286, + -0.004036533646285534 + ] + }, + "state_bridge": { + "test_acc": 0.834, + "mean_bp_cosine": 0.6950189173221588, + "mean_rho": 0.5849489569664001, + "mean_nudge_001": -0.012975628254935145, + "mean_nudge_003": -0.03723907680250704, + "mean_nudge_01": -0.10619704332202673, + "bp_cosine_per_layer": [ + 0.9177796840667725, + 0.47225815057754517 + ], + "rho_per_layer": [ + 0.7912815809249878, + 0.3786163330078125 + ], + "nudge_per_layer": [ + -0.187799870967865, + -0.02459421567618847 + ], + "state_pred_error_per_layer": [ + 654.3871459960938, + 278.6759338378906 + ], + "mean_state_pred_error": 466.5315399169922 + }, + "credit_bridge": { + "test_acc": 0.638, + "mean_bp_cosine": 0.18947000801563263, + "mean_rho": 0.3388983681797981, + "mean_nudge_001": -0.004155236994847655, + "mean_nudge_003": -0.012411902891471982, + "mean_nudge_01": -0.04074052348732948, + "bp_cosine_per_layer": [ + 0.09752383828163147, + 0.2814161777496338 + ], + "rho_per_layer": [ + 0.2172888070344925, + 0.46050792932510376 + ], + "nudge_per_layer": [ + -0.05797416716814041, + -0.023506879806518555 + ], + "final_value_loss": 0.6248516966819763, + "final_term_loss": 0.2734043194293976, + "final_bridge_loss": 0.04374015842676163, + "final_tgrad_loss": 0.3077072183132172 + } + }, + "a0.25_L2_s456": { + "bp": { + "test_acc": 0.914, + "mean_bp_cosine": 0.8777631521224976, + "mean_rho": 0.9999973177909851, + "mean_nudge_001": -0.017619559541344643, + "mean_nudge_003": -0.04847448691725731, + "mean_nudge_01": -0.1200898252427578, + "bp_cosine_per_layer": [ + 0.8855119943618774, + 0.8700143098831177 + ], + "rho_per_layer": [ + 0.9999988079071045, + 0.9999958276748657 + ], + "nudge_per_layer": [ + -0.16111940145492554, + -0.07906024903059006 + ] + }, + "dfa": { + "test_acc": 0.842, + "mean_bp_cosine": 0.049672482535243034, + "mean_rho": 0.03196176886558533, + "mean_nudge_001": -0.0005511407216545194, + "mean_nudge_003": -0.0016261094715446234, + "mean_nudge_01": -0.0050985191483050585, + "bp_cosine_per_layer": [ + 0.015632983297109604, + 0.08371198177337646 + ], + "rho_per_layer": [ + -0.06864285469055176, + 0.1325663924217224 + ], + "nudge_per_layer": [ + -0.006782663054764271, + -0.003414375241845846 + ] + }, + "state_bridge": { + "test_acc": 0.817, + "mean_bp_cosine": 0.7210330367088318, + "mean_rho": 0.6920621693134308, + "mean_nudge_001": -0.01618554489687085, + "mean_nudge_003": -0.04673728672787547, + "mean_nudge_01": -0.13591178134083748, + "bp_cosine_per_layer": [ + 0.9367842674255371, + 0.5052818059921265 + ], + "rho_per_layer": [ + 0.846778392791748, + 0.5373459458351135 + ], + "nudge_per_layer": [ + -0.23458413779735565, + -0.037239424884319305 + ], + "state_pred_error_per_layer": [ + 626.5816650390625, + 277.74237060546875 + ], + "mean_state_pred_error": 452.1620178222656 + }, + "credit_bridge": { + "test_acc": 0.6685, + "mean_bp_cosine": 0.21126148104667664, + "mean_rho": 0.3547997772693634, + "mean_nudge_001": -0.004930314142256975, + "mean_nudge_003": -0.014735064469277859, + "mean_nudge_01": -0.048451079055666924, + "bp_cosine_per_layer": [ + 0.13380715250968933, + 0.28871580958366394 + ], + "rho_per_layer": [ + 0.2647465467453003, + 0.4448530077934265 + ], + "nudge_per_layer": [ + -0.07276535779237747, + -0.024136800318956375 + ], + "final_value_loss": 0.4186974630832672, + "final_term_loss": 0.13192469900846482, + "final_bridge_loss": 0.02328252377510071, + "final_tgrad_loss": 0.2634902417182922 + } + }, + "a0.25_L4_s42": { + "bp": { + "test_acc": 0.911, + "mean_bp_cosine": 0.841001495718956, + "mean_rho": 0.9999824017286301, + "mean_nudge_001": -0.012893156963400543, + "mean_nudge_003": -0.035831862362101674, + "mean_nudge_01": -0.09177740290760994, + "bp_cosine_per_layer": [ + 0.868922770023346, + 0.8429951667785645, + 0.8289605379104614, + 0.8231275081634521 + ], + "rho_per_layer": [ + 0.999998927116394, + 0.9999972581863403, + 0.9999882578849792, + 0.9999451637268066 + ], + "nudge_per_layer": [ + -0.17674864828586578, + -0.10683682560920715, + -0.05415143817663193, + -0.029372699558734894 + ] + }, + "dfa": { + "test_acc": 0.8515, + "mean_bp_cosine": 0.0922011851798743, + "mean_rho": 0.09930456057190895, + "mean_nudge_001": -0.0006074781995266676, + "mean_nudge_003": -0.001813438575481996, + "mean_nudge_01": -0.005950940365437418, + "bp_cosine_per_layer": [ + 0.006489354185760021, + 0.12851163744926453, + 0.11991241574287415, + 0.11389133334159851 + ], + "rho_per_layer": [ + 0.029786743223667145, + 0.18639126420021057, + 0.11502038687467575, + 0.06601984798908234 + ], + "nudge_per_layer": [ + -0.01056693121790886, + -0.006519604474306107, + -0.003515135496854782, + -0.003202090272679925 + ] + }, + "state_bridge": { + "test_acc": 0.738, + "mean_bp_cosine": 0.3966497778892517, + "mean_rho": 0.33668526262044907, + "mean_nudge_001": -0.006818186957389116, + "mean_nudge_003": -0.020020907453726977, + "mean_nudge_01": -0.0618970247451216, + "bp_cosine_per_layer": [ + 0.8448630571365356, + 0.4407959580421448, + 0.15707260370254517, + 0.14386749267578125 + ], + "rho_per_layer": [ + 0.7033247947692871, + 0.34020179510116577, + 0.13395404815673828, + 0.1692604124546051 + ], + "nudge_per_layer": [ + -0.2203540802001953, + -0.01797248050570488, + -0.004883656278252602, + -0.004377881996333599 + ], + "state_pred_error_per_layer": [ + 3192.55322265625, + 2613.6337890625, + 1881.11669921875, + 2102.51953125 + ], + "mean_state_pred_error": 2447.455810546875 + }, + "credit_bridge": { + "test_acc": 0.662, + "mean_bp_cosine": 0.1593644004315138, + "mean_rho": 0.2909943610429764, + "mean_nudge_001": -0.0019232924096286297, + "mean_nudge_003": -0.005755707039497793, + "mean_nudge_01": -0.019015976693481207, + "bp_cosine_per_layer": [ + 0.07093458622694016, + 0.19623729586601257, + 0.18378585577011108, + 0.18649986386299133 + ], + "rho_per_layer": [ + 0.14815130829811096, + 0.336488276720047, + 0.35506749153137207, + 0.3242703676223755 + ], + "nudge_per_layer": [ + -0.033366985619068146, + -0.015239425003528595, + -0.013842864893376827, + -0.01361463125795126 + ], + "final_value_loss": 0.5039997359514237, + "final_term_loss": 0.20441836426854135, + "final_bridge_loss": 0.03893857387006283, + "final_tgrad_loss": 0.26064279942512514 + } + }, + "a0.25_L4_s123": { + "bp": { + "test_acc": 0.917, + "mean_bp_cosine": 0.7935318648815155, + "mean_rho": 0.9999762326478958, + "mean_nudge_001": -0.01081152242841199, + "mean_nudge_003": -0.029669071780517697, + "mean_nudge_01": -0.0743116931989789, + "bp_cosine_per_layer": [ + 0.8279672861099243, + 0.8114954233169556, + 0.7863935232162476, + 0.7482712268829346 + ], + "rho_per_layer": [ + 0.9999987483024597, + 0.9999956488609314, + 0.999983012676239, + 0.9999275207519531 + ], + "nudge_per_layer": [ + -0.14138484001159668, + -0.08725307881832123, + -0.04476301744580269, + -0.023845836520195007 + ] + }, + "dfa": { + "test_acc": 0.824, + "mean_bp_cosine": 0.1441014357842505, + "mean_rho": 0.14396781660616398, + "mean_nudge_001": -0.0003178600236424245, + "mean_nudge_003": -0.0009397821850143373, + "mean_nudge_01": -0.0029927556752227247, + "bp_cosine_per_layer": [ + -0.030194921419024467, + 0.3003618121147156, + 0.18209302425384521, + 0.12414582818746567 + ], + "rho_per_layer": [ + -0.038011275231838226, + 0.29912513494491577, + 0.1735759675502777, + 0.14118143916130066 + ], + "nudge_per_layer": [ + 0.005076530389487743, + -0.00841662660241127, + -0.005011391825973988, + -0.0036195346619933844 + ] + }, + "state_bridge": { + "test_acc": 0.733, + "mean_bp_cosine": 0.3913041353225708, + "mean_rho": 0.3523585610091686, + "mean_nudge_001": -0.0061569800454890355, + "mean_nudge_003": -0.01808436232386157, + "mean_nudge_01": -0.055880151805467904, + "bp_cosine_per_layer": [ + 0.821143627166748, + 0.36722686886787415, + 0.20176959037780762, + 0.1750764548778534 + ], + "rho_per_layer": [ + 0.6905952095985413, + 0.36183467507362366, + 0.19890159368515015, + 0.15810276567935944 + ], + "nudge_per_layer": [ + -0.1973220407962799, + -0.013631552457809448, + -0.0068134344182908535, + -0.0057535795494914055 + ], + "state_pred_error_per_layer": [ + 3017.568359375, + 2069.30517578125, + 2103.28662109375, + 1370.3270263671875 + ], + "mean_state_pred_error": 2140.121795654297 + }, + "credit_bridge": { + "test_acc": 0.7085, + "mean_bp_cosine": 0.11074696853756905, + "mean_rho": 0.20390365412458777, + "mean_nudge_001": -0.0010930995340459049, + "mean_nudge_003": -0.0032710169325582683, + "mean_nudge_01": -0.010791003005579114, + "bp_cosine_per_layer": [ + 0.021101564168930054, + 0.1092284768819809, + 0.14931762218475342, + 0.16334021091461182 + ], + "rho_per_layer": [ + 0.026919251307845116, + 0.23688018321990967, + 0.28421375155448914, + 0.2676014304161072 + ], + "nudge_per_layer": [ + -0.008425744250416756, + -0.009595570154488087, + -0.012630455195903778, + -0.012512242421507835 + ], + "final_value_loss": 0.44552071504592894, + "final_term_loss": 0.1639193995475769, + "final_bridge_loss": 0.022096455523371698, + "final_tgrad_loss": 0.2595048580646515 + } + }, + "a0.25_L4_s456": { + "bp": { + "test_acc": 0.9185, + "mean_bp_cosine": 0.7816510498523712, + "mean_rho": 0.9999814331531525, + "mean_nudge_001": -0.01180829742224887, + "mean_nudge_003": -0.032709411811083555, + "mean_nudge_01": -0.08326426614075899, + "bp_cosine_per_layer": [ + 0.8029586672782898, + 0.7900986075401306, + 0.7753629684448242, + 0.7581839561462402 + ], + "rho_per_layer": [ + 0.999998927116394, + 0.9999964237213135, + 0.999983549118042, + 0.9999468326568604 + ], + "nudge_per_layer": [ + -0.15638579428195953, + -0.09745092689990997, + -0.05102477967739105, + -0.028195563703775406 + ] + }, + "dfa": { + "test_acc": 0.8515, + "mean_bp_cosine": 0.06627230579033494, + "mean_rho": 0.10299420775845647, + "mean_nudge_001": -0.000254730271990411, + "mean_nudge_003": -0.0007513021846534684, + "mean_nudge_01": -0.0023495194036513567, + "bp_cosine_per_layer": [ + -0.014162426814436913, + 0.0798005759716034, + 0.09311279654502869, + 0.10633827745914459 + ], + "rho_per_layer": [ + 0.041398823261260986, + 0.02247910387814045, + 0.1714327037334442, + 0.17666620016098022 + ], + "nudge_per_layer": [ + 0.002492401283234358, + -0.005343085154891014, + -0.0033098761923611164, + -0.003237517550587654 + ] + }, + "state_bridge": { + "test_acc": 0.7085, + "mean_bp_cosine": 0.37615348026156425, + "mean_rho": 0.3445914164185524, + "mean_nudge_001": -0.00598156735941302, + "mean_nudge_003": -0.017677294556051493, + "mean_nudge_01": -0.055878938641399145, + "bp_cosine_per_layer": [ + 0.8312708735466003, + 0.37615716457366943, + 0.14436809718608856, + 0.15281778573989868 + ], + "rho_per_layer": [ + 0.7588610649108887, + 0.34236449003219604, + 0.14024245738983154, + 0.13689765334129333 + ], + "nudge_per_layer": [ + -0.19714727997779846, + -0.01597677543759346, + -0.004914070479571819, + -0.005477628670632839 + ], + "state_pred_error_per_layer": [ + 2233.37158203125, + 1546.82080078125, + 996.9107666015625, + 942.33251953125 + ], + "mean_state_pred_error": 1429.8589172363281 + }, + "credit_bridge": { + "test_acc": 0.6185, + "mean_bp_cosine": 0.1528007835149765, + "mean_rho": 0.2638061139732599, + "mean_nudge_001": -0.0015675137401558459, + "mean_nudge_003": -0.004692548653110862, + "mean_nudge_01": -0.015524385962635279, + "bp_cosine_per_layer": [ + 0.048861026763916016, + 0.17950567603111267, + 0.17905107140541077, + 0.20378535985946655 + ], + "rho_per_layer": [ + 0.07314518839120865, + 0.3309200406074524, + 0.2789418697357178, + 0.3722173571586609 + ], + "nudge_per_layer": [ + -0.017692390829324722, + -0.014619983732700348, + -0.014469930902123451, + -0.015315238386392593 + ], + "final_value_loss": 0.64283842253685, + "final_term_loss": 0.27786159224510193, + "final_bridge_loss": 0.049283357608318326, + "final_tgrad_loss": 0.31569347660541536 + } + }, + "a0.25_L8_s42": { + "bp": { + "test_acc": 0.8955, + "mean_bp_cosine": 0.8411818519234657, + "mean_rho": 0.999948225915432, + "mean_nudge_001": -0.008358085062354803, + "mean_nudge_003": -0.023856630141381174, + "mean_nudge_01": -0.06703015509992838, + "bp_cosine_per_layer": [ + 0.8706932663917542, + 0.8596300482749939, + 0.8512309789657593, + 0.842391848564148, + 0.8334972858428955, + 0.8275372385978699, + 0.823634147644043, + 0.8208400011062622 + ], + "rho_per_layer": [ + 0.9999992847442627, + 0.9999973773956299, + 0.9999889731407166, + 0.9999737739562988, + 0.999952495098114, + 0.9999229311943054, + 0.9998778104782104, + 0.999873161315918 + ], + "nudge_per_layer": [ + -0.19971789419651031, + -0.12236367166042328, + -0.07083894312381744, + -0.044348303228616714, + -0.031799670308828354, + -0.02545534446835518, + -0.02191336825489998, + -0.01980404555797577 + ] + }, + "dfa": { + "test_acc": 0.835, + "mean_bp_cosine": 0.06675009592436254, + "mean_rho": 0.0799849673639983, + "mean_nudge_001": -6.642583684879355e-06, + "mean_nudge_003": -9.95869777398184e-06, + "mean_nudge_01": 0.00010420403850730509, + "bp_cosine_per_layer": [ + -0.029614916071295738, + 0.08655504137277603, + 0.09347832202911377, + 0.10665939003229141, + 0.10298001766204834, + 0.055703092366456985, + 0.06406168639659882, + 0.054178133606910706 + ], + "rho_per_layer": [ + -0.10576558113098145, + 0.13653026521205902, + 0.13744692504405975, + 0.169493168592453, + 0.1142939031124115, + 0.09325758367776871, + 0.1042378693819046, + -0.00961439497768879 + ], + "nudge_per_layer": [ + 0.021624702960252762, + -0.006033358629792929, + -0.003085250034928322, + -0.0032903538085520267, + -0.0030274176970124245, + -0.0016871094703674316, + -0.0020643905736505985, + -0.0016031904378905892 + ] + }, + "state_bridge": { + "test_acc": 0.7705, + "mean_bp_cosine": 0.2720195781439543, + "mean_rho": 0.24409680720418692, + "mean_nudge_001": -0.0037333294421841856, + "mean_nudge_003": -0.01090175670105964, + "mean_nudge_01": -0.03293398043024354, + "bp_cosine_per_layer": [ + 0.8497925996780396, + 0.4692588150501251, + 0.1727459728717804, + 0.1467132717370987, + 0.13944602012634277, + 0.1262509524822235, + 0.13373470306396484, + 0.13821429014205933 + ], + "rho_per_layer": [ + 0.7623768448829651, + 0.4223487377166748, + 0.18194836378097534, + 0.12129966914653778, + 0.11680327355861664, + 0.15588274598121643, + 0.1260674148797989, + 0.06604740768671036 + ], + "nudge_per_layer": [ + -0.23203837871551514, + -0.013907128013670444, + -0.0036564678885042667, + -0.0029728016816079617, + -0.0027978671714663506, + -0.0026036568451672792, + -0.002694307826459408, + -0.0028012352995574474 + ], + "state_pred_error_per_layer": [ + 10530.408203125, + 8501.392578125, + 5819.005859375, + 4775.642578125, + 4112.55224609375, + 3853.83984375, + 4342.64697265625, + 3851.865478515625 + ], + "mean_state_pred_error": 5723.419219970703 + }, + "credit_bridge": { + "test_acc": 0.616, + "mean_bp_cosine": 0.11742978217080235, + "mean_rho": 0.20278298296034336, + "mean_nudge_001": -0.000763369575906836, + "mean_nudge_003": -0.0022864671773277223, + "mean_nudge_01": -0.007572929258458316, + "bp_cosine_per_layer": [ + 0.0006081201136112213, + 0.13602128624916077, + 0.1264307200908661, + 0.13147516548633575, + 0.14721693098545074, + 0.1274956315755844, + 0.13849349319934845, + 0.1316969096660614 + ], + "rho_per_layer": [ + 0.0121258944272995, + 0.21904222667217255, + 0.23992177844047546, + 0.23384322226047516, + 0.24397125840187073, + 0.24230614304542542, + 0.23810306191444397, + 0.1929502785205841 + ], + "nudge_per_layer": [ + 0.0015163691714406013, + -0.009462166577577591, + -0.008223006501793861, + -0.008610539138317108, + -0.009565019980072975, + -0.00855704490095377, + -0.008995135314762592, + -0.008686890825629234 + ], + "final_value_loss": 0.5891867377281189, + "final_term_loss": 0.3338063308954239, + "final_bridge_loss": 0.026477533173561097, + "final_tgrad_loss": 0.2289028725862503 + } + }, + "a0.25_L8_s123": { + "bp": { + "test_acc": 0.896, + "mean_bp_cosine": 0.8579939901828766, + "mean_rho": 0.9999475553631783, + "mean_nudge_001": -0.008832237246679142, + "mean_nudge_003": -0.02530999999726191, + "mean_nudge_01": -0.07218505791388452, + "bp_cosine_per_layer": [ + 0.8995364308357239, + 0.8806806802749634, + 0.8653636574745178, + 0.852218508720398, + 0.8451849222183228, + 0.8416627645492554, + 0.8401176333427429, + 0.8391873240470886 + ], + "rho_per_layer": [ + 0.9999992251396179, + 0.9999973773956299, + 0.9999878406524658, + 0.9999729990959167, + 0.9999438524246216, + 0.9999128580093384, + 0.9999063611030579, + 0.9998599290847778 + ], + "nudge_per_layer": [ + -0.2192329615354538, + -0.13158643245697021, + -0.07524827122688293, + -0.04681030660867691, + -0.03351406753063202, + -0.026811176910996437, + -0.02318240888416767, + -0.02109483815729618 + ] + }, + "dfa": { + "test_acc": 0.833, + "mean_bp_cosine": 0.07527017407119274, + "mean_rho": 0.08970394870266318, + "mean_nudge_001": -3.044791992579121e-05, + "mean_nudge_003": -8.396412886213511e-05, + "mean_nudge_01": -0.00019736881949938834, + "bp_cosine_per_layer": [ + -0.030230171978473663, + 0.1515132635831833, + 0.08784028142690659, + 0.07231537997722626, + 0.09554086625576019, + 0.09082843363285065, + 0.05412551760673523, + 0.0802278220653534 + ], + "rho_per_layer": [ + 0.04074572026729584, + 0.1662997603416443, + 0.08309999853372574, + 0.07389070093631744, + 0.14882703125476837, + 0.04519672691822052, + 0.0252661295235157, + 0.13430552184581757 + ], + "nudge_per_layer": [ + 0.013973418623209, + -0.0047885943204164505, + -0.0020089128520339727, + -0.0015227446565404534, + -0.002120924647897482, + -0.0020366935059428215, + -0.001262089004740119, + -0.0018124101916328073 + ] + }, + "state_bridge": { + "test_acc": 0.753, + "mean_bp_cosine": 0.26880230009555817, + "mean_rho": 0.23677901271730661, + "mean_nudge_001": -0.0032272498192469357, + "mean_nudge_003": -0.009375294612254947, + "mean_nudge_01": -0.027950568503001705, + "bp_cosine_per_layer": [ + 0.8559742569923401, + 0.48324936628341675, + 0.20313377678394318, + 0.15002062916755676, + 0.13207414746284485, + 0.11473802477121353, + 0.10703189671039581, + 0.10419630259275436 + ], + "rho_per_layer": [ + 0.712527871131897, + 0.4307812452316284, + 0.20181137323379517, + 0.13881561160087585, + 0.15075963735580444, + 0.09288278967142105, + 0.0890430212020874, + 0.0776105523109436 + ], + "nudge_per_layer": [ + -0.19413721561431885, + -0.013532894663512707, + -0.004060069564729929, + -0.0029658200219273567, + -0.00256463885307312, + -0.0022291922941803932, + -0.00204793200828135, + -0.002066785003989935 + ], + "state_pred_error_per_layer": [ + 8381.830078125, + 6536.470703125, + 4195.43359375, + 3240.16162109375, + 3085.78857421875, + 3078.50390625, + 3156.81787109375, + 3267.9345703125 + ], + "mean_state_pred_error": 4367.867614746094 + }, + "credit_bridge": { + "test_acc": 0.651, + "mean_bp_cosine": 0.131322234403342, + "mean_rho": 0.19494653795845807, + "mean_nudge_001": -0.0009437191256438382, + "mean_nudge_003": -0.002826296287821606, + "mean_nudge_01": -0.009364197961986065, + "bp_cosine_per_layer": [ + 0.021486874669790268, + 0.13597777485847473, + 0.14020901918411255, + 0.16125136613845825, + 0.15609152615070343, + 0.1541982889175415, + 0.14447104930877686, + 0.13689197599887848 + ], + "rho_per_layer": [ + 0.021052071824669838, + 0.17873916029930115, + 0.25896143913269043, + 0.18253415822982788, + 0.20761561393737793, + 0.24419330060482025, + 0.21560567617416382, + 0.25087088346481323 + ], + "nudge_per_layer": [ + -0.006693178787827492, + -0.009655885398387909, + -0.009345939382910728, + -0.010369300842285156, + -0.010154420509934425, + -0.010046296752989292, + -0.009472687728703022, + -0.009175874292850494 + ], + "final_value_loss": 0.41045001599788666, + "final_term_loss": 0.17502211028933526, + "final_bridge_loss": 0.01536440534889698, + "final_tgrad_loss": 0.2200635038137436 + } + }, + "a0.25_L8_s456": { + "bp": { + "test_acc": 0.8915, + "mean_bp_cosine": 0.8808343783020973, + "mean_rho": 0.9999449253082275, + "mean_nudge_001": -0.00886416298453696, + "mean_nudge_003": -0.025221005314961076, + "mean_nudge_01": -0.07025118661113083, + "bp_cosine_per_layer": [ + 0.9125592708587646, + 0.9000785946846008, + 0.8909372687339783, + 0.8829550743103027, + 0.8725745677947998, + 0.8661020994186401, + 0.8620940446853638, + 0.8593741059303284 + ], + "rho_per_layer": [ + 0.999998927116394, + 0.9999973177909851, + 0.9999907612800598, + 0.9999756813049316, + 0.9999436140060425, + 0.9999102354049683, + 0.9998818635940552, + 0.9998610019683838 + ], + "nudge_per_layer": [ + -0.20531992614269257, + -0.12906500697135925, + -0.07575342804193497, + -0.04753156006336212, + -0.033830925822257996, + -0.02684028074145317, + -0.02297976426780224, + -0.020688600838184357 + ] + }, + "dfa": { + "test_acc": 0.8165, + "mean_bp_cosine": 0.1053345538675785, + "mean_rho": 0.1329206523951143, + "mean_nudge_001": -0.0005203891905694036, + "mean_nudge_003": -0.0015467511984752491, + "mean_nudge_01": -0.0049866703047882766, + "bp_cosine_per_layer": [ + 0.023487910628318787, + 0.16097302734851837, + 0.15321409702301025, + 0.08171598613262177, + 0.09132305532693863, + 0.0943714827299118, + 0.12134475260972977, + 0.11624611914157867 + ], + "rho_per_layer": [ + 0.006953349336981773, + 0.2090909481048584, + 0.23601846396923065, + 0.09328415989875793, + 0.10916170477867126, + 0.12872634828090668, + 0.15839380025863647, + 0.12173644453287125 + ], + "nudge_per_layer": [ + -0.013351024128496647, + -0.0065501369535923, + -0.004914519842714071, + -0.002402292797341943, + -0.002674146555364132, + -0.0028969072736799717, + -0.0036479653790593147, + -0.0034563695080578327 + ] + }, + "state_bridge": { + "test_acc": 0.765, + "mean_bp_cosine": 0.24095587618649006, + "mean_rho": 0.20889087952673435, + "mean_nudge_001": -0.0035492044535203604, + "mean_nudge_003": -0.01036601059968234, + "mean_nudge_01": -0.03139855920744594, + "bp_cosine_per_layer": [ + 0.8715300559997559, + 0.44268321990966797, + 0.14538408815860748, + 0.1153520941734314, + 0.09680549800395966, + 0.08768410980701447, + 0.08654746413230896, + 0.08166047930717468 + ], + "rho_per_layer": [ + 0.7710200548171997, + 0.4253605008125305, + 0.09275925159454346, + 0.09712537378072739, + 0.11123719066381454, + 0.028249293565750122, + 0.05002531409263611, + 0.09535005688667297 + ], + "nudge_per_layer": [ + -0.22555799782276154, + -0.012845459394156933, + -0.003021553158760071, + -0.0024172987323254347, + -0.002025863155722618, + -0.0018953735707327724, + -0.0018195084994658828, + -0.0016054193256422877 + ], + "state_pred_error_per_layer": [ + 7857.92041015625, + 7327.2666015625, + 4158.3056640625, + 3231.240234375, + 3079.712890625, + 2843.65966796875, + 3014.824951171875, + 2904.82080078125 + ], + "mean_state_pred_error": 4302.218902587891 + }, + "credit_bridge": { + "test_acc": 0.6845, + "mean_bp_cosine": 0.08619831164833158, + "mean_rho": 0.20396122278179973, + "mean_nudge_001": -0.0008905812101147603, + "mean_nudge_003": -0.0026642234588507563, + "mean_nudge_01": -0.008798376395134255, + "bp_cosine_per_layer": [ + -0.005484581924974918, + 0.03739434853196144, + 0.0736197978258133, + 0.10366753488779068, + 0.11266068369150162, + 0.12653732299804688, + 0.11692580580711365, + 0.12426558136940002 + ], + "rho_per_layer": [ + -0.0015162499621510506, + 0.12250564247369766, + 0.22542724013328552, + 0.204342320561409, + 0.2217923402786255, + 0.28867796063423157, + 0.33211782574653625, + 0.23834270238876343 + ], + "nudge_per_layer": [ + 0.0002549269702285528, + -0.006913396995514631, + -0.008808376267552376, + -0.010325662791728973, + -0.010591026395559311, + -0.011654841713607311, + -0.010967787355184555, + -0.011380846612155437 + ], + "final_value_loss": 0.966836922454834, + "final_term_loss": 0.6684003219604492, + "final_bridge_loss": 0.09051647346019745, + "final_tgrad_loss": 0.20792012577056884 + } + }, + "a0.25_L12_s42": { + "bp": { + "test_acc": 0.897, + "mean_bp_cosine": 0.826698362827301, + "mean_rho": 0.9998699675003687, + "mean_nudge_001": -0.006519351474707946, + "mean_nudge_003": -0.0185935211678346, + "mean_nudge_01": -0.05259064872128268, + "bp_cosine_per_layer": [ + 0.8824102282524109, + 0.865839958190918, + 0.8526839017868042, + 0.839972198009491, + 0.826134204864502, + 0.8190910220146179, + 0.8134430646896362, + 0.8095068335533142, + 0.8061133027076721, + 0.8034266233444214, + 0.8016149997711182, + 0.8001440167427063 + ], + "rho_per_layer": [ + 0.9999990463256836, + 0.9999975562095642, + 0.9999887347221375, + 0.9999736547470093, + 0.9999515414237976, + 0.9999052882194519, + 0.9998592138290405, + 0.999845027923584, + 0.99979567527771, + 0.9997392892837524, + 0.999713659286499, + 0.9996709227561951 + ], + "nudge_per_layer": [ + -0.21559840440750122, + -0.13125374913215637, + -0.0758625715970993, + -0.04728776216506958, + -0.03328181058168411, + -0.025909576565027237, + -0.021545151248574257, + -0.01875336468219757, + -0.016917269676923752, + -0.015656160190701485, + -0.014799138531088829, + -0.01422282587736845 + ] + }, + "dfa": { + "test_acc": 0.8165, + "mean_bp_cosine": 0.06692749153201778, + "mean_rho": 0.09511666395701468, + "mean_nudge_001": -0.0003660954941248444, + "mean_nudge_003": -0.0010870555027698476, + "mean_nudge_01": -0.003503491034886489, + "bp_cosine_per_layer": [ + 0.02035588026046753, + 0.09721152484416962, + 0.10017214715480804, + 0.06879279017448425, + 0.0898706465959549, + 0.0775061622262001, + 0.0738426148891449, + 0.022470442578196526, + 0.03698011115193367, + 0.09759337455034256, + 0.05344103276729584, + 0.06489317119121552 + ], + "rho_per_layer": [ + -0.041805852204561234, + 0.14336195588111877, + 0.21263040602207184, + 0.15326815843582153, + 0.04533267021179199, + 0.07981619238853455, + 0.08665720373392105, + 0.004602088592946529, + 0.0780038833618164, + 0.11769488453865051, + 0.1415681391954422, + 0.12027023732662201 + ], + "nudge_per_layer": [ + -0.007749770302325487, + -0.008321389555931091, + -0.003876405069604516, + -0.0026999912224709988, + -0.0026630363427102566, + -0.0033310302533209324, + -0.0026011697482317686, + -0.0011158722918480635, + -0.0018408913165330887, + -0.0036767907440662384, + -0.0019704087171703577, + -0.0021951368544250727 + ] + }, + "state_bridge": { + "test_acc": 0.687, + "mean_bp_cosine": 0.1969081535935402, + "mean_rho": 0.18958334562679133, + "mean_nudge_001": -0.0026059118196523436, + "mean_nudge_003": -0.007709211970601852, + "mean_nudge_01": -0.02444164449116215, + "bp_cosine_per_layer": [ + 0.7618155479431152, + 0.3189862072467804, + 0.20356883108615875, + 0.1471748650074005, + 0.14541830122470856, + 0.13144558668136597, + 0.11054451763629913, + 0.12045299261808395, + 0.11467338353395462, + 0.1017053946852684, + 0.10614258050918579, + 0.10096963495016098 + ], + "rho_per_layer": [ + 0.6406711339950562, + 0.31470298767089844, + 0.1861359179019928, + 0.17725443840026855, + 0.11286133527755737, + 0.1387007087469101, + 0.07976903766393661, + 0.11419158428907394, + 0.13525697588920593, + 0.13865813612937927, + 0.10792528837919235, + 0.1288726031780243 + ], + "nudge_per_layer": [ + -0.24276113510131836, + -0.011681582778692245, + -0.006372842937707901, + -0.004580066539347172, + -0.004361784551292658, + -0.004005158320069313, + -0.0033329487778246403, + -0.003609130624681711, + -0.003437052248045802, + -0.003070915350690484, + -0.0031537071336060762, + -0.0029334095306694508 + ], + "state_pred_error_per_layer": [ + 13069.6103515625, + 12902.267578125, + 5325.7177734375, + 4598.6796875, + 4871.38818359375, + 4525.17333984375, + 4230.712890625, + 4117.212890625, + 3694.05078125, + 3737.547607421875, + 3966.26025390625, + 4157.70654296875 + ], + "mean_state_pred_error": 5766.360656738281 + }, + "credit_bridge": { + "test_acc": 0.6145, + "mean_bp_cosine": 0.07906571677691925, + "mean_rho": 0.138323282978187, + "mean_nudge_001": -0.000623912480174719, + "mean_nudge_003": -0.0018697016639634967, + "mean_nudge_01": -0.006201692313576738, + "bp_cosine_per_layer": [ + -0.00034100248012691736, + 0.04912012815475464, + 0.07342620939016342, + 0.08266763389110565, + 0.08488726615905762, + 0.08897420018911362, + 0.09187051653862, + 0.09561659395694733, + 0.09157264232635498, + 0.0947732925415039, + 0.09517554938793182, + 0.10104557126760483 + ], + "rho_per_layer": [ + 0.03049650974571705, + 0.10809889435768127, + 0.08979646861553192, + 0.17959633469581604, + 0.1275440901517868, + 0.17255432903766632, + 0.16415373980998993, + 0.11534757167100906, + 0.17073199152946472, + 0.15983673930168152, + 0.15877583622932434, + 0.18294689059257507 + ], + "nudge_per_layer": [ + -0.003660556860268116, + -0.004647519439458847, + -0.005617665126919746, + -0.006360755302011967, + -0.006202561780810356, + -0.006613034754991531, + -0.006794797722250223, + -0.006956290453672409, + -0.006790010258555412, + -0.006838815752416849, + -0.006875438615679741, + -0.007062861695885658 + ], + "final_value_loss": 0.5342490439891815, + "final_term_loss": 0.2775654150247574, + "final_bridge_loss": 0.01819542294666171, + "final_tgrad_loss": 0.2384882021665573 + } + }, + "a0.25_L12_s123": { + "bp": { + "test_acc": 0.902, + "mean_bp_cosine": 0.7854474087556204, + "mean_rho": 0.9998569438854853, + "mean_nudge_001": -0.005986864319614445, + "mean_nudge_003": -0.01699222985189408, + "mean_nudge_01": -0.04738136318822702, + "bp_cosine_per_layer": [ + 0.8318638801574707, + 0.8205357789993286, + 0.8115277886390686, + 0.8032979965209961, + 0.7886118292808533, + 0.7801527976989746, + 0.7755030393600464, + 0.769822359085083, + 0.7656118869781494, + 0.7624454498291016, + 0.7592873573303223, + 0.7567087411880493 + ], + "rho_per_layer": [ + 0.9999992251396179, + 0.9999969005584717, + 0.9999886155128479, + 0.9999699592590332, + 0.9999390244483948, + 0.9998932480812073, + 0.9998554587364197, + 0.9998190999031067, + 0.9997619986534119, + 0.9997045397758484, + 0.9997037649154663, + 0.9996514916419983 + ], + "nudge_per_layer": [ + -0.19001588225364685, + -0.1191760003566742, + -0.0696173831820488, + -0.04359997808933258, + -0.030619269236922264, + -0.023702502250671387, + -0.019644131883978844, + -0.01702706888318062, + -0.015273808501660824, + -0.014067228883504868, + -0.01321301981806755, + -0.012620084919035435 + ] + }, + "dfa": { + "test_acc": 0.8475, + "mean_bp_cosine": 0.08017303561791778, + "mean_rho": 0.06949969536314408, + "mean_nudge_001": -0.00017117233619501349, + "mean_nudge_003": -0.0005107432225486264, + "mean_nudge_01": -0.0016712878035226215, + "bp_cosine_per_layer": [ + 0.007017737254500389, + 0.1750856339931488, + 0.09811605513095856, + 0.09870222210884094, + 0.06923168152570724, + 0.07072796672582626, + 0.1299426257610321, + 0.06372487545013428, + 0.05202930420637131, + 0.07090489566326141, + 0.04892899468541145, + 0.07766443490982056 + ], + "rho_per_layer": [ + -0.05082311853766441, + 0.15127798914909363, + 0.10723739117383957, + 0.1141807958483696, + 0.10590988397598267, + 0.05159565061330795, + 0.11685939878225327, + 0.06997300684452057, + 0.00848393514752388, + 0.09840574860572815, + 0.04575839638710022, + 0.015137266367673874 + ], + "nudge_per_layer": [ + -9.43206250667572e-05, + -0.004689650610089302, + -0.0020264536142349243, + -0.0020407852716743946, + -0.0012656663311645389, + -0.0012923413887619972, + -0.0026080894749611616, + -0.0013762509915977716, + -0.0008721412159502506, + -0.0014046088326722383, + -0.0009981195908039808, + -0.0013870256952941418 + ] + }, + "state_bridge": { + "test_acc": 0.653, + "mean_bp_cosine": 0.212141719336311, + "mean_rho": 0.16903599786261717, + "mean_nudge_001": -0.002121228181446592, + "mean_nudge_003": -0.006256894756612989, + "mean_nudge_01": -0.019624086019272607, + "bp_cosine_per_layer": [ + 0.7411977648735046, + 0.3599514067173004, + 0.24466437101364136, + 0.18324854969978333, + 0.1438049077987671, + 0.1288401186466217, + 0.12390943616628647, + 0.11832019686698914, + 0.1285572201013565, + 0.12467152625322342, + 0.12941977381706238, + 0.11911536008119583 + ], + "rho_per_layer": [ + 0.637965977191925, + 0.3033628761768341, + 0.22177954018115997, + 0.1946793794631958, + 0.08981841057538986, + 0.07293770462274551, + 0.06646254658699036, + 0.08072252571582794, + 0.1001453697681427, + 0.10873826593160629, + 0.08548736572265625, + 0.06633201241493225 + ], + "nudge_per_layer": [ + -0.19135718047618866, + -0.010539980605244637, + -0.006164146587252617, + -0.004623022396117449, + -0.003351652529090643, + -0.002855603815987706, + -0.002745934296399355, + -0.0025949627161026, + -0.002952038776129484, + -0.002784580923616886, + -0.002810355508700013, + -0.0027095736004412174 + ], + "state_pred_error_per_layer": [ + 11398.169921875, + 8994.236328125, + 6843.07958984375, + 5338.4423828125, + 5392.61279296875, + 5254.96435546875, + 5057.08544921875, + 3968.3759765625, + 3609.97021484375, + 3456.01708984375, + 3801.56005859375, + 3800.938232421875 + ], + "mean_state_pred_error": 5576.287699381511 + }, + "credit_bridge": { + "test_acc": 0.6165, + "mean_bp_cosine": 0.062155287557592, + "mean_rho": 0.1365320294474562, + "mean_nudge_001": -0.0005568450481708472, + "mean_nudge_003": -0.001666992757236585, + "mean_nudge_01": -0.005523480668974419, + "bp_cosine_per_layer": [ + 0.022855455055832863, + 0.05216163024306297, + 0.06243491545319557, + 0.06105152890086174, + 0.04914259910583496, + 0.0686616599559784, + 0.07184358686208725, + 0.06793813407421112, + 0.07173632830381393, + 0.07284142076969147, + 0.07256414741277695, + 0.07263204455375671 + ], + "rho_per_layer": [ + 0.035705771297216415, + 0.06484436988830566, + 0.15210987627506256, + 0.16708198189735413, + 0.14389753341674805, + 0.17870034277439117, + 0.1870872974395752, + 0.1476944386959076, + 0.15697413682937622, + 0.11093902587890625, + 0.14925891160964966, + 0.1440906673669815 + ], + "nudge_per_layer": [ + -0.010396174155175686, + -0.0040237451903522015, + -0.004916047677397728, + -0.004709047265350819, + -0.003890307154506445, + -0.005256335251033306, + -0.00541608827188611, + -0.005244302563369274, + -0.005511538591235876, + -0.005561722908169031, + -0.005636853165924549, + -0.0057196058332920074 + ], + "final_value_loss": 0.7472030250549316, + "final_term_loss": 0.48659993648529054, + "final_bridge_loss": 0.02176231173723936, + "final_tgrad_loss": 0.23884078254699706 + } + }, + "a0.25_L12_s456": { + "bp": { + "test_acc": 0.899, + "mean_bp_cosine": 0.7671962430079778, + "mean_rho": 0.9998593876759211, + "mean_nudge_001": -0.004748132584306101, + "mean_nudge_003": -0.013334368025728812, + "mean_nudge_01": -0.03616663611804446, + "bp_cosine_per_layer": [ + 0.8408721685409546, + 0.8110387921333313, + 0.7906323671340942, + 0.7719681262969971, + 0.7599710822105408, + 0.7539124488830566, + 0.7502779364585876, + 0.7483201026916504, + 0.7469743490219116, + 0.7455896139144897, + 0.7440224885940552, + 0.7427754402160645 + ], + "rho_per_layer": [ + 0.9999985694885254, + 0.9999968409538269, + 0.9999892711639404, + 0.9999746680259705, + 0.9999452233314514, + 0.9998985528945923, + 0.999815821647644, + 0.9998071789741516, + 0.9997591972351074, + 0.9997697472572327, + 0.9996993541717529, + 0.9996582269668579 + ], + "nudge_per_layer": [ + -0.1375543624162674, + -0.0896252989768982, + -0.05422336980700493, + -0.034489020705223083, + -0.024439619854092598, + -0.019029833376407623, + -0.015829749405384064, + -0.013777680695056915, + -0.012396320700645447, + -0.011455517262220383, + -0.01080663874745369, + -0.01037222146987915 + ] + }, + "dfa": { + "test_acc": 0.8205, + "mean_bp_cosine": 0.11264437561233838, + "mean_rho": 0.10325007668385904, + "mean_nudge_001": -0.0003942390236867747, + "mean_nudge_003": -0.001173070602817461, + "mean_nudge_01": -0.003865133059055855, + "bp_cosine_per_layer": [ + 0.03703948110342026, + 0.2760871648788452, + 0.18428769707679749, + 0.1331849992275238, + 0.09719057381153107, + 0.1258918195962906, + 0.0748991146683693, + 0.08436713367700577, + 0.09110807627439499, + 0.10076140612363815, + 0.06335102021694183, + 0.08356402069330215 + ], + "rho_per_layer": [ + 0.048133689910173416, + 0.19754433631896973, + 0.16992174088954926, + 0.13566580414772034, + 0.05106702446937561, + 0.13118207454681396, + 0.057789772748947144, + 0.09156530350446701, + 0.05846566706895828, + 0.07805749773979187, + 0.11393842101097107, + 0.10566958785057068 + ], + "nudge_per_layer": [ + -0.010506195947527885, + -0.007814407348632812, + -0.005055932328104973, + -0.003603969234973192, + -0.0024205115623772144, + -0.0030835624784231186, + -0.0020989018958061934, + -0.002160410862416029, + -0.0025065483059734106, + -0.0029421483632177114, + -0.0018882867880165577, + -0.0023007215932011604 + ] + }, + "state_bridge": { + "test_acc": 0.645, + "mean_bp_cosine": 0.17685540641347566, + "mean_rho": 0.14925638431062302, + "mean_nudge_001": -0.001906786697266701, + "mean_nudge_003": -0.005651665274247837, + "mean_nudge_01": -0.018038961667722713, + "bp_cosine_per_layer": [ + 0.7252062559127808, + 0.29899632930755615, + 0.17116883397102356, + 0.13035137951374054, + 0.11515486240386963, + 0.09652335941791534, + 0.0831163302063942, + 0.08587749302387238, + 0.1138496845960617, + 0.09370164573192596, + 0.10970423370599747, + 0.09861446917057037 + ], + "rho_per_layer": [ + 0.5776556730270386, + 0.24244043231010437, + 0.15723995864391327, + 0.11212021112442017, + 0.13527166843414307, + 0.09345141798257828, + 0.05218992009758949, + 0.09958191215991974, + 0.09601333737373352, + 0.05242425203323364, + 0.08741243183612823, + 0.08527539670467377 + ], + "nudge_per_layer": [ + -0.1766481101512909, + -0.00916180107742548, + -0.004768161568790674, + -0.00345130218192935, + -0.0031899111345410347, + -0.002747050253674388, + -0.002392321825027466, + -0.0024352066684514284, + -0.0032566720619797707, + -0.0024684183299541473, + -0.003083357820287347, + -0.0028652269393205643 + ], + "state_pred_error_per_layer": [ + 14567.1396484375, + 8843.26171875, + 5969.56787109375, + 5045.4873046875, + 4699.3388671875, + 4805.94287109375, + 4535.58935546875, + 4793.4423828125, + 4549.9345703125, + 4690.251953125, + 4812.1875, + 4947.22509765625 + ], + "mean_state_pred_error": 6021.614095052083 + }, + "credit_bridge": { + "test_acc": 0.5665, + "mean_bp_cosine": 0.0795192973067363, + "mean_rho": 0.11809263161073129, + "mean_nudge_001": -0.0007323032235338663, + "mean_nudge_003": -0.002197402771950389, + "mean_nudge_01": -0.007294998116170366, + "bp_cosine_per_layer": [ + 0.0279831662774086, + 0.034206733107566833, + 0.06341560930013657, + 0.0695083886384964, + 0.09047738462686539, + 0.09644618630409241, + 0.1011449545621872, + 0.09714356064796448, + 0.09739723801612854, + 0.09588810801506042, + 0.09328337758779526, + 0.08733686059713364 + ], + "rho_per_layer": [ + -0.01078212633728981, + 0.08389643579721451, + 0.09591226279735565, + 0.09822964668273926, + 0.15539337694644928, + 0.077084481716156, + 0.18135306239128113, + 0.13923753798007965, + 0.15523496270179749, + 0.1566530466079712, + 0.16011789441108704, + 0.12478099763393402 + ], + "nudge_per_layer": [ + -0.014675050042569637, + -0.0035726604983210564, + -0.005193591117858887, + -0.005878218449652195, + -0.007073326967656612, + -0.007276617921888828, + -0.0072667524218559265, + -0.007385652512311935, + -0.00723686721175909, + -0.007413622923195362, + -0.0073149921372532845, + -0.007252625189721584 + ], + "final_value_loss": 0.8463798692464829, + "final_term_loss": 0.5014169258773327, + "final_bridge_loss": 0.03549532132707536, + "final_tgrad_loss": 0.3094676312446594 + } + } +}
\ No newline at end of file |
