diff options
Diffstat (limited to 'results/vector_audit_full/audit_results.json')
| -rw-r--r-- | results/vector_audit_full/audit_results.json | 1346 |
1 files changed, 1346 insertions, 0 deletions
diff --git a/results/vector_audit_full/audit_results.json b/results/vector_audit_full/audit_results.json new file mode 100644 index 0000000..06a244b --- /dev/null +++ b/results/vector_audit_full/audit_results.json @@ -0,0 +1,1346 @@ +[ + { + "method": "dfa", + "L": 4, + "seed": 42, + "mean_gamma": 0.012759206583723426, + "mean_rho": 0.010203135898336768, + "mean_nudge": -0.00013293450319906697, + "per_layer_gamma": [ + -0.005139289423823357, + 0.008053570054471493, + 0.024840975180268288, + 0.02328157052397728 + ], + "per_layer_rho": [ + -0.004372224677354097, + 0.0029046176932752132, + 0.0310027077794075, + 0.011277442798018456 + ], + "per_layer_nudge": [ + 0.0003250446170568466, + -0.0001853172725532204, + -0.00036372727481648326, + -0.00030773808248341084 + ] + }, + { + "method": "scalar_cb", + "L": 4, + "seed": 42, + "mean_gamma": 0.2243543565273285, + "mean_rho": 0.20948006212711334, + "mean_nudge": -0.007398057030513883, + "per_layer_gamma": [ + 0.23697319626808167, + 0.13470041751861572, + 0.186288982629776, + 0.3394548296928406 + ], + "per_layer_rho": [ + 0.2484399378299713, + 0.1292348951101303, + 0.18184946477413177, + 0.27839595079421997 + ], + "per_layer_nudge": [ + -0.008707698434591293, + -0.004232201725244522, + -0.00588453933596611, + -0.010767788626253605 + ] + }, + { + "method": "vec_eT_M4", + "L": 4, + "seed": 42, + "mean_gamma": 0.846664547920227, + "mean_rho": 0.9511756896972656, + "mean_nudge": -0.025688248220831156, + "per_layer_gamma": [ + 0.743350088596344, + 0.8330336809158325, + 0.8981793522834778, + 0.9120950698852539 + ], + "per_layer_rho": [ + 0.8806748390197754, + 0.9658336639404297, + 0.9759747982025146, + 0.9822194576263428 + ], + "per_layer_nudge": [ + -0.0588495098054409, + -0.01651737093925476, + -0.013681922107934952, + -0.013704190030694008 + ] + }, + { + "method": "vec_eT_M8", + "L": 4, + "seed": 42, + "mean_gamma": 0.8704017400741577, + "mean_rho": 0.9432401657104492, + "mean_nudge": -0.028888660948723555, + "per_layer_gamma": [ + 0.7826259136199951, + 0.877338171005249, + 0.9058365821838379, + 0.9158062934875488 + ], + "per_layer_rho": [ + 0.8731295466423035, + 0.9544992446899414, + 0.9707695245742798, + 0.9745623469352722 + ], + "per_layer_nudge": [ + -0.059486024081707, + -0.01946994476020336, + -0.018279198557138443, + -0.018319476395845413 + ] + }, + { + "method": "vec_eT_M4_shuffleCtrl", + "L": 4, + "seed": 42, + "mean_gamma": 0.0513513587648049, + "mean_rho": 0.0681416861480102, + "mean_nudge": -0.0007606418039358687, + "per_layer_gamma": [ + -0.09132926911115646, + -0.013022630475461483, + 0.0033656186424195766, + 0.30639171600341797 + ], + "per_layer_rho": [ + -0.047784049063920975, + -0.0063863289542496204, + 0.01414431817829609, + 0.3125928044319153 + ], + "per_layer_nudge": [ + 0.006318309810012579, + 0.0002974363451357931, + -0.00020490401948336512, + -0.009453409351408482 + ] + }, + { + "method": "vec_eT_M4_noTerm", + "L": 4, + "seed": 42, + "mean_gamma": 0.954873263835907, + "mean_rho": 0.9708771407604218, + "mean_nudge": -0.027431895025074482, + "per_layer_gamma": [ + 0.9027864336967468, + 0.9722906351089478, + 0.9725323915481567, + 0.9718835949897766 + ], + "per_layer_rho": [ + 0.9104452133178711, + 0.9908294677734375, + 0.991165280342102, + 0.9910686016082764 + ], + "per_layer_nudge": [ + -0.04417877644300461, + -0.022297389805316925, + -0.021837987005710602, + -0.021413426846265793 + ] + }, + { + "method": "vec_eT_M4_onesided", + "L": 4, + "seed": 42, + "mean_gamma": 0.8315763473510742, + "mean_rho": 0.9426839649677277, + "mean_nudge": -0.02414578991010785, + "per_layer_gamma": [ + 0.7389893531799316, + 0.8383945226669312, + 0.8796361684799194, + 0.8692853450775146 + ], + "per_layer_rho": [ + 0.8755806684494019, + 0.9449398517608643, + 0.9726759195327759, + 0.9775394201278687 + ], + "per_layer_nudge": [ + -0.055945657193660736, + -0.01551580149680376, + -0.012561880983412266, + -0.012559819966554642 + ] + }, + { + "method": "dfa", + "L": 4, + "seed": 123, + "mean_gamma": 0.0021313047036528587, + "mean_rho": 0.00923872203566134, + "mean_nudge": 0.000226999055826127, + "per_layer_gamma": [ + -0.013840198516845703, + 0.020386721938848495, + -0.0008580549620091915, + 0.002836750354617834 + ], + "per_layer_rho": [ + -0.012609685771167278, + 0.019667847082018852, + -0.009115943685173988, + 0.03901267051696777 + ], + "per_layer_nudge": [ + 0.0012924917973577976, + -0.0003459132567513734, + 3.6447577258513775e-06, + -4.222707502776757e-05 + ] + }, + { + "method": "scalar_cb", + "L": 4, + "seed": 123, + "mean_gamma": 0.4006684720516205, + "mean_rho": 0.3810938075184822, + "mean_nudge": -0.016430767253041267, + "per_layer_gamma": [ + 0.39850419759750366, + 0.4013897776603699, + 0.4055132269859314, + 0.397266685962677 + ], + "per_layer_rho": [ + 0.3824196457862854, + 0.4083380699157715, + 0.37734755873680115, + 0.3562699556350708 + ], + "per_layer_nudge": [ + -0.016568617895245552, + -0.016357120126485825, + -0.01656804233789444, + -0.016229288652539253 + ] + }, + { + "method": "vec_eT_M4", + "L": 4, + "seed": 123, + "mean_gamma": 0.8960145115852356, + "mean_rho": 0.9537482112646103, + "mean_nudge": -0.02881092019379139, + "per_layer_gamma": [ + 0.8080605864524841, + 0.8870053887367249, + 0.9341694116592407, + 0.9548226594924927 + ], + "per_layer_rho": [ + 0.8955597877502441, + 0.9675844311714172, + 0.9722031354904175, + 0.9796454906463623 + ], + "per_layer_nudge": [ + -0.0648956224322319, + -0.01859605871140957, + -0.01589030772447586, + -0.015861691907048225 + ] + }, + { + "method": "vec_eT_M8", + "L": 4, + "seed": 123, + "mean_gamma": 0.9169906079769135, + "mean_rho": 0.9518635720014572, + "mean_nudge": -0.030037105083465576, + "per_layer_gamma": [ + 0.813483715057373, + 0.9396308064460754, + 0.9553613662719727, + 0.9594865441322327 + ], + "per_layer_rho": [ + 0.8809271454811096, + 0.9691250324249268, + 0.9771296977996826, + 0.9802724123001099 + ], + "per_layer_nudge": [ + -0.06450991332530975, + -0.018834944814443588, + -0.018407035619020462, + -0.0183965265750885 + ] + }, + { + "method": "vec_eT_M4_shuffleCtrl", + "L": 4, + "seed": 123, + "mean_gamma": -0.03672784520313144, + "mean_rho": -0.000436956062912941, + "mean_nudge": 0.0007004090439295396, + "per_layer_gamma": [ + -0.012967733666300774, + -0.18309307098388672, + -0.33163735270500183, + 0.3807867765426636 + ], + "per_layer_rho": [ + 0.05609207600355148, + -0.16973736882209778, + -0.34432661533355713, + 0.45622408390045166 + ], + "per_layer_nudge": [ + 0.0007166759460233152, + 0.004922591149806976, + 0.009576696902513504, + -0.012414327822625637 + ] + }, + { + "method": "vec_eT_M4_noTerm", + "L": 4, + "seed": 123, + "mean_gamma": 0.9524389505386353, + "mean_rho": 0.9689934253692627, + "mean_nudge": -0.02997258398681879, + "per_layer_gamma": [ + 0.8996936082839966, + 0.9695490598678589, + 0.9714151620864868, + 0.9690979719161987 + ], + "per_layer_rho": [ + 0.9063906073570251, + 0.9897294640541077, + 0.9902646541595459, + 0.9895889759063721 + ], + "per_layer_nudge": [ + -0.048146918416023254, + -0.024354536086320877, + -0.023889556527137756, + -0.023499324917793274 + ] + }, + { + "method": "vec_eT_M4_onesided", + "L": 4, + "seed": 123, + "mean_gamma": 0.8988931030035019, + "mean_rho": 0.9505570530891418, + "mean_nudge": -0.02708751056343317, + "per_layer_gamma": [ + 0.8175626397132874, + 0.9190162420272827, + 0.9264382719993591, + 0.9325552582740784 + ], + "per_layer_rho": [ + 0.8918192386627197, + 0.9622496366500854, + 0.9709856510162354, + 0.9771736860275269 + ], + "per_layer_nudge": [ + -0.05964129418134689, + -0.017833322286605835, + -0.015457207337021828, + -0.015418218448758125 + ] + }, + { + "method": "dfa", + "L": 4, + "seed": 456, + "mean_gamma": 0.016278030583634973, + "mean_rho": 0.019018374383449554, + "mean_nudge": -0.001155311170805362, + "per_layer_gamma": [ + 0.034280914813280106, + 0.018388552591204643, + 0.004948894493281841, + 0.0074937604367733 + ], + "per_layer_rho": [ + 0.026491232216358185, + 0.0305374376475811, + -0.001606430858373642, + 0.020651258528232574 + ], + "per_layer_nudge": [ + -0.004200353287160397, + -0.0002525914169382304, + -7.005853694863617e-05, + -9.824144217418507e-05 + ] + }, + { + "method": "scalar_cb", + "L": 4, + "seed": 456, + "mean_gamma": 0.40844712406396866, + "mean_rho": 0.4075355716049671, + "mean_nudge": -0.011171038961037993, + "per_layer_gamma": [ + 0.261852890253067, + 0.41412365436553955, + 0.4508002996444702, + 0.5070116519927979 + ], + "per_layer_rho": [ + 0.2299479991197586, + 0.4202876687049866, + 0.4645801782608032, + 0.5153264403343201 + ], + "per_layer_nudge": [ + -0.009456473402678967, + -0.01063506305217743, + -0.011527800001204014, + -0.013064819388091564 + ] + }, + { + "method": "vec_eT_M4", + "L": 4, + "seed": 456, + "mean_gamma": 0.9677009582519531, + "mean_rho": 0.9615653902292252, + "mean_nudge": -0.02802830934524536, + "per_layer_gamma": [ + 0.90372633934021, + 0.9808875918388367, + 0.9896383285522461, + 0.9965515732765198 + ], + "per_layer_rho": [ + 0.9064497947692871, + 0.9720321297645569, + 0.980293869972229, + 0.9874857664108276 + ], + "per_layer_nudge": [ + -0.04350632429122925, + -0.0233478881418705, + -0.02268034964799881, + -0.02257867529988289 + ] + }, + { + "method": "vec_eT_M8", + "L": 4, + "seed": 456, + "mean_gamma": 0.7236898243427277, + "mean_rho": 0.8553760200738907, + "mean_nudge": -0.02606209833174944, + "per_layer_gamma": [ + 0.6436039209365845, + 0.6319636106491089, + 0.7965036630630493, + 0.822688102722168 + ], + "per_layer_rho": [ + 0.7970162630081177, + 0.7741899490356445, + 0.916257917881012, + 0.9340399503707886 + ], + "per_layer_nudge": [ + -0.05365825071930885, + -0.015726309269666672, + -0.017313942313194275, + -0.017549891024827957 + ] + }, + { + "method": "vec_eT_M4_shuffleCtrl", + "L": 4, + "seed": 456, + "mean_gamma": -0.12004246190190315, + "mean_rho": -0.09116240590810776, + "mean_nudge": 0.003779993741773069, + "per_layer_gamma": [ + -0.18761609494686127, + -0.4131208062171936, + -0.33985134959220886, + 0.4604184031486511 + ], + "per_layer_rho": [ + -0.08593425154685974, + -0.4190409183502197, + -0.3457789421081543, + 0.48610448837280273 + ], + "per_layer_nudge": [ + 0.007614006754010916, + 0.010954373516142368, + 0.009015142917633057, + -0.012463548220694065 + ] + }, + { + "method": "vec_eT_M4_noTerm", + "L": 4, + "seed": 456, + "mean_gamma": 0.9375280737876892, + "mean_rho": 0.9757244437932968, + "mean_nudge": -0.02518668444827199, + "per_layer_gamma": [ + 0.9148672819137573, + 0.9444636106491089, + 0.946875810623169, + 0.9439055919647217 + ], + "per_layer_rho": [ + 0.9372595548629761, + 0.9872512817382812, + 0.9900106191635132, + 0.9883763194084167 + ], + "per_layer_nudge": [ + -0.04899398609995842, + -0.018192578107118607, + -0.017080236226320267, + -0.016479937359690666 + ] + }, + { + "method": "vec_eT_M4_onesided", + "L": 4, + "seed": 456, + "mean_gamma": 0.9691873788833618, + "mean_rho": 0.9595922082662582, + "mean_nudge": -0.026451716665178537, + "per_layer_gamma": [ + 0.906065821647644, + 0.9809720516204834, + 0.992091178894043, + 0.9976204633712769 + ], + "per_layer_rho": [ + 0.9050431251525879, + 0.9693447351455688, + 0.9793726205825806, + 0.9846083521842957 + ], + "per_layer_nudge": [ + -0.04136938229203224, + -0.02186034619808197, + -0.021370645612478256, + -0.02120649255812168 + ] + }, + { + "method": "dfa", + "L": 8, + "seed": 42, + "mean_gamma": 0.09906564746052027, + "mean_rho": 0.09740300523117185, + "mean_nudge": -0.002161820186302066, + "per_layer_gamma": [ + 0.01413647085428238, + 0.28074702620506287, + 0.11767441779375076, + 0.054444827139377594, + 0.14474442601203918, + 0.06295441836118698, + 0.07057145237922668, + 0.04725214093923569 + ], + "per_layer_rho": [ + 0.02532106265425682, + 0.23610877990722656, + 0.12464869767427444, + 0.07118558138608932, + 0.1357075721025467, + 0.06361411511898041, + 0.08849744498729706, + 0.03414078801870346 + ], + "per_layer_nudge": [ + -0.0018329978920519352, + -0.0055640568025410175, + -0.002374582923948765, + -0.0012062718160450459, + -0.00274146581068635, + -0.0013790605589747429, + -0.0014756014570593834, + -0.0007205242291092873 + ] + }, + { + "method": "scalar_cb", + "L": 8, + "seed": 42, + "mean_gamma": 0.30624711513519287, + "mean_rho": 0.3206122815608978, + "mean_nudge": -0.009207659168168902, + "per_layer_gamma": [ + 0.16885146498680115, + 0.3251064419746399, + 0.292763888835907, + 0.3125339150428772, + 0.3227536380290985, + 0.33606037497520447, + 0.3436194658279419, + 0.3482877314090729 + ], + "per_layer_rho": [ + 0.15158507227897644, + 0.2908586263656616, + 0.29920056462287903, + 0.34763777256011963, + 0.3629569113254547, + 0.35797882080078125, + 0.38447317481040955, + 0.3702073097229004 + ], + "per_layer_nudge": [ + -0.005164027214050293, + -0.00964929535984993, + -0.00890397373586893, + -0.009508647955954075, + -0.009753547608852386, + -0.010073650628328323, + -0.010293008759617805, + -0.010315122082829475 + ] + }, + { + "method": "vec_eT_M4", + "L": 8, + "seed": 42, + "mean_gamma": 0.9610838517546654, + "mean_rho": 0.9551834538578987, + "mean_nudge": -0.02005277667194605, + "per_layer_gamma": [ + 0.8267648220062256, + 0.9711159467697144, + 0.9782320261001587, + 0.9792516827583313, + 0.9823880195617676, + 0.9807887077331543, + 0.9809024333953857, + 0.9892271757125854 + ], + "per_layer_rho": [ + 0.8289316892623901, + 0.9607423543930054, + 0.9680945873260498, + 0.970350980758667, + 0.9744545221328735, + 0.9756993055343628, + 0.9772317409515381, + 0.985962450504303 + ], + "per_layer_nudge": [ + -0.03688318282365799, + -0.017963383346796036, + -0.017710430547595024, + -0.017620962113142014, + -0.017566435039043427, + -0.017552118748426437, + -0.017480310052633286, + -0.017645390704274178 + ] + }, + { + "method": "vec_eT_M8", + "L": 8, + "seed": 42, + "mean_gamma": 0.9476289451122284, + "mean_rho": 0.952806644141674, + "mean_nudge": -0.021474516252055764, + "per_layer_gamma": [ + 0.7826216220855713, + 0.9704389572143555, + 0.9734323024749756, + 0.9753161072731018, + 0.9732745885848999, + 0.9694249033927917, + 0.9685238599777222, + 0.9679992198944092 + ], + "per_layer_rho": [ + 0.8156931400299072, + 0.965274453163147, + 0.9699603319168091, + 0.970566987991333, + 0.9739295244216919, + 0.9735742211341858, + 0.9758409261703491, + 0.9776135683059692 + ], + "per_layer_nudge": [ + -0.042923636734485626, + -0.018625982105731964, + -0.01854044198989868, + -0.018480297178030014, + -0.01844090223312378, + -0.018325258046388626, + -0.018257396295666695, + -0.018202215433120728 + ] + }, + { + "method": "vec_eT_M4_shuffleCtrl", + "L": 8, + "seed": 42, + "mean_gamma": -0.019792123697698116, + "mean_rho": 0.01533439988270402, + "mean_nudge": 0.0001886758691398427, + "per_layer_gamma": [ + 0.2983958125114441, + 0.2871808111667633, + -0.6762481927871704, + -0.09076518565416336, + -0.4631124436855316, + -0.5284497141838074, + 0.10263068974018097, + 0.9120312333106995 + ], + "per_layer_rho": [ + 0.436443030834198, + 0.31577497720718384, + -0.6712953448295593, + -0.038358043879270554, + -0.4568558931350708, + -0.533319890499115, + 0.1618560254573822, + 0.9084303379058838 + ], + "per_layer_nudge": [ + -0.00789229478687048, + -0.007670246995985508, + 0.016546625643968582, + 0.0017870900919660926, + 0.010900387540459633, + 0.012512469664216042, + -0.0028577707707881927, + -0.021816853433847427 + ] + }, + { + "method": "vec_eT_M4_noTerm", + "L": 8, + "seed": 42, + "mean_gamma": 0.9694314822554588, + "mean_rho": 0.9782926589250565, + "mean_nudge": -0.020679548615589738, + "per_layer_gamma": [ + 0.9044460654258728, + 0.9779231548309326, + 0.9797878861427307, + 0.9809790849685669, + 0.9813997149467468, + 0.9814468622207642, + 0.979229211807251, + 0.9702398777008057 + ], + "per_layer_rho": [ + 0.9102598428726196, + 0.9878777265548706, + 0.9896679520606995, + 0.9906449317932129, + 0.9906293153762817, + 0.9896650314331055, + 0.98812335729599, + 0.9794731140136719 + ], + "per_layer_nudge": [ + -0.04101525992155075, + -0.019054662436246872, + -0.018692705780267715, + -0.018473587930202484, + -0.01803751476109028, + -0.01748315989971161, + -0.016935309395194054, + -0.01574418880045414 + ] + }, + { + "method": "vec_eT_M4_onesided", + "L": 8, + "seed": 42, + "mean_gamma": 0.961296834051609, + "mean_rho": 0.9601987227797508, + "mean_nudge": -0.020286154001951218, + "per_layer_gamma": [ + 0.8300719857215881, + 0.975559413433075, + 0.9798641204833984, + 0.9784993529319763, + 0.9792141318321228, + 0.9826849102973938, + 0.9828553199768066, + 0.9816254377365112 + ], + "per_layer_rho": [ + 0.8414288759231567, + 0.9681671261787415, + 0.9723494052886963, + 0.9737668037414551, + 0.9768325686454773, + 0.9811946749687195, + 0.9829471111297607, + 0.9849032163619995 + ], + "per_layer_nudge": [ + -0.03684248775243759, + -0.01817578822374344, + -0.018080510199069977, + -0.017905343323946, + -0.017797425389289856, + -0.017846036702394485, + -0.017828192561864853, + -0.01781344786286354 + ] + }, + { + "method": "dfa", + "L": 8, + "seed": 123, + "mean_gamma": 0.0418074403423816, + "mean_rho": 0.043065165635198355, + "mean_nudge": -0.000943926574109355, + "per_layer_gamma": [ + 0.008853738196194172, + 0.060307569801807404, + 0.04014270007610321, + 0.046701639890670776, + 0.04881899803876877, + 0.07526923716068268, + 0.012093071825802326, + 0.04227256774902344 + ], + "per_layer_rho": [ + -0.00892745889723301, + 0.05283857136964798, + 0.04637228325009346, + 0.05245576798915863, + 0.05450460687279701, + 0.07646007835865021, + 0.02843533270061016, + 0.042382143437862396 + ], + "per_layer_nudge": [ + -0.0022439619060605764, + -0.0013329577632248402, + -0.0005934120854362845, + -0.0006395552773028612, + -0.0007643825374543667, + -0.001089449506253004, + -0.00021647402900271118, + -0.0006712194881401956 + ] + }, + { + "method": "scalar_cb", + "L": 8, + "seed": 123, + "mean_gamma": 0.2247180617414415, + "mean_rho": 0.26628467813134193, + "mean_nudge": -0.007505320216296241, + "per_layer_gamma": [ + 0.04518688842654228, + 0.17972084879875183, + 0.21200382709503174, + 0.24014034867286682, + 0.276295006275177, + 0.28583356738090515, + 0.2899315357208252, + 0.2686324715614319 + ], + "per_layer_rho": [ + 0.14380130171775818, + 0.22897371649742126, + 0.23557049036026, + 0.26198533177375793, + 0.3003377914428711, + 0.32919156551361084, + 0.3204420208930969, + 0.30997520685195923 + ], + "per_layer_nudge": [ + -0.0017040509264916182, + -0.006164136342704296, + -0.006984173320233822, + -0.008167261257767677, + -0.00930502824485302, + -0.009475477039813995, + -0.009366653859615326, + -0.008875780738890171 + ] + }, + { + "method": "vec_eT_M4", + "L": 8, + "seed": 123, + "mean_gamma": 0.9508489817380905, + "mean_rho": 0.9518037140369415, + "mean_nudge": -0.02076399209909141, + "per_layer_gamma": [ + 0.8060562014579773, + 0.9650354385375977, + 0.9726169109344482, + 0.973420262336731, + 0.9732815027236938, + 0.9745521545410156, + 0.9734596610069275, + 0.968369722366333 + ], + "per_layer_rho": [ + 0.8418968915939331, + 0.9559968113899231, + 0.962238073348999, + 0.9662503600120544, + 0.9685378670692444, + 0.9712143540382385, + 0.9724422097206116, + 0.9758531451225281 + ], + "per_layer_nudge": [ + -0.0521555095911026, + -0.016341347247362137, + -0.01634775847196579, + -0.01629696600139141, + -0.016271617263555527, + -0.016253814101219177, + -0.01619817316532135, + -0.016246750950813293 + ] + }, + { + "method": "vec_eT_M8", + "L": 8, + "seed": 123, + "mean_gamma": 0.9676685556769371, + "mean_rho": 0.9591586142778397, + "mean_nudge": -0.019975336268544197, + "per_layer_gamma": [ + 0.8518213033676147, + 0.9811072945594788, + 0.9843889474868774, + 0.983165442943573, + 0.9847903251647949, + 0.9829460382461548, + 0.9856388568878174, + 0.9874902367591858 + ], + "per_layer_rho": [ + 0.8631762266159058, + 0.9645696878433228, + 0.9685958027839661, + 0.9701895713806152, + 0.9725322127342224, + 0.9733850955963135, + 0.9789502024650574, + 0.9818701148033142 + ], + "per_layer_nudge": [ + -0.04242108017206192, + -0.017025835812091827, + -0.016797807067632675, + -0.016749639064073563, + -0.016767453402280807, + -0.01670318841934204, + -0.016672292724251747, + -0.016665393486618996 + ] + }, + { + "method": "vec_eT_M4_shuffleCtrl", + "L": 8, + "seed": 123, + "mean_gamma": -0.11373000172898173, + "mean_rho": -0.1359611451625824, + "mean_nudge": 0.004932066862238571, + "per_layer_gamma": [ + -0.056351568549871445, + -0.44720304012298584, + -0.6338962316513062, + -0.408905029296875, + -0.37608587741851807, + -0.18018096685409546, + 0.33276063203811646, + 0.8600220680236816 + ], + "per_layer_rho": [ + 0.044625282287597656, + -0.4992668628692627, + -0.6965052485466003, + -0.46216896176338196, + -0.42366287112236023, + -0.23159649968147278, + 0.2991888225078583, + 0.8816971778869629 + ], + "per_layer_nudge": [ + 0.003119478700682521, + 0.016028771176934242, + 0.022319095209240913, + 0.01471712812781334, + 0.013586362823843956, + 0.007011811248958111, + -0.010123632848262787, + -0.027202479541301727 + ] + }, + { + "method": "vec_eT_M4_noTerm", + "L": 8, + "seed": 123, + "mean_gamma": 0.8755882158875465, + "mean_rho": 0.9470387101173401, + "mean_nudge": -0.01607380306813866, + "per_layer_gamma": [ + 0.8875797986984253, + 0.9009760618209839, + 0.8808510899543762, + 0.8799238204956055, + 0.8797831535339355, + 0.8745893239974976, + 0.861487865447998, + 0.8395146131515503 + ], + "per_layer_rho": [ + 0.9190670847892761, + 0.9546182751655579, + 0.9534507393836975, + 0.9524415731430054, + 0.9578260183334351, + 0.9576990008354187, + 0.9501173496246338, + 0.9310896396636963 + ], + "per_layer_nudge": [ + -0.051533639430999756, + -0.015572542324662209, + -0.012057723477482796, + -0.011056014336645603, + -0.010354170575737953, + -0.009953269734978676, + -0.009345149621367455, + -0.008717915043234825 + ] + }, + { + "method": "vec_eT_M4_onesided", + "L": 8, + "seed": 123, + "mean_gamma": 0.9602480605244637, + "mean_rho": 0.9577522128820419, + "mean_nudge": -0.020163135835900903, + "per_layer_gamma": [ + 0.8212144374847412, + 0.9718189239501953, + 0.9794400930404663, + 0.9788751602172852, + 0.9804568886756897, + 0.9820123910903931, + 0.9819177389144897, + 0.9862488508224487 + ], + "per_layer_rho": [ + 0.8539210557937622, + 0.9595734477043152, + 0.968142032623291, + 0.9713950753211975, + 0.9739673137664795, + 0.9758511781692505, + 0.9757622480392456, + 0.983405351638794 + ], + "per_layer_nudge": [ + -0.048084814101457596, + -0.016458425670862198, + -0.01623723655939102, + -0.016196511685848236, + -0.016157593578100204, + -0.016071485355496407, + -0.015993185341358185, + -0.016105834394693375 + ] + }, + { + "method": "dfa", + "L": 8, + "seed": 456, + "mean_gamma": 0.11447641160339117, + "mean_rho": 0.11044186353683472, + "mean_nudge": -0.0029411360155791044, + "per_layer_gamma": [ + 0.051631297916173935, + 0.2667747735977173, + 0.1608148217201233, + 0.05039509758353233, + 0.09734607487916946, + 0.1104668602347374, + 0.10407236963510513, + 0.07430999726057053 + ], + "per_layer_rho": [ + 0.0571255087852478, + 0.24121275544166565, + 0.1396293193101883, + 0.03282786160707474, + 0.0832589864730835, + 0.12599189579486847, + 0.10961247235536575, + 0.09387610852718353 + ], + "per_layer_nudge": [ + -0.004148983396589756, + -0.006073276046663523, + -0.0035690395161509514, + -0.0011961309937760234, + -0.0020613158121705055, + -0.002379970159381628, + -0.00227751350030303, + -0.0018228586995974183 + ] + }, + { + "method": "scalar_cb", + "L": 8, + "seed": 456, + "mean_gamma": 0.2596400445327163, + "mean_rho": 0.29122191295027733, + "mean_nudge": -0.009376821690239012, + "per_layer_gamma": [ + 0.09049498289823532, + 0.2076151967048645, + 0.28473690152168274, + 0.29515770077705383, + 0.31399405002593994, + 0.29933249950408936, + 0.2904508113861084, + 0.2953382134437561 + ], + "per_layer_rho": [ + 0.10262437164783478, + 0.23574362695217133, + 0.32356733083724976, + 0.3371298313140869, + 0.3557179868221283, + 0.34890225529670715, + 0.31407758593559265, + 0.31201231479644775 + ], + "per_layer_nudge": [ + -0.003384523093700409, + -0.007686353288590908, + -0.010352302342653275, + -0.010613547638058662, + -0.011347497813403606, + -0.010740532539784908, + -0.010370716452598572, + -0.010519100353121758 + ] + }, + { + "method": "vec_eT_M4", + "L": 8, + "seed": 456, + "mean_gamma": 0.9574749916791916, + "mean_rho": 0.9430182427167892, + "mean_nudge": -0.025299219880253077, + "per_layer_gamma": [ + 0.8182810544967651, + 0.9655625820159912, + 0.9788223505020142, + 0.9715414047241211, + 0.9763141870498657, + 0.9819262623786926, + 0.9831951260566711, + 0.9841569662094116 + ], + "per_layer_rho": [ + 0.8498371243476868, + 0.9464435577392578, + 0.9519747495651245, + 0.9531487822532654, + 0.9558645486831665, + 0.9587409496307373, + 0.9619686007499695, + 0.9661676287651062 + ], + "per_layer_nudge": [ + -0.04676084965467453, + -0.022278331220149994, + -0.022243071347475052, + -0.022241756319999695, + -0.022209325805306435, + -0.022194838151335716, + -0.02222602069377899, + -0.0222395658493042 + ] + }, + { + "method": "vec_eT_M8", + "L": 8, + "seed": 456, + "mean_gamma": 0.8017567023634911, + "mean_rho": 0.8739266619086266, + "mean_nudge": -0.0273550299461931, + "per_layer_gamma": [ + 0.5685268640518188, + 0.8541168570518494, + 0.8301878571510315, + 0.8351892232894897, + 0.8266328573226929, + 0.8315808773040771, + 0.8355091214179993, + 0.8323099613189697 + ], + "per_layer_rho": [ + 0.6454399824142456, + 0.8863531947135925, + 0.893866240978241, + 0.90782630443573, + 0.9073142409324646, + 0.9110382795333862, + 0.9168291091918945, + 0.922745943069458 + ], + "per_layer_nudge": [ + -0.059318192303180695, + -0.022695917636156082, + -0.022645555436611176, + -0.022771799936890602, + -0.02274298295378685, + -0.022797273471951485, + -0.022850075736641884, + -0.02301844209432602 + ] + }, + { + "method": "vec_eT_M4_shuffleCtrl", + "L": 8, + "seed": 456, + "mean_gamma": 0.5487924553453922, + "mean_rho": 0.5787655711174011, + "mean_nudge": -0.01472583191934973, + "per_layer_gamma": [ + 0.4987947940826416, + 0.6894677877426147, + 0.5756305456161499, + 0.5317898392677307, + 0.4938901960849762, + 0.48660987615585327, + 0.4679740071296692, + 0.6461825966835022 + ], + "per_layer_rho": [ + 0.5681551694869995, + 0.6849030256271362, + 0.5905652046203613, + 0.5603526830673218, + 0.529013991355896, + 0.5252480506896973, + 0.505163311958313, + 0.6667231321334839 + ], + "per_layer_nudge": [ + -0.013360938057303429, + -0.018475033342838287, + -0.015427734702825546, + -0.0143125606700778, + -0.013382941484451294, + -0.013140549883246422, + -0.012608321383595467, + -0.017098575830459595 + ] + }, + { + "method": "vec_eT_M4_noTerm", + "L": 8, + "seed": 456, + "mean_gamma": 0.9719733148813248, + "mean_rho": 0.9774252474308014, + "mean_nudge": -0.021229598904028535, + "per_layer_gamma": [ + 0.8793158531188965, + 0.9842267632484436, + 0.9851877689361572, + 0.9860390424728394, + 0.9860944747924805, + 0.9856378436088562, + 0.9863163232803345, + 0.9829684495925903 + ], + "per_layer_rho": [ + 0.8756503462791443, + 0.9914530515670776, + 0.9921013712882996, + 0.9924013614654541, + 0.9925580024719238, + 0.992135763168335, + 0.9925041198730469, + 0.9905979633331299 + ], + "per_layer_nudge": [ + -0.039753369987010956, + -0.019631527364253998, + -0.019158396869897842, + -0.01886080764234066, + -0.018597319722175598, + -0.01827744022011757, + -0.017960023134946823, + -0.017597906291484833 + ] + }, + { + "method": "vec_eT_M4_onesided", + "L": 8, + "seed": 456, + "mean_gamma": 0.968105711042881, + "mean_rho": 0.9448694735765457, + "mean_nudge": -0.02237516944296658, + "per_layer_gamma": [ + 0.8237834572792053, + 0.981438159942627, + 0.984513521194458, + 0.9858155846595764, + 0.9882583618164062, + 0.9903416633605957, + 0.9931073784828186, + 0.9975875616073608 + ], + "per_layer_rho": [ + 0.8182570934295654, + 0.9534345269203186, + 0.956415593624115, + 0.9588236808776855, + 0.9621551036834717, + 0.9646933674812317, + 0.9697130918502808, + 0.975463330745697 + ], + "per_layer_nudge": [ + -0.040218278765678406, + -0.01982394978404045, + -0.019831635057926178, + -0.019780701026320457, + -0.01978381723165512, + -0.019830182194709778, + -0.019829627126455307, + -0.019903164356946945 + ] + } +]
\ No newline at end of file |
