diff options
Diffstat (limited to 'results/snapshot_no_outln_v1/snapshot_noLN_s123.json')
| -rw-r--r-- | results/snapshot_no_outln_v1/snapshot_noLN_s123.json | 4766 |
1 files changed, 4766 insertions, 0 deletions
diff --git a/results/snapshot_no_outln_v1/snapshot_noLN_s123.json b/results/snapshot_no_outln_v1/snapshot_noLN_s123.json new file mode 100644 index 0000000..f3f6392 --- /dev/null +++ b/results/snapshot_no_outln_v1/snapshot_noLN_s123.json @@ -0,0 +1,4766 @@ +{ + "config": { + "output_dir": "results/snapshot_no_outln_v1", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 123, + "depth": 4, + "d_hidden": 256 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "architecture": "ResidualMLP_NoOutLN", + "bp_log": [ + { + "hidden_norms": [ + 8.690464973449707, + 8.719978332519531, + 8.73093318939209, + 8.75937271118164, + 8.790542602539062 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005465824506245553, + 0.0005437708459794521, + 0.0005393712199293077, + 0.0005331890424713492, + 0.0005310169071890414 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.1015625, + "loss_eval": 2.3754236698150635, + "epoch": 0 + }, + { + "hidden_norms": [ + 40.83987808227539, + 37.75401306152344, + 36.1661376953125, + 34.91564178466797, + 34.55687713623047 + ], + "bp_grad_per_sample_l2_med": [ + 0.00012231437722221017, + 0.00012846711615566164, + 0.00013815351121593267, + 0.00015655385504942387, + 0.0002070761693175882 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.435546875, + "loss_eval": 1.5918896198272705, + "epoch": 1 + }, + { + "hidden_norms": [ + 54.60358810424805, + 49.46598434448242, + 46.75371170043945, + 44.21198272705078, + 42.52875900268555 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010624218703014776, + 0.00011056899529648945, + 0.0001174700737465173, + 0.00012732982577290386, + 0.00015480577712878585 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4755859375, + "loss_eval": 1.464656114578247, + "epoch": 2 + }, + { + "hidden_norms": [ + 65.05919647216797, + 58.81830596923828, + 54.65021896362305, + 50.87609100341797, + 48.61247253417969 + ], + "bp_grad_per_sample_l2_med": [ + 9.24510313780047e-05, + 9.810000483412296e-05, + 0.00010529180872254074, + 0.00011547923350008205, + 0.00013095361646264791 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.509765625, + "loss_eval": 1.4144818782806396, + "epoch": 3 + }, + { + "hidden_norms": [ + 71.89185333251953, + 63.81675338745117, + 58.61539077758789, + 53.633819580078125, + 50.85374450683594 + ], + "bp_grad_per_sample_l2_med": [ + 9.624486119719222e-05, + 0.00010101673979079351, + 0.00010665278387023136, + 0.00011629729851847515, + 0.0001258883421542123 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5009765625, + "loss_eval": 1.4042909145355225, + "epoch": 4 + }, + { + "hidden_norms": [ + 77.86115264892578, + 68.96236419677734, + 62.764793395996094, + 56.297122955322266, + 51.927825927734375 + ], + "bp_grad_per_sample_l2_med": [ + 8.636285201646388e-05, + 9.12561226869002e-05, + 9.721348760649562e-05, + 0.0001029788691084832, + 0.00010866572119994089 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5048828125, + "loss_eval": 1.362424373626709, + "epoch": 5 + }, + { + "hidden_norms": [ + 86.97894287109375, + 76.51913452148438, + 68.91358947753906, + 61.691619873046875, + 55.97148132324219 + ], + "bp_grad_per_sample_l2_med": [ + 8.555527165299281e-05, + 9.211624274030328e-05, + 9.770254109753296e-05, + 0.00010545850091148168, + 0.00011015798372682184 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4990234375, + "loss_eval": 1.4210331439971924, + "epoch": 6 + }, + { + "hidden_norms": [ + 91.98681640625, + 80.48826599121094, + 72.19147491455078, + 63.2117919921875, + 57.618526458740234 + ], + "bp_grad_per_sample_l2_med": [ + 8.108472684398293e-05, + 8.69045325089246e-05, + 9.184813097817823e-05, + 9.785865404410288e-05, + 0.00010359002772020176 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.50390625, + "loss_eval": 1.395978569984436, + "epoch": 7 + }, + { + "hidden_norms": [ + 97.7012939453125, + 84.81765747070312, + 75.55701446533203, + 65.7588119506836, + 58.28969955444336 + ], + "bp_grad_per_sample_l2_med": [ + 8.22104630060494e-05, + 8.808301208773628e-05, + 9.288280853070319e-05, + 0.0001000006013782695, + 0.00010321019362891093 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.525390625, + "loss_eval": 1.3341916799545288, + "epoch": 8 + }, + { + "hidden_norms": [ + 102.29643249511719, + 88.3180923461914, + 78.02013397216797, + 67.14125061035156, + 59.45139694213867 + ], + "bp_grad_per_sample_l2_med": [ + 8.297000749735162e-05, + 8.909840107662603e-05, + 9.493192192167044e-05, + 0.00010043827933259308, + 0.00010197651863563806 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5166015625, + "loss_eval": 1.3378056287765503, + "epoch": 9 + }, + { + "hidden_norms": [ + 107.60400390625, + 93.19139862060547, + 81.3952407836914, + 70.16273498535156, + 61.15400314331055 + ], + "bp_grad_per_sample_l2_med": [ + 7.625297439517453e-05, + 8.249503298429772e-05, + 8.778223127592355e-05, + 9.526272333459929e-05, + 9.708418656373397e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.54296875, + "loss_eval": 1.3057411909103394, + "epoch": 10 + }, + { + "hidden_norms": [ + 111.52012634277344, + 95.61714935302734, + 83.3553695678711, + 70.52283477783203, + 61.52479553222656 + ], + "bp_grad_per_sample_l2_med": [ + 7.589814777020365e-05, + 8.213706314563751e-05, + 8.74441975611262e-05, + 9.462270099902526e-05, + 9.573540592100471e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5400390625, + "loss_eval": 1.2877662181854248, + "epoch": 11 + }, + { + "hidden_norms": [ + 116.06771850585938, + 99.79177856445312, + 86.30980682373047, + 72.20254516601562, + 62.78416442871094 + ], + "bp_grad_per_sample_l2_med": [ + 7.193555939011276e-05, + 7.673310028621927e-05, + 8.175434049917385e-05, + 8.827414421830326e-05, + 9.135493019130081e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5478515625, + "loss_eval": 1.2685296535491943, + "epoch": 12 + }, + { + "hidden_norms": [ + 119.3271484375, + 102.65406799316406, + 88.69587707519531, + 74.90689849853516, + 63.780494689941406 + ], + "bp_grad_per_sample_l2_med": [ + 7.618113158969209e-05, + 8.220612653531134e-05, + 8.806472760625184e-05, + 9.463543392485008e-05, + 9.703192336019129e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.54296875, + "loss_eval": 1.276496410369873, + "epoch": 13 + }, + { + "hidden_norms": [ + 123.31849670410156, + 105.7769775390625, + 90.95068359375, + 76.97051239013672, + 64.97062683105469 + ], + "bp_grad_per_sample_l2_med": [ + 7.194027421064675e-05, + 7.883367652539164e-05, + 8.381865336559713e-05, + 9.018390846904367e-05, + 8.924194844439626e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.552734375, + "loss_eval": 1.2604155540466309, + "epoch": 14 + }, + { + "hidden_norms": [ + 127.73625946044922, + 109.2970199584961, + 94.82887268066406, + 79.42200469970703, + 66.68120574951172 + ], + "bp_grad_per_sample_l2_med": [ + 7.26957805454731e-05, + 7.816226570867002e-05, + 8.386534318560734e-05, + 9.044967737281695e-05, + 9.091151150641963e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.55859375, + "loss_eval": 1.2421667575836182, + "epoch": 15 + }, + { + "hidden_norms": [ + 129.39227294921875, + 110.16195678710938, + 95.65125274658203, + 79.63654327392578, + 66.4422836303711 + ], + "bp_grad_per_sample_l2_med": [ + 7.170928438426927e-05, + 7.703503069933504e-05, + 8.211386011680588e-05, + 8.873116166796535e-05, + 9.066827624337748e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5615234375, + "loss_eval": 1.2539770603179932, + "epoch": 16 + }, + { + "hidden_norms": [ + 132.24916076660156, + 113.025634765625, + 96.19522857666016, + 80.5164566040039, + 67.23816680908203 + ], + "bp_grad_per_sample_l2_med": [ + 7.194816862465814e-05, + 7.835567521397024e-05, + 8.341929060406983e-05, + 8.761802746448666e-05, + 8.926806913223118e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5732421875, + "loss_eval": 1.2596629858016968, + "epoch": 17 + }, + { + "hidden_norms": [ + 136.37730407714844, + 116.11273956298828, + 98.82146453857422, + 81.83920288085938, + 67.72627258300781 + ], + "bp_grad_per_sample_l2_med": [ + 7.331569941015914e-05, + 7.95917512732558e-05, + 8.647916547488421e-05, + 9.198131010634825e-05, + 9.28269510040991e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.53515625, + "loss_eval": 1.2714436054229736, + "epoch": 18 + }, + { + "hidden_norms": [ + 137.7354736328125, + 119.1905288696289, + 102.62776184082031, + 84.3735580444336, + 69.55421447753906 + ], + "bp_grad_per_sample_l2_med": [ + 7.105377881089225e-05, + 7.70094629842788e-05, + 8.26972391223535e-05, + 8.802180673228577e-05, + 8.82365129655227e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5498046875, + "loss_eval": 1.25264310836792, + "epoch": 19 + }, + { + "hidden_norms": [ + 139.01124572753906, + 119.05533599853516, + 101.28179168701172, + 83.50191497802734, + 68.7996826171875 + ], + "bp_grad_per_sample_l2_med": [ + 7.610249303979799e-05, + 8.31697034300305e-05, + 8.997280383482575e-05, + 9.514019620837644e-05, + 9.370686893817037e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.517578125, + "loss_eval": 1.2884626388549805, + "epoch": 20 + }, + { + "hidden_norms": [ + 142.8061981201172, + 121.41246795654297, + 104.47654724121094, + 86.13514709472656, + 70.62234497070312 + ], + "bp_grad_per_sample_l2_med": [ + 7.287831977009773e-05, + 7.990973244886845e-05, + 8.473258640151471e-05, + 9.054663678398356e-05, + 9.23949119169265e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5498046875, + "loss_eval": 1.2458946704864502, + "epoch": 21 + }, + { + "hidden_norms": [ + 145.03463745117188, + 124.42599487304688, + 105.64387512207031, + 87.60891723632812, + 71.11911010742188 + ], + "bp_grad_per_sample_l2_med": [ + 6.878219573991373e-05, + 7.463164365617558e-05, + 7.942628144519404e-05, + 8.418951620114967e-05, + 8.709819667274132e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5654296875, + "loss_eval": 1.2031928300857544, + "epoch": 22 + }, + { + "hidden_norms": [ + 145.368896484375, + 124.08200073242188, + 106.14088439941406, + 87.3053970336914, + 70.22563171386719 + ], + "bp_grad_per_sample_l2_med": [ + 6.987902452237904e-05, + 7.564797124359757e-05, + 8.058137609623373e-05, + 8.513103239238262e-05, + 8.664488268550485e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5830078125, + "loss_eval": 1.2048817873001099, + "epoch": 23 + }, + { + "hidden_norms": [ + 149.82542419433594, + 127.8211898803711, + 109.31559753417969, + 88.96003723144531, + 71.56672668457031 + ], + "bp_grad_per_sample_l2_med": [ + 7.123420073185116e-05, + 7.683804142288864e-05, + 8.418370271101594e-05, + 8.922854613047093e-05, + 8.777298353379592e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5654296875, + "loss_eval": 1.2408947944641113, + "epoch": 24 + }, + { + "hidden_norms": [ + 151.1898193359375, + 128.61166381835938, + 110.0819320678711, + 89.33537292480469, + 70.91573333740234 + ], + "bp_grad_per_sample_l2_med": [ + 7.046251994324848e-05, + 7.593455666210502e-05, + 8.183503086911514e-05, + 8.78809587447904e-05, + 8.738410542719066e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5849609375, + "loss_eval": 1.2345162630081177, + "epoch": 25 + }, + { + "hidden_norms": [ + 153.0899200439453, + 130.6381072998047, + 110.78546905517578, + 90.43073272705078, + 72.28581237792969 + ], + "bp_grad_per_sample_l2_med": [ + 7.224789442261681e-05, + 7.864048529881984e-05, + 8.493732457282022e-05, + 9.218508785124868e-05, + 9.127514931606129e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.548828125, + "loss_eval": 1.234302282333374, + "epoch": 26 + }, + { + "hidden_norms": [ + 156.78964233398438, + 132.35365295410156, + 114.26016998291016, + 93.03483581542969, + 73.8830337524414 + ], + "bp_grad_per_sample_l2_med": [ + 7.004363578744233e-05, + 7.51781408325769e-05, + 8.189951768144965e-05, + 8.64862377056852e-05, + 8.457603689748794e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.572265625, + "loss_eval": 1.226435661315918, + "epoch": 27 + }, + { + "hidden_norms": [ + 154.7094268798828, + 132.68295288085938, + 112.78950500488281, + 91.68452453613281, + 72.69532012939453 + ], + "bp_grad_per_sample_l2_med": [ + 6.871543155284598e-05, + 7.408537931041792e-05, + 7.912247383501381e-05, + 8.584219176555052e-05, + 8.712658018339425e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5693359375, + "loss_eval": 1.186962604522705, + "epoch": 28 + }, + { + "hidden_norms": [ + 156.5343475341797, + 133.95303344726562, + 113.44208526611328, + 91.55599212646484, + 72.66578674316406 + ], + "bp_grad_per_sample_l2_med": [ + 6.697547360090539e-05, + 7.314077083719894e-05, + 7.949489372549579e-05, + 8.466470171697438e-05, + 8.366732799913734e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.595703125, + "loss_eval": 1.1845954656600952, + "epoch": 29 + }, + { + "hidden_norms": [ + 158.63601684570312, + 134.8338165283203, + 115.27066802978516, + 93.78146362304688, + 72.8468017578125 + ], + "bp_grad_per_sample_l2_med": [ + 6.742558616679162e-05, + 7.408189412672073e-05, + 7.9598423326388e-05, + 8.415436604991555e-05, + 8.754149166634306e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5693359375, + "loss_eval": 1.208282470703125, + "epoch": 30 + }, + { + "hidden_norms": [ + 158.21023559570312, + 136.07545471191406, + 116.15364837646484, + 93.98001098632812, + 73.68004608154297 + ], + "bp_grad_per_sample_l2_med": [ + 7.207741873571649e-05, + 7.860636833356693e-05, + 8.520736446371302e-05, + 9.168307587970048e-05, + 8.956313104135916e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5859375, + "loss_eval": 1.2018094062805176, + "epoch": 31 + }, + { + "hidden_norms": [ + 160.46771240234375, + 136.1265411376953, + 116.0124282836914, + 93.3584976196289, + 73.7890396118164 + ], + "bp_grad_per_sample_l2_med": [ + 7.191704207798466e-05, + 7.717879634583369e-05, + 8.299856563098729e-05, + 8.967710164142773e-05, + 8.699094178155065e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5810546875, + "loss_eval": 1.1889103651046753, + "epoch": 32 + }, + { + "hidden_norms": [ + 160.90545654296875, + 137.0214080810547, + 115.83223724365234, + 94.28914642333984, + 73.96448516845703 + ], + "bp_grad_per_sample_l2_med": [ + 7.10546228219755e-05, + 7.790922973072156e-05, + 8.321165660163388e-05, + 8.87274945853278e-05, + 8.640237501822412e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5859375, + "loss_eval": 1.1516971588134766, + "epoch": 33 + }, + { + "hidden_norms": [ + 163.9844207763672, + 138.9420166015625, + 118.25187683105469, + 94.9247817993164, + 73.99342346191406 + ], + "bp_grad_per_sample_l2_med": [ + 7.05249622114934e-05, + 7.705103053012863e-05, + 8.39303684188053e-05, + 8.84484761627391e-05, + 8.569705096306279e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5888671875, + "loss_eval": 1.1713684797286987, + "epoch": 34 + }, + { + "hidden_norms": [ + 162.2567596435547, + 139.536376953125, + 118.07953643798828, + 96.10607147216797, + 75.22054290771484 + ], + "bp_grad_per_sample_l2_med": [ + 6.98907533660531e-05, + 7.564698171336204e-05, + 8.246934885391966e-05, + 8.673300180817023e-05, + 8.65447727846913e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5869140625, + "loss_eval": 1.1986680030822754, + "epoch": 35 + }, + { + "hidden_norms": [ + 163.85494995117188, + 140.6683807373047, + 120.20167541503906, + 96.79766845703125, + 74.6565933227539 + ], + "bp_grad_per_sample_l2_med": [ + 6.933045369805768e-05, + 7.555640331702307e-05, + 8.187161438399926e-05, + 8.634777623228729e-05, + 8.516138041159138e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.58203125, + "loss_eval": 1.17092764377594, + "epoch": 36 + }, + { + "hidden_norms": [ + 163.91464233398438, + 141.8627166748047, + 120.35345458984375, + 96.861083984375, + 74.91275024414062 + ], + "bp_grad_per_sample_l2_med": [ + 6.821981514804065e-05, + 7.462653593393043e-05, + 7.9863122664392e-05, + 8.513165812473744e-05, + 8.408474968746305e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.607421875, + "loss_eval": 1.1603121757507324, + "epoch": 37 + }, + { + "hidden_norms": [ + 166.6566162109375, + 142.48072814941406, + 120.16492462158203, + 96.4870376586914, + 75.0911636352539 + ], + "bp_grad_per_sample_l2_med": [ + 6.862134614493698e-05, + 7.509759598178789e-05, + 8.221028838306665e-05, + 8.709747635293752e-05, + 8.625433838460594e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5927734375, + "loss_eval": 1.163398027420044, + "epoch": 38 + }, + { + "hidden_norms": [ + 165.2766571044922, + 140.6273193359375, + 119.01939392089844, + 96.45698547363281, + 74.86931610107422 + ], + "bp_grad_per_sample_l2_med": [ + 6.741421384504065e-05, + 7.467559044016525e-05, + 8.113843068713322e-05, + 8.498551324009895e-05, + 8.365403482457623e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.1174335479736328, + "epoch": 39 + }, + { + "hidden_norms": [ + 166.8720703125, + 141.94195556640625, + 119.73834228515625, + 96.83306884765625, + 75.50749206542969 + ], + "bp_grad_per_sample_l2_med": [ + 6.83375183143653e-05, + 7.506174733862281e-05, + 8.1863887317013e-05, + 8.717682067072019e-05, + 8.521847485098988e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6201171875, + "loss_eval": 1.128427267074585, + "epoch": 40 + }, + { + "hidden_norms": [ + 166.10345458984375, + 140.8309783935547, + 119.59312438964844, + 96.5144271850586, + 75.01549530029297 + ], + "bp_grad_per_sample_l2_med": [ + 7.117655331967399e-05, + 7.808134250808507e-05, + 8.549879566999152e-05, + 9.121275070356205e-05, + 8.961764251580462e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6025390625, + "loss_eval": 1.1407405138015747, + "epoch": 41 + }, + { + "hidden_norms": [ + 168.5572052001953, + 144.19313049316406, + 121.29338836669922, + 98.18904113769531, + 75.74433898925781 + ], + "bp_grad_per_sample_l2_med": [ + 7.024689693935215e-05, + 7.835906581021845e-05, + 8.28477568575181e-05, + 8.988843183033168e-05, + 9.142952330876142e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5791015625, + "loss_eval": 1.188612699508667, + "epoch": 42 + }, + { + "hidden_norms": [ + 167.82464599609375, + 142.2963104248047, + 120.96216583251953, + 98.01409149169922, + 76.0032730102539 + ], + "bp_grad_per_sample_l2_med": [ + 7.296045077964664e-05, + 7.839543832233176e-05, + 8.31817596917972e-05, + 9.021619916893542e-05, + 8.68452261784114e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.60546875, + "loss_eval": 1.1675610542297363, + "epoch": 43 + }, + { + "hidden_norms": [ + 168.66015625, + 143.3383026123047, + 121.46915435791016, + 97.43902587890625, + 75.26473236083984 + ], + "bp_grad_per_sample_l2_med": [ + 7.207799353636801e-05, + 8.018259541131556e-05, + 8.563740993849933e-05, + 9.22580948099494e-05, + 9.03013497008942e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.591796875, + "loss_eval": 1.1672401428222656, + "epoch": 44 + }, + { + "hidden_norms": [ + 168.55662536621094, + 142.82704162597656, + 120.73102569580078, + 96.30245971679688, + 74.20568084716797 + ], + "bp_grad_per_sample_l2_med": [ + 7.172006007749587e-05, + 7.97949469415471e-05, + 8.564699237467721e-05, + 9.092836262425408e-05, + 9.031151421368122e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.591796875, + "loss_eval": 1.1739519834518433, + "epoch": 45 + }, + { + "hidden_norms": [ + 169.05859375, + 143.376953125, + 122.22779083251953, + 98.1865234375, + 75.46460723876953 + ], + "bp_grad_per_sample_l2_med": [ + 7.164492853917181e-05, + 8.059864194365218e-05, + 8.811463339952752e-05, + 9.420064452569932e-05, + 9.068247891264036e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5869140625, + "loss_eval": 1.1654919385910034, + "epoch": 46 + }, + { + "hidden_norms": [ + 167.85174560546875, + 143.98324584960938, + 121.09931945800781, + 97.61621856689453, + 75.3441390991211 + ], + "bp_grad_per_sample_l2_med": [ + 7.121654198272154e-05, + 7.876066229073331e-05, + 8.58678831718862e-05, + 9.374372893944383e-05, + 8.886006980901584e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6015625, + "loss_eval": 1.1619040966033936, + "epoch": 47 + }, + { + "hidden_norms": [ + 169.16136169433594, + 144.1681671142578, + 121.65021514892578, + 97.65489959716797, + 75.40325927734375 + ], + "bp_grad_per_sample_l2_med": [ + 7.085441029630601e-05, + 7.872789865359664e-05, + 8.54654426802881e-05, + 9.159239561995491e-05, + 8.735150913707912e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.60546875, + "loss_eval": 1.1553215980529785, + "epoch": 48 + }, + { + "hidden_norms": [ + 170.07469177246094, + 144.21502685546875, + 122.42488098144531, + 97.60433959960938, + 75.30228424072266 + ], + "bp_grad_per_sample_l2_med": [ + 7.460799679392949e-05, + 8.310206612804905e-05, + 8.914316276786849e-05, + 9.709167352411896e-05, + 9.34089912334457e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5947265625, + "loss_eval": 1.1511603593826294, + "epoch": 49 + }, + { + "hidden_norms": [ + 169.58541870117188, + 143.38230895996094, + 121.96705627441406, + 97.77040100097656, + 74.732177734375 + ], + "bp_grad_per_sample_l2_med": [ + 7.605904102092609e-05, + 8.306169183924794e-05, + 9.093777771340683e-05, + 9.604891965864226e-05, + 9.101478644879535e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.583984375, + "loss_eval": 1.150202751159668, + "epoch": 50 + }, + { + "hidden_norms": [ + 169.28955078125, + 143.6193084716797, + 122.43891906738281, + 97.91162109375, + 75.27656555175781 + ], + "bp_grad_per_sample_l2_med": [ + 7.325071055674925e-05, + 8.037279621930793e-05, + 8.85110639501363e-05, + 9.169802797259763e-05, + 8.926681766752154e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6201171875, + "loss_eval": 1.1172325611114502, + "epoch": 51 + }, + { + "hidden_norms": [ + 170.01052856445312, + 143.45779418945312, + 122.65426635742188, + 98.24798583984375, + 75.68919372558594 + ], + "bp_grad_per_sample_l2_med": [ + 7.252323121065274e-05, + 8.011860336409882e-05, + 8.620596781838685e-05, + 9.34487470658496e-05, + 9.04093321878463e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.611328125, + "loss_eval": 1.1147592067718506, + "epoch": 52 + }, + { + "hidden_norms": [ + 168.67430114746094, + 143.25802612304688, + 119.88789367675781, + 96.92530822753906, + 74.42180633544922 + ], + "bp_grad_per_sample_l2_med": [ + 7.410924445139244e-05, + 8.137265831464902e-05, + 8.864435949362814e-05, + 9.472777310293168e-05, + 9.015527029987425e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.625, + "loss_eval": 1.1209393739700317, + "epoch": 53 + }, + { + "hidden_norms": [ + 169.25973510742188, + 142.8248291015625, + 120.75433349609375, + 96.85049438476562, + 74.96371459960938 + ], + "bp_grad_per_sample_l2_med": [ + 7.351540989475325e-05, + 8.063198038144037e-05, + 8.647661161376163e-05, + 9.411892096977681e-05, + 9.352037159260362e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.1025673151016235, + "epoch": 54 + }, + { + "hidden_norms": [ + 170.8097381591797, + 143.562744140625, + 121.1410903930664, + 97.70262145996094, + 75.55540466308594 + ], + "bp_grad_per_sample_l2_med": [ + 7.382583135040477e-05, + 8.104312291834503e-05, + 8.895712380763143e-05, + 9.191031131194904e-05, + 8.924967551138252e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.1013734340667725, + "epoch": 55 + }, + { + "hidden_norms": [ + 169.41827392578125, + 143.60491943359375, + 119.79347229003906, + 96.5761947631836, + 74.94788360595703 + ], + "bp_grad_per_sample_l2_med": [ + 7.506331166950986e-05, + 8.308376709464937e-05, + 9.05599954421632e-05, + 9.552844858262688e-05, + 9.322594269178808e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6259765625, + "loss_eval": 1.1202704906463623, + "epoch": 56 + }, + { + "hidden_norms": [ + 169.0540008544922, + 144.03970336914062, + 121.87033081054688, + 98.80317687988281, + 76.42084503173828 + ], + "bp_grad_per_sample_l2_med": [ + 7.446128438459709e-05, + 8.153915405273438e-05, + 8.840708323987201e-05, + 9.388235048390925e-05, + 9.186066017718986e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6171875, + "loss_eval": 1.1205706596374512, + "epoch": 57 + }, + { + "hidden_norms": [ + 168.36595153808594, + 141.80178833007812, + 120.2418212890625, + 96.8748779296875, + 75.01248168945312 + ], + "bp_grad_per_sample_l2_med": [ + 7.731275400146842e-05, + 8.405288099311292e-05, + 9.186116949422285e-05, + 9.942329052137211e-05, + 9.51286856434308e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6162109375, + "loss_eval": 1.1108977794647217, + "epoch": 58 + }, + { + "hidden_norms": [ + 169.39569091796875, + 142.4537353515625, + 120.81804656982422, + 97.19158172607422, + 75.20236206054688 + ], + "bp_grad_per_sample_l2_med": [ + 7.883378566475585e-05, + 8.777670154813677e-05, + 9.416328248335049e-05, + 0.00010057339386548847, + 9.685986879048869e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6259765625, + "loss_eval": 1.1141078472137451, + "epoch": 59 + }, + { + "hidden_norms": [ + 169.97256469726562, + 143.7432098388672, + 121.0943832397461, + 97.53318786621094, + 75.44910430908203 + ], + "bp_grad_per_sample_l2_med": [ + 7.617164374096319e-05, + 8.471525507047772e-05, + 9.014597890200093e-05, + 9.796666563488543e-05, + 9.110565588343889e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.0869580507278442, + "epoch": 60 + }, + { + "hidden_norms": [ + 168.3030242919922, + 142.93931579589844, + 120.8933334350586, + 97.99317932128906, + 75.29071044921875 + ], + "bp_grad_per_sample_l2_med": [ + 7.692870713071898e-05, + 8.63347522681579e-05, + 9.28592708078213e-05, + 9.994371794164181e-05, + 9.114396380027756e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6357421875, + "loss_eval": 1.102014183998108, + "epoch": 61 + }, + { + "hidden_norms": [ + 168.24777221679688, + 142.03550720214844, + 120.25982666015625, + 97.82561492919922, + 75.54430389404297 + ], + "bp_grad_per_sample_l2_med": [ + 7.734074461041018e-05, + 8.487069862894714e-05, + 9.25088970689103e-05, + 9.827558096731082e-05, + 9.154371218755841e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.642578125, + "loss_eval": 1.0736993551254272, + "epoch": 62 + }, + { + "hidden_norms": [ + 168.08807373046875, + 142.24661254882812, + 119.9559555053711, + 96.72630310058594, + 74.6895523071289 + ], + "bp_grad_per_sample_l2_med": [ + 8.049221651162952e-05, + 8.925019210437313e-05, + 9.64810824370943e-05, + 0.00010555233166087419, + 9.567404049448669e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6328125, + "loss_eval": 1.0822858810424805, + "epoch": 63 + }, + { + "hidden_norms": [ + 167.2539825439453, + 141.55946350097656, + 119.37681579589844, + 97.13011169433594, + 75.02286529541016 + ], + "bp_grad_per_sample_l2_med": [ + 7.919344352558255e-05, + 8.567116310587153e-05, + 9.377488458994776e-05, + 9.892786329146475e-05, + 9.566175140207633e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6328125, + "loss_eval": 1.1096018552780151, + "epoch": 64 + }, + { + "hidden_norms": [ + 168.11643981933594, + 142.01052856445312, + 119.23418426513672, + 96.38211059570312, + 75.08849334716797 + ], + "bp_grad_per_sample_l2_med": [ + 7.787172216922045e-05, + 8.574797539040446e-05, + 9.008680353872478e-05, + 9.943459735950455e-05, + 9.4872091722209e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6455078125, + "loss_eval": 1.1080338954925537, + "epoch": 65 + }, + { + "hidden_norms": [ + 168.09153747558594, + 141.83984375, + 120.16891479492188, + 97.12582397460938, + 74.98177337646484 + ], + "bp_grad_per_sample_l2_med": [ + 7.894716691225767e-05, + 8.66493719513528e-05, + 9.518097795080394e-05, + 0.00010154353367397562, + 9.530662646284327e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.634765625, + "loss_eval": 1.1069355010986328, + "epoch": 66 + }, + { + "hidden_norms": [ + 167.35382080078125, + 142.33642578125, + 120.0411148071289, + 96.53257751464844, + 75.0328598022461 + ], + "bp_grad_per_sample_l2_med": [ + 7.973265019245446e-05, + 8.856245403876528e-05, + 9.601243800716475e-05, + 0.00010215263318968937, + 9.676075569586828e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.63671875, + "loss_eval": 1.100548505783081, + "epoch": 67 + }, + { + "hidden_norms": [ + 167.418701171875, + 140.93800354003906, + 119.4802017211914, + 96.3717269897461, + 74.67574310302734 + ], + "bp_grad_per_sample_l2_med": [ + 8.022025576792657e-05, + 8.782520308159292e-05, + 9.638317715143785e-05, + 0.0001046421384671703, + 9.856691031018272e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.63671875, + "loss_eval": 1.1227837800979614, + "epoch": 68 + }, + { + "hidden_norms": [ + 166.9136962890625, + 140.45266723632812, + 119.06848907470703, + 95.9060287475586, + 74.79631042480469 + ], + "bp_grad_per_sample_l2_med": [ + 7.995362102519721e-05, + 8.583935414208099e-05, + 9.508246148470789e-05, + 0.00010096231562783942, + 9.634289017412812e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6416015625, + "loss_eval": 1.1006299257278442, + "epoch": 69 + }, + { + "hidden_norms": [ + 165.4694366455078, + 139.69601440429688, + 117.53054809570312, + 95.05348205566406, + 74.65673065185547 + ], + "bp_grad_per_sample_l2_med": [ + 7.79753245296888e-05, + 8.487935701850802e-05, + 9.169900295091793e-05, + 9.879520075628534e-05, + 9.398034308105707e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.623046875, + "loss_eval": 1.0988688468933105, + "epoch": 70 + }, + { + "hidden_norms": [ + 165.3974609375, + 139.54141235351562, + 117.3493881225586, + 94.9970474243164, + 74.31880187988281 + ], + "bp_grad_per_sample_l2_med": [ + 7.893131260061637e-05, + 8.71433803695254e-05, + 9.492320532444865e-05, + 0.00010128845315193757, + 9.578587196301669e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6484375, + "loss_eval": 1.0860004425048828, + "epoch": 71 + }, + { + "hidden_norms": [ + 165.16651916503906, + 138.63233947753906, + 117.15692138671875, + 94.41555786132812, + 74.16561889648438 + ], + "bp_grad_per_sample_l2_med": [ + 8.611902012489736e-05, + 9.412867802893743e-05, + 0.0001005554513540119, + 0.00010507499246159568, + 0.00010004997602663934 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.638671875, + "loss_eval": 1.0985480546951294, + "epoch": 72 + }, + { + "hidden_norms": [ + 166.48802185058594, + 139.67433166503906, + 117.13744354248047, + 94.41883087158203, + 74.25392150878906 + ], + "bp_grad_per_sample_l2_med": [ + 8.272679406218231e-05, + 9.101553587242961e-05, + 9.994471474783495e-05, + 0.00010372102406108752, + 9.65072977123782e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.63671875, + "loss_eval": 1.1026251316070557, + "epoch": 73 + }, + { + "hidden_norms": [ + 164.66531372070312, + 138.62359619140625, + 117.72949981689453, + 95.40411376953125, + 74.5541763305664 + ], + "bp_grad_per_sample_l2_med": [ + 8.516917296219617e-05, + 9.385120938532054e-05, + 0.00010402742918813601, + 0.00010775420378195122, + 0.00010169474262511358 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6298828125, + "loss_eval": 1.1083872318267822, + "epoch": 74 + }, + { + "hidden_norms": [ + 164.67889404296875, + 138.3468017578125, + 116.61951446533203, + 93.94100952148438, + 74.09746551513672 + ], + "bp_grad_per_sample_l2_med": [ + 8.641117165097967e-05, + 9.53027411014773e-05, + 0.0001029834384098649, + 0.0001086485426640138, + 0.0001005055892164819 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6455078125, + "loss_eval": 1.1155339479446411, + "epoch": 75 + }, + { + "hidden_norms": [ + 164.2607421875, + 138.0647735595703, + 116.18480682373047, + 93.95038604736328, + 73.88935089111328 + ], + "bp_grad_per_sample_l2_med": [ + 8.567768963985145e-05, + 9.307480650022626e-05, + 9.939757728716359e-05, + 0.00010579575609881431, + 9.849719936028123e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.638671875, + "loss_eval": 1.1126312017440796, + "epoch": 76 + }, + { + "hidden_norms": [ + 163.9792938232422, + 137.88185119628906, + 116.34628295898438, + 93.93537139892578, + 73.83805084228516 + ], + "bp_grad_per_sample_l2_med": [ + 8.795045869192109e-05, + 9.678495553089306e-05, + 0.00010362159082433209, + 0.0001105417322833091, + 0.00010525066318223253 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6337890625, + "loss_eval": 1.110876202583313, + "epoch": 77 + }, + { + "hidden_norms": [ + 164.1384735107422, + 137.82691955566406, + 115.94445037841797, + 94.01095581054688, + 73.68436431884766 + ], + "bp_grad_per_sample_l2_med": [ + 8.610311488155276e-05, + 9.507987851975486e-05, + 0.00010208813182543963, + 0.00010807226499309763, + 0.00010176940850215033 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6318359375, + "loss_eval": 1.1176977157592773, + "epoch": 78 + }, + { + "hidden_norms": [ + 163.91049194335938, + 136.9142608642578, + 115.37925720214844, + 93.2219009399414, + 73.2654800415039 + ], + "bp_grad_per_sample_l2_med": [ + 8.745997183723375e-05, + 9.566589869791642e-05, + 0.00010251311323372647, + 0.00011129804624943063, + 0.0001056971013895236 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6318359375, + "loss_eval": 1.1140623092651367, + "epoch": 79 + }, + { + "hidden_norms": [ + 163.40182495117188, + 137.21026611328125, + 115.46720123291016, + 93.46426391601562, + 73.12786102294922 + ], + "bp_grad_per_sample_l2_med": [ + 8.96864221431315e-05, + 9.8639284260571e-05, + 0.0001043426527758129, + 0.00010869379184441641, + 0.00010685920278774574 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.630859375, + "loss_eval": 1.1114736795425415, + "epoch": 80 + }, + { + "hidden_norms": [ + 163.22100830078125, + 136.5157012939453, + 115.2002944946289, + 93.15667724609375, + 73.07371520996094 + ], + "bp_grad_per_sample_l2_med": [ + 8.870210876921192e-05, + 9.846940520219505e-05, + 0.0001080361835192889, + 0.0001128382355091162, + 0.00010244990698993206 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.634765625, + "loss_eval": 1.1125456094741821, + "epoch": 81 + }, + { + "hidden_norms": [ + 163.21449279785156, + 136.63999938964844, + 114.51496124267578, + 92.76043701171875, + 73.22138214111328 + ], + "bp_grad_per_sample_l2_med": [ + 8.551862265449017e-05, + 9.3683076556772e-05, + 0.00010453341383254156, + 0.00010722207662183791, + 0.00010129058500751853 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.638671875, + "loss_eval": 1.0996887683868408, + "epoch": 82 + }, + { + "hidden_norms": [ + 162.75770568847656, + 136.49710083007812, + 114.6112060546875, + 92.87682342529297, + 73.25039672851562 + ], + "bp_grad_per_sample_l2_med": [ + 8.870910096447915e-05, + 9.74184149526991e-05, + 0.00010446018859511241, + 0.00011418589565437287, + 0.00010412647679913789 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.634765625, + "loss_eval": 1.1063097715377808, + "epoch": 83 + }, + { + "hidden_norms": [ + 163.11697387695312, + 136.4162139892578, + 114.9229507446289, + 93.17060089111328, + 73.40281677246094 + ], + "bp_grad_per_sample_l2_med": [ + 8.790192077867687e-05, + 9.763163689058274e-05, + 0.00010599731467664242, + 0.00011016600910807028, + 0.00010507069964660332 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6435546875, + "loss_eval": 1.1009955406188965, + "epoch": 84 + }, + { + "hidden_norms": [ + 162.4318389892578, + 136.2643280029297, + 114.47940826416016, + 92.43824005126953, + 72.75123596191406 + ], + "bp_grad_per_sample_l2_med": [ + 8.680798055138439e-05, + 9.524248889647424e-05, + 0.00010346775525249541, + 0.00010771532106446102, + 0.00010157373617403209 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.106760025024414, + "epoch": 85 + }, + { + "hidden_norms": [ + 162.55992126464844, + 136.00660705566406, + 114.44908142089844, + 92.65226745605469, + 73.14122772216797 + ], + "bp_grad_per_sample_l2_med": [ + 8.55888138175942e-05, + 9.422176663065329e-05, + 0.00010130204464076087, + 0.0001082807284547016, + 0.00010286335600540042 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6435546875, + "loss_eval": 1.1080232858657837, + "epoch": 86 + }, + { + "hidden_norms": [ + 162.33607482910156, + 136.22657775878906, + 114.64276885986328, + 92.26687622070312, + 72.99312591552734 + ], + "bp_grad_per_sample_l2_med": [ + 9.005892934510484e-05, + 9.746963041834533e-05, + 0.00010383747576270252, + 0.00010905141971306875, + 0.00010293527157045901 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6455078125, + "loss_eval": 1.0989083051681519, + "epoch": 87 + }, + { + "hidden_norms": [ + 161.69874572753906, + 135.9654998779297, + 113.88583374023438, + 91.72888946533203, + 72.5824966430664 + ], + "bp_grad_per_sample_l2_med": [ + 9.02136744116433e-05, + 9.903020691126585e-05, + 0.0001059234855347313, + 0.00011399909999454394, + 0.00010543780081206933 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6435546875, + "loss_eval": 1.1039698123931885, + "epoch": 88 + }, + { + "hidden_norms": [ + 162.3827362060547, + 136.0760498046875, + 114.07840728759766, + 91.95870971679688, + 72.59473419189453 + ], + "bp_grad_per_sample_l2_med": [ + 9.043919999385253e-05, + 9.950586536433548e-05, + 0.00010800046584336087, + 0.00011628754145931453, + 0.00010360861051594839 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6435546875, + "loss_eval": 1.1007411479949951, + "epoch": 89 + }, + { + "hidden_norms": [ + 161.50054931640625, + 135.7166748046875, + 113.83382415771484, + 91.96630096435547, + 72.61833953857422 + ], + "bp_grad_per_sample_l2_med": [ + 9.075389243662357e-05, + 9.988105011871085e-05, + 0.00010788880899781361, + 0.00011431374150561169, + 0.00010596351057756692 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.64453125, + "loss_eval": 1.0992103815078735, + "epoch": 90 + }, + { + "hidden_norms": [ + 161.48770141601562, + 135.71417236328125, + 114.12840270996094, + 91.98160552978516, + 72.64606475830078 + ], + "bp_grad_per_sample_l2_med": [ + 9.050803782884032e-05, + 9.805837908061221e-05, + 0.00010800142626976594, + 0.00011649157386273146, + 0.00010660875705070794 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.640625, + "loss_eval": 1.1021543741226196, + "epoch": 91 + }, + { + "hidden_norms": [ + 162.0372314453125, + 135.4561767578125, + 114.00292205810547, + 91.83483123779297, + 72.68809509277344 + ], + "bp_grad_per_sample_l2_med": [ + 8.82204039953649e-05, + 9.769284224603325e-05, + 0.00010632916382746771, + 0.00011439422814873978, + 0.00010489066335139796 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6416015625, + "loss_eval": 1.1001535654067993, + "epoch": 92 + }, + { + "hidden_norms": [ + 161.88534545898438, + 135.54629516601562, + 113.90684509277344, + 91.81143188476562, + 72.64588165283203 + ], + "bp_grad_per_sample_l2_med": [ + 9.120439790422097e-05, + 9.779920219443738e-05, + 0.00010798833682201803, + 0.00011447365250205621, + 0.00010797424329211935 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.642578125, + "loss_eval": 1.0961315631866455, + "epoch": 93 + }, + { + "hidden_norms": [ + 162.06427001953125, + 135.49281311035156, + 113.69275665283203, + 91.76304626464844, + 72.4867935180664 + ], + "bp_grad_per_sample_l2_med": [ + 9.100054739974439e-05, + 9.935065463650972e-05, + 0.00010879126784857363, + 0.00011589765199460089, + 0.00010837834270205349 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6416015625, + "loss_eval": 1.097299337387085, + "epoch": 94 + }, + { + "hidden_norms": [ + 162.06063842773438, + 135.57981872558594, + 113.76399230957031, + 91.94515991210938, + 72.56278991699219 + ], + "bp_grad_per_sample_l2_med": [ + 9.139141184277833e-05, + 9.897649579215795e-05, + 0.00010867504897760227, + 0.0001159063758677803, + 0.00010943930828943849 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6376953125, + "loss_eval": 1.0986907482147217, + "epoch": 95 + }, + { + "hidden_norms": [ + 161.8842315673828, + 135.4130859375, + 113.66045379638672, + 91.80276489257812, + 72.58989715576172 + ], + "bp_grad_per_sample_l2_med": [ + 9.080857125809416e-05, + 0.00010123007814399898, + 0.00010883246432058513, + 0.00011908033775398508, + 0.00010963032400468364 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.0988240242004395, + "epoch": 96 + }, + { + "hidden_norms": [ + 161.86744689941406, + 135.38331604003906, + 113.66378784179688, + 91.70223236083984, + 72.4896240234375 + ], + "bp_grad_per_sample_l2_med": [ + 9.091695392271504e-05, + 0.00010080484207719564, + 0.00010940106585621834, + 0.00011762498616008088, + 0.00010917771578533575 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.0987744331359863, + "epoch": 97 + }, + { + "hidden_norms": [ + 161.89633178710938, + 135.33140563964844, + 113.67347717285156, + 91.68895721435547, + 72.49469757080078 + ], + "bp_grad_per_sample_l2_med": [ + 9.099576709559187e-05, + 0.00010038664186140522, + 0.0001086170959752053, + 0.00011788319534389302, + 0.00010914496670011431 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.0990701913833618, + "epoch": 98 + }, + { + "hidden_norms": [ + 161.9002227783203, + 135.33474731445312, + 113.68601989746094, + 91.69290924072266, + 72.48957061767578 + ], + "bp_grad_per_sample_l2_med": [ + 9.096309076994658e-05, + 0.00010059915803140029, + 0.00010838409070856869, + 0.00011784962407546118, + 0.00010893247235799208 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.098876953125, + "epoch": 99 + }, + { + "hidden_norms": [ + 161.8989715576172, + 135.33889770507812, + 113.69281768798828, + 91.6856689453125, + 72.48480224609375 + ], + "bp_grad_per_sample_l2_med": [ + 9.085259807761759e-05, + 0.00010061707871500403, + 0.00010823038610396907, + 0.00011745247320504859, + 0.00010919221676886082 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.0987944602966309, + "epoch": 100 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.690464973449707, + 8.719978332519531, + 8.73093318939209, + 8.75937271118164, + 8.790542602539062 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005465824506245553, + 0.0005437708459794521, + 0.0005393712199293077, + 0.0005331890424713492, + 0.0005310169071890414 + ], + "gamma_dfa": 0.007568402143078856, + "gamma_dfa_per_layer": [ + 0.002326551591977477, + 0.0009101498289965093, + -0.013218702748417854, + 0.04025560989975929 + ], + "acc_eval": 0.1015625, + "loss_eval": 2.3754236698150635, + "epoch": 0 + }, + { + "hidden_norms": [ + 536.5761108398438, + 845.265625, + 979.7896118164062, + 1192.0323486328125, + 1230.83935546875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006465085316449404, + 0.0006462159799411893, + 0.0006460825679823756, + 0.0006459451396949589, + 0.0006460213917307556 + ], + "gamma_dfa": 0.013024769607000053, + "gamma_dfa_per_layer": [ + 0.035579413175582886, + -0.0025600260123610497, + -0.0014369464479386806, + 0.020516637712717056 + ], + "acc_eval": 0.212890625, + "loss_eval": 8.137651443481445, + "epoch": 1 + }, + { + "hidden_norms": [ + 886.7508544921875, + 1871.2640380859375, + 2198.631591796875, + 2689.22412109375, + 2904.254150390625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007187994197010994, + 0.0007172312471084297, + 0.0007172476034611464, + 0.0007177897496148944, + 0.000717311049811542 + ], + "gamma_dfa": 0.004487544531002641, + "gamma_dfa_per_layer": [ + 0.04744107276201248, + -0.011962954886257648, + -0.02088175155222416, + 0.003353811800479889 + ], + "acc_eval": 0.203125, + "loss_eval": 16.637451171875, + "epoch": 2 + }, + { + "hidden_norms": [ + 1117.1649169921875, + 3064.644775390625, + 3849.060546875, + 4987.09130859375, + 5690.720703125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000734492321498692, + 0.0007317167473956943, + 0.0007317643612623215, + 0.0007318624993786216, + 0.0007319750147871673 + ], + "gamma_dfa": 0.0065072893630713224, + "gamma_dfa_per_layer": [ + 0.0597357451915741, + -0.0063293795101344585, + -0.033218011260032654, + 0.0058408030308783054 + ], + "acc_eval": 0.224609375, + "loss_eval": 29.753459930419922, + "epoch": 3 + }, + { + "hidden_norms": [ + 1279.7017822265625, + 4015.093017578125, + 5594.23828125, + 7459.69091796875, + 8727.64453125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007434640428982675, + 0.0007419881876558065, + 0.0007416673470288515, + 0.000741377065423876, + 0.0007413675775751472 + ], + "gamma_dfa": 0.0072651703376322985, + "gamma_dfa_per_layer": [ + 0.07467889785766602, + -0.02277005836367607, + -0.009787362068891525, + -0.013060796074569225 + ], + "acc_eval": 0.1640625, + "loss_eval": 54.22368621826172, + "epoch": 4 + }, + { + "hidden_norms": [ + 1399.06787109375, + 4862.35302734375, + 9250.7666015625, + 10789.8828125, + 12902.6591796875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007491935975849628, + 0.0007442779606208205, + 0.0007423132774420083, + 0.0007422835915349424, + 0.0007422153139486909 + ], + "gamma_dfa": -0.005301014054566622, + "gamma_dfa_per_layer": [ + 0.06516245007514954, + -0.03411812335252762, + -0.034175027161836624, + -0.01807335577905178 + ], + "acc_eval": 0.2080078125, + "loss_eval": 62.78772735595703, + "epoch": 5 + }, + { + "hidden_norms": [ + 1478.1070556640625, + 5865.33935546875, + 15407.5283203125, + 16717.609375, + 19284.30078125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000746070989407599, + 0.0007320672739297152, + 0.0007320406148210168, + 0.0007324790931306779, + 0.0007322196033783257 + ], + "gamma_dfa": -0.0043716938234865665, + "gamma_dfa_per_layer": [ + 0.0889529138803482, + -0.03475068882107735, + -0.06096648424863815, + -0.010722516104578972 + ], + "acc_eval": 0.21875, + "loss_eval": 84.72342681884766, + "epoch": 6 + }, + { + "hidden_norms": [ + 1569.764892578125, + 7991.109375, + 22041.46484375, + 23657.2890625, + 27372.69140625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007371728424914181, + 0.0007328476058319211, + 0.0007317248382605612, + 0.0007321859593503177, + 0.0007314819958992302 + ], + "gamma_dfa": -0.006586531409993768, + "gamma_dfa_per_layer": [ + 0.08020298182964325, + -0.038106564432382584, + -0.05412164330482483, + -0.014320899732410908 + ], + "acc_eval": 0.21484375, + "loss_eval": 87.40310668945312, + "epoch": 7 + }, + { + "hidden_norms": [ + 1649.8133544921875, + 12248.005859375, + 30825.916015625, + 32827.55078125, + 38153.3828125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007630810141563416, + 0.0007434195140376687, + 0.0007433100836351514, + 0.0007435025763697922, + 0.0007434298167936504 + ], + "gamma_dfa": -0.0035092607140541077, + "gamma_dfa_per_layer": [ + 0.1012866348028183, + -0.029570601880550385, + -0.04660683125257492, + -0.039146244525909424 + ], + "acc_eval": 0.1708984375, + "loss_eval": 157.51614379882812, + "epoch": 8 + }, + { + "hidden_norms": [ + 1712.73193359375, + 20302.939453125, + 43360.37109375, + 46000.90234375, + 53154.84765625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007849909015931189, + 0.0007540763472206891, + 0.0007541946833953261, + 0.0007542177918367088, + 0.0007542550447396934 + ], + "gamma_dfa": 0.006478439085185528, + "gamma_dfa_per_layer": [ + 0.1487787812948227, + -0.03583626449108124, + -0.0212298221886158, + -0.06579893827438354 + ], + "acc_eval": 0.138671875, + "loss_eval": 512.7744750976562, + "epoch": 9 + }, + { + "hidden_norms": [ + 1763.957763671875, + 29818.015625, + 57092.5546875, + 60514.234375, + 69695.1015625 + ], + "bp_grad_per_sample_l2_med": [ + 0.00080581457586959, + 0.0007400442264042795, + 0.0007398677407763898, + 0.0007363590411841869, + 0.0007358043803833425 + ], + "gamma_dfa": -0.003822646103799343, + "gamma_dfa_per_layer": [ + 0.1044168770313263, + -0.0318819060921669, + -0.054846249520778656, + -0.03297930583357811 + ], + "acc_eval": 0.203125, + "loss_eval": 288.6083984375, + "epoch": 10 + }, + { + "hidden_norms": [ + 1841.6363525390625, + 43646.69921875, + 76665.53125, + 80991.453125, + 91946.4765625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008064995636232197, + 0.0007405033684335649, + 0.0007410499965772033, + 0.0007410682155750692, + 0.0007410107646137476 + ], + "gamma_dfa": -0.005903353448957205, + "gamma_dfa_per_layer": [ + 0.15344271063804626, + -0.06077828258275986, + -0.0893951952457428, + -0.02688264660537243 + ], + "acc_eval": 0.1630859375, + "loss_eval": 462.175537109375, + "epoch": 11 + }, + { + "hidden_norms": [ + 1938.4581298828125, + 63804.453125, + 101178.828125, + 106970.6171875, + 119676.0390625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008472055778838694, + 0.0007312041707336903, + 0.0007307010819204152, + 0.0007308369968086481, + 0.000730738160200417 + ], + "gamma_dfa": 0.015948185697197914, + "gamma_dfa_per_layer": [ + 0.19398558139801025, + -0.05326637625694275, + -0.057601772248744965, + -0.019324690103530884 + ], + "acc_eval": 0.1572265625, + "loss_eval": 481.7687072753906, + "epoch": 12 + }, + { + "hidden_norms": [ + 2059.50390625, + 86267.453125, + 127668.078125, + 134690.953125, + 148832.21875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008536268142051995, + 0.0007572658942081034, + 0.0007572331232950091, + 0.0007572534959763288, + 0.0007572824251838028 + ], + "gamma_dfa": 0.007115887477993965, + "gamma_dfa_per_layer": [ + 0.19894848763942719, + -0.06199394166469574, + -0.04606857895851135, + -0.06242241710424423 + ], + "acc_eval": 0.162109375, + "loss_eval": 442.7697448730469, + "epoch": 13 + }, + { + "hidden_norms": [ + 2162.650390625, + 111971.2421875, + 158544.5, + 167081.546875, + 183230.21875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009137325105257332, + 0.0007456843741238117, + 0.0007456432213075459, + 0.0007455914164893329, + 0.0007455993909388781 + ], + "gamma_dfa": 0.008699490688741207, + "gamma_dfa_per_layer": [ + 0.22433382272720337, + -0.07114191353321075, + -0.07720339298248291, + -0.041190553456544876 + ], + "acc_eval": 0.16796875, + "loss_eval": 631.255859375, + "epoch": 14 + }, + { + "hidden_norms": [ + 2287.1767578125, + 140028.015625, + 188737.5625, + 197952.296875, + 214414.0625 + ], + "bp_grad_per_sample_l2_med": [ + 0.000864461821038276, + 0.0007380775641649961, + 0.0007383264601230621, + 0.000738749688025564, + 0.0007389392121694982 + ], + "gamma_dfa": 0.01581217348575592, + "gamma_dfa_per_layer": [ + 0.21350334584712982, + -0.05864371731877327, + -0.039877790957689285, + -0.051733143627643585 + ], + "acc_eval": 0.1806640625, + "loss_eval": 720.0626220703125, + "epoch": 15 + }, + { + "hidden_norms": [ + 2390.364013671875, + 180786.796875, + 233030.703125, + 243522.09375, + 260648.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010889085242524743, + 0.0007420245674438775, + 0.0007420974434353411, + 0.0007420690963044763, + 0.0007420206675305963 + ], + "gamma_dfa": 0.01692677615210414, + "gamma_dfa_per_layer": [ + 0.22792349755764008, + -0.06613948941230774, + -0.0679212138056755, + -0.026155689731240273 + ], + "acc_eval": 0.1904296875, + "loss_eval": 1348.43115234375, + "epoch": 16 + }, + { + "hidden_norms": [ + 2525.60009765625, + 226341.015625, + 282575.21875, + 294521.5, + 313155.65625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010620173998177052, + 0.0007694299565628171, + 0.0007695311214774847, + 0.0007694744854234159, + 0.000769737409427762 + ], + "gamma_dfa": 0.012939120642840862, + "gamma_dfa_per_layer": [ + 0.24798060953617096, + -0.07888300716876984, + -0.03452270105481148, + -0.0828184187412262 + ], + "acc_eval": 0.1572265625, + "loss_eval": 1277.5867919921875, + "epoch": 17 + }, + { + "hidden_norms": [ + 2738.423828125, + 284434.5625, + 346282.90625, + 359909.125, + 379330.46875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009644942474551499, + 0.0007429496035911143, + 0.0007425086805596948, + 0.0007422671769745648, + 0.0007426248048432171 + ], + "gamma_dfa": 0.02641105931252241, + "gamma_dfa_per_layer": [ + 0.2637922763824463, + -0.06210581958293915, + -0.05640384927392006, + -0.039638370275497437 + ], + "acc_eval": 0.220703125, + "loss_eval": 802.8688354492188, + "epoch": 18 + }, + { + "hidden_norms": [ + 2890.100830078125, + 346858.71875, + 414202.09375, + 429987.3125, + 451374.3125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010854159481823444, + 0.0007560763042420149, + 0.0007561030797660351, + 0.0007562912651337683, + 0.0007561809034086764 + ], + "gamma_dfa": -0.006043614819645882, + "gamma_dfa_per_layer": [ + 0.18550744652748108, + -0.07387037575244904, + -0.0915735587477684, + -0.04423797130584717 + ], + "acc_eval": 0.0927734375, + "loss_eval": 2067.48974609375, + "epoch": 19 + }, + { + "hidden_norms": [ + 3048.9677734375, + 416326.4375, + 488715.9375, + 506779.0, + 528907.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.001142722088843584, + 0.0007379497401416302, + 0.0007378923473879695, + 0.0007379662129096687, + 0.0007378893787972629 + ], + "gamma_dfa": 0.020490088500082493, + "gamma_dfa_per_layer": [ + 0.21813809871673584, + -0.053681232035160065, + -0.04219571128487587, + -0.040300801396369934 + ], + "acc_eval": 0.2294921875, + "loss_eval": 1929.7166748046875, + "epoch": 20 + }, + { + "hidden_norms": [ + 3216.734619140625, + 499057.0, + 577401.1875, + 597297.0, + 620542.125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014556541573256254, + 0.0007413470884785056, + 0.0007413764833472669, + 0.0007412104168906808, + 0.0007420589681714773 + ], + "gamma_dfa": 0.03948488784953952, + "gamma_dfa_per_layer": [ + 0.27680304646492004, + -0.05157003924250603, + -0.039460550993680954, + -0.02783290483057499 + ], + "acc_eval": 0.1474609375, + "loss_eval": 2699.9052734375, + "epoch": 21 + }, + { + "hidden_norms": [ + 3342.216064453125, + 584495.625, + 665696.625, + 687533.1875, + 710813.9375 + ], + "bp_grad_per_sample_l2_med": [ + 0.001884044730104506, + 0.0007584495469927788, + 0.0007583577535115182, + 0.0007583281840197742, + 0.0007583273691125214 + ], + "gamma_dfa": 0.004080784507095814, + "gamma_dfa_per_layer": [ + 0.1770291030406952, + -0.056366197764873505, + -0.057933274656534195, + -0.046406492590904236 + ], + "acc_eval": 0.2373046875, + "loss_eval": 1742.9925537109375, + "epoch": 22 + }, + { + "hidden_norms": [ + 3566.038818359375, + 674756.3125, + 760463.3125, + 784571.125, + 808618.6875 + ], + "bp_grad_per_sample_l2_med": [ + 0.001965342788025737, + 0.0007340435404330492, + 0.0007341310847550631, + 0.0007343373727053404, + 0.0007337987190112472 + ], + "gamma_dfa": 0.030578704085201025, + "gamma_dfa_per_layer": [ + 0.24771088361740112, + -0.05749209225177765, + -0.04569869861006737, + -0.022205276414752007 + ], + "acc_eval": 0.1611328125, + "loss_eval": 2397.3916015625, + "epoch": 23 + }, + { + "hidden_norms": [ + 3779.54296875, + 786509.5, + 877152.1875, + 903987.8125, + 928449.375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016364307375624776, + 0.0007935749599710107, + 0.000793365528807044, + 0.0007934189052321017, + 0.0007935216999612749 + ], + "gamma_dfa": 0.01740677817724645, + "gamma_dfa_per_layer": [ + 0.2701166570186615, + -0.0851234570145607, + 0.004913746379315853, + -0.12027983367443085 + ], + "acc_eval": 0.12109375, + "loss_eval": 4908.0458984375, + "epoch": 24 + }, + { + "hidden_norms": [ + 3969.119873046875, + 900145.9375, + 993945.75, + 1023047.9375, + 1047156.125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012235429603606462, + 0.0007582573452964425, + 0.0007582195685245097, + 0.000758210604544729, + 0.0007582050748169422 + ], + "gamma_dfa": -0.005556041374802589, + "gamma_dfa_per_layer": [ + 0.2166597992181778, + -0.09299580752849579, + -0.09515514969825745, + -0.05073300749063492 + ], + "acc_eval": 0.1728515625, + "loss_eval": 3738.029541015625, + "epoch": 25 + }, + { + "hidden_norms": [ + 4167.24169921875, + 1027096.125, + 1126300.25, + 1158199.625, + 1183064.875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015538743464276195, + 0.0007320540607906878, + 0.0007321767043322325, + 0.0007325086044147611, + 0.0007322292076423764 + ], + "gamma_dfa": 0.013890675269067287, + "gamma_dfa_per_layer": [ + 0.25793927907943726, + -0.09288333356380463, + -0.07571414113044739, + -0.03377910330891609 + ], + "acc_eval": 0.10546875, + "loss_eval": 6202.408203125, + "epoch": 26 + }, + { + "hidden_norms": [ + 4332.73046875, + 1157313.5, + 1261637.875, + 1297158.5, + 1323617.625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015948566142469645, + 0.0007783056935295463, + 0.00077825813787058, + 0.0007782406755723059, + 0.0007781987660564482 + ], + "gamma_dfa": 0.02306488621979952, + "gamma_dfa_per_layer": [ + 0.2585013508796692, + -0.07491485029459, + -0.058371271938085556, + -0.03295568376779556 + ], + "acc_eval": 0.208984375, + "loss_eval": 4646.37451171875, + "epoch": 27 + }, + { + "hidden_norms": [ + 4508.3486328125, + 1310938.125, + 1421261.875, + 1460382.75, + 1487384.375 + ], + "bp_grad_per_sample_l2_med": [ + 0.001599438488483429, + 0.0007645513396710157, + 0.0007644708384759724, + 0.00076470518251881, + 0.0007645483710803092 + ], + "gamma_dfa": 0.017900947481393814, + "gamma_dfa_per_layer": [ + 0.24153774976730347, + -0.06473007053136826, + -0.06562119722366333, + -0.039582692086696625 + ], + "acc_eval": 0.173828125, + "loss_eval": 5292.640625, + "epoch": 28 + }, + { + "hidden_norms": [ + 4729.70556640625, + 1458380.25, + 1572980.125, + 1615003.0, + 1642261.875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014249716186895967, + 0.0007341640302911401, + 0.00073421117849648, + 0.0007345581543631852, + 0.0007344211917370558 + ], + "gamma_dfa": 0.03120402991771698, + "gamma_dfa_per_layer": [ + 0.2725849747657776, + -0.07284568250179291, + -0.05128118395805359, + -0.02364198863506317 + ], + "acc_eval": 0.17578125, + "loss_eval": 4871.27001953125, + "epoch": 29 + }, + { + "hidden_norms": [ + 4886.33984375, + 1617197.25, + 1735577.625, + 1780813.375, + 1808887.125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018187292153015733, + 0.0007682304712943733, + 0.0007675564847886562, + 0.0007677674293518066, + 0.0007678233087062836 + ], + "gamma_dfa": 0.017138252966105938, + "gamma_dfa_per_layer": [ + 0.2494080811738968, + -0.08018361777067184, + -0.027287419885396957, + -0.07338403165340424 + ], + "acc_eval": 0.193359375, + "loss_eval": 3960.6728515625, + "epoch": 30 + }, + { + "hidden_norms": [ + 5119.7841796875, + 1765219.5, + 1886735.375, + 1934213.125, + 1961976.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0022127064876258373, + 0.000754481996409595, + 0.0007539362413808703, + 0.0007542265811935067, + 0.0007539446814917028 + ], + "gamma_dfa": 0.0332237659022212, + "gamma_dfa_per_layer": [ + 0.30639636516571045, + -0.08304375410079956, + -0.06092921271920204, + -0.029528334736824036 + ], + "acc_eval": 0.193359375, + "loss_eval": 4306.7734375, + "epoch": 31 + }, + { + "hidden_norms": [ + 5354.88720703125, + 1941186.125, + 2066860.125, + 2117348.25, + 2144884.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013304626336321235, + 0.0007719467394053936, + 0.0007719435379840434, + 0.0007721700239926577, + 0.0007720825960859656 + ], + "gamma_dfa": 0.01764332875609398, + "gamma_dfa_per_layer": [ + 0.2670303285121918, + -0.07338991016149521, + -0.05201137810945511, + -0.07105572521686554 + ], + "acc_eval": 0.1845703125, + "loss_eval": 4018.3662109375, + "epoch": 32 + }, + { + "hidden_norms": [ + 5519.78759765625, + 2116056.25, + 2246081.5, + 2300078.25, + 2327378.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016995095647871494, + 0.0007534062024205923, + 0.0007532716845162213, + 0.0007533822790719569, + 0.0007532139425165951 + ], + "gamma_dfa": 0.021287068724632263, + "gamma_dfa_per_layer": [ + 0.2717400789260864, + -0.08038187026977539, + -0.05876553803682327, + -0.04744439572095871 + ], + "acc_eval": 0.216796875, + "loss_eval": 6509.134765625, + "epoch": 33 + }, + { + "hidden_norms": [ + 5700.9130859375, + 2317603.75, + 2452612.5, + 2509779.5, + 2537064.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.001880816649645567, + 0.0007947525009512901, + 0.0007945421966724098, + 0.0007944482495076954, + 0.0007949797436594963 + ], + "gamma_dfa": 0.02851281687617302, + "gamma_dfa_per_layer": [ + 0.2822743058204651, + -0.08248982578516006, + -0.05187612026929855, + -0.03385709226131439 + ], + "acc_eval": 0.1337890625, + "loss_eval": 8231.9248046875, + "epoch": 34 + }, + { + "hidden_norms": [ + 5855.8310546875, + 2515524.75, + 2653569.0, + 2713748.5, + 2740903.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018560283351689577, + 0.0007757823332212865, + 0.0007757038110867143, + 0.0007756180129945278, + 0.0007759004947729409 + ], + "gamma_dfa": 0.018099953944329172, + "gamma_dfa_per_layer": [ + 0.2729976773262024, + -0.08800812810659409, + -0.002550901612266898, + -0.11003883183002472 + ], + "acc_eval": 0.150390625, + "loss_eval": 7247.7216796875, + "epoch": 35 + }, + { + "hidden_norms": [ + 6036.9033203125, + 2711563.0, + 2854179.0, + 2918077.75, + 2945814.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.001862754113972187, + 0.0007525583496317267, + 0.0007525330875068903, + 0.0007526627741754055, + 0.0007525623659603298 + ], + "gamma_dfa": 0.02487885858863592, + "gamma_dfa_per_layer": [ + 0.29685819149017334, + -0.08635345101356506, + -0.056181322783231735, + -0.054807983338832855 + ], + "acc_eval": 0.1435546875, + "loss_eval": 7513.36376953125, + "epoch": 36 + }, + { + "hidden_norms": [ + 6188.01611328125, + 2906995.5, + 3054202.25, + 3121279.0, + 3149996.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013340733712539077, + 0.0007529910071752965, + 0.0007524905377067626, + 0.0007527912384830415, + 0.0007525555556640029 + ], + "gamma_dfa": 0.027058321982622147, + "gamma_dfa_per_layer": [ + 0.25763267278671265, + -0.06575162708759308, + -0.04412994533777237, + -0.03951781243085861 + ], + "acc_eval": 0.2431640625, + "loss_eval": 12329.697265625, + "epoch": 37 + }, + { + "hidden_norms": [ + 6390.7060546875, + 3133419.5, + 3288636.0, + 3360502.75, + 3390539.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014776778407394886, + 0.0007607035804539919, + 0.0007607110310345888, + 0.0007606975850649178, + 0.000760715629439801 + ], + "gamma_dfa": 0.022189474664628506, + "gamma_dfa_per_layer": [ + 0.2616554796695709, + -0.07128072530031204, + -0.06259018927812576, + -0.039026666432619095 + ], + "acc_eval": 0.173828125, + "loss_eval": 6832.28955078125, + "epoch": 38 + }, + { + "hidden_norms": [ + 6548.68115234375, + 3356773.75, + 3517968.25, + 3593598.5, + 3624375.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.002129003871232271, + 0.0007741872104816139, + 0.000774160900618881, + 0.0007743749301880598, + 0.0007743173046037555 + ], + "gamma_dfa": 0.034090133383870125, + "gamma_dfa_per_layer": [ + 0.3182219862937927, + -0.08398662507534027, + -0.06546281278133392, + -0.03241201490163803 + ], + "acc_eval": 0.1904296875, + "loss_eval": 5371.0859375, + "epoch": 39 + }, + { + "hidden_norms": [ + 6723.9697265625, + 3592963.25, + 3757696.25, + 3837777.75, + 3868088.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018772021867334843, + 0.0007547365385107696, + 0.0007547002169303596, + 0.0007546909037046134, + 0.000754650856833905 + ], + "gamma_dfa": 0.003609549254179001, + "gamma_dfa_per_layer": [ + 0.282962441444397, + -0.10840916633605957, + -0.10053665935993195, + -0.05957841873168945 + ], + "acc_eval": 0.1376953125, + "loss_eval": 8650.76953125, + "epoch": 40 + }, + { + "hidden_norms": [ + 6887.81005859375, + 3829273.5, + 3999416.75, + 4084005.5, + 4113581.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020062020048499107, + 0.0007521071238443255, + 0.0007519447826780379, + 0.0007520412327721715, + 0.0007518909987993538 + ], + "gamma_dfa": 0.01951257325708866, + "gamma_dfa_per_layer": [ + 0.2743881344795227, + -0.08543786406517029, + -0.05402272939682007, + -0.056877247989177704 + ], + "acc_eval": 0.1796875, + "loss_eval": 15509.98828125, + "epoch": 41 + }, + { + "hidden_norms": [ + 7027.42626953125, + 4050130.5, + 4223340.0, + 4310667.5, + 4340882.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016777552664279938, + 0.0007508718408644199, + 0.0007508369744755328, + 0.0007509454735554755, + 0.0007508718408644199 + ], + "gamma_dfa": 0.02786387037485838, + "gamma_dfa_per_layer": [ + 0.2803051769733429, + -0.07360324263572693, + -0.04823639243841171, + -0.04701006039977074 + ], + "acc_eval": 0.2275390625, + "loss_eval": 7618.71533203125, + "epoch": 42 + }, + { + "hidden_norms": [ + 7157.845703125, + 4292685.0, + 4471049.5, + 4562175.0, + 4591811.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016224944265559316, + 0.0007538175559602678, + 0.0007538740755990148, + 0.0007538648205809295, + 0.0007538393838331103 + ], + "gamma_dfa": 0.0053657907992601395, + "gamma_dfa_per_layer": [ + 0.26428842544555664, + -0.10051027685403824, + -0.08806045353412628, + -0.05425453186035156 + ], + "acc_eval": 0.166015625, + "loss_eval": 7869.64111328125, + "epoch": 43 + }, + { + "hidden_norms": [ + 7275.4365234375, + 4532040.5, + 4714971.5, + 4809776.0, + 4839258.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.002823092043399811, + 0.0007887987303547561, + 0.0007888769032433629, + 0.0007889135158620775, + 0.0007889300468377769 + ], + "gamma_dfa": 0.008974121417850256, + "gamma_dfa_per_layer": [ + 0.25932246446609497, + -0.10199789702892303, + 0.012336602434515953, + -0.13376468420028687 + ], + "acc_eval": 0.091796875, + "loss_eval": 19789.41796875, + "epoch": 44 + }, + { + "hidden_norms": [ + 7393.93212890625, + 4772152.5, + 4958566.0, + 5058113.0, + 5086560.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0019131727749481797, + 0.0007677456014789641, + 0.0007676532259210944, + 0.000767527730204165, + 0.0007678664987906814 + ], + "gamma_dfa": 0.014807725325226784, + "gamma_dfa_per_layer": [ + 0.23344306647777557, + -0.08349616825580597, + -0.0560825914144516, + -0.03463340550661087 + ], + "acc_eval": 0.224609375, + "loss_eval": 12636.65625, + "epoch": 45 + }, + { + "hidden_norms": [ + 7527.99462890625, + 5048336.0, + 5239027.5, + 5342244.0, + 5370085.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018555351998656988, + 0.000769329781178385, + 0.0007686647586524487, + 0.0007689501508139074, + 0.0007690390921197832 + ], + "gamma_dfa": 0.004876136779785156, + "gamma_dfa_per_layer": [ + 0.21739649772644043, + -0.08506827056407928, + -0.03674054145812988, + -0.07608313858509064 + ], + "acc_eval": 0.232421875, + "loss_eval": 12248.12109375, + "epoch": 46 + }, + { + "hidden_norms": [ + 7638.85693359375, + 5287113.0, + 5479795.0, + 5586404.5, + 5613225.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0025236238725483418, + 0.0007688805344514549, + 0.000768228666856885, + 0.0007684807060286403, + 0.0007685597520321608 + ], + "gamma_dfa": -0.006854387931525707, + "gamma_dfa_per_layer": [ + 0.17993390560150146, + -0.08751687407493591, + -0.030272338539361954, + -0.08956224471330643 + ], + "acc_eval": 0.1796875, + "loss_eval": 18537.177734375, + "epoch": 47 + }, + { + "hidden_norms": [ + 7754.390625, + 5527426.0, + 5724221.0, + 5833576.5, + 5860100.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020714402198791504, + 0.0007631001644767821, + 0.0007630567415617406, + 0.0007630541222169995, + 0.0007631017942912877 + ], + "gamma_dfa": 0.02875693328678608, + "gamma_dfa_per_layer": [ + 0.29564130306243896, + -0.08437579870223999, + -0.050235565751791, + -0.04600220546126366 + ], + "acc_eval": 0.208984375, + "loss_eval": 10527.2578125, + "epoch": 48 + }, + { + "hidden_norms": [ + 7888.46923828125, + 5787159.5, + 5987915.0, + 6101035.0, + 6127097.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0026283818297088146, + 0.0007835617288947105, + 0.0007836156873963773, + 0.000783648225478828, + 0.0007836673175916076 + ], + "gamma_dfa": 0.011204172391444445, + "gamma_dfa_per_layer": [ + 0.26796066761016846, + -0.10181419551372528, + 0.010023357346653938, + -0.13135313987731934 + ], + "acc_eval": 0.0966796875, + "loss_eval": 15481.84375, + "epoch": 49 + }, + { + "hidden_norms": [ + 7975.13671875, + 6029198.0, + 6234359.5, + 6352162.0, + 6377873.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001740386476740241, + 0.0007632866618223488, + 0.0007632256019860506, + 0.0007631148328073323, + 0.0007634586072526872 + ], + "gamma_dfa": -0.000985240563750267, + "gamma_dfa_per_layer": [ + 0.20569762587547302, + -0.0866088718175888, + -0.04746733605861664, + -0.07556238025426865 + ], + "acc_eval": 0.2001953125, + "loss_eval": 12020.572265625, + "epoch": 50 + }, + { + "hidden_norms": [ + 8109.23095703125, + 6280213.0, + 6488845.5, + 6610432.5, + 6636101.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018630403792485595, + 0.0007671525236219168, + 0.000766951881814748, + 0.0007671291241422296, + 0.0007672281353734434 + ], + "gamma_dfa": -0.0027379142120480537, + "gamma_dfa_per_layer": [ + 0.22697225213050842, + -0.10085368156433105, + -0.059774767607450485, + -0.0772954598069191 + ], + "acc_eval": 0.13671875, + "loss_eval": 12490.904296875, + "epoch": 51 + }, + { + "hidden_norms": [ + 8223.3388671875, + 6520398.5, + 6731145.5, + 6855487.0, + 6880542.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020134998485445976, + 0.0007573508773930371, + 0.0007573754992336035, + 0.0007574421470053494, + 0.0007576147909276187 + ], + "gamma_dfa": 0.00887075625360012, + "gamma_dfa_per_layer": [ + 0.260132372379303, + -0.08125708997249603, + -0.07711100578308105, + -0.06628125160932541 + ], + "acc_eval": 0.12890625, + "loss_eval": 13286.50390625, + "epoch": 52 + }, + { + "hidden_norms": [ + 8317.2099609375, + 6773551.0, + 6990263.5, + 7117609.5, + 7143509.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016349060460925102, + 0.000744542689062655, + 0.0007445236551575363, + 0.000744638848118484, + 0.0007445821538567543 + ], + "gamma_dfa": 0.036132486537098885, + "gamma_dfa_per_layer": [ + 0.35822737216949463, + -0.09246134012937546, + -0.05995674431324005, + -0.06127934157848358 + ], + "acc_eval": 0.1318359375, + "loss_eval": 12961.923828125, + "epoch": 53 + }, + { + "hidden_norms": [ + 8396.16015625, + 7036334.0, + 7256480.5, + 7388541.0, + 7414023.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016424244968220592, + 0.0007655483204871416, + 0.0007653584470972419, + 0.0007655261433683336, + 0.0007656112429685891 + ], + "gamma_dfa": 0.00855250470340252, + "gamma_dfa_per_layer": [ + 0.31318342685699463, + -0.11486171185970306, + -0.07210143655538559, + -0.0920102596282959 + ], + "acc_eval": 0.0986328125, + "loss_eval": 14289.1396484375, + "epoch": 54 + }, + { + "hidden_norms": [ + 8425.91796875, + 7268265.0, + 7491250.5, + 7626377.5, + 7651502.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014321975177153945, + 0.0007547372952103615, + 0.0007547161658294499, + 0.0007547704153694212, + 0.000754979089833796 + ], + "gamma_dfa": 0.019777772948145866, + "gamma_dfa_per_layer": [ + 0.3146383762359619, + -0.0827077254652977, + -0.0876566469669342, + -0.06516291201114655 + ], + "acc_eval": 0.0908203125, + "loss_eval": 12761.185546875, + "epoch": 55 + }, + { + "hidden_norms": [ + 8519.505859375, + 7514964.5, + 7741589.0, + 7880037.0, + 7905207.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017787133110687137, + 0.0007505406392738223, + 0.0007507357513532043, + 0.0007507326663471758, + 0.0007507237605750561 + ], + "gamma_dfa": -0.012186199426651001, + "gamma_dfa_per_layer": [ + 0.2306034117937088, + -0.11392365396022797, + -0.1025918573141098, + -0.06283269822597504 + ], + "acc_eval": 0.1455078125, + "loss_eval": 8573.3310546875, + "epoch": 56 + }, + { + "hidden_norms": [ + 8575.814453125, + 7701015.5, + 7930432.0, + 8070523.0, + 8095346.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013273135991767049, + 0.0007214294746518135, + 0.0007213159115053713, + 0.0007215962978079915, + 0.0007215975201688707 + ], + "gamma_dfa": 0.02046024613082409, + "gamma_dfa_per_layer": [ + 0.2830252945423126, + -0.09345690906047821, + -0.06962529569864273, + -0.038102105259895325 + ], + "acc_eval": 0.1923828125, + "loss_eval": 6201.162109375, + "epoch": 57 + }, + { + "hidden_norms": [ + 8635.1220703125, + 7939687.0, + 8172801.5, + 8315327.5, + 8340462.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.002125338651239872, + 0.0007551790331490338, + 0.0007551065064035356, + 0.0007549694273620844, + 0.000755314074922353 + ], + "gamma_dfa": 0.019076894968748093, + "gamma_dfa_per_layer": [ + 0.25508445501327515, + -0.07673472911119461, + -0.04303552210330963, + -0.059006623923778534 + ], + "acc_eval": 0.1865234375, + "loss_eval": 12055.595703125, + "epoch": 58 + }, + { + "hidden_norms": [ + 8706.6689453125, + 8158003.0, + 8394169.0, + 8539798.0, + 8565165.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001350156613625586, + 0.0007560249068774283, + 0.0007559725781902671, + 0.0007558663492091, + 0.0007561935926787555 + ], + "gamma_dfa": 0.028152598068118095, + "gamma_dfa_per_layer": [ + 0.28580546379089355, + -0.08475945889949799, + -0.05238167941570282, + -0.03605393320322037 + ], + "acc_eval": 0.220703125, + "loss_eval": 12085.9541015625, + "epoch": 59 + }, + { + "hidden_norms": [ + 8758.453125, + 8374766.0, + 8613513.0, + 8761622.0, + 8786363.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.002377285622060299, + 0.0007197813247330487, + 0.0007195555372163653, + 0.0007198317907750607, + 0.000719684932846576 + ], + "gamma_dfa": 0.025455349124968052, + "gamma_dfa_per_layer": [ + 0.27419814467430115, + -0.08699844777584076, + -0.04594934359192848, + -0.0394289568066597 + ], + "acc_eval": 0.1669921875, + "loss_eval": 13302.744140625, + "epoch": 60 + }, + { + "hidden_norms": [ + 8795.5654296875, + 8572136.0, + 8812910.0, + 8963599.0, + 8987706.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015984047204256058, + 0.0007187420851550996, + 0.0007185072172433138, + 0.000718816474545747, + 0.000718718278221786 + ], + "gamma_dfa": 0.020128127187490463, + "gamma_dfa_per_layer": [ + 0.3066103458404541, + -0.1022094339132309, + -0.07834567129611969, + -0.04554273188114166 + ], + "acc_eval": 0.1181640625, + "loss_eval": 6553.7236328125, + "epoch": 61 + }, + { + "hidden_norms": [ + 8811.46875, + 8766653.0, + 9009529.0, + 9162389.0, + 9185680.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0019123096717521548, + 0.0007724921451881528, + 0.0007725215400569141, + 0.0007725482573732734, + 0.0007725649629719555 + ], + "gamma_dfa": 0.03271363768726587, + "gamma_dfa_per_layer": [ + 0.2947639226913452, + -0.08735189586877823, + -0.04557036980986595, + -0.030987106263637543 + ], + "acc_eval": 0.18359375, + "loss_eval": 11607.7158203125, + "epoch": 62 + }, + { + "hidden_norms": [ + 8860.6220703125, + 8977001.0, + 9224122.0, + 9379773.0, + 9402851.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013403806369751692, + 0.0007685344316996634, + 0.0007685531745664775, + 0.0007685986929573119, + 0.0007685821619816124 + ], + "gamma_dfa": 0.020242065889760852, + "gamma_dfa_per_layer": [ + 0.30239802598953247, + -0.09480112791061401, + -0.014634584076702595, + -0.11199405044317245 + ], + "acc_eval": 0.1337890625, + "loss_eval": 9788.81640625, + "epoch": 63 + }, + { + "hidden_norms": [ + 8904.9482421875, + 9185937.0, + 9436793.0, + 9595000.0, + 9618183.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012845145538449287, + 0.0007421535556204617, + 0.0007421503541991115, + 0.0007421293412335217, + 0.0007421668851748109 + ], + "gamma_dfa": 0.02229973580688238, + "gamma_dfa_per_layer": [ + 0.2927352786064148, + -0.08628389239311218, + -0.060364432632923126, + -0.05688801035284996 + ], + "acc_eval": 0.1728515625, + "loss_eval": 8114.20458984375, + "epoch": 64 + }, + { + "hidden_norms": [ + 8892.296875, + 9356716.0, + 9611136.0, + 9771064.0, + 9794530.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001351315644569695, + 0.0007599962409585714, + 0.0007597811054438353, + 0.0007599799428135157, + 0.0007600505487062037 + ], + "gamma_dfa": 0.019069598987698555, + "gamma_dfa_per_layer": [ + 0.29072487354278564, + -0.0944916158914566, + -0.05359811335802078, + -0.06635674834251404 + ], + "acc_eval": 0.169921875, + "loss_eval": 8773.3408203125, + "epoch": 65 + }, + { + "hidden_norms": [ + 8905.83984375, + 9511506.0, + 9766884.0, + 9928659.0, + 9951002.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017338081961497664, + 0.0007696599350310862, + 0.0007696837419643998, + 0.0007697126129642129, + 0.0007697291439399123 + ], + "gamma_dfa": 0.028427925892174244, + "gamma_dfa_per_layer": [ + 0.3319295644760132, + -0.09938425570726395, + 0.004324089735746384, + -0.12315769493579865 + ], + "acc_eval": 0.1142578125, + "loss_eval": 12823.435546875, + "epoch": 66 + }, + { + "hidden_norms": [ + 8944.53125, + 9692436.0, + 9950194.0, + 10113948.0, + 10136307.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017030658200383186, + 0.000714489258825779, + 0.0007141575333662331, + 0.0007145405979827046, + 0.0007144163828343153 + ], + "gamma_dfa": 0.055724941194057465, + "gamma_dfa_per_layer": [ + 0.3514706492424011, + -0.07685236632823944, + -0.031716104596853256, + -0.020002413541078568 + ], + "acc_eval": 0.18359375, + "loss_eval": 10412.890625, + "epoch": 67 + }, + { + "hidden_norms": [ + 8926.98828125, + 9838798.0, + 10099141.0, + 10264565.0, + 10286604.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015448650810867548, + 0.0007684402517043054, + 0.0007684584707021713, + 0.0007684882148168981, + 0.0007685049204155803 + ], + "gamma_dfa": 0.032529132440686226, + "gamma_dfa_per_layer": [ + 0.3082513213157654, + -0.0888272076845169, + -0.032446227967739105, + -0.056861355900764465 + ], + "acc_eval": 0.19921875, + "loss_eval": 8345.18359375, + "epoch": 68 + }, + { + "hidden_norms": [ + 8903.689453125, + 10005445.0, + 10266980.0, + 10434005.0, + 10454617.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017746278317645192, + 0.0007130402373149991, + 0.0007127230055630207, + 0.0007131076999939978, + 0.0007130174781195819 + ], + "gamma_dfa": 0.05443635303527117, + "gamma_dfa_per_layer": [ + 0.35508570075035095, + -0.08241431415081024, + -0.03841204196214676, + -0.01651393249630928 + ], + "acc_eval": 0.140625, + "loss_eval": 7877.36181640625, + "epoch": 69 + }, + { + "hidden_norms": [ + 8910.42578125, + 10173785.0, + 10439506.0, + 10609011.0, + 10630571.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011222161119803786, + 0.0007312637171708047, + 0.0007313191890716553, + 0.0007313672685995698, + 0.0007313768728636205 + ], + "gamma_dfa": 0.023520448245108128, + "gamma_dfa_per_layer": [ + 0.29335978627204895, + -0.08935706317424774, + -0.06947942078113556, + -0.04044150933623314 + ], + "acc_eval": 0.2421875, + "loss_eval": 5653.23388671875, + "epoch": 70 + }, + { + "hidden_norms": [ + 8876.2041015625, + 10317365.0, + 10586095.0, + 10757344.0, + 10779691.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011208312353119254, + 0.0007571111200377345, + 0.0007568965083919466, + 0.0007570943562313914, + 0.0007571595488116145 + ], + "gamma_dfa": 0.025294490158557892, + "gamma_dfa_per_layer": [ + 0.331506609916687, + -0.09467847645282745, + -0.06287634372711182, + -0.07277382910251617 + ], + "acc_eval": 0.1884765625, + "loss_eval": 3869.094970703125, + "epoch": 71 + }, + { + "hidden_norms": [ + 8852.7001953125, + 10449657.0, + 10719980.0, + 10891483.0, + 10913594.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001109768869355321, + 0.0007331773522309959, + 0.0007331601809710264, + 0.0007332302629947662, + 0.0007332285749725997 + ], + "gamma_dfa": 0.03539558406919241, + "gamma_dfa_per_layer": [ + 0.3268349766731262, + -0.08062416315078735, + -0.055393531918525696, + -0.04923494532704353 + ], + "acc_eval": 0.2353515625, + "loss_eval": 7111.935546875, + "epoch": 72 + }, + { + "hidden_norms": [ + 8827.3955078125, + 10582167.0, + 10855077.0, + 11028114.0, + 11050690.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001240618177689612, + 0.0007623998681083322, + 0.0007624404970556498, + 0.0007624777499586344, + 0.0007624629070051014 + ], + "gamma_dfa": 0.03839550958946347, + "gamma_dfa_per_layer": [ + 0.36802345514297485, + -0.09764832258224487, + -0.0042990874499082565, + -0.11249400675296783 + ], + "acc_eval": 0.1357421875, + "loss_eval": 6752.0322265625, + "epoch": 73 + }, + { + "hidden_norms": [ + 8814.1962890625, + 10696667.0, + 10971925.0, + 11146316.0, + 11168931.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001309843035414815, + 0.0007403214112855494, + 0.0007405314245261252, + 0.0007405264186672866, + 0.0007405087817460299 + ], + "gamma_dfa": 0.038134077563881874, + "gamma_dfa_per_layer": [ + 0.3364037275314331, + -0.08192241191864014, + -0.03633008152246475, + -0.06561492383480072 + ], + "acc_eval": 0.212890625, + "loss_eval": 6998.021484375, + "epoch": 74 + }, + { + "hidden_norms": [ + 8779.0400390625, + 10798076.0, + 11075004.0, + 11250115.0, + 11272600.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011087025050073862, + 0.0007316112169064581, + 0.0007316232076846063, + 0.0007316932315006852, + 0.00073169672396034 + ], + "gamma_dfa": 0.04451032355427742, + "gamma_dfa_per_layer": [ + 0.34500744938850403, + -0.07661331444978714, + -0.04388073831796646, + -0.04647210240364075 + ], + "acc_eval": 0.2490234375, + "loss_eval": 3624.614013671875, + "epoch": 75 + }, + { + "hidden_norms": [ + 8751.8486328125, + 10906611.0, + 11185716.0, + 11362176.0, + 11384611.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001067605335265398, + 0.0007393756532110274, + 0.0007396025466732681, + 0.000739598530344665, + 0.000739583745598793 + ], + "gamma_dfa": 0.03648093156516552, + "gamma_dfa_per_layer": [ + 0.31906285881996155, + -0.07843812555074692, + -0.051880721002817154, + -0.0428202860057354 + ], + "acc_eval": 0.2509765625, + "loss_eval": 2816.3427734375, + "epoch": 76 + }, + { + "hidden_norms": [ + 8743.0078125, + 10999747.0, + 11279813.0, + 11457343.0, + 11479737.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010900371707975864, + 0.0007332717068493366, + 0.0007332694949582219, + 0.0007332508685067296, + 0.0007332859677262604 + ], + "gamma_dfa": 0.03520212788134813, + "gamma_dfa_per_layer": [ + 0.3010096549987793, + -0.07223288714885712, + -0.05185239389538765, + -0.036115862429142 + ], + "acc_eval": 0.2451171875, + "loss_eval": 3747.66748046875, + "epoch": 77 + }, + { + "hidden_norms": [ + 8693.3349609375, + 11081850.0, + 11362476.0, + 11540274.0, + 11562006.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010161141399294138, + 0.0007433417486026883, + 0.0007432828424498439, + 0.000743163691367954, + 0.0007434578728862107 + ], + "gamma_dfa": 0.04203554056584835, + "gamma_dfa_per_layer": [ + 0.3622134029865265, + -0.08443501591682434, + -0.020812533795833588, + -0.08882369101047516 + ], + "acc_eval": 0.1953125, + "loss_eval": 3283.453125, + "epoch": 78 + }, + { + "hidden_norms": [ + 8679.0673828125, + 11176062.0, + 11458995.0, + 11637744.0, + 11660108.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010180213721469045, + 0.0007298000273294747, + 0.000729813240468502, + 0.0007298758719116449, + 0.0007298807031475008 + ], + "gamma_dfa": 0.03867925424128771, + "gamma_dfa_per_layer": [ + 0.3430703282356262, + -0.08001460134983063, + -0.05243712291121483, + -0.05590158700942993 + ], + "acc_eval": 0.22265625, + "loss_eval": 3249.233154296875, + "epoch": 79 + }, + { + "hidden_norms": [ + 8630.8896484375, + 11249126.0, + 11532709.0, + 11711592.0, + 11733760.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001043561496771872, + 0.0007425911608152092, + 0.0007425197982229292, + 0.0007423801580443978, + 0.000742721778806299 + ], + "gamma_dfa": 0.028339628130197525, + "gamma_dfa_per_layer": [ + 0.32279035449028015, + -0.09357395768165588, + -0.06377816200256348, + -0.05207972228527069 + ], + "acc_eval": 0.1904296875, + "loss_eval": 3085.4638671875, + "epoch": 80 + }, + { + "hidden_norms": [ + 8578.060546875, + 11304050.0, + 11589802.0, + 11769234.0, + 11792299.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000967628788203001, + 0.0007289479253813624, + 0.0007289598579518497, + 0.0007290169014595449, + 0.0007290222565643489 + ], + "gamma_dfa": 0.02121756039559841, + "gamma_dfa_per_layer": [ + 0.31049084663391113, + -0.09504136443138123, + -0.07916043698787689, + -0.05141880363225937 + ], + "acc_eval": 0.236328125, + "loss_eval": 1885.889404296875, + "epoch": 81 + }, + { + "hidden_norms": [ + 8522.4794921875, + 11393685.0, + 11680880.0, + 11860855.0, + 11883774.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010794082190841436, + 0.0007521919906139374, + 0.0007519960636273026, + 0.0007521732477471232, + 0.0007522284286096692 + ], + "gamma_dfa": 0.026587368920445442, + "gamma_dfa_per_layer": [ + 0.37745779752731323, + -0.11168865859508514, + -0.0728297159075737, + -0.08658994734287262 + ], + "acc_eval": 0.1220703125, + "loss_eval": 2588.15478515625, + "epoch": 82 + }, + { + "hidden_norms": [ + 8482.1484375, + 11447732.0, + 11736021.0, + 11916302.0, + 11939110.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009376976522617042, + 0.0007250583730638027, + 0.000724694284144789, + 0.0007250410853885114, + 0.0007250093622133136 + ], + "gamma_dfa": 0.0355191919952631, + "gamma_dfa_per_layer": [ + 0.31943440437316895, + -0.07911509275436401, + -0.0536213181912899, + -0.04462122544646263 + ], + "acc_eval": 0.2783203125, + "loss_eval": 1507.2919921875, + "epoch": 83 + }, + { + "hidden_norms": [ + 8430.1455078125, + 11492522.0, + 11781554.0, + 11962317.0, + 11985175.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009387033060193062, + 0.0007079826318658888, + 0.0007078545750118792, + 0.0007080811192281544, + 0.0007080849609337747 + ], + "gamma_dfa": 0.036465028300881386, + "gamma_dfa_per_layer": [ + 0.3066443204879761, + -0.07488954067230225, + -0.03129498288035393, + -0.05459968373179436 + ], + "acc_eval": 0.275390625, + "loss_eval": 1614.5029296875, + "epoch": 84 + }, + { + "hidden_norms": [ + 8369.6298828125, + 11532036.0, + 11821641.0, + 12002443.0, + 12025323.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009389162878505886, + 0.0007232772768475115, + 0.0007233347278088331, + 0.0007233632495626807, + 0.000723376520909369 + ], + "gamma_dfa": 0.040183850564062595, + "gamma_dfa_per_layer": [ + 0.34539365768432617, + -0.08373545110225677, + -0.05380668863654137, + -0.04711611568927765 + ], + "acc_eval": 0.25, + "loss_eval": 1501.9444580078125, + "epoch": 85 + }, + { + "hidden_norms": [ + 8319.4169921875, + 11569238.0, + 11860199.0, + 12041371.0, + 12064573.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009176665917038918, + 0.0007041870849207044, + 0.0007039242191240191, + 0.0007042758516035974, + 0.0007042170618660748 + ], + "gamma_dfa": 0.035514961928129196, + "gamma_dfa_per_layer": [ + 0.2879785895347595, + -0.07180146872997284, + -0.037917762994766235, + -0.03619951009750366 + ], + "acc_eval": 0.30859375, + "loss_eval": 1078.8165283203125, + "epoch": 86 + }, + { + "hidden_norms": [ + 8282.478515625, + 11596869.0, + 11888039.0, + 12069453.0, + 12092582.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00098571612033993, + 0.000731602602172643, + 0.0007312855450436473, + 0.0007312477100640535, + 0.0007316134287975729 + ], + "gamma_dfa": 0.04066215269267559, + "gamma_dfa_per_layer": [ + 0.33381348848342896, + -0.08063024282455444, + -0.055662885308265686, + -0.034871749579906464 + ], + "acc_eval": 0.234375, + "loss_eval": 1841.648193359375, + "epoch": 87 + }, + { + "hidden_norms": [ + 8242.1005859375, + 11624052.0, + 11916218.0, + 12098548.0, + 12121911.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009184937225654721, + 0.0007233315263874829, + 0.000723001197911799, + 0.0007232833886519074, + 0.0007232468342408538 + ], + "gamma_dfa": 0.03233872726559639, + "gamma_dfa_per_layer": [ + 0.2990570068359375, + -0.07802218198776245, + -0.04814079403877258, + -0.04353912174701691 + ], + "acc_eval": 0.2890625, + "loss_eval": 980.395751953125, + "epoch": 88 + }, + { + "hidden_norms": [ + 8216.91796875, + 11647355.0, + 11939175.0, + 12121172.0, + 12144056.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008776114555075765, + 0.0007067625410854816, + 0.0007066249381750822, + 0.0007068619015626609, + 0.0007068667327985168 + ], + "gamma_dfa": 0.027417242527008057, + "gamma_dfa_per_layer": [ + 0.28433892130851746, + -0.07622525095939636, + -0.050822652876377106, + -0.04762204736471176 + ], + "acc_eval": 0.326171875, + "loss_eval": 776.0946044921875, + "epoch": 89 + }, + { + "hidden_norms": [ + 8169.76513671875, + 11658648.0, + 11950474.0, + 12132456.0, + 12155182.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008986471802927554, + 0.0007065801764838398, + 0.0007064181263558567, + 0.000706693041138351, + 0.0007066999096423388 + ], + "gamma_dfa": 0.03352018166333437, + "gamma_dfa_per_layer": [ + 0.296892374753952, + -0.07546264678239822, + -0.04814247041940689, + -0.03920653089880943 + ], + "acc_eval": 0.3095703125, + "loss_eval": 893.558349609375, + "epoch": 90 + }, + { + "hidden_norms": [ + 8142.11669921875, + 11667783.0, + 11959690.0, + 12141714.0, + 12164439.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009172433638013899, + 0.0007064292440190911, + 0.0007062776712700725, + 0.0007065359968692064, + 0.000706541701219976 + ], + "gamma_dfa": 0.03799809701740742, + "gamma_dfa_per_layer": [ + 0.31104975938796997, + -0.07753260433673859, + -0.04483959078788757, + -0.03668517619371414 + ], + "acc_eval": 0.2763671875, + "loss_eval": 918.902099609375, + "epoch": 91 + }, + { + "hidden_norms": [ + 8113.36474609375, + 11673688.0, + 11965558.0, + 12147558.0, + 12170198.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009179572225548327, + 0.0007257050601765513, + 0.0007257269462570548, + 0.0007257769466377795, + 0.0007257869001477957 + ], + "gamma_dfa": 0.03620104119181633, + "gamma_dfa_per_layer": [ + 0.3097808361053467, + -0.07722775638103485, + -0.0500766858458519, + -0.03767222911119461 + ], + "acc_eval": 0.2880859375, + "loss_eval": 1033.579833984375, + "epoch": 92 + }, + { + "hidden_norms": [ + 8085.35595703125, + 11678927.0, + 11970798.0, + 12152808.0, + 12175446.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008720594923943281, + 0.0007061808719299734, + 0.0007060291827656329, + 0.0007062855875119567, + 0.0007062909426167607 + ], + "gamma_dfa": 0.03221010882407427, + "gamma_dfa_per_layer": [ + 0.2895042598247528, + -0.07448285818099976, + -0.04004380851984024, + -0.04613715782761574 + ], + "acc_eval": 0.3046875, + "loss_eval": 827.44140625, + "epoch": 93 + }, + { + "hidden_norms": [ + 8072.322265625, + 11682684.0, + 11974490.0, + 12156499.0, + 12179080.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008837314089760184, + 0.0007061065407469869, + 0.0007059663184918463, + 0.00070620869519189, + 0.000706215447280556 + ], + "gamma_dfa": 0.026722624897956848, + "gamma_dfa_per_layer": [ + 0.28959959745407104, + -0.08210700005292892, + -0.05253326892852783, + -0.048068828880786896 + ], + "acc_eval": 0.291015625, + "loss_eval": 795.6766357421875, + "epoch": 94 + }, + { + "hidden_norms": [ + 8063.02001953125, + 11684947.0, + 11976758.0, + 12158785.0, + 12181362.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008943622815422714, + 0.0007086708792485297, + 0.0007086790283210576, + 0.0007087094127200544, + 0.0007087020785547793 + ], + "gamma_dfa": 0.02946585137397051, + "gamma_dfa_per_layer": [ + 0.29232603311538696, + -0.08056485652923584, + -0.05102770775556564, + -0.042870063334703445 + ], + "acc_eval": 0.2919921875, + "loss_eval": 839.8633422851562, + "epoch": 95 + }, + { + "hidden_norms": [ + 8055.40576171875, + 11685775.0, + 11977584.0, + 12159594.0, + 12182165.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008769903797656298, + 0.0007059753406792879, + 0.0007058423361741006, + 0.0007060715579427779, + 0.0007060769130475819 + ], + "gamma_dfa": 0.02765239030122757, + "gamma_dfa_per_layer": [ + 0.2855387032032013, + -0.07872132211923599, + -0.051525406539440155, + -0.04468241333961487 + ], + "acc_eval": 0.3115234375, + "loss_eval": 736.9282836914062, + "epoch": 96 + }, + { + "hidden_norms": [ + 8050.93310546875, + 11685670.0, + 11977453.0, + 12159452.0, + 12182004.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008705379441380501, + 0.0007085780380293727, + 0.0007085860124789178, + 0.0007086164550855756, + 0.0007086091791279614 + ], + "gamma_dfa": 0.026861276477575302, + "gamma_dfa_per_layer": [ + 0.2898082733154297, + -0.07899712026119232, + -0.046087510883808136, + -0.05727853626012802 + ], + "acc_eval": 0.302734375, + "loss_eval": 737.6731567382812, + "epoch": 97 + }, + { + "hidden_norms": [ + 8048.384765625, + 11685821.0, + 11977554.0, + 12159347.0, + 12182068.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008696588920429349, + 0.0007085675024427474, + 0.0007085754186846316, + 0.0007086056284606457, + 0.0007085986435413361 + ], + "gamma_dfa": 0.02852465771138668, + "gamma_dfa_per_layer": [ + 0.2933640480041504, + -0.07862062007188797, + -0.04777185618877411, + -0.05287294089794159 + ], + "acc_eval": 0.30859375, + "loss_eval": 716.3431396484375, + "epoch": 98 + }, + { + "hidden_norms": [ + 8047.294921875, + 11685550.0, + 11977281.0, + 12159072.0, + 12181796.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000868224713485688, + 0.0007059023482725024, + 0.0007057614857330918, + 0.0007060033385641873, + 0.0007060095085762441 + ], + "gamma_dfa": 0.026804575696587563, + "gamma_dfa_per_layer": [ + 0.2827316224575043, + -0.07767541706562042, + -0.051301658153533936, + -0.046536244451999664 + ], + "acc_eval": 0.32421875, + "loss_eval": 693.041259765625, + "epoch": 99 + }, + { + "hidden_norms": [ + 8047.01025390625, + 11685479.0, + 11977214.0, + 12159006.0, + 12181733.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008688519592396915, + 0.0007085604593157768, + 0.0007085682009346783, + 0.0007085984107106924, + 0.0007085916586220264 + ], + "gamma_dfa": 0.027284779585897923, + "gamma_dfa_per_layer": [ + 0.2883991003036499, + -0.07865853607654572, + -0.04951424151659012, + -0.05108720436692238 + ], + "acc_eval": 0.3134765625, + "loss_eval": 705.9644775390625, + "epoch": 100 + } + ] +}
\ No newline at end of file |
