From aa73718eb6427d7da3b9cb416275802d90c4b2ed Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Sun, 14 Jun 2026 04:06:32 -0500 Subject: Add new experiment scripts, figures, and paper assets; untrack pyc/build artifacts Co-Authored-By: Claude Opus 4.8 (1M context) --- .../alpha_sweep_scaffold/alpha_sweep_t5_s42.json | 6489 ++++++++++++++++++++ results/audit_d512_L2_4method.log | 16 + results/audit_d512_L2_6method.log | 35 + results/blend_dissection/dissection_t5_s42.json | 4311 +++++++++++++ .../ablation_a1.0_L4_s42.json | 90 + .../ablation_a1.0_L4_s123.json | 46 + .../ablation_a1.0_L4_s456.json | 46 + .../ablation_a1.0_L4_s42.json | 90 + .../ablation_a1.0_L4_s42.json | 90 + .../ablation_a1.0_L4_s42.json | 90 + results/bp_with_penalty_run.log | 18 + results/checkpointed_handoff/handoff_s42.json | 5828 ++++++++++++++++++ results/cifar100_protocol_validation.log | 371 ++ .../results_cifar100.json | 3467 +++++++++++ results/cifar100_scan.log | 179 +- results/cifar_deltaL/cb_deltaL_d512_L4_s42.json | 428 ++ results/cifar_depth_scan_multiseed.log | 81 + .../cifar_depth_scan_multiseed/d512_L4_s123.json | 838 +++ .../cifar_depth_scan_multiseed/d512_L4_s456.json | 838 +++ results/cifar_depth_scan_multiseed/summary.json | 78 + results/cifar_depth_scan_s42/d512_L12_s42.json | 1421 +++++ results/cifar_depth_scan_s42/d512_L2_s42.json | 1151 ++++ results/cifar_depth_scan_s42/d512_L4_s42.json | 1205 ++++ results/cifar_depth_scan_s42/d512_L6_s42.json | 1259 ++++ results/cifar_depth_scan_s42/d512_L8_s42.json | 1313 ++++ results/cifar_depth_scan_s42/summary.json | 186 + .../confirmatory/T1_cifar_full_metrics_gpu1.csv | 41 + results/confirmatory/T2_support_sparsity_FIXED.csv | 961 +++ results/confirmatory/T2_support_sparsity_gpu1.csv | 801 +++ results/confirmatory/T4_active_gamma_gpu1.csv | 101 + .../element_grad_concentration_gpu1.csv | 49 + results/deeper_L_multiseed_scan.log | 1090 ++++ results/dfa_canonical_freshB.log | 13 + .../freshB_null_canonical_s42.json | 56 + .../results_cifar10.json | 549 ++ .../results_cifar10.json | 549 ++ results/dfa_canonical_penalty_sweep.log | 77 + results/dfa_canonical_penalty_trajectory.json | 1700 +++++ results/dfa_canonical_penalty_trajectory.log | 47 + results/dfa_direction_quality_run.log | 3 + results/dfa_pen_short_lam1e-1.log | 15 + results/dfa_pen_short_lam1e-4.log | 15 + results/dfa_pen_short_lam1e-4_s123.log | 15 + results/dfa_pen_short_lam1e-4_s456.log | 15 + results/dfa_pen_short_run.log | 15 + results/dfa_pen_short_s123.log | 15 + results/dfa_pen_short_s456.log | 15 + .../dfa_residual_penalty/dfa_pen_lam0.001_s42.json | 85 + .../dfa_residual_penalty/dfa_pen_lam0.01_s123.json | 85 + .../dfa_residual_penalty/dfa_pen_lam0.01_s42.json | 85 + .../dfa_residual_penalty/dfa_pen_lam0.01_s456.json | 85 + results/dfa_residual_penalty/run_lam1e-1_s42.log | 7 + results/dfa_residual_penalty/run_lam1e-2_s123.log | 21 + results/dfa_residual_penalty/run_lam1e-2_s42.log | 21 + results/dfa_residual_penalty/run_lam1e-2_s456.log | 21 + results/dfa_residual_penalty/run_lam1e-3_s123.log | 7 + results/dfa_residual_penalty/run_lam1e-3_s42.log | 21 + results/dfa_residual_penalty/run_lam1e-3_s456.log | 7 + results/ep_baseline/ep_s2048.json | 23 + .../exploit_linesearch/linesearch_L4_d256_s42.json | 112 + .../linesearch_L4_d256_s42.json | 1850 ++++++ .../fa_canonical_lam1e-2_30ep/results_cifar10.json | 549 ++ .../fa_canonical_lam1e-4_30ep/results_cifar10.json | 549 ++ results/fa_canonical_penalty_sweep.log | 76 + results/figures/figure_snapshot_resmlp.pdf | Bin 0 -> 40868 bytes results/figures/figure_snapshot_vit.pdf | Bin 0 -> 28184 bytes .../freeze_with_decay_t5_s42.json | 5762 +++++++++++++++++ results/frozen_baselines_crossarch.json | 14 + results/frozen_baselines_crossarch.log | 120 + results/frozen_cifar/frozen_L4_d256_s42.json | 174 + results/frozen_cifar/frozen_L4_d512_s42.json | 174 + results/frozen_cifar/frozen_L6_d256_s42.json | 216 + .../frozen_cifar_vec/frozen_vec_L4_d256_s42.json | 188 + results/h2_no_residual_full_s123.log | 107 + .../snapshot_evolution_s123.json | 2749 +++++++++ results/h2_no_residual_full_s42.log | 210 + .../snapshot_evolution_s42.json | 5475 +++++++++++++++++ results/h2_no_residual_full_s456.log | 107 + .../snapshot_evolution_s456.json | 2749 +++++++++ results/h2_no_residual_s42.log | 16 + results/h2_smoke_w0.1/snapshot_evolution_s42.json | 237 + results/h2_smoke_w0.2/snapshot_evolution_s42.json | 237 + results/h2_smoke_w0.5/snapshot_evolution_s42.json | 237 + results/h2_smoketest/snapshot_evolution_s42.json | 129 + .../minimal_aux_compression_t5_s42.json | 5768 +++++++++++++++++ results/online_shallow/scan_s42.json | 422 ++ results/online_shallow_3seed/scan_s123.json | 62 + results/online_shallow_3seed/scan_s42.json | 62 + results/online_shallow_3seed/scan_s456.json | 62 + results/online_vec_pilot/pilot_s42.json | 177 + results/optionA_random_targets_s42.log | 107 + .../snapshot_evolution_s42.json | 2749 +++++++++ results/optionA_smoke/snapshot_evolution_s42.json | 130 + results/optionEP_random_targets_full.log | 7 + .../ep_random_s42.json | 23 + results/optionEP_smoke/ep_random_s42.json | 23 + results/optionSBCB_random_targets_s42.log | 36 + .../results_cifar10.json | 996 +++ results/optionSBCB_smoke/results_cifar10.json | 220 + results/periodic_refit/periodic_refit_s42.json | 414 ++ results/prefit_threshold/prefit_curve_t5_s42.json | 330 + results/resmlp_frozen_blocks_s123.log | 73 + results/resmlp_frozen_blocks_s42.log | 73 + results/resmlp_frozen_blocks_s456.log | 73 + results/resnet_baseline_s42.log | 6 + results/resnet_frozen_blocks_s42.log | 5 + results/resnet_protocol_validation.json | 2999 +++++++++ results/resnet_protocol_validation.log | 161 + results/round38_cb_penalty_30ep_s123.log | 15 + .../results_cifar10.json | 233 + results/round38_cb_penalty_30ep_s456.log | 15 + .../results_cifar10.json | 233 + results/round38_sb_penalty_30ep_s123.log | 14 + .../results_cifar10.json | 233 + results/round38_sb_penalty_30ep_s456.log | 14 + .../results_cifar10.json | 233 + results/round38_sbcb_baseline_30ep.log | 22 + .../results_cifar10.json | 437 ++ results/round38_sbcb_penalty_30ep.log | 22 + .../round38_sbcb_penalty_30ep/results_cifar10.json | 437 ++ .../round38_smoke_sbcb_pen/results_cifar10.json | 213 + results/round41_dfa_penalty_30ep.log | 14 + .../round41_dfa_penalty_30ep/results_cifar10.json | 201 + results/round41_dfa_penalty_30ep_s123.log | 14 + .../results_cifar10.json | 201 + results/round41_dfa_penalty_30ep_s456.log | 14 + .../results_cifar10.json | 201 + results/scaffold_replication/replication.json | 38 + results/schedule_timing/schedules_s42.json | 2018 ++++++ results/snapshot_evolution_v2/run_s123.log | 210 + results/snapshot_evolution_v2/run_s42.log | 210 + results/snapshot_evolution_v2/run_s456.log | 210 + .../snapshot_evolution_s123.json | 5473 +++++++++++++++++ .../snapshot_evolution_s42.json | 5473 +++++++++++++++++ .../snapshot_evolution_s456.json | 5473 +++++++++++++++++ .../snapshot_fa_canonical_s42.json | 2734 +++++++++ results/snapshot_evolution_v2/snapshot_fa_s42.json | 2734 +++++++++ results/snapshot_evolution_v3_fa.log | 1 + results/snapshot_exploit/snapshot_L4_d256_s42.json | 209 + results/snapshot_fa_canonical_all.log | 142 + results/snapshot_fa_canonical_noln.log | 13 + results/snapshot_fa_crossarch.log | 28 + results/snapshot_fa_evolution.log | 103 + results/snapshot_fa_studentnet_vit.log | 37 + results/snapshot_no_outln_v1/run_s123.log | 51 + results/snapshot_no_outln_v1/run_s42.log | 51 + results/snapshot_no_outln_v1/run_s456.log | 51 + .../snapshot_fa_canonical_noln_s42.json | 1824 ++++++ .../snapshot_no_outln_v1/snapshot_fa_noln_s42.json | 1824 ++++++ .../snapshot_no_outln_v1/snapshot_noLN_s123.json | 4766 ++++++++++++++ .../snapshot_no_outln_v1/snapshot_noLN_s42.json | 4766 ++++++++++++++ .../snapshot_no_outln_v1/snapshot_noLN_s456.json | 4766 ++++++++++++++ results/snapshot_synth_v1/run_a1.0_s42.log | 44 + .../snapshot_fa_canonical_s42.json | 2276 +++++++ .../snapshot_fa_synth_a1.0_L4_s42.json | 2276 +++++++ .../snapshot_synth_a1.0_L4_s42.json | 4960 +++++++++++++++ results/snapshot_time/time_sweep_L4_d256_s42.json | 128 + results/snapshot_vit_v1/run_s123.log | 36 + results/snapshot_vit_v1/run_s42.log | 36 + results/snapshot_vit_v1/run_s456.log | 36 + .../snapshot_vit_v1/snapshot_fa_canonical_s42.json | 1104 ++++ results/snapshot_vit_v1/snapshot_fa_vit_s42.json | 1104 ++++ results/snapshot_vit_v1/snapshot_vit_s123.json | 4594 ++++++++++++++ results/snapshot_vit_v1/snapshot_vit_s42.json | 4594 ++++++++++++++ results/snapshot_vit_v1/snapshot_vit_s456.json | 4594 ++++++++++++++ results/structured_aux/structured_aux_t5_s42.json | 6481 +++++++++++++++++++ results/synth_ladder_smoke/config.json | 30 + results/synth_ladder_smoke/summary.json | 782 +++ results/synth_ladder_smoke/synth_a0.0_L2_s42.json | 1172 ++++ results/synth_ladder_smoke/synth_a0.0_L8_s42.json | 1298 ++++ results/synth_ladder_smoke/synth_a0.5_L2_s42.json | 1172 ++++ results/synth_ladder_smoke/synth_a0.5_L8_s42.json | 1298 ++++ results/synth_ladder_smoke/synth_a1.0_L2_s42.json | 1172 ++++ results/synth_ladder_smoke/synth_a1.0_L8_s42.json | 1298 ++++ results/synth_ladder_v2_hi/config.json | 33 + results/synth_ladder_v2_hi/summary.json | 3590 +++++++++++ .../synth_ladder_v2_hi/synth_a0.5_L12_s123.json | 1722 ++++++ results/synth_ladder_v2_hi/synth_a0.5_L12_s42.json | 1722 ++++++ .../synth_ladder_v2_hi/synth_a0.5_L12_s456.json | 1722 ++++++ results/synth_ladder_v2_hi/synth_a0.5_L2_s123.json | 1512 +++++ results/synth_ladder_v2_hi/synth_a0.5_L2_s42.json | 1512 +++++ results/synth_ladder_v2_hi/synth_a0.5_L2_s456.json | 1512 +++++ results/synth_ladder_v2_hi/synth_a0.5_L4_s123.json | 1554 +++++ results/synth_ladder_v2_hi/synth_a0.5_L4_s42.json | 1554 +++++ results/synth_ladder_v2_hi/synth_a0.5_L4_s456.json | 1554 +++++ results/synth_ladder_v2_hi/synth_a0.5_L8_s123.json | 1638 +++++ results/synth_ladder_v2_hi/synth_a0.5_L8_s42.json | 1638 +++++ results/synth_ladder_v2_hi/synth_a0.5_L8_s456.json | 1638 +++++ .../synth_ladder_v2_hi/synth_a1.0_L12_s123.json | 1722 ++++++ results/synth_ladder_v2_hi/synth_a1.0_L12_s42.json | 1722 ++++++ .../synth_ladder_v2_hi/synth_a1.0_L12_s456.json | 1722 ++++++ results/synth_ladder_v2_hi/synth_a1.0_L2_s123.json | 1512 +++++ results/synth_ladder_v2_hi/synth_a1.0_L2_s42.json | 1512 +++++ results/synth_ladder_v2_hi/synth_a1.0_L2_s456.json | 1512 +++++ results/synth_ladder_v2_hi/synth_a1.0_L4_s123.json | 1554 +++++ results/synth_ladder_v2_hi/synth_a1.0_L4_s42.json | 1554 +++++ results/synth_ladder_v2_hi/synth_a1.0_L4_s456.json | 1554 +++++ results/synth_ladder_v2_hi/synth_a1.0_L8_s123.json | 1638 +++++ results/synth_ladder_v2_hi/synth_a1.0_L8_s42.json | 1638 +++++ results/synth_ladder_v2_hi/synth_a1.0_L8_s456.json | 1638 +++++ results/synth_ladder_v2_lo/config.json | 33 + results/synth_ladder_v2_lo/summary.json | 3590 +++++++++++ .../synth_ladder_v2_lo/synth_a0.0_L12_s123.json | 1722 ++++++ results/synth_ladder_v2_lo/synth_a0.0_L12_s42.json | 1722 ++++++ .../synth_ladder_v2_lo/synth_a0.0_L12_s456.json | 1722 ++++++ results/synth_ladder_v2_lo/synth_a0.0_L2_s123.json | 1512 +++++ results/synth_ladder_v2_lo/synth_a0.0_L2_s42.json | 1512 +++++ results/synth_ladder_v2_lo/synth_a0.0_L2_s456.json | 1512 +++++ results/synth_ladder_v2_lo/synth_a0.0_L4_s123.json | 1554 +++++ results/synth_ladder_v2_lo/synth_a0.0_L4_s42.json | 1554 +++++ results/synth_ladder_v2_lo/synth_a0.0_L4_s456.json | 1554 +++++ results/synth_ladder_v2_lo/synth_a0.0_L8_s123.json | 1638 +++++ results/synth_ladder_v2_lo/synth_a0.0_L8_s42.json | 1638 +++++ results/synth_ladder_v2_lo/synth_a0.0_L8_s456.json | 1638 +++++ .../synth_ladder_v2_lo/synth_a0.25_L12_s123.json | 1722 ++++++ .../synth_ladder_v2_lo/synth_a0.25_L12_s42.json | 1722 ++++++ .../synth_ladder_v2_lo/synth_a0.25_L12_s456.json | 1722 ++++++ .../synth_ladder_v2_lo/synth_a0.25_L2_s123.json | 1512 +++++ results/synth_ladder_v2_lo/synth_a0.25_L2_s42.json | 1512 +++++ .../synth_ladder_v2_lo/synth_a0.25_L2_s456.json | 1512 +++++ .../synth_ladder_v2_lo/synth_a0.25_L4_s123.json | 1554 +++++ results/synth_ladder_v2_lo/synth_a0.25_L4_s42.json | 1554 +++++ .../synth_ladder_v2_lo/synth_a0.25_L4_s456.json | 1554 +++++ .../synth_ladder_v2_lo/synth_a0.25_L8_s123.json | 1638 +++++ results/synth_ladder_v2_lo/synth_a0.25_L8_s42.json | 1638 +++++ .../synth_ladder_v2_lo/synth_a0.25_L8_s456.json | 1638 +++++ results/topdown_curriculum/topdown_s42.json | 620 ++ results/update_swap/update_swap_L4_d256_s42.json | 326 + results/vector_audit/audit_results.json | 184 + results/vector_audit_full/audit_results.json | 1346 ++++ results/vector_credit_pilot/results.json | 590 ++ results/vit_dfa_train_s42.log | 4 + results/vit_frozen_blocks_s123.log | 34 + results/vit_frozen_blocks_s42.log | 34 + results/vit_frozen_blocks_s456.log | 34 + results/vit_shallow_baseline_s42.log | 28 + results/vit_test/snapshot_vit_s42.json | 244 + 237 files changed, 247844 insertions(+), 3 deletions(-) create mode 100644 results/alpha_sweep_scaffold/alpha_sweep_t5_s42.json create mode 100644 results/audit_d512_L2_4method.log create mode 100644 results/audit_d512_L2_6method.log create mode 100644 results/blend_dissection/dissection_t5_s42.json create mode 100644 results/boundary_ablation_deltaL_wr/ablation_a1.0_L4_s42.json create mode 100644 results/boundary_ablation_s123/ablation_a1.0_L4_s123.json create mode 100644 results/boundary_ablation_s456/ablation_a1.0_L4_s456.json create mode 100644 results/boundary_ablation_s_sweep/ablation_a1.0_L4_s42.json create mode 100644 results/boundary_ablation_tgw_sweep/ablation_a1.0_L4_s42.json create mode 100644 results/boundary_ablation_wr_sweep/ablation_a1.0_L4_s42.json create mode 100644 results/bp_with_penalty_run.log create mode 100644 results/checkpointed_handoff/handoff_s42.json create mode 100644 results/cifar100_protocol_validation.log create mode 100644 results/cifar100_protocol_validation/results_cifar100.json create mode 100644 results/cifar_deltaL/cb_deltaL_d512_L4_s42.json create mode 100644 results/cifar_depth_scan_multiseed.log create mode 100644 results/cifar_depth_scan_multiseed/d512_L4_s123.json create mode 100644 results/cifar_depth_scan_multiseed/d512_L4_s456.json create mode 100644 results/cifar_depth_scan_multiseed/summary.json create mode 100644 results/cifar_depth_scan_s42/d512_L12_s42.json create mode 100644 results/cifar_depth_scan_s42/d512_L2_s42.json create mode 100644 results/cifar_depth_scan_s42/d512_L4_s42.json create mode 100644 results/cifar_depth_scan_s42/d512_L6_s42.json create mode 100644 results/cifar_depth_scan_s42/d512_L8_s42.json create mode 100644 results/cifar_depth_scan_s42/summary.json create mode 100644 results/confirmatory/T1_cifar_full_metrics_gpu1.csv create mode 100644 results/confirmatory/T2_support_sparsity_FIXED.csv create mode 100644 results/confirmatory/T2_support_sparsity_gpu1.csv create mode 100644 results/confirmatory/T4_active_gamma_gpu1.csv create mode 100644 results/confirmatory/element_grad_concentration_gpu1.csv create mode 100644 results/deeper_L_multiseed_scan.log create mode 100644 results/dfa_canonical_freshB.log create mode 100644 results/dfa_canonical_freshB/freshB_null_canonical_s42.json create mode 100644 results/dfa_canonical_lam1e-2_30ep/results_cifar10.json create mode 100644 results/dfa_canonical_lam1e-4_30ep/results_cifar10.json create mode 100644 results/dfa_canonical_penalty_sweep.log create mode 100644 results/dfa_canonical_penalty_trajectory.json create mode 100644 results/dfa_canonical_penalty_trajectory.log create mode 100644 results/dfa_direction_quality_run.log create mode 100644 results/dfa_pen_short_lam1e-1.log create mode 100644 results/dfa_pen_short_lam1e-4.log create mode 100644 results/dfa_pen_short_lam1e-4_s123.log create mode 100644 results/dfa_pen_short_lam1e-4_s456.log create mode 100644 results/dfa_pen_short_run.log create mode 100644 results/dfa_pen_short_s123.log create mode 100644 results/dfa_pen_short_s456.log create mode 100644 results/dfa_residual_penalty/dfa_pen_lam0.001_s42.json create mode 100644 results/dfa_residual_penalty/dfa_pen_lam0.01_s123.json create mode 100644 results/dfa_residual_penalty/dfa_pen_lam0.01_s42.json create mode 100644 results/dfa_residual_penalty/dfa_pen_lam0.01_s456.json create mode 100644 results/dfa_residual_penalty/run_lam1e-1_s42.log create mode 100644 results/dfa_residual_penalty/run_lam1e-2_s123.log create mode 100644 results/dfa_residual_penalty/run_lam1e-2_s42.log create mode 100644 results/dfa_residual_penalty/run_lam1e-2_s456.log create mode 100644 results/dfa_residual_penalty/run_lam1e-3_s123.log create mode 100644 results/dfa_residual_penalty/run_lam1e-3_s42.log create mode 100644 results/dfa_residual_penalty/run_lam1e-3_s456.log create mode 100644 results/ep_baseline/ep_s2048.json create mode 100644 results/exploit_linesearch/linesearch_L4_d256_s42.json create mode 100644 results/exploit_linesearch_full/linesearch_L4_d256_s42.json create mode 100644 results/fa_canonical_lam1e-2_30ep/results_cifar10.json create mode 100644 results/fa_canonical_lam1e-4_30ep/results_cifar10.json create mode 100644 results/fa_canonical_penalty_sweep.log create mode 100644 results/figures/figure_snapshot_resmlp.pdf create mode 100644 results/figures/figure_snapshot_vit.pdf create mode 100644 results/freeze_with_decay/freeze_with_decay_t5_s42.json create mode 100644 results/frozen_baselines_crossarch.json create mode 100644 results/frozen_baselines_crossarch.log create mode 100644 results/frozen_cifar/frozen_L4_d256_s42.json create mode 100644 results/frozen_cifar/frozen_L4_d512_s42.json create mode 100644 results/frozen_cifar/frozen_L6_d256_s42.json create mode 100644 results/frozen_cifar_vec/frozen_vec_L4_d256_s42.json create mode 100644 results/h2_no_residual_full_s123.log create mode 100644 results/h2_no_residual_full_s123/snapshot_evolution_s123.json create mode 100644 results/h2_no_residual_full_s42.log create mode 100644 results/h2_no_residual_full_s42/snapshot_evolution_s42.json create mode 100644 results/h2_no_residual_full_s456.log create mode 100644 results/h2_no_residual_full_s456/snapshot_evolution_s456.json create mode 100644 results/h2_no_residual_s42.log create mode 100644 results/h2_smoke_w0.1/snapshot_evolution_s42.json create mode 100644 results/h2_smoke_w0.2/snapshot_evolution_s42.json create mode 100644 results/h2_smoke_w0.5/snapshot_evolution_s42.json create mode 100644 results/h2_smoketest/snapshot_evolution_s42.json create mode 100644 results/minimal_aux_compression/minimal_aux_compression_t5_s42.json create mode 100644 results/online_shallow/scan_s42.json create mode 100644 results/online_shallow_3seed/scan_s123.json create mode 100644 results/online_shallow_3seed/scan_s42.json create mode 100644 results/online_shallow_3seed/scan_s456.json create mode 100644 results/online_vec_pilot/pilot_s42.json create mode 100644 results/optionA_random_targets_s42.log create mode 100644 results/optionA_random_targets_s42/snapshot_evolution_s42.json create mode 100644 results/optionA_smoke/snapshot_evolution_s42.json create mode 100644 results/optionEP_random_targets_full.log create mode 100644 results/optionEP_random_targets_full/ep_random_s42.json create mode 100644 results/optionEP_smoke/ep_random_s42.json create mode 100644 results/optionSBCB_random_targets_s42.log create mode 100644 results/optionSBCB_random_targets_s42/results_cifar10.json create mode 100644 results/optionSBCB_smoke/results_cifar10.json create mode 100644 results/periodic_refit/periodic_refit_s42.json create mode 100644 results/prefit_threshold/prefit_curve_t5_s42.json create mode 100644 results/resmlp_frozen_blocks_s123.log create mode 100644 results/resmlp_frozen_blocks_s42.log create mode 100644 results/resmlp_frozen_blocks_s456.log create mode 100644 results/resnet_baseline_s42.log create mode 100644 results/resnet_frozen_blocks_s42.log create mode 100644 results/resnet_protocol_validation.json create mode 100644 results/resnet_protocol_validation.log create mode 100644 results/round38_cb_penalty_30ep_s123.log create mode 100644 results/round38_cb_penalty_30ep_s123/results_cifar10.json create mode 100644 results/round38_cb_penalty_30ep_s456.log create mode 100644 results/round38_cb_penalty_30ep_s456/results_cifar10.json create mode 100644 results/round38_sb_penalty_30ep_s123.log create mode 100644 results/round38_sb_penalty_30ep_s123/results_cifar10.json create mode 100644 results/round38_sb_penalty_30ep_s456.log create mode 100644 results/round38_sb_penalty_30ep_s456/results_cifar10.json create mode 100644 results/round38_sbcb_baseline_30ep.log create mode 100644 results/round38_sbcb_baseline_30ep/results_cifar10.json create mode 100644 results/round38_sbcb_penalty_30ep.log create mode 100644 results/round38_sbcb_penalty_30ep/results_cifar10.json create mode 100644 results/round38_smoke_sbcb_pen/results_cifar10.json create mode 100644 results/round41_dfa_penalty_30ep.log create mode 100644 results/round41_dfa_penalty_30ep/results_cifar10.json create mode 100644 results/round41_dfa_penalty_30ep_s123.log create mode 100644 results/round41_dfa_penalty_30ep_s123/results_cifar10.json create mode 100644 results/round41_dfa_penalty_30ep_s456.log create mode 100644 results/round41_dfa_penalty_30ep_s456/results_cifar10.json create mode 100644 results/scaffold_replication/replication.json create mode 100644 results/schedule_timing/schedules_s42.json create mode 100644 results/snapshot_evolution_v2/run_s123.log create mode 100644 results/snapshot_evolution_v2/run_s42.log create mode 100644 results/snapshot_evolution_v2/run_s456.log create mode 100644 results/snapshot_evolution_v2/snapshot_evolution_s123.json create mode 100644 results/snapshot_evolution_v2/snapshot_evolution_s42.json create mode 100644 results/snapshot_evolution_v2/snapshot_evolution_s456.json create mode 100644 results/snapshot_evolution_v2/snapshot_fa_canonical_s42.json create mode 100644 results/snapshot_evolution_v2/snapshot_fa_s42.json create mode 100644 results/snapshot_evolution_v3_fa.log create mode 100644 results/snapshot_exploit/snapshot_L4_d256_s42.json create mode 100644 results/snapshot_fa_canonical_all.log create mode 100644 results/snapshot_fa_canonical_noln.log create mode 100644 results/snapshot_fa_crossarch.log create mode 100644 results/snapshot_fa_evolution.log create mode 100644 results/snapshot_fa_studentnet_vit.log create mode 100644 results/snapshot_no_outln_v1/run_s123.log create mode 100644 results/snapshot_no_outln_v1/run_s42.log create mode 100644 results/snapshot_no_outln_v1/run_s456.log create mode 100644 results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json create mode 100644 results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json create mode 100644 results/snapshot_no_outln_v1/snapshot_noLN_s123.json create mode 100644 results/snapshot_no_outln_v1/snapshot_noLN_s42.json create mode 100644 results/snapshot_no_outln_v1/snapshot_noLN_s456.json create mode 100644 results/snapshot_synth_v1/run_a1.0_s42.log create mode 100644 results/snapshot_synth_v1/snapshot_fa_canonical_s42.json create mode 100644 results/snapshot_synth_v1/snapshot_fa_synth_a1.0_L4_s42.json create mode 100644 results/snapshot_synth_v1/snapshot_synth_a1.0_L4_s42.json create mode 100644 results/snapshot_time/time_sweep_L4_d256_s42.json create mode 100644 results/snapshot_vit_v1/run_s123.log create mode 100644 results/snapshot_vit_v1/run_s42.log create mode 100644 results/snapshot_vit_v1/run_s456.log create mode 100644 results/snapshot_vit_v1/snapshot_fa_canonical_s42.json create mode 100644 results/snapshot_vit_v1/snapshot_fa_vit_s42.json create mode 100644 results/snapshot_vit_v1/snapshot_vit_s123.json create mode 100644 results/snapshot_vit_v1/snapshot_vit_s42.json create mode 100644 results/snapshot_vit_v1/snapshot_vit_s456.json create mode 100644 results/structured_aux/structured_aux_t5_s42.json create mode 100644 results/synth_ladder_smoke/config.json create mode 100644 results/synth_ladder_smoke/summary.json create mode 100644 results/synth_ladder_smoke/synth_a0.0_L2_s42.json create mode 100644 results/synth_ladder_smoke/synth_a0.0_L8_s42.json create mode 100644 results/synth_ladder_smoke/synth_a0.5_L2_s42.json create mode 100644 results/synth_ladder_smoke/synth_a0.5_L8_s42.json create mode 100644 results/synth_ladder_smoke/synth_a1.0_L2_s42.json create mode 100644 results/synth_ladder_smoke/synth_a1.0_L8_s42.json create mode 100644 results/synth_ladder_v2_hi/config.json create mode 100644 results/synth_ladder_v2_hi/summary.json create mode 100644 results/synth_ladder_v2_hi/synth_a0.5_L12_s123.json create mode 100644 results/synth_ladder_v2_hi/synth_a0.5_L12_s42.json create mode 100644 results/synth_ladder_v2_hi/synth_a0.5_L12_s456.json create mode 100644 results/synth_ladder_v2_hi/synth_a0.5_L2_s123.json create mode 100644 results/synth_ladder_v2_hi/synth_a0.5_L2_s42.json create mode 100644 results/synth_ladder_v2_hi/synth_a0.5_L2_s456.json create mode 100644 results/synth_ladder_v2_hi/synth_a0.5_L4_s123.json create mode 100644 results/synth_ladder_v2_hi/synth_a0.5_L4_s42.json create mode 100644 results/synth_ladder_v2_hi/synth_a0.5_L4_s456.json create mode 100644 results/synth_ladder_v2_hi/synth_a0.5_L8_s123.json create mode 100644 results/synth_ladder_v2_hi/synth_a0.5_L8_s42.json create mode 100644 results/synth_ladder_v2_hi/synth_a0.5_L8_s456.json create mode 100644 results/synth_ladder_v2_hi/synth_a1.0_L12_s123.json create mode 100644 results/synth_ladder_v2_hi/synth_a1.0_L12_s42.json create mode 100644 results/synth_ladder_v2_hi/synth_a1.0_L12_s456.json create mode 100644 results/synth_ladder_v2_hi/synth_a1.0_L2_s123.json create mode 100644 results/synth_ladder_v2_hi/synth_a1.0_L2_s42.json create mode 100644 results/synth_ladder_v2_hi/synth_a1.0_L2_s456.json create mode 100644 results/synth_ladder_v2_hi/synth_a1.0_L4_s123.json create mode 100644 results/synth_ladder_v2_hi/synth_a1.0_L4_s42.json create mode 100644 results/synth_ladder_v2_hi/synth_a1.0_L4_s456.json create mode 100644 results/synth_ladder_v2_hi/synth_a1.0_L8_s123.json create mode 100644 results/synth_ladder_v2_hi/synth_a1.0_L8_s42.json create mode 100644 results/synth_ladder_v2_hi/synth_a1.0_L8_s456.json create mode 100644 results/synth_ladder_v2_lo/config.json create mode 100644 results/synth_ladder_v2_lo/summary.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.0_L12_s123.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.0_L12_s42.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.0_L12_s456.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.0_L2_s123.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.0_L2_s42.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.0_L2_s456.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.0_L4_s123.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.0_L4_s42.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.0_L4_s456.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.0_L8_s123.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.0_L8_s42.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.0_L8_s456.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.25_L12_s123.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.25_L12_s42.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.25_L12_s456.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.25_L2_s123.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.25_L2_s42.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.25_L2_s456.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.25_L4_s123.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.25_L4_s42.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.25_L4_s456.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.25_L8_s123.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.25_L8_s42.json create mode 100644 results/synth_ladder_v2_lo/synth_a0.25_L8_s456.json create mode 100644 results/topdown_curriculum/topdown_s42.json create mode 100644 results/update_swap/update_swap_L4_d256_s42.json create mode 100644 results/vector_audit/audit_results.json create mode 100644 results/vector_audit_full/audit_results.json create mode 100644 results/vector_credit_pilot/results.json create mode 100644 results/vit_dfa_train_s42.log create mode 100644 results/vit_frozen_blocks_s123.log create mode 100644 results/vit_frozen_blocks_s42.log create mode 100644 results/vit_frozen_blocks_s456.log create mode 100644 results/vit_shallow_baseline_s42.log create mode 100644 results/vit_test/snapshot_vit_s42.json (limited to 'results') diff --git a/results/alpha_sweep_scaffold/alpha_sweep_t5_s42.json b/results/alpha_sweep_scaffold/alpha_sweep_t5_s42.json new file mode 100644 index 0000000..6ca3952 --- /dev/null +++ b/results/alpha_sweep_scaffold/alpha_sweep_t5_s42.json @@ -0,0 +1,6489 @@ +{ + "args": { + "num_blocks": 4, + "d_hidden": 256, + "batch_size": 128, + "epochs": 100, + "t0": 5, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "M": 4, + "seed": 42, + "gpu": 3, + "output_dir": "/home/yurenh2/fa/results/alpha_sweep_scaffold" + }, + "dfa_ckpt_acc": 0.304, + "dfa_final_acc": 0.3115, + "continue_DFA": { + "alpha": 0.0, + "test_acc": [ + 0.2982, + 0.3109, + 0.3125, + 0.3038, + 0.3113, + 0.3135, + 0.302, + 0.3075, + 0.3097, + 0.3101, + 0.3029, + 0.3054, + 0.3108, + 0.3095, + 0.3047, + 0.3164, + 0.3031, + 0.3083, + 0.3171, + 0.3029, + 0.2979, + 0.2958, + 0.3099, + 0.2966, + 0.2959, + 0.3017, + 0.3082, + 0.3046, + 0.306, + 0.292, + 0.281, + 0.3129, + 0.3075, + 0.3115, + 0.3141, + 0.3111, + 0.3151, + 0.2969, + 0.3097, + 0.321, + 0.3058, + 0.3145, + 0.32, + 0.303, + 0.3093, + 0.3071, + 0.3118, + 0.3043, + 0.3104, + 0.3127, + 0.3148, + 0.3203, + 0.3112, + 0.3016, + 0.315, + 0.312, + 0.3134, + 0.3129, + 0.3049, + 0.3125, + 0.3142, + 0.3164, + 0.314, + 0.309, + 0.3142, + 0.3165, + 0.3125, + 0.3095, + 0.3104, + 0.3188, + 0.3149, + 0.3142, + 0.3119, + 0.3166, + 0.3118, + 0.3119, + 0.3127, + 0.311, + 0.3141, + 0.3164, + 0.3123, + 0.3128, + 0.3126, + 0.3091, + 0.3115, + 0.3127, + 0.3121, + 0.3123, + 0.3127, + 0.3132, + 0.3118, + 0.3118, + 0.3117, + 0.3114, + 0.3115 + ], + "train_loss": [ + 1.989790809059143, + 1.990307411880493, + 1.9905100513458251, + 1.9918334338378907, + 1.9863724251937867, + 1.9870153832244872, + 1.9874663953399658, + 1.9870845441055298, + 1.9880484677505492, + 1.9872064337539672, + 1.9897905487823486, + 1.9892820449066162, + 1.9874972410583496, + 1.9877921746444702, + 1.9876875100708007, + 1.9888226028060914, + 1.9874765905761718, + 1.9867966274642945, + 1.987537554550171, + 1.9880204120254517, + 1.9879772283935546, + 1.987797650413513, + 1.9874019779968262, + 1.9876940496063233, + 1.986886355819702, + 1.9884147914123536, + 1.9890670285797118, + 1.9873397811889648, + 1.9847210833740234, + 1.9871949213027955, + 1.9887558262634277, + 1.9838399686431885, + 1.9857967501068114, + 1.9860699237060546, + 1.9850847225952148, + 1.987654845123291, + 1.983670299758911, + 1.987481754837036, + 1.9858247266387938, + 1.9868243627166748, + 1.9862985388946532, + 1.984481724205017, + 1.9851255657958984, + 1.9881289917373657, + 1.9866780487442017, + 1.9885919563293457, + 1.9857788675308228, + 1.9890421838378907, + 1.9863371643066405, + 1.986637942276001, + 1.9849364169311523, + 1.9842691050720216, + 1.9856912046051025, + 1.988491299057007, + 1.9852929847717284, + 1.9856826776123047, + 1.9851847518920898, + 1.9835067967987061, + 1.9865730474853516, + 1.9850236835479735, + 1.9849657077789307, + 1.9844414936065673, + 1.9851242599105834, + 1.9842400899505614, + 1.9859014458847046, + 1.9850837426757812, + 1.985779475440979, + 1.985046662750244, + 1.9846652752685547, + 1.9845653623199462, + 1.984431827697754, + 1.9861651288223268, + 1.9833351360702514, + 1.9858753430175782, + 1.9859362523651123, + 1.9840349249649047, + 1.9841974882507325, + 1.9834141875457765, + 1.9854680131530762, + 1.9825797986221314, + 1.9835828475570678, + 1.9841230081176757, + 1.9844115731811522, + 1.9840126071548463, + 1.9844582679748535, + 1.9840802533340454, + 1.9842612131118775, + 1.984658988571167, + 1.9846206958770751, + 1.983520182762146, + 1.981859715309143, + 1.9833977752304077, + 1.9841900691986083, + 1.982843738861084, + 1.9838121879577637 + ], + "gamma": [ + [ + 6, + 0.0821653357706964 + ], + [ + 7, + 0.083711032057181 + ], + [ + 8, + 0.08393650152720511 + ], + [ + 9, + 0.08384976850356907 + ], + [ + 10, + 0.08560753799974918 + ], + [ + 13, + 0.0868276598630473 + ], + [ + 15, + 0.08848524722270668 + ], + [ + 20, + 0.08918609796091914 + ], + [ + 25, + 0.09372491284739226 + ], + [ + 35, + 0.09340126946335658 + ], + [ + 45, + 0.09817965375259519 + ], + [ + 55, + 0.09978153288830072 + ], + [ + 65, + 0.1001084745512344 + ], + [ + 75, + 0.1013008076697588 + ], + [ + 85, + 0.1014239476644434 + ], + [ + 95, + 0.10141936334548518 + ], + [ + 100, + 0.10145300498697907 + ] + ], + "rho": [ + [ + 6, + 0.019282110035419464 + ], + [ + 7, + 0.006952052121050656 + ], + [ + 8, + 0.008748143445700407 + ], + [ + 9, + 0.008938514394685626 + ], + [ + 10, + 0.01805932994466275 + ], + [ + 13, + 0.01803369668778032 + ], + [ + 15, + 0.0023002898087725043 + ], + [ + 20, + 0.012751705711707473 + ], + [ + 25, + 0.0011155498214066029 + ], + [ + 35, + 0.009300894802436233 + ], + [ + 45, + -0.0039156777784228325 + ], + [ + 55, + -0.007268198300153017 + ], + [ + 65, + 0.008430896326899529 + ], + [ + 75, + 0.004795442800968885 + ], + [ + 85, + -0.0030130266677588224 + ], + [ + 95, + 0.006304946728050709 + ], + [ + 100, + 0.004224925301969051 + ] + ], + "alpha_eff": [ + [ + 6, + 0.0 + ], + [ + 7, + 0.0 + ], + [ + 8, + 0.0 + ], + [ + 9, + 0.0 + ], + [ + 10, + 0.0 + ], + [ + 11, + 0.0 + ], + [ + 12, + 0.0 + ], + [ + 13, + 0.0 + ], + [ + 14, + 0.0 + ], + [ + 15, + 0.0 + ], + [ + 16, + 0.0 + ], + [ + 17, + 0.0 + ], + [ + 18, + 0.0 + ], + [ + 19, + 0.0 + ], + [ + 20, + 0.0 + ], + [ + 21, + 0.0 + ], + [ + 22, + 0.0 + ], + [ + 23, + 0.0 + ], + [ + 24, + 0.0 + ], + [ + 25, + 0.0 + ], + [ + 26, + 0.0 + ], + [ + 27, + 0.0 + ], + [ + 28, + 0.0 + ], + [ + 29, + 0.0 + ], + [ + 30, + 0.0 + ], + [ + 31, + 0.0 + ], + [ + 32, + 0.0 + ], + [ + 33, + 0.0 + ], + [ + 34, + 0.0 + ], + [ + 35, + 0.0 + ], + [ + 36, + 0.0 + ], + [ + 37, + 0.0 + ], + [ + 38, + 0.0 + ], + [ + 39, + 0.0 + ], + [ + 40, + 0.0 + ], + [ + 41, + 0.0 + ], + [ + 42, + 0.0 + ], + [ + 43, + 0.0 + ], + [ + 44, + 0.0 + ], + [ + 45, + 0.0 + ], + [ + 46, + 0.0 + ], + [ + 47, + 0.0 + ], + [ + 48, + 0.0 + ], + [ + 49, + 0.0 + ], + [ + 50, + 0.0 + ], + [ + 51, + 0.0 + ], + [ + 52, + 0.0 + ], + [ + 53, + 0.0 + ], + [ + 54, + 0.0 + ], + [ + 55, + 0.0 + ], + [ + 56, + 0.0 + ], + [ + 57, + 0.0 + ], + [ + 58, + 0.0 + ], + [ + 59, + 0.0 + ], + [ + 60, + 0.0 + ], + [ + 61, + 0.0 + ], + [ + 62, + 0.0 + ], + [ + 63, + 0.0 + ], + [ + 64, + 0.0 + ], + [ + 65, + 0.0 + ], + [ + 66, + 0.0 + ], + [ + 67, + 0.0 + ], + [ + 68, + 0.0 + ], + [ + 69, + 0.0 + ], + [ + 70, + 0.0 + ], + [ + 71, + 0.0 + ], + [ + 72, + 0.0 + ], + [ + 73, + 0.0 + ], + [ + 74, + 0.0 + ], + [ + 75, + 0.0 + ], + [ + 76, + 0.0 + ], + [ + 77, + 0.0 + ], + [ + 78, + 0.0 + ], + [ + 79, + 0.0 + ], + [ + 80, + 0.0 + ], + [ + 81, + 0.0 + ], + [ + 82, + 0.0 + ], + [ + 83, + 0.0 + ], + [ + 84, + 0.0 + ], + [ + 85, + 0.0 + ], + [ + 86, + 0.0 + ], + [ + 87, + 0.0 + ], + [ + 88, + 0.0 + ], + [ + 89, + 0.0 + ], + [ + 90, + 0.0 + ], + [ + 91, + 0.0 + ], + [ + 92, + 0.0 + ], + [ + 93, + 0.0 + ], + [ + 94, + 0.0 + ], + [ + 95, + 0.0 + ], + [ + 96, + 0.0 + ], + [ + 97, + 0.0 + ], + [ + 98, + 0.0 + ], + [ + 99, + 0.0 + ], + [ + 100, + 0.0 + ] + ] + }, + "blend_perlayer_vector_alpha025": { + "alpha": 0.25, + "test_acc": [ + 0.3059, + 0.3134, + 0.3123, + 0.3027, + 0.3018, + 0.2983, + 0.3026, + 0.3085, + 0.2995, + 0.309, + 0.32, + 0.3066, + 0.3078, + 0.292, + 0.3148, + 0.3093, + 0.3138, + 0.3203, + 0.3104, + 0.3125, + 0.3131, + 0.3109, + 0.3155, + 0.3017, + 0.2953, + 0.3003, + 0.3192, + 0.3038, + 0.2993, + 0.3093, + 0.3122, + 0.3103, + 0.3157, + 0.3056, + 0.3163, + 0.3008, + 0.3168, + 0.3076, + 0.3191, + 0.2972, + 0.3109, + 0.3154, + 0.3106, + 0.3057, + 0.2987, + 0.2986, + 0.2998, + 0.3103, + 0.3066, + 0.2939, + 0.3131, + 0.3157, + 0.3075, + 0.3084, + 0.3134, + 0.304, + 0.3125, + 0.3086, + 0.3127, + 0.3062, + 0.3115, + 0.3095, + 0.3136, + 0.3181, + 0.3079, + 0.305, + 0.3098, + 0.3092, + 0.3121, + 0.3123, + 0.3019, + 0.3064, + 0.3185, + 0.3061, + 0.314, + 0.3095, + 0.3082, + 0.3099, + 0.3077, + 0.3074, + 0.309, + 0.3084, + 0.3071, + 0.3117, + 0.3135, + 0.3103, + 0.3108, + 0.3128, + 0.311, + 0.3125, + 0.311, + 0.3116, + 0.3116, + 0.3114, + 0.3113 + ], + "train_loss": [ + 1.9946389611434936, + 1.9873730335998536, + 1.9877911005020141, + 1.9842363983154296, + 1.9815330656433106, + 1.980721904220581, + 1.9785015773773194, + 1.9797889567565918, + 1.9816056001281739, + 1.9788435654449463, + 1.9812182509613037, + 1.9796995071792602, + 1.9816956015396119, + 1.9824337406921386, + 1.979214592666626, + 1.9782327182769774, + 1.983439411239624, + 1.9820835842895508, + 1.982200440979004, + 1.9838852446746826, + 1.9820847830963135, + 1.9821476971435548, + 1.9841077730560304, + 1.984079453048706, + 1.981676795501709, + 1.981983535079956, + 1.9816267264175416, + 1.9832186078262328, + 1.9813471504974365, + 1.983914895172119, + 1.980699147644043, + 1.9799334463500977, + 1.981280658531189, + 1.981482693939209, + 1.981354609375, + 1.9822732683563233, + 1.981365751876831, + 1.9825617141723633, + 1.9832577297210694, + 1.982207321434021, + 1.981124991416931, + 1.9847596619415284, + 1.9812841805648804, + 1.9833404195404052, + 1.9824105700683594, + 1.9793556769561769, + 1.9829961922454833, + 1.983497814025879, + 1.9825690042495727, + 1.9819972144317628, + 1.9813205464172363, + 1.9805747171783448, + 1.981684338645935, + 1.981287991065979, + 1.9817047914886474, + 1.9801208978652953, + 1.982117232284546, + 1.9809979217910767, + 1.9817907106781005, + 1.9819589037704468, + 1.980901844406128, + 1.979100549545288, + 1.9783411534118653, + 1.982215822982788, + 1.9786703715515137, + 1.9790553332138061, + 1.9795003827285766, + 1.9804647981262207, + 1.9805792209243775, + 1.9786001267242432, + 1.980303563232422, + 1.9798223697280883, + 1.9818306106948853, + 1.9783708667755127, + 1.9785375136947632, + 1.9783638653945923, + 1.9782444370269776, + 1.9777508059692384, + 1.9798192587280274, + 1.9783385585021973, + 1.9803018301773072, + 1.977279466819763, + 1.9773743700790405, + 1.9787853107452393, + 1.9787623846054077, + 1.9773602225112914, + 1.978456362953186, + 1.9782572579956055, + 1.9804483145141603, + 1.9793778206634522, + 1.9739930397033691, + 1.979039264907837, + 1.9762582428359985, + 1.977005643081665, + 1.9782807824707032 + ], + "gamma": [ + [ + 6, + 0.07866817025933415 + ], + [ + 7, + 0.08171852119266987 + ], + [ + 8, + 0.0832369290292263 + ], + [ + 9, + 0.08300935570150614 + ], + [ + 10, + 0.08633468067273498 + ], + [ + 13, + 0.08728862018324435 + ], + [ + 15, + 0.08539568376727402 + ], + [ + 20, + 0.0892858924344182 + ], + [ + 25, + 0.08779954141937196 + ], + [ + 35, + 0.089820038061589 + ], + [ + 45, + 0.09298557415604591 + ], + [ + 55, + 0.09603138081729412 + ], + [ + 65, + 0.09451595041900873 + ], + [ + 75, + 0.09730265894904733 + ], + [ + 85, + 0.09736149618402123 + ], + [ + 95, + 0.09684902639128268 + ], + [ + 100, + 0.09718019678257406 + ] + ], + "rho": [ + [ + 6, + 0.01853559073060751 + ], + [ + 7, + 0.0021537072025239468 + ], + [ + 8, + 0.022916836314834654 + ], + [ + 9, + 0.017495981883257627 + ], + [ + 10, + -0.007019296521320939 + ], + [ + 13, + 0.020411364268511534 + ], + [ + 15, + 0.008924664638470858 + ], + [ + 20, + 0.009920771466568112 + ], + [ + 25, + 0.0004479335620999336 + ], + [ + 35, + -0.00826605735346675 + ], + [ + 45, + 0.0026894344482570887 + ], + [ + 55, + -0.0041805449873209 + ], + [ + 65, + 0.0017762749921530485 + ], + [ + 75, + 0.0005749878473579884 + ], + [ + 85, + 0.0030663725920021534 + ], + [ + 95, + 0.01072357571683824 + ], + [ + 100, + -0.002892943099141121 + ] + ], + "alpha_eff": [ + [ + 6, + 0.24972248771260733 + ], + [ + 7, + 0.24947935032695043 + ], + [ + 8, + 0.24948230432577714 + ], + [ + 9, + 0.24949492228305725 + ], + [ + 10, + 0.24948454982935764 + ], + [ + 11, + 0.24949888452990227 + ], + [ + 12, + 0.24948282668432062 + ], + [ + 13, + 0.24949142674491542 + ], + [ + 14, + 0.24948863864376475 + ], + [ + 15, + 0.249494092781818 + ], + [ + 16, + 0.2494879335982677 + ], + [ + 17, + 0.24949017029823428 + ], + [ + 18, + 0.24947683994673858 + ], + [ + 19, + 0.24948694720682202 + ], + [ + 20, + 0.24948447549318925 + ], + [ + 21, + 0.24948920513186867 + ], + [ + 22, + 0.2494920286991675 + ], + [ + 23, + 0.24949015605792602 + ], + [ + 24, + 0.24947783867079276 + ], + [ + 25, + 0.2494776485658948 + ], + [ + 26, + 0.2494743912586451 + ], + [ + 27, + 0.24945635304586694 + ], + [ + 28, + 0.2494817281764155 + ], + [ + 29, + 0.24947529417163083 + ], + [ + 30, + 0.24948553835581308 + ], + [ + 31, + 0.24947934118373832 + ], + [ + 32, + 0.2494931516826185 + ], + [ + 33, + 0.24948261801326022 + ], + [ + 34, + 0.24948319727456705 + ], + [ + 35, + 0.24947981390237856 + ], + [ + 36, + 0.2494862019543101 + ], + [ + 37, + 0.24948648091286968 + ], + [ + 38, + 0.24948492864362595 + ], + [ + 39, + 0.2494821003855004 + ], + [ + 40, + 0.24947632642287987 + ], + [ + 41, + 0.24947967624534692 + ], + [ + 42, + 0.24947886875613925 + ], + [ + 43, + 0.24948325688500178 + ], + [ + 44, + 0.2494944341907901 + ], + [ + 45, + 0.24948371186478835 + ], + [ + 46, + 0.2494850860984326 + ], + [ + 47, + 0.2494756676395805 + ], + [ + 48, + 0.24947560985496792 + ], + [ + 49, + 0.24949731965623512 + ], + [ + 50, + 0.24947536293189315 + ], + [ + 51, + 0.24946844536101623 + ], + [ + 52, + 0.24947678739963527 + ], + [ + 53, + 0.24947438884654782 + ], + [ + 54, + 0.24949042802970364 + ], + [ + 55, + 0.2494939425232515 + ], + [ + 56, + 0.24948793523593268 + ], + [ + 57, + 0.24949688396885342 + ], + [ + 58, + 0.24948035040414968 + ], + [ + 59, + 0.24945642654825334 + ], + [ + 60, + 0.24948242856112499 + ], + [ + 61, + 0.24948100071931803 + ], + [ + 62, + 0.24949957614031087 + ], + [ + 63, + 0.24948502855966503 + ], + [ + 64, + 0.24948644180485893 + ], + [ + 65, + 0.24947477087551181 + ], + [ + 66, + 0.24946816015729842 + ], + [ + 67, + 0.2494722537208322 + ], + [ + 68, + 0.2494809632315978 + ], + [ + 69, + 0.24949564815756167 + ], + [ + 70, + 0.24946268715863537 + ], + [ + 71, + 0.24948731809190608 + ], + [ + 72, + 0.24948537374072835 + ], + [ + 73, + 0.24948555141221207 + ], + [ + 74, + 0.249494409075237 + ], + [ + 75, + 0.24947960040422168 + ], + [ + 76, + 0.2494949614662781 + ], + [ + 77, + 0.24949650212563007 + ], + [ + 78, + 0.24949114084876567 + ], + [ + 79, + 0.249489902312524 + ], + [ + 80, + 0.24946300410005345 + ], + [ + 81, + 0.24947569553155974 + ], + [ + 82, + 0.24948523532543226 + ], + [ + 83, + 0.24948210614594962 + ], + [ + 84, + 0.24947225552035546 + ], + [ + 85, + 0.24947941896357276 + ], + [ + 86, + 0.24948837982560348 + ], + [ + 87, + 0.24947696381396076 + ], + [ + 88, + 0.24947869451986296 + ], + [ + 89, + 0.24945727642174398 + ], + [ + 90, + 0.24946828940090288 + ], + [ + 91, + 0.24947728166379377 + ], + [ + 92, + 0.24947517484195078 + ], + [ + 93, + 0.24948233253009675 + ], + [ + 94, + 0.2494779532154209 + ], + [ + 95, + 0.24947562515897356 + ], + [ + 96, + 0.2494888820429275 + ], + [ + 97, + 0.2494965139146254 + ], + [ + 98, + 0.24947869341928813 + ], + [ + 99, + 0.24948464951129232 + ], + [ + 100, + 0.24947761844822447 + ] + ] + }, + "blend_perlayer_vector_alpha050": { + "alpha": 0.5, + "test_acc": [ + 0.3023, + 0.3096, + 0.3145, + 0.3032, + 0.3072, + 0.2997, + 0.3137, + 0.3118, + 0.3058, + 0.3109, + 0.3207, + 0.3091, + 0.3121, + 0.2956, + 0.32, + 0.312, + 0.3177, + 0.3197, + 0.3224, + 0.3198, + 0.318, + 0.3172, + 0.3178, + 0.3128, + 0.2978, + 0.3098, + 0.32, + 0.3142, + 0.3047, + 0.3156, + 0.3106, + 0.3144, + 0.3143, + 0.312, + 0.3241, + 0.3061, + 0.3211, + 0.3149, + 0.319, + 0.3059, + 0.3164, + 0.315, + 0.3141, + 0.3046, + 0.3048, + 0.3037, + 0.3057, + 0.3178, + 0.3129, + 0.3019, + 0.3178, + 0.3198, + 0.3123, + 0.3085, + 0.3157, + 0.3089, + 0.3156, + 0.3123, + 0.3181, + 0.3123, + 0.3148, + 0.3144, + 0.3168, + 0.3198, + 0.3121, + 0.3111, + 0.3151, + 0.3155, + 0.3144, + 0.3164, + 0.3099, + 0.3103, + 0.3255, + 0.3112, + 0.3223, + 0.313, + 0.3094, + 0.3146, + 0.311, + 0.3155, + 0.3148, + 0.3139, + 0.3125, + 0.3138, + 0.3151, + 0.316, + 0.3156, + 0.3154, + 0.3165, + 0.3167, + 0.3163, + 0.3171, + 0.3171, + 0.3171, + 0.3171 + ], + "train_loss": [ + 1.9917561831665038, + 1.9829305992126465, + 1.9812401902008057, + 1.9778941026306152, + 1.9752952905273438, + 1.974818321762085, + 1.9736881392669678, + 1.974170976486206, + 1.9745802745056151, + 1.9709150112533569, + 1.9729148027801513, + 1.9720560794830322, + 1.9740230810928345, + 1.9755329774475097, + 1.9731374980163574, + 1.9692442362213134, + 1.9725708643341064, + 1.9713253354644775, + 1.970638151473999, + 1.9699185414886475, + 1.9683959786224365, + 1.967863571510315, + 1.9711056298828125, + 1.972366621360779, + 1.9698165482330323, + 1.9716122170257568, + 1.969995245361328, + 1.971645417175293, + 1.9680979971313477, + 1.9714557960510255, + 1.9684885326766968, + 1.9681451354599, + 1.9684070782089234, + 1.9694038621520995, + 1.9699225545501708, + 1.9718246128082275, + 1.97034676486969, + 1.9717714920425415, + 1.9720078167724608, + 1.9701439580535889, + 1.9689175207901002, + 1.974075308189392, + 1.9706641263580322, + 1.9716036338043212, + 1.97032455657959, + 1.9667090301513672, + 1.970846530380249, + 1.9712551027679444, + 1.9709385818862915, + 1.9708643013763427, + 1.9695846894073485, + 1.9686976073837281, + 1.9692375783920288, + 1.9684447635650635, + 1.9694693069458007, + 1.9663859380722046, + 1.9694285501861573, + 1.9679479430389404, + 1.9683449375152589, + 1.9691200702667235, + 1.9684226276397705, + 1.965940485496521, + 1.9654108630371094, + 1.9689697052764892, + 1.9656564891052246, + 1.9655308631134034, + 1.9673858330917358, + 1.9679986907196045, + 1.9682127925872803, + 1.9662462731933594, + 1.9673945916366578, + 1.9669571544647217, + 1.969510202255249, + 1.9656707555770874, + 1.9662874362945557, + 1.9652958306503296, + 1.9660377970886231, + 1.9649639958953857, + 1.9671108046722412, + 1.9657821132659912, + 1.9678813097763062, + 1.9645460061645508, + 1.9649910687637329, + 1.9668921905899048, + 1.9659738945770264, + 1.964272243347168, + 1.965306146583557, + 1.96566610496521, + 1.967940728225708, + 1.9675999630737304, + 1.96113099899292, + 1.966398711013794, + 1.963310030479431, + 1.96448876953125, + 1.9661073540496825 + ], + "gamma": [ + [ + 6, + 0.06322180852293968 + ], + [ + 7, + 0.06429825956001878 + ], + [ + 8, + 0.06493996377685107 + ], + [ + 9, + 0.06486295888316818 + ], + [ + 10, + 0.06457511300686747 + ], + [ + 13, + 0.0671108040260151 + ], + [ + 15, + 0.0674042459577322 + ], + [ + 20, + 0.07273604930378497 + ], + [ + 25, + 0.06582908588461578 + ], + [ + 35, + 0.06825429387390614 + ], + [ + 45, + 0.07122062100097537 + ], + [ + 55, + 0.0672054453752935 + ], + [ + 65, + 0.06926454044878483 + ], + [ + 75, + 0.06559235090389848 + ], + [ + 85, + 0.06751847686246037 + ], + [ + 95, + 0.06816108210477978 + ], + [ + 100, + 0.06730447930749506 + ] + ], + "rho": [ + [ + 6, + 0.0200467340182513 + ], + [ + 7, + 0.013113802997395396 + ], + [ + 8, + -0.003037167713046074 + ], + [ + 9, + 0.0035772863775491714 + ], + [ + 10, + -0.006673132302239537 + ], + [ + 13, + 0.010507516213692725 + ], + [ + 15, + 0.006647368194535375 + ], + [ + 20, + 0.014684727881103754 + ], + [ + 25, + -0.006462351040681824 + ], + [ + 35, + 0.006036010920070112 + ], + [ + 45, + 0.00909994961693883 + ], + [ + 55, + 0.008473677095025778 + ], + [ + 65, + 0.00033604807686060667 + ], + [ + 75, + 0.0012597318273037672 + ], + [ + 85, + 0.004310714080929756 + ], + [ + 95, + 0.0027081522857770324 + ], + [ + 100, + 0.003070657607167959 + ] + ], + "alpha_eff": [ + [ + 6, + 0.4996261993362568 + ], + [ + 7, + 0.4993391021476833 + ], + [ + 8, + 0.49931185811976125 + ], + [ + 9, + 0.4993096364983503 + ], + [ + 10, + 0.4993144600555052 + ], + [ + 11, + 0.4993251101963492 + ], + [ + 12, + 0.4993212678677952 + ], + [ + 13, + 0.4993213098394563 + ], + [ + 14, + 0.4993075194350882 + ], + [ + 15, + 0.4993074665095068 + ], + [ + 16, + 0.4993121157349748 + ], + [ + 17, + 0.49932483488099205 + ], + [ + 18, + 0.49931736472090327 + ], + [ + 19, + 0.4993086092610733 + ], + [ + 20, + 0.4993029887170185 + ], + [ + 21, + 0.4992957905314217 + ], + [ + 22, + 0.49929552812098327 + ], + [ + 23, + 0.49931472694487866 + ], + [ + 24, + 0.49932052243153885 + ], + [ + 25, + 0.4993186115711273 + ], + [ + 26, + 0.49932203807715797 + ], + [ + 27, + 0.49931577169005587 + ], + [ + 28, + 0.49930774133195877 + ], + [ + 29, + 0.4993113354669589 + ], + [ + 30, + 0.4993269110739146 + ], + [ + 31, + 0.4992846764001769 + ], + [ + 32, + 0.4993147888204103 + ], + [ + 33, + 0.4992991821444239 + ], + [ + 34, + 0.499315539341136 + ], + [ + 35, + 0.49929300368544605 + ], + [ + 36, + 0.4993135312110566 + ], + [ + 37, + 0.499312173433516 + ], + [ + 38, + 0.49928442076505974 + ], + [ + 39, + 0.4992879848127134 + ], + [ + 40, + 0.4993209541877065 + ], + [ + 41, + 0.499310149841278 + ], + [ + 42, + 0.4993123354568663 + ], + [ + 43, + 0.4993222357028763 + ], + [ + 44, + 0.4993008995468193 + ], + [ + 45, + 0.4993061526558331 + ], + [ + 46, + 0.4993149831092503 + ], + [ + 47, + 0.4992837521548189 + ], + [ + 48, + 0.49930527816737597 + ], + [ + 49, + 0.49931959987404495 + ], + [ + 50, + 0.49929977286637234 + ], + [ + 51, + 0.4993105151789878 + ], + [ + 52, + 0.4992952907262145 + ], + [ + 53, + 0.49932079464976303 + ], + [ + 54, + 0.4993199948848364 + ], + [ + 55, + 0.499329275416757 + ], + [ + 56, + 0.4993268754767892 + ], + [ + 57, + 0.49933033291600765 + ], + [ + 58, + 0.4993347317146705 + ], + [ + 59, + 0.4993103629058204 + ], + [ + 60, + 0.4993249711709759 + ], + [ + 61, + 0.49930806472910405 + ], + [ + 62, + 0.49934650968638655 + ], + [ + 63, + 0.499318712547547 + ], + [ + 64, + 0.49930730074876145 + ], + [ + 65, + 0.499297153457682 + ], + [ + 66, + 0.4993050258252328 + ], + [ + 67, + 0.4993109057142996 + ], + [ + 68, + 0.4993250766214407 + ], + [ + 69, + 0.49931206114113486 + ], + [ + 70, + 0.4992909524624259 + ], + [ + 71, + 0.4993036393420284 + ], + [ + 72, + 0.49928560112304887 + ], + [ + 73, + 0.49928474530212236 + ], + [ + 74, + 0.4993115701930791 + ], + [ + 75, + 0.49932136828439816 + ], + [ + 76, + 0.49933078556097654 + ], + [ + 77, + 0.49931148991954166 + ], + [ + 78, + 0.4993258145434325 + ], + [ + 79, + 0.49929900535780325 + ], + [ + 80, + 0.4993166113977388 + ], + [ + 81, + 0.49933789130753126 + ], + [ + 82, + 0.49931904675707844 + ], + [ + 83, + 0.4993120953828435 + ], + [ + 84, + 0.49931019143782207 + ], + [ + 85, + 0.49933704079924096 + ], + [ + 86, + 0.4993145677080777 + ], + [ + 87, + 0.49930384335673567 + ], + [ + 88, + 0.499322289517738 + ], + [ + 89, + 0.49929241445598693 + ], + [ + 90, + 0.4992949648031173 + ], + [ + 91, + 0.4993037293404372 + ], + [ + 92, + 0.4993026274800937 + ], + [ + 93, + 0.4993259323893475 + ], + [ + 94, + 0.4993038912299493 + ], + [ + 95, + 0.4993109706485008 + ], + [ + 96, + 0.4993138731485378 + ], + [ + 97, + 0.49931836748686986 + ], + [ + 98, + 0.4993113804309337 + ], + [ + 99, + 0.4992930082988331 + ], + [ + 100, + 0.4992933031719118 + ] + ] + }, + "blend_perlayer_vector_alpha075": { + "alpha": 0.75, + "test_acc": [ + 0.3069, + 0.3117, + 0.3134, + 0.3102, + 0.3043, + 0.3044, + 0.3067, + 0.3087, + 0.3081, + 0.3071, + 0.3231, + 0.3151, + 0.3161, + 0.3, + 0.3232, + 0.3145, + 0.3203, + 0.3116, + 0.3031, + 0.3142, + 0.3144, + 0.3131, + 0.3144, + 0.3083, + 0.3032, + 0.314, + 0.3217, + 0.3134, + 0.3115, + 0.3174, + 0.3138, + 0.3208, + 0.3169, + 0.3148, + 0.3267, + 0.3132, + 0.3244, + 0.3238, + 0.3246, + 0.3124, + 0.3231, + 0.3273, + 0.3208, + 0.3184, + 0.3131, + 0.3126, + 0.3145, + 0.3219, + 0.3236, + 0.3125, + 0.3258, + 0.3232, + 0.3253, + 0.3178, + 0.3239, + 0.3178, + 0.3258, + 0.3196, + 0.3233, + 0.3198, + 0.3233, + 0.3256, + 0.3257, + 0.3272, + 0.322, + 0.3216, + 0.3197, + 0.3245, + 0.3215, + 0.3198, + 0.3168, + 0.3195, + 0.3252, + 0.3238, + 0.3253, + 0.3194, + 0.3212, + 0.3215, + 0.321, + 0.3206, + 0.3216, + 0.3216, + 0.3208, + 0.3243, + 0.3234, + 0.3221, + 0.3212, + 0.3217, + 0.3227, + 0.3219, + 0.3222, + 0.3219, + 0.322, + 0.3221, + 0.3221 + ], + "train_loss": [ + 1.9939408515167236, + 1.9861596878051757, + 1.9854449212646483, + 1.9809263521575928, + 1.97566344871521, + 1.9728280086517334, + 1.974452314453125, + 1.9807431080627442, + 1.9744162216949463, + 1.9669867644882202, + 1.9692662822723388, + 1.9678162953948974, + 1.9709133194732666, + 1.972092370071411, + 1.9702331074523927, + 1.9634329458618165, + 1.9693690857696533, + 1.9714275366973877, + 1.9736647372436524, + 1.9713019152069091, + 1.967839783554077, + 1.9648340505981445, + 1.9675980786895753, + 1.9694680223846435, + 1.9661734999847411, + 1.9668920111465453, + 1.9645757045745849, + 1.9667655364608765, + 1.9594652931976317, + 1.9621334440612792, + 1.9592414768218993, + 1.9580158362579345, + 1.9570839422988893, + 1.9565859017181397, + 1.9596544408416747, + 1.9624952820587158, + 1.9606676049804688, + 1.9625141510009765, + 1.9646410295104981, + 1.9604910164642333, + 1.9581072945404052, + 1.9628234854507447, + 1.9590881076049804, + 1.9604977954101563, + 1.9603009243774414, + 1.956119110031128, + 1.9611696166610717, + 1.9605925281143188, + 1.9598565783309936, + 1.9586773540496827, + 1.9580707284545897, + 1.9566046767807006, + 1.9583141498184204, + 1.9575138668823242, + 1.9584173246002197, + 1.9545537184906006, + 1.9576402924346923, + 1.9552772137069703, + 1.955228793106079, + 1.956446703186035, + 1.9568019944000243, + 1.9528450647735596, + 1.9516719250488281, + 1.9547899242401123, + 1.9507095720672607, + 1.951067873840332, + 1.9530513054656982, + 1.9538879953765869, + 1.953553825111389, + 1.9515541619110108, + 1.9523499368667603, + 1.9517578278350831, + 1.9545308373260497, + 1.9503954576873779, + 1.951339678955078, + 1.950171506958008, + 1.951169235610962, + 1.9501886684417724, + 1.9523463172149658, + 1.950947571105957, + 1.9535913979339599, + 1.949757958946228, + 1.9497659448623657, + 1.9515488370513916, + 1.9508306390380858, + 1.9497578717803956, + 1.9498168933105469, + 1.9509752071380615, + 1.9535040804672241, + 1.9524465697860718, + 1.9461274175643921, + 1.9513143978118896, + 1.9484365969848634, + 1.9497413010406495, + 1.9511626023101807 + ], + "gamma": [ + [ + 6, + 0.029690025316085666 + ], + [ + 7, + 0.03211108082905412 + ], + [ + 8, + 0.02919765340629965 + ], + [ + 9, + 0.02874648931901902 + ], + [ + 10, + 0.029019907349720597 + ], + [ + 13, + 0.0342491683550179 + ], + [ + 15, + 0.03304886294063181 + ], + [ + 20, + 0.03220415679970756 + ], + [ + 25, + 0.027112489042337984 + ], + [ + 35, + 0.03040921490173787 + ], + [ + 45, + 0.026454357663169503 + ], + [ + 55, + 0.03050265001365915 + ], + [ + 65, + 0.022586700739338994 + ], + [ + 75, + 0.03416337142698467 + ], + [ + 85, + 0.030736169428564608 + ], + [ + 95, + 0.03216187539510429 + ], + [ + 100, + 0.03935998142696917 + ] + ], + "rho": [ + [ + 6, + 0.015949245484080166 + ], + [ + 7, + 0.01342307054437697 + ], + [ + 8, + 0.004009846597909927 + ], + [ + 9, + 0.025402148254215717 + ], + [ + 10, + 0.008257870795205235 + ], + [ + 13, + 0.006433822971303016 + ], + [ + 15, + -0.017903955653309822 + ], + [ + 20, + 0.008053621626459062 + ], + [ + 25, + 0.011718281777575612 + ], + [ + 35, + -0.004712250549346209 + ], + [ + 45, + -0.0023677245480939746 + ], + [ + 55, + 0.014406869537197053 + ], + [ + 65, + 0.012566582299768925 + ], + [ + 75, + 0.0038452057633548975 + ], + [ + 85, + 0.005002687452360988 + ], + [ + 95, + -0.005955582018941641 + ], + [ + 100, + -0.00363031099550426 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7497128513850779 + ], + [ + 7, + 0.7495006479403842 + ], + [ + 8, + 0.7494898494059449 + ], + [ + 9, + 0.7494894703915523 + ], + [ + 10, + 0.7494910522493321 + ], + [ + 11, + 0.7494916838514811 + ], + [ + 12, + 0.7494720897153492 + ], + [ + 13, + 0.7494797446246886 + ], + [ + 14, + 0.7494986754725924 + ], + [ + 15, + 0.7494939935776234 + ], + [ + 16, + 0.7494804065708064 + ], + [ + 17, + 0.7495019121324088 + ], + [ + 18, + 0.7495100362494223 + ], + [ + 19, + 0.7494826293182024 + ], + [ + 20, + 0.7494933775064284 + ], + [ + 21, + 0.7494798413342856 + ], + [ + 22, + 0.7494969511168854 + ], + [ + 23, + 0.7494865050193906 + ], + [ + 24, + 0.7494881104692075 + ], + [ + 25, + 0.7494846218186876 + ], + [ + 26, + 0.7494853043551933 + ], + [ + 27, + 0.7494773243484152 + ], + [ + 28, + 0.74949463029463 + ], + [ + 29, + 0.7494757489504915 + ], + [ + 30, + 0.7494804237637255 + ], + [ + 31, + 0.7494909548788173 + ], + [ + 32, + 0.7494900723300271 + ], + [ + 33, + 0.7494941878746446 + ], + [ + 34, + 0.7494877638886531 + ], + [ + 35, + 0.7494897202151976 + ], + [ + 36, + 0.7494963330719294 + ], + [ + 37, + 0.7494808239403828 + ], + [ + 38, + 0.7494753657764512 + ], + [ + 39, + 0.7494608971844654 + ], + [ + 40, + 0.7494808497354714 + ], + [ + 41, + 0.74946907683424 + ], + [ + 42, + 0.7494659161119482 + ], + [ + 43, + 0.7494800591210298 + ], + [ + 44, + 0.7494823127125755 + ], + [ + 45, + 0.7494831127329752 + ], + [ + 46, + 0.7494868941304027 + ], + [ + 47, + 0.7494760497503494 + ], + [ + 48, + 0.7494636843509664 + ], + [ + 49, + 0.7494856075038441 + ], + [ + 50, + 0.7494714868603383 + ], + [ + 51, + 0.7494691888956687 + ], + [ + 52, + 0.749490003547161 + ], + [ + 53, + 0.7494840879178268 + ], + [ + 54, + 0.7494897896890308 + ], + [ + 55, + 0.74948246129217 + ], + [ + 56, + 0.7494876378303129 + ], + [ + 57, + 0.7494846458457998 + ], + [ + 58, + 0.7494881171334334 + ], + [ + 59, + 0.7494740839123716 + ], + [ + 60, + 0.7494890395866025 + ], + [ + 61, + 0.7494802380837144 + ], + [ + 62, + 0.7495076806478569 + ], + [ + 63, + 0.7494821568138585 + ], + [ + 64, + 0.7494822141688123 + ], + [ + 65, + 0.7494636815466068 + ], + [ + 66, + 0.7494762624940223 + ], + [ + 67, + 0.7494929011143916 + ], + [ + 68, + 0.7494633290311189 + ], + [ + 69, + 0.7494907818954 + ], + [ + 70, + 0.7494698129657793 + ], + [ + 71, + 0.7494802658543539 + ], + [ + 72, + 0.7494772070406521 + ], + [ + 73, + 0.7494757257563516 + ], + [ + 74, + 0.7494800816258608 + ], + [ + 75, + 0.7494901063270729 + ], + [ + 76, + 0.7494993449623615 + ], + [ + 77, + 0.7495025094752598 + ], + [ + 78, + 0.7494899987239635 + ], + [ + 79, + 0.7494908590412915 + ], + [ + 80, + 0.7494663255005782 + ], + [ + 81, + 0.7494692173356918 + ], + [ + 82, + 0.7494787389196118 + ], + [ + 83, + 0.7494800861725361 + ], + [ + 84, + 0.749475234405983 + ], + [ + 85, + 0.7494909942691758 + ], + [ + 86, + 0.7494746851469412 + ], + [ + 87, + 0.749478037434971 + ], + [ + 88, + 0.7494801549497961 + ], + [ + 89, + 0.749456032036178 + ], + [ + 90, + 0.7494693929095732 + ], + [ + 91, + 0.749480378399538 + ], + [ + 92, + 0.7494707978635028 + ], + [ + 93, + 0.749493460356757 + ], + [ + 94, + 0.7494840322166019 + ], + [ + 95, + 0.7494808940938613 + ], + [ + 96, + 0.7495053216308006 + ], + [ + 97, + 0.7494823938620113 + ], + [ + 98, + 0.7494855984799902 + ], + [ + 99, + 0.7494825074497661 + ], + [ + 100, + 0.7494873096472457 + ] + ] + }, + "blend_perlayer_vector_alpha090": { + "alpha": 0.9, + "test_acc": [ + 0.3069, + 0.3092, + 0.3164, + 0.3052, + 0.3059, + 0.2984, + 0.2973, + 0.2947, + 0.2982, + 0.3095, + 0.3037, + 0.2972, + 0.2966, + 0.2832, + 0.3005, + 0.3075, + 0.3059, + 0.3057, + 0.3103, + 0.3071, + 0.3066, + 0.3057, + 0.2968, + 0.3149, + 0.2998, + 0.3032, + 0.3059, + 0.2894, + 0.2553, + 0.276, + 0.2692, + 0.2751, + 0.2626, + 0.2736, + 0.2803, + 0.2831, + 0.2905, + 0.2837, + 0.2877, + 0.2887, + 0.2928, + 0.2954, + 0.2928, + 0.2862, + 0.2882, + 0.2838, + 0.2886, + 0.2929, + 0.2915, + 0.2865, + 0.2984, + 0.299, + 0.2878, + 0.296, + 0.2927, + 0.2884, + 0.2999, + 0.29, + 0.2963, + 0.2913, + 0.2989, + 0.2929, + 0.3013, + 0.2986, + 0.2953, + 0.2932, + 0.2908, + 0.2978, + 0.291, + 0.2916, + 0.2903, + 0.2934, + 0.2984, + 0.2947, + 0.298, + 0.2972, + 0.2956, + 0.2959, + 0.2951, + 0.2946, + 0.2971, + 0.2956, + 0.296, + 0.297, + 0.2973, + 0.2972, + 0.2969, + 0.2968, + 0.2969, + 0.2974, + 0.2975, + 0.2977, + 0.2977, + 0.2977, + 0.2977 + ], + "train_loss": [ + 1.997782850074768, + 1.9959279607391358, + 1.9895094528961181, + 1.981425369491577, + 1.987436777191162, + 1.9854413581085204, + 1.9890507335662841, + 1.999713560562134, + 2.0028857360839845, + 1.9928191792297363, + 2.0108930098724365, + 2.0137152437973023, + 2.0112061127090453, + 2.0165509329223634, + 2.0117236939239502, + 2.003053000869751, + 2.002287318687439, + 1.9908985527801513, + 1.9845779376983643, + 1.98173641166687, + 1.9821000887298583, + 1.9811158957290649, + 1.9879641247558595, + 1.9877586428833007, + 1.9778228791809083, + 1.9733421154785156, + 1.972704354248047, + 1.9742003258514405, + 1.9950288501358033, + 2.002638019256592, + 2.0036745891571046, + 2.0020674619293213, + 1.9996952025985717, + 1.9941947059631349, + 1.994228055343628, + 1.9943625868988037, + 1.9882129996490479, + 1.9930521758270263, + 1.9930853601074219, + 1.9859523449325562, + 1.9788912723541259, + 1.984332553024292, + 1.9792242436981202, + 1.9806055389404298, + 1.9804424798202516, + 1.9772218966293336, + 1.9814973215103149, + 1.97999455078125, + 1.9773017657089234, + 1.976198729248047, + 1.9766320819091796, + 1.9745968744277953, + 1.976400178565979, + 1.9745356512832641, + 1.972631764678955, + 1.970634806175232, + 1.9749352013397217, + 1.9714062850952148, + 1.9663891560363769, + 1.9686513556671144, + 1.967209598388672, + 1.9641500353622436, + 1.9615454802703858, + 1.965209234046936, + 1.9620319871520997, + 1.9626867557525636, + 1.9641366138076781, + 1.9657211672210693, + 1.963914808883667, + 1.963132495651245, + 1.9641750479125977, + 1.9627278024673462, + 1.9663054087066651, + 1.962103825340271, + 1.963687724533081, + 1.9598489971923827, + 1.9601465383148193, + 1.9602603670501708, + 1.9618255139923095, + 1.9606169825744628, + 1.9639963116836547, + 1.959268245162964, + 1.9602994772338866, + 1.9610898205947875, + 1.9605756457901, + 1.9586503783416749, + 1.960484585647583, + 1.9599338275909424, + 1.9627701279449463, + 1.962965354270935, + 1.9585062088012695, + 1.9599010592269897, + 1.9586225860214233, + 1.9604066236114501, + 1.9609591567230225 + ], + "gamma": [ + [ + 6, + 0.0012919941218569875 + ], + [ + 7, + 0.013235294725745916 + ], + [ + 8, + 0.005836346885189414 + ], + [ + 9, + 0.007337209477555007 + ], + [ + 10, + 0.01136046287138015 + ], + [ + 13, + 0.013101757591357455 + ], + [ + 15, + 0.0105974708130816 + ], + [ + 20, + 0.01104156908695586 + ], + [ + 25, + 0.005037317343521863 + ], + [ + 35, + 0.016087420284748077 + ], + [ + 45, + 0.009149214645731263 + ], + [ + 55, + 0.007499612169340253 + ], + [ + 65, + 0.018092090846039355 + ], + [ + 75, + 0.011558135156519711 + ], + [ + 85, + 0.012031848134938627 + ], + [ + 95, + 0.012515450536739081 + ], + [ + 100, + 0.007372630410827696 + ] + ], + "rho": [ + [ + 6, + -0.010041043860837817 + ], + [ + 7, + 0.0027252465952187777 + ], + [ + 8, + -0.001453035045415163 + ], + [ + 9, + -0.009528452530503273 + ], + [ + 10, + -0.023047671420499682 + ], + [ + 13, + -0.007210864219814539 + ], + [ + 15, + 0.0055196997709572315 + ], + [ + 20, + 0.004364048421848565 + ], + [ + 25, + 0.0042708017863333225 + ], + [ + 35, + 0.014436901547014713 + ], + [ + 45, + 0.0030632668640464544 + ], + [ + 55, + 0.014385869493708014 + ], + [ + 65, + -0.009030808927491307 + ], + [ + 75, + -0.00455438275821507 + ], + [ + 85, + 0.006564809940755367 + ], + [ + 95, + -0.002711795154027641 + ], + [ + 100, + -0.018319898284971714 + ] + ], + "alpha_eff": [ + [ + 6, + 0.8998637034742774 + ], + [ + 7, + 0.8997563326857774 + ], + [ + 8, + 0.8997523543230196 + ], + [ + 9, + 0.8997494678808297 + ], + [ + 10, + 0.8997527853654496 + ], + [ + 11, + 0.8997554477200242 + ], + [ + 12, + 0.8997461976186043 + ], + [ + 13, + 0.8997534205024557 + ], + [ + 14, + 0.8997589831013083 + ], + [ + 15, + 0.8997533015536816 + ], + [ + 16, + 0.899759264603019 + ], + [ + 17, + 0.8997603646560224 + ], + [ + 18, + 0.899744551444836 + ], + [ + 19, + 0.8997519522531576 + ], + [ + 20, + 0.8997514759915216 + ], + [ + 21, + 0.8997469126131926 + ], + [ + 22, + 0.8997551999292398 + ], + [ + 23, + 0.8997531225692526 + ], + [ + 24, + 0.8997492362557167 + ], + [ + 25, + 0.8997548329971168 + ], + [ + 26, + 0.8997452556978576 + ], + [ + 27, + 0.8997449194113881 + ], + [ + 28, + 0.899748204397291 + ], + [ + 29, + 0.8997564658103022 + ], + [ + 30, + 0.8997560852420976 + ], + [ + 31, + 0.899745100011646 + ], + [ + 32, + 0.8997443665296799 + ], + [ + 33, + 0.8997538987615857 + ], + [ + 34, + 0.8997562560855241 + ], + [ + 35, + 0.8997577694863691 + ], + [ + 36, + 0.8997531511549263 + ], + [ + 37, + 0.8997498077332158 + ], + [ + 38, + 0.8997471279800556 + ], + [ + 39, + 0.8997470251827299 + ], + [ + 40, + 0.8997483266806293 + ], + [ + 41, + 0.899755457365203 + ], + [ + 42, + 0.8997535806917598 + ], + [ + 43, + 0.8997482846351207 + ], + [ + 44, + 0.8997564019689559 + ], + [ + 45, + 0.899755343975014 + ], + [ + 46, + 0.899753419242508 + ], + [ + 47, + 0.8997497203084536 + ], + [ + 48, + 0.8997497351657013 + ], + [ + 49, + 0.8997573738207715 + ], + [ + 50, + 0.8997540927136419 + ], + [ + 51, + 0.8997470542451639 + ], + [ + 52, + 0.8997551731091843 + ], + [ + 53, + 0.8997503267897882 + ], + [ + 54, + 0.8997541813397864 + ], + [ + 55, + 0.8997525896849798 + ], + [ + 56, + 0.8997549450950412 + ], + [ + 57, + 0.8997491197190708 + ], + [ + 58, + 0.8997518755081857 + ], + [ + 59, + 0.8997480943804367 + ], + [ + 60, + 0.899753113172218 + ], + [ + 61, + 0.8997530148003327 + ], + [ + 62, + 0.8997619302848505 + ], + [ + 63, + 0.8997553120039977 + ], + [ + 64, + 0.8997560414549803 + ], + [ + 65, + 0.8997569489272897 + ], + [ + 66, + 0.8997469547600226 + ], + [ + 67, + 0.8997601259492954 + ], + [ + 68, + 0.8997641942648589 + ], + [ + 69, + 0.8997522213318294 + ], + [ + 70, + 0.8997532461835194 + ], + [ + 71, + 0.8997499700423474 + ], + [ + 72, + 0.8997493443402218 + ], + [ + 73, + 0.8997523293564776 + ], + [ + 74, + 0.899754103669039 + ], + [ + 75, + 0.8997519753496676 + ], + [ + 76, + 0.8997513374171273 + ], + [ + 77, + 0.8997519755200604 + ], + [ + 78, + 0.8997566013902689 + ], + [ + 79, + 0.8997531982405848 + ], + [ + 80, + 0.8997471969888591 + ], + [ + 81, + 0.8997520879056414 + ], + [ + 82, + 0.8997545979206795 + ], + [ + 83, + 0.8997494490540048 + ], + [ + 84, + 0.8997460583559757 + ], + [ + 85, + 0.8997473555098748 + ], + [ + 86, + 0.8997510402160203 + ], + [ + 87, + 0.8997478383467744 + ], + [ + 88, + 0.8997539129293753 + ], + [ + 89, + 0.8997414488573269 + ], + [ + 90, + 0.8997540890154373 + ], + [ + 91, + 0.8997432008102813 + ], + [ + 92, + 0.8997552213896457 + ], + [ + 93, + 0.8997529959770517 + ], + [ + 94, + 0.8997478145754266 + ], + [ + 95, + 0.8997567217736824 + ], + [ + 96, + 0.8997592502084472 + ], + [ + 97, + 0.8997512810017133 + ], + [ + 98, + 0.8997578958982544 + ], + [ + 99, + 0.8997540308265919 + ], + [ + 100, + 0.8997528533801658 + ] + ] + }, + "blend_random_trainable_alpha025": { + "alpha": 0.25, + "test_acc": [ + 0.3057, + 0.3113, + 0.3171, + 0.3057, + 0.3103, + 0.3051, + 0.299, + 0.2961, + 0.2919, + 0.2998, + 0.3092, + 0.3096, + 0.319, + 0.3049, + 0.3063, + 0.2969, + 0.31, + 0.3108, + 0.3048, + 0.302, + 0.2983, + 0.3143, + 0.2984, + 0.3035, + 0.2974, + 0.3054, + 0.2983, + 0.3046, + 0.3029, + 0.3079, + 0.3096, + 0.2971, + 0.3078, + 0.2992, + 0.3089, + 0.3024, + 0.3186, + 0.317, + 0.3028, + 0.3157, + 0.3045, + 0.2984, + 0.3065, + 0.3089, + 0.2953, + 0.2998, + 0.3084, + 0.2948, + 0.2979, + 0.3127, + 0.3008, + 0.3063, + 0.3108, + 0.3017, + 0.3002, + 0.3108, + 0.3082, + 0.3142, + 0.3089, + 0.3083, + 0.312, + 0.3163, + 0.3164, + 0.3199, + 0.2936, + 0.3038, + 0.31, + 0.312, + 0.313, + 0.306, + 0.3075, + 0.3148, + 0.3082, + 0.3128, + 0.3049, + 0.3151, + 0.3092, + 0.3095, + 0.3086, + 0.3109, + 0.3122, + 0.3145, + 0.3159, + 0.3119, + 0.314, + 0.3121, + 0.3128, + 0.3109, + 0.3113, + 0.3116, + 0.3128, + 0.3124, + 0.3124, + 0.3124, + 0.3124 + ], + "train_loss": [ + 1.992463056564331, + 1.9916953456115722, + 1.9931287091827392, + 1.9910267595672608, + 1.995366346435547, + 1.9881870716094971, + 1.9875581604003907, + 1.9898411698150635, + 1.9859656770324707, + 1.9878472745513915, + 1.9862687158966064, + 1.9826919412612916, + 1.9842528048324586, + 1.9822434168243408, + 1.9832794903564452, + 1.983619165649414, + 1.9822709893035888, + 1.985293566017151, + 1.9828473961639403, + 1.9828178525543212, + 1.9830375411987304, + 1.9841897015762329, + 1.9822585163116455, + 1.9849855586242675, + 1.9855137767028808, + 1.982492109375, + 1.9817083055877684, + 1.983814546470642, + 1.9830951291656493, + 1.9834409854888917, + 1.9843923540496826, + 1.9837786234283448, + 1.9858489233398438, + 1.9843562865829467, + 1.985345831375122, + 1.984080626373291, + 1.984860789489746, + 1.9836374221801758, + 1.9838351998138428, + 1.985522770690918, + 1.984236577987671, + 1.9826813336181641, + 1.984687279624939, + 1.9871889962387086, + 1.985666301612854, + 1.9821212170028686, + 1.9843766479492186, + 1.9833683200454713, + 1.9826139880371094, + 1.9830137462615967, + 1.9837637259292602, + 1.9805976415252686, + 1.9828971029281617, + 1.9823104657363892, + 1.9834304161071776, + 1.9824106423187255, + 1.9827309079742432, + 1.9808049842834472, + 1.9814650936508178, + 1.9820775619888307, + 1.982669534263611, + 1.9827197716522216, + 1.9821792037200927, + 1.9798552976989745, + 1.979809619369507, + 1.9808402716064453, + 1.9794260027313233, + 1.9834764907836915, + 1.981304560585022, + 1.981673750038147, + 1.9809300524902345, + 1.9807403813934326, + 1.9815810343170166, + 1.9786591122436523, + 1.980813638343811, + 1.9796091654968262, + 1.9807487456893922, + 1.9808974559020995, + 1.9807395389556886, + 1.9779186904907227, + 1.9808351560211181, + 1.9781523110580443, + 1.9806969366836549, + 1.9775474491119385, + 1.9770090746307374, + 1.979831170310974, + 1.978646503868103, + 1.978791363143921, + 1.978567936706543, + 1.975908480529785, + 1.980026588821411, + 1.980623605003357, + 1.9787831642913818, + 1.9771810034179687, + 1.981867674217224 + ], + "gamma": [ + [ + 6, + 0.08240128122270107 + ], + [ + 7, + 0.08177360892295837 + ], + [ + 8, + 0.0865556257776916 + ], + [ + 9, + 0.08398968121036887 + ], + [ + 10, + 0.08614908019080758 + ], + [ + 13, + 0.0879793162457645 + ], + [ + 15, + 0.08577868971042335 + ], + [ + 20, + 0.08392585255205631 + ], + [ + 25, + 0.09226418123580515 + ], + [ + 35, + 0.09257616940885782 + ], + [ + 45, + 0.09423351753503084 + ], + [ + 55, + 0.09354621008969843 + ], + [ + 65, + 0.09582796646282077 + ], + [ + 75, + 0.09583176532760262 + ], + [ + 85, + 0.09660185943357646 + ], + [ + 95, + 0.09697433561086655 + ], + [ + 100, + 0.09696925128810108 + ] + ], + "rho": [ + [ + 6, + 0.026699657319113612 + ], + [ + 7, + 0.024797862162813544 + ], + [ + 8, + 0.016839083284139633 + ], + [ + 9, + 0.01808858383446932 + ], + [ + 10, + 0.013804351910948753 + ], + [ + 13, + 0.026929726358503103 + ], + [ + 15, + 0.01636372960638255 + ], + [ + 20, + 0.001426217146217823 + ], + [ + 25, + 0.0031939256004989147 + ], + [ + 35, + 0.0024604005739092827 + ], + [ + 45, + 0.014439057791605592 + ], + [ + 55, + 0.011355152353644371 + ], + [ + 65, + 0.014422241831198335 + ], + [ + 75, + 0.0033052514772862196 + ], + [ + 85, + 0.001998395542614162 + ], + [ + 95, + 0.005214786971919239 + ], + [ + 100, + 0.000343971885740757 + ] + ], + "alpha_eff": [ + [ + 6, + 0.2499213730869882 + ], + [ + 7, + 0.2498478211316315 + ], + [ + 8, + 0.24980691583613213 + ], + [ + 9, + 0.2497380500065483 + ], + [ + 10, + 0.24969213367824736 + ], + [ + 11, + 0.2496609270495203 + ], + [ + 12, + 0.24960425423149746 + ], + [ + 13, + 0.24956507486919746 + ], + [ + 14, + 0.2495778302328802 + ], + [ + 15, + 0.24950300901182632 + ], + [ + 16, + 0.24947434297956608 + ], + [ + 17, + 0.24955579869915723 + ], + [ + 18, + 0.24945036082955535 + ], + [ + 19, + 0.2494441338902135 + ], + [ + 20, + 0.24941560827274628 + ], + [ + 21, + 0.24941500229898922 + ], + [ + 22, + 0.24940152800170728 + ], + [ + 23, + 0.24941301736596458 + ], + [ + 24, + 0.24942289937005896 + ], + [ + 25, + 0.24943153562055728 + ], + [ + 26, + 0.2493944244004199 + ], + [ + 27, + 0.2493841483672213 + ], + [ + 28, + 0.24939026444232057 + ], + [ + 29, + 0.2493861962498303 + ], + [ + 30, + 0.2494033750456337 + ], + [ + 31, + 0.24938243676234567 + ], + [ + 32, + 0.24939319423626036 + ], + [ + 33, + 0.24939562419949676 + ], + [ + 34, + 0.24938205925404472 + ], + [ + 35, + 0.2493830925597816 + ], + [ + 36, + 0.2493944349979185 + ], + [ + 37, + 0.24938788290342598 + ], + [ + 38, + 0.24936400395985633 + ], + [ + 39, + 0.2493850344676143 + ], + [ + 40, + 0.24939985723679156 + ], + [ + 41, + 0.24939008893879183 + ], + [ + 42, + 0.24937747852341605 + ], + [ + 43, + 0.2493874785149169 + ], + [ + 44, + 0.24939919036674274 + ], + [ + 45, + 0.24939671759793644 + ], + [ + 46, + 0.2493911499053157 + ], + [ + 47, + 0.24938359107234617 + ], + [ + 48, + 0.24938592302378676 + ], + [ + 49, + 0.24939079277922477 + ], + [ + 50, + 0.2493865861851642 + ], + [ + 51, + 0.24938631211078413 + ], + [ + 52, + 0.2493991330587277 + ], + [ + 53, + 0.24939046190218817 + ], + [ + 54, + 0.24940303265783006 + ], + [ + 55, + 0.24939970424987953 + ], + [ + 56, + 0.24940813219908353 + ], + [ + 57, + 0.2494083824609693 + ], + [ + 58, + 0.24939771728527144 + ], + [ + 59, + 0.2493876792301662 + ], + [ + 60, + 0.2494002168938244 + ], + [ + 61, + 0.24940474481600178 + ], + [ + 62, + 0.24941695923309265 + ], + [ + 63, + 0.24939676061118335 + ], + [ + 64, + 0.24939502011458942 + ], + [ + 65, + 0.24939994227754606 + ], + [ + 66, + 0.24939422481077445 + ], + [ + 67, + 0.24938903324548542 + ], + [ + 68, + 0.2493852272043755 + ], + [ + 69, + 0.24939771266287739 + ], + [ + 70, + 0.24938762919778643 + ], + [ + 71, + 0.2493922112905308 + ], + [ + 72, + 0.24939185406299313 + ], + [ + 73, + 0.24938339641701565 + ], + [ + 74, + 0.24940474663816414 + ], + [ + 75, + 0.24939512209537285 + ], + [ + 76, + 0.24940129882528578 + ], + [ + 77, + 0.24941330412838525 + ], + [ + 78, + 0.24941724034515972 + ], + [ + 79, + 0.24940367609896208 + ], + [ + 80, + 0.2494165335645714 + ], + [ + 81, + 0.24941158939486094 + ], + [ + 82, + 0.2493936464817174 + ], + [ + 83, + 0.24938938208789213 + ], + [ + 84, + 0.24939251169705332 + ], + [ + 85, + 0.24939146172130572 + ], + [ + 86, + 0.24938545924827824 + ], + [ + 87, + 0.24939188685283167 + ], + [ + 88, + 0.24938399198640737 + ], + [ + 89, + 0.249372010405215 + ], + [ + 90, + 0.24938619307549603 + ], + [ + 91, + 0.24938151487506702 + ], + [ + 92, + 0.24938646258998595 + ], + [ + 93, + 0.2494060045181368 + ], + [ + 94, + 0.2493982639873303 + ], + [ + 95, + 0.24939781273659428 + ], + [ + 96, + 0.24937664426383271 + ], + [ + 97, + 0.249376480147334 + ], + [ + 98, + 0.2493897912286789 + ], + [ + 99, + 0.24939717074066392 + ], + [ + 100, + 0.2494029934547596 + ] + ] + }, + "blend_random_trainable_alpha050": { + "alpha": 0.5, + "test_acc": [ + 0.3071, + 0.3153, + 0.3159, + 0.3073, + 0.3107, + 0.3048, + 0.3066, + 0.3002, + 0.2956, + 0.3025, + 0.3134, + 0.3098, + 0.3238, + 0.3106, + 0.3069, + 0.3009, + 0.3152, + 0.3153, + 0.3102, + 0.3059, + 0.305, + 0.3192, + 0.3077, + 0.3096, + 0.3039, + 0.3099, + 0.3109, + 0.3063, + 0.3103, + 0.3126, + 0.3141, + 0.3057, + 0.3133, + 0.3062, + 0.3146, + 0.3102, + 0.3179, + 0.325, + 0.3137, + 0.3186, + 0.3054, + 0.3068, + 0.3147, + 0.3127, + 0.3052, + 0.3089, + 0.3136, + 0.301, + 0.3065, + 0.3139, + 0.3091, + 0.3119, + 0.3171, + 0.3044, + 0.3084, + 0.3115, + 0.3155, + 0.3168, + 0.3097, + 0.3124, + 0.316, + 0.32, + 0.3188, + 0.3243, + 0.3033, + 0.3073, + 0.3149, + 0.3198, + 0.3143, + 0.3103, + 0.3134, + 0.3189, + 0.3155, + 0.3144, + 0.3076, + 0.3201, + 0.3123, + 0.316, + 0.314, + 0.3144, + 0.32, + 0.3188, + 0.32, + 0.3159, + 0.3167, + 0.3159, + 0.316, + 0.3153, + 0.315, + 0.316, + 0.3155, + 0.3159, + 0.3158, + 0.3158, + 0.3156 + ], + "train_loss": [ + 1.9908838816833496, + 1.9877498167419434, + 1.9915257918930054, + 1.98690866355896, + 1.990242875289917, + 1.982980037765503, + 1.9806120121002198, + 1.981981626815796, + 1.9789552877044678, + 1.9801098787689209, + 1.9775814321899414, + 1.9735393454742431, + 1.97612149017334, + 1.9740667019271851, + 1.9752808430480957, + 1.9748608548736573, + 1.9725629011535644, + 1.975950546951294, + 1.9726420166778564, + 1.9719942540740967, + 1.972226925048828, + 1.9718828250122071, + 1.9702325133514405, + 1.972721547088623, + 1.9749690441894532, + 1.970941196937561, + 1.9705127066802979, + 1.9721903118515014, + 1.9724419820404053, + 1.9722332624816894, + 1.9732470855712891, + 1.9714836350250244, + 1.9737400853729248, + 1.9724387300872803, + 1.9739704666900635, + 1.9718335093688966, + 1.9735708393096925, + 1.9722440079498291, + 1.972540139389038, + 1.9745972146987916, + 1.9730849907684327, + 1.971971201171875, + 1.9731891180038452, + 1.977160333328247, + 1.9752889443969726, + 1.9720553560638427, + 1.9734648179626464, + 1.972916893234253, + 1.9725440413665771, + 1.9729121141815185, + 1.973689049911499, + 1.9710198628997804, + 1.973855771446228, + 1.9726994828033446, + 1.9739762287902831, + 1.9727908270645143, + 1.9747351895904541, + 1.9715166574096679, + 1.9719487404632567, + 1.9724699239730834, + 1.973008492050171, + 1.9730079955291748, + 1.9727294918060303, + 1.9705677117538452, + 1.9700410662841796, + 1.9705747305679322, + 1.9694746914672852, + 1.9736025182724, + 1.9716221771240234, + 1.9716520706939697, + 1.9713862493133545, + 1.970648483581543, + 1.9720281861877442, + 1.9689332669830322, + 1.9710357287979126, + 1.9701062538146972, + 1.9711170873641968, + 1.9709298823547363, + 1.9700459471130372, + 1.967672025527954, + 1.9714107075500489, + 1.9676781567764283, + 1.9705823202896118, + 1.9675492962646484, + 1.9665284505462646, + 1.9696068994140625, + 1.9690539211654663, + 1.9694294802856445, + 1.9689524176788331, + 1.9657572605895997, + 1.9702196077728271, + 1.9710681314468383, + 1.9685678855895996, + 1.9667935219955444, + 1.9720542455291747 + ], + "gamma": [ + [ + 6, + 0.06159791396930814 + ], + [ + 7, + 0.058924108219798654 + ], + [ + 8, + 0.0625917793950066 + ], + [ + 9, + 0.06508902739733458 + ], + [ + 10, + 0.06468426494393498 + ], + [ + 13, + 0.064562008890789 + ], + [ + 15, + 0.06312858680030331 + ], + [ + 20, + 0.06455998323508538 + ], + [ + 25, + 0.07518586772494018 + ], + [ + 35, + 0.07322781311813742 + ], + [ + 45, + 0.06869896280113608 + ], + [ + 55, + 0.06770999490981922 + ], + [ + 65, + 0.06603386749338824 + ], + [ + 75, + 0.0666171737248078 + ], + [ + 85, + 0.07043640181655064 + ], + [ + 95, + 0.06907140363182407 + ], + [ + 100, + 0.0720302565023303 + ] + ], + "rho": [ + [ + 6, + 0.01675456902012229 + ], + [ + 7, + 0.01637683156877756 + ], + [ + 8, + 0.014717273181304336 + ], + [ + 9, + 0.011490113567560911 + ], + [ + 10, + 0.01329625304788351 + ], + [ + 13, + 0.005268331617116928 + ], + [ + 15, + 0.010573521489277482 + ], + [ + 20, + 0.007580187520943582 + ], + [ + 25, + 0.015451677609235048 + ], + [ + 35, + 0.016363009715860244 + ], + [ + 45, + 0.009572957176715136 + ], + [ + 55, + 0.020591675187461078 + ], + [ + 65, + 0.0008253897540271282 + ], + [ + 75, + 0.018082315160427243 + ], + [ + 85, + 0.004077966790646315 + ], + [ + 95, + 0.0056699051056057215 + ], + [ + 100, + 0.00042029470205307007 + ] + ], + "alpha_eff": [ + [ + 6, + 0.49989725988622363 + ], + [ + 7, + 0.49979735055626884 + ], + [ + 8, + 0.4997228360573307 + ], + [ + 9, + 0.49965275979738544 + ], + [ + 10, + 0.49958351357846775 + ], + [ + 11, + 0.49952551324310107 + ], + [ + 12, + 0.4994794246524265 + ], + [ + 13, + 0.4995562578955705 + ], + [ + 14, + 0.49938075811023797 + ], + [ + 15, + 0.49933156874722834 + ], + [ + 16, + 0.4993205764172403 + ], + [ + 17, + 0.4992995361849271 + ], + [ + 18, + 0.499288721696257 + ], + [ + 19, + 0.4992492484545191 + ], + [ + 20, + 0.49924901244261427 + ], + [ + 21, + 0.49924637408738043 + ], + [ + 22, + 0.4992184335676231 + ], + [ + 23, + 0.49921578349900986 + ], + [ + 24, + 0.49922592091700196 + ], + [ + 25, + 0.49923121253047503 + ], + [ + 26, + 0.4992126275079129 + ], + [ + 27, + 0.4991961502573495 + ], + [ + 28, + 0.4991821145312485 + ], + [ + 29, + 0.49919672315265506 + ], + [ + 30, + 0.4991906685158188 + ], + [ + 31, + 0.4991706533861234 + ], + [ + 32, + 0.4991725657775582 + ], + [ + 33, + 0.499173431494215 + ], + [ + 34, + 0.4991801839979003 + ], + [ + 35, + 0.49917648037211526 + ], + [ + 36, + 0.4991798443560795 + ], + [ + 37, + 0.4991831958540486 + ], + [ + 38, + 0.49917732217336347 + ], + [ + 39, + 0.49916182153597827 + ], + [ + 40, + 0.4991891533621105 + ], + [ + 41, + 0.49917867210464356 + ], + [ + 42, + 0.49918224555863994 + ], + [ + 43, + 0.49919490290287694 + ], + [ + 44, + 0.49922504713982274 + ], + [ + 45, + 0.4991974079788523 + ], + [ + 46, + 0.4991875999343034 + ], + [ + 47, + 0.49915751473944203 + ], + [ + 48, + 0.4991624911963996 + ], + [ + 49, + 0.49919186485919353 + ], + [ + 50, + 0.49917108740313154 + ], + [ + 51, + 0.4991606516524022 + ], + [ + 52, + 0.49917049827456755 + ], + [ + 53, + 0.4991804268264333 + ], + [ + 54, + 0.4992850830997803 + ], + [ + 55, + 0.49926025122092216 + ], + [ + 56, + 0.4992252067028678 + ], + [ + 57, + 0.49922797896930804 + ], + [ + 58, + 0.4992153532644955 + ], + [ + 59, + 0.49920003195065593 + ], + [ + 60, + 0.49920019451594494 + ], + [ + 61, + 0.4991897607897768 + ], + [ + 62, + 0.4992129324487871 + ], + [ + 63, + 0.499182074732644 + ], + [ + 64, + 0.49917155802631125 + ], + [ + 65, + 0.49919449559465245 + ], + [ + 66, + 0.4991937913452975 + ], + [ + 67, + 0.4991794039404566 + ], + [ + 68, + 0.49917882367874006 + ], + [ + 69, + 0.4992004154626366 + ], + [ + 70, + 0.4991786464503386 + ], + [ + 71, + 0.4991943976881417 + ], + [ + 72, + 0.4992084133590561 + ], + [ + 73, + 0.49919357186411856 + ], + [ + 74, + 0.49921211436505386 + ], + [ + 75, + 0.4991929743768104 + ], + [ + 76, + 0.4992041790551587 + ], + [ + 77, + 0.49918873023025095 + ], + [ + 78, + 0.49919151095021985 + ], + [ + 79, + 0.4991981630858893 + ], + [ + 80, + 0.4991842623630541 + ], + [ + 81, + 0.49918613368125275 + ], + [ + 82, + 0.499202557557044 + ], + [ + 83, + 0.4992060318878455 + ], + [ + 84, + 0.4991915450073312 + ], + [ + 85, + 0.4991825420377337 + ], + [ + 86, + 0.4991920382638308 + ], + [ + 87, + 0.4991819721839756 + ], + [ + 88, + 0.4991836322841509 + ], + [ + 89, + 0.49916824998324905 + ], + [ + 90, + 0.4991779286550408 + ], + [ + 91, + 0.49917084890951546 + ], + [ + 92, + 0.49917853233370346 + ], + [ + 93, + 0.4991865933238822 + ], + [ + 94, + 0.49917952327598253 + ], + [ + 95, + 0.49918596799442716 + ], + [ + 96, + 0.49919212982497696 + ], + [ + 97, + 0.49919001650648115 + ], + [ + 98, + 0.49919079738614003 + ], + [ + 99, + 0.49918675694839687 + ], + [ + 100, + 0.49918872952896104 + ] + ] + }, + "blend_random_trainable_alpha075": { + "alpha": 0.75, + "test_acc": [ + 0.3034, + 0.3123, + 0.3089, + 0.3033, + 0.3088, + 0.3043, + 0.3017, + 0.2996, + 0.2881, + 0.2957, + 0.3089, + 0.3049, + 0.3084, + 0.3074, + 0.306, + 0.3032, + 0.3122, + 0.3096, + 0.309, + 0.3037, + 0.3015, + 0.3162, + 0.3072, + 0.3088, + 0.3035, + 0.3113, + 0.3108, + 0.3164, + 0.3061, + 0.3093, + 0.3161, + 0.3102, + 0.3104, + 0.3092, + 0.317, + 0.3135, + 0.3166, + 0.3193, + 0.3132, + 0.321, + 0.3138, + 0.3106, + 0.3148, + 0.3154, + 0.3107, + 0.3126, + 0.3175, + 0.3097, + 0.3109, + 0.3177, + 0.3114, + 0.3165, + 0.3205, + 0.3109, + 0.3134, + 0.3142, + 0.3192, + 0.3161, + 0.3129, + 0.3146, + 0.3184, + 0.3207, + 0.3196, + 0.3259, + 0.309, + 0.3131, + 0.3182, + 0.3223, + 0.32, + 0.3143, + 0.3178, + 0.3211, + 0.3199, + 0.318, + 0.3125, + 0.3211, + 0.3159, + 0.3194, + 0.3163, + 0.3181, + 0.3222, + 0.3221, + 0.3212, + 0.3191, + 0.3201, + 0.3193, + 0.3186, + 0.3173, + 0.3182, + 0.3194, + 0.3194, + 0.3193, + 0.3194, + 0.3193, + 0.3192 + ], + "train_loss": [ + 1.987240170211792, + 1.9871271530914307, + 1.9845678861236573, + 1.983582562904358, + 1.9888756177520752, + 1.986539323387146, + 1.9845917708587646, + 1.985333621673584, + 1.9822719374084472, + 1.9816022521972656, + 1.9779683029937745, + 1.971929577407837, + 1.9722519189834595, + 1.9687975677490235, + 1.969152216873169, + 1.9684696987915038, + 1.9655458721542358, + 1.9683702281951905, + 1.9652744570159912, + 1.9654630448150634, + 1.9655610497283935, + 1.964896211166382, + 1.9623671910858154, + 1.9632857027435302, + 1.9660598248291015, + 1.9606867895507814, + 1.960700237426758, + 1.9627517392349243, + 1.96167004032135, + 1.96215058883667, + 1.9626673681640625, + 1.9613383666610718, + 1.9638981309509278, + 1.9615884679412843, + 1.9643639147567749, + 1.9602514279174805, + 1.9618201668930053, + 1.9615961993408204, + 1.961815823097229, + 1.9646509646224977, + 1.9624934663391114, + 1.960718916244507, + 1.9623830725860596, + 1.9652647049331664, + 1.9634992519760133, + 1.959999230041504, + 1.9619419541931153, + 1.9603431912231446, + 1.9606768273162842, + 1.9610141585540772, + 1.9610223788452148, + 1.9585339109039306, + 1.9616724869155884, + 1.9590482375717162, + 1.961669761428833, + 1.9600498888778686, + 1.9626958881378174, + 1.9603246263885499, + 1.9605694396209716, + 1.9609092087554931, + 1.961390089111328, + 1.9620549584960938, + 1.9616080158996583, + 1.9578674816131592, + 1.9594170637512207, + 1.9593613959121705, + 1.957629048690796, + 1.9621257973861694, + 1.9598495999908447, + 1.9601541738891601, + 1.959862784500122, + 1.9588044677352905, + 1.9608067423248292, + 1.95737032913208, + 1.9599335641479492, + 1.9586967916107179, + 1.959671367111206, + 1.9605539001083374, + 1.9584323050689698, + 1.9562305585479736, + 1.9603590017700194, + 1.955668737487793, + 1.9594869439315796, + 1.9560476244354248, + 1.9548624114608764, + 1.9581794776153565, + 1.9577512713623046, + 1.9576651248168946, + 1.9579689697265625, + 1.954503147583008, + 1.9583285201263427, + 1.9600629302215575, + 1.9575826657485962, + 1.9553564596176147, + 1.9605778546905517 + ], + "gamma": [ + [ + 6, + 0.020075631327927113 + ], + [ + 7, + 0.020418883301317692 + ], + [ + 8, + 0.041572967427782714 + ], + [ + 9, + 0.034633477218449116 + ], + [ + 10, + 0.032537849212531 + ], + [ + 13, + 0.026815209886990488 + ], + [ + 15, + 0.027469406370073557 + ], + [ + 20, + 0.02724000324087683 + ], + [ + 25, + 0.026616851129801944 + ], + [ + 35, + 0.033171679242514074 + ], + [ + 45, + 0.030373239191249013 + ], + [ + 55, + 0.023685507534537464 + ], + [ + 65, + 0.02635520964395255 + ], + [ + 75, + 0.027785221464000642 + ], + [ + 85, + 0.0341503472882323 + ], + [ + 95, + 0.03362242935691029 + ], + [ + 100, + 0.03354454814689234 + ] + ], + "rho": [ + [ + 6, + 0.026563940104097128 + ], + [ + 7, + 0.009303744416683912 + ], + [ + 8, + -0.002133091911673546 + ], + [ + 9, + 0.028314012044575065 + ], + [ + 10, + 0.006396602489985526 + ], + [ + 13, + 0.007015988463535905 + ], + [ + 15, + 0.011417242116294801 + ], + [ + 20, + 0.0027145042549818754 + ], + [ + 25, + 0.005520312930457294 + ], + [ + 35, + -0.01181224372703582 + ], + [ + 45, + 0.016137104714289308 + ], + [ + 55, + -0.003447658964432776 + ], + [ + 65, + 0.0003238511271774769 + ], + [ + 75, + -5.083635915070772e-05 + ], + [ + 85, + 0.007546830922365189 + ], + [ + 95, + -0.00822349707596004 + ], + [ + 100, + -0.003206890542060137 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7499192532525394 + ], + [ + 7, + 0.7498502609810094 + ], + [ + 8, + 0.7498018195944903 + ], + [ + 9, + 0.74974280153621 + ], + [ + 10, + 0.7496940813124257 + ], + [ + 11, + 0.7496545372701029 + ], + [ + 12, + 0.7495810472115972 + ], + [ + 13, + 0.749558732048481 + ], + [ + 14, + 0.7495275827741228 + ], + [ + 15, + 0.7495326757935619 + ], + [ + 16, + 0.7495022523737868 + ], + [ + 17, + 0.7495021004220415 + ], + [ + 18, + 0.7494640027781643 + ], + [ + 19, + 0.7494477251847736 + ], + [ + 20, + 0.7494261573039042 + ], + [ + 21, + 0.7494410834410338 + ], + [ + 22, + 0.7494386201277249 + ], + [ + 23, + 0.7494231009862471 + ], + [ + 24, + 0.7494020657321235 + ], + [ + 25, + 0.7494010221685214 + ], + [ + 26, + 0.7494057753731722 + ], + [ + 27, + 0.749389045099605 + ], + [ + 28, + 0.749384071241818 + ], + [ + 29, + 0.7493894289640239 + ], + [ + 30, + 0.7494117084122605 + ], + [ + 31, + 0.749385563060789 + ], + [ + 32, + 0.7493704445564451 + ], + [ + 33, + 0.7493706049375978 + ], + [ + 34, + 0.7493805366806727 + ], + [ + 35, + 0.7493874588228995 + ], + [ + 36, + 0.7493978847742617 + ], + [ + 37, + 0.7494017685499555 + ], + [ + 38, + 0.7493880230593533 + ], + [ + 39, + 0.7493769516761828 + ], + [ + 40, + 0.7494408632640851 + ], + [ + 41, + 0.7493989971123053 + ], + [ + 42, + 0.7493897648061398 + ], + [ + 43, + 0.7493895841945271 + ], + [ + 44, + 0.7493882939300405 + ], + [ + 45, + 0.7493841867438201 + ], + [ + 46, + 0.7493926980162646 + ], + [ + 47, + 0.7493867757744943 + ], + [ + 48, + 0.7493720257682946 + ], + [ + 49, + 0.7494728147215595 + ], + [ + 50, + 0.749414911835902 + ], + [ + 51, + 0.7494096663834889 + ], + [ + 52, + 0.7493995216109133 + ], + [ + 53, + 0.749396777072851 + ], + [ + 54, + 0.7493965331252112 + ], + [ + 55, + 0.7493923580980166 + ], + [ + 56, + 0.7494068358236006 + ], + [ + 57, + 0.7494184103961008 + ], + [ + 58, + 0.7494000625639603 + ], + [ + 59, + 0.7494034769879309 + ], + [ + 60, + 0.7493934865981208 + ], + [ + 61, + 0.7493903652907954 + ], + [ + 62, + 0.7494398632661997 + ], + [ + 63, + 0.7494094916387471 + ], + [ + 64, + 0.7493947113321128 + ], + [ + 65, + 0.7494024170011034 + ], + [ + 66, + 0.749398971814846 + ], + [ + 67, + 0.7494397440709936 + ], + [ + 68, + 0.7493945606505155 + ], + [ + 69, + 0.7494030530324994 + ], + [ + 70, + 0.7493775239285799 + ], + [ + 71, + 0.7493773878959508 + ], + [ + 72, + 0.7493824697180758 + ], + [ + 73, + 0.7493759069136149 + ], + [ + 74, + 0.7494055114912002 + ], + [ + 75, + 0.7493977227125793 + ], + [ + 76, + 0.7494091331388193 + ], + [ + 77, + 0.7494083440941964 + ], + [ + 78, + 0.7494013029090836 + ], + [ + 79, + 0.7493902673789514 + ], + [ + 80, + 0.7493761629049908 + ], + [ + 81, + 0.7493847590553622 + ], + [ + 82, + 0.7493947307932345 + ], + [ + 83, + 0.7494084699250041 + ], + [ + 84, + 0.7493976491047936 + ], + [ + 85, + 0.7493935376218088 + ], + [ + 86, + 0.7493913260946169 + ], + [ + 87, + 0.7493949209269184 + ], + [ + 88, + 0.7493897975263685 + ], + [ + 89, + 0.7493713406303161 + ], + [ + 90, + 0.7493740259292067 + ], + [ + 91, + 0.7493801858158619 + ], + [ + 92, + 0.7493910697674242 + ], + [ + 93, + 0.7494002957991308 + ], + [ + 94, + 0.7494018104351715 + ], + [ + 95, + 0.7493974601231723 + ], + [ + 96, + 0.7493904702338606 + ], + [ + 97, + 0.7493766092739566 + ], + [ + 98, + 0.7493959197929352 + ], + [ + 99, + 0.749394734893217 + ], + [ + 100, + 0.7493910770041978 + ] + ] + }, + "blend_random_trainable_alpha090": { + "alpha": 0.9, + "test_acc": [ + 0.299, + 0.304, + 0.3011, + 0.2798, + 0.301, + 0.2953, + 0.2991, + 0.2972, + 0.2835, + 0.2989, + 0.3027, + 0.2963, + 0.2943, + 0.294, + 0.2838, + 0.2818, + 0.3032, + 0.298, + 0.3001, + 0.288, + 0.2961, + 0.3002, + 0.2976, + 0.2961, + 0.2935, + 0.2971, + 0.2987, + 0.3023, + 0.3001, + 0.3019, + 0.3074, + 0.3007, + 0.3042, + 0.3036, + 0.3068, + 0.3051, + 0.3103, + 0.313, + 0.3015, + 0.3068, + 0.3068, + 0.3016, + 0.3074, + 0.312, + 0.3022, + 0.3071, + 0.3095, + 0.2999, + 0.3055, + 0.3127, + 0.304, + 0.3098, + 0.3112, + 0.3023, + 0.3033, + 0.3137, + 0.3138, + 0.3117, + 0.3067, + 0.3029, + 0.3127, + 0.3107, + 0.3114, + 0.3155, + 0.3012, + 0.3059, + 0.3067, + 0.3107, + 0.3123, + 0.3073, + 0.3084, + 0.3122, + 0.3134, + 0.3105, + 0.3051, + 0.3114, + 0.3109, + 0.3115, + 0.3115, + 0.3098, + 0.3124, + 0.3115, + 0.3132, + 0.3116, + 0.3121, + 0.3132, + 0.3111, + 0.3121, + 0.3105, + 0.3102, + 0.3103, + 0.3103, + 0.3104, + 0.3102, + 0.3104 + ], + "train_loss": [ + 1.9890508442687989, + 1.990648283843994, + 1.994727445678711, + 1.9898214043426514, + 1.9945692050552368, + 1.9881462112426758, + 1.9850170427703857, + 1.9874203789520264, + 1.9842438862609864, + 1.9827749535369874, + 1.9797347565078736, + 1.9834029346084594, + 1.988257053451538, + 1.9841754889678955, + 1.985011074142456, + 1.984129882659912, + 1.9779130119323731, + 1.9801474346542358, + 1.97670384223938, + 1.975082826385498, + 1.973111046295166, + 1.9703727652359009, + 1.9688108737182617, + 1.9692627041625976, + 1.9705071445083617, + 1.9649039663696288, + 1.9643345845794677, + 1.96681397605896, + 1.9641611499404907, + 1.9641723567199707, + 1.9648383374786378, + 1.9631840893936157, + 1.9648317515563964, + 1.9614055786895752, + 1.9650694213104247, + 1.961541328048706, + 1.9629750553131105, + 1.962144373550415, + 1.962860485305786, + 1.9636458072280885, + 1.9623364852905274, + 1.9610377810668946, + 1.9629042342376708, + 1.9655962491226195, + 1.9635980056762696, + 1.9599338647079467, + 1.9622287102508544, + 1.9611709561538697, + 1.9601466109848023, + 1.9616209969329834, + 1.960803759689331, + 1.9582552689361572, + 1.9611395385742187, + 1.9584340462875367, + 1.961097812576294, + 1.959400883255005, + 1.9609548767471314, + 1.9589200262069701, + 1.9589226739883423, + 1.958297335510254, + 1.9593491931915283, + 1.960762004852295, + 1.959771747894287, + 1.9566084023284913, + 1.956548022003174, + 1.9582088103866577, + 1.9569922626113891, + 1.9611940761566162, + 1.9581898126983643, + 1.9584559888076782, + 1.9579038101959227, + 1.957134034500122, + 1.9579114457702638, + 1.9553621417236329, + 1.958240584373474, + 1.9565584728622436, + 1.9576134494400024, + 1.9577414935684203, + 1.9558836351013185, + 1.95412816986084, + 1.957853369293213, + 1.9536584018707275, + 1.9573557986831664, + 1.953881487350464, + 1.9525489911270142, + 1.9555533562469483, + 1.9550897399520875, + 1.9547373791122435, + 1.9562894794464112, + 1.9520553144073487, + 1.956090751800537, + 1.9581266250610352, + 1.9547510679626465, + 1.9527177194213867, + 1.9579596255111695 + ], + "gamma": [ + [ + 6, + 0.020970277953892946 + ], + [ + 7, + 0.010939141269773245 + ], + [ + 8, + 0.015217388630844653 + ], + [ + 9, + -0.0042448341846466064 + ], + [ + 10, + 0.014619549445342273 + ], + [ + 13, + 0.006043761153705418 + ], + [ + 15, + 0.015412847453262657 + ], + [ + 20, + 0.008474407310131937 + ], + [ + 25, + 0.0068653663620352745 + ], + [ + 35, + 0.006590569159016013 + ], + [ + 45, + 0.017077833792427555 + ], + [ + 55, + 0.008733848109841347 + ], + [ + 65, + 0.013923669699579477 + ], + [ + 75, + 0.017147758801002055 + ], + [ + 85, + 0.007989586098119617 + ], + [ + 95, + 0.007280286401510239 + ], + [ + 100, + 0.004780605202540755 + ] + ], + "rho": [ + [ + 6, + 0.0234045252436772 + ], + [ + 7, + 0.007293196045793593 + ], + [ + 8, + -0.004426149884238839 + ], + [ + 9, + 0.006934044416993856 + ], + [ + 10, + 0.015940490178763866 + ], + [ + 13, + 0.00822709547355771 + ], + [ + 15, + -0.002329273382201791 + ], + [ + 20, + 0.00963468081317842 + ], + [ + 25, + -0.013927004765719175 + ], + [ + 35, + -0.015318268910050392 + ], + [ + 45, + 0.00814310647547245 + ], + [ + 55, + -0.0056371710961684585 + ], + [ + 65, + 0.005264427280053496 + ], + [ + 75, + -0.006690809037536383 + ], + [ + 85, + 0.02103410242125392 + ], + [ + 95, + 0.0006436840631067753 + ], + [ + 100, + 0.004339051432907581 + ] + ], + "alpha_eff": [ + [ + 6, + 0.8999630756881548 + ], + [ + 7, + 0.8999290295126786 + ], + [ + 8, + 0.899902619170082 + ], + [ + 9, + 0.8998760179499884 + ], + [ + 10, + 0.8998530249039248 + ], + [ + 11, + 0.8998271876043261 + ], + [ + 12, + 0.8998125385272272 + ], + [ + 13, + 0.8997871005381969 + ], + [ + 14, + 0.8997809391666968 + ], + [ + 15, + 0.8997644459866166 + ], + [ + 16, + 0.8997902300882685 + ], + [ + 17, + 0.8997535400184713 + ], + [ + 18, + 0.8997355777376747 + ], + [ + 19, + 0.8997289153744131 + ], + [ + 20, + 0.899722931653093 + ], + [ + 21, + 0.8997228981314278 + ], + [ + 22, + 0.8997144762755186 + ], + [ + 23, + 0.8997192063355121 + ], + [ + 24, + 0.8997157021832001 + ], + [ + 25, + 0.8997321245068026 + ], + [ + 26, + 0.8997285128442438 + ], + [ + 27, + 0.8997031268267427 + ], + [ + 28, + 0.8997031082162511 + ], + [ + 29, + 0.8997039632836831 + ], + [ + 30, + 0.8997145364640176 + ], + [ + 31, + 0.8997023406296571 + ], + [ + 32, + 0.8997020849440805 + ], + [ + 33, + 0.8997035311834697 + ], + [ + 34, + 0.8997063751061889 + ], + [ + 35, + 0.8997086170889398 + ], + [ + 36, + 0.8997108071445673 + ], + [ + 37, + 0.8997076995274622 + ], + [ + 38, + 0.8997031768711902 + ], + [ + 39, + 0.8996995302817202 + ], + [ + 40, + 0.8997065973709011 + ], + [ + 41, + 0.8997068631940662 + ], + [ + 42, + 0.899703036028811 + ], + [ + 43, + 0.899706049281201 + ], + [ + 44, + 0.8997102282322337 + ], + [ + 45, + 0.8997103121378697 + ], + [ + 46, + 0.8997192965751147 + ], + [ + 47, + 0.899705187170609 + ], + [ + 48, + 0.8996959242607423 + ], + [ + 49, + 0.899711522933519 + ], + [ + 50, + 0.899706037301123 + ], + [ + 51, + 0.8997002093214819 + ], + [ + 52, + 0.8997071771801318 + ], + [ + 53, + 0.8997081014789804 + ], + [ + 54, + 0.8997188554489542 + ], + [ + 55, + 0.899720778788983 + ], + [ + 56, + 0.899719698950363 + ], + [ + 57, + 0.8997175967443884 + ], + [ + 58, + 0.8997158655149179 + ], + [ + 59, + 0.8997115404828796 + ], + [ + 60, + 0.8997160153322658 + ], + [ + 61, + 0.899708785385546 + ], + [ + 62, + 0.899715713068994 + ], + [ + 63, + 0.8997065337151827 + ], + [ + 64, + 0.8997141056722793 + ], + [ + 65, + 0.8997136566544934 + ], + [ + 66, + 0.899702694273918 + ], + [ + 67, + 0.8997030763643339 + ], + [ + 68, + 0.8997057542746615 + ], + [ + 69, + 0.8997141589604338 + ], + [ + 70, + 0.8997088932789362 + ], + [ + 71, + 0.8997089861909919 + ], + [ + 72, + 0.8997062874596711 + ], + [ + 73, + 0.8997017510694443 + ], + [ + 74, + 0.8997142078393265 + ], + [ + 75, + 0.8997098150026078 + ], + [ + 76, + 0.8997117228573014 + ], + [ + 77, + 0.8997054817459939 + ], + [ + 78, + 0.8997646824729889 + ], + [ + 79, + 0.8997297471777584 + ], + [ + 80, + 0.8997190852472362 + ], + [ + 81, + 0.8997168875745091 + ], + [ + 82, + 0.8997159321584175 + ], + [ + 83, + 0.8997078933597031 + ], + [ + 84, + 0.8997014896847517 + ], + [ + 85, + 0.8997058110406619 + ], + [ + 86, + 0.8997117273849363 + ], + [ + 87, + 0.8997057470204033 + ], + [ + 88, + 0.8997055645964045 + ], + [ + 89, + 0.8996992502849522 + ], + [ + 90, + 0.8997053043136866 + ], + [ + 91, + 0.899701870877184 + ], + [ + 92, + 0.8997028730898097 + ], + [ + 93, + 0.8997091255880337 + ], + [ + 94, + 0.8997070845031366 + ], + [ + 95, + 0.8997101786387347 + ], + [ + 96, + 0.8997108956408635 + ], + [ + 97, + 0.899711030221111 + ], + [ + 98, + 0.8997101646986978 + ], + [ + 99, + 0.8997098436319917 + ], + [ + 100, + 0.8997112090139117 + ] + ] + } +} \ No newline at end of file diff --git a/results/audit_d512_L2_4method.log b/results/audit_d512_L2_4method.log new file mode 100644 index 0000000..5869475 --- /dev/null +++ b/results/audit_d512_L2_4method.log @@ -0,0 +1,16 @@ +=== 4-METHOD AUDIT (BP,EP,SB,CB only): d=512 L=2, seeds 1,2,5 === +FA and DFA already in results/fa_dfa_d512_L2_seed{1,2,5}/ +Start: Sun Apr 26 09:01:32 AM CDT 2026 + + seed=1 (Sun Apr 26 09:01:32 AM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 1 +============================================================ + +--- BP --- + [BP] Epoch 1: loss=1.9296, train=0.3129, test=0.3920 + [BP] Epoch 10: loss=1.3859, train=0.4995, test=0.5210 + [BP] Epoch 20: loss=1.2614, train=0.5473, test=0.5560 + [BP] Epoch 30: loss=1.1744, train=0.5783, test=0.5708 diff --git a/results/audit_d512_L2_6method.log b/results/audit_d512_L2_6method.log new file mode 100644 index 0000000..c5ad667 --- /dev/null +++ b/results/audit_d512_L2_6method.log @@ -0,0 +1,35 @@ +=== 6-METHOD AUDIT: d=512 L=2, seeds 1,2,5 === +Start: Sun Apr 26 08:50:41 AM CDT 2026 + + seed=1 (Sun Apr 26 08:50:41 AM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 1 +============================================================ + +--- BP --- + [BP] Epoch 1: loss=1.9296, train=0.3129, test=0.3920 + [BP] Epoch 10: loss=1.3859, train=0.4995, test=0.5210 + [BP] Epoch 20: loss=1.2614, train=0.5473, test=0.5560 + [BP] Epoch 30: loss=1.1744, train=0.5783, test=0.5708 + [BP] Epoch 40: loss=1.1065, train=0.6047, test=0.5824 + [BP] Epoch 50: loss=1.0347, train=0.6289, test=0.5947 + [BP] Epoch 60: loss=0.9762, train=0.6505, test=0.5996 + [BP] Epoch 70: loss=0.9339, train=0.6657, test=0.6027 + [BP] Epoch 80: loss=0.8948, train=0.6800, test=0.6057 + [BP] Epoch 90: loss=0.8688, train=0.6898, test=0.6049 + [BP] Epoch 100: loss=0.8640, train=0.6923, test=0.6061 + Final test acc: 0.6061 + +--- DFA --- + [DFA] Epoch 1: loss=2.0591, train=0.2454, test=0.2655 + [DFA] Epoch 10: loss=2.0095, train=0.2684, test=0.2903 + [DFA] Epoch 20: loss=2.0058, train=0.2681, test=0.2783 + [DFA] Epoch 30: loss=2.0053, train=0.2721, test=0.2762 + [DFA] Epoch 40: loss=2.0044, train=0.2712, test=0.2959 + [DFA] Epoch 50: loss=2.0005, train=0.2729, test=0.2901 + [DFA] Epoch 60: loss=1.9964, train=0.2742, test=0.2919 + [DFA] Epoch 70: loss=1.9982, train=0.2780, test=0.2913 + [DFA] Epoch 80: loss=1.9966, train=0.2753, test=0.2950 + [DFA] Epoch 90: loss=1.9938, train=0.2775, test=0.2936 diff --git a/results/blend_dissection/dissection_t5_s42.json b/results/blend_dissection/dissection_t5_s42.json new file mode 100644 index 0000000..5562a0e --- /dev/null +++ b/results/blend_dissection/dissection_t5_s42.json @@ -0,0 +1,4311 @@ +{ + "beta": 0.7907743990635343, + "continue_DFA": { + "test_acc": [ + 0.2963, + 0.3055, + 0.3037, + 0.3129, + 0.3085, + 0.3059, + 0.3142, + 0.3052, + 0.3048, + 0.295, + 0.3038, + 0.3109, + 0.303, + 0.3129, + 0.3181, + 0.3073, + 0.3138, + 0.2935, + 0.2724, + 0.2899, + 0.3043, + 0.304, + 0.3153, + 0.3162, + 0.3153, + 0.3011, + 0.3114, + 0.3036, + 0.3097, + 0.3118, + 0.3093, + 0.308, + 0.315, + 0.3028, + 0.3092, + 0.3124, + 0.3058, + 0.3095, + 0.3035, + 0.306, + 0.3082, + 0.3016, + 0.314, + 0.32, + 0.3034, + 0.2995, + 0.3072, + 0.3076, + 0.299, + 0.3123, + 0.3139, + 0.3077, + 0.3044, + 0.3051, + 0.3111, + 0.3095, + 0.304, + 0.3146, + 0.3128, + 0.3142, + 0.3086, + 0.3097, + 0.3075, + 0.3022, + 0.3179, + 0.3152, + 0.303, + 0.3041, + 0.3139, + 0.314, + 0.3077, + 0.3088, + 0.3072, + 0.3176, + 0.3104, + 0.3087, + 0.3064, + 0.3122, + 0.3071, + 0.315, + 0.3133, + 0.3125, + 0.311, + 0.3113, + 0.3123, + 0.3116, + 0.3112, + 0.3114, + 0.3099, + 0.3096, + 0.3106, + 0.3106, + 0.3103, + 0.3104, + 0.3105 + ], + "train_loss": [ + 1.9917153326416015, + 1.9914020665740966, + 1.9901976773071288, + 1.988933535003662, + 1.9858682497406006, + 1.9855058740615845, + 1.9855351746368408, + 1.9885486212158203, + 1.9854358833312988, + 1.9890342288208007, + 1.9882773254394532, + 1.9898943268203735, + 1.9858055562591552, + 1.9871372011566162, + 1.9864173832702636, + 1.9868827392578126, + 1.9849347032928466, + 1.9864702680969237, + 1.9879106298065186, + 1.9874647803497314, + 1.9868588120269774, + 1.9855480011367799, + 1.9865379638671874, + 1.9834296019744873, + 1.9872295205688477, + 1.9846305572891236, + 1.9842337454223633, + 1.9827104736328125, + 1.98434967338562, + 1.987197992401123, + 1.9876438945770263, + 1.9883500901031494, + 1.987552170639038, + 1.9858486380004883, + 1.985440172958374, + 1.9890925741577148, + 1.986767668838501, + 1.987451621360779, + 1.9835427057647705, + 1.9881386394500733, + 1.987318958129883, + 1.9880258861541749, + 1.989282262802124, + 1.9864823223876953, + 1.986908299560547, + 1.9868181982421875, + 1.9874914128112793, + 1.9840115883636475, + 1.9868999612045288, + 1.9878488900375366, + 1.9851782949066161, + 1.9862295052337646, + 1.9874154011535645, + 1.9858859173965455, + 1.9878456968688965, + 1.9853282151031495, + 1.985901883392334, + 1.9859509258270263, + 1.9890274000549317, + 1.9853982135009767, + 1.984879475479126, + 1.98574097114563, + 1.9858561849975587, + 1.9860091897964478, + 1.9858733835601807, + 1.9871158577728272, + 1.9840241395568847, + 1.9853334728240968, + 1.986361666946411, + 1.9839559393692017, + 1.984299683265686, + 1.9864232648468017, + 1.984328148651123, + 1.9850988402557372, + 1.982911961593628, + 1.9842189752960204, + 1.9847925899887084, + 1.9840286093521118, + 1.984117462081909, + 1.98515405418396, + 1.9852717823791504, + 1.9829368571472168, + 1.9830631381988526, + 1.9837770384979247, + 1.9852064317321778, + 1.982457720298767, + 1.9828754368591308, + 1.9826085054779052, + 1.9845606142807006, + 1.9855709371566772, + 1.9825187755966187, + 1.9828999655151367, + 1.9843557969665528, + 1.983104598236084, + 1.9826115587615967 + ], + "gamma": [ + [ + 6, + 0.08147912286221981 + ], + [ + 7, + 0.083942775381729 + ], + [ + 8, + 0.08335589081980288 + ], + [ + 9, + 0.08451867988333106 + ], + [ + 10, + 0.08567881945054978 + ], + [ + 13, + 0.08585492498241365 + ], + [ + 15, + 0.08818750991486013 + ], + [ + 20, + 0.09013927017804235 + ], + [ + 25, + 0.09144815686158836 + ], + [ + 35, + 0.09544415841810405 + ], + [ + 45, + 0.09857377805747092 + ], + [ + 55, + 0.1013135741231963 + ], + [ + 65, + 0.10160410939715803 + ], + [ + 75, + 0.10183499159757048 + ], + [ + 85, + 0.10208195971790701 + ], + [ + 95, + 0.10211039299611002 + ], + [ + 100, + 0.10216700565069914 + ] + ], + "rho": [ + [ + 6, + 0.022012292640283704 + ], + [ + 7, + 0.01926875812932849 + ], + [ + 8, + 0.005791868083178997 + ], + [ + 9, + 0.015724025666713715 + ], + [ + 10, + 0.03417299780994654 + ], + [ + 13, + 0.013052632100880146 + ], + [ + 15, + 0.003919541195500642 + ], + [ + 20, + 0.00705078081227839 + ], + [ + 25, + 0.0076473255176097155 + ], + [ + 35, + 0.00891413411591202 + ], + [ + 45, + 0.004709912231191993 + ], + [ + 55, + 0.004661331884562969 + ], + [ + 65, + 0.004180454183369875 + ], + [ + 75, + -0.005214415490627289 + ], + [ + 85, + -0.00544139719568193 + ], + [ + 95, + 0.0012514754198491573 + ], + [ + 100, + 0.0011127730831503868 + ] + ], + "alpha_eff": [ + [ + 6, + 0.0 + ], + [ + 7, + 0.0 + ], + [ + 8, + 0.0 + ], + [ + 9, + 0.0 + ], + [ + 10, + 0.0 + ], + [ + 11, + 0.0 + ], + [ + 12, + 0.0 + ], + [ + 13, + 0.0 + ], + [ + 14, + 0.0 + ], + [ + 15, + 0.0 + ], + [ + 16, + 0.0 + ], + [ + 17, + 0.0 + ], + [ + 18, + 0.0 + ], + [ + 19, + 0.0 + ], + [ + 20, + 0.0 + ], + [ + 21, + 0.0 + ], + [ + 22, + 0.0 + ], + [ + 23, + 0.0 + ], + [ + 24, + 0.0 + ], + [ + 25, + 0.0 + ], + [ + 26, + 0.0 + ], + [ + 27, + 0.0 + ], + [ + 28, + 0.0 + ], + [ + 29, + 0.0 + ], + [ + 30, + 0.0 + ], + [ + 31, + 0.0 + ], + [ + 32, + 0.0 + ], + [ + 33, + 0.0 + ], + [ + 34, + 0.0 + ], + [ + 35, + 0.0 + ], + [ + 36, + 0.0 + ], + [ + 37, + 0.0 + ], + [ + 38, + 0.0 + ], + [ + 39, + 0.0 + ], + [ + 40, + 0.0 + ], + [ + 41, + 0.0 + ], + [ + 42, + 0.0 + ], + [ + 43, + 0.0 + ], + [ + 44, + 0.0 + ], + [ + 45, + 0.0 + ], + [ + 46, + 0.0 + ], + [ + 47, + 0.0 + ], + [ + 48, + 0.0 + ], + [ + 49, + 0.0 + ], + [ + 50, + 0.0 + ], + [ + 51, + 0.0 + ], + [ + 52, + 0.0 + ], + [ + 53, + 0.0 + ], + [ + 54, + 0.0 + ], + [ + 55, + 0.0 + ], + [ + 56, + 0.0 + ], + [ + 57, + 0.0 + ], + [ + 58, + 0.0 + ], + [ + 59, + 0.0 + ], + [ + 60, + 0.0 + ], + [ + 61, + 0.0 + ], + [ + 62, + 0.0 + ], + [ + 63, + 0.0 + ], + [ + 64, + 0.0 + ], + [ + 65, + 0.0 + ], + [ + 66, + 0.0 + ], + [ + 67, + 0.0 + ], + [ + 68, + 0.0 + ], + [ + 69, + 0.0 + ], + [ + 70, + 0.0 + ], + [ + 71, + 0.0 + ], + [ + 72, + 0.0 + ], + [ + 73, + 0.0 + ], + [ + 74, + 0.0 + ], + [ + 75, + 0.0 + ], + [ + 76, + 0.0 + ], + [ + 77, + 0.0 + ], + [ + 78, + 0.0 + ], + [ + 79, + 0.0 + ], + [ + 80, + 0.0 + ], + [ + 81, + 0.0 + ], + [ + 82, + 0.0 + ], + [ + 83, + 0.0 + ], + [ + 84, + 0.0 + ], + [ + 85, + 0.0 + ], + [ + 86, + 0.0 + ], + [ + 87, + 0.0 + ], + [ + 88, + 0.0 + ], + [ + 89, + 0.0 + ], + [ + 90, + 0.0 + ], + [ + 91, + 0.0 + ], + [ + 92, + 0.0 + ], + [ + 93, + 0.0 + ], + [ + 94, + 0.0 + ], + [ + 95, + 0.0 + ], + [ + 96, + 0.0 + ], + [ + 97, + 0.0 + ], + [ + 98, + 0.0 + ], + [ + 99, + 0.0 + ], + [ + 100, + 0.0 + ] + ] + }, + "blend_random_frozen": { + "test_acc": [ + 0.1857, + 0.1291, + 0.117, + 0.1118, + 0.1248, + 0.1312, + 0.1199, + 0.1369, + 0.1375, + 0.125, + 0.1145, + 0.1407, + 0.1155, + 0.1187, + 0.1281, + 0.1235, + 0.1161, + 0.1199, + 0.1289, + 0.1144, + 0.1142, + 0.1201, + 0.1353, + 0.1313, + 0.1246, + 0.1274, + 0.1247, + 0.1161, + 0.1397, + 0.1196, + 0.1263, + 0.1359, + 0.1209, + 0.1416, + 0.1226, + 0.1162, + 0.1332, + 0.1348, + 0.131, + 0.1259, + 0.133, + 0.1177, + 0.1263, + 0.1328, + 0.1418, + 0.1421, + 0.124, + 0.1402, + 0.1182, + 0.1118, + 0.1278, + 0.1156, + 0.1234, + 0.1395, + 0.1413, + 0.1206, + 0.1385, + 0.1086, + 0.1398, + 0.1233, + 0.1304, + 0.1313, + 0.1203, + 0.1195, + 0.1344, + 0.1388, + 0.1147, + 0.131, + 0.137, + 0.1168, + 0.14, + 0.1321, + 0.1297, + 0.1415, + 0.1389, + 0.1313, + 0.1226, + 0.1368, + 0.1382, + 0.1169, + 0.1245, + 0.1293, + 0.1306, + 0.1123, + 0.1316, + 0.1261, + 0.1379, + 0.1253, + 0.139, + 0.1138, + 0.1311, + 0.1284, + 0.1253, + 0.1262, + 0.126 + ], + "train_loss": [ + 2.077210623931885, + 2.2431990660095216, + 2.290568412475586, + 2.2990872356414793, + 2.304406560058594, + 2.302724478225708, + 2.303276051559448, + 2.304779994354248, + 2.300059924621582, + 2.3021979917907713, + 2.3029969697570802, + 2.3014632540130617, + 2.300812749786377, + 2.300768824920654, + 2.2993542736816406, + 2.2997050019836425, + 2.3000418968963623, + 2.301567208099365, + 2.299892781524658, + 2.2995775370025635, + 2.2988372010040283, + 2.2988756278991698, + 2.298202882614136, + 2.2971937602233887, + 2.2983451007843017, + 2.2980890339660642, + 2.2972370765686034, + 2.296438496246338, + 2.2960709575653078, + 2.2963922400665284, + 2.2985967403411864, + 2.297392815170288, + 2.295402819824219, + 2.295079497833252, + 2.2953191860198974, + 2.295060697174072, + 2.2955474838256835, + 2.2945937699890138, + 2.2936295893859864, + 2.2942492738342284, + 2.2945799352264404, + 2.2940659660339358, + 2.294150905303955, + 2.295430052947998, + 2.2934328555297854, + 2.292744130706787, + 2.2929725063323976, + 2.2918734077453613, + 2.2933706995391847, + 2.2920743852996828, + 2.2925622122192384, + 2.291407374420166, + 2.2910671371459963, + 2.2916195738220213, + 2.291281509552002, + 2.2912379996490477, + 2.291590235519409, + 2.290989848022461, + 2.290456315460205, + 2.2903050439453123, + 2.290454834365845, + 2.2907322105407717, + 2.28940681640625, + 2.290701127166748, + 2.2906121561431885, + 2.2893689794921874, + 2.288984686203003, + 2.2901946446228028, + 2.2899436653900147, + 2.2897436267852784, + 2.2897221459197996, + 2.2891692597961426, + 2.2897191500854492, + 2.288403730316162, + 2.2887934480285645, + 2.2886755839538573, + 2.2888823398590086, + 2.288241148300171, + 2.2888436951446534, + 2.2886351592254637, + 2.288302882003784, + 2.2883120162200927, + 2.287797662277222, + 2.28854989151001, + 2.2888951800537107, + 2.2881162230682373, + 2.288466665496826, + 2.2875457569885254, + 2.2886454067230226, + 2.288561104736328, + 2.287538832473755, + 2.2877361987304687, + 2.2882793353271484, + 2.287487026824951, + 2.287928214645386 + ], + "gamma": [ + [ + 6, + 0.09705849178135395 + ], + [ + 7, + 0.07987675396725535 + ], + [ + 8, + 0.07847554539330304 + ], + [ + 9, + 0.06686021399218589 + ], + [ + 10, + 0.054796886746771634 + ], + [ + 13, + 0.028864670486655086 + ], + [ + 15, + 0.016553362278500572 + ], + [ + 20, + 0.0022447525116149336 + ], + [ + 25, + 0.00010601917711028364 + ], + [ + 35, + -0.0019804608182312222 + ], + [ + 45, + -0.0017012776543197106 + ], + [ + 55, + -0.0020026571969538054 + ], + [ + 65, + -0.001736226889761383 + ], + [ + 75, + -0.0018044146279407869 + ], + [ + 85, + -0.001727562398855298 + ], + [ + 95, + -0.0017598790404917963 + ], + [ + 100, + -0.0017594303167243197 + ] + ], + "rho": [ + [ + 6, + -0.002870356140192598 + ], + [ + 7, + -0.020844032696913928 + ], + [ + 8, + -0.0065721028950065374 + ], + [ + 9, + 0.0031941549386829138 + ], + [ + 10, + 0.004641983890905976 + ], + [ + 13, + -0.0004568711156025529 + ], + [ + 15, + 0.002178539871238172 + ], + [ + 20, + 0.004280881490558386 + ], + [ + 25, + 0.0007321110460907221 + ], + [ + 35, + -0.006570447469130158 + ], + [ + 45, + 0.002107909880578518 + ], + [ + 55, + -0.0017221630550920963 + ], + [ + 65, + -0.005303161218762398 + ], + [ + 75, + 0.001089076278731227 + ], + [ + 85, + -0.006758960895240307 + ], + [ + 95, + -0.0025665550492703915 + ], + [ + 100, + -0.007264598738402128 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7033667214069578 + ], + [ + 7, + 0.7033355423498502 + ], + [ + 8, + 0.703341337654383 + ], + [ + 9, + 0.7033398915526489 + ], + [ + 10, + 0.7033469137142988 + ], + [ + 11, + 0.7033528203921838 + ], + [ + 12, + 0.703349631935409 + ], + [ + 13, + 0.7033556054835431 + ], + [ + 14, + 0.7033573467399955 + ], + [ + 15, + 0.7033585127713516 + ], + [ + 16, + 0.7033606313869974 + ], + [ + 17, + 0.7033594386167735 + ], + [ + 18, + 0.7033671048090361 + ], + [ + 19, + 0.7033617031610764 + ], + [ + 20, + 0.7033631114120102 + ], + [ + 21, + 0.7033684879417307 + ], + [ + 22, + 0.7033645952043742 + ], + [ + 23, + 0.7033701060730531 + ], + [ + 24, + 0.7033683947982355 + ], + [ + 25, + 0.7033682637594127 + ], + [ + 26, + 0.7033687384932725 + ], + [ + 27, + 0.7033697160393604 + ], + [ + 28, + 0.7033708260416804 + ], + [ + 29, + 0.7033711030388574 + ], + [ + 30, + 0.7033714754785831 + ], + [ + 31, + 0.7033720291691299 + ], + [ + 32, + 0.7033707667566945 + ], + [ + 33, + 0.7033725817548855 + ], + [ + 34, + 0.7033739800760702 + ], + [ + 35, + 0.7033681630264693 + ], + [ + 36, + 0.7033765694995706 + ], + [ + 37, + 0.703373384319045 + ], + [ + 38, + 0.7033701013445582 + ], + [ + 39, + 0.7033728931094333 + ], + [ + 40, + 0.7033736549166267 + ], + [ + 41, + 0.7033730176410118 + ], + [ + 42, + 0.7033740118920294 + ], + [ + 43, + 0.7033752262350167 + ], + [ + 44, + 0.7033772818090822 + ], + [ + 45, + 0.7033712921076286 + ], + [ + 46, + 0.7033728100265195 + ], + [ + 47, + 0.7033766031530017 + ], + [ + 48, + 0.7033713796996419 + ], + [ + 49, + 0.7033742263771229 + ], + [ + 50, + 0.7033749682923209 + ], + [ + 51, + 0.7033747108405795 + ], + [ + 52, + 0.7033767917382471 + ], + [ + 53, + 0.7033738078594078 + ], + [ + 54, + 0.7033752515487298 + ], + [ + 55, + 0.7033755963393229 + ], + [ + 56, + 0.7033732814953582 + ], + [ + 57, + 0.7033746217600133 + ], + [ + 58, + 0.7033786444182895 + ], + [ + 59, + 0.7033732916027474 + ], + [ + 60, + 0.7033739815385246 + ], + [ + 61, + 0.703377629525928 + ], + [ + 62, + 0.7033728224336424 + ], + [ + 63, + 0.7033765335638839 + ], + [ + 64, + 0.7033752288066356 + ], + [ + 65, + 0.7033736545360807 + ], + [ + 66, + 0.7033756682556455 + ], + [ + 67, + 0.7033761157760855 + ], + [ + 68, + 0.7033729582214312 + ], + [ + 69, + 0.7033766643374293 + ], + [ + 70, + 0.7033719770073115 + ], + [ + 71, + 0.7033767043497829 + ], + [ + 72, + 0.7033743330504698 + ], + [ + 73, + 0.7033767093442654 + ], + [ + 74, + 0.7033765244545683 + ], + [ + 75, + 0.7033772286271813 + ], + [ + 76, + 0.703377821922085 + ], + [ + 77, + 0.7033750672481118 + ], + [ + 78, + 0.7033763135715737 + ], + [ + 79, + 0.7033710082922844 + ], + [ + 80, + 0.7033734395170478 + ], + [ + 81, + 0.7033782704525657 + ], + [ + 82, + 0.7033740154550022 + ], + [ + 83, + 0.7033775118364295 + ], + [ + 84, + 0.7033791464760508 + ], + [ + 85, + 0.7033698482008165 + ], + [ + 86, + 0.7033807658668279 + ], + [ + 87, + 0.7033769820551344 + ], + [ + 88, + 0.7033774036258972 + ], + [ + 89, + 0.7033759531355517 + ], + [ + 90, + 0.7033756237618816 + ], + [ + 91, + 0.7033732726080191 + ], + [ + 92, + 0.7033769110082546 + ], + [ + 93, + 0.703371497962236 + ], + [ + 94, + 0.7033814102348596 + ], + [ + 95, + 0.7033817271064535 + ], + [ + 96, + 0.7033722352979139 + ], + [ + 97, + 0.7033719312619731 + ], + [ + 98, + 0.7033777498598163 + ], + [ + 99, + 0.703375456215777 + ], + [ + 100, + 0.7033768264757309 + ] + ] + }, + "blend_random_trainable": { + "test_acc": [ + 0.3057, + 0.313, + 0.3159, + 0.3074, + 0.3127, + 0.3075, + 0.2992, + 0.3017, + 0.2934, + 0.3036, + 0.3107, + 0.3157, + 0.3175, + 0.3067, + 0.3038, + 0.3036, + 0.3188, + 0.3151, + 0.3159, + 0.306, + 0.3065, + 0.3211, + 0.3101, + 0.3111, + 0.3086, + 0.3114, + 0.315, + 0.3177, + 0.3148, + 0.3155, + 0.3192, + 0.315, + 0.314, + 0.3112, + 0.3237, + 0.3152, + 0.3232, + 0.3246, + 0.315, + 0.322, + 0.3147, + 0.3138, + 0.3184, + 0.3186, + 0.3112, + 0.3167, + 0.3203, + 0.3108, + 0.3149, + 0.32, + 0.3166, + 0.319, + 0.3187, + 0.3122, + 0.3185, + 0.3175, + 0.3226, + 0.3188, + 0.3184, + 0.3178, + 0.3234, + 0.322, + 0.3222, + 0.3306, + 0.313, + 0.3163, + 0.3231, + 0.3259, + 0.3243, + 0.3182, + 0.3185, + 0.3235, + 0.3219, + 0.3217, + 0.317, + 0.324, + 0.3179, + 0.3234, + 0.3202, + 0.3218, + 0.3251, + 0.3246, + 0.3246, + 0.3222, + 0.3217, + 0.3228, + 0.3219, + 0.3212, + 0.3214, + 0.3226, + 0.3219, + 0.3226, + 0.3226, + 0.3224, + 0.3224 + ], + "train_loss": [ + 1.9863584661102296, + 1.9901082321166992, + 1.9899895672607422, + 1.9905559247207643, + 1.9933388582992553, + 1.9831242485809326, + 1.9819840459823608, + 1.9838320283508302, + 1.9812498509216308, + 1.980695964202881, + 1.9775935582733155, + 1.9746784218597413, + 1.9758756914520264, + 1.9731443271255493, + 1.9735053044128419, + 1.9710882552337647, + 1.9679033090591431, + 1.9719498504257202, + 1.96802033203125, + 1.9680989447021484, + 1.9678990168762207, + 1.9670032351303102, + 1.9651213776016236, + 1.9671727653503417, + 1.9690395525741577, + 1.9632393447494507, + 1.9625915707778931, + 1.9642795868301393, + 1.962284288253784, + 1.9620551160430908, + 1.9625657203674316, + 1.9611133654403687, + 1.9630646159362792, + 1.960646312789917, + 1.9632540558242797, + 1.9595271733093262, + 1.96106090385437, + 1.9597418651580811, + 1.9601698782730101, + 1.9627716778945923, + 1.960522246322632, + 1.9592057704925536, + 1.9605137160873414, + 1.9641116384506225, + 1.9620838027954102, + 1.9584725994873047, + 1.9602987656402588, + 1.9586591900253296, + 1.9589158935165405, + 1.9596970495605468, + 1.9598131320571899, + 1.9568223999023437, + 1.96024339012146, + 1.9578165494155884, + 1.9596277838134766, + 1.9579522448730469, + 1.9601750942230225, + 1.9571070608520509, + 1.9577818801116944, + 1.9579749005508422, + 1.958904959487915, + 1.9588295747375488, + 1.9592107725524903, + 1.9556558278656007, + 1.9566347140502929, + 1.9571185677337646, + 1.9556720935058594, + 1.960075058364868, + 1.9572499262237548, + 1.9573225322723389, + 1.9572704486465453, + 1.956118627243042, + 1.9577359083557129, + 1.9548047360229492, + 1.9568554579925537, + 1.9560601205444337, + 1.9569705477905273, + 1.9573911285018921, + 1.9555766596984863, + 1.9534356274032594, + 1.9576097611236571, + 1.9529308759307862, + 1.956716926498413, + 1.9529449435043336, + 1.9519823665618896, + 1.9550598822021485, + 1.95468404838562, + 1.9547595784759522, + 1.9551029265975952, + 1.9516690326690673, + 1.9553640102386474, + 1.9570171786880493, + 1.9546185680770873, + 1.9530967560577392, + 1.9577186687469483 + ], + "gamma": [ + [ + 6, + -0.004118485609069467 + ], + [ + 7, + 0.005376987275667489 + ], + [ + 8, + -0.00023444528051186353 + ], + [ + 9, + 0.005996660329401493 + ], + [ + 10, + -0.006186874001286924 + ], + [ + 13, + -0.006834868196165189 + ], + [ + 15, + -0.004276088788174093 + ], + [ + 20, + 0.0077267399756237864 + ], + [ + 25, + -0.003282535937614739 + ], + [ + 35, + -0.010988562135025859 + ], + [ + 45, + 0.0008946055895648897 + ], + [ + 55, + -0.007401655660942197 + ], + [ + 65, + -0.0035742081963689998 + ], + [ + 75, + -0.002076548000331968 + ], + [ + 85, + 0.00452860991936177 + ], + [ + 95, + 0.001453812321415171 + ], + [ + 100, + 0.0011978186666965485 + ] + ], + "rho": [ + [ + 6, + -0.007702916627749801 + ], + [ + 7, + -0.004025159869343042 + ], + [ + 8, + 0.021773064276203513 + ], + [ + 9, + -0.0036036039236932993 + ], + [ + 10, + -0.0019339255522936583 + ], + [ + 13, + 0.0074055485893040895 + ], + [ + 15, + -0.0007032814901322126 + ], + [ + 20, + -0.0010675000958144665 + ], + [ + 25, + 0.012549822218716145 + ], + [ + 35, + 0.007774165831506252 + ], + [ + 45, + -0.0026706024073064327 + ], + [ + 55, + -0.024923408403992653 + ], + [ + 65, + -0.006310549098998308 + ], + [ + 75, + 0.021657895063981414 + ], + [ + 85, + 0.0006069509545341134 + ], + [ + 95, + 0.0037721219705417752 + ], + [ + 100, + -0.0004379982128739357 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7033255782623484 + ], + [ + 7, + 0.7032452192264916 + ], + [ + 8, + 0.7032050016928376 + ], + [ + 9, + 0.703171796987776 + ], + [ + 10, + 0.7030983852125524 + ], + [ + 11, + 0.7030327350522556 + ], + [ + 12, + 0.7029979283071539 + ], + [ + 13, + 0.7029728943932545 + ], + [ + 14, + 0.7029575023468488 + ], + [ + 15, + 0.7029825013424166 + ], + [ + 16, + 0.7029338430132441 + ], + [ + 17, + 0.7029114040960175 + ], + [ + 18, + 0.7028689867828561 + ], + [ + 19, + 0.7028345513184494 + ], + [ + 20, + 0.7028593984699817 + ], + [ + 21, + 0.7028383329822545 + ], + [ + 22, + 0.7028438030389291 + ], + [ + 23, + 0.7028243180452911 + ], + [ + 24, + 0.7028346831254739 + ], + [ + 25, + 0.7028180286361645 + ], + [ + 26, + 0.7028014773850306 + ], + [ + 27, + 0.7027888179206988 + ], + [ + 28, + 0.7027863083218597 + ], + [ + 29, + 0.7028209930438672 + ], + [ + 30, + 0.7028279271831875 + ], + [ + 31, + 0.7027893018550231 + ], + [ + 32, + 0.7028124128060081 + ], + [ + 33, + 0.7028223737344558 + ], + [ + 34, + 0.7028201852469204 + ], + [ + 35, + 0.702787292812866 + ], + [ + 36, + 0.7028007631880852 + ], + [ + 37, + 0.702809109510097 + ], + [ + 38, + 0.7028038546552855 + ], + [ + 39, + 0.7027820295246561 + ], + [ + 40, + 0.7028060363890423 + ], + [ + 41, + 0.702801802489862 + ], + [ + 42, + 0.7027970512551064 + ], + [ + 43, + 0.7027816857911551 + ], + [ + 44, + 0.7028146974236424 + ], + [ + 45, + 0.7028108528244092 + ], + [ + 46, + 0.7028032662828714 + ], + [ + 47, + 0.7028106773101793 + ], + [ + 48, + 0.7028022876850725 + ], + [ + 49, + 0.7028333743877524 + ], + [ + 50, + 0.7028122615388537 + ], + [ + 51, + 0.7027948595351735 + ], + [ + 52, + 0.7027854272525506 + ], + [ + 53, + 0.7028041186634381 + ], + [ + 54, + 0.7028192758582721 + ], + [ + 55, + 0.702827106131425 + ], + [ + 56, + 0.7028275540300264 + ], + [ + 57, + 0.7028256401699401 + ], + [ + 58, + 0.7028067247308835 + ], + [ + 59, + 0.7027970731099571 + ], + [ + 60, + 0.7028207470398128 + ], + [ + 61, + 0.702814488660145 + ], + [ + 62, + 0.7028247185472278 + ], + [ + 63, + 0.7027922412187371 + ], + [ + 64, + 0.7028048580096842 + ], + [ + 65, + 0.702826426863984 + ], + [ + 66, + 0.7027851675507224 + ], + [ + 67, + 0.7028056438600826 + ], + [ + 68, + 0.702814753857548 + ], + [ + 69, + 0.702812968839077 + ], + [ + 70, + 0.7028016256474466 + ], + [ + 71, + 0.7028178008107661 + ], + [ + 72, + 0.7028044665369725 + ], + [ + 73, + 0.7027934503683306 + ], + [ + 74, + 0.7028170385562992 + ], + [ + 75, + 0.702816213251658 + ], + [ + 76, + 0.7028134797940632 + ], + [ + 77, + 0.7028168974149571 + ], + [ + 78, + 0.702814796642661 + ], + [ + 79, + 0.7028328657670465 + ], + [ + 80, + 0.702808031339876 + ], + [ + 81, + 0.7028109267678178 + ], + [ + 82, + 0.7028058159878949 + ], + [ + 83, + 0.7027879547376482 + ], + [ + 84, + 0.7027941171869214 + ], + [ + 85, + 0.7027849449106414 + ], + [ + 86, + 0.7027873690929133 + ], + [ + 87, + 0.7028192755752336 + ], + [ + 88, + 0.7028264756997268 + ], + [ + 89, + 0.7028008863027374 + ], + [ + 90, + 0.7028002023485964 + ], + [ + 91, + 0.7028032489220616 + ], + [ + 92, + 0.702777540454898 + ], + [ + 93, + 0.7028065339511926 + ], + [ + 94, + 0.7028124872167342 + ], + [ + 95, + 0.7028305131130029 + ], + [ + 96, + 0.7028279535369464 + ], + [ + 97, + 0.702820345056386 + ], + [ + 98, + 0.7028157220060052 + ], + [ + 99, + 0.7028204015749513 + ], + [ + 100, + 0.7028156186762927 + ] + ] + }, + "blend_shuffled_trainable": { + "test_acc": [ + 0.3072, + 0.3092, + 0.3089, + 0.2989, + 0.3149, + 0.3067, + 0.303, + 0.3018, + 0.3015, + 0.3072, + 0.3142, + 0.3181, + 0.3277, + 0.3162, + 0.3168, + 0.3073, + 0.3175, + 0.3207, + 0.3169, + 0.3102, + 0.3098, + 0.3244, + 0.3152, + 0.3161, + 0.3089, + 0.3137, + 0.3193, + 0.3187, + 0.3193, + 0.3165, + 0.322, + 0.3144, + 0.3172, + 0.3124, + 0.3258, + 0.3168, + 0.3248, + 0.3276, + 0.3205, + 0.3238, + 0.3185, + 0.3205, + 0.3213, + 0.3199, + 0.3133, + 0.3187, + 0.3245, + 0.3134, + 0.3173, + 0.3221, + 0.3182, + 0.3219, + 0.3222, + 0.3184, + 0.3198, + 0.3175, + 0.326, + 0.3223, + 0.319, + 0.3188, + 0.3257, + 0.3244, + 0.3236, + 0.3315, + 0.316, + 0.3178, + 0.3246, + 0.3246, + 0.3246, + 0.3222, + 0.3218, + 0.3264, + 0.3241, + 0.3237, + 0.3202, + 0.327, + 0.3205, + 0.3249, + 0.3226, + 0.3235, + 0.3273, + 0.326, + 0.3271, + 0.3233, + 0.325, + 0.324, + 0.3241, + 0.3231, + 0.3239, + 0.3246, + 0.3242, + 0.3237, + 0.3244, + 0.3246, + 0.3246 + ], + "train_loss": [ + 1.9879663883209229, + 1.9890402872467041, + 1.9952381700897217, + 1.9932921267700194, + 1.9911339688110352, + 1.9806355129241944, + 1.9793314032363891, + 1.980378553543091, + 1.9759705561828613, + 1.9773317337036134, + 1.9736765740585327, + 1.9703904146575928, + 1.9728017766952515, + 1.9694668106842041, + 1.9699617266082763, + 1.9694622762298584, + 1.9675536489105225, + 1.9719966775131226, + 1.9680718574523925, + 1.968003705444336, + 1.967256714553833, + 1.9672853146743774, + 1.964880690536499, + 1.965979939880371, + 1.9679325546264648, + 1.9625504761505126, + 1.9618715047836304, + 1.9649697366333008, + 1.963205277481079, + 1.9629014247894288, + 1.9639540438842773, + 1.963319803237915, + 1.9654156721496583, + 1.96292624294281, + 1.9647651282501222, + 1.9619133391571044, + 1.963123630142212, + 1.9621254228973388, + 1.9626237009048462, + 1.9647653387069701, + 1.9629008512878419, + 1.9611902642822265, + 1.9622716049957276, + 1.9655254000854492, + 1.964137872390747, + 1.9600657921600342, + 1.9621819856262206, + 1.9604503631591796, + 1.9604949105834961, + 1.9606080364990235, + 1.9609809567642211, + 1.9586302294158935, + 1.9622212756729125, + 1.959335130004883, + 1.9614084063720703, + 1.9598014483261108, + 1.9618542864227295, + 1.9592163647460938, + 1.959282341003418, + 1.9592253719711303, + 1.9599059103775025, + 1.9597750213623046, + 1.9604897107696533, + 1.9564096441268921, + 1.9573765369415284, + 1.9579895470428468, + 1.9563196194839478, + 1.9610270920562745, + 1.9584971033477783, + 1.9583748922348023, + 1.9581460390853882, + 1.9575567456436158, + 1.9587494486236572, + 1.9562542750549317, + 1.9581185290908814, + 1.9573783723449707, + 1.95829107963562, + 1.9588930324554443, + 1.9563945680236816, + 1.9548106145477295, + 1.9585965635681153, + 1.9541787635040284, + 1.9577070035171509, + 1.9542437261199952, + 1.9530290853881835, + 1.9563414603042601, + 1.9557864339447022, + 1.9560457189178466, + 1.9564100560760498, + 1.9526432427215576, + 1.9564164319610595, + 1.9582645511627197, + 1.9558721158599854, + 1.954110027694702, + 1.9587735888290405 + ], + "gamma": [ + [ + 6, + -0.009713975014165044 + ], + [ + 7, + -0.0041672863881103694 + ], + [ + 8, + 0.0017023678519763052 + ], + [ + 9, + -0.0016231403860729188 + ], + [ + 10, + 0.006231077190022916 + ], + [ + 13, + 0.0005289145046845078 + ], + [ + 15, + 0.001387338328640908 + ], + [ + 20, + -0.0053925951942801476 + ], + [ + 25, + 0.017255719751119614 + ], + [ + 35, + 0.008442985475994647 + ], + [ + 45, + -0.005755626174504869 + ], + [ + 55, + -0.0024627968086861074 + ], + [ + 65, + 0.0014147361507639289 + ], + [ + 75, + -0.002341967134270817 + ], + [ + 85, + 0.004121452220715582 + ], + [ + 95, + 0.0031763689476065338 + ], + [ + 100, + -0.0005143235466675833 + ] + ], + "rho": [ + [ + 6, + 0.002152219181880355 + ], + [ + 7, + -0.033379526576027274 + ], + [ + 8, + -0.011984863318502903 + ], + [ + 9, + 0.0029476822819560766 + ], + [ + 10, + -0.0029922070680186152 + ], + [ + 13, + 0.01654075738042593 + ], + [ + 15, + 0.018994803074747324 + ], + [ + 20, + 0.007151593221351504 + ], + [ + 25, + 0.014041082700714469 + ], + [ + 35, + -0.01747659279499203 + ], + [ + 45, + -0.00826160958968103 + ], + [ + 55, + 0.01035646814852953 + ], + [ + 65, + 0.0037725798320025206 + ], + [ + 75, + -0.004486699355766177 + ], + [ + 85, + -0.018721963511779904 + ], + [ + 95, + 0.006656181067228317 + ], + [ + 100, + -0.0036278615007176995 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7033339174499001 + ], + [ + 7, + 0.7032361200018741 + ], + [ + 8, + 0.7031762191512683 + ], + [ + 9, + 0.7031844815950166 + ], + [ + 10, + 0.7030993607574066 + ], + [ + 11, + 0.7030523094471233 + ], + [ + 12, + 0.702976516447472 + ], + [ + 13, + 0.7029754254894292 + ], + [ + 14, + 0.7029325368134507 + ], + [ + 15, + 0.7029050937706328 + ], + [ + 16, + 0.7030105891474726 + ], + [ + 17, + 0.7029323172969673 + ], + [ + 18, + 0.702834244610307 + ], + [ + 19, + 0.7028815203745374 + ], + [ + 20, + 0.7028589270867153 + ], + [ + 21, + 0.7028378005487591 + ], + [ + 22, + 0.7028346275872981 + ], + [ + 23, + 0.7028355932887045 + ], + [ + 24, + 0.7028302380748503 + ], + [ + 25, + 0.7028100432115536 + ], + [ + 26, + 0.7028366537211526 + ], + [ + 27, + 0.7028070675120949 + ], + [ + 28, + 0.7027893720289293 + ], + [ + 29, + 0.7028148357540881 + ], + [ + 30, + 0.7027788356845154 + ], + [ + 31, + 0.7027770661615153 + ], + [ + 32, + 0.7028071799802298 + ], + [ + 33, + 0.7028076010826527 + ], + [ + 34, + 0.7028142181529359 + ], + [ + 35, + 0.7027950159010475 + ], + [ + 36, + 0.7028097789176848 + ], + [ + 37, + 0.702799851950602 + ], + [ + 38, + 0.7027780540380907 + ], + [ + 39, + 0.7027803827595185 + ], + [ + 40, + 0.7028002047633005 + ], + [ + 41, + 0.7028111402359748 + ], + [ + 42, + 0.7027993858025785 + ], + [ + 43, + 0.7028177744642827 + ], + [ + 44, + 0.7027975135914483 + ], + [ + 45, + 0.7028445352253704 + ], + [ + 46, + 0.70281649881293 + ], + [ + 47, + 0.7028247795858051 + ], + [ + 48, + 0.7028098422602339 + ], + [ + 49, + 0.7028137396672447 + ], + [ + 50, + 0.702814586621834 + ], + [ + 51, + 0.7028078767292393 + ], + [ + 52, + 0.7028169988117405 + ], + [ + 53, + 0.7028302991990524 + ], + [ + 54, + 0.7028096623881444 + ], + [ + 55, + 0.7028140847582655 + ], + [ + 56, + 0.7028022164999655 + ], + [ + 57, + 0.7028335232728006 + ], + [ + 58, + 0.7028335849544588 + ], + [ + 59, + 0.7027932349232999 + ], + [ + 60, + 0.7028162757477675 + ], + [ + 61, + 0.7028306875026191 + ], + [ + 62, + 0.7028131360710491 + ], + [ + 63, + 0.7028241795978089 + ], + [ + 64, + 0.7028207905885385 + ], + [ + 65, + 0.7028356599351333 + ], + [ + 66, + 0.702815174170097 + ], + [ + 67, + 0.7028057297745339 + ], + [ + 68, + 0.7028060759122144 + ], + [ + 69, + 0.7027829770660874 + ], + [ + 70, + 0.7027938324593894 + ], + [ + 71, + 0.7027983038322353 + ], + [ + 72, + 0.7027959458054085 + ], + [ + 73, + 0.7028203285613996 + ], + [ + 74, + 0.7028592307212126 + ], + [ + 75, + 0.7028289591445176 + ], + [ + 76, + 0.7028212181835 + ], + [ + 77, + 0.7028389914681423 + ], + [ + 78, + 0.7028282505198481 + ], + [ + 79, + 0.702787021150262 + ], + [ + 80, + 0.7027912021258632 + ], + [ + 81, + 0.702769888694361 + ], + [ + 82, + 0.7027841236689804 + ], + [ + 83, + 0.7027907547876603 + ], + [ + 84, + 0.7028087220119643 + ], + [ + 85, + 0.7028211578756763 + ], + [ + 86, + 0.7027905592178233 + ], + [ + 87, + 0.7028016952077285 + ], + [ + 88, + 0.7028003592471743 + ], + [ + 89, + 0.7028142821317884 + ], + [ + 90, + 0.7028169041049376 + ], + [ + 91, + 0.7028386791655826 + ], + [ + 92, + 0.7028113598704812 + ], + [ + 93, + 0.7027831894648512 + ], + [ + 94, + 0.7028061516377985 + ], + [ + 95, + 0.702813675338315 + ], + [ + 96, + 0.7028069171747628 + ], + [ + 97, + 0.702797567775642 + ], + [ + 98, + 0.7027865161639475 + ], + [ + 99, + 0.7028180762199959 + ], + [ + 100, + 0.7028370504489405 + ] + ] + }, + "blend_gaussian_noise": { + "test_acc": [ + 0.2923, + 0.2893, + 0.3022, + 0.2995, + 0.3104, + 0.2977, + 0.3152, + 0.3044, + 0.3142, + 0.3045, + 0.3009, + 0.3202, + 0.3054, + 0.3214, + 0.3013, + 0.3061, + 0.3046, + 0.3051, + 0.3039, + 0.3138, + 0.3007, + 0.2997, + 0.2997, + 0.2962, + 0.3108, + 0.3017, + 0.2981, + 0.3043, + 0.3109, + 0.3072, + 0.3035, + 0.3094, + 0.2995, + 0.3035, + 0.31, + 0.3094, + 0.3075, + 0.3168, + 0.3068, + 0.3031, + 0.31, + 0.3137, + 0.306, + 0.3002, + 0.302, + 0.3104, + 0.3061, + 0.3054, + 0.307, + 0.3112, + 0.3089, + 0.307, + 0.3058, + 0.3061, + 0.301, + 0.3108, + 0.2957, + 0.2948, + 0.312, + 0.3081, + 0.3008, + 0.3056, + 0.3102, + 0.3025, + 0.3023, + 0.2971, + 0.3088, + 0.3127, + 0.301, + 0.3085, + 0.2993, + 0.3055, + 0.3043, + 0.3053, + 0.3094, + 0.3054, + 0.3065, + 0.3068, + 0.3064, + 0.3113, + 0.3058, + 0.3052, + 0.3103, + 0.3033, + 0.3069, + 0.3091, + 0.3078, + 0.3078, + 0.3091, + 0.307, + 0.3078, + 0.3075, + 0.308, + 0.3082, + 0.308 + ], + "train_loss": [ + 1.993203340988159, + 1.9910778423309325, + 1.99141674659729, + 1.9893118661499023, + 1.9885935766983032, + 1.9924972130966188, + 1.988737977218628, + 1.9893469274902345, + 1.989744023513794, + 1.9893734909057617, + 1.9869207611465454, + 1.990346015701294, + 1.9872243325042724, + 1.9895274951171875, + 1.9882190063476564, + 1.989698461227417, + 1.9893472623062134, + 1.9898485544204711, + 1.9900170107269286, + 1.989502276992798, + 1.9923988220596314, + 1.991524747619629, + 1.9925210540390015, + 1.9921520061492919, + 1.990912898864746, + 1.9911081723022461, + 1.990390337486267, + 1.994553267364502, + 1.9918868299102783, + 1.9919861629486084, + 1.9922139133071899, + 1.9942808624267578, + 1.9913640481567383, + 1.992362200050354, + 1.9930698289489746, + 1.9946385150909425, + 1.992706957321167, + 1.9911939100646974, + 1.991908963623047, + 1.991841597442627, + 1.9918154586791992, + 1.9941014937591552, + 1.9925166857910157, + 1.9932450345611572, + 1.993057201156616, + 1.9896164094543458, + 1.9924529732894898, + 1.9913356364440917, + 1.993225507850647, + 1.9949576287078858, + 1.990734895324707, + 1.994212381324768, + 1.993110608177185, + 1.9939460328674317, + 1.994380189437866, + 1.9940233193206787, + 1.9925984786224364, + 1.9929084342193604, + 1.9928766473388673, + 1.9908388400268555, + 1.9931877150726318, + 1.9923542861938477, + 1.9914218115234374, + 1.989885845298767, + 1.991323904800415, + 1.9923666381072997, + 1.9922850937652588, + 1.992446579322815, + 1.992551320877075, + 1.9928769355010987, + 1.9906947250366211, + 1.9921092461395264, + 1.9913399781799317, + 1.9916002709960938, + 1.9930710066986084, + 1.9895993492126465, + 1.9913664756011964, + 1.9913178414916992, + 1.9908054991912842, + 1.9906724109268188, + 1.9903135766601563, + 1.992289573097229, + 1.9921454113006591, + 1.990802325706482, + 1.9924688410949707, + 1.9917918102645873, + 1.9891820581817627, + 1.9913058753204345, + 1.9912357090759278, + 1.9914252561187744, + 1.9911018399810791, + 1.9911789398956299, + 1.9911635885238648, + 1.9902537596130372, + 1.990801071510315 + ], + "gamma": [ + [ + 6, + 0.08380796911660582 + ], + [ + 7, + 0.08333815913647413 + ], + [ + 8, + 0.08704009023495018 + ], + [ + 9, + 0.08895917236804962 + ], + [ + 10, + 0.08596491045318544 + ], + [ + 13, + 0.08832892146892846 + ], + [ + 15, + 0.09080104250460863 + ], + [ + 20, + 0.09193688485538587 + ], + [ + 25, + 0.09346445556730032 + ], + [ + 35, + 0.09449018631130457 + ], + [ + 45, + 0.09490034345071763 + ], + [ + 55, + 0.09678847156465054 + ], + [ + 65, + 0.09723592596128583 + ], + [ + 75, + 0.09813381871208549 + ], + [ + 85, + 0.09853162965737283 + ], + [ + 95, + 0.09864975488744676 + ], + [ + 100, + 0.09859528485685587 + ] + ], + "rho": [ + [ + 6, + 0.02303900895640254 + ], + [ + 7, + 0.012604618910700083 + ], + [ + 8, + 0.014456501696258783 + ], + [ + 9, + 0.00725952023640275 + ], + [ + 10, + 0.020146489376202226 + ], + [ + 13, + 0.0030475526582449675 + ], + [ + 15, + 0.0361496222903952 + ], + [ + 20, + 0.009380030445754528 + ], + [ + 25, + 0.002206234261393547 + ], + [ + 35, + -0.00058283272664994 + ], + [ + 45, + 0.014510783948935568 + ], + [ + 55, + -0.004783019423484802 + ], + [ + 65, + -0.004751493455842137 + ], + [ + 75, + 0.016444321256130934 + ], + [ + 85, + 0.010288935154676437 + ], + [ + 95, + -0.008311591343954206 + ], + [ + 100, + 0.007094032131135464 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7033998784337714 + ], + [ + 7, + 0.7033910169918016 + ], + [ + 8, + 0.7034136526142997 + ], + [ + 9, + 0.7034070206506373 + ], + [ + 10, + 0.7034160177763678 + ], + [ + 11, + 0.7034197747927642 + ], + [ + 12, + 0.7034154987241014 + ], + [ + 13, + 0.7033991506334835 + ], + [ + 14, + 0.703421358321397 + ], + [ + 15, + 0.7034235275706476 + ], + [ + 16, + 0.7034026355790705 + ], + [ + 17, + 0.7034197697517156 + ], + [ + 18, + 0.703402643024413 + ], + [ + 19, + 0.7034150378446538 + ], + [ + 20, + 0.7034075672037926 + ], + [ + 21, + 0.7034204166634406 + ], + [ + 22, + 0.7034157228143394 + ], + [ + 23, + 0.7033968356284199 + ], + [ + 24, + 0.7034031630736975 + ], + [ + 25, + 0.703410156103346 + ], + [ + 26, + 0.7034086456799321 + ], + [ + 27, + 0.7034100013254312 + ], + [ + 28, + 0.7034054126837145 + ], + [ + 29, + 0.7034168842721602 + ], + [ + 30, + 0.7034103727050093 + ], + [ + 31, + 0.7034181687044258 + ], + [ + 32, + 0.7034211239913891 + ], + [ + 33, + 0.7034040598767372 + ], + [ + 34, + 0.7034267895463847 + ], + [ + 35, + 0.7034200785590842 + ], + [ + 36, + 0.7034173722446537 + ], + [ + 37, + 0.703416780973294 + ], + [ + 38, + 0.703422458432895 + ], + [ + 39, + 0.7034195678835375 + ], + [ + 40, + 0.703400933023945 + ], + [ + 41, + 0.7034118368760235 + ], + [ + 42, + 0.7034002693410815 + ], + [ + 43, + 0.7034194315555959 + ], + [ + 44, + 0.7034286038136975 + ], + [ + 45, + 0.7034134317802809 + ], + [ + 46, + 0.7034242729654911 + ], + [ + 47, + 0.7034045125390909 + ], + [ + 48, + 0.7034099637821133 + ], + [ + 49, + 0.7033870604822503 + ], + [ + 50, + 0.7033924611643435 + ], + [ + 51, + 0.7034032859922925 + ], + [ + 52, + 0.7034192864606833 + ], + [ + 53, + 0.7034295490822474 + ], + [ + 54, + 0.7034194220300799 + ], + [ + 55, + 0.7034077030469154 + ], + [ + 56, + 0.7034119982005912 + ], + [ + 57, + 0.7034071134317261 + ], + [ + 58, + 0.7034133354428551 + ], + [ + 59, + 0.7034074457932897 + ], + [ + 60, + 0.7034086687185702 + ], + [ + 61, + 0.7034012845059016 + ], + [ + 62, + 0.7034189883647035 + ], + [ + 63, + 0.7034170228577107 + ], + [ + 64, + 0.703410216508625 + ], + [ + 65, + 0.7034202924379496 + ], + [ + 66, + 0.7033994356546907 + ], + [ + 67, + 0.7034228162228883 + ], + [ + 68, + 0.7034097016837918 + ], + [ + 69, + 0.703416189376855 + ], + [ + 70, + 0.7034111950875575 + ], + [ + 71, + 0.7034096783296612 + ], + [ + 72, + 0.7034113716881638 + ], + [ + 73, + 0.7033929757032754 + ], + [ + 74, + 0.7034120626120587 + ], + [ + 75, + 0.7034038837218367 + ], + [ + 76, + 0.7034052191416231 + ], + [ + 77, + 0.7034159421532796 + ], + [ + 78, + 0.7034022329870004 + ], + [ + 79, + 0.7034199248109828 + ], + [ + 80, + 0.7034037609969638 + ], + [ + 81, + 0.7034077383449302 + ], + [ + 82, + 0.7034011513520346 + ], + [ + 83, + 0.7034088498775594 + ], + [ + 84, + 0.7034269061684973 + ], + [ + 85, + 0.7034224866858519 + ], + [ + 86, + 0.7034218087266184 + ], + [ + 87, + 0.703416653940843 + ], + [ + 88, + 0.7034053592518323 + ], + [ + 89, + 0.7034014784604647 + ], + [ + 90, + 0.7034107465506516 + ], + [ + 91, + 0.7034046001342196 + ], + [ + 92, + 0.7034083525557394 + ], + [ + 93, + 0.7034195766688707 + ], + [ + 94, + 0.7034061635552622 + ], + [ + 95, + 0.7034016385768332 + ], + [ + 96, + 0.7034038206996376 + ], + [ + 97, + 0.7034008895165578 + ], + [ + 98, + 0.7034181994324757 + ], + [ + 99, + 0.7034136723166532 + ], + [ + 100, + 0.7034087198421428 + ] + ] + }, + "scaled_DFA_norm_match": { + "test_acc": [ + 0.2799, + 0.3023, + 0.3022, + 0.305, + 0.3031, + 0.3068, + 0.3027, + 0.2964, + 0.2947, + 0.2848, + 0.2912, + 0.2877, + 0.2868, + 0.2984, + 0.3135, + 0.3148, + 0.2928, + 0.3185, + 0.3164, + 0.3051, + 0.2942, + 0.3055, + 0.2997, + 0.3027, + 0.3009, + 0.3046, + 0.2969, + 0.3048, + 0.3112, + 0.3102, + 0.3099, + 0.3145, + 0.3103, + 0.3128, + 0.3031, + 0.3132, + 0.3069, + 0.3117, + 0.3155, + 0.3126, + 0.2991, + 0.304, + 0.3105, + 0.3124, + 0.3024, + 0.3162, + 0.3076, + 0.3111, + 0.3096, + 0.3103, + 0.3153, + 0.313, + 0.303, + 0.3057, + 0.3146, + 0.3083, + 0.3074, + 0.3138, + 0.3108, + 0.3085, + 0.3115, + 0.3079, + 0.3102, + 0.3059, + 0.3105, + 0.3101, + 0.3144, + 0.309, + 0.3064, + 0.3121, + 0.3136, + 0.3122, + 0.3067, + 0.3146, + 0.315, + 0.308, + 0.3117, + 0.3103, + 0.315, + 0.3129, + 0.3114, + 0.3129, + 0.3106, + 0.314, + 0.3098, + 0.3104, + 0.3129, + 0.3083, + 0.3104, + 0.3111, + 0.3112, + 0.3099, + 0.31, + 0.3103, + 0.3103 + ], + "train_loss": [ + 1.9923602294921876, + 1.9890546128845215, + 1.9894204819107055, + 1.989152320098877, + 1.988577550048828, + 1.9859502027130127, + 1.9874351345825196, + 1.986509676132202, + 1.9871239212417602, + 1.9853697342300416, + 1.985647074241638, + 1.985660191116333, + 1.9867867967224122, + 1.9850995402526856, + 1.9839853742218017, + 1.9865364765930176, + 1.9865033807754517, + 1.9884818240356446, + 1.9859886218643188, + 1.985927615699768, + 1.9861562162017823, + 1.9862393185424805, + 1.9836800576400757, + 1.9871808597183227, + 1.984883204612732, + 1.9837886934661866, + 1.984786727218628, + 1.9883024155044555, + 1.986108370513916, + 1.985321258506775, + 1.9894738638305665, + 1.9877986724090577, + 1.9852204217147826, + 1.9860017431640624, + 1.985712166366577, + 1.9874249489593505, + 1.9876427067565918, + 1.9873564577865601, + 1.986385534057617, + 1.9867805167007446, + 1.9849875399017334, + 1.9849051692962647, + 1.9866327854156494, + 1.9845338430023194, + 1.9859189166259765, + 1.9855265950775147, + 1.9854994425201415, + 1.985078913192749, + 1.9875052710342407, + 1.98448387260437, + 1.9849784341430665, + 1.9860004656600951, + 1.985462727622986, + 1.9841788135147094, + 1.9858437190246583, + 1.9838197813415528, + 1.9862801889038086, + 1.9847486730957031, + 1.986294497680664, + 1.9839171840667724, + 1.9854622132873536, + 1.9838967436218262, + 1.986957244606018, + 1.9826673496246339, + 1.9867617028045654, + 1.9846681551742553, + 1.9820888243865966, + 1.9863314709472657, + 1.9857821100616455, + 1.983645559425354, + 1.9855974853897094, + 1.9851708868789673, + 1.9823928085708618, + 1.9847473794937134, + 1.9838309204101563, + 1.9840375453186034, + 1.985171105003357, + 1.983263666305542, + 1.9819131956481935, + 1.9829617855072021, + 1.9849323486328125, + 1.9837079382324219, + 1.9853739337158203, + 1.9829405225372314, + 1.9818017826080323, + 1.98483393283844, + 1.985428338661194, + 1.9848500240707398, + 1.985539596939087, + 1.983101581802368, + 1.980854806137085, + 1.9814058712005616, + 1.9833548774719238, + 1.9822778103637695, + 1.9830925686264038 + ], + "gamma": [ + [ + 6, + 0.08236762369051576 + ], + [ + 7, + 0.08481154637411237 + ], + [ + 8, + 0.08291630423627794 + ], + [ + 9, + 0.08259243832435459 + ], + [ + 10, + 0.08517789037432522 + ], + [ + 13, + 0.08799418865237385 + ], + [ + 15, + 0.08809825091157109 + ], + [ + 20, + 0.09083233081037179 + ], + [ + 25, + 0.09246953902766109 + ], + [ + 35, + 0.09479347959859297 + ], + [ + 45, + 0.09672224917449057 + ], + [ + 55, + 0.09851697343401611 + ], + [ + 65, + 0.09970828366931528 + ], + [ + 75, + 0.10043370386119932 + ], + [ + 85, + 0.10070295282639563 + ], + [ + 95, + 0.10071049875114113 + ], + [ + 100, + 0.10068938741460443 + ] + ], + "rho": [ + [ + 6, + 0.029324434872251004 + ], + [ + 7, + 0.023356831399723887 + ], + [ + 8, + -0.007588486885651946 + ], + [ + 9, + 0.01867034286260605 + ], + [ + 10, + -0.0011366518447175622 + ], + [ + 13, + -0.0065241712145507336 + ], + [ + 15, + 0.022009607404470444 + ], + [ + 20, + 0.008090358693152666 + ], + [ + 25, + 0.004446777165867388 + ], + [ + 35, + 0.005390704143792391 + ], + [ + 45, + 0.0015335289062932134 + ], + [ + 55, + 0.00856107659637928 + ], + [ + 65, + -0.004320075735449791 + ], + [ + 75, + 0.002856543753296137 + ], + [ + 85, + -0.0016379100270569324 + ], + [ + 95, + 0.013521237298846245 + ], + [ + 100, + 0.0017306602094322443 + ] + ], + "alpha_eff": [ + [ + 6, + 0.42857142991858715 + ], + [ + 7, + 0.4285714293646927 + ], + [ + 8, + 0.42857142933129205 + ], + [ + 9, + 0.42857142977663426 + ], + [ + 10, + 0.42857142979055124 + ], + [ + 11, + 0.4285714292422236 + ], + [ + 12, + 0.42857142948159505 + ], + [ + 13, + 0.42857142918098906 + ], + [ + 14, + 0.42857142965973194 + ], + [ + 15, + 0.42857142958736383 + ], + [ + 16, + 0.42857142966808215 + ], + [ + 17, + 0.42857143007167353 + ], + [ + 18, + 0.4285714298545692 + ], + [ + 19, + 0.4285714297042662 + ], + [ + 20, + 0.4285714299519878 + ], + [ + 21, + 0.42857143005218984 + ], + [ + 22, + 0.42857142965416517 + ], + [ + 23, + 0.42857143026094396 + ], + [ + 24, + 0.4285714298684861 + ], + [ + 25, + 0.42857143004383963 + ], + [ + 26, + 0.42857142963746486 + ], + [ + 27, + 0.42857143016352534 + ], + [ + 28, + 0.428571429158722 + ], + [ + 29, + 0.42857143056433333 + ], + [ + 30, + 0.42857143018579247 + ], + [ + 31, + 0.42857142967643225 + ], + [ + 32, + 0.4285714301189911 + ], + [ + 33, + 0.42857143047248153 + ], + [ + 34, + 0.4285714299714715 + ], + [ + 35, + 0.4285714303277453 + ], + [ + 36, + 0.4285714300438397 + ], + [ + 37, + 0.42857142987683633 + ], + [ + 38, + 0.42857143028042766 + ], + [ + 39, + 0.4285714299631213 + ], + [ + 40, + 0.42857143049753205 + ], + [ + 41, + 0.4285714301941427 + ], + [ + 42, + 0.4285714300939406 + ], + [ + 43, + 0.42857143028042766 + ], + [ + 44, + 0.4285714301551752 + ], + [ + 45, + 0.42857143040846357 + ], + [ + 46, + 0.4285714303834131 + ], + [ + 47, + 0.4285714301134243 + ], + [ + 48, + 0.4285714303527958 + ], + [ + 49, + 0.4285714300661067 + ], + [ + 50, + 0.42857143011620774 + ], + [ + 51, + 0.42857142971539974 + ], + [ + 52, + 0.4285714303444456 + ], + [ + 53, + 0.4285714303806297 + ], + [ + 54, + 0.4285714301718755 + ], + [ + 55, + 0.42857143038341305 + ], + [ + 56, + 0.4285714301356915 + ], + [ + 57, + 0.4285714298267353 + ], + [ + 58, + 0.4285714297376668 + ], + [ + 59, + 0.42857143010507415 + ], + [ + 60, + 0.42857142979890134 + ], + [ + 61, + 0.42857143019135924 + ], + [ + 62, + 0.4285714303527958 + ], + [ + 63, + 0.4285714306116509 + ], + [ + 64, + 0.4285714299213705 + ], + [ + 65, + 0.4285714300271393 + ], + [ + 66, + 0.4285714297877678 + ], + [ + 67, + 0.4285714299018868 + ], + [ + 68, + 0.4285714305003154 + ], + [ + 69, + 0.42857143031104494 + ], + [ + 70, + 0.42857143048361507 + ], + [ + 71, + 0.4285714304168138 + ], + [ + 72, + 0.4285714305003154 + ], + [ + 73, + 0.4285714305420662 + ], + [ + 74, + 0.42857143048361507 + ], + [ + 75, + 0.4285714299798216 + ], + [ + 76, + 0.42857142976271734 + ], + [ + 77, + 0.42857143021919314 + ], + [ + 78, + 0.42857142989631997 + ], + [ + 79, + 0.4285714304195971 + ], + [ + 80, + 0.4285714301663087 + ], + [ + 81, + 0.42857143029434464 + ], + [ + 82, + 0.42857143078143767 + ], + [ + 83, + 0.4285714298601359 + ], + [ + 84, + 0.4285714302692941 + ], + [ + 85, + 0.42857143021640975 + ], + [ + 86, + 0.4285714303834131 + ], + [ + 87, + 0.42857143041959717 + ], + [ + 88, + 0.4285714300911572 + ], + [ + 89, + 0.42857143014404164 + ], + [ + 90, + 0.4285714297655008 + ], + [ + 91, + 0.42857143032774525 + ], + [ + 92, + 0.42857143011620774 + ], + [ + 93, + 0.4285714306255679 + ], + [ + 94, + 0.42857143082318855 + ], + [ + 95, + 0.42857143026372735 + ], + [ + 96, + 0.4285714307842211 + ], + [ + 97, + 0.4285714300271393 + ], + [ + 98, + 0.4285714301496084 + ], + [ + 99, + 0.42857143009394066 + ], + [ + 100, + 0.428571430160742 + ] + ] + } +} \ No newline at end of file diff --git a/results/boundary_ablation_deltaL_wr/ablation_a1.0_L4_s42.json b/results/boundary_ablation_deltaL_wr/ablation_a1.0_L4_s42.json new file mode 100644 index 0000000..437dca7 --- /dev/null +++ b/results/boundary_ablation_deltaL_wr/ablation_a1.0_L4_s42.json @@ -0,0 +1,90 @@ +{ + "s_deltaL_tgw1.0_wr0.0": { + "test_acc": 0.29, + "mean_bp_cosine": 0.5333309099078178, + "mean_rho": 0.5133568346500397, + "mean_nudge": -0.06044131517410278, + "bp_cosine_per_layer": [ + 0.2888738811016083, + 0.5792224407196045, + 0.602611780166626, + 0.6626155376434326 + ], + "rho_per_layer": [ + 0.2811542749404907, + 0.5901442170143127, + 0.6039299368858337, + 0.5781989097595215 + ], + "final_value_loss": 0.9101862869262696, + "s_type": "deltaL", + "term_grad_weight": 1.0, + "warmup_ratio": 0.0 + }, + "s_deltaL_tgw1.0_wr0.05": { + "test_acc": 0.389, + "mean_bp_cosine": 0.7679609805345535, + "mean_rho": 0.6908697336912155, + "mean_nudge": -0.0764562301337719, + "bp_cosine_per_layer": [ + 0.6061833500862122, + 0.8235390186309814, + 0.8219610452651978, + 0.8201605081558228 + ], + "rho_per_layer": [ + 0.6085672974586487, + 0.739956259727478, + 0.7246303558349609, + 0.6903250217437744 + ], + "final_value_loss": 0.7349927394866943, + "s_type": "deltaL", + "term_grad_weight": 1.0, + "warmup_ratio": 0.05 + }, + "s_deltaL_tgw1.0_wr0.2": { + "test_acc": 0.442, + "mean_bp_cosine": 0.5583586767315865, + "mean_rho": 0.49782785028219223, + "mean_nudge": -0.051266513764858246, + "bp_cosine_per_layer": [ + 0.2746746242046356, + 0.6255925893783569, + 0.6661019921302795, + 0.6670655012130737 + ], + "rho_per_layer": [ + 0.27920976281166077, + 0.5733566284179688, + 0.594862163066864, + 0.5438828468322754 + ], + "final_value_loss": 0.47215704221725463, + "s_type": "deltaL", + "term_grad_weight": 1.0, + "warmup_ratio": 0.2 + }, + "s_deltaL_tgw1.0_wr0.5": { + "test_acc": 0.6635, + "mean_bp_cosine": 0.34044671431183815, + "mean_rho": 0.39984575659036636, + "mean_nudge": -0.037964228074997663, + "bp_cosine_per_layer": [ + 0.14777149260044098, + 0.3089486062526703, + 0.42195770144462585, + 0.4831090569496155 + ], + "rho_per_layer": [ + 0.15686997771263123, + 0.35711926221847534, + 0.5539429187774658, + 0.5314508676528931 + ], + "final_value_loss": 0.3006336982488632, + "s_type": "deltaL", + "term_grad_weight": 1.0, + "warmup_ratio": 0.5 + } +} \ No newline at end of file diff --git a/results/boundary_ablation_s123/ablation_a1.0_L4_s123.json b/results/boundary_ablation_s123/ablation_a1.0_L4_s123.json new file mode 100644 index 0000000..47a7fc4 --- /dev/null +++ b/results/boundary_ablation_s123/ablation_a1.0_L4_s123.json @@ -0,0 +1,46 @@ +{ + "s_eT_tgw1.0_wr0.2": { + "test_acc": 0.5135, + "mean_bp_cosine": 0.3966578356921673, + "mean_rho": 0.46284765750169754, + "mean_nudge": -0.03856433369219303, + "bp_cosine_per_layer": [ + 0.1582626849412918, + 0.46924665570259094, + 0.4738205075263977, + 0.48530149459838867 + ], + "rho_per_layer": [ + 0.20893594622612, + 0.5339754819869995, + 0.5519976019859314, + 0.5564815998077393 + ], + "final_value_loss": 0.588364347743988, + "s_type": "eT", + "term_grad_weight": 1.0, + "warmup_ratio": 0.2 + }, + "s_deltaL_tgw1.0_wr0.2": { + "test_acc": 0.422, + "mean_bp_cosine": 0.556720569729805, + "mean_rho": 0.5030678957700729, + "mean_nudge": -0.055364650674164295, + "bp_cosine_per_layer": [ + 0.25414949655532837, + 0.6241912841796875, + 0.6748597621917725, + 0.6736817359924316 + ], + "rho_per_layer": [ + 0.2788790464401245, + 0.5604095458984375, + 0.5989287495613098, + 0.5740542411804199 + ], + "final_value_loss": 0.6335030339241028, + "s_type": "deltaL", + "term_grad_weight": 1.0, + "warmup_ratio": 0.2 + } +} \ No newline at end of file diff --git a/results/boundary_ablation_s456/ablation_a1.0_L4_s456.json b/results/boundary_ablation_s456/ablation_a1.0_L4_s456.json new file mode 100644 index 0000000..29afee7 --- /dev/null +++ b/results/boundary_ablation_s456/ablation_a1.0_L4_s456.json @@ -0,0 +1,46 @@ +{ + "s_eT_tgw1.0_wr0.2": { + "test_acc": 0.4935, + "mean_bp_cosine": 0.49867621809244156, + "mean_rho": 0.5327592641115189, + "mean_nudge": -0.04268983006477356, + "bp_cosine_per_layer": [ + 0.21021124720573425, + 0.5842739939689636, + 0.5913121700286865, + 0.6089074611663818 + ], + "rho_per_layer": [ + 0.24787980318069458, + 0.6222057342529297, + 0.6273762583732605, + 0.6335752606391907 + ], + "final_value_loss": 0.4651986366271973, + "s_type": "eT", + "term_grad_weight": 1.0, + "warmup_ratio": 0.2 + }, + "s_deltaL_tgw1.0_wr0.2": { + "test_acc": 0.4805, + "mean_bp_cosine": 0.572130560874939, + "mean_rho": 0.5290974006056786, + "mean_nudge": -0.05305152013897896, + "bp_cosine_per_layer": [ + 0.3073272705078125, + 0.6108690500259399, + 0.6810163259506226, + 0.6893095970153809 + ], + "rho_per_layer": [ + 0.33536288142204285, + 0.6113735437393188, + 0.6066526174545288, + 0.5630005598068237 + ], + "final_value_loss": 0.48287113523483277, + "s_type": "deltaL", + "term_grad_weight": 1.0, + "warmup_ratio": 0.2 + } +} \ No newline at end of file diff --git a/results/boundary_ablation_s_sweep/ablation_a1.0_L4_s42.json b/results/boundary_ablation_s_sweep/ablation_a1.0_L4_s42.json new file mode 100644 index 0000000..62bca79 --- /dev/null +++ b/results/boundary_ablation_s_sweep/ablation_a1.0_L4_s42.json @@ -0,0 +1,90 @@ +{ + "s_eT_tgw1.0_wr0.2": { + "test_acc": 0.5605, + "mean_bp_cosine": 0.46006373316049576, + "mean_rho": 0.5312944203615189, + "mean_nudge": -0.03811332583427429, + "bp_cosine_per_layer": [ + 0.18216726183891296, + 0.5338927507400513, + 0.5597370862960815, + 0.5644578337669373 + ], + "rho_per_layer": [ + 0.2443590760231018, + 0.5769795775413513, + 0.6636242270469666, + 0.6402148008346558 + ], + "final_value_loss": 0.39113953742980956, + "s_type": "eT", + "term_grad_weight": 1.0, + "warmup_ratio": 0.2 + }, + "s_deltaL_tgw1.0_wr0.2": { + "test_acc": 0.442, + "mean_bp_cosine": 0.5583586767315865, + "mean_rho": 0.49782785028219223, + "mean_nudge": -0.051266513764858246, + "bp_cosine_per_layer": [ + 0.2746746242046356, + 0.6255925893783569, + 0.6661019921302795, + 0.6670655012130737 + ], + "rho_per_layer": [ + 0.27920976281166077, + 0.5733566284179688, + 0.594862163066864, + 0.5438828468322754 + ], + "final_value_loss": 0.47215704221725463, + "s_type": "deltaL", + "term_grad_weight": 1.0, + "warmup_ratio": 0.2 + }, + "s_eT_hL_tgw1.0_wr0.2": { + "test_acc": 0.559, + "mean_bp_cosine": 0.0016190913447644562, + "mean_rho": 0.016410242416895926, + "mean_nudge": -0.00021975510026095435, + "bp_cosine_per_layer": [ + -0.004644347354769707, + 0.0010294992243871093, + -0.0010337075218558311, + 0.011124921031296253 + ], + "rho_per_layer": [ + 0.046507176011800766, + 0.007014757487922907, + -0.006595376878976822, + 0.018714413046836853 + ], + "final_value_loss": 0.8668150995254517, + "s_type": "eT_hL", + "term_grad_weight": 1.0, + "warmup_ratio": 0.2 + }, + "s_deltaL_hL_tgw1.0_wr0.2": { + "test_acc": 0.5635, + "mean_bp_cosine": 0.018434561206959188, + "mean_rho": 0.026365829166024923, + "mean_nudge": -0.0017427445782232098, + "bp_cosine_per_layer": [ + 0.013983936980366707, + 0.02003202959895134, + 0.00282791955396533, + 0.036894358694553375 + ], + "rho_per_layer": [ + -0.006572568789124489, + 0.049806319177150726, + 0.020004384219646454, + 0.042225182056427 + ], + "final_value_loss": 0.7973948855400086, + "s_type": "deltaL_hL", + "term_grad_weight": 1.0, + "warmup_ratio": 0.2 + } +} \ No newline at end of file diff --git a/results/boundary_ablation_tgw_sweep/ablation_a1.0_L4_s42.json b/results/boundary_ablation_tgw_sweep/ablation_a1.0_L4_s42.json new file mode 100644 index 0000000..8a70394 --- /dev/null +++ b/results/boundary_ablation_tgw_sweep/ablation_a1.0_L4_s42.json @@ -0,0 +1,90 @@ +{ + "s_eT_tgw0.0_wr0.2": { + "test_acc": 0.532, + "mean_bp_cosine": 0.11989971622824669, + "mean_rho": 0.16079141944646835, + "mean_nudge": -0.010690351715311408, + "bp_cosine_per_layer": [ + 0.03718709945678711, + 0.1347142904996872, + 0.15199805796146393, + 0.15569941699504852 + ], + "rho_per_layer": [ + 0.08883650600910187, + 0.1502864807844162, + 0.20964613556861877, + 0.19439655542373657 + ], + "final_value_loss": 0.07598549057245255, + "s_type": "eT", + "term_grad_weight": 0.0, + "warmup_ratio": 0.2 + }, + "s_eT_tgw0.25_wr0.2": { + "test_acc": 0.558, + "mean_bp_cosine": 0.22698336280882359, + "mean_rho": 0.2679573856294155, + "mean_nudge": -0.0202574310824275, + "bp_cosine_per_layer": [ + 0.09379873424768448, + 0.2528688311576843, + 0.2722504138946533, + 0.2890154719352722 + ], + "rho_per_layer": [ + 0.13511960208415985, + 0.289243221282959, + 0.33815300464630127, + 0.30931371450424194 + ], + "final_value_loss": 0.16253001551628113, + "s_type": "eT", + "term_grad_weight": 0.25, + "warmup_ratio": 0.2 + }, + "s_eT_tgw1.0_wr0.2": { + "test_acc": 0.558, + "mean_bp_cosine": 0.45794273912906647, + "mean_rho": 0.5322257168591022, + "mean_nudge": -0.038075629621744156, + "bp_cosine_per_layer": [ + 0.17809242010116577, + 0.5349531173706055, + 0.5522423982620239, + 0.5664830207824707 + ], + "rho_per_layer": [ + 0.22843755781650543, + 0.5910820364952087, + 0.6707864999771118, + 0.638596773147583 + ], + "final_value_loss": 0.38718592133522034, + "s_type": "eT", + "term_grad_weight": 1.0, + "warmup_ratio": 0.2 + }, + "s_eT_tgw4.0_wr0.2": { + "test_acc": 0.3935, + "mean_bp_cosine": 0.5738203078508377, + "mean_rho": 0.5946865696460009, + "mean_nudge": -0.04504407802596688, + "bp_cosine_per_layer": [ + 0.07111608982086182, + 0.6408071517944336, + 0.787927508354187, + 0.7954304814338684 + ], + "rho_per_layer": [ + 0.10197217017412186, + 0.6885993480682373, + 0.7956527471542358, + 0.7925220131874084 + ], + "final_value_loss": 1.2652584648132323, + "s_type": "eT", + "term_grad_weight": 4.0, + "warmup_ratio": 0.2 + } +} \ No newline at end of file diff --git a/results/boundary_ablation_wr_sweep/ablation_a1.0_L4_s42.json b/results/boundary_ablation_wr_sweep/ablation_a1.0_L4_s42.json new file mode 100644 index 0000000..e03c56d --- /dev/null +++ b/results/boundary_ablation_wr_sweep/ablation_a1.0_L4_s42.json @@ -0,0 +1,90 @@ +{ + "s_eT_tgw1.0_wr0.0": { + "test_acc": 0.4585, + "mean_bp_cosine": 0.6755405366420746, + "mean_rho": 0.6671112030744553, + "mean_nudge": -0.05872981250286102, + "bp_cosine_per_layer": [ + 0.4783632755279541, + 0.7401086091995239, + 0.7420414686203003, + 0.74164879322052 + ], + "rho_per_layer": [ + 0.49320322275161743, + 0.7312472462654114, + 0.7255045771598816, + 0.7184897661209106 + ], + "final_value_loss": 0.544479172039032, + "s_type": "eT", + "term_grad_weight": 1.0, + "warmup_ratio": 0.0 + }, + "s_eT_tgw1.0_wr0.05": { + "test_acc": 0.4495, + "mean_bp_cosine": 0.45614035055041313, + "mean_rho": 0.5053879581391811, + "mean_nudge": -0.04452316835522652, + "bp_cosine_per_layer": [ + 0.12354414165019989, + 0.5106832385063171, + 0.5928497314453125, + 0.597484290599823 + ], + "rho_per_layer": [ + 0.16242454946041107, + 0.5767663717269897, + 0.6462773084640503, + 0.6360836029052734 + ], + "final_value_loss": 0.6794619485855102, + "s_type": "eT", + "term_grad_weight": 1.0, + "warmup_ratio": 0.05 + }, + "s_eT_tgw1.0_wr0.2": { + "test_acc": 0.558, + "mean_bp_cosine": 0.45794273912906647, + "mean_rho": 0.5322257168591022, + "mean_nudge": -0.038075629621744156, + "bp_cosine_per_layer": [ + 0.17809242010116577, + 0.5349531173706055, + 0.5522423982620239, + 0.5664830207824707 + ], + "rho_per_layer": [ + 0.22843755781650543, + 0.5910820364952087, + 0.6707864999771118, + 0.638596773147583 + ], + "final_value_loss": 0.38718592133522034, + "s_type": "eT", + "term_grad_weight": 1.0, + "warmup_ratio": 0.2 + }, + "s_eT_tgw1.0_wr0.5": { + "test_acc": 0.663, + "mean_bp_cosine": 0.2331971675157547, + "mean_rho": 0.3403939865529537, + "mean_nudge": -0.029925621580332518, + "bp_cosine_per_layer": [ + 0.11287420988082886, + 0.2289769947528839, + 0.2839260697364807, + 0.3070113956928253 + ], + "rho_per_layer": [ + 0.1355699747800827, + 0.3721342980861664, + 0.43592938780784607, + 0.4179422855377197 + ], + "final_value_loss": 0.3164243281364441, + "s_type": "eT", + "term_grad_weight": 1.0, + "warmup_ratio": 0.5 + } +} \ No newline at end of file diff --git a/results/bp_with_penalty_run.log b/results/bp_with_penalty_run.log new file mode 100644 index 0000000..62fe4cb --- /dev/null +++ b/results/bp_with_penalty_run.log @@ -0,0 +1,18 @@ +BP + ‖f‖² penalty: seed=42, lam=0.01, epochs=30 + ep 1: test_acc=0.3621 + ep 5: test_acc=0.4054 + ep 10: test_acc=0.4527 + ep 15: test_acc=0.4872 + ep 20: test_acc=0.5082 + ep 25: test_acc=0.5285 + ep 30: test_acc=0.5303 + +FINAL test acc: 0.5303 +Compare to: + BP-trainable (3-seed mean): 0.609 + Penalized DFA lam=1e-2: 0.363 + DFA-shallow: 0.349 + +Margin vs DFA-shallow baseline: +18.13 pp + → BP+penalty intermediate; partial capacity loss + residual mode 2 +Saved results/bp_with_penalty/bp_pen_lam0.01_s42.json diff --git a/results/checkpointed_handoff/handoff_s42.json b/results/checkpointed_handoff/handoff_s42.json new file mode 100644 index 0000000..3c587e1 --- /dev/null +++ b/results/checkpointed_handoff/handoff_s42.json @@ -0,0 +1,5828 @@ +{ + "t0=1_continue_DFA": { + "t0": 1, + "branch": "continue_DFA", + "credit_mode": "dfa", + "vec_gamma_frozen": 0.09656917676329613, + "vec_rho_frozen": 0.05863579269498587, + "test_acc": [ + 0.2992, + 0.2975, + 0.3174, + 0.3063, + 0.3024, + 0.3003, + 0.3026, + 0.3126, + 0.3016, + 0.3099, + 0.3091, + 0.3011, + 0.3036, + 0.3023, + 0.3082, + 0.2997, + 0.306, + 0.3101, + 0.3107, + 0.3066, + 0.3077, + 0.3185, + 0.3073, + 0.3143, + 0.3011, + 0.2963, + 0.2984, + 0.3025, + 0.312, + 0.3114, + 0.2975, + 0.3027, + 0.3081, + 0.3163, + 0.3096, + 0.3068, + 0.3043, + 0.2993, + 0.3082, + 0.3177, + 0.2952, + 0.3185, + 0.3019, + 0.3166, + 0.3051, + 0.3034, + 0.3135, + 0.3163, + 0.3113, + 0.2949, + 0.306, + 0.3028, + 0.3149, + 0.2981, + 0.3037, + 0.298, + 0.3058, + 0.3096, + 0.305, + 0.3109, + 0.3116, + 0.3077, + 0.308, + 0.2948, + 0.3006, + 0.3, + 0.3113, + 0.3102, + 0.3116, + 0.3198, + 0.3093, + 0.3127, + 0.3114, + 0.3148, + 0.3084, + 0.3079, + 0.309, + 0.312, + 0.3092, + 0.3124, + 0.3127, + 0.3081, + 0.3107, + 0.3129, + 0.3113, + 0.3072, + 0.3129, + 0.3104, + 0.3105, + 0.3127, + 0.3101, + 0.3096, + 0.3097, + 0.3096, + 0.3098, + 0.3105, + 0.3102, + 0.3099, + 0.3099 + ], + "train_loss": [ + 2.005104094390869, + 1.999245828552246, + 1.990717918434143, + 1.9948186715316774, + 1.9878637986755372, + 1.9893593432998657, + 1.9875701547241211, + 1.9883377310943604, + 1.9889778761291503, + 1.9904992935180663, + 1.988277052154541, + 1.9882306117248536, + 1.9872782027816773, + 1.985600216217041, + 1.9860772969818115, + 1.9898460612487794, + 1.9905180142211913, + 1.9860824179077148, + 1.9880974890518188, + 1.9891550038146972, + 1.9879916094970702, + 1.9876963312149047, + 1.9865646858215331, + 1.9875610054779054, + 1.9867460869979858, + 1.9865504845428468, + 1.9887695896148683, + 1.985237215309143, + 1.983262216796875, + 1.9856646533966065, + 1.98726192527771, + 1.986215076828003, + 1.9864962064361573, + 1.9879007104492188, + 1.9856411930084228, + 1.9844791618347168, + 1.985663981590271, + 1.9866812015533448, + 1.9882104327011108, + 1.986241177368164, + 1.987839227027893, + 1.9884029525756837, + 1.9851063582992554, + 1.9873973809814454, + 1.9883398697662353, + 1.9882926291656493, + 1.9878544625854493, + 1.9876278662872315, + 1.986814312057495, + 1.9875123343658447, + 1.9894303966903686, + 1.9896298727416992, + 1.9864508179473876, + 1.9891698278045655, + 1.9884083446502685, + 1.9887369794464111, + 1.9869199591827393, + 1.9856764691543578, + 1.988462228012085, + 1.988183416519165, + 1.986203140182495, + 1.985873547821045, + 1.9887823755645753, + 1.9903624279785157, + 1.9878888959121703, + 1.9861296884918214, + 1.9867054331970215, + 1.9861590448760986, + 1.987158843231201, + 1.9881789891815185, + 1.9856666998672485, + 1.9864538384246826, + 1.9857932313537598, + 1.9855015665435791, + 1.9882590783691407, + 1.985731133995056, + 1.9852981592178345, + 1.9857705572128297, + 1.985713699913025, + 1.985548313446045, + 1.986746173248291, + 1.986178836288452, + 1.9855894580459594, + 1.987165645980835, + 1.984333198928833, + 1.9847857676696776, + 1.9848962052154542, + 1.985673169631958, + 1.9849330069732667, + 1.9860302136611938, + 1.9846637627410888, + 1.9842699263763428, + 1.9867480223083496, + 1.9843860877990722, + 1.9850193544006347, + 1.9854852320098877, + 1.986603337097168, + 1.98447160446167, + 1.9859222885131835 + ], + "gamma": [ + [ + 2, + 0.08365460828645155 + ], + [ + 3, + 0.0838756044395268 + ], + [ + 4, + 0.08642448589671403 + ], + [ + 5, + 0.08631917362799868 + ], + [ + 6, + 0.08794902882073075 + ], + [ + 10, + 0.08498848279123195 + ], + [ + 15, + 0.08810723858186975 + ], + [ + 20, + 0.08898510690778494 + ], + [ + 25, + 0.09006544196745381 + ], + [ + 30, + 0.09117551462259144 + ], + [ + 35, + 0.09306339762406424 + ], + [ + 40, + 0.09325595473637804 + ], + [ + 45, + 0.09583467012271285 + ], + [ + 50, + 0.09658780478639528 + ], + [ + 55, + 0.09793511401221622 + ], + [ + 60, + 0.0987178310751915 + ], + [ + 65, + 0.09876266792707611 + ], + [ + 70, + 0.09971006825799122 + ], + [ + 75, + 0.09984865269507281 + ], + [ + 80, + 0.09999703618814237 + ], + [ + 85, + 0.10003893816610798 + ], + [ + 90, + 0.10005248506786302 + ], + [ + 95, + 0.10013895700103603 + ], + [ + 100, + 0.10013917449396104 + ] + ], + "rho": [ + [ + 2, + 0.023623208981007338 + ], + [ + 3, + 0.031059461180120707 + ], + [ + 4, + 0.007820640923455358 + ], + [ + 5, + 0.007515952922403812 + ], + [ + 6, + 0.026527911657467484 + ], + [ + 10, + 0.012991047464311123 + ], + [ + 15, + -0.005115614854730666 + ], + [ + 20, + 0.009924503974616528 + ], + [ + 25, + -0.0037195844342932105 + ], + [ + 30, + 0.006601060973480344 + ], + [ + 35, + 0.0018748474540188909 + ], + [ + 40, + -0.00871655740775168 + ], + [ + 45, + 0.00834443885833025 + ], + [ + 50, + -0.002292913617566228 + ], + [ + 55, + 0.0025207558646798134 + ], + [ + 60, + 0.002179012168198824 + ], + [ + 65, + 0.0020641330629587173 + ], + [ + 70, + 0.005590236629359424 + ], + [ + 75, + 0.016159044578671455 + ], + [ + 80, + -0.013107148231938481 + ], + [ + 85, + 0.009786740876734257 + ], + [ + 90, + -0.0008740962948650122 + ], + [ + 95, + 0.000459164846688509 + ], + [ + 100, + 0.003254909534007311 + ] + ] + }, + "t0=1_handoff_to_Vec": { + "t0": 1, + "branch": "handoff_to_Vec", + "credit_mode": "vec", + "vec_gamma_frozen": 0.09656917676329613, + "vec_rho_frozen": 0.05863579269498587, + "test_acc": [ + 0.2955, + 0.2782, + 0.2784, + 0.284, + 0.2814, + 0.2775, + 0.2776, + 0.2642, + 0.2763, + 0.2874, + 0.2822, + 0.2847, + 0.2816, + 0.2739, + 0.2718, + 0.2833, + 0.2914, + 0.2842, + 0.2728, + 0.2859, + 0.2878, + 0.2853, + 0.2797, + 0.2865, + 0.2736, + 0.2932, + 0.2818, + 0.2931, + 0.2861, + 0.2999, + 0.2925, + 0.2911, + 0.2873, + 0.296, + 0.2953, + 0.2985, + 0.2992, + 0.2898, + 0.2864, + 0.2994, + 0.2975, + 0.2969, + 0.2929, + 0.2861, + 0.2932, + 0.3, + 0.2995, + 0.3002, + 0.2885, + 0.2882, + 0.2825, + 0.2756, + 0.2816, + 0.2808, + 0.2696, + 0.2753, + 0.2645, + 0.2737, + 0.2722, + 0.2798, + 0.2799, + 0.2829, + 0.2821, + 0.2815, + 0.2843, + 0.2844, + 0.2836, + 0.2905, + 0.2833, + 0.2843, + 0.2853, + 0.2869, + 0.2936, + 0.2873, + 0.2871, + 0.2893, + 0.2881, + 0.2892, + 0.288, + 0.2878, + 0.2831, + 0.2881, + 0.2877, + 0.2879, + 0.2889, + 0.2877, + 0.2881, + 0.2875, + 0.2885, + 0.2885, + 0.2899, + 0.2876, + 0.2878, + 0.2878, + 0.2878, + 0.2878, + 0.2877, + 0.2879, + 0.2879 + ], + "train_loss": [ + 2.015945917510986, + 2.031215166893005, + 2.0368634999084474, + 2.0477696321105956, + 2.054421726951599, + 2.0483808721923826, + 2.05320213470459, + 2.0556341265869142, + 2.058164549179077, + 2.0555249584197997, + 2.0498539701080323, + 2.048066238670349, + 2.053440905456543, + 2.0512889804840087, + 2.054679793930054, + 2.0598641773986817, + 2.057493388595581, + 2.0601788735198974, + 2.056555284423828, + 2.051032764129639, + 2.0525693659210207, + 2.0453330043029787, + 2.0461127487945556, + 2.047214804916382, + 2.0442636833953856, + 2.045948752670288, + 2.0369925126647948, + 2.0333812905502318, + 2.033120552749634, + 2.031175687828064, + 2.0306918560409546, + 2.026498753967285, + 2.0220600573348997, + 2.023093720741272, + 2.0173547603607176, + 2.015150221710205, + 2.0117789109039306, + 2.0088074950408936, + 2.0061517330932617, + 2.009935451011658, + 2.006004488182068, + 2.004825442237854, + 2.0023602933502196, + 2.000458836746216, + 2.004193814163208, + 2.0054830549621583, + 2.002757899093628, + 2.0051502709960936, + 2.0092752606964113, + 2.019751435394287, + 2.025835816116333, + 2.039621664581299, + 2.0485558793640135, + 2.0460470599365235, + 2.0490744052886964, + 2.046350567779541, + 2.048276037979126, + 2.0485092347717284, + 2.0470163821792604, + 2.0446103648376464, + 2.044947638206482, + 2.04646453125, + 2.04499529045105, + 2.0435341911315916, + 2.043754483680725, + 2.0412174251937865, + 2.0414371580505373, + 2.039103049697876, + 2.0424850984954834, + 2.037294840545654, + 2.038373082923889, + 2.040944115943909, + 2.039581598815918, + 2.0386644300842285, + 2.0361406172943117, + 2.0376198292541505, + 2.036687510910034, + 2.038670269317627, + 2.035312682189941, + 2.034039740829468, + 2.036844966278076, + 2.0356181509399414, + 2.0358072791290285, + 2.036061419219971, + 2.0355172812652587, + 2.0355146361541747, + 2.035239947242737, + 2.0346506198883056, + 2.0338744622802736, + 2.035136474304199, + 2.0350362033843994, + 2.036776700363159, + 2.03147145111084, + 2.0319668660736085, + 2.0320254293823243, + 2.033486301231384, + 2.0317889405059812, + 2.0344483298492433, + 2.036302082977295 + ], + "gamma": [ + [ + 2, + 0.08047902956604958 + ], + [ + 3, + 0.07857133075594902 + ], + [ + 4, + 0.07546431943774223 + ], + [ + 5, + 0.08395727723836899 + ], + [ + 6, + 0.05610836483538151 + ], + [ + 10, + 0.04730626195669174 + ], + [ + 15, + 0.025737784802913666 + ], + [ + 20, + 0.0345981465652585 + ], + [ + 25, + 0.045754930935800076 + ], + [ + 30, + 0.04951832536607981 + ], + [ + 35, + 0.026294309180229902 + ], + [ + 40, + 0.0595368966460228 + ], + [ + 45, + 0.046594537794589996 + ], + [ + 50, + 0.033051918260753155 + ], + [ + 55, + 0.02544371667318046 + ], + [ + 60, + 0.020283427322283387 + ], + [ + 65, + 0.012271790998056531 + ], + [ + 70, + 0.013303825166076422 + ], + [ + 75, + 0.01240244135260582 + ], + [ + 80, + 0.019197688903659582 + ], + [ + 85, + 0.025835730601102114 + ], + [ + 90, + 0.014533155597746372 + ], + [ + 95, + 0.010510357329621911 + ], + [ + 100, + 0.03327144589275122 + ] + ], + "rho": [ + [ + 2, + 0.0523966820910573 + ], + [ + 3, + 0.035237337462604046 + ], + [ + 4, + 0.02739660767838359 + ], + [ + 5, + 0.02595712710171938 + ], + [ + 6, + 0.01324984265374951 + ], + [ + 10, + 0.0034468388184905052 + ], + [ + 15, + 0.02876631636172533 + ], + [ + 20, + 0.014511071029119194 + ], + [ + 25, + 0.018587190308608115 + ], + [ + 30, + 0.017810289282351732 + ], + [ + 35, + -0.00010454491712152958 + ], + [ + 40, + 0.03750455845147371 + ], + [ + 45, + 0.0221580620855093 + ], + [ + 50, + 0.016393208876252174 + ], + [ + 55, + 0.024259520694613457 + ], + [ + 60, + 0.0006769530009478331 + ], + [ + 65, + 0.004339074715971947 + ], + [ + 70, + -0.014295346569269896 + ], + [ + 75, + 0.006795731722377241 + ], + [ + 80, + 0.004815738648176193 + ], + [ + 85, + 0.01747259055264294 + ], + [ + 90, + 0.008213724358938634 + ], + [ + 95, + 0.0064226004760712385 + ], + [ + 100, + -0.011937383911572397 + ] + ] + }, + "t0=1_handoff_blend_025": { + "t0": 1, + "branch": "handoff_blend_025", + "credit_mode": "0.25", + "vec_gamma_frozen": 0.09656917676329613, + "vec_rho_frozen": 0.05863579269498587, + "test_acc": [ + 0.3111, + 0.3053, + 0.3102, + 0.296, + 0.2996, + 0.3021, + 0.3028, + 0.3078, + 0.3244, + 0.3001, + 0.3014, + 0.3089, + 0.3036, + 0.3074, + 0.2926, + 0.3058, + 0.2992, + 0.3037, + 0.313, + 0.3021, + 0.3029, + 0.3, + 0.2896, + 0.3085, + 0.3151, + 0.3089, + 0.2984, + 0.3209, + 0.2974, + 0.3025, + 0.3092, + 0.2992, + 0.2943, + 0.3076, + 0.308, + 0.2943, + 0.3121, + 0.3064, + 0.3032, + 0.3053, + 0.3022, + 0.3028, + 0.3145, + 0.2974, + 0.2874, + 0.3106, + 0.314, + 0.2995, + 0.3134, + 0.3098, + 0.314, + 0.3063, + 0.2977, + 0.3034, + 0.2948, + 0.3037, + 0.3012, + 0.3031, + 0.305, + 0.3157, + 0.3155, + 0.3111, + 0.3079, + 0.3132, + 0.3093, + 0.3094, + 0.3016, + 0.3061, + 0.3103, + 0.3033, + 0.3069, + 0.3034, + 0.3061, + 0.3106, + 0.3118, + 0.3016, + 0.3042, + 0.3055, + 0.3076, + 0.303, + 0.3139, + 0.3142, + 0.3073, + 0.3095, + 0.3104, + 0.307, + 0.3113, + 0.3082, + 0.3082, + 0.3114, + 0.3088, + 0.3082, + 0.3105, + 0.3084, + 0.3088, + 0.3085, + 0.3087, + 0.3085, + 0.3086 + ], + "train_loss": [ + 2.0022245991516114, + 1.9935898416900635, + 1.9875775625610352, + 1.9858978401184082, + 1.9874549602508544, + 1.986268791809082, + 1.98443969581604, + 1.9838888143920899, + 1.983516501235962, + 1.984957610244751, + 1.9847360565948486, + 1.9854843878936768, + 1.9889900983428954, + 1.9892487187957764, + 1.986811499862671, + 1.9856256427764893, + 1.9893547413635253, + 1.9828974528503418, + 1.986581955718994, + 1.9878245291137695, + 1.9864517379760742, + 1.9873112936019897, + 1.9876939282226562, + 1.9883113063049316, + 1.9865273703384398, + 1.9862786171722413, + 1.9892862311553956, + 1.9884720623397827, + 1.9870043449401855, + 1.9874348849487304, + 1.990588033065796, + 1.9881115494155883, + 1.9887018839263917, + 1.9879537491226196, + 1.9903549543762207, + 1.9885931634521485, + 1.9875886775207519, + 1.9906563118743896, + 1.9887426946258544, + 1.9884200235366822, + 1.9906145004272462, + 1.9910429104232787, + 1.9885761791229248, + 1.9890102088928223, + 1.9905473038482666, + 1.9892784567260742, + 1.989883409576416, + 1.9908014490127564, + 1.98919737739563, + 1.9889136992645264, + 1.9883604386138916, + 1.9884866456604005, + 1.9879132501602172, + 1.9889593492126465, + 1.9869321535873412, + 1.9885730269622803, + 1.991215665359497, + 1.9891708112335205, + 1.9890033248519898, + 1.9874444742584227, + 1.9906505158996581, + 1.986556499633789, + 1.9876996881866456, + 1.9885468618011475, + 1.9893393377304076, + 1.9888792642974853, + 1.9877725827789308, + 1.9870013921356202, + 1.987901944580078, + 1.9878336889266968, + 1.9885768801498414, + 1.9894254553222657, + 1.9879446279144286, + 1.988163232269287, + 1.9871198620605468, + 1.9874201794433595, + 1.9874488901519776, + 1.9859690590667725, + 1.9852127573394776, + 1.988850376739502, + 1.9867211999511718, + 1.9882648557281495, + 1.9882584195709228, + 1.9879279172134399, + 1.9870988179779052, + 1.9880465350341796, + 1.9854906230163574, + 1.9872620104599, + 1.984942267112732, + 1.9865179452514647, + 1.9890154412841796, + 1.9864197870254516, + 1.9873270251464843, + 1.984911873626709, + 1.985314598083496, + 1.9849051734924317, + 1.9861649570465087, + 1.9855684439086914, + 1.9856900079345703 + ], + "gamma": [ + [ + 2, + 0.08755725051742047 + ], + [ + 3, + 0.08835660142358392 + ], + [ + 4, + 0.09044992318376899 + ], + [ + 5, + 0.0912612872198224 + ], + [ + 6, + 0.08909219017368741 + ], + [ + 10, + 0.09415691878530197 + ], + [ + 15, + 0.09399708660203032 + ], + [ + 20, + 0.09649969436577521 + ], + [ + 25, + 0.09672255971236154 + ], + [ + 30, + 0.09725288115441799 + ], + [ + 35, + 0.09698972932528704 + ], + [ + 40, + 0.09553188434801996 + ], + [ + 45, + 0.09639296727254987 + ], + [ + 50, + 0.09763344551902264 + ], + [ + 55, + 0.09868537378497422 + ], + [ + 60, + 0.0996450218372047 + ], + [ + 65, + 0.09987909882329404 + ], + [ + 70, + 0.10013037058524787 + ], + [ + 75, + 0.1004320508800447 + ], + [ + 80, + 0.1006945266854018 + ], + [ + 85, + 0.10076600266620517 + ], + [ + 90, + 0.1008826564066112 + ], + [ + 95, + 0.10086964559741318 + ], + [ + 100, + 0.10083653079345822 + ] + ], + "rho": [ + [ + 2, + 0.04362574522383511 + ], + [ + 3, + 0.018613046035170555 + ], + [ + 4, + 0.03438749210909009 + ], + [ + 5, + 0.012654631165787578 + ], + [ + 6, + 0.024472361663356423 + ], + [ + 10, + 0.023966667242348194 + ], + [ + 15, + 0.01459161564707756 + ], + [ + 20, + 0.007110691978596151 + ], + [ + 25, + -0.00921933469362557 + ], + [ + 30, + -0.0029747774824500084 + ], + [ + 35, + 0.0010375240817666054 + ], + [ + 40, + -0.02443948434665799 + ], + [ + 45, + 0.019922912120819092 + ], + [ + 50, + 0.00852518086321652 + ], + [ + 55, + 0.012839498929679394 + ], + [ + 60, + 0.014052851125597954 + ], + [ + 65, + 0.004162493161857128 + ], + [ + 70, + 0.009675031527876854 + ], + [ + 75, + -0.0009063638281077147 + ], + [ + 80, + -0.007764752488583326 + ], + [ + 85, + 0.007670489139854908 + ], + [ + 90, + 0.006271053454838693 + ], + [ + 95, + 0.0010284053860232234 + ], + [ + 100, + 0.011300223181024194 + ] + ] + }, + "t0=1_handoff_blend_05": { + "t0": 1, + "branch": "handoff_blend_05", + "credit_mode": "0.5", + "vec_gamma_frozen": 0.09656917676329613, + "vec_rho_frozen": 0.05863579269498587, + "test_acc": [ + 0.2998, + 0.2995, + 0.3061, + 0.3097, + 0.2982, + 0.3039, + 0.3034, + 0.3137, + 0.319, + 0.3051, + 0.3111, + 0.3024, + 0.3178, + 0.3052, + 0.3125, + 0.3095, + 0.2925, + 0.3163, + 0.3181, + 0.3107, + 0.3188, + 0.3122, + 0.3111, + 0.3192, + 0.315, + 0.3186, + 0.326, + 0.3084, + 0.3176, + 0.3248, + 0.3144, + 0.3108, + 0.3046, + 0.3055, + 0.3033, + 0.3203, + 0.2965, + 0.3188, + 0.3115, + 0.3089, + 0.3195, + 0.3079, + 0.3168, + 0.3177, + 0.3036, + 0.3127, + 0.323, + 0.3197, + 0.3194, + 0.3151, + 0.3139, + 0.3075, + 0.3064, + 0.3135, + 0.3102, + 0.3175, + 0.3182, + 0.3164, + 0.3158, + 0.3192, + 0.3119, + 0.3203, + 0.3215, + 0.3178, + 0.3146, + 0.3153, + 0.3114, + 0.3195, + 0.3221, + 0.3218, + 0.3173, + 0.318, + 0.3144, + 0.3176, + 0.3238, + 0.3123, + 0.3239, + 0.3117, + 0.3221, + 0.3174, + 0.3165, + 0.3134, + 0.3211, + 0.3096, + 0.3203, + 0.3141, + 0.3188, + 0.3172, + 0.3188, + 0.3194, + 0.3191, + 0.3183, + 0.3192, + 0.3184, + 0.3197, + 0.3192, + 0.3193, + 0.3194, + 0.3193 + ], + "train_loss": [ + 1.9964759397125245, + 1.986522459487915, + 1.9889211281585693, + 1.9849028786468506, + 1.9856864283752442, + 1.9870827670669555, + 1.9844132846069336, + 1.9864352696990968, + 1.9838863813781737, + 1.9818759115982056, + 1.9820441235351562, + 1.9810762729263305, + 1.9795643308258057, + 1.9780980207061767, + 1.977905396270752, + 1.978753300552368, + 1.9777276525115968, + 1.9766205754852295, + 1.9777377243423462, + 1.9798491777801515, + 1.9769015805053711, + 1.9804970788574219, + 1.9793168542480468, + 1.977575127105713, + 1.9770600776672362, + 1.9771426824188232, + 1.9763531399536134, + 1.977475728492737, + 1.9750000988388061, + 1.975525735168457, + 1.9758171199035643, + 1.974286738510132, + 1.9785872597503662, + 1.9767009394073487, + 1.9724377210998536, + 1.9768052847290039, + 1.975557327041626, + 1.9760462573242188, + 1.977154655532837, + 1.978235277862549, + 1.9766063391113282, + 1.9764202359771728, + 1.973938695526123, + 1.9763149166488647, + 1.976523175201416, + 1.978896485519409, + 1.9763345267486572, + 1.9742885404968262, + 1.9735685025787353, + 1.9737253631591798, + 1.9754708728027344, + 1.973962202835083, + 1.976864084815979, + 1.9740761524200439, + 1.9715926027679442, + 1.973404716873169, + 1.9737475647354126, + 1.9745283292388915, + 1.971100970916748, + 1.973395662765503, + 1.9691142282485963, + 1.9740757447052002, + 1.9709492151260375, + 1.9731487519073487, + 1.973130091934204, + 1.9727552867889404, + 1.9702830828475952, + 1.9701461628723145, + 1.9707595698547364, + 1.9722970157241821, + 1.9729449915313721, + 1.9734750841522217, + 1.9717456188201905, + 1.9711427689361571, + 1.9695089659881593, + 1.970119482688904, + 1.970220106048584, + 1.9718244704818726, + 1.9723210890197753, + 1.971758684692383, + 1.9695239351654052, + 1.9687840794372558, + 1.972842834701538, + 1.9699950525665284, + 1.970986016921997, + 1.9703039749908446, + 1.969877626953125, + 1.969045710144043, + 1.9671956343078614, + 1.9715656520080567, + 1.970316907119751, + 1.9676782611846924, + 1.969870410232544, + 1.9710947259521485, + 1.9689072478866576, + 1.968521340637207, + 1.970043116760254, + 1.9692224349975587, + 1.9709827098083497 + ], + "gamma": [ + [ + 2, + 0.026154235936701298 + ], + [ + 3, + 0.020070078317075968 + ], + [ + 4, + 0.01762574864551425 + ], + [ + 5, + 0.0008397532510571182 + ], + [ + 6, + 0.006103275518398732 + ], + [ + 10, + -0.003356293927936349 + ], + [ + 15, + 0.0013201967813074589 + ], + [ + 20, + 0.001530651847133413 + ], + [ + 25, + 0.005929780309088528 + ], + [ + 30, + 0.004774399858433753 + ], + [ + 35, + -0.006621059263125062 + ], + [ + 40, + 0.00380888202926144 + ], + [ + 45, + 0.0010936335020232946 + ], + [ + 50, + 0.004796426190296188 + ], + [ + 55, + 0.005293689668178558 + ], + [ + 60, + 0.005288513260893524 + ], + [ + 65, + 0.0058356927474960685 + ], + [ + 70, + -0.0037194571923464537 + ], + [ + 75, + -0.0013957229093648493 + ], + [ + 80, + -0.0023256471613422036 + ], + [ + 85, + 0.0007315699476748705 + ], + [ + 90, + 0.005473496858030558 + ], + [ + 95, + -0.001862971083028242 + ], + [ + 100, + -0.005210198578424752 + ] + ], + "rho": [ + [ + 2, + 0.02363818814046681 + ], + [ + 3, + -0.003841649042442441 + ], + [ + 4, + 0.0038465188117697835 + ], + [ + 5, + -0.007402543909847736 + ], + [ + 6, + -0.009222022956237197 + ], + [ + 10, + -0.006807031808421016 + ], + [ + 15, + 0.005405803909525275 + ], + [ + 20, + 0.00024111219681799412 + ], + [ + 25, + 0.007579304627142847 + ], + [ + 30, + -0.008540671231457964 + ], + [ + 35, + -0.015692403772845864 + ], + [ + 40, + 0.006019875523634255 + ], + [ + 45, + -0.017327272333204746 + ], + [ + 50, + 0.006294254271779209 + ], + [ + 55, + -0.006749727763235569 + ], + [ + 60, + -0.026353304274380207 + ], + [ + 65, + -0.005721054505556822 + ], + [ + 70, + 0.009690426988527179 + ], + [ + 75, + 0.019502819515764713 + ], + [ + 80, + 0.005438428255729377 + ], + [ + 85, + 0.0001830030232667923 + ], + [ + 90, + 0.006266675773076713 + ], + [ + 95, + 0.01847551402170211 + ], + [ + 100, + 0.0018311627209186554 + ] + ] + }, + "t0=1_handoff_blend_075": { + "t0": 1, + "branch": "handoff_blend_075", + "credit_mode": "0.75", + "vec_gamma_frozen": 0.09656917676329613, + "vec_rho_frozen": 0.05863579269498587, + "test_acc": [ + 0.2977, + 0.305, + 0.2969, + 0.3109, + 0.2979, + 0.2928, + 0.3066, + 0.3099, + 0.3142, + 0.3105, + 0.3106, + 0.3048, + 0.3076, + 0.3091, + 0.318, + 0.3129, + 0.3093, + 0.3041, + 0.3055, + 0.3115, + 0.3052, + 0.3136, + 0.3118, + 0.3102, + 0.3118, + 0.3081, + 0.307, + 0.2984, + 0.3087, + 0.313, + 0.3133, + 0.2993, + 0.317, + 0.3144, + 0.3119, + 0.3078, + 0.3066, + 0.3069, + 0.317, + 0.3064, + 0.3104, + 0.3167, + 0.3101, + 0.3134, + 0.3162, + 0.3087, + 0.3094, + 0.3043, + 0.3077, + 0.307, + 0.3117, + 0.3143, + 0.3099, + 0.315, + 0.3135, + 0.3124, + 0.3093, + 0.3053, + 0.3055, + 0.3158, + 0.3143, + 0.3098, + 0.3093, + 0.3148, + 0.3153, + 0.3127, + 0.3125, + 0.3131, + 0.3129, + 0.3091, + 0.3118, + 0.3116, + 0.3118, + 0.3139, + 0.3125, + 0.3124, + 0.3133, + 0.3156, + 0.3101, + 0.3147, + 0.3129, + 0.3151, + 0.3132, + 0.3134, + 0.3101, + 0.3127, + 0.3116, + 0.3141, + 0.3141, + 0.3144, + 0.3125, + 0.3128, + 0.3129, + 0.3139, + 0.3134, + 0.3131, + 0.313, + 0.3129, + 0.3129 + ], + "train_loss": [ + 2.002244232940674, + 1.9951775869750976, + 1.9918160665130615, + 1.9940172212982177, + 1.9916485752105713, + 1.9921171990966797, + 1.9883098573303222, + 1.9892685530853271, + 1.9849425873184203, + 1.9915643294906615, + 1.9951231976699828, + 1.992038464126587, + 1.9917635531997682, + 1.9923094696044923, + 1.9920373969268799, + 1.9935483200073243, + 1.9923310842132569, + 1.991506326599121, + 1.9918861209869385, + 1.9921872561645508, + 1.990366029281616, + 1.9843111011505128, + 1.9868859357452393, + 1.9840549843597413, + 1.9850743936538697, + 1.9839836559677124, + 1.9826338681030273, + 1.9822956439590453, + 1.9856928828430176, + 1.9857296188354492, + 1.9837195449829101, + 1.9857995317840575, + 1.9845319289398193, + 1.984692417640686, + 1.9811759020614623, + 1.9817139127349854, + 1.980710191307068, + 1.9814997412109374, + 1.9822780115509033, + 1.9804564181137085, + 1.977652523651123, + 1.9795805383300782, + 1.980954542617798, + 1.978486502380371, + 1.9791298051452637, + 1.9800936795043946, + 1.9805563346099853, + 1.9785936288452148, + 1.980796855392456, + 1.9780987171936035, + 1.9748391804504395, + 1.9757625882720948, + 1.976084370689392, + 1.9784486378479005, + 1.9737589139556886, + 1.9767526709747314, + 1.9767190921020508, + 1.9780089361953734, + 1.9759229090118409, + 1.9766665428924561, + 1.9769705713653565, + 1.978578275756836, + 1.9803025625228883, + 1.9753058197784423, + 1.9762325865936279, + 1.9765951169586182, + 1.97721080078125, + 1.9758360475158692, + 1.97510467918396, + 1.975154207611084, + 1.9767314224243164, + 1.9760272202301026, + 1.9717421292877197, + 1.974777950820923, + 1.9745227828598022, + 1.972256569480896, + 1.9772344808197022, + 1.9736685093688966, + 1.9746162140655517, + 1.9726906596374512, + 1.9713606758880615, + 1.974294290161133, + 1.972399390335083, + 1.972963998260498, + 1.97328719291687, + 1.9742246744537353, + 1.9722734257507324, + 1.9737086239242554, + 1.9756339550018311, + 1.9758233905792237, + 1.9724433166503905, + 1.9736129235839843, + 1.9720692176055907, + 1.9757880128479004, + 1.974402798538208, + 1.9715344583129883, + 1.9708433507537841, + 1.9731714196777344, + 1.9710566232299804 + ], + "gamma": [ + [ + 2, + 0.052353628911077976 + ], + [ + 3, + 0.034367543179541826 + ], + [ + 4, + 0.024552959483116865 + ], + [ + 5, + 0.02667293418198824 + ], + [ + 6, + 0.023417511023581028 + ], + [ + 10, + 0.0010976618505083025 + ], + [ + 15, + 0.000705889193341136 + ], + [ + 20, + 0.002806061034789309 + ], + [ + 25, + 0.004039550432935357 + ], + [ + 30, + -0.0011348283442202955 + ], + [ + 35, + 0.0009491801902186126 + ], + [ + 40, + 0.0009468548669246957 + ], + [ + 45, + 0.0053506477270275354 + ], + [ + 50, + 0.0007167482108343393 + ], + [ + 55, + 0.012037382461130619 + ], + [ + 60, + -0.0031005641794763505 + ], + [ + 65, + -0.006883909518364817 + ], + [ + 70, + 0.0009665123070590198 + ], + [ + 75, + -0.0019836243882309645 + ], + [ + 80, + 0.00025643024127930403 + ], + [ + 85, + 0.0018020248680841178 + ], + [ + 90, + 0.00039675203152000904 + ], + [ + 95, + 0.0029509408050216734 + ], + [ + 100, + 0.002882578322896734 + ] + ], + "rho": [ + [ + 2, + 0.015290866955183446 + ], + [ + 3, + -0.004411513218656182 + ], + [ + 4, + 0.010378057137131691 + ], + [ + 5, + 0.0035153937060385942 + ], + [ + 6, + 0.03270322363823652 + ], + [ + 10, + 0.013274953002110124 + ], + [ + 15, + 0.007313696900382638 + ], + [ + 20, + 0.0014700493775308132 + ], + [ + 25, + 0.02754763583652675 + ], + [ + 30, + -0.009145653806626797 + ], + [ + 35, + -0.02248904900625348 + ], + [ + 40, + 0.0035426513059064746 + ], + [ + 45, + -0.019286202965304255 + ], + [ + 50, + 0.001962615526281297 + ], + [ + 55, + -0.006869069766253233 + ], + [ + 60, + -0.002172804670408368 + ], + [ + 65, + -0.016067678690887988 + ], + [ + 70, + 0.009328338550403714 + ], + [ + 75, + 0.002936127595603466 + ], + [ + 80, + 0.007801508414559066 + ], + [ + 85, + -0.010142600862309337 + ], + [ + 90, + 0.022333773435093462 + ], + [ + 95, + 0.027533504646271467 + ], + [ + 100, + 0.007295530114788562 + ] + ] + }, + "t0=5_continue_DFA": { + "t0": 5, + "branch": "continue_DFA", + "credit_mode": "dfa", + "vec_gamma_frozen": -0.0011670500971376896, + "vec_rho_frozen": -0.0008091113995760679, + "test_acc": [ + 0.286, + 0.2864, + 0.3127, + 0.3129, + 0.303, + 0.31, + 0.3079, + 0.303, + 0.3037, + 0.2946, + 0.3018, + 0.3081, + 0.3082, + 0.3141, + 0.2962, + 0.3041, + 0.3069, + 0.3011, + 0.2941, + 0.3159, + 0.3023, + 0.3, + 0.3151, + 0.3031, + 0.3017, + 0.3004, + 0.3014, + 0.3056, + 0.31, + 0.2991, + 0.3019, + 0.3082, + 0.3095, + 0.3154, + 0.309, + 0.3099, + 0.3151, + 0.3132, + 0.31, + 0.3055, + 0.315, + 0.3119, + 0.3122, + 0.3081, + 0.2984, + 0.3005, + 0.2993, + 0.3104, + 0.3013, + 0.3184, + 0.3114, + 0.3148, + 0.3147, + 0.3212, + 0.3041, + 0.3067, + 0.3154, + 0.3153, + 0.3039, + 0.3071, + 0.3027, + 0.3065, + 0.306, + 0.3054, + 0.3101, + 0.3134, + 0.3153, + 0.3114, + 0.3126, + 0.3107, + 0.3098, + 0.3094, + 0.3175, + 0.3083, + 0.314, + 0.3086, + 0.3157, + 0.3117, + 0.3112, + 0.308, + 0.3121, + 0.3116, + 0.3105, + 0.3102, + 0.3116, + 0.3079, + 0.3116, + 0.3107, + 0.3101, + 0.3107, + 0.3102, + 0.3106, + 0.3102, + 0.3103, + 0.3103 + ], + "train_loss": [ + 1.9945657642364503, + 1.9892032089233398, + 1.989667843170166, + 1.9889540602111817, + 1.9877084450912477, + 1.9906675277328492, + 1.9864669036483764, + 1.9867150240325928, + 1.9877397603988647, + 1.9864815524291992, + 1.9863448078918458, + 1.9870365029144288, + 1.9845438903045654, + 1.986594946975708, + 1.9863773782348633, + 1.9880121642684936, + 1.9844076459503175, + 1.9840656581115723, + 1.985374744529724, + 1.9861069692993165, + 1.9889161559295654, + 1.9823769841766357, + 1.9831642793273925, + 1.9848684078216552, + 1.9829382559967041, + 1.9855777975463866, + 1.9854941162490845, + 1.9845333672714234, + 1.9839171437072753, + 1.9880839752197266, + 1.9847318223571777, + 1.984719175720215, + 1.9868058791732788, + 1.9847546783065797, + 1.9858031771087647, + 1.9850444971084595, + 1.9849619479370118, + 1.9860688787841796, + 1.9873581707000731, + 1.9846882070541383, + 1.9853530577850342, + 1.9865586192321778, + 1.9831706686782837, + 1.9880626383209228, + 1.98433695602417, + 1.9854192114257811, + 1.9873864656829834, + 1.9847075728607178, + 1.9848620285797118, + 1.9850804802703856, + 1.986241734085083, + 1.9842840629577636, + 1.9846623175811768, + 1.9837202432250975, + 1.9833905213165284, + 1.98507500831604, + 1.9852062008666993, + 1.9849481295013427, + 1.9852164017486573, + 1.9842260655212403, + 1.9830121032714845, + 1.9843900450897216, + 1.985827170753479, + 1.9848842519378662, + 1.9841410041809082, + 1.983917918395996, + 1.983969561920166, + 1.9836610689544678, + 1.9818206084823609, + 1.985752599143982, + 1.9869396998596192, + 1.9837494311523438, + 1.9854834408187867, + 1.9834301959991456, + 1.9836588149261474, + 1.9832239440536499, + 1.98726832157135, + 1.9839551043319703, + 1.9846663961410522, + 1.984481372642517, + 1.982844881439209, + 1.98507500125885, + 1.983243388671875, + 1.9826328707885743, + 1.9851836437988282, + 1.9820660934448242, + 1.9849612855529786, + 1.9845160094833374, + 1.9832502113342285, + 1.9836221703338623, + 1.9820610466003419, + 1.9824563201141356, + 1.9836898809814454, + 1.984211915359497, + 1.9812234192276001 + ], + "gamma": [ + [ + 6, + 0.08068505953997374 + ], + [ + 7, + 0.08144430501852185 + ], + [ + 8, + 0.08350347669329494 + ], + [ + 9, + 0.08311534579843283 + ], + [ + 10, + 0.08463118376675993 + ], + [ + 15, + 0.08571162971202284 + ], + [ + 20, + 0.08807254146086052 + ], + [ + 25, + 0.08991092321230099 + ], + [ + 30, + 0.0921339783235453 + ], + [ + 35, + 0.09160169487586245 + ], + [ + 40, + 0.09465893157175742 + ], + [ + 45, + 0.096345643280074 + ], + [ + 50, + 0.0977244143577991 + ], + [ + 55, + 0.09827914473135024 + ], + [ + 60, + 0.0987607302959077 + ], + [ + 65, + 0.09956814988981932 + ], + [ + 70, + 0.09977925471321214 + ], + [ + 75, + 0.09998935088515282 + ], + [ + 80, + 0.10024463618174195 + ], + [ + 85, + 0.10021435595990624 + ], + [ + 90, + 0.10016857067239471 + ], + [ + 95, + 0.10026378170005046 + ], + [ + 100, + 0.10024830840120558 + ] + ], + "rho": [ + [ + 6, + 0.01574710663408041 + ], + [ + 7, + 0.006062062457203865 + ], + [ + 8, + 0.016018295427784324 + ], + [ + 9, + 0.015312008908949792 + ], + [ + 10, + 0.028855220298282802 + ], + [ + 15, + -0.002411970403045416 + ], + [ + 20, + -0.014547059312462807 + ], + [ + 25, + -0.0001543508842587471 + ], + [ + 30, + 0.007254098542034626 + ], + [ + 35, + -0.002188083017244935 + ], + [ + 40, + 0.0022464566864073277 + ], + [ + 45, + -0.002664287807419896 + ], + [ + 50, + 0.0016106266994029284 + ], + [ + 55, + -0.005183202214539051 + ], + [ + 60, + -0.00018570874817669392 + ], + [ + 65, + -0.006523153744637966 + ], + [ + 70, + 0.0007113250903785229 + ], + [ + 75, + 0.003613469423726201 + ], + [ + 80, + -0.001357327913865447 + ], + [ + 85, + 0.005128338932991028 + ], + [ + 90, + 0.0064690024591982365 + ], + [ + 95, + 0.006112658418715 + ], + [ + 100, + -0.0015342006227001548 + ] + ] + }, + "t0=5_handoff_to_Vec": { + "t0": 5, + "branch": "handoff_to_Vec", + "credit_mode": "vec", + "vec_gamma_frozen": -0.0011670500971376896, + "vec_rho_frozen": -0.0008091113995760679, + "test_acc": [ + 0.3101, + 0.2999, + 0.3149, + 0.3139, + 0.3006, + 0.3141, + 0.3142, + 0.2974, + 0.3111, + 0.3089, + 0.3121, + 0.3166, + 0.322, + 0.318, + 0.3157, + 0.3099, + 0.3205, + 0.3181, + 0.3027, + 0.3025, + 0.2954, + 0.3054, + 0.3062, + 0.2937, + 0.2964, + 0.2991, + 0.3017, + 0.2947, + 0.2916, + 0.2873, + 0.2905, + 0.2995, + 0.2949, + 0.2956, + 0.294, + 0.3013, + 0.2997, + 0.298, + 0.2871, + 0.2955, + 0.2911, + 0.3015, + 0.3048, + 0.3008, + 0.3004, + 0.2984, + 0.2967, + 0.3011, + 0.2986, + 0.3011, + 0.3006, + 0.3004, + 0.2958, + 0.2959, + 0.2998, + 0.3019, + 0.3035, + 0.2956, + 0.3013, + 0.2971, + 0.2991, + 0.3015, + 0.3004, + 0.3036, + 0.3026, + 0.3017, + 0.3051, + 0.306, + 0.3011, + 0.3029, + 0.3002, + 0.3008, + 0.3016, + 0.3013, + 0.3038, + 0.3005, + 0.3016, + 0.3008, + 0.3012, + 0.3036, + 0.3024, + 0.303, + 0.3006, + 0.302, + 0.3012, + 0.3019, + 0.3027, + 0.3009, + 0.3016, + 0.3015, + 0.3019, + 0.3018, + 0.3014, + 0.3015, + 0.3015 + ], + "train_loss": [ + 1.98885035697937, + 1.9834733580780028, + 1.981598624267578, + 1.9747283523559571, + 1.9707511127090453, + 1.9739490607452392, + 1.9759334008789062, + 1.9722962183380126, + 1.969624571609497, + 1.970889538192749, + 1.9678439852142333, + 1.965836248550415, + 1.969429095993042, + 1.9667920967864991, + 1.9675887169647217, + 1.9696137982559203, + 1.9648815822601318, + 1.9641471920776368, + 1.9694185340881347, + 1.9674127616882324, + 1.9701248693847657, + 1.968683921661377, + 1.9691599715423584, + 1.971469653930664, + 1.9735202487182617, + 1.9709416125488282, + 1.9693266723251344, + 1.9711621636199952, + 1.9731029653549195, + 1.9722007320404054, + 1.9766441119003295, + 1.9791824002456666, + 1.980170124053955, + 1.9817060145568848, + 1.9830878174591065, + 1.9799753763198853, + 1.9815638799285888, + 1.9794073379516601, + 1.980983480911255, + 1.981872991294861, + 1.9820363941192627, + 1.9837005889511108, + 1.984742343788147, + 1.9826304132461547, + 1.9830743347549438, + 1.9853464989471437, + 1.9872392234039307, + 1.9889681858062744, + 1.9864943215560913, + 1.9846966150665284, + 1.9865829640960693, + 1.9905489418029785, + 1.9874937824249268, + 1.989253215866089, + 1.9904289415740968, + 1.9927669877624512, + 1.990568099708557, + 1.9897481592559814, + 1.992023238067627, + 1.9895323735046386, + 1.993159462814331, + 1.9899572118377686, + 1.9872143391418458, + 1.9883589829254151, + 1.989579504470825, + 1.9907801698303222, + 1.9910909828948975, + 1.9903339798355102, + 1.9899965377426148, + 1.9899286922836303, + 1.9903258807754516, + 1.9883497542572022, + 1.9908707794952392, + 1.9920183470916748, + 1.9884405541992187, + 1.9887260723114013, + 1.9880731015777588, + 1.9888823722076416, + 1.9922956163787842, + 1.9894610665893555, + 1.9864570722198487, + 1.9915890454864502, + 1.9884616263580321, + 1.9895376153945923, + 1.987952762145996, + 1.9885796316528321, + 1.9864410493469238, + 1.988354708404541, + 1.9899560904693603, + 1.9896160398101808, + 1.9880389366912843, + 1.9887718877792357, + 1.9906292826080323, + 1.9877384049224853, + 1.9911569009017944 + ], + "gamma": [ + [ + 6, + 0.005619358271360397 + ], + [ + 7, + 0.0035822700010612607 + ], + [ + 8, + -0.0029355929873418063 + ], + [ + 9, + 0.006172257591970265 + ], + [ + 10, + -0.004561105743050575 + ], + [ + 15, + -0.010032707592472434 + ], + [ + 20, + -0.0037149503914406523 + ], + [ + 25, + 0.007247599656693637 + ], + [ + 30, + -0.0050241799908690155 + ], + [ + 35, + 0.015613792231306434 + ], + [ + 40, + 0.025709006004035473 + ], + [ + 45, + 0.0002260007313452661 + ], + [ + 50, + 0.0014361715875566006 + ], + [ + 55, + -0.011857346049509943 + ], + [ + 60, + -0.005695054976968095 + ], + [ + 65, + -0.005439719301648438 + ], + [ + 70, + 0.0009671060252003372 + ], + [ + 75, + -0.016561364755034447 + ], + [ + 80, + -0.0004842726048082113 + ], + [ + 85, + 0.0014199530705809593 + ], + [ + 90, + 0.01024728428456001 + ], + [ + 95, + 0.0046352153294719756 + ], + [ + 100, + -0.002752471948042512 + ] + ], + "rho": [ + [ + 6, + 0.003488943912088871 + ], + [ + 7, + 0.001728452043607831 + ], + [ + 8, + 0.00367677363101393 + ], + [ + 9, + 0.008639804320409894 + ], + [ + 10, + -0.001072778832167387 + ], + [ + 15, + -0.00901060551404953 + ], + [ + 20, + -0.005643368232995272 + ], + [ + 25, + -0.02103308727964759 + ], + [ + 30, + 0.0036174810957163572 + ], + [ + 35, + 0.000864740926772356 + ], + [ + 40, + 0.006006992422044277 + ], + [ + 45, + 0.020154819823801517 + ], + [ + 50, + -0.0033918266417458653 + ], + [ + 55, + 0.0006412133807316422 + ], + [ + 60, + -0.00839216262102127 + ], + [ + 65, + 0.012077370309270918 + ], + [ + 70, + -0.0074131840374320745 + ], + [ + 75, + 0.016973318299278617 + ], + [ + 80, + 0.0036046612076461315 + ], + [ + 85, + -0.0015375642105937004 + ], + [ + 90, + -0.00948665989562869 + ], + [ + 95, + -0.013291625306010246 + ], + [ + 100, + 0.0005498486571013927 + ] + ] + }, + "t0=5_handoff_blend_025": { + "t0": 5, + "branch": "handoff_blend_025", + "credit_mode": "0.25", + "vec_gamma_frozen": -0.0011670500971376896, + "vec_rho_frozen": -0.0008091113995760679, + "test_acc": [ + 0.3063, + 0.308, + 0.3149, + 0.3063, + 0.3135, + 0.2986, + 0.2898, + 0.2885, + 0.2977, + 0.3044, + 0.3098, + 0.3095, + 0.3128, + 0.3035, + 0.3068, + 0.2941, + 0.3203, + 0.3105, + 0.3065, + 0.3087, + 0.2912, + 0.304, + 0.3148, + 0.306, + 0.2943, + 0.3101, + 0.3007, + 0.3147, + 0.3186, + 0.309, + 0.2981, + 0.3112, + 0.3092, + 0.3053, + 0.3077, + 0.2914, + 0.3036, + 0.3021, + 0.3074, + 0.3137, + 0.3048, + 0.2981, + 0.3129, + 0.3148, + 0.3003, + 0.3029, + 0.3108, + 0.3148, + 0.2984, + 0.314, + 0.3058, + 0.3086, + 0.3067, + 0.3159, + 0.3045, + 0.3026, + 0.3092, + 0.3024, + 0.3048, + 0.3068, + 0.3132, + 0.3156, + 0.3041, + 0.3096, + 0.3129, + 0.3085, + 0.306, + 0.3075, + 0.3041, + 0.3166, + 0.3122, + 0.3133, + 0.3132, + 0.3098, + 0.3106, + 0.3144, + 0.3119, + 0.3099, + 0.3116, + 0.3101, + 0.3101, + 0.3092, + 0.3125, + 0.3126, + 0.312, + 0.3121, + 0.3103, + 0.3118, + 0.312, + 0.3117, + 0.3116, + 0.3119, + 0.3121, + 0.3121, + 0.3121 + ], + "train_loss": [ + 1.991063755493164, + 1.9891048667907716, + 1.9863166485595702, + 1.985428505859375, + 1.9845469324493408, + 1.9856898361968993, + 1.9859479013061523, + 1.9861413344955445, + 1.987729702606201, + 1.9837639855957032, + 1.9841289485931397, + 1.9848187063980103, + 1.9860578922271728, + 1.985988610458374, + 1.9876202394104003, + 1.9866319847106935, + 1.9875208644866944, + 1.987033146095276, + 1.9867303422546387, + 1.9879651712799071, + 1.9859774648284911, + 1.987113154144287, + 1.9862299811553956, + 1.9857690775299073, + 1.988408780822754, + 1.9880884175872802, + 1.9875518899917604, + 1.988998243789673, + 1.989372254257202, + 1.9874613111877442, + 1.9886616062164306, + 1.9855735210418701, + 1.9848130255126952, + 1.987750488586426, + 1.9888636597061158, + 1.987453981628418, + 1.9868767975234984, + 1.9858004119110106, + 1.9872028504180907, + 1.98767549369812, + 1.9877946385955811, + 1.9850490479278564, + 1.9870550692749023, + 1.9855170317077637, + 1.9866968719863891, + 1.986244729537964, + 1.9856399948883057, + 1.9851934980773926, + 1.987251290550232, + 1.9848943976593019, + 1.9856630751037598, + 1.9835738152313231, + 1.9850466170501708, + 1.9853938566589355, + 1.9854372603988648, + 1.9848404151916503, + 1.9842564939880372, + 1.984966632232666, + 1.9862527949523925, + 1.9858872723770142, + 1.9870590911102295, + 1.9838753735351562, + 1.9845243627929687, + 1.9838003320693969, + 1.9846255307388305, + 1.9837014434051514, + 1.9841858550262452, + 1.9833481007385254, + 1.9850787268829346, + 1.983225867614746, + 1.9865360502624512, + 1.9847832034683228, + 1.9826461749267579, + 1.9844200134277343, + 1.9813355867767335, + 1.984790707244873, + 1.982914197998047, + 1.9847005506134032, + 1.9827604949569702, + 1.9835056610107422, + 1.9856193158721924, + 1.9832022803497313, + 1.983253235168457, + 1.9844388064956664, + 1.9839341816711427, + 1.9846962734985352, + 1.9845728868865966, + 1.984046629714966, + 1.9824064780044555, + 1.9842023155212403, + 1.9807324981307983, + 1.9825623114013673, + 1.9840583863067627, + 1.981500357284546, + 1.982737907409668 + ], + "gamma": [ + [ + 6, + 0.08110687113367021 + ], + [ + 7, + 0.08583660633303225 + ], + [ + 8, + 0.0866433356422931 + ], + [ + 9, + 0.0874824351631105 + ], + [ + 10, + 0.08917368366383016 + ], + [ + 15, + 0.0921399628277868 + ], + [ + 20, + 0.09438218630384654 + ], + [ + 25, + 0.09332562319468707 + ], + [ + 30, + 0.09237831912469119 + ], + [ + 35, + 0.09489014593418688 + ], + [ + 40, + 0.09572238114196807 + ], + [ + 45, + 0.09763896185904741 + ], + [ + 50, + 0.099001151509583 + ], + [ + 55, + 0.10060104553122073 + ], + [ + 60, + 0.10066475439816713 + ], + [ + 65, + 0.1013602283783257 + ], + [ + 70, + 0.1013283513020724 + ], + [ + 75, + 0.10205963579937816 + ], + [ + 80, + 0.10181845515035093 + ], + [ + 85, + 0.1020878148265183 + ], + [ + 90, + 0.10206597857177258 + ], + [ + 95, + 0.10202388069592416 + ], + [ + 100, + 0.10202996502630413 + ] + ], + "rho": [ + [ + 6, + 0.029335655737668276 + ], + [ + 7, + 0.003754556179046631 + ], + [ + 8, + 0.03516152314841747 + ], + [ + 9, + -0.005450671538710594 + ], + [ + 10, + 0.03606446529738605 + ], + [ + 15, + 0.00365481834160164 + ], + [ + 20, + 0.012497917516157031 + ], + [ + 25, + -0.011625229148194194 + ], + [ + 30, + 0.013168673729524016 + ], + [ + 35, + 0.002954811556264758 + ], + [ + 40, + -0.00015860568964853883 + ], + [ + 45, + -0.0018259281641803682 + ], + [ + 50, + -0.0024563749320805073 + ], + [ + 55, + 0.0037257722578942776 + ], + [ + 60, + 0.003340904542710632 + ], + [ + 65, + 0.008623109199106693 + ], + [ + 70, + -0.0010987441055476665 + ], + [ + 75, + 0.0020438041538000107 + ], + [ + 80, + 0.009311038942541927 + ], + [ + 85, + 0.000543791800737381 + ], + [ + 90, + -0.011298802681267262 + ], + [ + 95, + -0.0026983938878402114 + ], + [ + 100, + -0.0008281976915895939 + ] + ] + }, + "t0=5_handoff_blend_05": { + "t0": 5, + "branch": "handoff_blend_05", + "credit_mode": "0.5", + "vec_gamma_frozen": -0.0011670500971376896, + "vec_rho_frozen": -0.0008091113995760679, + "test_acc": [ + 0.3037, + 0.2939, + 0.3123, + 0.3131, + 0.3005, + 0.3028, + 0.3001, + 0.3062, + 0.3167, + 0.3174, + 0.3019, + 0.3094, + 0.3115, + 0.3157, + 0.3087, + 0.3161, + 0.3065, + 0.3059, + 0.3011, + 0.3135, + 0.3084, + 0.3149, + 0.3074, + 0.3079, + 0.3221, + 0.3171, + 0.3081, + 0.3259, + 0.3131, + 0.3187, + 0.3131, + 0.3089, + 0.3071, + 0.3107, + 0.3166, + 0.3218, + 0.3108, + 0.3106, + 0.3029, + 0.3114, + 0.3087, + 0.3226, + 0.311, + 0.3085, + 0.3111, + 0.3194, + 0.313, + 0.3169, + 0.31, + 0.312, + 0.318, + 0.3094, + 0.3147, + 0.3168, + 0.3131, + 0.3093, + 0.3124, + 0.3144, + 0.3135, + 0.3131, + 0.3161, + 0.3122, + 0.3237, + 0.3101, + 0.3172, + 0.3069, + 0.3184, + 0.3131, + 0.3056, + 0.3185, + 0.3204, + 0.317, + 0.3136, + 0.3156, + 0.3178, + 0.3163, + 0.316, + 0.3167, + 0.3139, + 0.3171, + 0.3159, + 0.3177, + 0.3146, + 0.3166, + 0.3164, + 0.3165, + 0.3168, + 0.3166, + 0.3164, + 0.3171, + 0.3168, + 0.3169, + 0.3169, + 0.3169, + 0.3166 + ], + "train_loss": [ + 1.989920323486328, + 1.9814545530700685, + 1.9797040303802491, + 1.977913288345337, + 1.9804364520645141, + 1.9774842262268066, + 1.9772156427383423, + 1.9809386281585692, + 1.9747767695617675, + 1.9781757772827149, + 1.9787077528381347, + 1.978690902786255, + 1.9772437986755371, + 1.9765710025024414, + 1.9750249889373779, + 1.9749383535003662, + 1.9780638354492188, + 1.9763352072906495, + 1.9787582021331787, + 1.9784047212219238, + 1.9771386277008056, + 1.9769252400970458, + 1.976383394241333, + 1.9784637090301513, + 1.9788820373916627, + 1.9782504370117187, + 1.9749387907409668, + 1.9747097717285156, + 1.975444818878174, + 1.9766639586639405, + 1.9724876895523071, + 1.9725531145477295, + 1.976385212020874, + 1.9782319937896728, + 1.9737711849975585, + 1.973644761390686, + 1.9728259078979493, + 1.976724259262085, + 1.9733991305541991, + 1.975024061050415, + 1.9750342240142822, + 1.976791547164917, + 1.9721737294769288, + 1.9757624352264405, + 1.9740187911987304, + 1.9715763872528076, + 1.974257389678955, + 1.9742160180664063, + 1.9752464599227906, + 1.9712771053314209, + 1.9748193713378905, + 1.9749141446685792, + 1.9720298815155028, + 1.971592350769043, + 1.9715159897613526, + 1.9740276614379884, + 1.974955996131897, + 1.9737971368408203, + 1.9721809567642212, + 1.972617737388611, + 1.973553286895752, + 1.9727391172027589, + 1.9711793769836425, + 1.97289596408844, + 1.9729657166290284, + 1.9724417525482179, + 1.9734269491958618, + 1.9736238091278075, + 1.9729384266662597, + 1.9715021076202393, + 1.9715961434173583, + 1.971838274269104, + 1.970664451675415, + 1.9723946903991698, + 1.9681628646469116, + 1.9713885641098023, + 1.9714233623886108, + 1.9704941757965089, + 1.9717961227416991, + 1.9709891326141358, + 1.9698141984558106, + 1.9694300765228272, + 1.9674521529769897, + 1.968568952293396, + 1.9684835869979858, + 1.968900461807251, + 1.9713853565979005, + 1.969524931640625, + 1.9704243312835694, + 1.9714735486602784, + 1.9711184131622315, + 1.9691432343292237, + 1.9701531174087525, + 1.96900106716156, + 1.969152776222229 + ], + "gamma": [ + [ + 6, + -0.006406156346201897 + ], + [ + 7, + 0.005549430090468377 + ], + [ + 8, + -0.014852836960926652 + ], + [ + 9, + 0.004497126807109453 + ], + [ + 10, + 0.008979676757007837 + ], + [ + 15, + -0.0022616543574258685 + ], + [ + 20, + -0.0017912940820679069 + ], + [ + 25, + -0.0005058745155110955 + ], + [ + 30, + -0.006743058795109391 + ], + [ + 35, + -0.003928700694814324 + ], + [ + 40, + -0.0038105265703052282 + ], + [ + 45, + 0.0034737606765702367 + ], + [ + 50, + 0.0012252477463334799 + ], + [ + 55, + 4.656023520510644e-05 + ], + [ + 60, + -0.001994765450945124 + ], + [ + 65, + -0.0032054060138761997 + ], + [ + 70, + -0.00046937276783864945 + ], + [ + 75, + -0.0027389351453166455 + ], + [ + 80, + -0.004259559675119817 + ], + [ + 85, + 0.003984946117270738 + ], + [ + 90, + 0.0023324156063608825 + ], + [ + 95, + 0.010914091719314456 + ], + [ + 100, + 0.0012247695412952453 + ] + ], + "rho": [ + [ + 6, + 0.0013132079038769007 + ], + [ + 7, + -0.006549160461872816 + ], + [ + 8, + 0.0023524018470197916 + ], + [ + 9, + 0.002624807762913406 + ], + [ + 10, + 0.017818652791902423 + ], + [ + 15, + -0.006970469374209642 + ], + [ + 20, + -0.003616457339376211 + ], + [ + 25, + -0.010600036010146141 + ], + [ + 30, + 0.006578520638868213 + ], + [ + 35, + 0.00021186470985412598 + ], + [ + 40, + -0.006158043164759874 + ], + [ + 45, + 0.009233269607648253 + ], + [ + 50, + 0.02198852994479239 + ], + [ + 55, + 0.003516675438731909 + ], + [ + 60, + 0.0034372663940303028 + ], + [ + 65, + -0.005627294420264661 + ], + [ + 70, + -0.0006588770775124431 + ], + [ + 75, + -0.004699242126662284 + ], + [ + 80, + -0.010308766330126673 + ], + [ + 85, + -0.007724274415522814 + ], + [ + 90, + 0.010630680772010237 + ], + [ + 95, + -0.003774375654757023 + ], + [ + 100, + 0.008449196349829435 + ] + ] + }, + "t0=5_handoff_blend_075": { + "t0": 5, + "branch": "handoff_blend_075", + "credit_mode": "0.75", + "vec_gamma_frozen": -0.0011670500971376896, + "vec_rho_frozen": -0.0008091113995760679, + "test_acc": [ + 0.3141, + 0.2998, + 0.305, + 0.3127, + 0.3138, + 0.3116, + 0.3125, + 0.3157, + 0.3145, + 0.326, + 0.3126, + 0.3183, + 0.3161, + 0.321, + 0.3054, + 0.3167, + 0.3186, + 0.3105, + 0.3058, + 0.3176, + 0.3146, + 0.3219, + 0.3311, + 0.3264, + 0.3087, + 0.322, + 0.3197, + 0.3244, + 0.3293, + 0.3179, + 0.322, + 0.3233, + 0.3317, + 0.3234, + 0.3126, + 0.3182, + 0.3203, + 0.3185, + 0.3165, + 0.3262, + 0.3171, + 0.3258, + 0.3143, + 0.3088, + 0.3264, + 0.3181, + 0.3235, + 0.3198, + 0.3222, + 0.3245, + 0.3244, + 0.3225, + 0.3196, + 0.3167, + 0.3277, + 0.3177, + 0.3168, + 0.3256, + 0.3247, + 0.3252, + 0.3224, + 0.3202, + 0.3253, + 0.3221, + 0.3219, + 0.3239, + 0.3218, + 0.3258, + 0.3281, + 0.3257, + 0.3234, + 0.3273, + 0.3263, + 0.3227, + 0.3221, + 0.3246, + 0.3253, + 0.324, + 0.3259, + 0.3235, + 0.3239, + 0.3224, + 0.3269, + 0.3249, + 0.3262, + 0.325, + 0.3243, + 0.324, + 0.3242, + 0.3249, + 0.325, + 0.3254, + 0.3253, + 0.3254, + 0.3255 + ], + "train_loss": [ + 1.9887806289672851, + 1.9798492393493652, + 1.9770838994979858, + 1.974819222793579, + 1.972799209213257, + 1.9724265090942383, + 1.9691669107055665, + 1.969123511581421, + 1.9685189966583252, + 1.969195809249878, + 1.9682516871643065, + 1.9669985847473144, + 1.9701892945861816, + 1.967657275466919, + 1.967640663986206, + 1.9675346103286744, + 1.9673507315444947, + 1.96461721534729, + 1.9646919076538085, + 1.9671023194122315, + 1.9669487468719482, + 1.9686367099380493, + 1.9653930168914795, + 1.9673711193466186, + 1.9633510193634034, + 1.9649822988510133, + 1.964322645263672, + 1.9612459350585938, + 1.965179051437378, + 1.9655230182647705, + 1.964747555770874, + 1.9657264164733887, + 1.965226427268982, + 1.9668125988769531, + 1.963646941795349, + 1.963662981300354, + 1.9665489539337158, + 1.9637163995742797, + 1.9635050727081298, + 1.9627389594268798, + 1.9650295120620727, + 1.9620897372817994, + 1.9611733522033692, + 1.964628535308838, + 1.9642805702972412, + 1.964224110069275, + 1.9608901892852784, + 1.9634879403305054, + 1.96202836063385, + 1.961953832244873, + 1.962700569114685, + 1.9636967702484132, + 1.9646112118148804, + 1.9632205015563964, + 1.961768946838379, + 1.960234896697998, + 1.9627824864959718, + 1.9588261922836303, + 1.9607146656036376, + 1.9624977801132202, + 1.9624813533782959, + 1.9629455206680297, + 1.958997371826172, + 1.9598133665466309, + 1.9610961584854125, + 1.9587416419219972, + 1.9598756586456298, + 1.9617953030395507, + 1.962351581878662, + 1.960147843322754, + 1.962101521835327, + 1.9590696320343017, + 1.9597472089004517, + 1.9596738564682006, + 1.9596313110733032, + 1.9605814127349854, + 1.9622519910049439, + 1.9600993612670898, + 1.956996003189087, + 1.9584874711608886, + 1.9579721714019775, + 1.9598075309753418, + 1.9577328550720214, + 1.9582674449920654, + 1.9587023457336425, + 1.958327255783081, + 1.9579892782592774, + 1.9576218103027343, + 1.9604835634613038, + 1.9595883728027343, + 1.9593276914215088, + 1.9566011611938476, + 1.9574530683898925, + 1.9586209949493407, + 1.9584272537231446 + ], + "gamma": [ + [ + 6, + 0.011505375849083066 + ], + [ + 7, + -0.004328439070377499 + ], + [ + 8, + 0.0035834669251926243 + ], + [ + 9, + -0.004052334581501782 + ], + [ + 10, + 0.013710617553442717 + ], + [ + 15, + -0.003643441421445459 + ], + [ + 20, + -0.0021449794294312596 + ], + [ + 25, + -0.0036328031856101006 + ], + [ + 30, + -0.0012953793921042234 + ], + [ + 35, + 0.005909526313189417 + ], + [ + 40, + 0.016804294427856803 + ], + [ + 45, + 0.0032158615067601204 + ], + [ + 50, + -0.006744181155227125 + ], + [ + 55, + 0.0038794619031250477 + ], + [ + 60, + -0.005895215319469571 + ], + [ + 65, + 0.005237550707533956 + ], + [ + 70, + -0.0034871078096330166 + ], + [ + 75, + 0.001894826884381473 + ], + [ + 80, + -0.004059363855049014 + ], + [ + 85, + -0.00168273359304294 + ], + [ + 90, + 0.005555906856898218 + ], + [ + 95, + 0.0004772244283230975 + ], + [ + 100, + -0.001725059817545116 + ] + ], + "rho": [ + [ + 6, + 0.012261858209967613 + ], + [ + 7, + 0.0036515695974230766 + ], + [ + 8, + -0.012208035914227366 + ], + [ + 9, + -0.009903644444420934 + ], + [ + 10, + -0.0031967777758836746 + ], + [ + 15, + 0.0049271658062934875 + ], + [ + 20, + -0.012986334972083569 + ], + [ + 25, + -0.005337987095117569 + ], + [ + 30, + -0.0004181895637884736 + ], + [ + 35, + -0.005065932986326516 + ], + [ + 40, + -0.02178479335270822 + ], + [ + 45, + -0.014644806389696896 + ], + [ + 50, + 0.00805065780878067 + ], + [ + 55, + 0.008234395296312869 + ], + [ + 60, + -0.006709430832415819 + ], + [ + 65, + -0.006348557129967958 + ], + [ + 70, + 0.0009087740909308195 + ], + [ + 75, + -0.013001261162571609 + ], + [ + 80, + -0.01535764615982771 + ], + [ + 85, + 0.00408406846690923 + ], + [ + 90, + 0.007417078013531864 + ], + [ + 95, + -0.010641217231750488 + ], + [ + 100, + -0.01683203224092722 + ] + ] + }, + "t0=10_continue_DFA": { + "t0": 10, + "branch": "continue_DFA", + "credit_mode": "dfa", + "vec_gamma_frozen": 0.0042067440517712384, + "vec_rho_frozen": 0.0038935517659410834, + "test_acc": [ + 0.3114, + 0.3054, + 0.298, + 0.2924, + 0.3038, + 0.3041, + 0.3029, + 0.2963, + 0.3077, + 0.3122, + 0.3064, + 0.3095, + 0.2972, + 0.3051, + 0.316, + 0.2902, + 0.3071, + 0.2993, + 0.3074, + 0.2859, + 0.3065, + 0.3043, + 0.3118, + 0.3022, + 0.3142, + 0.3177, + 0.2984, + 0.2954, + 0.3089, + 0.3047, + 0.3033, + 0.3038, + 0.3063, + 0.2929, + 0.3073, + 0.3094, + 0.3043, + 0.3091, + 0.3107, + 0.3075, + 0.3051, + 0.3198, + 0.3147, + 0.3188, + 0.295, + 0.3082, + 0.3073, + 0.3049, + 0.2987, + 0.3112, + 0.3017, + 0.3015, + 0.3075, + 0.3108, + 0.3167, + 0.3147, + 0.305, + 0.3118, + 0.3119, + 0.3048, + 0.3099, + 0.3117, + 0.3097, + 0.311, + 0.3119, + 0.3065, + 0.3139, + 0.309, + 0.3092, + 0.3086, + 0.3125, + 0.3109, + 0.3063, + 0.3118, + 0.3046, + 0.3101, + 0.3114, + 0.3103, + 0.3096, + 0.3133, + 0.3092, + 0.3115, + 0.3115, + 0.3109, + 0.3111, + 0.3105, + 0.3106, + 0.3102, + 0.3102, + 0.3103 + ], + "train_loss": [ + 1.9875320287704468, + 1.9891177563476563, + 1.9865943518066407, + 1.9904258282470704, + 1.9874406365585326, + 1.9873190088653565, + 1.9885692932891845, + 1.988010051574707, + 1.9869099227142335, + 1.9894244235229492, + 1.9876407884979248, + 1.9897507932281495, + 1.9887112911224365, + 1.9864059360122681, + 1.9881148773956299, + 1.9869364385986328, + 1.988127936668396, + 1.990114035873413, + 1.986607758216858, + 1.9885956006240846, + 1.9870170391845703, + 1.98955090675354, + 1.9890418215560912, + 1.9895443496704102, + 1.9886660667419434, + 1.9854677661895752, + 1.9864808071136475, + 1.9883289696502686, + 1.9876732089996338, + 1.9876765283203126, + 1.9878952088928223, + 1.9894333304214478, + 1.9865212602233886, + 1.9859716952896118, + 1.9869049006652832, + 1.987617547683716, + 1.9880057638549804, + 1.987460345840454, + 1.9877301689147948, + 1.9870423724365234, + 1.9876786922836305, + 1.9868367038345336, + 1.9879550299835205, + 1.9884745108795165, + 1.9880395782089233, + 1.9850390566253662, + 1.9869491412353515, + 1.9868434957122802, + 1.988668685836792, + 1.9864980206680298, + 1.9862751343536378, + 1.9873612005233765, + 1.986293578262329, + 1.9846468793487548, + 1.9868420107269287, + 1.9848728201675414, + 1.9856274399566651, + 1.9876766166687012, + 1.9855491283416749, + 1.9856539597320557, + 1.9859953440093994, + 1.9868049453735352, + 1.983933601989746, + 1.9855083358001708, + 1.9851877621841432, + 1.9846026678085327, + 1.9831799187850951, + 1.9833928588104248, + 1.9852891273498534, + 1.984254077835083, + 1.9818164873504638, + 1.983409195175171, + 1.983656044883728, + 1.9843665660858154, + 1.9844557377624512, + 1.9834174674987792, + 1.9829292294311522, + 1.9844586798858643, + 1.9849174486923218, + 1.9825584698486327, + 1.9820008834457397, + 1.9833803461456299, + 1.9823364935302734, + 1.9831650439453126, + 1.983894295425415, + 1.9838459788513183, + 1.9835173099517822, + 1.983146858253479, + 1.9846808233261108, + 1.9830649966812133 + ], + "gamma": [ + [ + 11, + 0.0847038640640676 + ], + [ + 12, + 0.08449943130835891 + ], + [ + 13, + 0.08560229558497667 + ], + [ + 14, + 0.0849406763445586 + ], + [ + 15, + 0.08678498375229537 + ], + [ + 20, + 0.08858749852515757 + ], + [ + 25, + 0.09002651006449014 + ], + [ + 30, + 0.09209231153363362 + ], + [ + 35, + 0.09397269494365901 + ], + [ + 40, + 0.0946828828600701 + ], + [ + 45, + 0.0959556256129872 + ], + [ + 50, + 0.09717596844711807 + ], + [ + 55, + 0.09897968024597503 + ], + [ + 60, + 0.09992457224871032 + ], + [ + 65, + 0.09955423115752637 + ], + [ + 70, + 0.09959435404743999 + ], + [ + 75, + 0.10014662385219708 + ], + [ + 80, + 0.10013154963962734 + ], + [ + 85, + 0.10005534396623261 + ], + [ + 90, + 0.10045824624830857 + ], + [ + 95, + 0.10026703868061304 + ], + [ + 100, + 0.10031358560081571 + ] + ], + "rho": [ + [ + 11, + 0.002421351382508874 + ], + [ + 12, + -0.020076005719602108 + ], + [ + 13, + 0.00905256497208029 + ], + [ + 14, + 0.026296202559024096 + ], + [ + 15, + 0.019721826422028244 + ], + [ + 20, + 0.017800879169953987 + ], + [ + 25, + -0.003079839516431093 + ], + [ + 30, + 0.004590018652379513 + ], + [ + 35, + 0.0004936892073601484 + ], + [ + 40, + 0.007190009579062462 + ], + [ + 45, + 0.00793769839219749 + ], + [ + 50, + 0.0011359832715243101 + ], + [ + 55, + 0.0012366813607513905 + ], + [ + 60, + -0.011631682515144348 + ], + [ + 65, + 0.00852967519313097 + ], + [ + 70, + -0.012241421965882182 + ], + [ + 75, + -0.012332477606832981 + ], + [ + 80, + 0.012475105933845043 + ], + [ + 85, + -0.0027559904847294092 + ], + [ + 90, + -0.008937430568039417 + ], + [ + 95, + -0.008499621413648129 + ], + [ + 100, + 0.0026798928156495094 + ] + ] + }, + "t0=10_handoff_to_Vec": { + "t0": 10, + "branch": "handoff_to_Vec", + "credit_mode": "vec", + "vec_gamma_frozen": 0.0042067440517712384, + "vec_rho_frozen": 0.0038935517659410834, + "test_acc": [ + 0.3044, + 0.2993, + 0.3131, + 0.3245, + 0.3137, + 0.298, + 0.3213, + 0.3135, + 0.2985, + 0.3038, + 0.3002, + 0.3126, + 0.3013, + 0.2997, + 0.3072, + 0.3069, + 0.3002, + 0.3091, + 0.3067, + 0.2967, + 0.306, + 0.2967, + 0.3161, + 0.3121, + 0.3129, + 0.2983, + 0.3111, + 0.3063, + 0.3121, + 0.3096, + 0.3064, + 0.3012, + 0.3127, + 0.3055, + 0.3133, + 0.3005, + 0.3065, + 0.3032, + 0.3034, + 0.3051, + 0.3042, + 0.3099, + 0.3107, + 0.3087, + 0.3078, + 0.3137, + 0.302, + 0.3104, + 0.3101, + 0.3073, + 0.3034, + 0.3077, + 0.3025, + 0.3104, + 0.3104, + 0.3044, + 0.3058, + 0.3063, + 0.3061, + 0.3073, + 0.306, + 0.306, + 0.3066, + 0.3072, + 0.3022, + 0.3075, + 0.307, + 0.3049, + 0.3006, + 0.3046, + 0.3028, + 0.3052, + 0.3042, + 0.3041, + 0.3074, + 0.3068, + 0.3063, + 0.3072, + 0.3071, + 0.3073, + 0.3074, + 0.3069, + 0.3073, + 0.3068, + 0.3059, + 0.3068, + 0.3068, + 0.3071, + 0.3072, + 0.3072 + ], + "train_loss": [ + 1.9866068698120116, + 1.9822053937530517, + 1.9804531171035766, + 1.9769810823059082, + 1.977052113609314, + 1.9752359896469116, + 1.9722654714584351, + 1.9719278221130372, + 1.970822947731018, + 1.9717840911483764, + 1.9682231511688233, + 1.968495904006958, + 1.96760017868042, + 1.9701581380462647, + 1.9675142916488648, + 1.9680279364776612, + 1.9666622930145263, + 1.9654243109893799, + 1.9659241844940185, + 1.9667544781112671, + 1.9654184175109863, + 1.9682446677398682, + 1.9665645470809936, + 1.962704022254944, + 1.9667242764282227, + 1.9651664418029786, + 1.96742610080719, + 1.9632605270385741, + 1.965363286743164, + 1.967875340270996, + 1.9658809958267212, + 1.9652816242218019, + 1.9644886882019044, + 1.9643921794891357, + 1.9656528813171388, + 1.9628269485473633, + 1.9645728551483155, + 1.9642161107635498, + 1.9638631564331055, + 1.9666428575897217, + 1.9680908479309083, + 1.9663742835235596, + 1.9642835456085206, + 1.9627088230133056, + 1.963959354248047, + 1.9639146718978882, + 1.9634665188598632, + 1.964948549194336, + 1.9620582075500488, + 1.9650217700576782, + 1.9627274538803101, + 1.9650206172943114, + 1.9632625915908815, + 1.9611075479888915, + 1.9657896464538573, + 1.961214722213745, + 1.9627577758407593, + 1.9625123359680177, + 1.9633644173431397, + 1.9626851040649413, + 1.959757084350586, + 1.9622343629455565, + 1.9648383917999268, + 1.962337583694458, + 1.9636648812103272, + 1.9621018824005128, + 1.9638115926361084, + 1.9647201615905763, + 1.96513031829834, + 1.9660897815322875, + 1.9630526079559327, + 1.9641853886413574, + 1.9618755170440674, + 1.961919069480896, + 1.9624179935455321, + 1.960745535507202, + 1.9640649700164794, + 1.9637301733779908, + 1.9630452741241455, + 1.96104790309906, + 1.9639451459503174, + 1.9629601496124267, + 1.9628581218719483, + 1.964691388282776, + 1.9644895922088623, + 1.9644148468017577, + 1.9623606049346924, + 1.9623322786712647, + 1.9616047958374023, + 1.9641540831756592 + ], + "gamma": [ + [ + 11, + -0.004042641550768167 + ], + [ + 12, + 0.010617796564474702 + ], + [ + 13, + 0.012645653099752963 + ], + [ + 14, + 0.009190087672322989 + ], + [ + 15, + -0.0031805136532057077 + ], + [ + 20, + -0.006982525228522718 + ], + [ + 25, + 0.007745365088339895 + ], + [ + 30, + 0.0010499480413272977 + ], + [ + 35, + 0.002336127159651369 + ], + [ + 40, + 0.00398875743849203 + ], + [ + 45, + -0.005754569137934595 + ], + [ + 50, + -0.0032395682064816356 + ], + [ + 55, + -0.013786613941192627 + ], + [ + 60, + -0.0024626134036225267 + ], + [ + 65, + 0.0008561888244003057 + ], + [ + 70, + 0.01141710695810616 + ], + [ + 75, + 0.008856949862092733 + ], + [ + 80, + 0.012243610108271241 + ], + [ + 85, + 0.00931936502456665 + ], + [ + 90, + 0.008772111963480711 + ], + [ + 95, + -0.004374492971692234 + ], + [ + 100, + 0.002082181628793478 + ] + ], + "rho": [ + [ + 11, + 0.02106075780466199 + ], + [ + 12, + 0.006604651396628469 + ], + [ + 13, + 0.009807938942685723 + ], + [ + 14, + 0.02017845318187028 + ], + [ + 15, + -0.0014247590443119407 + ], + [ + 20, + 0.00818872411036864 + ], + [ + 25, + 0.007353978231549263 + ], + [ + 30, + -0.007289526052772999 + ], + [ + 35, + -0.028255917131900787 + ], + [ + 40, + -0.004728848347440362 + ], + [ + 45, + 0.014037816552445292 + ], + [ + 50, + -0.005819418700411916 + ], + [ + 55, + -0.0016381022869609296 + ], + [ + 60, + -0.007356879650615156 + ], + [ + 65, + 0.009376309579238296 + ], + [ + 70, + -0.016099544009193778 + ], + [ + 75, + -0.004943012027069926 + ], + [ + 80, + 0.007042828015983105 + ], + [ + 85, + -0.00042343116365373135 + ], + [ + 90, + -0.016734275268390775 + ], + [ + 95, + -0.0006720859091728926 + ], + [ + 100, + 0.008259820868261158 + ] + ] + }, + "t0=10_handoff_blend_025": { + "t0": 10, + "branch": "handoff_blend_025", + "credit_mode": "0.25", + "vec_gamma_frozen": 0.0042067440517712384, + "vec_rho_frozen": 0.0038935517659410834, + "test_acc": [ + 0.2938, + 0.2897, + 0.3007, + 0.3175, + 0.3098, + 0.3088, + 0.3094, + 0.3167, + 0.301, + 0.3052, + 0.3195, + 0.3092, + 0.2997, + 0.3157, + 0.3054, + 0.3154, + 0.306, + 0.3143, + 0.3158, + 0.298, + 0.3069, + 0.2918, + 0.3074, + 0.312, + 0.3124, + 0.3162, + 0.3206, + 0.3123, + 0.3074, + 0.3144, + 0.3123, + 0.3122, + 0.3188, + 0.3175, + 0.3158, + 0.316, + 0.3144, + 0.304, + 0.3082, + 0.2964, + 0.293, + 0.3095, + 0.306, + 0.3053, + 0.3097, + 0.313, + 0.3042, + 0.3075, + 0.3138, + 0.3018, + 0.3122, + 0.3059, + 0.3097, + 0.3022, + 0.3156, + 0.3145, + 0.3089, + 0.3111, + 0.3064, + 0.3054, + 0.3068, + 0.313, + 0.3196, + 0.3176, + 0.3092, + 0.307, + 0.3158, + 0.314, + 0.3169, + 0.3126, + 0.3102, + 0.3125, + 0.3105, + 0.3132, + 0.3103, + 0.3091, + 0.3097, + 0.3132, + 0.3122, + 0.3099, + 0.3127, + 0.3114, + 0.3129, + 0.3123, + 0.3119, + 0.3119, + 0.3119, + 0.3122, + 0.3121, + 0.312 + ], + "train_loss": [ + 1.989478285598755, + 1.9868447759246826, + 1.9876150262832641, + 1.9858550075531005, + 1.9833146737289429, + 1.985652213973999, + 1.9831381234359742, + 1.9834452158355713, + 1.9825294380187988, + 1.9874132528305053, + 1.9871378646850586, + 1.9839914614105225, + 1.9840993252182006, + 1.9814335080718994, + 1.9815850207519532, + 1.9850090422821045, + 1.985265905380249, + 1.9841137189102174, + 1.9826534753417968, + 1.9812066304779052, + 1.9828772528076173, + 1.98269517578125, + 1.984909154586792, + 1.9837005503845215, + 1.9842012789535521, + 1.9811075918579102, + 1.9811774273300171, + 1.9820292532348633, + 1.9851325442504884, + 1.9831501845932007, + 1.9847520957946778, + 1.983698173866272, + 1.9826594636535644, + 1.9831600260925293, + 1.9819660359191895, + 1.9834444214630127, + 1.9822623685073852, + 1.9827716506576538, + 1.9826187271881104, + 1.9849012186050414, + 1.9839086280822753, + 1.9825999378967285, + 1.981730891571045, + 1.982155584754944, + 1.9843205583953858, + 1.9827571130752564, + 1.9833940881347656, + 1.9835176082992554, + 1.9838816494750977, + 1.9830150816345216, + 1.9806758447647095, + 1.981820216293335, + 1.9821692760849, + 1.9804246088027955, + 1.9804472206878663, + 1.982804430809021, + 1.9837173638534547, + 1.984720592956543, + 1.9828333145141601, + 1.9820240353775025, + 1.9822105483245849, + 1.9838723239135743, + 1.9806797274398804, + 1.9809212255859374, + 1.9826797536849976, + 1.9829638636779785, + 1.9802171006011964, + 1.9812134786605835, + 1.9817558652496339, + 1.9808594998550415, + 1.9826035800170898, + 1.9826281146621705, + 1.979410721435547, + 1.9823534533691407, + 1.9809793517303467, + 1.9805086376953125, + 1.9803655435562133, + 1.978996251182556, + 1.980624110069275, + 1.9790157104492188, + 1.9797257055664061, + 1.9816278476333617, + 1.980231456451416, + 1.9801238049316405, + 1.9815326901626586, + 1.9793833974456787, + 1.9792350862884522, + 1.9807127814483643, + 1.9803146588516236, + 1.9807132862854004 + ], + "gamma": [ + [ + 11, + 0.0843387390486896 + ], + [ + 12, + 0.08346948947291821 + ], + [ + 13, + 0.08525195316178724 + ], + [ + 14, + 0.08714305562898517 + ], + [ + 15, + 0.08630326110869646 + ], + [ + 20, + 0.08899839816149324 + ], + [ + 25, + 0.09083676844602451 + ], + [ + 30, + 0.08932982292026281 + ], + [ + 35, + 0.09085761086316779 + ], + [ + 40, + 0.09201906819362193 + ], + [ + 45, + 0.09160545861232094 + ], + [ + 50, + 0.0932986771222204 + ], + [ + 55, + 0.09416521346429363 + ], + [ + 60, + 0.09465667745098472 + ], + [ + 65, + 0.09539491019677371 + ], + [ + 70, + 0.09575836511794478 + ], + [ + 75, + 0.09669694234617054 + ], + [ + 80, + 0.09700643667019904 + ], + [ + 85, + 0.09706368180923164 + ], + [ + 90, + 0.09690045518800616 + ], + [ + 95, + 0.09702154714614153 + ], + [ + 100, + 0.0969982537208125 + ] + ], + "rho": [ + [ + 11, + 0.0063589331693947315 + ], + [ + 12, + 0.024797477293759584 + ], + [ + 13, + 0.018316544490517117 + ], + [ + 14, + -0.0036471225321292877 + ], + [ + 15, + 0.004702381091192365 + ], + [ + 20, + -0.018541559227742255 + ], + [ + 25, + 0.0007382262265309691 + ], + [ + 30, + 0.014796937932260334 + ], + [ + 35, + 0.018859683419577777 + ], + [ + 40, + 0.004127278691157699 + ], + [ + 45, + 0.004332367796450853 + ], + [ + 50, + 0.005462064524181187 + ], + [ + 55, + 0.0007683481089770794 + ], + [ + 60, + 0.007523805135861039 + ], + [ + 65, + 0.0036167651414871216 + ], + [ + 70, + -0.0057612257078289986 + ], + [ + 75, + 0.005442411871626973 + ], + [ + 80, + -0.008708719164133072 + ], + [ + 85, + 0.0015424963785335422 + ], + [ + 90, + -0.0008635269477963448 + ], + [ + 95, + -0.007743132300674915 + ], + [ + 100, + -0.012928523123264313 + ] + ] + }, + "t0=10_handoff_blend_05": { + "t0": 10, + "branch": "handoff_blend_05", + "credit_mode": "0.5", + "vec_gamma_frozen": 0.0042067440517712384, + "vec_rho_frozen": 0.0038935517659410834, + "test_acc": [ + 0.3107, + 0.3069, + 0.3178, + 0.3074, + 0.3105, + 0.3078, + 0.3055, + 0.3022, + 0.3127, + 0.3075, + 0.3179, + 0.3154, + 0.3124, + 0.3118, + 0.3171, + 0.2973, + 0.3058, + 0.309, + 0.3099, + 0.3205, + 0.3011, + 0.3109, + 0.3115, + 0.3081, + 0.3109, + 0.316, + 0.3075, + 0.3189, + 0.3147, + 0.3134, + 0.3188, + 0.3134, + 0.3206, + 0.3121, + 0.3206, + 0.316, + 0.3051, + 0.3085, + 0.3201, + 0.3113, + 0.3185, + 0.3194, + 0.3163, + 0.3126, + 0.315, + 0.3141, + 0.3087, + 0.3112, + 0.2993, + 0.3225, + 0.3196, + 0.3178, + 0.3152, + 0.3216, + 0.3141, + 0.316, + 0.3198, + 0.3185, + 0.3181, + 0.3108, + 0.316, + 0.3187, + 0.3096, + 0.3168, + 0.3211, + 0.317, + 0.3191, + 0.3149, + 0.3131, + 0.3104, + 0.3101, + 0.3199, + 0.3171, + 0.3174, + 0.3165, + 0.3183, + 0.3156, + 0.3146, + 0.3177, + 0.3168, + 0.3146, + 0.3177, + 0.3188, + 0.318, + 0.3179, + 0.3186, + 0.3178, + 0.3177, + 0.3178, + 0.3177 + ], + "train_loss": [ + 1.988869067993164, + 1.9845831605529785, + 1.9853724942016602, + 1.9788412484741211, + 1.9795959680938722, + 1.978823126296997, + 1.9802506366348267, + 1.9784362533187867, + 1.9762019078063964, + 1.9746749285888672, + 1.9741735333251953, + 1.9746440016937257, + 1.975217692489624, + 1.976247932434082, + 1.9756203607940674, + 1.9737033957290648, + 1.9758937371444703, + 1.9722264950180053, + 1.9748607511138916, + 1.9720990928649902, + 1.977367167892456, + 1.9720380249023437, + 1.9738850479125976, + 1.9752985586166383, + 1.9738832075500488, + 1.9757071376037598, + 1.9718886584472657, + 1.9740739653015136, + 1.9749583083343505, + 1.973467418899536, + 1.973932978515625, + 1.973497041091919, + 1.9737253588867187, + 1.971032596511841, + 1.9755067537689208, + 1.9737163492584229, + 1.9727142861938476, + 1.9743528587341308, + 1.9701210864639283, + 1.9694558350372315, + 1.9700019970703124, + 1.970854245376587, + 1.971451057434082, + 1.9691312657165527, + 1.9712557052612305, + 1.9721587106323242, + 1.9694245384979248, + 1.9688617358398437, + 1.971903282699585, + 1.97263688911438, + 1.9709516286849975, + 1.9710711121368407, + 1.968572710494995, + 1.969881056137085, + 1.9684886044311523, + 1.9685047689819335, + 1.9687362952041625, + 1.9716000007629395, + 1.9706510061645508, + 1.9688725923156738, + 1.9700345636749268, + 1.970209267539978, + 1.9703309046936035, + 1.9708261836242675, + 1.9692469010162355, + 1.9700154656600952, + 1.9684070959472657, + 1.9679225051116944, + 1.969794107093811, + 1.967144956588745, + 1.9679356328582764, + 1.9668708432006836, + 1.9686791171646119, + 1.9661260284423827, + 1.9700672862243653, + 1.9676780422973632, + 1.9701103863906861, + 1.969267603225708, + 1.968710355758667, + 1.9687487289428711, + 1.966826369781494, + 1.967273148727417, + 1.9668864069366454, + 1.967294078063965, + 1.9671314589691162, + 1.9698059977722169, + 1.9670280086517333, + 1.9667310697174072, + 1.9649179275894164, + 1.9662872632598878 + ], + "gamma": [ + [ + 11, + 0.005040839430876076 + ], + [ + 12, + 0.006231138599105179 + ], + [ + 13, + -0.0030368249281309545 + ], + [ + 14, + 0.0067162682535126805 + ], + [ + 15, + 0.002636920806253329 + ], + [ + 20, + 0.005144889175426215 + ], + [ + 25, + 0.006085717934183776 + ], + [ + 30, + -0.0007032401044853032 + ], + [ + 35, + 0.002966892789117992 + ], + [ + 40, + -0.006012294325046241 + ], + [ + 45, + 0.007054211804643273 + ], + [ + 50, + 0.0023782282951287925 + ], + [ + 55, + 0.002206481178291142 + ], + [ + 60, + 0.0008678719314048067 + ], + [ + 65, + -0.0032794239814393222 + ], + [ + 70, + -0.0032538210580241866 + ], + [ + 75, + -0.0023977016971912235 + ], + [ + 80, + 0.005701849120669067 + ], + [ + 85, + -0.0027998359873890877 + ], + [ + 90, + -0.002594916499219835 + ], + [ + 95, + -0.00027929351199418306 + ], + [ + 100, + -0.003620500734541565 + ] + ], + "rho": [ + [ + 11, + -0.008984365151263773 + ], + [ + 12, + 0.016045914497226477 + ], + [ + 13, + 0.020033088629134 + ], + [ + 14, + -0.0027512782253324986 + ], + [ + 15, + -0.022611984983086586 + ], + [ + 20, + 0.004838105174712837 + ], + [ + 25, + 0.005988906603306532 + ], + [ + 30, + -0.003986725118011236 + ], + [ + 35, + 0.01905521471053362 + ], + [ + 40, + -0.005017005110858008 + ], + [ + 45, + 0.0032180151902139187 + ], + [ + 50, + 0.010202619945630431 + ], + [ + 55, + 0.00630239536985755 + ], + [ + 60, + -0.011329676839523017 + ], + [ + 65, + -0.012603579787537456 + ], + [ + 70, + -0.0014488683082163334 + ], + [ + 75, + -0.011644262121990323 + ], + [ + 80, + -0.0017293521668761969 + ], + [ + 85, + -0.006097985926317051 + ], + [ + 90, + 0.0025850951205939054 + ], + [ + 95, + -0.005077496636658907 + ], + [ + 100, + -0.0019108050037175417 + ] + ] + }, + "t0=10_handoff_blend_075": { + "t0": 10, + "branch": "handoff_blend_075", + "credit_mode": "0.75", + "vec_gamma_frozen": 0.0042067440517712384, + "vec_rho_frozen": 0.0038935517659410834, + "test_acc": [ + 0.3222, + 0.3223, + 0.3032, + 0.3142, + 0.3092, + 0.3019, + 0.3233, + 0.3144, + 0.3195, + 0.3171, + 0.3159, + 0.3172, + 0.3017, + 0.3117, + 0.3089, + 0.3174, + 0.3009, + 0.3269, + 0.3226, + 0.3177, + 0.3199, + 0.3052, + 0.3152, + 0.3104, + 0.3246, + 0.323, + 0.31, + 0.3223, + 0.3217, + 0.3177, + 0.3167, + 0.3179, + 0.3136, + 0.312, + 0.3174, + 0.3228, + 0.3192, + 0.3106, + 0.3276, + 0.3135, + 0.3179, + 0.3201, + 0.3267, + 0.3173, + 0.3255, + 0.317, + 0.3209, + 0.3196, + 0.3199, + 0.3262, + 0.3205, + 0.3224, + 0.3197, + 0.3241, + 0.3185, + 0.3228, + 0.3252, + 0.3166, + 0.3175, + 0.3222, + 0.3195, + 0.3171, + 0.3151, + 0.3221, + 0.3235, + 0.3242, + 0.3233, + 0.3276, + 0.3243, + 0.3198, + 0.323, + 0.3246, + 0.3273, + 0.3254, + 0.321, + 0.324, + 0.3248, + 0.3226, + 0.3245, + 0.3254, + 0.3248, + 0.3255, + 0.3244, + 0.3236, + 0.3242, + 0.3244, + 0.3242, + 0.3247, + 0.3246, + 0.3245 + ], + "train_loss": [ + 1.9853151974868775, + 1.9779540844726562, + 1.976351653060913, + 1.9757407247543335, + 1.9750776460266113, + 1.971900207862854, + 1.9714685012435913, + 1.968988427581787, + 1.9705463257598876, + 1.9726191318511963, + 1.9720882730102538, + 1.9695369549942017, + 1.969402609024048, + 1.9666985021209717, + 1.966377460784912, + 1.9654915356445313, + 1.9680337253189086, + 1.9667737590789796, + 1.9653948320770265, + 1.9655801219177247, + 1.9665559098052978, + 1.965029079322815, + 1.9641189581298828, + 1.9654726974487304, + 1.9643710608291627, + 1.9620441046905517, + 1.9647027013397216, + 1.964224019317627, + 1.9637281811904908, + 1.9642600621795654, + 1.962255348968506, + 1.965959539489746, + 1.9661672568511963, + 1.964241234817505, + 1.9639819019317626, + 1.963460948448181, + 1.961119805870056, + 1.9617840161132813, + 1.9627312831878663, + 1.9620910082244873, + 1.9600660537338257, + 1.9605730410766602, + 1.9604247958755494, + 1.960695573348999, + 1.9619682940673828, + 1.960375007247925, + 1.9624817748641967, + 1.9609252223205567, + 1.9611583375549317, + 1.9605066580963135, + 1.9610357287216187, + 1.9620044408416748, + 1.9608555350494385, + 1.9589478369903564, + 1.9598016510009766, + 1.9613045867156982, + 1.9589987204360961, + 1.9592427587509156, + 1.9570969534301759, + 1.9574322660064698, + 1.9600443893432618, + 1.9599411028289795, + 1.9616032498931886, + 1.9596367269134523, + 1.9583338011169433, + 1.959767865638733, + 1.9593639748382568, + 1.9587717581176758, + 1.960190855102539, + 1.9604558444595337, + 1.9605646094512938, + 1.9579826686096191, + 1.958512364501953, + 1.9592011234283446, + 1.95956085231781, + 1.956600224647522, + 1.9561384924316407, + 1.9609758742904664, + 1.959275781288147, + 1.9571418167114258, + 1.9607560622406006, + 1.9598481244659425, + 1.9565918572998047, + 1.9561568305206298, + 1.9588905561828613, + 1.958674913368225, + 1.9579413537979127, + 1.958909477081299, + 1.9573396010589599, + 1.9593311087417602 + ], + "gamma": [ + [ + 11, + 0.014960728585720062 + ], + [ + 12, + 0.009227815549820662 + ], + [ + 13, + 0.0007640749681740999 + ], + [ + 14, + -0.004959427751600742 + ], + [ + 15, + 0.006078387959860265 + ], + [ + 20, + 0.005380313203204423 + ], + [ + 25, + 0.0031420112936757505 + ], + [ + 30, + 0.003277134121162817 + ], + [ + 35, + 0.0022802076127845794 + ], + [ + 40, + 0.0024955139379017055 + ], + [ + 45, + -0.0029354651924222708 + ], + [ + 50, + -0.0011411391897127032 + ], + [ + 55, + -0.004323135945014656 + ], + [ + 60, + -0.008762454148381948 + ], + [ + 65, + -0.0003843858721666038 + ], + [ + 70, + -0.003346499928738922 + ], + [ + 75, + 0.001878025766927749 + ], + [ + 80, + -0.0057985419407486916 + ], + [ + 85, + -0.0015874637756496668 + ], + [ + 90, + 0.002085449988953769 + ], + [ + 95, + -0.00530237628845498 + ], + [ + 100, + 0.010076196165755391 + ] + ], + "rho": [ + [ + 11, + 0.010401577688753605 + ], + [ + 12, + 0.0012026397744193673 + ], + [ + 13, + 0.002180876152124256 + ], + [ + 14, + 0.0010479262564331293 + ], + [ + 15, + -0.007734984726994298 + ], + [ + 20, + -0.011412379331886768 + ], + [ + 25, + 0.009992486098781228 + ], + [ + 30, + 0.009496938291704282 + ], + [ + 35, + 0.0015284090768545866 + ], + [ + 40, + -0.006484974641352892 + ], + [ + 45, + -0.002899596467614174 + ], + [ + 50, + -0.033241343684494495 + ], + [ + 55, + 0.0027693638112396 + ], + [ + 60, + -0.01847140514291823 + ], + [ + 65, + -0.0011339893680997193 + ], + [ + 70, + 0.019210411817766726 + ], + [ + 75, + 0.003856189548969269 + ], + [ + 80, + -0.009710555663332343 + ], + [ + 85, + 0.0024136375286616385 + ], + [ + 90, + 0.015115916496142745 + ], + [ + 95, + -0.0043041663011536 + ], + [ + 100, + -0.007703886600211263 + ] + ] + }, + "dfa_final_acc": 0.3102 +} \ No newline at end of file diff --git a/results/cifar100_protocol_validation.log b/results/cifar100_protocol_validation.log new file mode 100644 index 0000000..150e850 --- /dev/null +++ b/results/cifar100_protocol_validation.log @@ -0,0 +1,371 @@ +=== CIFAR-100 PROTOCOL VALIDATION === +Start: Wed Apr 29 09:24:37 PM CDT 2026 + +--- BP + FA + DFA on CIFAR-100 --- +Using device: cuda:0 + +============================================================ +Seed 42 +============================================================ + +--- BP --- + [BP] Epoch 1: loss=3.9752, train=0.0983, test=0.1432 + [BP] Epoch 10: loss=3.0848, train=0.2424, test=0.2492 + [BP] Epoch 20: loss=2.8041, train=0.2935, test=0.2883 + [BP] Epoch 30: loss=2.6019, train=0.3352, test=0.3078 + [BP] Epoch 40: loss=2.4193, train=0.3727, test=0.3158 + [BP] Epoch 50: loss=2.2631, train=0.4053, test=0.3160 + [BP] Epoch 60: loss=2.1134, train=0.4371, test=0.3223 + [BP] Epoch 70: loss=1.9686, train=0.4729, test=0.3207 + [BP] Epoch 80: loss=1.8724, train=0.4941, test=0.3197 + [BP] Epoch 90: loss=1.8161, train=0.5069, test=0.3197 + [BP] Epoch 100: loss=1.7897, train=0.5126, test=0.3192 + Final test acc: 0.3192 + +--- DFA --- + [DFA] Epoch 1: loss=4.1736, train=0.0679, test=0.0775 + [DFA] Epoch 10: loss=4.0844, train=0.0798, test=0.0819 + [DFA] Epoch 20: loss=4.0627, train=0.0840, test=0.0759 + [DFA] Epoch 30: loss=4.0466, train=0.0876, test=0.0840 + [DFA] Epoch 40: loss=4.0357, train=0.0896, test=0.0862 + [DFA] Epoch 50: loss=4.0347, train=0.0909, test=0.0879 + [DFA] Epoch 60: loss=4.0298, train=0.0933, test=0.0879 + [DFA] Epoch 70: loss=4.0244, train=0.0958, test=0.0883 + [DFA] Epoch 80: loss=4.0232, train=0.0939, test=0.0871 + [DFA] Epoch 90: loss=4.0219, train=0.0962, test=0.0870 + [DFA] Epoch 100: loss=4.0244, train=0.0949, test=0.0875 + Final test acc: 0.0875 + +--- FA --- + [FA] Epoch 1: loss=4.1842, train=0.0639, test=0.0598 + [FA] Epoch 10: loss=3.9551, train=0.0978, test=0.0949 + [FA] Epoch 20: loss=3.8745, train=0.1103, test=0.1101 + [FA] Epoch 30: loss=3.8457, train=0.1160, test=0.1212 + [FA] Epoch 40: loss=3.7975, train=0.1235, test=0.1247 + [FA] Epoch 50: loss=3.7623, train=0.1290, test=0.1332 + [FA] Epoch 60: loss=3.7338, train=0.1341, test=0.1397 + [FA] Epoch 70: loss=3.7109, train=0.1404, test=0.1400 + [FA] Epoch 80: loss=3.6910, train=0.1426, test=0.1457 + [FA] Epoch 90: loss=3.6844, train=0.1436, test=0.1455 + [FA] Epoch 100: loss=3.6859, train=0.1440, test=0.1464 + Final test acc: 0.1464 + +============================================================ +Seed 123 +============================================================ + +--- BP --- + [BP] Epoch 1: loss=3.9679, train=0.0986, test=0.1439 + [BP] Epoch 10: loss=3.0754, train=0.2440, test=0.2501 + [BP] Epoch 20: loss=2.8025, train=0.2938, test=0.2812 + [BP] Epoch 30: loss=2.5874, train=0.3376, test=0.3021 + [BP] Epoch 40: loss=2.4113, train=0.3699, test=0.3104 + [BP] Epoch 50: loss=2.2468, train=0.4084, test=0.3160 + [BP] Epoch 60: loss=2.1034, train=0.4373, test=0.3209 + [BP] Epoch 70: loss=1.9664, train=0.4711, test=0.3212 + [BP] Epoch 80: loss=1.8659, train=0.4913, test=0.3208 + [BP] Epoch 90: loss=1.8143, train=0.5098, test=0.3201 + [BP] Epoch 100: loss=1.7758, train=0.5158, test=0.3218 + Final test acc: 0.3218 + +--- DFA --- + [DFA] Epoch 1: loss=4.1790, train=0.0644, test=0.0808 + [DFA] Epoch 10: loss=4.1013, train=0.0738, test=0.0764 + [DFA] Epoch 20: loss=4.0720, train=0.0808, test=0.0803 + [DFA] Epoch 30: loss=4.0493, train=0.0865, test=0.0845 + [DFA] Epoch 40: loss=4.0403, train=0.0866, test=0.0855 + [DFA] Epoch 50: loss=4.0321, train=0.0897, test=0.0852 + [DFA] Epoch 60: loss=4.0243, train=0.0921, test=0.0856 + [DFA] Epoch 70: loss=4.0213, train=0.0924, test=0.0868 + [DFA] Epoch 80: loss=4.0207, train=0.0933, test=0.0867 + [DFA] Epoch 90: loss=4.0178, train=0.0948, test=0.0875 + [DFA] Epoch 100: loss=4.0181, train=0.0932, test=0.0872 + Final test acc: 0.0872 + +--- FA --- + [FA] Epoch 1: loss=4.1971, train=0.0632, test=0.0708 + [FA] Epoch 10: loss=4.0477, train=0.0854, test=0.0847 + [FA] Epoch 20: loss=3.9867, train=0.0968, test=0.0997 + [FA] Epoch 30: loss=3.9504, train=0.1036, test=0.1037 + [FA] Epoch 40: loss=3.9204, train=0.1070, test=0.1068 + [FA] Epoch 50: loss=3.8915, train=0.1107, test=0.1091 + [FA] Epoch 60: loss=3.8680, train=0.1147, test=0.1135 + [FA] Epoch 70: loss=3.8517, train=0.1166, test=0.1156 + [FA] Epoch 80: loss=3.8433, train=0.1188, test=0.1182 + [FA] Epoch 90: loss=3.8342, train=0.1202, test=0.1215 + [FA] Epoch 100: loss=3.8330, train=0.1228, test=0.1208 + Final test acc: 0.1208 + +============================================================ +Seed 456 +============================================================ + +--- BP --- + [BP] Epoch 1: loss=3.9722, train=0.0978, test=0.1436 + [BP] Epoch 10: loss=3.0679, train=0.2433, test=0.2496 + [BP] Epoch 20: loss=2.7902, train=0.2983, test=0.2857 + [BP] Epoch 30: loss=2.5920, train=0.3374, test=0.3018 + [BP] Epoch 40: loss=2.4046, train=0.3747, test=0.3166 + [BP] Epoch 50: loss=2.2421, train=0.4090, test=0.3165 + [BP] Epoch 60: loss=2.0908, train=0.4420, test=0.3204 + [BP] Epoch 70: loss=1.9548, train=0.4750, test=0.3202 + [BP] Epoch 80: loss=1.8580, train=0.4973, test=0.3177 + [BP] Epoch 90: loss=1.8029, train=0.5128, test=0.3217 + [BP] Epoch 100: loss=1.7769, train=0.5179, test=0.3219 + Final test acc: 0.3219 + +--- DFA --- + [DFA] Epoch 1: loss=4.1619, train=0.0684, test=0.0832 + [DFA] Epoch 10: loss=4.0780, train=0.0790, test=0.0777 + [DFA] Epoch 20: loss=4.0602, train=0.0848, test=0.0813 + [DFA] Epoch 30: loss=4.0430, train=0.0885, test=0.0878 + [DFA] Epoch 40: loss=4.0391, train=0.0893, test=0.0872 + [DFA] Epoch 50: loss=4.0372, train=0.0914, test=0.0834 + [DFA] Epoch 60: loss=4.0358, train=0.0919, test=0.0884 + [DFA] Epoch 70: loss=4.0340, train=0.0928, test=0.0906 + [DFA] Epoch 80: loss=4.0334, train=0.0926, test=0.0879 + [DFA] Epoch 90: loss=4.0325, train=0.0935, test=0.0898 + [DFA] Epoch 100: loss=4.0329, train=0.0929, test=0.0894 + Final test acc: 0.0894 + +--- FA --- + [FA] Epoch 1: loss=4.2178, train=0.0611, test=0.0534 + [FA] Epoch 10: loss=3.9339, train=0.1008, test=0.0999 + [FA] Epoch 20: loss=3.8903, train=0.1079, test=0.1125 + [FA] Epoch 30: loss=3.8439, train=0.1169, test=0.1138 + [FA] Epoch 40: loss=3.8094, train=0.1220, test=0.1228 + [FA] Epoch 50: loss=3.7933, train=0.1252, test=0.1240 + [FA] Epoch 60: loss=3.7808, train=0.1273, test=0.1275 + [FA] Epoch 70: loss=3.7675, train=0.1281, test=0.1252 + [FA] Epoch 80: loss=3.7592, train=0.1312, test=0.1307 + [FA] Epoch 90: loss=3.7554, train=0.1333, test=0.1311 + [FA] Epoch 100: loss=3.7508, train=0.1319, test=0.1310 + Final test acc: 0.1310 + +All results saved to results/cifar100_protocol_validation/results_cifar100.json + +--- Frozen baseline on CIFAR-100 --- + Frozen baseline seed=42 (Wed Apr 29 10:19:56 PM CDT 2026) +Device: cuda:0, seed=42, epochs=100, dataset=cifar100 + +=== BP shallow (ResMLP num_blocks=0), seed=42 === + n_params: 812900 (812900 trainable) + [BP-shallow] ep 1: test_acc=0.1119 + [BP-shallow] ep 10: test_acc=0.1320 + [BP-shallow] ep 20: test_acc=0.1286 + [BP-shallow] ep 30: test_acc=0.1324 + [BP-shallow] ep 40: test_acc=0.1407 + [BP-shallow] ep 50: test_acc=0.1555 + [BP-shallow] ep 60: test_acc=0.1599 + [BP-shallow] ep 70: test_acc=0.1706 + [BP-shallow] ep 80: test_acc=0.1738 + [BP-shallow] ep 90: test_acc=0.1780 + [BP-shallow] ep 100: test_acc=0.1787 +FINAL BP-shallow: 0.1787 + +=== BP frozen-blocks (ResMLP num_blocks=4, blocks frozen), seed=42 === + n_params: 1341284 (812900 trainable) + [BP-frozen] ep 1: test_acc=0.1109 + [BP-frozen] ep 10: test_acc=0.1313 + [BP-frozen] ep 20: test_acc=0.1252 + [BP-frozen] ep 30: test_acc=0.1271 + [BP-frozen] ep 40: test_acc=0.1338 + [BP-frozen] ep 50: test_acc=0.1557 + [BP-frozen] ep 60: test_acc=0.1613 + [BP-frozen] ep 70: test_acc=0.1713 + [BP-frozen] ep 80: test_acc=0.1751 + [BP-frozen] ep 90: test_acc=0.1764 + [BP-frozen] ep 100: test_acc=0.1770 +FINAL BP-frozen-blocks: 0.1770 + +=== DFA shallow (ResMLP num_blocks=0), seed=42 === + n_params: 812900 (812900 trainable) + [DFA-shallow] ep 1: test_acc=0.0914 + [DFA-shallow] ep 10: test_acc=0.1120 + [DFA-shallow] ep 20: test_acc=0.1130 + [DFA-shallow] ep 30: test_acc=0.1198 + [DFA-shallow] ep 40: test_acc=0.1170 + [DFA-shallow] ep 50: test_acc=0.1211 + [DFA-shallow] ep 60: test_acc=0.1248 + [DFA-shallow] ep 70: test_acc=0.1203 + [DFA-shallow] ep 80: test_acc=0.1248 + [DFA-shallow] ep 90: test_acc=0.1254 + [DFA-shallow] ep 100: test_acc=0.1255 +FINAL DFA-shallow: 0.1255 + +=== DFA frozen-blocks (ResMLP num_blocks=4, blocks frozen), seed=42 === + n_params: 1341284 (812900 trainable) + [DFA-frozen] ep 1: test_acc=0.0920 + [DFA-frozen] ep 10: test_acc=0.1004 + [DFA-frozen] ep 20: test_acc=0.1171 + [DFA-frozen] ep 30: test_acc=0.1141 + [DFA-frozen] ep 40: test_acc=0.1207 + [DFA-frozen] ep 50: test_acc=0.1208 + [DFA-frozen] ep 60: test_acc=0.1204 + [DFA-frozen] ep 70: test_acc=0.1235 + [DFA-frozen] ep 80: test_acc=0.1243 + [DFA-frozen] ep 90: test_acc=0.1262 + [DFA-frozen] ep 100: test_acc=0.1256 +FINAL DFA-frozen-blocks: 0.1256 + +=== ResMLP frozen/shallow baseline summary, seed=42 === + BP-shallow: 0.1787 + BP-frozen: 0.1770 + DFA-shallow: 0.1255 + DFA-frozen: 0.1256 + +Compare to trainable 4-block ResMLP (3-seed): BP=0.6147 100ep / 0.585 30ep, DFA=0.306 100ep / 0.301 30ep + +Interpretation: + If DFA-frozen ≈ DFA-trainable: blocks are passengers, walk-back parallels ViT + If DFA-frozen << DFA-trainable: ResMLP DFA actually trains the blocks (interesting contrast with ViT) + Frozen baseline seed=123 (Wed Apr 29 10:59:17 PM CDT 2026) +Device: cuda:0, seed=123, epochs=100, dataset=cifar100 + +=== BP shallow (ResMLP num_blocks=0), seed=123 === + n_params: 812900 (812900 trainable) + [BP-shallow] ep 1: test_acc=0.1098 + [BP-shallow] ep 10: test_acc=0.1309 + [BP-shallow] ep 20: test_acc=0.1203 + [BP-shallow] ep 30: test_acc=0.1262 + [BP-shallow] ep 40: test_acc=0.1415 + [BP-shallow] ep 50: test_acc=0.1532 + [BP-shallow] ep 60: test_acc=0.1622 + [BP-shallow] ep 70: test_acc=0.1725 + [BP-shallow] ep 80: test_acc=0.1751 + [BP-shallow] ep 90: test_acc=0.1745 + [BP-shallow] ep 100: test_acc=0.1756 +FINAL BP-shallow: 0.1756 + +=== BP frozen-blocks (ResMLP num_blocks=4, blocks frozen), seed=123 === + n_params: 1341284 (812900 trainable) + [BP-frozen] ep 1: test_acc=0.1100 + [BP-frozen] ep 10: test_acc=0.1328 + [BP-frozen] ep 20: test_acc=0.1256 + [BP-frozen] ep 30: test_acc=0.1333 + [BP-frozen] ep 40: test_acc=0.1411 + [BP-frozen] ep 50: test_acc=0.1596 + [BP-frozen] ep 60: test_acc=0.1638 + [BP-frozen] ep 70: test_acc=0.1720 + [BP-frozen] ep 80: test_acc=0.1737 + [BP-frozen] ep 90: test_acc=0.1769 + [BP-frozen] ep 100: test_acc=0.1777 +FINAL BP-frozen-blocks: 0.1777 + +=== DFA shallow (ResMLP num_blocks=0), seed=123 === + n_params: 812900 (812900 trainable) + [DFA-shallow] ep 1: test_acc=0.0928 + [DFA-shallow] ep 10: test_acc=0.1025 + [DFA-shallow] ep 20: test_acc=0.1146 + [DFA-shallow] ep 30: test_acc=0.1180 + [DFA-shallow] ep 40: test_acc=0.1239 + [DFA-shallow] ep 50: test_acc=0.1283 + [DFA-shallow] ep 60: test_acc=0.1204 + [DFA-shallow] ep 70: test_acc=0.1237 + [DFA-shallow] ep 80: test_acc=0.1261 + [DFA-shallow] ep 90: test_acc=0.1261 + [DFA-shallow] ep 100: test_acc=0.1269 +FINAL DFA-shallow: 0.1269 + +=== DFA frozen-blocks (ResMLP num_blocks=4, blocks frozen), seed=123 === + n_params: 1341284 (812900 trainable) + [DFA-frozen] ep 1: test_acc=0.0916 + [DFA-frozen] ep 10: test_acc=0.1060 + [DFA-frozen] ep 20: test_acc=0.1167 + [DFA-frozen] ep 30: test_acc=0.1125 + [DFA-frozen] ep 40: test_acc=0.1153 + [DFA-frozen] ep 50: test_acc=0.1237 + [DFA-frozen] ep 60: test_acc=0.1217 + [DFA-frozen] ep 70: test_acc=0.1254 + [DFA-frozen] ep 80: test_acc=0.1239 + [DFA-frozen] ep 90: test_acc=0.1254 + [DFA-frozen] ep 100: test_acc=0.1257 +FINAL DFA-frozen-blocks: 0.1257 + +=== ResMLP frozen/shallow baseline summary, seed=123 === + BP-shallow: 0.1756 + BP-frozen: 0.1777 + DFA-shallow: 0.1269 + DFA-frozen: 0.1257 + +Compare to trainable 4-block ResMLP (3-seed): BP=0.6147 100ep / 0.585 30ep, DFA=0.306 100ep / 0.301 30ep + +Interpretation: + If DFA-frozen ≈ DFA-trainable: blocks are passengers, walk-back parallels ViT + If DFA-frozen << DFA-trainable: ResMLP DFA actually trains the blocks (interesting contrast with ViT) + Frozen baseline seed=456 (Wed Apr 29 11:38:34 PM CDT 2026) +Device: cuda:0, seed=456, epochs=100, dataset=cifar100 + +=== BP shallow (ResMLP num_blocks=0), seed=456 === + n_params: 812900 (812900 trainable) + [BP-shallow] ep 1: test_acc=0.1073 + [BP-shallow] ep 10: test_acc=0.1327 + [BP-shallow] ep 20: test_acc=0.1250 + [BP-shallow] ep 30: test_acc=0.1303 + [BP-shallow] ep 40: test_acc=0.1411 + [BP-shallow] ep 50: test_acc=0.1529 + [BP-shallow] ep 60: test_acc=0.1651 + [BP-shallow] ep 70: test_acc=0.1724 + [BP-shallow] ep 80: test_acc=0.1743 + [BP-shallow] ep 90: test_acc=0.1757 + [BP-shallow] ep 100: test_acc=0.1776 +FINAL BP-shallow: 0.1776 + +=== BP frozen-blocks (ResMLP num_blocks=4, blocks frozen), seed=456 === + n_params: 1341284 (812900 trainable) + [BP-frozen] ep 1: test_acc=0.1073 + [BP-frozen] ep 10: test_acc=0.1326 + [BP-frozen] ep 20: test_acc=0.1226 + [BP-frozen] ep 30: test_acc=0.1276 + [BP-frozen] ep 40: test_acc=0.1495 + [BP-frozen] ep 50: test_acc=0.1535 + [BP-frozen] ep 60: test_acc=0.1645 + [BP-frozen] ep 70: test_acc=0.1685 + [BP-frozen] ep 80: test_acc=0.1773 + [BP-frozen] ep 90: test_acc=0.1777 + [BP-frozen] ep 100: test_acc=0.1794 +FINAL BP-frozen-blocks: 0.1794 + +=== DFA shallow (ResMLP num_blocks=0), seed=456 === + n_params: 812900 (812900 trainable) + [DFA-shallow] ep 1: test_acc=0.0913 + [DFA-shallow] ep 10: test_acc=0.1150 + [DFA-shallow] ep 20: test_acc=0.1153 + [DFA-shallow] ep 30: test_acc=0.1161 + [DFA-shallow] ep 40: test_acc=0.1140 + [DFA-shallow] ep 50: test_acc=0.1202 + [DFA-shallow] ep 60: test_acc=0.1229 + [DFA-shallow] ep 70: test_acc=0.1243 + [DFA-shallow] ep 80: test_acc=0.1240 + [DFA-shallow] ep 90: test_acc=0.1237 + [DFA-shallow] ep 100: test_acc=0.1235 +FINAL DFA-shallow: 0.1235 + +=== DFA frozen-blocks (ResMLP num_blocks=4, blocks frozen), seed=456 === + n_params: 1341284 (812900 trainable) + [DFA-frozen] ep 1: test_acc=0.0862 + [DFA-frozen] ep 10: test_acc=0.1059 + [DFA-frozen] ep 20: test_acc=0.1130 + [DFA-frozen] ep 30: test_acc=0.1200 + [DFA-frozen] ep 40: test_acc=0.1227 + [DFA-frozen] ep 50: test_acc=0.1177 + [DFA-frozen] ep 60: test_acc=0.1229 + [DFA-frozen] ep 70: test_acc=0.1232 + [DFA-frozen] ep 80: test_acc=0.1240 + [DFA-frozen] ep 90: test_acc=0.1237 + [DFA-frozen] ep 100: test_acc=0.1236 +FINAL DFA-frozen-blocks: 0.1236 + +=== ResMLP frozen/shallow baseline summary, seed=456 === + BP-shallow: 0.1776 + BP-frozen: 0.1794 + DFA-shallow: 0.1235 + DFA-frozen: 0.1236 + +Compare to trainable 4-block ResMLP (3-seed): BP=0.6147 100ep / 0.585 30ep, DFA=0.306 100ep / 0.301 30ep + +Interpretation: + If DFA-frozen ≈ DFA-trainable: blocks are passengers, walk-back parallels ViT + If DFA-frozen << DFA-trainable: ResMLP DFA actually trains the blocks (interesting contrast with ViT) + +=== CIFAR-100 VALIDATION DONE (Thu Apr 30 12:17:41 AM CDT 2026) === diff --git a/results/cifar100_protocol_validation/results_cifar100.json b/results/cifar100_protocol_validation/results_cifar100.json new file mode 100644 index 0000000..c26cc59 --- /dev/null +++ b/results/cifar100_protocol_validation/results_cifar100.json @@ -0,0 +1,3467 @@ +{ + "42": { + "bp": { + "log": { + "train_loss": [ + 3.975249941253662, + 3.6423986249542235, + 3.4934494227600097, + 3.3944045304870607, + 3.3128096391296387, + 3.249527327423096, + 3.202136681060791, + 3.1545809954071045, + 3.118299830780029, + 3.08477955947876, + 3.05101420211792, + 3.014707311477661, + 2.9815688012695314, + 2.9542644719696045, + 2.917737830657959, + 2.8987481777954103, + 2.877259644317627, + 2.8476891691589357, + 2.826910527801514, + 2.8041292054748537, + 2.7817903074645995, + 2.7624645190429686, + 2.736394059448242, + 2.7153989936065672, + 2.6938070545959474, + 2.6722896592712404, + 2.656808620452881, + 2.6342206648254396, + 2.6130940935516356, + 2.601909016876221, + 2.5847591175842286, + 2.5616293630218507, + 2.540946982421875, + 2.528531006851196, + 2.508262563323975, + 2.494774736251831, + 2.471127844619751, + 2.455823439178467, + 2.443439641647339, + 2.419278503417969, + 2.409900106124878, + 2.3866433473205566, + 2.3731185454559327, + 2.348314314727783, + 2.336296524658203, + 2.3228698544311523, + 2.299138896865845, + 2.2919679093933105, + 2.271020979156494, + 2.263141948699951, + 2.242116179199219, + 2.2228171809387205, + 2.210650175628662, + 2.1947706311798094, + 2.1783614316558837, + 2.1615723634338377, + 2.152301993675232, + 2.139739892730713, + 2.11690347366333, + 2.1134400886535643, + 2.0890519944000245, + 2.076347621765137, + 2.067469055480957, + 2.0518165933990478, + 2.041287666015625, + 2.027727124786377, + 2.0111099968719484, + 1.9989793057250977, + 1.991382496948242, + 1.9685791171264648, + 1.966265661239624, + 1.9562527508544922, + 1.942470475769043, + 1.9250774355316163, + 1.9187585319137572, + 1.9093894129943847, + 1.9017769010162353, + 1.8909222549438476, + 1.8789906490707398, + 1.87238977394104, + 1.876755567703247, + 1.8579993398284913, + 1.8549057474517823, + 1.8437388555145264, + 1.83396729637146, + 1.8345417359161378, + 1.83224958152771, + 1.8185578295516969, + 1.8260858072280883, + 1.8161109666442872, + 1.8139908428573608, + 1.8139760601043702, + 1.8037351627349854, + 1.8002028354644775, + 1.8035412215423583, + 1.8000410940933227, + 1.7957222201156615, + 1.79567547290802, + 1.7953530138397218, + 1.7897127409744262 + ], + "train_acc": [ + 0.09828, + 0.14442, + 0.16788, + 0.18412, + 0.1995, + 0.21148, + 0.21652, + 0.2278, + 0.23422, + 0.24242, + 0.24772, + 0.25402, + 0.26126, + 0.2639, + 0.27258, + 0.27642, + 0.2808, + 0.28564, + 0.2893, + 0.29352, + 0.29922, + 0.3014, + 0.30794, + 0.31222, + 0.31722, + 0.322, + 0.32392, + 0.32726, + 0.33092, + 0.3352, + 0.33782, + 0.34382, + 0.34482, + 0.34966, + 0.3531, + 0.35308, + 0.36068, + 0.36312, + 0.36942, + 0.37268, + 0.3705, + 0.3762, + 0.38242, + 0.38778, + 0.38854, + 0.39198, + 0.3985, + 0.39664, + 0.4058, + 0.40534, + 0.40916, + 0.41304, + 0.41528, + 0.42002, + 0.42598, + 0.4278, + 0.42834, + 0.43244, + 0.43612, + 0.43712, + 0.4414, + 0.44592, + 0.44574, + 0.44904, + 0.4551, + 0.45958, + 0.46296, + 0.4616, + 0.46646, + 0.47288, + 0.4693, + 0.47354, + 0.47626, + 0.48042, + 0.4848, + 0.48688, + 0.4857, + 0.4874, + 0.49078, + 0.49406, + 0.49478, + 0.49768, + 0.49744, + 0.50144, + 0.50262, + 0.5014, + 0.50426, + 0.5064, + 0.5074, + 0.50692, + 0.50832, + 0.50964, + 0.5119, + 0.51018, + 0.5099, + 0.51064, + 0.51258, + 0.515, + 0.51522, + 0.5126 + ], + "test_acc": [ + 0.1432, + 0.181, + 0.1871, + 0.212, + 0.2185, + 0.2122, + 0.2368, + 0.2466, + 0.241, + 0.2492, + 0.2563, + 0.2629, + 0.2656, + 0.2695, + 0.2731, + 0.2753, + 0.2737, + 0.2823, + 0.2832, + 0.2883, + 0.2946, + 0.2915, + 0.2957, + 0.2922, + 0.2981, + 0.294, + 0.2961, + 0.301, + 0.3015, + 0.3078, + 0.3127, + 0.3097, + 0.308, + 0.3058, + 0.3138, + 0.3098, + 0.3114, + 0.3129, + 0.3126, + 0.3158, + 0.3146, + 0.3119, + 0.313, + 0.3137, + 0.3127, + 0.3167, + 0.3186, + 0.3181, + 0.3165, + 0.316, + 0.3222, + 0.3188, + 0.3228, + 0.3173, + 0.3178, + 0.3174, + 0.3217, + 0.3173, + 0.3196, + 0.3223, + 0.3181, + 0.3186, + 0.3196, + 0.3161, + 0.3202, + 0.314, + 0.3178, + 0.3172, + 0.3174, + 0.3207, + 0.3193, + 0.3214, + 0.3213, + 0.3175, + 0.3228, + 0.3207, + 0.3208, + 0.3213, + 0.3187, + 0.3197, + 0.3226, + 0.32, + 0.3205, + 0.3213, + 0.3217, + 0.3192, + 0.3203, + 0.3207, + 0.3209, + 0.3197, + 0.3207, + 0.3195, + 0.3192, + 0.3186, + 0.3178, + 0.3191, + 0.3189, + 0.3193, + 0.3189, + 0.3192 + ] + }, + "diagnostics": { + "bp_cosine": [ + 1.0, + 1.0, + 1.0, + 1.0 + ], + "perturbation_rho": [ + 0.9980340600013733, + 0.9982945919036865, + 0.9984437227249146, + 0.9987074136734009 + ], + "nudging": { + "0.001": [ + -0.0022835906129330397, + -0.0023387258406728506, + -0.002373999450355768, + -0.002260879147797823 + ], + "0.003": [ + -0.006846790201961994, + -0.007012245710939169, + -0.007117925677448511, + -0.006779024377465248 + ], + "0.01": [ + -0.022776642814278603, + -0.02332628145813942, + -0.023679494857788086, + -0.02255532145500183 + ] + }, + "hidden_norms_per_layer": [ + 236.57855224609375, + 217.48927307128906, + 197.1617889404297, + 187.24839782714844, + 191.277587890625 + ], + "bp_grad_norms_per_layer": [ + 0.0010384325869381428, + 0.0010872395941987634, + 0.0011213896796107292, + 0.001103188842535019, + 0.0009315301431342959 + ] + }, + "drift": { + "embed.weight": 7.433656905137662, + "embed.bias": 13.602162006682997, + "blocks.0.ln.weight": 0.14788760244846344, + "blocks.0.w1.weight": 3.605816897627063, + "blocks.0.w1.bias": 5.290238058535016, + "blocks.0.w2.weight": 13.310045077395138, + "blocks.1.ln.weight": 0.2914122939109802, + "blocks.1.w1.weight": 3.997572101972956, + "blocks.1.w1.bias": 4.732854205627193, + "blocks.1.w2.weight": 14.921397012401421, + "blocks.2.ln.weight": 0.35930144786834717, + "blocks.2.w1.weight": 4.149029664687284, + "blocks.2.w1.bias": 3.8845074849434162, + "blocks.2.w2.weight": 16.00171210299565, + "blocks.3.ln.weight": 0.5467617511749268, + "blocks.3.w1.weight": 4.475958556672767, + "blocks.3.w1.bias": 3.7954587976923664, + "blocks.3.w2.weight": 17.52879838948756, + "out_ln.weight": 0.1443399339914322, + "out_head.weight": 2.871805586504566, + "out_head.bias": 3.1293217686796893 + } + }, + "dfa": { + "log": { + "train_loss": [ + 4.17356710144043, + 4.045213865203857, + 4.0394830491638185, + 4.052726871032715, + 4.062585520324707, + 4.077131650848389, + 4.081288940353393, + 4.082902023620606, + 4.082292946929932, + 4.084377682189942, + 4.082009593811035, + 4.078371176147461, + 4.0787283967590335, + 4.0781014080810545, + 4.071053223266602, + 4.073739369049072, + 4.070565816497803, + 4.068224396362305, + 4.064294567718506, + 4.062663984680176, + 4.060789375686645, + 4.060499965057373, + 4.05942348953247, + 4.05340063583374, + 4.054450568389893, + 4.051036394500732, + 4.052292782592773, + 4.04923277923584, + 4.047891028900146, + 4.046583199005127, + 4.046011067352295, + 4.0444303074646, + 4.045907030334472, + 4.044839619445801, + 4.03859343673706, + 4.043664588165283, + 4.0400294355773925, + 4.035496199493408, + 4.038207025909424, + 4.035675854187012, + 4.037980937347412, + 4.038932502746582, + 4.036024468383789, + 4.037031109313965, + 4.034120268630981, + 4.036895367584228, + 4.037431150054932, + 4.033238902282715, + 4.036427326049805, + 4.03467604888916, + 4.03339782157898, + 4.0328554144287105, + 4.031013775024414, + 4.031612381286621, + 4.0287201686096195, + 4.031132036132813, + 4.029230642242432, + 4.029863064575196, + 4.03147859588623, + 4.029825403366089, + 4.030359633789063, + 4.028107041168213, + 4.02976943069458, + 4.029035094909668, + 4.028509668731689, + 4.0304917379760745, + 4.030941032562255, + 4.026340734710693, + 4.027734536590576, + 4.024428620147705, + 4.025526253967286, + 4.025494504394532, + 4.026692573547363, + 4.0229616456604, + 4.026408356018067, + 4.024612335662842, + 4.023342019500732, + 4.024318858337402, + 4.023249450683593, + 4.023151823806763, + 4.026289680709839, + 4.023877305831909, + 4.023189326248169, + 4.022549798278809, + 4.024784528045655, + 4.022774189758301, + 4.024208254547119, + 4.023730496368408, + 4.02367640625, + 4.021903743209839, + 4.02390080947876, + 4.022859935150146, + 4.023393632354736, + 4.021766328201294, + 4.02325630645752, + 4.023518178710938, + 4.021166778717041, + 4.023976897583008, + 4.023609465179443, + 4.024444749069214 + ], + "train_acc": [ + 0.06788, + 0.08332, + 0.08406, + 0.0818, + 0.08046, + 0.08148, + 0.07862, + 0.07956, + 0.08038, + 0.07976, + 0.08042, + 0.0808, + 0.08058, + 0.08086, + 0.08006, + 0.08136, + 0.08244, + 0.08388, + 0.08354, + 0.084, + 0.08448, + 0.08518, + 0.08594, + 0.08624, + 0.08568, + 0.08764, + 0.08492, + 0.08604, + 0.08814, + 0.0876, + 0.08836, + 0.08956, + 0.08702, + 0.08854, + 0.08976, + 0.08954, + 0.0895, + 0.09006, + 0.0894, + 0.08964, + 0.09064, + 0.09034, + 0.09288, + 0.0913, + 0.0914, + 0.09116, + 0.09094, + 0.09192, + 0.09044, + 0.0909, + 0.09252, + 0.09214, + 0.09332, + 0.0931, + 0.09364, + 0.09176, + 0.09246, + 0.09302, + 0.09276, + 0.09334, + 0.09404, + 0.0942, + 0.09392, + 0.09358, + 0.09336, + 0.09392, + 0.09252, + 0.0949, + 0.09444, + 0.0958, + 0.09542, + 0.0949, + 0.0954, + 0.09438, + 0.09338, + 0.0958, + 0.09376, + 0.0959, + 0.09448, + 0.09388, + 0.09458, + 0.09422, + 0.09542, + 0.09522, + 0.09468, + 0.0951, + 0.09564, + 0.09586, + 0.09536, + 0.09624, + 0.09588, + 0.09594, + 0.09642, + 0.09588, + 0.09496, + 0.09496, + 0.096, + 0.09454, + 0.09542, + 0.09488 + ], + "test_acc": [ + 0.0775, + 0.0794, + 0.0808, + 0.0828, + 0.0742, + 0.0795, + 0.0788, + 0.0855, + 0.0809, + 0.0819, + 0.0767, + 0.0826, + 0.0854, + 0.0752, + 0.0798, + 0.0796, + 0.0813, + 0.0771, + 0.0823, + 0.0759, + 0.0814, + 0.0772, + 0.0826, + 0.079, + 0.0803, + 0.0815, + 0.0818, + 0.0819, + 0.0818, + 0.084, + 0.0853, + 0.0855, + 0.0875, + 0.0818, + 0.0861, + 0.0827, + 0.0847, + 0.0825, + 0.0853, + 0.0862, + 0.0841, + 0.0857, + 0.0852, + 0.0852, + 0.0827, + 0.0863, + 0.0878, + 0.0858, + 0.0857, + 0.0879, + 0.0888, + 0.088, + 0.0878, + 0.0871, + 0.0878, + 0.0845, + 0.0863, + 0.0852, + 0.0872, + 0.0879, + 0.086, + 0.0878, + 0.0851, + 0.0863, + 0.0877, + 0.0861, + 0.0889, + 0.0839, + 0.0893, + 0.0883, + 0.0867, + 0.0855, + 0.0878, + 0.086, + 0.0876, + 0.0882, + 0.0895, + 0.0877, + 0.0876, + 0.0871, + 0.088, + 0.0876, + 0.088, + 0.0885, + 0.0879, + 0.0888, + 0.0882, + 0.0876, + 0.0882, + 0.087, + 0.0873, + 0.0877, + 0.0876, + 0.0882, + 0.0878, + 0.0876, + 0.0877, + 0.0876, + 0.0875, + 0.0875 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.14061881601810455, + 0.0022556069307029247, + -0.009000124409794807, + -0.013949227519333363 + ], + "perturbation_rho": [ + 0.04333949834108353, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -5.513429641723633e-07, + 0.0, + 0.0, + -3.725290298461914e-09 + ], + "0.003": [ + -1.7480924725532532e-06, + -1.4901161193847656e-08, + 0.0, + -1.862645149230957e-09 + ], + "0.01": [ + -5.760230123996735e-06, + 2.3283064365386963e-08, + -1.862645149230957e-09, + 0.0 + ] + }, + "hidden_norms_per_layer": [ + 20187.3125, + 13252251.0, + 93144488.0, + 163952208.0, + 202900624.0 + ], + "bp_grad_norms_per_layer": [ + 1.3867399957234738e-06, + 9.786202070927175e-09, + 9.394233835280374e-09, + 9.39475075512064e-09, + 9.382485899323001e-09 + ] + }, + "drift": { + "embed.weight": 164.5243882671684, + "embed.bias": 86.31975598233767, + "blocks.0.ln.weight": 9.94965648651123, + "blocks.0.w1.weight": 116.60864500939675, + "blocks.0.w1.bias": 119.5896283256837, + "blocks.0.w2.weight": 139.89574047116318, + "blocks.1.ln.weight": 6.952559471130371, + "blocks.1.w1.weight": 171.01066211955538, + "blocks.1.w1.bias": 184.66872276388008, + "blocks.1.w2.weight": 113.70390206644275, + "blocks.2.ln.weight": 8.037435531616211, + "blocks.2.w1.weight": 204.0534914689403, + "blocks.2.w1.bias": 205.1741516813065, + "blocks.2.w2.weight": 112.9529550385935, + "blocks.3.ln.weight": 7.489717483520508, + "blocks.3.w1.weight": 199.12470243900225, + "blocks.3.w1.bias": 198.81992912624156, + "blocks.3.w2.weight": 104.7339169635497, + "out_ln.weight": 1.6446622610092163, + "out_head.weight": 8.633984180685534, + "out_head.bias": 0.8233496742420285 + } + }, + "fa": { + "log": { + "train_loss": [ + 4.184186522827148, + 4.179929753265381, + 4.089846964416504, + 4.048904882202148, + 4.019415323638916, + 4.003474291839599, + 3.9891197368621825, + 3.9800468362426757, + 3.9685846406555174, + 3.9551162309265138, + 3.942166231536865, + 3.9271056993865967, + 3.915979294891357, + 3.9063652964782714, + 3.8933532473754884, + 3.892304434890747, + 3.8851386541748045, + 3.880706764526367, + 3.8791183966064455, + 3.874532577972412, + 3.870268273162842, + 3.8705162049865725, + 3.8667305128479006, + 3.8626690478515626, + 3.8593408808898926, + 3.8570751000213623, + 3.858237083206177, + 3.8517847180938722, + 3.8476831745910642, + 3.8457262559509275, + 3.840909554901123, + 3.835939132537842, + 3.834127527542114, + 3.830621910324097, + 3.8192956964874267, + 3.8194126902770997, + 3.8129332183074953, + 3.803470793991089, + 3.8037892980194092, + 3.7975124457550047, + 3.7967339707946777, + 3.7944636122131348, + 3.786077890625, + 3.7846675917053223, + 3.7791504066467283, + 3.7762106622314455, + 3.777709127731323, + 3.7638775648498535, + 3.765332045440674, + 3.7623159846496583, + 3.761364775314331, + 3.7529254064178468, + 3.749479592971802, + 3.744997635345459, + 3.7406992932128906, + 3.74050118598938, + 3.740082041091919, + 3.7403511964416505, + 3.7391156189727783, + 3.7338412855529786, + 3.733470021286011, + 3.726227327346802, + 3.7261299742889404, + 3.722200173187256, + 3.7222453344726563, + 3.7236415620422365, + 3.720610160598755, + 3.71873546585083, + 3.7171892735290526, + 3.710947210006714, + 3.7083427098846435, + 3.7072678149414062, + 3.70656751663208, + 3.704509799041748, + 3.7028028456115725, + 3.7015775603485106, + 3.7001070789337156, + 3.6981460167694093, + 3.696165197067261, + 3.6909815367889403, + 3.6975155518341065, + 3.693085638427734, + 3.6924814643096924, + 3.6891826426696777, + 3.688821280517578, + 3.689004655685425, + 3.6925391107177736, + 3.6897733489990236, + 3.687680895843506, + 3.6844489430236815, + 3.688553215789795, + 3.6839564624023438, + 3.685328346557617, + 3.6844889741516114, + 3.682617470626831, + 3.685823777923584, + 3.6817508575439453, + 3.6835061328125, + 3.683719411773682, + 3.685913360671997 + ], + "train_acc": [ + 0.06392, + 0.06052, + 0.07254, + 0.0799, + 0.0863, + 0.08926, + 0.09172, + 0.09366, + 0.0967, + 0.09784, + 0.10026, + 0.10226, + 0.10344, + 0.10226, + 0.10548, + 0.10614, + 0.10576, + 0.1094, + 0.10852, + 0.11026, + 0.1109, + 0.1113, + 0.11464, + 0.11204, + 0.114, + 0.11382, + 0.11484, + 0.11308, + 0.11652, + 0.116, + 0.11544, + 0.11934, + 0.1164, + 0.11756, + 0.12118, + 0.12098, + 0.1208, + 0.1226, + 0.12196, + 0.12346, + 0.1241, + 0.12418, + 0.12376, + 0.12556, + 0.12682, + 0.12578, + 0.12646, + 0.12802, + 0.12834, + 0.12896, + 0.1285, + 0.13022, + 0.13064, + 0.13266, + 0.132, + 0.13304, + 0.13302, + 0.13274, + 0.13234, + 0.13406, + 0.1352, + 0.1352, + 0.13452, + 0.13546, + 0.1378, + 0.1353, + 0.13576, + 0.13548, + 0.13744, + 0.1404, + 0.13826, + 0.13848, + 0.14008, + 0.13914, + 0.13812, + 0.14022, + 0.14048, + 0.14066, + 0.14008, + 0.1426, + 0.1408, + 0.1407, + 0.1429, + 0.14204, + 0.14294, + 0.14272, + 0.14102, + 0.14226, + 0.14414, + 0.1436, + 0.14408, + 0.14312, + 0.1434, + 0.14338, + 0.14488, + 0.14448, + 0.14394, + 0.1426, + 0.14502, + 0.14398 + ], + "test_acc": [ + 0.0598, + 0.0694, + 0.069, + 0.0805, + 0.086, + 0.0911, + 0.0953, + 0.0986, + 0.0954, + 0.0949, + 0.0993, + 0.1051, + 0.1069, + 0.1004, + 0.1066, + 0.11, + 0.1087, + 0.1039, + 0.1151, + 0.1101, + 0.1136, + 0.1096, + 0.1118, + 0.1138, + 0.1155, + 0.1151, + 0.1171, + 0.1197, + 0.1188, + 0.1212, + 0.1182, + 0.1194, + 0.12, + 0.122, + 0.1259, + 0.1204, + 0.1205, + 0.1259, + 0.1231, + 0.1247, + 0.1263, + 0.1294, + 0.1233, + 0.1265, + 0.1299, + 0.1267, + 0.1297, + 0.1338, + 0.1276, + 0.1332, + 0.1337, + 0.1302, + 0.1399, + 0.1354, + 0.1322, + 0.1382, + 0.1372, + 0.1363, + 0.1369, + 0.1397, + 0.1357, + 0.1394, + 0.144, + 0.1395, + 0.1448, + 0.1373, + 0.1435, + 0.1417, + 0.1398, + 0.14, + 0.1409, + 0.1409, + 0.1408, + 0.141, + 0.145, + 0.1425, + 0.1425, + 0.1452, + 0.1449, + 0.1457, + 0.1432, + 0.1449, + 0.1446, + 0.1486, + 0.1429, + 0.1477, + 0.1458, + 0.146, + 0.1449, + 0.1455, + 0.1442, + 0.1453, + 0.1458, + 0.1462, + 0.1468, + 0.1456, + 0.1462, + 0.1464, + 0.1465, + 0.1464 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.032749101519584656, + -0.02806573174893856, + -0.13188865780830383, + 0.9981366395950317 + ], + "perturbation_rho": [ + 0.023128217086195946, + -0.033153705298900604, + -0.03114410489797592, + -0.04209538549184799 + ], + "nudging": { + "0.001": [ + -3.4319236874580383e-07, + 3.664754331111908e-07, + 2.3958273231983185e-07, + -1.4158431440591812e-06 + ], + "0.003": [ + -1.9101426005363464e-06, + 6.353948265314102e-07, + 1.5594996511936188e-06, + -8.973991498351097e-06 + ], + "0.01": [ + -6.851274520158768e-06, + 8.617062121629715e-07, + 6.175599992275238e-06, + -3.897189162671566e-05 + ] + }, + "hidden_norms_per_layer": [ + 10709.3916015625, + 183619.875, + 1852831.0, + 3034211.25, + 169794.0625 + ], + "bp_grad_norms_per_layer": [ + 1.2192158465040848e-05, + 2.159640871468582e-06, + 1.9386970961932093e-06, + 1.93888718058588e-06, + 1.940315996762365e-06 + ] + }, + "drift": { + "embed.weight": 97.51059845469358, + "embed.bias": 45.31500470139968, + "blocks.0.ln.weight": 2.126800775527954, + "blocks.0.w1.weight": 24.113425166766486, + "blocks.0.w1.bias": 25.534244327420822, + "blocks.0.w2.weight": 69.8748433766199, + "blocks.1.ln.weight": 1.5964641571044922, + "blocks.1.w1.weight": 35.519098992915914, + "blocks.1.w1.bias": 42.27561830539123, + "blocks.1.w2.weight": 61.05750225415427, + "blocks.2.ln.weight": 1.4540088176727295, + "blocks.2.w1.weight": 41.92037705190106, + "blocks.2.w1.bias": 47.8882125375433, + "blocks.2.w2.weight": 47.86373297818362, + "blocks.3.ln.weight": 1.6165372133255005, + "blocks.3.w1.weight": 47.10451321088829, + "blocks.3.w1.bias": 53.07025310766248, + "blocks.3.w2.weight": 48.00579573400754, + "out_ln.weight": 0.49529579281806946, + "out_head.weight": 4.173857948425521, + "out_head.bias": 3.4238911704789996 + } + } + }, + "123": { + "bp": { + "log": { + "train_loss": [ + 3.967920153274536, + 3.643245764923096, + 3.486677552947998, + 3.389170970993042, + 3.3176012518310545, + 3.2524516577148437, + 3.196259712524414, + 3.152468095245361, + 3.116606701889038, + 3.0753799269104003, + 3.0412558711242674, + 3.0103372289276122, + 2.9851040869140624, + 2.9536216430664064, + 2.919733713989258, + 2.8960993688964844, + 2.872693371734619, + 2.84370941696167, + 2.8186388218688965, + 2.802537234954834, + 2.775104519882202, + 2.752585594329834, + 2.7324084952545165, + 2.7153604712677004, + 2.6842776251220704, + 2.667392734527588, + 2.6493602058410644, + 2.6304399774932863, + 2.6058559870910645, + 2.5874294744110107, + 2.5774721023559573, + 2.560277436981201, + 2.5345041821289063, + 2.5185300437927247, + 2.5040577131652832, + 2.4822867348480226, + 2.4557650662994384, + 2.4456021406555175, + 2.4341802147674563, + 2.4113426206207276, + 2.401808072052002, + 2.3768489891052247, + 2.3607859144592287, + 2.3446667034912108, + 2.329873125, + 2.3144486641693116, + 2.297909416656494, + 2.2798938914489746, + 2.266936881713867, + 2.2467652272033694, + 2.2354507537841797, + 2.2205448300933837, + 2.2017585570526124, + 2.1915560935974123, + 2.1722356983947755, + 2.1580420698547362, + 2.138712609024048, + 2.1268783713531496, + 2.1147646588897704, + 2.1034324825286865, + 2.088131596069336, + 2.0740757128143312, + 2.049090367126465, + 2.0376090378570555, + 2.0276603718566895, + 2.0167199254989625, + 2.0046445736694336, + 1.9935844805145264, + 1.9779361727905274, + 1.9663786093521118, + 1.9583420275497436, + 1.94067984375, + 1.929230265197754, + 1.9221224881362915, + 1.912958982810974, + 1.9034557625579833, + 1.8937049017715455, + 1.8790358535003662, + 1.876692020301819, + 1.8658557400512696, + 1.8551803729629517, + 1.8528358583831788, + 1.8547788270568848, + 1.83579787399292, + 1.825839135055542, + 1.8247737094116212, + 1.8170814221191407, + 1.8188595218658448, + 1.815419641456604, + 1.8142681406402588, + 1.8094764706802369, + 1.7942750823593139, + 1.7980619449615478, + 1.7933076245498658, + 1.7883917538452148, + 1.7867490985870362, + 1.7903605484771727, + 1.79024905128479, + 1.7870432864379884, + 1.7758308526611328 + ], + "train_acc": [ + 0.0986, + 0.14448, + 0.17068, + 0.18832, + 0.20038, + 0.21186, + 0.22002, + 0.22894, + 0.23506, + 0.24404, + 0.24964, + 0.25374, + 0.25782, + 0.26606, + 0.2711, + 0.27704, + 0.28214, + 0.2849, + 0.29088, + 0.2938, + 0.29992, + 0.3054, + 0.3096, + 0.30988, + 0.3165, + 0.3225, + 0.32436, + 0.32574, + 0.33332, + 0.33762, + 0.33924, + 0.343, + 0.34878, + 0.3505, + 0.35344, + 0.35974, + 0.36384, + 0.36348, + 0.3704, + 0.36994, + 0.37362, + 0.38144, + 0.38266, + 0.3852, + 0.3905, + 0.3918, + 0.39726, + 0.40046, + 0.40264, + 0.40842, + 0.40998, + 0.41106, + 0.4151, + 0.4193, + 0.4234, + 0.42538, + 0.43214, + 0.43326, + 0.43584, + 0.4373, + 0.44392, + 0.4447, + 0.44954, + 0.45406, + 0.45662, + 0.45958, + 0.46094, + 0.46528, + 0.46588, + 0.47114, + 0.47258, + 0.47772, + 0.47956, + 0.48164, + 0.48602, + 0.48696, + 0.48908, + 0.49296, + 0.49344, + 0.49132, + 0.49576, + 0.49762, + 0.49882, + 0.49984, + 0.50594, + 0.5048, + 0.50622, + 0.50504, + 0.50664, + 0.50984, + 0.50942, + 0.5116, + 0.5117, + 0.51286, + 0.51336, + 0.51602, + 0.5143, + 0.51562, + 0.51416, + 0.51578 + ], + "test_acc": [ + 0.1439, + 0.1786, + 0.2007, + 0.208, + 0.2165, + 0.2315, + 0.2325, + 0.2385, + 0.2483, + 0.2501, + 0.254, + 0.2585, + 0.2634, + 0.2702, + 0.2749, + 0.2758, + 0.2809, + 0.2848, + 0.2814, + 0.2812, + 0.2857, + 0.2915, + 0.2921, + 0.2923, + 0.2939, + 0.295, + 0.302, + 0.2965, + 0.3039, + 0.3021, + 0.3035, + 0.3055, + 0.3095, + 0.3052, + 0.3129, + 0.3112, + 0.3097, + 0.308, + 0.3123, + 0.3104, + 0.3135, + 0.3145, + 0.3105, + 0.3173, + 0.3165, + 0.3154, + 0.315, + 0.3172, + 0.3154, + 0.316, + 0.3159, + 0.3184, + 0.316, + 0.3219, + 0.3177, + 0.3206, + 0.3164, + 0.3151, + 0.3233, + 0.3209, + 0.3224, + 0.3239, + 0.3212, + 0.318, + 0.3248, + 0.3255, + 0.324, + 0.3217, + 0.323, + 0.3212, + 0.323, + 0.3249, + 0.3196, + 0.3215, + 0.3217, + 0.3204, + 0.3211, + 0.3238, + 0.3237, + 0.3208, + 0.3243, + 0.3225, + 0.3216, + 0.3233, + 0.3208, + 0.3198, + 0.3185, + 0.319, + 0.3196, + 0.3201, + 0.3197, + 0.3214, + 0.3217, + 0.3219, + 0.3217, + 0.3221, + 0.3217, + 0.3217, + 0.3218, + 0.3218 + ] + }, + "diagnostics": { + "bp_cosine": [ + 1.0, + 1.0, + 1.0, + 1.0 + ], + "perturbation_rho": [ + 0.9976038932800293, + 0.9983073472976685, + 0.9986611604690552, + 0.9987543821334839 + ], + "nudging": { + "0.001": [ + -0.002336513716727495, + -0.0024050232023000717, + -0.002418666612356901, + -0.0022877217270433903 + ], + "0.003": [ + -0.007005014922469854, + -0.007211083546280861, + -0.007251948118209839, + -0.006859402172267437 + ], + "0.01": [ + -0.023301422595977783, + -0.02398984506726265, + -0.024125652387738228, + -0.022821901366114616 + ] + }, + "hidden_norms_per_layer": [ + 228.35731506347656, + 216.70431518554688, + 197.1549835205078, + 189.50289916992188, + 193.0804901123047 + ], + "bp_grad_norms_per_layer": [ + 0.0011750052217394114, + 0.0012150296242907643, + 0.00123639649245888, + 0.0011825052788481116, + 0.0009545879438519478 + ] + }, + "drift": { + "embed.weight": 7.3996956607158415, + "embed.bias": 13.278713687472328, + "blocks.0.ln.weight": 0.15684440732002258, + "blocks.0.w1.weight": 3.6258136635529388, + "blocks.0.w1.bias": 5.57490288506498, + "blocks.0.w2.weight": 13.211600071846687, + "blocks.1.ln.weight": 0.26902759075164795, + "blocks.1.w1.weight": 3.9457858088997937, + "blocks.1.w1.bias": 4.8656985397285295, + "blocks.1.w2.weight": 14.784374975769294, + "blocks.2.ln.weight": 0.37451720237731934, + "blocks.2.w1.weight": 4.11706460399454, + "blocks.2.w1.bias": 4.146142198756796, + "blocks.2.w2.weight": 15.840220385160595, + "blocks.3.ln.weight": 0.5431011319160461, + "blocks.3.w1.weight": 4.464837126822249, + "blocks.3.w1.bias": 3.6144859875754407, + "blocks.3.w2.weight": 17.545783297025896, + "out_ln.weight": 0.14564843475818634, + "out_head.weight": 2.8817944671871123, + "out_head.bias": 3.056171448565604 + } + }, + "dfa": { + "log": { + "train_loss": [ + 4.179048243713379, + 4.067725786132812, + 4.071110060424805, + 4.091065592956543, + 4.10388401260376, + 4.1050505090332035, + 4.10725640045166, + 4.107924006652832, + 4.103042182159424, + 4.101259585266114, + 4.0994670211791995, + 4.092466098937988, + 4.091690199432373, + 4.088890562286377, + 4.083471063919068, + 4.082734613113403, + 4.079294251174927, + 4.074109273834228, + 4.072821339111328, + 4.072047854766845, + 4.068868335876465, + 4.064674437255859, + 4.064519798278808, + 4.062208421783447, + 4.059947501296997, + 4.0568214564514165, + 4.0578119854736325, + 4.05678455657959, + 4.054043687744141, + 4.04934491607666, + 4.049620868835449, + 4.048787186126709, + 4.041555746765137, + 4.046662612380981, + 4.043773061065674, + 4.0444277174377445, + 4.043180988922119, + 4.040115342483521, + 4.041283304138184, + 4.040324337005615, + 4.03773109161377, + 4.037001483154297, + 4.036031613235473, + 4.035188417053223, + 4.035520594024658, + 4.031777966766358, + 4.036043049621582, + 4.0324571522521975, + 4.032010763549804, + 4.032135240783691, + 4.028632532043457, + 4.028738806915284, + 4.029276781768798, + 4.030177063598633, + 4.027558575515747, + 4.0295089608764645, + 4.02790505935669, + 4.0268916735076905, + 4.025881996612549, + 4.024340693664551, + 4.024784558410644, + 4.022587103195191, + 4.023770975189209, + 4.024697297668457, + 4.023757594070434, + 4.025282996749878, + 4.020828542404175, + 4.02296846206665, + 4.021536037902832, + 4.021342518310547, + 4.023781976318359, + 4.020269456634521, + 4.019074986038208, + 4.020880366287232, + 4.02205199508667, + 4.019182727050781, + 4.019642067718506, + 4.019440497131348, + 4.018397001342773, + 4.020665705871582, + 4.020597035064697, + 4.019291881713867, + 4.019497079620361, + 4.018186092681884, + 4.018166368408203, + 4.017542911529541, + 4.018283336334228, + 4.015659646606445, + 4.0151326177978515, + 4.017795926361084, + 4.016853940124512, + 4.018234666442871, + 4.015345659790039, + 4.017251117095947, + 4.018545875244141, + 4.017435375213623, + 4.015963760681152, + 4.015863068695069, + 4.015675266418457, + 4.018068486938477 + ], + "train_acc": [ + 0.06442, + 0.07788, + 0.07748, + 0.07344, + 0.07334, + 0.0722, + 0.07326, + 0.07414, + 0.07376, + 0.07382, + 0.07452, + 0.07688, + 0.07534, + 0.07782, + 0.08016, + 0.07796, + 0.08084, + 0.0805, + 0.0801, + 0.08082, + 0.08118, + 0.08206, + 0.08406, + 0.08258, + 0.08372, + 0.08414, + 0.08464, + 0.08358, + 0.0859, + 0.08652, + 0.08582, + 0.08718, + 0.08834, + 0.08784, + 0.08652, + 0.08678, + 0.08714, + 0.08734, + 0.0885, + 0.08662, + 0.08978, + 0.08958, + 0.08816, + 0.08956, + 0.08942, + 0.09074, + 0.08972, + 0.08778, + 0.08952, + 0.08974, + 0.09166, + 0.08992, + 0.0922, + 0.09098, + 0.09182, + 0.092, + 0.09068, + 0.09088, + 0.09264, + 0.09206, + 0.09184, + 0.09252, + 0.09102, + 0.09206, + 0.09348, + 0.09252, + 0.09214, + 0.09232, + 0.09276, + 0.09236, + 0.0915, + 0.09298, + 0.09236, + 0.0928, + 0.09326, + 0.09264, + 0.09282, + 0.0924, + 0.0927, + 0.09328, + 0.09474, + 0.09338, + 0.09336, + 0.09342, + 0.09358, + 0.09408, + 0.09404, + 0.09384, + 0.09388, + 0.09484, + 0.09448, + 0.09396, + 0.09364, + 0.09346, + 0.09286, + 0.09446, + 0.0944, + 0.094, + 0.0935, + 0.09318 + ], + "test_acc": [ + 0.0808, + 0.0776, + 0.0759, + 0.0747, + 0.0703, + 0.0777, + 0.0773, + 0.0701, + 0.0792, + 0.0764, + 0.0753, + 0.0743, + 0.0772, + 0.0824, + 0.0807, + 0.081, + 0.0784, + 0.0813, + 0.0774, + 0.0803, + 0.0826, + 0.0865, + 0.0793, + 0.0798, + 0.0821, + 0.082, + 0.0822, + 0.0812, + 0.0812, + 0.0845, + 0.0808, + 0.087, + 0.0849, + 0.0823, + 0.0861, + 0.0851, + 0.0873, + 0.0833, + 0.0826, + 0.0855, + 0.0843, + 0.0861, + 0.0904, + 0.0866, + 0.0882, + 0.0861, + 0.0875, + 0.0871, + 0.0843, + 0.0852, + 0.0874, + 0.0892, + 0.0868, + 0.0887, + 0.0882, + 0.0874, + 0.0816, + 0.0865, + 0.0861, + 0.0856, + 0.0874, + 0.0869, + 0.0905, + 0.0844, + 0.0838, + 0.0898, + 0.0881, + 0.0865, + 0.0891, + 0.0868, + 0.0861, + 0.0874, + 0.0909, + 0.0889, + 0.0856, + 0.0875, + 0.088, + 0.0864, + 0.0889, + 0.0867, + 0.0852, + 0.0869, + 0.0879, + 0.0875, + 0.0872, + 0.0883, + 0.0897, + 0.0879, + 0.0875, + 0.0875, + 0.0868, + 0.087, + 0.0869, + 0.0868, + 0.0875, + 0.0873, + 0.0871, + 0.0872, + 0.0872, + 0.0872 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.14216047525405884, + -0.000992744229733944, + -0.008401205763220787, + -0.018219897523522377 + ], + "perturbation_rho": [ + 0.053201157599687576, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -6.109476089477539e-07, + 3.725290298461914e-09, + 0.0, + 0.0 + ], + "0.003": [ + -1.6260892152786255e-06, + 3.725290298461914e-09, + 3.725290298461914e-09, + 0.0 + ], + "0.01": [ + -5.261041224002838e-06, + -1.4901161193847656e-08, + 5.587935447692871e-09, + 5.587935447692871e-09 + ] + }, + "hidden_norms_per_layer": [ + 19441.8984375, + 14779116.0, + 143599776.0, + 226312160.0, + 280974592.0 + ], + "bp_grad_norms_per_layer": [ + 1.4361885405378416e-06, + 8.184267485944474e-09, + 7.640669430486469e-09, + 7.643201627161034e-09, + 7.633985887878225e-09 + ] + }, + "drift": { + "embed.weight": 162.24755066692174, + "embed.bias": 87.51431369480697, + "blocks.0.ln.weight": 10.42286205291748, + "blocks.0.w1.weight": 122.86975821758014, + "blocks.0.w1.bias": 127.51968896872295, + "blocks.0.w2.weight": 144.60590878787062, + "blocks.1.ln.weight": 7.615029811859131, + "blocks.1.w1.weight": 201.6705191292493, + "blocks.1.w1.bias": 211.79976689727667, + "blocks.1.w2.weight": 125.73570047362797, + "blocks.2.ln.weight": 8.678234100341797, + "blocks.2.w1.weight": 226.59101485856874, + "blocks.2.w1.bias": 218.5035230014578, + "blocks.2.w2.weight": 132.07798132121874, + "blocks.3.ln.weight": 8.401058197021484, + "blocks.3.w1.weight": 221.76508002622688, + "blocks.3.w1.bias": 204.23780375800553, + "blocks.3.w2.weight": 123.66583688447245, + "out_ln.weight": 1.673746943473816, + "out_head.weight": 9.550233758399107, + "out_head.bias": 0.9096587370527971 + } + }, + "fa": { + "log": { + "train_loss": [ + 4.1970798970031735, + 4.170009743804932, + 4.130948940124512, + 4.094561860961914, + 4.050638759155273, + 4.024049156494141, + 4.013653193511963, + 4.014947728729248, + 4.032731681671143, + 4.047689598388672, + 4.044174816589355, + 4.0340768909454345, + 4.026809699783326, + 4.0191610552215575, + 4.009859062652588, + 4.004589066696167, + 4.000014752273559, + 3.9934563516235353, + 3.989729327392578, + 3.9867174030303953, + 3.980116393737793, + 3.979052162322998, + 3.976570917816162, + 3.972892049102783, + 3.9706854679870607, + 3.964727850341797, + 3.9669337309265136, + 3.962656950378418, + 3.959514749221802, + 3.950425816116333, + 3.9518183033752443, + 3.944525026168823, + 3.9370513851928712, + 3.9401658685302734, + 3.9340728694152833, + 3.933683126220703, + 3.929854642791748, + 3.9251790898132324, + 3.925471938934326, + 3.920428736419678, + 3.9194086865997315, + 3.916180799026489, + 3.910477230758667, + 3.9091271575164797, + 3.9079003392791747, + 3.9009140887451172, + 3.903854856109619, + 3.896608190765381, + 3.8983821444702147, + 3.8914879888153076, + 3.8876359399414064, + 3.8866743579101564, + 3.886013005371094, + 3.8823793061065675, + 3.8820696644592285, + 3.8807897300720215, + 3.8792161915588377, + 3.873366918258667, + 3.872225737609863, + 3.867956961669922, + 3.8688921507263183, + 3.864798822555542, + 3.8635835083770753, + 3.8616594306182863, + 3.86274955078125, + 3.8615631605529783, + 3.855813476715088, + 3.8575434510040285, + 3.8537498898315428, + 3.8516512804412844, + 3.853169044036865, + 3.848847638626099, + 3.8501204053497315, + 3.8475019567871094, + 3.8478130152130126, + 3.841899245147705, + 3.8445189476776123, + 3.8427941259002685, + 3.841190276489258, + 3.8432645402526857, + 3.840385712738037, + 3.841228730545044, + 3.8406887775421144, + 3.838410483932495, + 3.8366693685913087, + 3.8328694233703615, + 3.8348467766571046, + 3.8281507495880125, + 3.8312854344177247, + 3.8341920923614503, + 3.832209959793091, + 3.832971982574463, + 3.827496012649536, + 3.832459149017334, + 3.8320746698760986, + 3.833449503631592, + 3.8311014671325685, + 3.828391033859253, + 3.8309260621643064, + 3.832998709869385 + ], + "train_acc": [ + 0.06318, + 0.06262, + 0.06896, + 0.07402, + 0.08474, + 0.0894, + 0.09134, + 0.0919, + 0.08782, + 0.08538, + 0.08668, + 0.0868, + 0.08842, + 0.0918, + 0.09218, + 0.09394, + 0.09588, + 0.09596, + 0.09472, + 0.09676, + 0.09782, + 0.09964, + 0.10034, + 0.09964, + 0.09956, + 0.10158, + 0.10016, + 0.10198, + 0.10194, + 0.1036, + 0.10318, + 0.10394, + 0.1047, + 0.1039, + 0.10536, + 0.10528, + 0.10612, + 0.10692, + 0.10644, + 0.10704, + 0.10844, + 0.1082, + 0.10744, + 0.10862, + 0.10826, + 0.11176, + 0.10998, + 0.10964, + 0.11052, + 0.1107, + 0.11298, + 0.11352, + 0.11398, + 0.11322, + 0.11342, + 0.11344, + 0.11324, + 0.11226, + 0.11314, + 0.11472, + 0.11338, + 0.11524, + 0.11458, + 0.11598, + 0.11536, + 0.11664, + 0.11622, + 0.11714, + 0.1169, + 0.11656, + 0.11594, + 0.11838, + 0.1178, + 0.11898, + 0.1183, + 0.11852, + 0.11904, + 0.11914, + 0.1193, + 0.11876, + 0.11858, + 0.12086, + 0.11934, + 0.11944, + 0.12044, + 0.1214, + 0.12184, + 0.12008, + 0.12106, + 0.12018, + 0.12146, + 0.12004, + 0.12064, + 0.11986, + 0.12106, + 0.12248, + 0.12166, + 0.12014, + 0.12266, + 0.12278 + ], + "test_acc": [ + 0.0708, + 0.0659, + 0.0746, + 0.0752, + 0.0902, + 0.0946, + 0.0937, + 0.0824, + 0.0936, + 0.0847, + 0.095, + 0.084, + 0.0884, + 0.0959, + 0.0927, + 0.0944, + 0.101, + 0.0972, + 0.098, + 0.0997, + 0.095, + 0.1032, + 0.0977, + 0.0949, + 0.1003, + 0.1004, + 0.0969, + 0.101, + 0.1019, + 0.1037, + 0.0979, + 0.103, + 0.1047, + 0.1026, + 0.1092, + 0.1071, + 0.1062, + 0.1024, + 0.1051, + 0.1068, + 0.1088, + 0.105, + 0.108, + 0.1068, + 0.1092, + 0.1112, + 0.1096, + 0.1084, + 0.108, + 0.1091, + 0.1102, + 0.1141, + 0.1109, + 0.1138, + 0.1085, + 0.1143, + 0.1107, + 0.1135, + 0.1153, + 0.1135, + 0.1181, + 0.1159, + 0.1171, + 0.1126, + 0.1165, + 0.1193, + 0.1206, + 0.113, + 0.1139, + 0.1156, + 0.1152, + 0.1201, + 0.1239, + 0.1171, + 0.1187, + 0.1197, + 0.1187, + 0.1212, + 0.1187, + 0.1182, + 0.1187, + 0.1203, + 0.1195, + 0.1212, + 0.122, + 0.1207, + 0.1192, + 0.1205, + 0.1205, + 0.1215, + 0.12, + 0.1201, + 0.1203, + 0.1203, + 0.1213, + 0.1208, + 0.1209, + 0.1209, + 0.1209, + 0.1208 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.017588060349225998, + -0.016497433185577393, + -0.053346455097198486, + 0.9986427426338196 + ], + "perturbation_rho": [ + 0.02255980297923088, + 0.005564957857131958, + -0.049259480088949203, + -0.011541965417563915 + ], + "nudging": { + "0.001": [ + 1.280568540096283e-07, + 1.62515789270401e-07, + 7.82310962677002e-08, + -5.41098415851593e-07 + ], + "0.003": [ + 1.0710209608078003e-07, + 2.7334317564964294e-07, + 1.1641532182693481e-07, + -2.648215740919113e-06 + ], + "0.01": [ + 3.57162207365036e-07, + 2.039596438407898e-07, + 8.307397365570068e-07, + -1.1221971362829208e-05 + ] + }, + "hidden_norms_per_layer": [ + 19381.54296875, + 312615.90625, + 2321965.25, + 3640082.0, + 692179.875 + ], + "bp_grad_norms_per_layer": [ + 5.805031378258718e-06, + 6.129388907538669e-07, + 5.996270147079485e-07, + 6.020890737090667e-07, + 6.002287022965902e-07 + ] + }, + "drift": { + "embed.weight": 160.52406007787414, + "embed.bias": 24.62414456524661, + "blocks.0.ln.weight": 2.7208244800567627, + "blocks.0.w1.weight": 31.32931103808957, + "blocks.0.w1.bias": 24.578464288381767, + "blocks.0.w2.weight": 76.69986787657376, + "blocks.1.ln.weight": 2.1396796703338623, + "blocks.1.w1.weight": 41.923375948001016, + "blocks.1.w1.bias": 42.687481681423954, + "blocks.1.w2.weight": 41.924463722510936, + "blocks.2.ln.weight": 1.8985017538070679, + "blocks.2.w1.weight": 49.16152213344094, + "blocks.2.w1.bias": 49.20711111001434, + "blocks.2.w2.weight": 40.28985166850181, + "blocks.3.ln.weight": 1.8008719682693481, + "blocks.3.w1.weight": 48.175959456780525, + "blocks.3.w1.bias": 46.53396040604286, + "blocks.3.w2.weight": 50.22310178120013, + "out_ln.weight": 0.6654373407363892, + "out_head.weight": 4.396233728367674, + "out_head.bias": 1.1577362249288412 + } + } + }, + "456": { + "bp": { + "log": { + "train_loss": [ + 3.9721967333221437, + 3.6422341596221925, + 3.48317311088562, + 3.384400603027344, + 3.3024317309570312, + 3.244081290435791, + 3.1941285145568847, + 3.1515661222839357, + 3.110703917541504, + 3.0678702397155764, + 3.0385052178955076, + 3.0125491227722168, + 2.9755833444976805, + 2.9489572755432127, + 2.922896576004028, + 2.8952785552215574, + 2.8644921349334718, + 2.837543485031128, + 2.815750347290039, + 2.7902291624450686, + 2.7643565017700196, + 2.749027015914917, + 2.7195132698059084, + 2.7054608350372313, + 2.678812169647217, + 2.655367773590088, + 2.6455082903289795, + 2.621019700469971, + 2.6011389213562013, + 2.592018772201538, + 2.563096626586914, + 2.5475857734680174, + 2.5312666052246096, + 2.507406205291748, + 2.4910193432617187, + 2.4760341359710694, + 2.463254167022705, + 2.443411533126831, + 2.4220050102996824, + 2.4045714128875733, + 2.3885920139312744, + 2.3683135289001465, + 2.35701943649292, + 2.339880431365967, + 2.3229517127990724, + 2.307848415145874, + 2.2967623091125486, + 2.277586201171875, + 2.2599157135009764, + 2.2420585137939453, + 2.2226363661193846, + 2.211539700012207, + 2.1965325047302247, + 2.181053132362366, + 2.1636188303375246, + 2.148667406234741, + 2.1403865797424317, + 2.118398011932373, + 2.1047801040649414, + 2.090780695877075, + 2.0796419092178344, + 2.0641602599716187, + 2.046349721298218, + 2.034338469238281, + 2.0246941263580323, + 2.010717328338623, + 1.9879577135848998, + 1.9908112752532958, + 1.9648436877822877, + 1.9547819673156739, + 1.942468291015625, + 1.9376066028594972, + 1.9182865232086181, + 1.9184452313232423, + 1.9024611935424804, + 1.8942070873641967, + 1.8815567203521728, + 1.8690018142318725, + 1.8623281653213501, + 1.8579870316314697, + 1.8522963430404662, + 1.836771893234253, + 1.8371977347564696, + 1.8297668377685548, + 1.822632707901001, + 1.8128088718032838, + 1.8157146021270751, + 1.8022041482162476, + 1.8005397263336183, + 1.80292332862854, + 1.7940929901504516, + 1.7858528171539307, + 1.7898485187149047, + 1.7881443228149414, + 1.7818482210540771, + 1.776848041419983, + 1.7760994798278809, + 1.7772335396957397, + 1.7761591400146484, + 1.7769086535644532 + ], + "train_acc": [ + 0.09778, + 0.1434, + 0.17072, + 0.18902, + 0.20188, + 0.21248, + 0.22264, + 0.22896, + 0.23846, + 0.24332, + 0.2513, + 0.25484, + 0.26372, + 0.26734, + 0.27242, + 0.27908, + 0.2835, + 0.28882, + 0.29154, + 0.29834, + 0.30224, + 0.30392, + 0.31194, + 0.3125, + 0.31934, + 0.32328, + 0.32578, + 0.3307, + 0.33552, + 0.33738, + 0.34074, + 0.34822, + 0.3489, + 0.35476, + 0.35714, + 0.3598, + 0.36264, + 0.3679, + 0.373, + 0.37474, + 0.37926, + 0.38364, + 0.38482, + 0.38824, + 0.3921, + 0.39568, + 0.39682, + 0.4015, + 0.4051, + 0.40902, + 0.41356, + 0.41618, + 0.42064, + 0.4233, + 0.42546, + 0.42778, + 0.43316, + 0.4337, + 0.4397, + 0.442, + 0.44436, + 0.45016, + 0.4521, + 0.45792, + 0.45892, + 0.4619, + 0.46716, + 0.46476, + 0.47062, + 0.475, + 0.4752, + 0.47938, + 0.48198, + 0.48142, + 0.48788, + 0.49032, + 0.49212, + 0.49664, + 0.49638, + 0.4973, + 0.4982, + 0.5018, + 0.5012, + 0.50402, + 0.50828, + 0.512, + 0.50698, + 0.51086, + 0.51272, + 0.5128, + 0.51364, + 0.5147, + 0.51322, + 0.51572, + 0.51924, + 0.51582, + 0.52014, + 0.51688, + 0.519, + 0.51792 + ], + "test_acc": [ + 0.1436, + 0.1724, + 0.1976, + 0.2161, + 0.2193, + 0.2286, + 0.2386, + 0.2425, + 0.2508, + 0.2496, + 0.2572, + 0.2667, + 0.2678, + 0.266, + 0.2744, + 0.2762, + 0.278, + 0.277, + 0.2819, + 0.2857, + 0.2884, + 0.2924, + 0.2971, + 0.2938, + 0.2967, + 0.2984, + 0.2994, + 0.2987, + 0.3023, + 0.3018, + 0.3005, + 0.3058, + 0.3086, + 0.3118, + 0.3122, + 0.317, + 0.3139, + 0.3083, + 0.3131, + 0.3166, + 0.3193, + 0.3185, + 0.318, + 0.3176, + 0.319, + 0.3176, + 0.3157, + 0.3158, + 0.3241, + 0.3165, + 0.3253, + 0.3217, + 0.3224, + 0.3244, + 0.3217, + 0.3181, + 0.3206, + 0.3261, + 0.3208, + 0.3204, + 0.3198, + 0.324, + 0.322, + 0.3227, + 0.3184, + 0.3193, + 0.323, + 0.3233, + 0.3254, + 0.3202, + 0.3196, + 0.3251, + 0.3243, + 0.3247, + 0.3209, + 0.3245, + 0.3267, + 0.322, + 0.3224, + 0.3177, + 0.3213, + 0.3196, + 0.3218, + 0.3207, + 0.3219, + 0.3223, + 0.3244, + 0.3202, + 0.3248, + 0.3217, + 0.3236, + 0.3228, + 0.3211, + 0.3231, + 0.3222, + 0.3215, + 0.3217, + 0.3216, + 0.3217, + 0.3219 + ] + }, + "diagnostics": { + "bp_cosine": [ + 1.0, + 1.0, + 1.0, + 1.0 + ], + "perturbation_rho": [ + 0.9977043271064758, + 0.9984360337257385, + 0.9986849427223206, + 0.998687744140625 + ], + "nudging": { + "0.001": [ + -0.0023326585069298744, + -0.0024166624061763287, + -0.002438523806631565, + -0.002317411359399557 + ], + "0.003": [ + -0.006994417868554592, + -0.007245808374136686, + -0.007311580237001181, + -0.0069488403387367725 + ], + "0.01": [ + -0.023275790736079216, + -0.024107107892632484, + -0.02432604506611824, + -0.023123476654291153 + ] + }, + "hidden_norms_per_layer": [ + 233.81195068359375, + 216.790283203125, + 197.1819305419922, + 192.0648956298828, + 192.4108123779297 + ], + "bp_grad_norms_per_layer": [ + 0.0011535885278135538, + 0.0012452645460143685, + 0.0012428142363205552, + 0.0011899643577635288, + 0.0009729627054184675 + ] + }, + "drift": { + "embed.weight": 7.39398977590873, + "embed.bias": 12.21138556118351, + "blocks.0.ln.weight": 0.14770954847335815, + "blocks.0.w1.weight": 3.60408439890455, + "blocks.0.w1.bias": 5.22994684696013, + "blocks.0.w2.weight": 13.053238719433654, + "blocks.1.ln.weight": 0.2946910560131073, + "blocks.1.w1.weight": 4.020628252632815, + "blocks.1.w1.bias": 4.08986730586542, + "blocks.1.w2.weight": 14.948894323523715, + "blocks.2.ln.weight": 0.3565492630004883, + "blocks.2.w1.weight": 4.131160512042399, + "blocks.2.w1.bias": 4.003626979292673, + "blocks.2.w2.weight": 15.902707284756408, + "blocks.3.ln.weight": 0.5485884547233582, + "blocks.3.w1.weight": 4.454943236812576, + "blocks.3.w1.bias": 3.7282169522367608, + "blocks.3.w2.weight": 17.516109303089266, + "out_ln.weight": 0.14718063175678253, + "out_head.weight": 2.8761547030079035, + "out_head.bias": 2.9449926838807814 + } + }, + "dfa": { + "log": { + "train_loss": [ + 4.161876879730225, + 4.0187293235778805, + 4.006406578216553, + 4.022609137268066, + 4.043629914093017, + 4.065061766357422, + 4.069896491699219, + 4.078123603668213, + 4.078062142028808, + 4.077979364929199, + 4.076888464050293, + 4.075497508239746, + 4.072547879943848, + 4.0701713494110106, + 4.069026535797119, + 4.064811604537964, + 4.061763154296875, + 4.060759606628418, + 4.057107001800537, + 4.0601828897094725, + 4.055534585723877, + 4.054944921569824, + 4.051256662597656, + 4.050451954650879, + 4.050393276824951, + 4.046223313903808, + 4.047258992919922, + 4.047048767089843, + 4.044600559692383, + 4.0430317344665525, + 4.043368485031128, + 4.043571725158691, + 4.04141174987793, + 4.0433316299438475, + 4.041590490188598, + 4.042222282104492, + 4.039775361480713, + 4.0390912678527835, + 4.040217839660644, + 4.039096583099365, + 4.040037224197388, + 4.037792987365723, + 4.037555375213623, + 4.0370241506958005, + 4.036846955261231, + 4.037261250762939, + 4.036293372497559, + 4.036143635406495, + 4.036682392578125, + 4.037161629333496, + 4.033746524200439, + 4.0374753099060054, + 4.035349784240722, + 4.037173667144775, + 4.0371518122863765, + 4.035486927947998, + 4.036137412185669, + 4.036821200714112, + 4.035519530792237, + 4.035781366424561, + 4.034954352722168, + 4.03612970993042, + 4.036103559722901, + 4.03622392074585, + 4.035975666046142, + 4.036468890686035, + 4.0351540557861325, + 4.035398180618286, + 4.034821971435547, + 4.0340077725219725, + 4.0375495939636235, + 4.034684106140137, + 4.034154214782715, + 4.032997749557495, + 4.033953489532471, + 4.034259751586914, + 4.034655684280396, + 4.0341955810546875, + 4.032625467605591, + 4.033415794677734, + 4.0320995791625975, + 4.034218223724365, + 4.033138923187256, + 4.03524599899292, + 4.03208328704834, + 4.032160759277343, + 4.034070838088989, + 4.030838821868897, + 4.031133236694336, + 4.032454485397339, + 4.0351671361541745, + 4.032833539428711, + 4.03182988456726, + 4.035511425170898, + 4.034130640563965, + 4.030528937072754, + 4.031213985443115, + 4.02996834274292, + 4.034611818542481, + 4.032926365203857 + ], + "train_acc": [ + 0.06838, + 0.08666, + 0.08636, + 0.08428, + 0.08436, + 0.08, + 0.07998, + 0.0795, + 0.08026, + 0.07902, + 0.08168, + 0.08248, + 0.08128, + 0.08158, + 0.0824, + 0.08262, + 0.08376, + 0.08384, + 0.08508, + 0.08482, + 0.0866, + 0.08544, + 0.08676, + 0.08688, + 0.08632, + 0.08594, + 0.0864, + 0.08776, + 0.08736, + 0.0885, + 0.08856, + 0.08896, + 0.08866, + 0.08886, + 0.08898, + 0.09026, + 0.08896, + 0.09028, + 0.09104, + 0.08926, + 0.08906, + 0.08948, + 0.09216, + 0.09092, + 0.0916, + 0.09188, + 0.09304, + 0.09212, + 0.09048, + 0.0914, + 0.09228, + 0.09146, + 0.09234, + 0.09168, + 0.09086, + 0.09146, + 0.09152, + 0.0926, + 0.0927, + 0.09192, + 0.09064, + 0.09282, + 0.09188, + 0.09342, + 0.09134, + 0.09174, + 0.09164, + 0.09388, + 0.09276, + 0.0928, + 0.09378, + 0.0937, + 0.09332, + 0.09394, + 0.09278, + 0.09276, + 0.09362, + 0.09378, + 0.0931, + 0.09256, + 0.09352, + 0.0925, + 0.09258, + 0.0933, + 0.09242, + 0.09364, + 0.09322, + 0.09358, + 0.09406, + 0.09348, + 0.09254, + 0.09332, + 0.09516, + 0.09486, + 0.09452, + 0.09486, + 0.09398, + 0.09486, + 0.0926, + 0.09292 + ], + "test_acc": [ + 0.0832, + 0.0875, + 0.0896, + 0.0827, + 0.0848, + 0.0809, + 0.0756, + 0.0769, + 0.0809, + 0.0777, + 0.0775, + 0.0751, + 0.0835, + 0.0804, + 0.0776, + 0.0805, + 0.0857, + 0.0753, + 0.0811, + 0.0813, + 0.0813, + 0.0786, + 0.0812, + 0.0834, + 0.0862, + 0.0883, + 0.0863, + 0.0861, + 0.0853, + 0.0878, + 0.0835, + 0.087, + 0.0873, + 0.0833, + 0.087, + 0.0834, + 0.08, + 0.0867, + 0.0897, + 0.0872, + 0.0834, + 0.0871, + 0.0804, + 0.084, + 0.0892, + 0.0908, + 0.0851, + 0.0891, + 0.0889, + 0.0834, + 0.0892, + 0.0905, + 0.0915, + 0.0885, + 0.09, + 0.0895, + 0.0863, + 0.0889, + 0.0923, + 0.0884, + 0.0901, + 0.087, + 0.0912, + 0.0893, + 0.0901, + 0.0868, + 0.09, + 0.0877, + 0.09, + 0.0906, + 0.0895, + 0.0902, + 0.0864, + 0.0878, + 0.0914, + 0.0888, + 0.0878, + 0.0886, + 0.089, + 0.0879, + 0.0894, + 0.0902, + 0.0885, + 0.0887, + 0.0886, + 0.089, + 0.0897, + 0.0892, + 0.09, + 0.0898, + 0.0898, + 0.089, + 0.0898, + 0.0896, + 0.0895, + 0.0893, + 0.0895, + 0.0894, + 0.0895, + 0.0894 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.1401812732219696, + -0.0036733129527419806, + -0.012468342669308186, + -0.005749615840613842 + ], + "perturbation_rho": [ + -0.006108707282692194, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -6.239861249923706e-07, + 0.0, + -7.450580596923828e-09, + 0.0 + ], + "0.003": [ + -1.9390136003494263e-06, + -1.862645149230957e-09, + -5.587935447692871e-09, + -9.313225746154785e-10 + ], + "0.01": [ + -6.262678653001785e-06, + 7.450580596923828e-09, + -9.313225746154785e-09, + -9.313225746154785e-10 + ] + }, + "hidden_norms_per_layer": [ + 18858.84765625, + 30104360.0, + 115109720.0, + 142242432.0, + 189834320.0 + ], + "bp_grad_norms_per_layer": [ + 1.6800353250800981e-06, + 1.0384521687001325e-08, + 1.0259526561640087e-08, + 1.025457141423658e-08, + 1.027041474088719e-08 + ] + }, + "drift": { + "embed.weight": 159.1972472218232, + "embed.bias": 106.18499737865416, + "blocks.0.ln.weight": 8.374361991882324, + "blocks.0.w1.weight": 130.25292802776573, + "blocks.0.w1.bias": 147.17751025342662, + "blocks.0.w2.weight": 140.99980409584657, + "blocks.1.ln.weight": 7.522654056549072, + "blocks.1.w1.weight": 183.9407903471226, + "blocks.1.w1.bias": 180.51106512410223, + "blocks.1.w2.weight": 111.67829579527385, + "blocks.2.ln.weight": 7.498361110687256, + "blocks.2.w1.weight": 174.07305808153814, + "blocks.2.w1.bias": 174.07821632973472, + "blocks.2.w2.weight": 98.850301691257, + "blocks.3.ln.weight": 7.616756439208984, + "blocks.3.w1.weight": 196.59852287605085, + "blocks.3.w1.bias": 194.4284525943356, + "blocks.3.w2.weight": 107.54506697831434, + "out_ln.weight": 1.6382553577423096, + "out_head.weight": 8.655421610551045, + "out_head.bias": 0.8148936743952768 + } + }, + "fa": { + "log": { + "train_loss": [ + 4.217838704376221, + 4.173818229370117, + 4.116404933776855, + 4.05976043182373, + 4.010950881347656, + 3.9877797143554687, + 3.9654394758605958, + 3.9516948413085937, + 3.9414562885284425, + 3.933943572845459, + 3.9315726831054687, + 3.9283136461639403, + 3.918033894042969, + 3.912524202957153, + 3.9111721415710448, + 3.9033537468719484, + 3.898933872528076, + 3.8940574435424806, + 3.888040324020386, + 3.8902594078826906, + 3.881309941253662, + 3.879018879852295, + 3.874496072845459, + 3.871587658691406, + 3.867957287750244, + 3.8586695248413085, + 3.858678229446411, + 3.8550938296508788, + 3.848460863571167, + 3.843934544219971, + 3.841355255813599, + 3.838310421142578, + 3.832888546218872, + 3.8317080396270753, + 3.8244371617126465, + 3.826680388870239, + 3.820091895675659, + 3.8168691710662843, + 3.8143892570495606, + 3.8094303827667235, + 3.811340135421753, + 3.808084242401123, + 3.8061284660339356, + 3.8042135272979736, + 3.803864609298706, + 3.8014156354522703, + 3.796123163604736, + 3.7960259418487547, + 3.794198034515381, + 3.793316494140625, + 3.7887488148498534, + 3.7955673222351076, + 3.787652738494873, + 3.789291185760498, + 3.7856833452606202, + 3.7837219773864748, + 3.7850829206848147, + 3.7822190380859375, + 3.780595345993042, + 3.780773038482666, + 3.7798492553710936, + 3.777712000579834, + 3.77948525390625, + 3.7754471015930178, + 3.7783823108673094, + 3.7751461651611327, + 3.7731632305908205, + 3.7698883753204346, + 3.7678470989227293, + 3.7675471087646484, + 3.768726477050781, + 3.7664906182861326, + 3.7642928605651855, + 3.7634823627471925, + 3.7624606089782713, + 3.7626713751983645, + 3.76369431892395, + 3.7644162739562987, + 3.759299655914307, + 3.759175650482178, + 3.758095093460083, + 3.758687426223755, + 3.7558257189941404, + 3.758380405960083, + 3.7552133833312986, + 3.7560367737579345, + 3.757290748748779, + 3.7513376335144044, + 3.7552056824493407, + 3.7553686474609376, + 3.754800821685791, + 3.752587652511597, + 3.7521287742614744, + 3.754502056884766, + 3.7546933338928223, + 3.750953895263672, + 3.749489372558594, + 3.7477175559997558, + 3.753209332885742, + 3.75081868347168 + ], + "train_acc": [ + 0.06112, + 0.06028, + 0.0684, + 0.07838, + 0.08954, + 0.09232, + 0.0962, + 0.09766, + 0.099, + 0.10078, + 0.1022, + 0.10314, + 0.10234, + 0.1031, + 0.10412, + 0.10498, + 0.10776, + 0.10782, + 0.109, + 0.10792, + 0.10914, + 0.11072, + 0.10982, + 0.11022, + 0.11282, + 0.11262, + 0.11402, + 0.11302, + 0.11302, + 0.11694, + 0.11542, + 0.11602, + 0.11642, + 0.1175, + 0.11876, + 0.12074, + 0.11926, + 0.11816, + 0.12184, + 0.12202, + 0.12178, + 0.12238, + 0.1222, + 0.12238, + 0.12092, + 0.12362, + 0.12338, + 0.12428, + 0.1248, + 0.12516, + 0.12588, + 0.12532, + 0.12592, + 0.12498, + 0.12348, + 0.1247, + 0.12646, + 0.12716, + 0.12708, + 0.1273, + 0.12668, + 0.12754, + 0.1268, + 0.1288, + 0.12586, + 0.12914, + 0.12678, + 0.12832, + 0.1304, + 0.12808, + 0.12922, + 0.13104, + 0.12964, + 0.13008, + 0.13144, + 0.1314, + 0.12958, + 0.1298, + 0.1312, + 0.13116, + 0.13188, + 0.1315, + 0.1315, + 0.13028, + 0.13222, + 0.1339, + 0.13118, + 0.13218, + 0.13354, + 0.1333, + 0.13136, + 0.13216, + 0.13268, + 0.13262, + 0.13292, + 0.13426, + 0.13368, + 0.13344, + 0.13306, + 0.13192 + ], + "test_acc": [ + 0.0534, + 0.0616, + 0.0812, + 0.0837, + 0.0888, + 0.0944, + 0.0942, + 0.0981, + 0.1007, + 0.0999, + 0.1021, + 0.0988, + 0.1083, + 0.1019, + 0.1073, + 0.1051, + 0.1085, + 0.107, + 0.1044, + 0.1125, + 0.1066, + 0.1037, + 0.1053, + 0.1129, + 0.1129, + 0.1183, + 0.1149, + 0.1188, + 0.1188, + 0.1138, + 0.114, + 0.1201, + 0.1229, + 0.1223, + 0.1169, + 0.1239, + 0.1156, + 0.1221, + 0.1195, + 0.1228, + 0.1275, + 0.1226, + 0.1232, + 0.1264, + 0.1312, + 0.1262, + 0.126, + 0.1266, + 0.126, + 0.124, + 0.1272, + 0.1229, + 0.1293, + 0.1247, + 0.125, + 0.1265, + 0.1232, + 0.1295, + 0.1274, + 0.1275, + 0.1273, + 0.1276, + 0.1285, + 0.1266, + 0.1285, + 0.128, + 0.1299, + 0.1295, + 0.1308, + 0.1252, + 0.1315, + 0.1292, + 0.1291, + 0.1296, + 0.1298, + 0.1308, + 0.1314, + 0.1297, + 0.1304, + 0.1307, + 0.13, + 0.1335, + 0.1296, + 0.1302, + 0.1329, + 0.1303, + 0.1313, + 0.1315, + 0.132, + 0.1311, + 0.1311, + 0.1322, + 0.1311, + 0.1317, + 0.1308, + 0.1309, + 0.1306, + 0.1308, + 0.1311, + 0.131 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.08354228734970093, + 0.008694879710674286, + -0.10087701678276062, + 0.9982630610466003 + ], + "perturbation_rho": [ + -0.00011634547263383865, + 0.02022995427250862, + -0.014473065733909607, + -0.005974383093416691 + ], + "nudging": { + "0.001": [ + -1.8016435205936432e-06, + -6.216578185558319e-08, + 9.220093488693237e-08, + -1.9045546650886536e-06 + ], + "0.003": [ + -5.271751433610916e-06, + -1.3830140233039856e-07, + 7.264316082000732e-07, + -7.401220500469208e-06 + ], + "0.01": [ + -1.7585232853889465e-05, + -5.245674401521683e-07, + 3.0526425689458847e-06, + -2.642977051436901e-05 + ] + }, + "hidden_norms_per_layer": [ + 11478.736328125, + 155429.828125, + 870084.3125, + 1247755.625, + 225384.953125 + ], + "bp_grad_norms_per_layer": [ + 9.544731256028172e-06, + 1.3853283462594845e-06, + 1.3375421303862822e-06, + 1.3386792261371738e-06, + 1.3382986026044819e-06 + ] + }, + "drift": { + "embed.weight": 105.03852710133908, + "embed.bias": 26.837405563994206, + "blocks.0.ln.weight": 2.3730220794677734, + "blocks.0.w1.weight": 28.170015713455946, + "blocks.0.w1.bias": 23.197896445244968, + "blocks.0.w2.weight": 73.04463083219117, + "blocks.1.ln.weight": 1.476442575454712, + "blocks.1.w1.weight": 29.314224337417265, + "blocks.1.w1.bias": 28.13876609135274, + "blocks.1.w2.weight": 39.8446977611363, + "blocks.2.ln.weight": 1.1785210371017456, + "blocks.2.w1.weight": 29.01006529023273, + "blocks.2.w1.bias": 32.13611131919081, + "blocks.2.w2.weight": 31.240416399097963, + "blocks.3.ln.weight": 1.4267656803131104, + "blocks.3.w1.weight": 32.92178917188402, + "blocks.3.w1.bias": 34.64484336575641, + "blocks.3.w2.weight": 31.82487883605455, + "out_ln.weight": 0.5113871097564697, + "out_head.weight": 3.9161050246024547, + "out_head.bias": 2.224345965208238 + } + } + }, + "config": { + "dataset": "cifar100", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 100, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 42, + 123, + 456 + ], + "gpu": 0, + "output_dir": "results/cifar100_protocol_validation", + "methods": [ + "bp", + "fa", + "dfa" + ], + "random_targets": false, + "penalty_lam": 0.0, + "num_classes": 100 + } +} \ No newline at end of file diff --git a/results/cifar100_scan.log b/results/cifar100_scan.log index 637893f..15d1d46 100644 --- a/results/cifar100_scan.log +++ b/results/cifar100_scan.log @@ -113,7 +113,180 @@ FINAL BP-frozen-blocks: 0.1777 n_params: 812900 (812900 trainable) [DFA-shallow] ep 1: test_acc=0.0928 [DFA-shallow] ep 10: test_acc=0.1025 -st=0.2812 + [DFA-shallow] ep 20: test_acc=0.1146 + [DFA-shallow] ep 30: test_acc=0.1180 + [DFA-shallow] ep 40: test_acc=0.1239 + [DFA-shallow] ep 50: test_acc=0.1283 + [DFA-shallow] ep 60: test_acc=0.1204 + [DFA-shallow] ep 70: test_acc=0.1237 + [DFA-shallow] ep 80: test_acc=0.1261 + [DFA-shallow] ep 90: test_acc=0.1261 + [DFA-shallow] ep 100: test_acc=0.1269 +FINAL DFA-shallow: 0.1269 + +=== DFA frozen-blocks (ResMLP num_blocks=4, blocks frozen), seed=123 === + n_params: 1341284 (812900 trainable) + [DFA-frozen] ep 1: test_acc=0.0916 + [DFA-frozen] ep 10: test_acc=0.1060 + [DFA-frozen] ep 20: test_acc=0.1167 + [DFA-frozen] ep 30: test_acc=0.1125 + [DFA-frozen] ep 40: test_acc=0.1153 + [DFA-frozen] ep 50: test_acc=0.1237 + [DFA-frozen] ep 60: test_acc=0.1217 + [DFA-frozen] ep 70: test_acc=0.1254 + [DFA-frozen] ep 80: test_acc=0.1239 + [DFA-frozen] ep 90: test_acc=0.1254 + [DFA-frozen] ep 100: test_acc=0.1257 +FINAL DFA-frozen-blocks: 0.1257 + +=== ResMLP frozen/shallow baseline summary, seed=123 === + BP-shallow: 0.1756 + BP-frozen: 0.1777 + DFA-shallow: 0.1269 + DFA-frozen: 0.1257 + +Compare to trainable 4-block ResMLP (3-seed): BP=0.6147 100ep / 0.585 30ep, DFA=0.306 100ep / 0.301 30ep + +Interpretation: + If DFA-frozen ≈ DFA-trainable: blocks are passengers, walk-back parallels ViT + If DFA-frozen << DFA-trainable: ResMLP DFA actually trains the blocks (interesting contrast with ViT) + frozen s=456 (Sun Apr 26 10:35:07 AM CDT 2026) +Device: cuda:0, seed=456, epochs=100, dataset=cifar100 + +=== BP shallow (ResMLP num_blocks=0), seed=456 === + n_params: 812900 (812900 trainable) + [BP-shallow] ep 1: test_acc=0.1073 + [BP-shallow] ep 10: test_acc=0.1327 + [BP-shallow] ep 20: test_acc=0.1250 + [BP-shallow] ep 30: test_acc=0.1303 + [BP-shallow] ep 40: test_acc=0.1411 + [BP-shallow] ep 50: test_acc=0.1529 + [BP-shallow] ep 60: test_acc=0.1651 + [BP-shallow] ep 70: test_acc=0.1724 + [BP-shallow] ep 80: test_acc=0.1743 + [BP-shallow] ep 90: test_acc=0.1757 + [BP-shallow] ep 100: test_acc=0.1776 +FINAL BP-shallow: 0.1776 + +=== BP frozen-blocks (ResMLP num_blocks=4, blocks frozen), seed=456 === + n_params: 1341284 (812900 trainable) + [BP-frozen] ep 1: test_acc=0.1073 + [BP-frozen] ep 10: test_acc=0.1326 + [BP-frozen] ep 20: test_acc=0.1226 + [BP-frozen] ep 30: test_acc=0.1276 + [BP-frozen] ep 40: test_acc=0.1495 + [BP-frozen] ep 50: test_acc=0.1535 + [BP-frozen] ep 60: test_acc=0.1645 + [BP-frozen] ep 70: test_acc=0.1685 + [BP-frozen] ep 80: test_acc=0.1773 + [BP-frozen] ep 90: test_acc=0.1777 + [BP-frozen] ep 100: test_acc=0.1794 +FINAL BP-frozen-blocks: 0.1794 + +=== DFA shallow (ResMLP num_blocks=0), seed=456 === + n_params: 812900 (812900 trainable) + [DFA-shallow] ep 1: test_acc=0.0913 + [DFA-shallow] ep 10: test_acc=0.1150 + [DFA-shallow] ep 20: test_acc=0.1153 + [DFA-shallow] ep 30: test_acc=0.1161 + [DFA-shallow] ep 40: test_acc=0.1140 + [DFA-shallow] ep 50: test_acc=0.1202 + [DFA-shallow] ep 60: test_acc=0.1229 + [DFA-shallow] ep 70: test_acc=0.1243 + [DFA-shallow] ep 80: test_acc=0.1240 + [DFA-shallow] ep 90: test_acc=0.1237 + [DFA-shallow] ep 100: test_acc=0.1235 +FINAL DFA-shallow: 0.1235 + +=== DFA frozen-blocks (ResMLP num_blocks=4, blocks frozen), seed=456 === + n_params: 1341284 (812900 trainable) + [DFA-frozen] ep 1: test_acc=0.0862 + [DFA-frozen] ep 10: test_acc=0.1059 + [DFA-frozen] ep 20: test_acc=0.1130 + [DFA-frozen] ep 30: test_acc=0.1200 + [DFA-frozen] ep 40: test_acc=0.1227 + [DFA-frozen] ep 50: test_acc=0.1177 + [DFA-frozen] ep 60: test_acc=0.1229 + [DFA-frozen] ep 70: test_acc=0.1232 + [DFA-frozen] ep 80: test_acc=0.1240 + [DFA-frozen] ep 90: test_acc=0.1237 + [DFA-frozen] ep 100: test_acc=0.1236 +FINAL DFA-frozen-blocks: 0.1236 + +=== ResMLP frozen/shallow baseline summary, seed=456 === + BP-shallow: 0.1776 + BP-frozen: 0.1794 + DFA-shallow: 0.1235 + DFA-frozen: 0.1236 + +Compare to trainable 4-block ResMLP (3-seed): BP=0.6147 100ep / 0.585 30ep, DFA=0.306 100ep / 0.301 30ep + +Interpretation: + If DFA-frozen ≈ DFA-trainable: blocks are passengers, walk-back parallels ViT + If DFA-frozen << DFA-trainable: ResMLP DFA actually trains the blocks (interesting contrast with ViT) + +--- FA + DFA + BP --- + s=42 (Sun Apr 26 11:16:00 AM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 42 +============================================================ + +--- BP --- + [BP] Epoch 1: loss=3.9752, train=0.0983, test=0.1432 + [BP] Epoch 10: loss=3.0848, train=0.2424, test=0.2492 + [BP] Epoch 20: loss=2.8041, train=0.2935, test=0.2883 + [BP] Epoch 30: loss=2.6019, train=0.3352, test=0.3078 + [BP] Epoch 40: loss=2.4193, train=0.3727, test=0.3158 + [BP] Epoch 50: loss=2.2631, train=0.4053, test=0.3160 + [BP] Epoch 60: loss=2.1134, train=0.4371, test=0.3223 + [BP] Epoch 70: loss=1.9686, train=0.4729, test=0.3207 + [BP] Epoch 80: loss=1.8724, train=0.4941, test=0.3197 + [BP] Epoch 90: loss=1.8161, train=0.5069, test=0.3197 + [BP] Epoch 100: loss=1.7897, train=0.5126, test=0.3192 + Final test acc: 0.3192 + +--- DFA --- + [DFA] Epoch 1: loss=4.1736, train=0.0679, test=0.0775 + [DFA] Epoch 10: loss=4.0844, train=0.0798, test=0.0819 + [DFA] Epoch 20: loss=4.0627, train=0.0840, test=0.0759 + [DFA] Epoch 30: loss=4.0466, train=0.0876, test=0.0840 + [DFA] Epoch 40: loss=4.0357, train=0.0896, test=0.0862 + [DFA] Epoch 50: loss=4.0347, train=0.0909, test=0.0879 + [DFA] Epoch 60: loss=4.0298, train=0.0933, test=0.0879 + [DFA] Epoch 70: loss=4.0244, train=0.0958, test=0.0883 + [DFA] Epoch 80: loss=4.0232, train=0.0939, test=0.0871 + [DFA] Epoch 90: loss=4.0219, train=0.0962, test=0.0870 + [DFA] Epoch 100: loss=4.0244, train=0.0949, test=0.0875 + Final test acc: 0.0875 + +--- FA --- + [FA] Epoch 1: loss=4.1842, train=0.0639, test=0.0598 + [FA] Epoch 10: loss=3.9551, train=0.0978, test=0.0949 + [FA] Epoch 20: loss=3.8745, train=0.1103, test=0.1101 + [FA] Epoch 30: loss=3.8457, train=0.1160, test=0.1212 + [FA] Epoch 40: loss=3.7975, train=0.1235, test=0.1247 + [FA] Epoch 50: loss=3.7623, train=0.1290, test=0.1332 + [FA] Epoch 60: loss=3.7338, train=0.1341, test=0.1397 + [FA] Epoch 70: loss=3.7109, train=0.1404, test=0.1400 + [FA] Epoch 80: loss=3.6910, train=0.1426, test=0.1457 + [FA] Epoch 90: loss=3.6844, train=0.1436, test=0.1455 + [FA] Epoch 100: loss=3.6859, train=0.1440, test=0.1464 + Final test acc: 0.1464 + +All results saved to results/cifar100_d256_L4/results_cifar100.json + s=123 (Sun Apr 26 11:35:15 AM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 123 +============================================================ + +--- BP --- + [BP] Epoch 1: loss=3.9679, train=0.0986, test=0.1439 + [BP] Epoch 10: loss=3.0754, train=0.2440, test=0.2501 + [BP] Epoch 20: loss=2.8025, train=0.2938, test=0.2812 [BP] Epoch 30: loss=2.5874, train=0.3376, test=0.3021 [BP] Epoch 40: loss=2.4113, train=0.3699, test=0.3104 [BP] Epoch 50: loss=2.2468, train=0.4084, test=0.3160 @@ -153,7 +326,7 @@ st=0.2812 Final test acc: 0.1208 All results saved to results/cifar100_d256_L4/results_cifar100.json - methods s=456 (Sun Apr 26 09:51:41 AM CDT 2026) + s=456 (Sun Apr 26 11:55:24 AM CDT 2026) Using device: cuda:0 ============================================================ @@ -204,4 +377,4 @@ Seed 456 All results saved to results/cifar100_d256_L4/results_cifar100.json -=== CIFAR-100 SCAN DONE (Sun Apr 26 10:11:18 AM CDT 2026) === +=== CIFAR-100 DONE (Sun Apr 26 12:15:42 PM CDT 2026) === diff --git a/results/cifar_deltaL/cb_deltaL_d512_L4_s42.json b/results/cifar_deltaL/cb_deltaL_d512_L4_s42.json new file mode 100644 index 0000000..78966f7 --- /dev/null +++ b/results/cifar_deltaL/cb_deltaL_d512_L4_s42.json @@ -0,0 +1,428 @@ +{ + "test_acc": 0.1717, + "mean_gamma": -0.00046299276073114015, + "mean_rho": 0.0012461934238672256, + "mean_nudge": 4.773028194904327e-09, + "gamma_per_layer": [ + -0.0023594852536916733, + 0.0009741284884512424, + 4.115530464332551e-05, + -0.0005077695823274553 + ], + "rho_per_layer": [ + 0.004984773695468903, + 0.0, + 0.0, + 0.0 + ], + "log": { + "train_loss": [ + 2.0444039750671386, + 2.0249123254776, + 2.0189146698760987, + 2.0144716346740723, + 2.007473691558838, + 2.0051053838729858, + 2.006714312667847, + 2.0036455520629883, + 2.0023505293273924, + 2.0000714305114746, + 1.9993012132263184, + 1.9970802461242676, + 1.995211095352173, + 1.9947504391860962, + 1.9972148755264283, + 1.9986877463531494, + 1.9952667998886109, + 1.9928774863433838, + 1.9940253998184203, + 1.9955561303710938, + 1.9948335401153565, + 1.998514718055725, + 2.0032336281967162, + 2.0081826359558104, + 2.0130954586791994, + 2.0154034085845947, + 2.0223417203140257, + 2.0345401898956297, + 2.046992734832764, + 2.061535261764526, + 2.0764444414520264, + 2.0923677632141113, + 2.1082171977233886, + 2.1213150553894042, + 2.1289831489562987, + 2.1352404473876954, + 2.135588712615967, + 2.1505063746643067, + 2.1559543489837645, + 2.1559944111633302, + 2.156506446609497, + 2.1627962405395507, + 2.1623581884765626, + 2.157731541137695, + 2.1567544932556153, + 2.161283037261963, + 2.1659480712890624, + 2.165219133605957, + 2.1676781672668457, + 2.168010374298096, + 2.170241591796875, + 2.1681420809936522, + 2.1678991339874267, + 2.1717238208770753, + 2.169441184158325, + 2.17231173286438, + 2.1697757583618165, + 2.165332278289795, + 2.1648404447937013, + 2.162443913421631, + 2.163502599334717, + 2.166408346405029, + 2.16804390083313, + 2.1689177021026613, + 2.1651865095520018, + 2.163989846191406, + 2.1641754064941408, + 2.165077611541748, + 2.166705653839111, + 2.167564101715088, + 2.1710278340911864, + 2.1769975834655764, + 2.1826982949829103, + 2.1865540245056154, + 2.1911163873291017, + 2.1955129777526854, + 2.200497989349365, + 2.2021149839782717, + 2.2051946167755125, + 2.2077737213134765, + 2.2073872657775877, + 2.2054029051208497, + 2.202284111480713, + 2.203277819747925, + 2.2013303881072996, + 2.198281947479248, + 2.1976117317962647, + 2.1977084674835203, + 2.1950897843933106, + 2.194660401611328, + 2.192600202255249, + 2.1936425202178955, + 2.1910581676483156, + 2.1923243353271484, + 2.193233468551636, + 2.1907765885925294, + 2.190179352416992, + 2.1911171742248534, + 2.190001749725342, + 2.192826342468262 + ], + "train_acc": [ + 0.24654, + 0.25888, + 0.26084, + 0.26342, + 0.26736, + 0.26766, + 0.27072, + 0.26988, + 0.2689, + 0.27084, + 0.27104, + 0.27648, + 0.27528, + 0.27486, + 0.27226, + 0.2722, + 0.27294, + 0.27544, + 0.27466, + 0.27426, + 0.27326, + 0.27362, + 0.27122, + 0.27092, + 0.26646, + 0.26598, + 0.26664, + 0.25898, + 0.25328, + 0.24918, + 0.24344, + 0.23666, + 0.22862, + 0.221, + 0.21902, + 0.2138, + 0.21294, + 0.20364, + 0.19536, + 0.19486, + 0.198, + 0.19404, + 0.19518, + 0.18816, + 0.18668, + 0.1857, + 0.1859, + 0.18318, + 0.18076, + 0.18372, + 0.1812, + 0.18038, + 0.18282, + 0.18026, + 0.18034, + 0.18116, + 0.18096, + 0.18402, + 0.18362, + 0.1836, + 0.18128, + 0.18144, + 0.18048, + 0.18196, + 0.18358, + 0.18372, + 0.18174, + 0.18188, + 0.18088, + 0.17936, + 0.1797, + 0.17762, + 0.17326, + 0.16934, + 0.17002, + 0.1682, + 0.16828, + 0.16984, + 0.16748, + 0.16712, + 0.1678, + 0.16924, + 0.17316, + 0.16976, + 0.1735, + 0.1744, + 0.17464, + 0.17778, + 0.18032, + 0.18102, + 0.18016, + 0.18154, + 0.1833, + 0.18726, + 0.18486, + 0.18794, + 0.18796, + 0.18886, + 0.19076, + 0.18784 + ], + "test_acc": [ + 0.2946, + 0.2788, + 0.2693, + 0.2902, + 0.283, + 0.2822, + 0.2855, + 0.304, + 0.3036, + 0.2924, + 0.2837, + 0.3045, + 0.3041, + 0.3089, + 0.3047, + 0.3046, + 0.308, + 0.2885, + 0.2916, + 0.3075, + 0.3108, + 0.2899, + 0.3075, + 0.2907, + 0.3007, + 0.2876, + 0.2914, + 0.291, + 0.2743, + 0.266, + 0.2565, + 0.2491, + 0.2279, + 0.2496, + 0.215, + 0.2361, + 0.2407, + 0.1966, + 0.1912, + 0.1959, + 0.1969, + 0.2094, + 0.2005, + 0.1898, + 0.2025, + 0.2021, + 0.2028, + 0.1906, + 0.198, + 0.1903, + 0.1939, + 0.2039, + 0.1939, + 0.1918, + 0.1967, + 0.2025, + 0.1895, + 0.1988, + 0.1975, + 0.1868, + 0.1938, + 0.1829, + 0.1763, + 0.1954, + 0.1943, + 0.2005, + 0.1717, + 0.199, + 0.1796, + 0.1758, + 0.1857, + 0.186, + 0.17, + 0.1769, + 0.1563, + 0.1484, + 0.1597, + 0.1476, + 0.153, + 0.1491, + 0.157, + 0.1616, + 0.1614, + 0.168, + 0.1528, + 0.1645, + 0.1585, + 0.1612, + 0.1583, + 0.1609, + 0.1617, + 0.1711, + 0.1739, + 0.1698, + 0.1705, + 0.1682, + 0.1704, + 0.1696, + 0.1707, + 0.1717 + ], + "value_loss": [ + 0.6843515609264373, + 0.4836954481315613, + 0.49060195610046387, + 0.482502464427948, + 0.4724110138607025, + 0.47196283916473386, + 0.4722852735424042, + 0.47474509954452515, + 0.47920079902648927, + 0.4653218937301636, + 0.4708782638549805, + 0.4721875062274933, + 0.46917473793029785, + 0.4662531480121613, + 0.4700366088104248, + 0.46397935678482055, + 0.4631014201927185, + 0.4610643830871582, + 0.46284970180511475, + 0.46170863552093505, + 0.47011133566856383, + 0.47193270978927615, + 0.4646204328250885, + 0.467099391117096, + 0.4621818755531311, + 0.4425638478469849, + 0.42111622163772583, + 0.3994237916183472, + 0.37747854212760923, + 0.3546357834625244, + 0.33539585664749144, + 0.3129578005027771, + 0.2981300315666199, + 0.282984656662941, + 0.26991029960632323, + 0.2535946504974365, + 0.27314576332092283, + 2.4199648852539064, + 2.493552964782715, + 0.7517320976638794, + 0.4001072905731201, + 0.3338989479637146, + 0.4265604039001465, + 0.6514868779945373, + 0.36797485956192016, + 0.2637787111091614, + 0.29417893881320956, + 0.28382857972621917, + 0.28800895755290984, + 0.25106282708644867, + 0.21279508100032807, + 0.22448700638771057, + 0.23670673545837403, + 0.25310671283721925, + 0.2424251132106781, + 0.23667334317684174, + 0.2266401306438446, + 0.22766124735355378, + 0.22233413058280946, + 0.21773689158439635, + 0.22565684715270995, + 0.23761135723114013, + 0.23149112558364868, + 0.23285244408607483, + 0.22737021198272706, + 0.23226782833099366, + 0.2398809409046173, + 0.2550660298633575, + 0.24118843837738038, + 0.23774260456085206, + 0.24037814396858215, + 0.2305371964597702, + 0.21118572751522063, + 0.1980142738342285, + 0.18865261703968048, + 0.18505996946573258, + 0.1821361440181732, + 0.16658801609516144, + 0.16734248275279998, + 0.1691108640861511, + 0.17054776992797852, + 0.17163910236358643, + 0.16854004856586458, + 0.17512820116758346, + 0.1776979324054718, + 0.18071853521347045, + 0.18127825408935547, + 0.1877873701763153, + 0.17884414254665373, + 0.18034058660030364, + 0.17787896811008452, + 0.17911501332044602, + 0.17415666017055512, + 0.17281464380860329, + 0.17541839653730393, + 0.1780324169397354, + 0.17434879955768584, + 0.175187377910614, + 0.17379322323322297, + 0.17982573692560197 + ] + } +} \ No newline at end of file diff --git a/results/cifar_depth_scan_multiseed.log b/results/cifar_depth_scan_multiseed.log new file mode 100644 index 0000000..e732776 --- /dev/null +++ b/results/cifar_depth_scan_multiseed.log @@ -0,0 +1,81 @@ +Device: cuda:0 +Depths: [4], Widths: [512] +Seeds: [123, 456], BP seeds: [99999] + +============================================================ +Config: d512_L4_s123, methods: ['dfa', 'credit_bridge'] +============================================================ + + d=512, L=4, seed=123, method=dfa + [DFA] Ep 1: loss=2.0624 train=0.2399 test=0.2780 + [DFA] Ep 10: loss=1.9937 train=0.2692 test=0.2896 + [DFA] Ep 20: loss=1.9914 train=0.2763 test=0.2907 + [DFA] Ep 30: loss=1.9863 train=0.2793 test=0.3103 + [DFA] Ep 40: loss=1.9821 train=0.2795 test=0.2838 + [DFA] Ep 50: loss=1.9797 train=0.2815 test=0.3044 + [DFA] Ep 60: loss=1.9779 train=0.2836 test=0.3078 + [DFA] Ep 70: loss=1.9746 train=0.2853 test=0.3045 + [DFA] Ep 80: loss=1.9749 train=0.2850 test=0.3127 + [DFA] Ep 90: loss=1.9713 train=0.2850 test=0.3100 + [DFA] Ep 100: loss=1.9721 train=0.2881 test=0.3094 + Done in 934s: acc=0.3094 Gamma=0.1070 rho=0.0024 + + d=512, L=4, seed=123, method=credit_bridge + [CB] Ep 1 (warmup): loss=2.0474 train=0.2498 test=0.2708 vloss=0.570750 + [CB] Ep 10 (warmup): loss=1.9885 train=0.2744 test=0.2904 vloss=0.072501 + [CB] Ep 20 (warmup): loss=1.9826 train=0.2787 test=0.3163 vloss=0.044637 + [CB] Ep 30 (blend=0.50): loss=1.9813 train=0.2803 test=0.2957 vloss=0.034919 + [CB] Ep 40 (blend=1.00): loss=1.9706 train=0.2851 test=0.2988 vloss=0.024587 + [CB] Ep 50 (blend=1.00): loss=1.9926 train=0.2667 test=0.2809 vloss=0.023065 + [CB] Ep 60 (blend=1.00): loss=1.9741 train=0.2725 test=0.2772 vloss=0.019018 + [CB] Ep 70 (blend=1.00): loss=1.9646 train=0.2812 test=0.2917 vloss=0.011482 + [CB] Ep 80 (blend=1.00): loss=1.9559 train=0.2854 test=0.3062 vloss=0.005063 + [CB] Ep 90 (blend=1.00): loss=1.9517 train=0.2901 test=0.3151 vloss=0.002326 + [CB] Ep 100 (blend=1.00): loss=1.9479 train=0.2907 test=0.3091 vloss=0.001450 + Done in 1572s: acc=0.3091 Gamma=0.1319 rho=0.0010 + +============================================================ +Config: d512_L4_s456, methods: ['dfa', 'credit_bridge'] +============================================================ + + d=512, L=4, seed=456, method=dfa + [DFA] Ep 1: loss=2.0361 train=0.2552 test=0.2764 + [DFA] Ep 10: loss=1.9941 train=0.2756 test=0.2900 + [DFA] Ep 20: loss=1.9883 train=0.2767 test=0.2958 + [DFA] Ep 30: loss=1.9867 train=0.2788 test=0.3011 + [DFA] Ep 40: loss=1.9829 train=0.2834 test=0.3067 + [DFA] Ep 50: loss=1.9822 train=0.2800 test=0.2991 + [DFA] Ep 60: loss=1.9784 train=0.2827 test=0.2979 + [DFA] Ep 70: loss=1.9806 train=0.2869 test=0.3041 + [DFA] Ep 80: loss=1.9778 train=0.2845 test=0.3078 + [DFA] Ep 90: loss=1.9771 train=0.2875 test=0.3110 + [DFA] Ep 100: loss=1.9766 train=0.2863 test=0.3092 + Done in 1075s: acc=0.3092 Gamma=0.1012 rho=0.0045 + + d=512, L=4, seed=456, method=credit_bridge + [CB] Ep 1 (warmup): loss=2.0472 train=0.2499 test=0.2680 vloss=0.491338 + [CB] Ep 10 (warmup): loss=1.9976 train=0.2715 test=0.2905 vloss=0.067081 + [CB] Ep 20 (warmup): loss=1.9967 train=0.2732 test=0.2852 vloss=0.044847 + [CB] Ep 30 (blend=0.50): loss=1.9887 train=0.2796 test=0.2918 vloss=0.025167 + [CB] Ep 40 (blend=1.00): loss=1.9825 train=0.2789 test=0.3019 vloss=0.023611 + [CB] Ep 50 (blend=1.00): loss=1.9632 train=0.2860 test=0.3026 vloss=0.028265 + [CB] Ep 60 (blend=1.00): loss=1.9739 train=0.2757 test=0.2977 vloss=0.021634 + [CB] Ep 70 (blend=1.00): loss=1.9594 train=0.2854 test=0.2976 vloss=0.011156 + [CB] Ep 80 (blend=1.00): loss=1.9557 train=0.2895 test=0.3066 vloss=0.004731 + [CB] Ep 90 (blend=1.00): loss=1.9549 train=0.2912 test=0.3087 vloss=0.001627 + [CB] Ep 100 (blend=1.00): loss=1.9500 train=0.2922 test=0.3082 vloss=0.000972 + Done in 8663s: acc=0.3082 Gamma=0.1447 rho=0.0076 + +Summary saved to results/cifar_depth_scan_multiseed/summary.json + +========================================================================================== +CIFAR-10 DEPTH SCAN SUMMARY +========================================================================================== +Config Method Acc Gamma rho nudge +------------------------------------------------------------------------------------------ +d512_L4_s123 credit_bridge 0.3091 0.1319 0.0010 -0.000002 +d512_L4_s123 dfa 0.3094 0.1070 0.0024 -0.000001 + +d512_L4_s456 credit_bridge 0.3082 0.1447 0.0076 -0.000002 +d512_L4_s456 dfa 0.3092 0.1012 0.0045 -0.000001 + diff --git a/results/cifar_depth_scan_multiseed/d512_L4_s123.json b/results/cifar_depth_scan_multiseed/d512_L4_s123.json new file mode 100644 index 0000000..65a54a8 --- /dev/null +++ b/results/cifar_depth_scan_multiseed/d512_L4_s123.json @@ -0,0 +1,838 @@ +{ + "dfa": { + "log": { + "train_loss": [ + 2.0624400663757325, + 2.0397126093292237, + 2.030224827308655, + 2.019537830963135, + 2.0098417961883546, + 2.0099143604278566, + 2.001345584373474, + 1.997260925064087, + 1.9985963092803956, + 1.993651236228943, + 1.9917502028656007, + 1.9918365036010741, + 1.9975997705841064, + 1.9904954579925538, + 1.9898213328552246, + 1.9904397552490234, + 1.9868707651519775, + 1.9902398801422119, + 1.9854657730484009, + 1.9914187986755372, + 1.985543049468994, + 1.988907001800537, + 1.9854262001800538, + 1.985992236480713, + 1.986677961502075, + 1.9851684880065918, + 1.9878835204315186, + 1.9870538790893555, + 1.984294542236328, + 1.9862867044067383, + 1.9819232828140259, + 1.98281076171875, + 1.9850609212493897, + 1.9814563494873048, + 1.9814497323989868, + 1.985917557067871, + 1.9854490676498413, + 1.9831627449798583, + 1.9817213195037842, + 1.9821227896118163, + 1.983226878051758, + 1.9835711795043944, + 1.9833458575057983, + 1.9817056420516967, + 1.9815308977890014, + 1.9825032497406005, + 1.9806674496459962, + 1.9796993829345704, + 1.9813827806091309, + 1.9796657073974608, + 1.9811469369506836, + 1.9779993580627442, + 1.9808807947540283, + 1.9770961724853515, + 1.9780911437225341, + 1.977968225440979, + 1.9786042345428467, + 1.9761781659698487, + 1.9768042601013183, + 1.9778708429718017, + 1.9789468997192383, + 1.977910756225586, + 1.9747010653686523, + 1.9750921910858155, + 1.978596909751892, + 1.9746475157928467, + 1.9765909009552003, + 1.9770333652114869, + 1.973500870285034, + 1.9746166478729248, + 1.9764599881362914, + 1.9757590785217285, + 1.9747783449554444, + 1.9717445582580566, + 1.9745237543487548, + 1.9730215407562255, + 1.973571043701172, + 1.9736142820739746, + 1.9728294008636476, + 1.974929390296936, + 1.9747015952301026, + 1.9722450610733033, + 1.9724271701049805, + 1.9719529797363282, + 1.9742696553039552, + 1.9725008160018922, + 1.9723811784362792, + 1.9741300776672364, + 1.973212038269043, + 1.971276873435974, + 1.9703804751205445, + 1.970821933631897, + 1.9726865364074706, + 1.9739636318588256, + 1.9740656425476075, + 1.9727160183334351, + 1.9740542842102051, + 1.971614676208496, + 1.971007470932007, + 1.9721037426757813 + ], + "train_acc": [ + 0.23992, + 0.24876, + 0.25324, + 0.25864, + 0.26564, + 0.2615, + 0.26848, + 0.27098, + 0.26694, + 0.26916, + 0.27382, + 0.27204, + 0.27188, + 0.2717, + 0.2728, + 0.27254, + 0.27468, + 0.27354, + 0.27584, + 0.27626, + 0.27632, + 0.2744, + 0.27728, + 0.2785, + 0.27958, + 0.27762, + 0.27576, + 0.27726, + 0.27874, + 0.27928, + 0.28054, + 0.27888, + 0.27832, + 0.27914, + 0.27884, + 0.27718, + 0.27824, + 0.2804, + 0.27976, + 0.27946, + 0.28172, + 0.2795, + 0.28108, + 0.28218, + 0.27982, + 0.27774, + 0.28186, + 0.28412, + 0.28204, + 0.2815, + 0.28198, + 0.28554, + 0.2811, + 0.28404, + 0.28402, + 0.28164, + 0.28256, + 0.2828, + 0.28234, + 0.28364, + 0.28262, + 0.28518, + 0.28496, + 0.28426, + 0.28172, + 0.28612, + 0.28492, + 0.28286, + 0.28482, + 0.28532, + 0.28536, + 0.28336, + 0.28372, + 0.28758, + 0.28676, + 0.28552, + 0.28688, + 0.28368, + 0.28704, + 0.28502, + 0.28718, + 0.2875, + 0.28606, + 0.2879, + 0.28476, + 0.28654, + 0.28584, + 0.28448, + 0.2866, + 0.285, + 0.28856, + 0.28764, + 0.28518, + 0.28624, + 0.28576, + 0.28584, + 0.28608, + 0.28572, + 0.28552, + 0.28808 + ], + "test_acc": [ + 0.278, + 0.2691, + 0.2704, + 0.2679, + 0.2967, + 0.277, + 0.2844, + 0.2727, + 0.2956, + 0.2896, + 0.2868, + 0.3071, + 0.2921, + 0.2959, + 0.2702, + 0.2866, + 0.2803, + 0.3031, + 0.2824, + 0.2907, + 0.3033, + 0.2871, + 0.299, + 0.2951, + 0.2985, + 0.286, + 0.2974, + 0.2932, + 0.2974, + 0.3103, + 0.289, + 0.3118, + 0.3113, + 0.3008, + 0.2943, + 0.2927, + 0.3043, + 0.3027, + 0.303, + 0.2838, + 0.291, + 0.3025, + 0.3031, + 0.3022, + 0.3058, + 0.3064, + 0.3029, + 0.2923, + 0.2905, + 0.3044, + 0.3046, + 0.3085, + 0.3098, + 0.3073, + 0.2895, + 0.3096, + 0.3094, + 0.2988, + 0.2985, + 0.3078, + 0.3008, + 0.3075, + 0.3094, + 0.3081, + 0.305, + 0.2999, + 0.311, + 0.3039, + 0.305, + 0.3045, + 0.3106, + 0.3084, + 0.3096, + 0.3111, + 0.3133, + 0.3093, + 0.3035, + 0.3052, + 0.3052, + 0.3127, + 0.3085, + 0.3042, + 0.3093, + 0.3092, + 0.3111, + 0.3122, + 0.3093, + 0.3087, + 0.308, + 0.31, + 0.3088, + 0.3101, + 0.3083, + 0.3106, + 0.3082, + 0.3098, + 0.3092, + 0.309, + 0.3094, + 0.3094 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.4263063073158264, + 0.0001657301909290254, + 0.0015438150148838758, + -0.00019233977945987135 + ], + "perturbation_rho": [ + 0.009619573131203651, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -5.541369318962097e-07, + 0.0, + 0.0, + 0.0 + ], + "0.003": [ + -1.4677643775939941e-06, + 1.862645149230957e-09, + 0.0, + 0.0 + ], + "0.01": [ + -4.9551017582416534e-06, + 5.587935447692871e-09, + 0.0, + -9.313225746154785e-10 + ] + } + }, + "drift": { + "embed.weight": 309.23071938279907, + "embed.bias": 237.22614756651578, + "blocks.0.ln.weight": 8.168762727821633, + "blocks.0.w1.weight": 195.29175323586153, + "blocks.0.w1.bias": 144.58261416253544, + "blocks.0.w2.weight": 309.9917799247131, + "blocks.1.ln.weight": 7.339870422040846, + "blocks.1.w1.weight": 295.9775177425126, + "blocks.1.w1.bias": 264.8927251390922, + "blocks.1.w2.weight": 245.06528152841986, + "blocks.2.ln.weight": 5.568128485175647, + "blocks.2.w1.weight": 190.7912001656625, + "blocks.2.w1.bias": 151.63622211328425, + "blocks.2.w2.weight": 148.49851386877077, + "blocks.3.ln.weight": 6.179513040361593, + "blocks.3.w1.weight": 205.73090318196944, + "blocks.3.w1.bias": 165.1061911212938, + "blocks.3.w2.weight": 158.15418176798514, + "out_ln.weight": 0.501473453849158, + "out_head.weight": 8.012264954942612, + "out_head.bias": 1.9789555595618953 + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.047448694076538, + 2.0313234769439696, + 2.020185037612915, + 2.010881477203369, + 2.0009254308319093, + 1.996725665550232, + 1.9918568433380126, + 1.9913989479064942, + 1.9935748266220092, + 1.9885124765396118, + 1.9861768546295167, + 1.9848651294326782, + 1.9840049396514892, + 1.983628706588745, + 1.9854573066711425, + 1.9872153559875487, + 1.9828620668029786, + 1.9831350064849853, + 1.9787096114730836, + 1.9825948291397095, + 1.982805096092224, + 1.9789331387710571, + 1.9828052577972413, + 1.9828253454589844, + 1.9806131177520752, + 1.9788864892578124, + 1.9819215051651, + 1.980471068572998, + 1.9807338523101807, + 1.9813471894073487, + 1.9765760861968995, + 1.9785934501647948, + 1.9759084671783447, + 1.9761677234649657, + 1.9766588953399657, + 1.9750333673095704, + 1.9727988452911378, + 1.976060122756958, + 1.9735999352264404, + 1.9706104679870606, + 1.9753494220733643, + 1.9759558032989502, + 1.9787567910766601, + 1.9837647161483765, + 1.9871420777893067, + 1.987115750579834, + 1.9864891412734986, + 1.9884751352310182, + 1.9899889309310914, + 1.9925686660385131, + 1.9907978774261474, + 1.9877149448013305, + 1.9817013835906983, + 1.980732074661255, + 1.9820370742034912, + 1.9818651236724854, + 1.9819183142089845, + 1.983378551673889, + 1.9774607040023804, + 1.9741114377593993, + 1.9718304233551025, + 1.9683720745849609, + 1.9687809296417236, + 1.9646731536102295, + 1.966298240814209, + 1.9667856047821044, + 1.9649899264526367, + 1.9666670780181885, + 1.967674755706787, + 1.9645581008148194, + 1.9643389911651612, + 1.9642895327377319, + 1.9622753365707397, + 1.9615250595855713, + 1.958518320388794, + 1.959536176071167, + 1.956633321876526, + 1.955765027809143, + 1.955853212966919, + 1.9559229345321656, + 1.9547552616882324, + 1.9537322317886352, + 1.955186512069702, + 1.9555984322357178, + 1.9526400441741942, + 1.9539651677703858, + 1.9541091006469726, + 1.9521852050018311, + 1.9506305475616454, + 1.9516619800567627, + 1.9523800668716431, + 1.9526127795410155, + 1.9500486698150634, + 1.9506466804504394, + 1.950422335205078, + 1.9492678187561034, + 1.951801809387207, + 1.9492061517333985, + 1.9487847713470459, + 1.9479388536834716 + ], + "train_acc": [ + 0.24982, + 0.25432, + 0.25988, + 0.26398, + 0.26826, + 0.27072, + 0.2736, + 0.27368, + 0.27026, + 0.2744, + 0.27562, + 0.2762, + 0.27898, + 0.27752, + 0.27714, + 0.27558, + 0.27794, + 0.27886, + 0.27944, + 0.27866, + 0.27782, + 0.2802, + 0.27774, + 0.2782, + 0.27834, + 0.28176, + 0.27964, + 0.28122, + 0.28302, + 0.2803, + 0.28168, + 0.28492, + 0.28662, + 0.28498, + 0.28398, + 0.28418, + 0.28436, + 0.28406, + 0.285, + 0.28506, + 0.2853, + 0.28632, + 0.2816, + 0.27674, + 0.27452, + 0.2762, + 0.27286, + 0.27104, + 0.26842, + 0.26674, + 0.2682, + 0.27086, + 0.2721, + 0.27334, + 0.26858, + 0.26754, + 0.2682, + 0.26736, + 0.27326, + 0.2725, + 0.27848, + 0.2799, + 0.2766, + 0.27852, + 0.27936, + 0.27878, + 0.27724, + 0.27918, + 0.27932, + 0.28118, + 0.28126, + 0.28392, + 0.2803, + 0.28266, + 0.286, + 0.28438, + 0.28684, + 0.28472, + 0.28482, + 0.28542, + 0.2862, + 0.2881, + 0.28612, + 0.2846, + 0.28796, + 0.28742, + 0.2881, + 0.28934, + 0.28792, + 0.2901, + 0.28916, + 0.28972, + 0.28884, + 0.28898, + 0.29152, + 0.2882, + 0.28858, + 0.28908, + 0.28988, + 0.2907 + ], + "test_acc": [ + 0.2708, + 0.2877, + 0.2844, + 0.3019, + 0.2856, + 0.2682, + 0.2969, + 0.2967, + 0.3046, + 0.2904, + 0.3, + 0.301, + 0.3127, + 0.3024, + 0.3016, + 0.2968, + 0.2932, + 0.2853, + 0.2994, + 0.3163, + 0.3043, + 0.3064, + 0.3019, + 0.3067, + 0.3108, + 0.2873, + 0.313, + 0.294, + 0.2992, + 0.2957, + 0.3138, + 0.2825, + 0.3008, + 0.313, + 0.2963, + 0.2933, + 0.2959, + 0.302, + 0.3025, + 0.2988, + 0.2862, + 0.2898, + 0.288, + 0.2864, + 0.2839, + 0.2921, + 0.2735, + 0.2758, + 0.2837, + 0.2809, + 0.2859, + 0.2985, + 0.2934, + 0.2953, + 0.2901, + 0.2936, + 0.2736, + 0.2867, + 0.2944, + 0.2772, + 0.2934, + 0.2907, + 0.2657, + 0.2904, + 0.2948, + 0.2986, + 0.295, + 0.2922, + 0.2922, + 0.2917, + 0.3014, + 0.2951, + 0.3037, + 0.2992, + 0.2986, + 0.3016, + 0.2992, + 0.2954, + 0.3074, + 0.3062, + 0.3064, + 0.3057, + 0.303, + 0.3132, + 0.3005, + 0.3005, + 0.3063, + 0.3046, + 0.3109, + 0.3151, + 0.3084, + 0.3104, + 0.3085, + 0.3095, + 0.3074, + 0.3073, + 0.3089, + 0.3099, + 0.3091, + 0.3091 + ], + "value_loss": [ + 0.5707502987289429, + 0.21804388338804245, + 0.15581646837711335, + 0.12560613882541657, + 0.09998264230251312, + 0.0933005502653122, + 0.07152107969522477, + 0.0807156308054924, + 0.0758870889377594, + 0.0725011654818058, + 0.06433650768041611, + 0.0583218602848053, + 0.05447098765850067, + 0.05356317266821861, + 0.051104292290210726, + 0.04830431792974472, + 0.04666164525568485, + 0.04492894763946533, + 0.03697128227233887, + 0.044636598999500274, + 0.038840959733724596, + 0.03668111073076725, + 0.04674931382536888, + 0.03399278607428074, + 0.03293712543725968, + 0.031108056619167327, + 0.0359199301469326, + 0.032191682063341144, + 0.030914719166755675, + 0.034918713810443876, + 0.027279326229095457, + 0.028772687133550644, + 0.026532491153478624, + 0.03022626201868057, + 0.02425762990474701, + 0.021495298286676408, + 0.02340421486377716, + 0.02494628700852394, + 0.02157571573317051, + 0.02458729513168335, + 0.030457366015315054, + 0.028464497868418693, + 0.03454268118262291, + 0.033964355611801146, + 0.03478494201660156, + 0.03390908203601837, + 0.03329608275532722, + 0.02784320188641548, + 0.02793454117655754, + 0.023065205497145653, + 0.029398028488755227, + 0.024307609224021434, + 0.021599815479516983, + 0.022070472690463066, + 0.022135936530828477, + 0.02179758728504181, + 0.022954062497019766, + 0.022859104943275452, + 0.024180895167589186, + 0.019018265507221223, + 0.01852666168630123, + 0.015004176079034806, + 0.017163365394473076, + 0.0168545845746994, + 0.01648236249387264, + 0.016145528084635735, + 0.015413791033029556, + 0.015835543455481528, + 0.013550898374915124, + 0.011481919240653515, + 0.011319914956986903, + 0.011722228462398052, + 0.010268688924312592, + 0.01009241207242012, + 0.008388303059637546, + 0.00844380562722683, + 0.006402937684953213, + 0.006658818064033985, + 0.005926967875659466, + 0.005063385500609875, + 0.0050483594045042995, + 0.004696262401491403, + 0.0043795296615362165, + 0.003987229224145412, + 0.0035997102437913416, + 0.0031672756604850293, + 0.002853435079678893, + 0.0022479154869914056, + 0.0024048341078311206, + 0.002326442019492388, + 0.0018791391399502755, + 0.0019763806109130383, + 0.001660491597019136, + 0.001620488502755761, + 0.0015598841778188945, + 0.0014834263022989035, + 0.0016181138510629534, + 0.001651853753849864, + 0.0013820433163642884, + 0.0014498794532939792 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.4222239851951599, + 0.024459093809127808, + 0.03995171934366226, + 0.04084722697734833 + ], + "perturbation_rho": [ + 0.0041291676461696625, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -9.620562195777893e-07, + 0.0, + 0.0, + 0.0 + ], + "0.003": [ + -2.819579094648361e-06, + 0.0, + 0.0, + 0.0 + ], + "0.01": [ + -9.313225746154785e-06, + 0.0, + 0.0, + 0.0 + ] + } + }, + "drift": { + "embed.weight": 169.77199532845293, + "embed.bias": 94.39731873768694, + "blocks.0.ln.weight": 7.473003215045953, + "blocks.0.w1.weight": 145.00989153500845, + "blocks.0.w1.bias": 73.71991188904822, + "blocks.0.w2.weight": 216.26672683471344, + "blocks.1.ln.weight": 5.6302704740332, + "blocks.1.w1.weight": 287.6493822307464, + "blocks.1.w1.bias": 275.5944088792273, + "blocks.1.w2.weight": 219.66609078475946, + "blocks.2.ln.weight": 5.395047896943873, + "blocks.2.w1.weight": 191.14272489250746, + "blocks.2.w1.bias": 161.75927742876627, + "blocks.2.w2.weight": 145.48860169566208, + "blocks.3.ln.weight": 5.19878957620753, + "blocks.3.w1.weight": 200.1583978400427, + "blocks.3.w1.bias": 170.38103589953525, + "blocks.3.w2.weight": 151.26043219994418, + "out_ln.weight": 0.33097813227586326, + "out_head.weight": 5.511603241177177, + "out_head.bias": 1.1054650448531782 + } + } +} \ No newline at end of file diff --git a/results/cifar_depth_scan_multiseed/d512_L4_s456.json b/results/cifar_depth_scan_multiseed/d512_L4_s456.json new file mode 100644 index 0000000..d65e1d7 --- /dev/null +++ b/results/cifar_depth_scan_multiseed/d512_L4_s456.json @@ -0,0 +1,838 @@ +{ + "dfa": { + "log": { + "train_loss": [ + 2.036063042526245, + 2.021697966270447, + 2.0175282815551756, + 2.0099474266815185, + 2.0023637646484373, + 1.9997982411193849, + 1.994500837135315, + 1.9948944988250732, + 1.9934745358657837, + 1.9940558145904541, + 1.989395669708252, + 1.9907533937835693, + 1.9909110592269899, + 1.9884686621856689, + 1.9896867315673827, + 1.9894394902038575, + 1.9898611724472046, + 1.9885188024139404, + 1.987230980796814, + 1.9882823168945312, + 1.989858097000122, + 1.9871241819763183, + 1.9898512621307374, + 1.9869138607788086, + 1.989206803970337, + 1.988134487876892, + 1.986097745704651, + 1.9872820987701416, + 1.9868804365539552, + 1.9866938884735108, + 1.985588796081543, + 1.986480817642212, + 1.9833618145370484, + 1.9839750741958617, + 1.9829646868133546, + 1.9850209189605712, + 1.9842300912857056, + 1.9849878060150146, + 1.9847687102508544, + 1.9829170959854125, + 1.984829327354431, + 1.9833095259094238, + 1.9831390253067016, + 1.9819875910186768, + 1.9806521664810182, + 1.9821762627410888, + 1.9833445807647705, + 1.9825785246276855, + 1.9821733226013183, + 1.9822086193847657, + 1.9808910798645019, + 1.9806908596801758, + 1.9812886644744874, + 1.9800793671417236, + 1.9819620014953614, + 1.9800292537689208, + 1.979716037750244, + 1.978658859024048, + 1.9786357926940918, + 1.9784277129745484, + 1.9790855308532715, + 1.9804114780426025, + 1.9788293676757813, + 1.9797553412628175, + 1.9789648551940917, + 1.9809454851913453, + 1.9784064822006227, + 1.9783699047851562, + 1.9753275060272217, + 1.980608378677368, + 1.9775778076553345, + 1.9774704048919678, + 1.9763223318481444, + 1.978011087913513, + 1.97850968624115, + 1.9783587040710449, + 1.9769906464385987, + 1.9791353679656982, + 1.97542318939209, + 1.9777735634613036, + 1.975693401260376, + 1.9773611065673828, + 1.9757630486679076, + 1.9765492203521728, + 1.975723260231018, + 1.9762512990951537, + 1.9754029594421387, + 1.9746607822418214, + 1.9762510384368897, + 1.9770903870391845, + 1.9748862505340576, + 1.976749499130249, + 1.976892409286499, + 1.9757273367309571, + 1.972305432357788, + 1.9770755380630494, + 1.9764292287445069, + 1.9747362934875488, + 1.975049077911377, + 1.976587531967163 + ], + "train_acc": [ + 0.25522, + 0.26076, + 0.26296, + 0.26702, + 0.2714, + 0.27334, + 0.27538, + 0.27482, + 0.27362, + 0.27556, + 0.2766, + 0.27682, + 0.27788, + 0.27572, + 0.2761, + 0.28036, + 0.2788, + 0.2774, + 0.27756, + 0.27672, + 0.2781, + 0.27916, + 0.27804, + 0.2809, + 0.27756, + 0.28, + 0.28036, + 0.2806, + 0.27974, + 0.27884, + 0.28096, + 0.28062, + 0.28074, + 0.2811, + 0.27964, + 0.28086, + 0.2816, + 0.27984, + 0.28018, + 0.28336, + 0.28218, + 0.28254, + 0.28162, + 0.2826, + 0.28312, + 0.2808, + 0.28174, + 0.28084, + 0.28134, + 0.28002, + 0.28486, + 0.28302, + 0.28208, + 0.28486, + 0.28308, + 0.2868, + 0.28404, + 0.28324, + 0.28522, + 0.28274, + 0.28296, + 0.2849, + 0.28348, + 0.28502, + 0.2858, + 0.28408, + 0.28474, + 0.28406, + 0.28494, + 0.28688, + 0.28452, + 0.2866, + 0.28644, + 0.28752, + 0.2848, + 0.2847, + 0.28528, + 0.28742, + 0.28474, + 0.28446, + 0.28554, + 0.28544, + 0.2885, + 0.28666, + 0.28764, + 0.28658, + 0.28774, + 0.2877, + 0.2864, + 0.28752, + 0.28678, + 0.28682, + 0.28516, + 0.28676, + 0.28974, + 0.2863, + 0.28726, + 0.28506, + 0.2869, + 0.28632 + ], + "test_acc": [ + 0.2764, + 0.2831, + 0.2553, + 0.2822, + 0.2726, + 0.3049, + 0.2889, + 0.2915, + 0.2919, + 0.29, + 0.2917, + 0.3012, + 0.3024, + 0.2861, + 0.2951, + 0.2962, + 0.2897, + 0.3072, + 0.3078, + 0.2958, + 0.3093, + 0.3003, + 0.3061, + 0.2877, + 0.2989, + 0.3088, + 0.2985, + 0.3014, + 0.2986, + 0.3011, + 0.2905, + 0.2903, + 0.3073, + 0.3026, + 0.2959, + 0.3046, + 0.2985, + 0.2826, + 0.3078, + 0.3067, + 0.311, + 0.2923, + 0.3024, + 0.2948, + 0.3099, + 0.3032, + 0.3032, + 0.2891, + 0.3125, + 0.2991, + 0.3019, + 0.3096, + 0.3008, + 0.3084, + 0.3091, + 0.3074, + 0.3035, + 0.3102, + 0.3007, + 0.2979, + 0.306, + 0.309, + 0.3073, + 0.2987, + 0.3052, + 0.2988, + 0.306, + 0.2997, + 0.3018, + 0.3041, + 0.3108, + 0.3085, + 0.3074, + 0.2964, + 0.3099, + 0.3028, + 0.3144, + 0.3079, + 0.3112, + 0.3078, + 0.307, + 0.3066, + 0.3091, + 0.312, + 0.3103, + 0.3094, + 0.3098, + 0.3109, + 0.3078, + 0.311, + 0.3066, + 0.3075, + 0.31, + 0.3083, + 0.3101, + 0.3094, + 0.3091, + 0.3094, + 0.3093, + 0.3092 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.4088655710220337, + -0.002644116524606943, + -0.0004242559662088752, + -0.0010030616540461779 + ], + "perturbation_rho": [ + 0.017800072208046913, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -5.755573511123657e-07, + 0.0, + 0.0, + 0.0 + ], + "0.003": [ + -1.5613622963428497e-06, + 0.0, + 3.725290298461914e-09, + 0.0 + ], + "0.01": [ + -4.863366484642029e-06, + 8.381903171539307e-09, + 3.725290298461914e-09, + 0.0 + ] + } + }, + "drift": { + "embed.weight": 315.7518315228289, + "embed.bias": 267.4648316812159, + "blocks.0.ln.weight": 8.951174139569966, + "blocks.0.w1.weight": 192.5650439107619, + "blocks.0.w1.bias": 171.4174148721031, + "blocks.0.w2.weight": 313.89070882314047, + "blocks.1.ln.weight": 6.8925622022167055, + "blocks.1.w1.weight": 194.8736554676167, + "blocks.1.w1.bias": 185.61167242903338, + "blocks.1.w2.weight": 199.17952398047407, + "blocks.2.ln.weight": 8.397539871551576, + "blocks.2.w1.weight": 312.5130188038433, + "blocks.2.w1.bias": 283.112828695419, + "blocks.2.w2.weight": 249.32467631496087, + "blocks.3.ln.weight": 6.76367039376874, + "blocks.3.w1.weight": 241.46568621944522, + "blocks.3.w1.bias": 203.66496160187438, + "blocks.3.w2.weight": 186.01939293630215, + "out_ln.weight": 0.5298360495994237, + "out_head.weight": 8.435630315194661, + "out_head.bias": 0.7630893123248244 + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.047214571609497, + 2.0258394496154786, + 2.014380089035034, + 2.0146764693450927, + 2.002668328704834, + 2.000372503089905, + 2.001418789329529, + 1.998143268814087, + 1.9978233530426026, + 1.9975765690612792, + 1.9943444046783447, + 1.9969068594741821, + 1.9981716201019286, + 1.9975472425842284, + 1.9952556930541991, + 1.995059373474121, + 1.995745087661743, + 1.9953922092437744, + 1.9958506728363037, + 1.9966995294189454, + 1.9936217088317871, + 1.9977384044647217, + 1.9900378979492188, + 1.995351834487915, + 1.9918289903259276, + 1.9904872145843506, + 1.9942275651550292, + 1.989791995162964, + 1.9887557349014282, + 1.988693539352417, + 1.9892886767959594, + 1.9865470782089234, + 1.9907586919784546, + 1.9870898510742188, + 1.9892321113586426, + 1.98550331451416, + 1.9859091914367675, + 1.9834753859710694, + 1.98342726020813, + 1.9825064794158935, + 1.975549033241272, + 1.9788008226776124, + 1.9745526809692382, + 1.9800522961425782, + 1.9824256409454346, + 1.9816255992126466, + 1.978651096534729, + 1.9725130395507813, + 1.9663972332000732, + 1.9632064117050172, + 1.9650584650421143, + 1.9675109244537354, + 1.9645280550765991, + 1.9664162315368652, + 1.9687347400665283, + 1.9710959251403808, + 1.9732261672210694, + 1.974084882888794, + 1.9758672645568847, + 1.9739485864257813, + 1.9705300562286376, + 1.9686042825317382, + 1.965795273361206, + 1.9660617874908448, + 1.9628826525115968, + 1.9620544732666017, + 1.9629843045043944, + 1.9600788848114015, + 1.9614591297912598, + 1.959416093711853, + 1.9595416427993775, + 1.9580717747497558, + 1.9569868729400635, + 1.9550456240081786, + 1.9526267935180663, + 1.9543473984146118, + 1.9556241884994507, + 1.953918418045044, + 1.9537964162445067, + 1.9556760054779052, + 1.954758342666626, + 1.954609064102173, + 1.9536275988006593, + 1.9515601125717164, + 1.9516277051544189, + 1.9505773259735106, + 1.9528203700256348, + 1.9523416848754882, + 1.9502265241241454, + 1.9548965677642822, + 1.9504040404510499, + 1.9516542065048217, + 1.9515247675323486, + 1.9528300396347047, + 1.9510270280456543, + 1.9527411913299562, + 1.9511454486465454, + 1.9502003860092163, + 1.9522995095825195, + 1.9499988179779053 + ], + "train_acc": [ + 0.2499, + 0.25788, + 0.26494, + 0.26084, + 0.26878, + 0.2712, + 0.27118, + 0.27266, + 0.27206, + 0.27154, + 0.27462, + 0.27238, + 0.27458, + 0.27032, + 0.27216, + 0.27462, + 0.27516, + 0.27298, + 0.27476, + 0.27324, + 0.27506, + 0.274, + 0.27674, + 0.27228, + 0.27442, + 0.27654, + 0.27692, + 0.27454, + 0.2804, + 0.27958, + 0.27752, + 0.27736, + 0.27586, + 0.2782, + 0.27726, + 0.28116, + 0.2789, + 0.27918, + 0.27974, + 0.27888, + 0.28152, + 0.28328, + 0.28688, + 0.28546, + 0.28702, + 0.28784, + 0.28384, + 0.2859, + 0.28622, + 0.28602, + 0.28538, + 0.28386, + 0.2856, + 0.28078, + 0.28262, + 0.28218, + 0.27848, + 0.27654, + 0.27756, + 0.2757, + 0.2768, + 0.27826, + 0.27982, + 0.2823, + 0.2833, + 0.28266, + 0.28444, + 0.28494, + 0.28888, + 0.28544, + 0.28652, + 0.28844, + 0.28944, + 0.2881, + 0.28956, + 0.2906, + 0.29176, + 0.28834, + 0.2891, + 0.28948, + 0.29038, + 0.29102, + 0.29088, + 0.2909, + 0.29376, + 0.29154, + 0.29132, + 0.29376, + 0.29256, + 0.29118, + 0.29196, + 0.2941, + 0.29126, + 0.29016, + 0.2928, + 0.29118, + 0.29464, + 0.29172, + 0.29392, + 0.29224 + ], + "test_acc": [ + 0.268, + 0.2814, + 0.2568, + 0.292, + 0.2886, + 0.2937, + 0.2938, + 0.2863, + 0.2814, + 0.2905, + 0.275, + 0.3008, + 0.2934, + 0.2729, + 0.2989, + 0.2943, + 0.3016, + 0.3044, + 0.2873, + 0.2852, + 0.2866, + 0.2992, + 0.2724, + 0.2684, + 0.2827, + 0.304, + 0.2923, + 0.2958, + 0.2981, + 0.2918, + 0.2992, + 0.2875, + 0.2948, + 0.2875, + 0.3111, + 0.2978, + 0.3045, + 0.2924, + 0.2877, + 0.3019, + 0.2913, + 0.2895, + 0.2916, + 0.3021, + 0.3003, + 0.3099, + 0.3144, + 0.3095, + 0.3134, + 0.3026, + 0.3103, + 0.313, + 0.3017, + 0.2915, + 0.3025, + 0.3131, + 0.3051, + 0.2965, + 0.2797, + 0.2977, + 0.297, + 0.2923, + 0.3018, + 0.3011, + 0.2965, + 0.2952, + 0.3104, + 0.3054, + 0.3027, + 0.2976, + 0.3061, + 0.3103, + 0.2906, + 0.3087, + 0.3045, + 0.3048, + 0.3059, + 0.3052, + 0.3091, + 0.3066, + 0.3069, + 0.302, + 0.3095, + 0.3084, + 0.3047, + 0.3052, + 0.3046, + 0.312, + 0.3046, + 0.3087, + 0.3074, + 0.3071, + 0.3084, + 0.3055, + 0.3087, + 0.306, + 0.3077, + 0.3083, + 0.3083, + 0.3082 + ], + "value_loss": [ + 0.4913383872461319, + 0.22707418837547302, + 0.13916742013454436, + 0.13212530642986298, + 0.10880221369981766, + 0.08938120811700821, + 0.08285075999736786, + 0.07436370565414428, + 0.0646062517285347, + 0.06708085874557496, + 0.06273384610176086, + 0.064812075984478, + 0.049855572044849396, + 0.05398712279319763, + 0.052991126668453216, + 0.050567634534835815, + 0.04312473271250725, + 0.04782974468231201, + 0.04543443771123886, + 0.04484746047854424, + 0.035203484983444215, + 0.04272815336585045, + 0.03375269600868225, + 0.03881277943253517, + 0.034244361296892165, + 0.027195509301424028, + 0.030852211108207704, + 0.028148308331370355, + 0.02536116129040718, + 0.02516651110470295, + 0.025302239354252815, + 0.024717796894311906, + 0.026331115382909775, + 0.02268559746146202, + 0.021856163937449456, + 0.02109427482008934, + 0.01978621674835682, + 0.020399272651076317, + 0.019002752946615218, + 0.023610892441272735, + 0.023741913932561875, + 0.027797962927818297, + 0.027950212181806565, + 0.03767011716604233, + 0.03873864560246468, + 0.04052356805562973, + 0.037897691878676414, + 0.03509879319190979, + 0.0298798540186882, + 0.02826528010547161, + 0.025150670776367186, + 0.023189803918004036, + 0.02258694800913334, + 0.0227879896363616, + 0.018950610594153403, + 0.02115175976037979, + 0.018137221140265464, + 0.019522321037650107, + 0.020110222578048707, + 0.021634354048967363, + 0.015847989951372148, + 0.015064587514996529, + 0.015048437801599503, + 0.016566245526373386, + 0.012935848025679588, + 0.013470480437874794, + 0.012650928798913956, + 0.012831412743330002, + 0.011072860435843468, + 0.011155749862790108, + 0.010086000168919564, + 0.009089389600753783, + 0.008566578444838524, + 0.008092092015594243, + 0.006333343644291163, + 0.006346363427191973, + 0.006376809701025486, + 0.005647175543010235, + 0.0053406619898974895, + 0.0047307779046893116, + 0.00445646613240242, + 0.004058126023709774, + 0.0036959357082098723, + 0.003506302860453725, + 0.0027707107151299713, + 0.002242106978483498, + 0.0019543161161243916, + 0.0018740397913753987, + 0.0018142502733692527, + 0.0016265417851135135, + 0.001198948476240039, + 0.0011920882830768825, + 0.0015300761497579515, + 0.0010724398448318244, + 0.0010545289165526629, + 0.001005428223758936, + 0.000948510251417756, + 0.0011458344962261618, + 0.0009775474201142787, + 0.0009718504769355059 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.4191405475139618, + 0.03466985002160072, + 0.062135644257068634, + 0.06281301379203796 + ], + "perturbation_rho": [ + 0.030575327575206757, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -8.246861398220062e-07, + 0.0, + 0.0, + 0.0 + ], + "0.003": [ + -2.357177436351776e-06, + 0.0, + 0.0, + 0.0 + ], + "0.01": [ + -7.648952305316925e-06, + 0.0, + 0.0, + 0.0 + ] + } + }, + "drift": { + "embed.weight": 175.57738575537255, + "embed.bias": 86.00449885806607, + "blocks.0.ln.weight": 7.688942765674561, + "blocks.0.w1.weight": 144.41266674735652, + "blocks.0.w1.bias": 74.01994211256735, + "blocks.0.w2.weight": 210.53383192058863, + "blocks.1.ln.weight": 4.915474746745905, + "blocks.1.w1.weight": 180.17962097603296, + "blocks.1.w1.bias": 190.87101630029008, + "blocks.1.w2.weight": 184.55972367569038, + "blocks.2.ln.weight": 6.248608922167667, + "blocks.2.w1.weight": 243.67136564327112, + "blocks.2.w1.bias": 181.912146435998, + "blocks.2.w2.weight": 169.06723472537846, + "blocks.3.ln.weight": 5.300882057690101, + "blocks.3.w1.weight": 226.17127443307106, + "blocks.3.w1.bias": 188.5014277153452, + "blocks.3.w2.weight": 160.55519875984788, + "out_ln.weight": 0.3450086076510187, + "out_head.weight": 5.754048046839396, + "out_head.bias": 2.9997445042071984 + } + } +} \ No newline at end of file diff --git a/results/cifar_depth_scan_multiseed/summary.json b/results/cifar_depth_scan_multiseed/summary.json new file mode 100644 index 0000000..0bbb673 --- /dev/null +++ b/results/cifar_depth_scan_multiseed/summary.json @@ -0,0 +1,78 @@ +{ + "d512_L4_s123": { + "dfa": { + "test_acc": 0.3094, + "mean_bp_cosine": 0.10695587818554486, + "mean_rho": 0.002404893282800913, + "mean_nudge_01": -1.237611286342144e-06, + "bp_cosine_per_layer": [ + 0.4263063073158264, + 0.0001657301909290254, + 0.0015438150148838758, + -0.00019233977945987135 + ], + "rho_per_layer": [ + 0.009619573131203651, + 0.0, + 0.0, + 0.0 + ] + }, + "credit_bridge": { + "test_acc": 0.3091, + "mean_bp_cosine": 0.13187050633132458, + "mean_rho": 0.0010322919115424156, + "mean_nudge_01": -2.3283064365386963e-06, + "bp_cosine_per_layer": [ + 0.4222239851951599, + 0.024459093809127808, + 0.03995171934366226, + 0.04084722697734833 + ], + "rho_per_layer": [ + 0.0041291676461696625, + 0.0, + 0.0, + 0.0 + ] + } + }, + "d512_L4_s456": { + "dfa": { + "test_acc": 0.3092, + "mean_bp_cosine": 0.10119853421929292, + "mean_rho": 0.004450018052011728, + "mean_nudge_01": -1.212814822793007e-06, + "bp_cosine_per_layer": [ + 0.4088655710220337, + -0.002644116524606943, + -0.0004242559662088752, + -0.0010030616540461779 + ], + "rho_per_layer": [ + 0.017800072208046913, + 0.0, + 0.0, + 0.0 + ] + }, + "credit_bridge": { + "test_acc": 0.3082, + "mean_bp_cosine": 0.14468976389616728, + "mean_rho": 0.007643831893801689, + "mean_nudge_01": -1.9122380763292313e-06, + "bp_cosine_per_layer": [ + 0.4191405475139618, + 0.03466985002160072, + 0.062135644257068634, + 0.06281301379203796 + ], + "rho_per_layer": [ + 0.030575327575206757, + 0.0, + 0.0, + 0.0 + ] + } + } +} \ No newline at end of file diff --git a/results/cifar_depth_scan_s42/d512_L12_s42.json b/results/cifar_depth_scan_s42/d512_L12_s42.json new file mode 100644 index 0000000..e551271 --- /dev/null +++ b/results/cifar_depth_scan_s42/d512_L12_s42.json @@ -0,0 +1,1421 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.9159408319854736, + 1.6833457696151732, + 1.5935267736053467, + 1.5389775912475585, + 1.4867800998687744, + 1.4524269732284545, + 1.4178237664794922, + 1.3897597776794433, + 1.3664597565460206, + 1.342870984840393, + 1.3235610486221314, + 1.301216788482666, + 1.279724592475891, + 1.2618738833999634, + 1.2407353455352783, + 1.22462412940979, + 1.2109693797302246, + 1.1892420639038086, + 1.1723702849578856, + 1.1557361126327514, + 1.1423172385787963, + 1.1261568475341797, + 1.1062135691070556, + 1.0966129437637329, + 1.0756375621795655, + 1.0581538507270813, + 1.0487863679885865, + 1.0285031553268433, + 1.0112163684082032, + 0.9978593858337402, + 0.9784134501266479, + 0.9645692346191406, + 0.9500791883468628, + 0.9311204533195495, + 0.9137258143806457, + 0.8955737284660339, + 0.8760775566101074, + 0.8636410433959961, + 0.8472155108451843, + 0.8257175942802429, + 0.8081484350395203, + 0.7949162258720398, + 0.7682366105842591, + 0.7535309395217895, + 0.7374585538101196, + 0.7163707330703736, + 0.7002532124710082, + 0.6810121598052978, + 0.6590044124794007, + 0.6416365943050385, + 0.6245126323890686, + 0.6053193593788146, + 0.5843256318569183, + 0.5672504850196839, + 0.5574265190124512, + 0.5282080096054077, + 0.5124851553916931, + 0.49809444856643675, + 0.4815664218711853, + 0.46325312936782836, + 0.44530024614334107, + 0.4232256102848053, + 0.41155227093696595, + 0.3951142164516449, + 0.3779419419193268, + 0.36394513979434967, + 0.3495154238319397, + 0.33435829617500307, + 0.3247876634025574, + 0.31244264134407046, + 0.30034732496261596, + 0.2886586371707916, + 0.2739575230407715, + 0.26273826862812044, + 0.25702780318260193, + 0.23921729731559754, + 0.2356625511932373, + 0.23087995275020598, + 0.21462623807907105, + 0.21162452461242676, + 0.20137000153541565, + 0.1957099277973175, + 0.19024162811279297, + 0.1820225635457039, + 0.17860664487838745, + 0.17204254170417785, + 0.1648883514738083, + 0.1611987146615982, + 0.15891523240566255, + 0.15874515238285064, + 0.15378751336574553, + 0.15460485486030578, + 0.1495811799764633, + 0.14360208065509797, + 0.14562011506080627, + 0.14506465085983275, + 0.1431816494703293, + 0.1397772234392166, + 0.14342590034008026, + 0.142473215675354 + ], + "train_acc": [ + 0.31126, + 0.39118, + 0.41882, + 0.44388, + 0.4617, + 0.4731, + 0.48828, + 0.49882, + 0.50712, + 0.51646, + 0.5211, + 0.53098, + 0.53964, + 0.54616, + 0.55448, + 0.55806, + 0.56566, + 0.57324, + 0.57908, + 0.58582, + 0.58824, + 0.59418, + 0.60314, + 0.60678, + 0.61408, + 0.62094, + 0.62264, + 0.63056, + 0.63836, + 0.64046, + 0.64822, + 0.65186, + 0.65832, + 0.66298, + 0.67222, + 0.67798, + 0.686, + 0.688, + 0.695, + 0.7014, + 0.709, + 0.71344, + 0.7245, + 0.72892, + 0.73524, + 0.7426, + 0.74692, + 0.75382, + 0.76378, + 0.76914, + 0.77694, + 0.78392, + 0.78984, + 0.79764, + 0.79948, + 0.81182, + 0.81536, + 0.82284, + 0.82968, + 0.83584, + 0.84158, + 0.8514, + 0.85392, + 0.86052, + 0.86604, + 0.87092, + 0.87644, + 0.88364, + 0.88486, + 0.88988, + 0.89316, + 0.89914, + 0.9048, + 0.90892, + 0.90944, + 0.91828, + 0.9189, + 0.92122, + 0.92622, + 0.92784, + 0.93044, + 0.9332, + 0.93514, + 0.93836, + 0.93948, + 0.94166, + 0.94506, + 0.9452, + 0.94606, + 0.94738, + 0.9493, + 0.94928, + 0.94976, + 0.95178, + 0.9521, + 0.95234, + 0.95228, + 0.9543, + 0.95236, + 0.9534 + ], + "test_acc": [ + 0.3908, + 0.433, + 0.4419, + 0.4858, + 0.4871, + 0.4878, + 0.5141, + 0.5211, + 0.5188, + 0.5279, + 0.5296, + 0.5402, + 0.5415, + 0.5584, + 0.5559, + 0.5648, + 0.5531, + 0.5686, + 0.5685, + 0.575, + 0.5694, + 0.5749, + 0.5711, + 0.585, + 0.5778, + 0.5875, + 0.5827, + 0.5876, + 0.5868, + 0.5947, + 0.5903, + 0.6001, + 0.5963, + 0.6013, + 0.5943, + 0.5994, + 0.5879, + 0.5925, + 0.6006, + 0.5978, + 0.6007, + 0.6034, + 0.5914, + 0.5958, + 0.5959, + 0.5959, + 0.5928, + 0.5961, + 0.6013, + 0.5978, + 0.5974, + 0.5998, + 0.5919, + 0.5936, + 0.5958, + 0.6019, + 0.5972, + 0.5927, + 0.5998, + 0.5945, + 0.5942, + 0.5984, + 0.5904, + 0.5907, + 0.595, + 0.5928, + 0.5944, + 0.5973, + 0.5924, + 0.5909, + 0.5976, + 0.5938, + 0.5943, + 0.5926, + 0.5969, + 0.5918, + 0.5943, + 0.5881, + 0.5907, + 0.5921, + 0.5934, + 0.5926, + 0.5919, + 0.5923, + 0.5912, + 0.5908, + 0.5888, + 0.5899, + 0.5904, + 0.5911, + 0.5911, + 0.5905, + 0.5894, + 0.5918, + 0.5926, + 0.5931, + 0.5935, + 0.5936, + 0.5939, + 0.594 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9423961043357849, + 0.9423063397407532, + 0.9428478479385376, + 0.9422410726547241, + 0.9424552917480469, + 0.9417660236358643, + 0.9408372640609741, + 0.9404677152633667, + 0.9403290748596191, + 0.9396632313728333, + 0.935971736907959, + 0.9338305592536926 + ], + "perturbation_rho": [ + 0.987454891204834, + 0.9897942543029785, + 0.990141749382019, + 0.9901803731918335, + 0.9920680522918701, + 0.9906818866729736, + 0.9903223514556885, + 0.9926531910896301, + 0.9914379119873047, + 0.9897843599319458, + 0.9882909059524536, + 0.9869540929794312 + ], + "nudging": { + "0.001": [ + -0.002897711703553796, + -0.002905686851590872, + -0.0029487141873687506, + -0.0030073150992393494, + -0.002988070249557495, + -0.0028954721055924892, + -0.0027900305576622486, + -0.002700705546885729, + -0.0025893584825098515, + -0.0024207504466176033, + -0.002165877493098378, + -0.00189895648509264 + ], + "0.003": [ + -0.008684658445417881, + -0.008708733133971691, + -0.008837150409817696, + -0.009012945927679539, + -0.008955370634794235, + -0.008678246289491653, + -0.008362163789570332, + -0.008094580844044685, + -0.007761792279779911, + -0.007257224526256323, + -0.006493166089057922, + -0.005693747662007809 + ], + "0.01": [ + -0.028850272297859192, + -0.028929298743605614, + -0.029354672878980637, + -0.029939891770482063, + -0.029747068881988525, + -0.028829604387283325, + -0.027784891426563263, + -0.026898572221398354, + -0.025797637179493904, + -0.024130169302225113, + -0.02159387245774269, + -0.018940377980470657 + ] + } + }, + "drift": { + "embed.weight": 8.833701837291958, + "embed.bias": 14.261815769395275, + "blocks.0.ln.weight": 0.34404799666331826, + "blocks.0.w1.weight": 4.175094808562947, + "blocks.0.w1.bias": 6.98398106061982, + "blocks.0.w2.weight": 10.592751719664884, + "blocks.1.ln.weight": 0.2322510556310593, + "blocks.1.w1.weight": 4.523413515316886, + "blocks.1.w1.bias": 4.3749413052218085, + "blocks.1.w2.weight": 11.940958034527862, + "blocks.2.ln.weight": 0.2150404740407862, + "blocks.2.w1.weight": 4.58583359520105, + "blocks.2.w1.bias": 4.159787661269507, + "blocks.2.w2.weight": 12.401201224911981, + "blocks.3.ln.weight": 0.22107801019329978, + "blocks.3.w1.weight": 4.586995215167557, + "blocks.3.w1.bias": 3.881613437324734, + "blocks.3.w2.weight": 12.64024804795375, + "blocks.4.ln.weight": 0.23170407382172373, + "blocks.4.w1.weight": 4.578125313924808, + "blocks.4.w1.bias": 3.7932938751482683, + "blocks.4.w2.weight": 12.963501907885533, + "blocks.5.ln.weight": 0.23628225424614754, + "blocks.5.w1.weight": 4.5240873092186416, + "blocks.5.w1.bias": 3.803760854867017, + "blocks.5.w2.weight": 12.912394584749915, + "blocks.6.ln.weight": 0.2619501911907522, + "blocks.6.w1.weight": 4.461384236716512, + "blocks.6.w1.bias": 3.799496573870174, + "blocks.6.w2.weight": 13.155197671866139, + "blocks.7.ln.weight": 0.2657175505296468, + "blocks.7.w1.weight": 4.422447215896801, + "blocks.7.w1.bias": 3.725743197114046, + "blocks.7.w2.weight": 13.149302405423146, + "blocks.8.ln.weight": 0.28028080422594653, + "blocks.8.w1.weight": 4.320993108213275, + "blocks.8.w1.bias": 3.577600797368634, + "blocks.8.w2.weight": 13.112473965027567, + "blocks.9.ln.weight": 0.3122222575319159, + "blocks.9.w1.weight": 4.3011661234952125, + "blocks.9.w1.bias": 3.5701937101673704, + "blocks.9.w2.weight": 13.20746990540504, + "blocks.10.ln.weight": 0.2907587848995931, + "blocks.10.w1.weight": 4.244185315341837, + "blocks.10.w1.bias": 3.487530574891753, + "blocks.10.w2.weight": 13.342063167376029, + "blocks.11.ln.weight": 0.30672613980463925, + "blocks.11.w1.weight": 4.1911870376224645, + "blocks.11.w1.bias": 3.626239385452188, + "blocks.11.w2.weight": 13.53569165604796, + "out_ln.weight": 0.304987181878743, + "out_head.weight": 3.659824943443211, + "out_head.bias": 0.7848376848440143 + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.057183644256592, + 2.0219752458190916, + 2.014074349899292, + 2.009915184326172, + 2.003742285079956, + 2.0064792041397093, + 2.001210139312744, + 2.0027513356781004, + 1.9994710051727296, + 2.0039267013549806, + 1.9983517964935302, + 1.9981007271575928, + 1.9967711097717284, + 1.9957333689880372, + 1.9961917282485961, + 1.997950509262085, + 1.9958872592163086, + 1.9964322351837158, + 1.9945315238189698, + 1.993023081741333, + 1.9933346648788453, + 1.9943037507629395, + 1.9923084811019898, + 1.9912947034454345, + 1.9911876581573487, + 1.9902342232513428, + 1.9931360609436035, + 1.9907362972640992, + 1.9919358252334596, + 1.9918178892517089, + 1.99015292427063, + 1.9888984406280517, + 1.990421195602417, + 1.9874123781585693, + 1.9881913418197632, + 1.9892149132537842, + 1.9870399390411377, + 1.988616922302246, + 1.9857829595947265, + 1.9879872678375243, + 1.9910465408325195, + 1.9890870415878297, + 1.9886888786315917, + 1.9860569588470458, + 1.9893753149414062, + 1.9879478802490234, + 1.986084238319397, + 1.9871028468322753, + 1.987663519668579, + 1.9854809813690186, + 1.987514366722107, + 1.9865355487442016, + 1.9870760778808594, + 1.9852242317199706, + 1.9868980590438843, + 1.9847661309432982, + 1.9880792671203613, + 1.9864630212402343, + 1.9864557014465332, + 1.9846630696105958, + 1.9851684265518188, + 1.9845601000976563, + 1.984690249786377, + 1.9832856945037842, + 1.9843514255523682, + 1.98395031955719, + 1.9839791688537598, + 1.9839756365203858, + 1.9832659860992432, + 1.985604306640625, + 1.9832666548156739, + 1.983997225265503, + 1.9818758429718017, + 1.9806820659637452, + 1.9815394610595702, + 1.9834156256103515, + 1.9787700980377196, + 1.982170662612915, + 1.9797498672485352, + 1.9827086754608154, + 1.9817713089370728, + 1.9803067615127563, + 1.9819608657073975, + 1.9829605780410766, + 1.9819707880401611, + 1.9838256735229491, + 1.9817811890411376, + 1.9816452063369752, + 1.9808973921203614, + 1.98217180267334, + 1.9815813362884522, + 1.981448392868042, + 1.9818018493652343, + 1.978947674217224, + 1.981713777770996, + 1.9825912845611573, + 1.9784613372421265, + 1.9797205515289307, + 1.9829137060546875, + 1.9835036209869386 + ], + "train_acc": [ + 0.24212, + 0.26076, + 0.26024, + 0.26518, + 0.26958, + 0.26636, + 0.26982, + 0.26922, + 0.27358, + 0.26904, + 0.27336, + 0.27268, + 0.27124, + 0.27456, + 0.27402, + 0.27524, + 0.27538, + 0.27344, + 0.27274, + 0.27408, + 0.27474, + 0.27582, + 0.27818, + 0.27952, + 0.27862, + 0.27686, + 0.27516, + 0.27816, + 0.2769, + 0.27774, + 0.27712, + 0.2764, + 0.27884, + 0.27974, + 0.27744, + 0.27654, + 0.28156, + 0.27792, + 0.28188, + 0.28016, + 0.27916, + 0.27818, + 0.28024, + 0.28084, + 0.27922, + 0.28046, + 0.27866, + 0.2805, + 0.27788, + 0.2798, + 0.27828, + 0.28152, + 0.2793, + 0.28102, + 0.28142, + 0.28174, + 0.2784, + 0.28092, + 0.28108, + 0.2819, + 0.27962, + 0.28176, + 0.2825, + 0.2829, + 0.283, + 0.28336, + 0.28122, + 0.28198, + 0.2826, + 0.2796, + 0.28184, + 0.28408, + 0.28324, + 0.28434, + 0.28316, + 0.28344, + 0.28512, + 0.283, + 0.28622, + 0.28278, + 0.28352, + 0.28448, + 0.28224, + 0.2846, + 0.28276, + 0.28316, + 0.28462, + 0.28342, + 0.28424, + 0.28358, + 0.2832, + 0.28652, + 0.28394, + 0.28506, + 0.2852, + 0.28386, + 0.28612, + 0.28354, + 0.28348, + 0.28488 + ], + "test_acc": [ + 0.2796, + 0.2818, + 0.3016, + 0.2892, + 0.2743, + 0.2847, + 0.2712, + 0.2939, + 0.2897, + 0.2995, + 0.2732, + 0.305, + 0.3018, + 0.3117, + 0.2831, + 0.2864, + 0.3018, + 0.2984, + 0.3147, + 0.298, + 0.2968, + 0.3081, + 0.3062, + 0.305, + 0.2994, + 0.3014, + 0.2985, + 0.315, + 0.3063, + 0.31, + 0.3086, + 0.2951, + 0.3006, + 0.3114, + 0.3053, + 0.3148, + 0.2984, + 0.3013, + 0.3048, + 0.3018, + 0.3083, + 0.2985, + 0.3067, + 0.2993, + 0.3114, + 0.3088, + 0.3051, + 0.3005, + 0.3107, + 0.3014, + 0.3002, + 0.3077, + 0.3098, + 0.3078, + 0.3139, + 0.3013, + 0.3122, + 0.2999, + 0.3094, + 0.3123, + 0.3146, + 0.3057, + 0.309, + 0.3068, + 0.3141, + 0.3044, + 0.3053, + 0.311, + 0.3116, + 0.3115, + 0.3105, + 0.3096, + 0.3132, + 0.3069, + 0.3019, + 0.3068, + 0.3023, + 0.3101, + 0.3091, + 0.3059, + 0.3075, + 0.3129, + 0.3145, + 0.3114, + 0.311, + 0.3123, + 0.307, + 0.3076, + 0.3106, + 0.3098, + 0.3089, + 0.3079, + 0.3111, + 0.3096, + 0.3102, + 0.311, + 0.3088, + 0.3092, + 0.3091, + 0.309 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.38828110694885254, + 0.0037502094637602568, + -0.0013616610085591674, + -0.0004177851078566164, + 0.0008564171148464084, + 0.00033698498737066984, + 0.0006134084542281926, + -0.00040099132456816733, + -0.00013616093201562762, + -0.0008071845513768494, + -0.0019259440014138818, + -0.0014602115843445063 + ], + "perturbation_rho": [ + -0.0468934029340744, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -3.948807716369629e-07, + 0.0, + -1.862645149230957e-09, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + -9.313225746154785e-10, + 0.0, + 0.0 + ], + "0.003": [ + -1.2898817658424377e-06, + -3.725290298461914e-09, + -1.862645149230957e-09, + 0.0, + 0.0, + 0.0, + -9.313225746154785e-10, + 0.0, + 0.0, + -9.313225746154785e-10, + 0.0, + 3.725290298461914e-09 + ], + "0.01": [ + -4.674773663282394e-06, + -3.725290298461914e-09, + -1.862645149230957e-09, + -3.725290298461914e-09, + 0.0, + 9.313225746154785e-10, + -9.313225746154785e-10, + -1.862645149230957e-09, + 0.0, + -9.313225746154785e-10, + 9.313225746154785e-10, + 3.725290298461914e-09 + ] + } + }, + "drift": { + "embed.weight": 319.6256145809284, + "embed.bias": 241.39131706930516, + "blocks.0.ln.weight": 8.451152686823706, + "blocks.0.w1.weight": 198.0653736517787, + "blocks.0.w1.bias": 172.12729591798578, + "blocks.0.w2.weight": 339.00018245731724, + "blocks.1.ln.weight": 7.000199186009471, + "blocks.1.w1.weight": 213.18535798636668, + "blocks.1.w1.bias": 202.05532367109083, + "blocks.1.w2.weight": 208.8135070796582, + "blocks.2.ln.weight": 7.935838334127239, + "blocks.2.w1.weight": 314.5106044563863, + "blocks.2.w1.bias": 271.6455147079551, + "blocks.2.w2.weight": 247.9045165300641, + "blocks.3.ln.weight": 5.795920066983145, + "blocks.3.w1.weight": 182.91564428516534, + "blocks.3.w1.bias": 152.5137308265898, + "blocks.3.w2.weight": 151.050379705954, + "blocks.4.ln.weight": 6.3276885496198645, + "blocks.4.w1.weight": 215.98859872586803, + "blocks.4.w1.bias": 183.97920728444788, + "blocks.4.w2.weight": 165.74279725091483, + "blocks.5.ln.weight": 5.792878750342549, + "blocks.5.w1.weight": 193.44922307145256, + "blocks.5.w1.bias": 172.0595502919292, + "blocks.5.w2.weight": 156.55012054903048, + "blocks.6.ln.weight": 5.98080042430076, + "blocks.6.w1.weight": 182.32068889300982, + "blocks.6.w1.bias": 161.74264639168877, + "blocks.6.w2.weight": 161.51005233041852, + "blocks.7.ln.weight": 6.798251040626781, + "blocks.7.w1.weight": 235.9970011878696, + "blocks.7.w1.bias": 202.73306946131746, + "blocks.7.w2.weight": 176.16251425264502, + "blocks.8.ln.weight": 8.05032468668243, + "blocks.8.w1.weight": 304.9749512658957, + "blocks.8.w1.bias": 254.78399637200565, + "blocks.8.w2.weight": 226.8419755905067, + "blocks.9.ln.weight": 8.324689211241104, + "blocks.9.w1.weight": 304.64714323529006, + "blocks.9.w1.bias": 254.27332736169836, + "blocks.9.w2.weight": 226.94604254635792, + "blocks.10.ln.weight": 5.162597908184438, + "blocks.10.w1.weight": 159.94571322633212, + "blocks.10.w1.bias": 138.12937914272587, + "blocks.10.w2.weight": 129.89821404142262, + "blocks.11.ln.weight": 7.516332199105425, + "blocks.11.w1.weight": 279.9271343014864, + "blocks.11.w1.bias": 236.42300656616862, + "blocks.11.w2.weight": 202.50408675479144, + "out_ln.weight": 0.6271483618826256, + "out_head.weight": 8.718326486393146, + "out_head.bias": 0.5753880166404655 + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.0568576118469237, + 2.033485134429932, + 2.0218416510772705, + 2.0142132845306397, + 2.0108241705703733, + 2.002156679153442, + 2.0038612014770507, + 1.9997895935821532, + 2.0023641468048097, + 2.0011226501846315, + 1.9980047481536864, + 1.9944430965423583, + 1.9959918328094481, + 1.9943659350585938, + 1.9955686949157714, + 1.9932625021743775, + 1.9940180532073974, + 1.992023607826233, + 1.990704457244873, + 1.9915499368286134, + 1.9944144274139404, + 1.9895493435668945, + 1.9895022438812255, + 1.9851936352157593, + 1.9862560325622558, + 1.9824435089874268, + 1.9816281591796876, + 1.9810021967315674, + 1.9812662688446046, + 1.9824039008331298, + 1.9829267932891845, + 1.9802660181427, + 1.9798483668518065, + 1.979789539527893, + 1.9795299366760253, + 1.9757647130584717, + 1.972223770904541, + 1.9694228728485108, + 1.9702133034896852, + 1.9706256021499633, + 1.9694662646102905, + 1.9712112203979493, + 1.9850462644958495, + 2.002737700653076, + 2.0086276149749756, + 2.0277000471496582, + 2.0281700329589842, + 2.0319336601257323, + 2.023782074584961, + 2.0170300160217285, + 2.0127930587005616, + 2.0128867221832274, + 2.01850300453186, + 2.0133023000335695, + 2.0104183267593383, + 2.0138787005996703, + 2.021632391052246, + 2.029548404159546, + 2.0301968224334717, + 2.0342870476531982, + 2.0400729270172118, + 2.0447248320770264, + 2.0492120973205568, + 2.0500868199157716, + 2.0525983279418947, + 2.053036574554443, + 2.055363027687073, + 2.0557615393066406, + 2.060003659210205, + 2.059733818283081, + 2.063136697921753, + 2.063323797454834, + 2.0652847254180906, + 2.065591119003296, + 2.0690882136535644, + 2.07202782333374, + 2.0749201114654543, + 2.0776294555664063, + 2.079117084503174, + 2.078432328796387, + 2.078386816864014, + 2.076197295227051, + 2.075240274810791, + 2.071873186187744, + 2.0715130477142334, + 2.070623317947388, + 2.0708017208862306, + 2.0684812643432617, + 2.067380738296509, + 2.065728325653076, + 2.0663505850982666, + 2.0655458202362063, + 2.0657374589538575, + 2.0645635641479494, + 2.0653134523010253, + 2.0636908391571045, + 2.063971264190674, + 2.0637667852783204, + 2.064012709197998, + 2.064872869949341 + ], + "train_acc": [ + 0.24184, + 0.2521, + 0.25882, + 0.26394, + 0.26408, + 0.26908, + 0.2699, + 0.2708, + 0.27198, + 0.27044, + 0.27198, + 0.27592, + 0.27358, + 0.27498, + 0.2747, + 0.27506, + 0.2745, + 0.27506, + 0.27742, + 0.2764, + 0.27738, + 0.2759, + 0.2767, + 0.27868, + 0.27842, + 0.27882, + 0.27966, + 0.27812, + 0.2803, + 0.27992, + 0.27782, + 0.28038, + 0.27874, + 0.28038, + 0.28104, + 0.28038, + 0.28444, + 0.28556, + 0.28248, + 0.28622, + 0.2816, + 0.27992, + 0.2709, + 0.26912, + 0.264, + 0.254, + 0.2571, + 0.25402, + 0.25446, + 0.25542, + 0.25666, + 0.25594, + 0.25068, + 0.25624, + 0.2585, + 0.25766, + 0.25522, + 0.24842, + 0.25234, + 0.25176, + 0.24892, + 0.24678, + 0.24418, + 0.24632, + 0.24382, + 0.2433, + 0.24304, + 0.24668, + 0.24448, + 0.24628, + 0.24476, + 0.24558, + 0.2455, + 0.25012, + 0.24546, + 0.24462, + 0.24508, + 0.2428, + 0.23992, + 0.23902, + 0.23556, + 0.23456, + 0.23548, + 0.23628, + 0.2383, + 0.23514, + 0.23668, + 0.2391, + 0.2391, + 0.23886, + 0.24188, + 0.24092, + 0.24206, + 0.24588, + 0.24146, + 0.24336, + 0.24526, + 0.24318, + 0.24306, + 0.241 + ], + "test_acc": [ + 0.2607, + 0.2707, + 0.2859, + 0.3016, + 0.277, + 0.3077, + 0.2813, + 0.309, + 0.3096, + 0.283, + 0.2983, + 0.3135, + 0.2938, + 0.3079, + 0.2923, + 0.3001, + 0.2908, + 0.2904, + 0.3037, + 0.3131, + 0.3022, + 0.3126, + 0.3113, + 0.299, + 0.2999, + 0.304, + 0.2825, + 0.3158, + 0.3181, + 0.3042, + 0.3046, + 0.2901, + 0.3147, + 0.286, + 0.3127, + 0.3144, + 0.3237, + 0.3242, + 0.3072, + 0.2959, + 0.2996, + 0.2938, + 0.2808, + 0.2722, + 0.2706, + 0.2656, + 0.2651, + 0.2755, + 0.2528, + 0.2641, + 0.2557, + 0.27, + 0.2477, + 0.2502, + 0.2324, + 0.2355, + 0.2419, + 0.2416, + 0.2607, + 0.2678, + 0.275, + 0.2598, + 0.262, + 0.2613, + 0.2586, + 0.252, + 0.26, + 0.2567, + 0.2422, + 0.2632, + 0.2589, + 0.2585, + 0.268, + 0.2485, + 0.2499, + 0.2309, + 0.2442, + 0.2451, + 0.2248, + 0.2271, + 0.2286, + 0.2357, + 0.2347, + 0.2262, + 0.2355, + 0.2376, + 0.2363, + 0.2374, + 0.2359, + 0.2392, + 0.2359, + 0.2366, + 0.2387, + 0.2367, + 0.2364, + 0.2389, + 0.2405, + 0.2399, + 0.2392, + 0.239 + ], + "value_loss": [ + 0.45757097380638123, + 0.20398492289066314, + 0.14403926629781724, + 0.12142798287391662, + 0.12356067106246948, + 0.10323704772472382, + 0.09025520797491074, + 0.07278211853384972, + 0.0721493047785759, + 0.07462056404113769, + 0.058030206863880156, + 0.051864567153453826, + 0.05143641318678856, + 0.049471625967025756, + 0.048022189247608184, + 0.04581756822347641, + 0.048392335476875305, + 0.039053659332990646, + 0.03958373228907585, + 0.039008795657157896, + 0.03813901361584664, + 0.03919893253147602, + 0.03719111958146095, + 0.033129610191583635, + 0.03316450059056282, + 0.029290390903949737, + 0.030135655524730683, + 0.03032812103867531, + 0.028851064978837968, + 0.030176216821670532, + 0.027550049550533296, + 0.024665569834709168, + 0.02101791775226593, + 0.025735651454925536, + 0.0251218857216835, + 0.02088318651020527, + 0.019842562421560288, + 0.021842277721762657, + 0.019696957327723502, + 0.039216412217617035, + 0.044192443869113925, + 0.04437062278270722, + 0.10603765468597412, + 0.5277386970996857, + 4.009285344390869, + 23.118207588806154, + 144.34815091796875, + 518.8025195117187, + 1318.1295115625, + 1762.37145984375, + 6916.118271875, + 4658.513114609375, + 2876.65883546875, + 1116.1913117382812, + 672.6694246875, + 704.66234140625, + 552.1133823925782, + 171.6432964111328, + 135.70525376220704, + 134.33308825195311, + 132.31754293945312, + 72.1968391418457, + 41.47797743041992, + 43.47026284912109, + 36.734252014160155, + 25.379087185058594, + 18.40212633392334, + 29.28388342590332, + 10.164241724700927, + 2.897604249019623, + 1.047686642589569, + 0.325347878112793, + 0.14909634278774261, + 0.07973611199140548, + 0.06035885235905647, + 0.04197409330606461, + 0.028365342289209367, + 0.017914904502928257, + 0.01303940503180027, + 0.009001612865626812, + 0.006971689679771661, + 0.005598475634455681, + 0.005475701079368591, + 0.004648658817410469, + 0.0038136353914439676, + 0.0030602712966501713, + 0.0028339786121994257, + 0.0029074203512072564, + 0.0026963330183178186, + 0.0023759404706954956, + 0.002058511268571019, + 0.002492244097441435, + 0.0014459992367774248, + 0.0019114786966145038, + 0.0025138171672821046, + 0.00124135938256979, + 0.0020614514429681003, + 0.0013046426071599126, + 0.0029164830996282398, + 0.0010984712824225426 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.20759254693984985, + 0.005885659717023373, + 0.014463091269135475, + 0.013757804408669472, + 0.01659775897860527, + 0.0177934467792511, + 0.018012138083577156, + 0.019089948385953903, + 0.019284311681985855, + 0.01838410645723343, + 0.01891487091779709, + 0.018453549593687057 + ], + "perturbation_rho": [ + 0.010340061970055103, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -4.516914486885071e-07, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "0.003": [ + -1.214444637298584e-06, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "0.01": [ + -4.189088940620422e-06, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ] + } + }, + "drift": { + "embed.weight": 150.67057498445888, + "embed.bias": 134.41454679929575, + "blocks.0.ln.weight": 5.823816560727751, + "blocks.0.w1.weight": 121.67399642558134, + "blocks.0.w1.bias": 113.51970790036184, + "blocks.0.w2.weight": 204.33462559926585, + "blocks.1.ln.weight": 6.501127217482716, + "blocks.1.w1.weight": 285.45091938635363, + "blocks.1.w1.bias": 289.6326970920111, + "blocks.1.w2.weight": 243.81894015436046, + "blocks.2.ln.weight": 6.326138219917707, + "blocks.2.w1.weight": 324.84264337850595, + "blocks.2.w1.bias": 293.5437947059724, + "blocks.2.w2.weight": 224.099887924036, + "blocks.3.ln.weight": 5.602491317116855, + "blocks.3.w1.weight": 245.36011562278688, + "blocks.3.w1.bias": 220.93326847278095, + "blocks.3.w2.weight": 200.84652256624017, + "blocks.4.ln.weight": 5.329743882869523, + "blocks.4.w1.weight": 182.97700815621855, + "blocks.4.w1.bias": 140.02593230649856, + "blocks.4.w2.weight": 140.60772145327962, + "blocks.5.ln.weight": 5.286696439762922, + "blocks.5.w1.weight": 155.33931234812562, + "blocks.5.w1.bias": 93.8828284250912, + "blocks.5.w2.weight": 133.6255221433454, + "blocks.6.ln.weight": 5.3698026086033686, + "blocks.6.w1.weight": 153.69676226206676, + "blocks.6.w1.bias": 104.50919556116708, + "blocks.6.w2.weight": 146.8099489527109, + "blocks.7.ln.weight": 5.580818732892067, + "blocks.7.w1.weight": 159.38306611743945, + "blocks.7.w1.bias": 101.31052511081181, + "blocks.7.w2.weight": 104.61639494957436, + "blocks.8.ln.weight": 6.117239553334436, + "blocks.8.w1.weight": 351.20193371314235, + "blocks.8.w1.bias": 322.90500949025466, + "blocks.8.w2.weight": 205.93771553542751, + "blocks.9.ln.weight": 5.428160484749458, + "blocks.9.w1.weight": 151.20229062994952, + "blocks.9.w1.bias": 86.27513547236327, + "blocks.9.w2.weight": 119.94171519954084, + "blocks.10.ln.weight": 3.187901359176882, + "blocks.10.w1.weight": 100.37314795265215, + "blocks.10.w1.bias": 86.90571689186352, + "blocks.10.w2.weight": 116.36697077856738, + "blocks.11.ln.weight": 4.855792448009543, + "blocks.11.w1.weight": 290.16810994044624, + "blocks.11.w1.bias": 269.48650679370706, + "blocks.11.w2.weight": 207.9959909476014, + "out_ln.weight": 0.44311953950689703, + "out_head.weight": 7.617038267805974, + "out_head.bias": 2.5026283939923624 + } + } +} \ No newline at end of file diff --git a/results/cifar_depth_scan_s42/d512_L2_s42.json b/results/cifar_depth_scan_s42/d512_L2_s42.json new file mode 100644 index 0000000..5b1a950 --- /dev/null +++ b/results/cifar_depth_scan_s42/d512_L2_s42.json @@ -0,0 +1,1151 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.9354850341033936, + 1.7026564234542847, + 1.6196284805679322, + 1.5522706447601318, + 1.5103712742996216, + 1.4760794692230224, + 1.4480401036453248, + 1.4238936393356323, + 1.3998644092941284, + 1.3888274967193603, + 1.370794108505249, + 1.3523651966094972, + 1.3417378455352784, + 1.32940377494812, + 1.3123712255859374, + 1.3025306620025634, + 1.2916712799072265, + 1.277412696762085, + 1.2670877025604248, + 1.2579533868026733, + 1.250452767906189, + 1.2388696469116212, + 1.2288407207870484, + 1.218021198196411, + 1.2081415139007567, + 1.2038527836227417, + 1.1919150150299072, + 1.1843040127944946, + 1.1809553996276856, + 1.1748971781539916, + 1.1629332243728638, + 1.1559197056579589, + 1.1501819496154786, + 1.1386108488464355, + 1.1359955614471435, + 1.1256131409072876, + 1.1200060926818847, + 1.114403334388733, + 1.1042931074905395, + 1.1033966439437866, + 1.0955395514297486, + 1.086461291847229, + 1.076456173362732, + 1.0776306005477905, + 1.0669021976089477, + 1.0603959639167786, + 1.0562950397491455, + 1.0486062710762023, + 1.037363448638916, + 1.0395437144470214, + 1.0320540841293335, + 1.0248265104293823, + 1.0186307384872437, + 1.01219017370224, + 1.0086890588760375, + 1.0036477170944214, + 0.9918886923408509, + 0.9959744847869874, + 0.983810892829895, + 0.9749429069328308, + 0.9761281036186218, + 0.9669857545852661, + 0.9646618202209473, + 0.9585257618713379, + 0.951733235244751, + 0.9470721603393555, + 0.9449367933654785, + 0.9399459014511108, + 0.9332768785476685, + 0.9295426531982421, + 0.9249779984283447, + 0.9206048580551147, + 0.9163932028198242, + 0.9137818552780151, + 0.9054667686653137, + 0.8992140997695923, + 0.8981155136108399, + 0.9007723778915405, + 0.8907698515319824, + 0.8869161108398438, + 0.8879233457946777, + 0.8870189405632019, + 0.8807708535385131, + 0.875256696395874, + 0.8748971775817871, + 0.8757942477035523, + 0.8740769153022766, + 0.8715347571182251, + 0.8681148331069947, + 0.8674819102478027, + 0.863512946510315, + 0.8696056005477906, + 0.8647798666381836, + 0.8631498766708374, + 0.866932133693695, + 0.8609341511917115, + 0.8584218189620971, + 0.8627110484886169, + 0.8589248524093628, + 0.8619690019416809 + ], + "train_acc": [ + 0.31324, + 0.3856, + 0.41254, + 0.43722, + 0.4538, + 0.46698, + 0.47636, + 0.48598, + 0.49418, + 0.49864, + 0.50738, + 0.51122, + 0.51678, + 0.52288, + 0.5272, + 0.53212, + 0.53512, + 0.53952, + 0.5452, + 0.54694, + 0.54924, + 0.55342, + 0.559, + 0.56202, + 0.56542, + 0.56722, + 0.57134, + 0.57538, + 0.57742, + 0.57586, + 0.58118, + 0.58464, + 0.5859, + 0.59246, + 0.59194, + 0.59674, + 0.59898, + 0.60034, + 0.6066, + 0.60422, + 0.60806, + 0.61212, + 0.61618, + 0.61372, + 0.61884, + 0.6198, + 0.62164, + 0.62388, + 0.6294, + 0.62744, + 0.63112, + 0.63436, + 0.63332, + 0.63632, + 0.6381, + 0.6401, + 0.6463, + 0.64188, + 0.64658, + 0.65074, + 0.65084, + 0.65332, + 0.65314, + 0.65706, + 0.65862, + 0.66132, + 0.66338, + 0.66192, + 0.6661, + 0.6698, + 0.66802, + 0.66974, + 0.67114, + 0.67274, + 0.6753, + 0.67902, + 0.6777, + 0.67944, + 0.68172, + 0.68452, + 0.68178, + 0.68314, + 0.68652, + 0.68794, + 0.688, + 0.6866, + 0.68708, + 0.6896, + 0.69086, + 0.69196, + 0.69182, + 0.68984, + 0.69014, + 0.69196, + 0.69008, + 0.69314, + 0.69342, + 0.69112, + 0.6941, + 0.69128 + ], + "test_acc": [ + 0.379, + 0.42, + 0.4414, + 0.468, + 0.4821, + 0.4867, + 0.5048, + 0.5076, + 0.5032, + 0.5071, + 0.5251, + 0.5385, + 0.5339, + 0.5395, + 0.5359, + 0.5373, + 0.5411, + 0.5429, + 0.544, + 0.5558, + 0.5584, + 0.553, + 0.5587, + 0.557, + 0.5617, + 0.5595, + 0.5661, + 0.5732, + 0.5671, + 0.5738, + 0.5715, + 0.5762, + 0.5734, + 0.5772, + 0.5787, + 0.5735, + 0.5753, + 0.5788, + 0.5757, + 0.5779, + 0.5818, + 0.5857, + 0.5877, + 0.5853, + 0.5807, + 0.5926, + 0.5907, + 0.5921, + 0.5863, + 0.5905, + 0.5941, + 0.5959, + 0.5907, + 0.5931, + 0.5922, + 0.5982, + 0.5976, + 0.5888, + 0.595, + 0.5987, + 0.6, + 0.594, + 0.5975, + 0.599, + 0.5987, + 0.5921, + 0.5957, + 0.5921, + 0.5999, + 0.5947, + 0.5996, + 0.5976, + 0.5949, + 0.5992, + 0.5982, + 0.5956, + 0.6015, + 0.6011, + 0.5993, + 0.601, + 0.5974, + 0.5976, + 0.5997, + 0.599, + 0.5988, + 0.6011, + 0.5974, + 0.5985, + 0.6018, + 0.598, + 0.5993, + 0.5991, + 0.599, + 0.5992, + 0.5991, + 0.6004, + 0.5994, + 0.5993, + 0.5994, + 0.5993 + ] + }, + "diagnostics": { + "bp_cosine": [ + 1.0, + 1.0 + ], + "perturbation_rho": [ + 0.9868886470794678, + 0.9831097722053528 + ], + "nudging": { + "0.001": [ + -0.0010212662164121866, + -0.0008843992254696786 + ], + "0.003": [ + -0.0030618617311120033, + -0.0026517128571867943 + ], + "0.01": [ + -0.010182719677686691, + -0.008822238072752953 + ] + } + }, + "drift": { + "embed.weight": 8.850352053801725, + "embed.bias": 26.80721203618006, + "blocks.0.ln.weight": 0.20347274443339167, + "blocks.0.w1.weight": 4.629616202784868, + "blocks.0.w1.bias": 7.3007028332357145, + "blocks.0.w2.weight": 12.573673444728787, + "blocks.1.ln.weight": 0.15135983015831284, + "blocks.1.w1.weight": 4.835127700607666, + "blocks.1.w1.bias": 4.074910897523138, + "blocks.1.w2.weight": 15.468163387197967, + "out_ln.weight": 0.43266956541456525, + "out_head.weight": 2.288095707738499, + "out_head.bias": 1.5696642748538316 + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.0506517180633543, + 2.037630374984741, + 2.0375006256103516, + 2.0347165871810913, + 2.0280541705322266, + 2.0247886113739013, + 2.023957159957886, + 2.017765091934204, + 2.013640316925049, + 2.0121789574813844, + 2.012694746131897, + 2.0094316165542603, + 2.010430689163208, + 2.0080650563812257, + 2.004681011276245, + 2.0067793479156495, + 2.002835368652344, + 2.0035605745697023, + 2.005288227157593, + 2.0020996487045286, + 2.0037673551940918, + 2.0026556689453123, + 2.0015291195678713, + 1.9998969723129272, + 2.001053342666626, + 1.9988280670166017, + 1.998517660293579, + 2.000125762634277, + 1.9984248222351073, + 2.0001446187973024, + 1.997779655456543, + 1.9962129680633545, + 1.996638311729431, + 1.9934515882873536, + 1.9944385040664674, + 1.9950137895965576, + 1.9948566608428955, + 1.9947254082489014, + 1.9938683570861817, + 1.993011798019409, + 1.993586630821228, + 1.9928539782333374, + 1.99163732421875, + 1.9935448779296876, + 1.992500286026001, + 1.9926587213134765, + 1.9939856634140014, + 1.9904723690795898, + 1.99148487449646, + 1.989919489364624, + 1.9883176875305175, + 1.9909399053192138, + 1.9917929566955566, + 1.9895172406005859, + 1.9915735732650757, + 1.98892810256958, + 1.9902667702484131, + 1.9884299784851074, + 1.9891859377288819, + 1.9871826519012452, + 1.9888171925354003, + 1.9876050499725342, + 1.9885715426635742, + 1.9879224799346924, + 1.9875414797210693, + 1.9883081774902345, + 1.9874149275970459, + 1.9873363061904907, + 1.9844847861480712, + 1.9853876978302003, + 1.9853303070449828, + 1.986023975753784, + 1.9871168149566651, + 1.9860221238708495, + 1.9863739596176146, + 1.9852040929412842, + 1.9818872883605958, + 1.9874637450408936, + 1.9860291708374023, + 1.9853426343154907, + 1.9848574941253663, + 1.985159556503296, + 1.9853443636322021, + 1.9854941542053222, + 1.9842009844970703, + 1.9843328964614868, + 1.9830964395141601, + 1.9839789056777954, + 1.9838400217437744, + 1.9850177837371825, + 1.9836825035858154, + 1.9848054162597657, + 1.9832133966827392, + 1.9829493893432617, + 1.9810011239242553, + 1.9834887173843383, + 1.9844633283233644, + 1.9830566509628296, + 1.983135018005371, + 1.9840513249969483 + ], + "train_acc": [ + 0.24914, + 0.2591, + 0.25864, + 0.25854, + 0.26322, + 0.26478, + 0.2666, + 0.2671, + 0.27048, + 0.26588, + 0.26632, + 0.27096, + 0.26978, + 0.2698, + 0.27074, + 0.27022, + 0.27292, + 0.27118, + 0.27308, + 0.27424, + 0.27086, + 0.27322, + 0.27464, + 0.2738, + 0.27538, + 0.27228, + 0.2751, + 0.27742, + 0.27544, + 0.2723, + 0.27602, + 0.27634, + 0.27544, + 0.27646, + 0.27732, + 0.27708, + 0.27726, + 0.2762, + 0.27976, + 0.27826, + 0.27656, + 0.2791, + 0.28084, + 0.27786, + 0.27708, + 0.27874, + 0.27834, + 0.28096, + 0.27838, + 0.28342, + 0.27998, + 0.27926, + 0.27846, + 0.2797, + 0.27926, + 0.28266, + 0.2793, + 0.28242, + 0.27896, + 0.27938, + 0.2807, + 0.28146, + 0.27946, + 0.279, + 0.28374, + 0.28138, + 0.28202, + 0.28122, + 0.2837, + 0.28122, + 0.28228, + 0.2817, + 0.27958, + 0.283, + 0.2825, + 0.28446, + 0.28486, + 0.28054, + 0.28292, + 0.28036, + 0.28328, + 0.28302, + 0.28552, + 0.2844, + 0.28334, + 0.28374, + 0.28518, + 0.28306, + 0.2825, + 0.28426, + 0.28316, + 0.28418, + 0.28372, + 0.285, + 0.28484, + 0.2843, + 0.28284, + 0.28358, + 0.28314, + 0.28086 + ], + "test_acc": [ + 0.2818, + 0.2871, + 0.2791, + 0.2853, + 0.2856, + 0.2861, + 0.3039, + 0.2842, + 0.2723, + 0.2875, + 0.2911, + 0.2934, + 0.3073, + 0.3023, + 0.2854, + 0.2884, + 0.3049, + 0.2901, + 0.2934, + 0.3139, + 0.3034, + 0.3021, + 0.321, + 0.2958, + 0.3122, + 0.2967, + 0.3089, + 0.3045, + 0.2876, + 0.2966, + 0.3042, + 0.2978, + 0.3161, + 0.3091, + 0.3033, + 0.3149, + 0.3106, + 0.2978, + 0.3124, + 0.3057, + 0.3115, + 0.2996, + 0.3098, + 0.303, + 0.2889, + 0.3177, + 0.3011, + 0.2992, + 0.3019, + 0.3108, + 0.3212, + 0.3085, + 0.3138, + 0.3106, + 0.296, + 0.3106, + 0.3058, + 0.3123, + 0.3076, + 0.3118, + 0.3063, + 0.3124, + 0.3079, + 0.3077, + 0.3123, + 0.3141, + 0.3109, + 0.319, + 0.3017, + 0.3049, + 0.3113, + 0.318, + 0.3157, + 0.3079, + 0.3101, + 0.3137, + 0.3058, + 0.3153, + 0.3094, + 0.3139, + 0.3087, + 0.3128, + 0.3162, + 0.3133, + 0.3087, + 0.3134, + 0.3167, + 0.3121, + 0.3118, + 0.3111, + 0.3131, + 0.3113, + 0.3128, + 0.3125, + 0.3131, + 0.3123, + 0.3118, + 0.312, + 0.3121, + 0.3122 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.396158367395401, + -0.005014405585825443 + ], + "perturbation_rho": [ + 0.0009753962513059378, + 0.0 + ], + "nudging": { + "0.001": [ + -4.3818727135658264e-07, + 0.0 + ], + "0.003": [ + -1.3783574104309082e-06, + 9.313225746154785e-10 + ], + "0.01": [ + -4.818197339773178e-06, + 3.725290298461914e-09 + ] + } + }, + "drift": { + "embed.weight": 323.8257144939098, + "embed.bias": 248.21108220164808, + "blocks.0.ln.weight": 8.42464670192897, + "blocks.0.w1.weight": 206.7713721666247, + "blocks.0.w1.bias": 171.8292028267183, + "blocks.0.w2.weight": 323.69930361812675, + "blocks.1.ln.weight": 6.518412820464622, + "blocks.1.w1.weight": 229.69399525127193, + "blocks.1.w1.bias": 219.11418017905737, + "blocks.1.w2.weight": 202.46482559231447, + "out_ln.weight": 0.4266951230953523, + "out_head.weight": 6.867727427000321, + "out_head.bias": 3.719577118675905 + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.0466229999542236, + 2.0390515814208983, + 2.0387567960357664, + 2.035990318336487, + 2.0319369410705566, + 2.0270682551574706, + 2.0257353674316407, + 2.01995243888855, + 2.014456915893555, + 2.014794263648987, + 2.0092950971221923, + 2.0075508432769777, + 2.0089861209869384, + 2.009624204673767, + 2.0054416754150393, + 2.004343302459717, + 2.004835032348633, + 2.004392629699707, + 2.0029932656097413, + 2.002116594848633, + 2.0016485495758056, + 1.9995216164398193, + 1.9959283925628661, + 1.9984067166900634, + 1.9955141537475587, + 1.9943039474105835, + 1.9905847966003418, + 1.9943868572235108, + 1.9933354425811767, + 1.9950886684799194, + 1.9958439822769165, + 1.9941565301132202, + 1.992669308166504, + 1.9904355131530762, + 1.9945945461273193, + 1.9895463079452516, + 1.9893892168807983, + 1.9876361457061769, + 1.9826778482055665, + 1.988116795387268, + 1.9903033963012695, + 1.9945041528320313, + 2.003135726776123, + 2.0090655849838255, + 2.003611517944336, + 1.993031780052185, + 1.9829731557846069, + 1.9795342245483398, + 1.9742745175933838, + 1.9710580517196656, + 1.9662886399841308, + 1.9650878366470337, + 1.9633581380462646, + 1.9602308530426025, + 1.9592647447967528, + 1.9569754809570312, + 1.9564002374267577, + 1.9596573688125611, + 1.9562416759490966, + 1.9577629917907715, + 1.9564975534057618, + 1.9539075463485718, + 1.9531170993804932, + 1.9562737216949464, + 1.9533874069213868, + 1.9565455058288574, + 1.9550479524993896, + 1.9579495740509034, + 1.9561651504898072, + 1.9566914569091798, + 1.9560811403656007, + 1.9559252410888672, + 1.954912179260254, + 1.9543887220001221, + 1.9562247213363648, + 1.9564899509429932, + 1.9564726518249511, + 1.9530779626464845, + 1.954867910079956, + 1.953048494796753, + 1.9528486930084228, + 1.9534204055404663, + 1.9533309042358398, + 1.952870100631714, + 1.9535446406555175, + 1.9520780282592773, + 1.9539363479614258, + 1.9533953338241576, + 1.9520681017303467, + 1.9507475804901122, + 1.9521085049819946, + 1.9542150582122804, + 1.9536484621429444, + 1.9531653139877319, + 1.9510113228988648, + 1.9543765464782714, + 1.9518434842681884, + 1.9509774511337281, + 1.9520590380859375, + 1.9515080471801758 + ], + "train_acc": [ + 0.25224, + 0.25856, + 0.25666, + 0.2584, + 0.26252, + 0.26562, + 0.26418, + 0.2664, + 0.26886, + 0.27, + 0.27072, + 0.27296, + 0.26938, + 0.27142, + 0.27324, + 0.27214, + 0.27118, + 0.27374, + 0.274, + 0.27416, + 0.27408, + 0.27516, + 0.27406, + 0.2768, + 0.27462, + 0.27758, + 0.2832, + 0.27908, + 0.27992, + 0.27762, + 0.27726, + 0.27918, + 0.2775, + 0.2774, + 0.2756, + 0.27898, + 0.27944, + 0.27822, + 0.282, + 0.27834, + 0.28466, + 0.28584, + 0.28626, + 0.28466, + 0.2816, + 0.28212, + 0.28232, + 0.28346, + 0.28134, + 0.28332, + 0.2858, + 0.28386, + 0.28558, + 0.28612, + 0.28698, + 0.28932, + 0.2885, + 0.28432, + 0.2864, + 0.28792, + 0.28548, + 0.28804, + 0.28786, + 0.28798, + 0.2883, + 0.28572, + 0.2894, + 0.28642, + 0.28876, + 0.28766, + 0.28924, + 0.28718, + 0.28808, + 0.28528, + 0.2878, + 0.28852, + 0.2875, + 0.28816, + 0.28838, + 0.28702, + 0.29014, + 0.29108, + 0.28906, + 0.29216, + 0.29062, + 0.28836, + 0.29078, + 0.28994, + 0.28852, + 0.29152, + 0.29096, + 0.29036, + 0.29132, + 0.29078, + 0.29352, + 0.28894, + 0.29248, + 0.2919, + 0.2922, + 0.28814 + ], + "test_acc": [ + 0.2783, + 0.2698, + 0.2993, + 0.282, + 0.3008, + 0.2636, + 0.302, + 0.2948, + 0.2815, + 0.2878, + 0.2823, + 0.3067, + 0.3037, + 0.2988, + 0.2874, + 0.2945, + 0.2916, + 0.2958, + 0.3024, + 0.2933, + 0.2879, + 0.3095, + 0.3108, + 0.3052, + 0.3078, + 0.304, + 0.299, + 0.2887, + 0.2945, + 0.2859, + 0.2947, + 0.3076, + 0.287, + 0.3072, + 0.3058, + 0.3008, + 0.2991, + 0.3036, + 0.3086, + 0.2928, + 0.3031, + 0.3113, + 0.307, + 0.3049, + 0.3033, + 0.3003, + 0.3063, + 0.307, + 0.2942, + 0.312, + 0.3043, + 0.3027, + 0.3029, + 0.3049, + 0.297, + 0.3117, + 0.2993, + 0.3076, + 0.2972, + 0.3089, + 0.3051, + 0.31, + 0.3078, + 0.2928, + 0.3153, + 0.3035, + 0.3138, + 0.3058, + 0.312, + 0.3027, + 0.3098, + 0.3066, + 0.3106, + 0.3118, + 0.3022, + 0.3123, + 0.3051, + 0.3089, + 0.3057, + 0.3095, + 0.3091, + 0.3075, + 0.3085, + 0.3078, + 0.3102, + 0.3103, + 0.3092, + 0.3038, + 0.3111, + 0.31, + 0.3089, + 0.3099, + 0.3095, + 0.3099, + 0.3096, + 0.3092, + 0.3102, + 0.3106, + 0.3106, + 0.3105 + ], + "value_loss": [ + 0.5981157046318054, + 0.23145676259040832, + 0.1629143718481064, + 0.13112473169445993, + 0.1034177236700058, + 0.0916099097251892, + 0.09448877233743667, + 0.07975816262960433, + 0.07028926397323608, + 0.06960906606912613, + 0.0663377025961876, + 0.06277827244520187, + 0.06609309570908546, + 0.05464596090316772, + 0.05347000701904297, + 0.055175553441047666, + 0.05404586620092392, + 0.050111453244686126, + 0.04170590556740761, + 0.042121976542472836, + 0.04078092483282089, + 0.04033791535496712, + 0.041389339334964755, + 0.04141822567462921, + 0.039917332406044004, + 0.036470176842212675, + 0.03570402141869068, + 0.0356453166270256, + 0.0348940605866909, + 0.03294261076688766, + 0.030363075378537177, + 0.031874004955291746, + 0.028748285691142083, + 0.02522519760966301, + 0.025916270488500596, + 0.02379499412894249, + 0.0268276374822855, + 0.021691660759449005, + 0.019947531086206435, + 0.021523804327845574, + 0.02691959607720375, + 0.02570752409338951, + 0.02876643155694008, + 0.0335148137229681, + 0.031904469298124315, + 0.02778498649060726, + 0.02370047950387001, + 0.02384015331029892, + 0.022202999491095544, + 0.02014792114138603, + 0.01951033084630966, + 0.0173978901296854, + 0.015886960296034813, + 0.014518849447965622, + 0.016183216240406036, + 0.016505281180143355, + 0.014820445327758789, + 0.014580657460987568, + 0.012194996480941772, + 0.014215488128364087, + 0.013283061341047286, + 0.011145545057058334, + 0.011805196754932403, + 0.009617018352746963, + 0.01116202095746994, + 0.009037217251360417, + 0.0090115091329813, + 0.011461790952682495, + 0.008820395555198193, + 0.007558346377015114, + 0.00825535637140274, + 0.007499891985356807, + 0.006166567915007472, + 0.006294274886846542, + 0.006129814375638962, + 0.005847277462333441, + 0.004945684289932251, + 0.004713377166241407, + 0.0033198376420140265, + 0.0037709764985740185, + 0.002341279806494713, + 0.002568720788434148, + 0.002159126052595675, + 0.001921226680725813, + 0.0018878655811026693, + 0.0016211944927275181, + 0.0013243718447163702, + 0.001169309064410627, + 0.0010681760500371455, + 0.0008630752410739661, + 0.0008580225262790919, + 0.0008040335815213621, + 0.0007892505507543683, + 0.0006356554404087364, + 0.0006604202647879719, + 0.0006046383780613541, + 0.0006052350796759129, + 0.0005226440225169063, + 0.0005789817444421351, + 0.0006147388235665858 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.33032962679862976, + 0.01970662735402584 + ], + "perturbation_rho": [ + 0.06130741536617279, + 0.0 + ], + "nudging": { + "0.001": [ + -5.778856575489044e-07, + 0.0 + ], + "0.003": [ + -1.7262063920497894e-06, + 0.0 + ], + "0.01": [ + -5.792360752820969e-06, + 0.0 + ] + } + }, + "drift": { + "embed.weight": 175.24499314321244, + "embed.bias": 87.67212401922586, + "blocks.0.ln.weight": 8.05369238852348, + "blocks.0.w1.weight": 157.60363681616167, + "blocks.0.w1.bias": 81.08793311128552, + "blocks.0.w2.weight": 221.88820128646415, + "blocks.1.ln.weight": 5.44449828938583, + "blocks.1.w1.weight": 244.47570610251066, + "blocks.1.w1.bias": 227.1893178317289, + "blocks.1.w2.weight": 212.32680563546222, + "out_ln.weight": 0.33305352742575556, + "out_head.weight": 4.339797161618964, + "out_head.bias": 2.8094622055285003 + } + } +} \ No newline at end of file diff --git a/results/cifar_depth_scan_s42/d512_L4_s42.json b/results/cifar_depth_scan_s42/d512_L4_s42.json new file mode 100644 index 0000000..3fb7a64 --- /dev/null +++ b/results/cifar_depth_scan_s42/d512_L4_s42.json @@ -0,0 +1,1205 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.9128315224838257, + 1.6880022193145752, + 1.6019164403533936, + 1.542231183242798, + 1.4950828089141845, + 1.4559073908996583, + 1.4284738327407838, + 1.397783087120056, + 1.3783822360992433, + 1.3537940772247314, + 1.3363390048980712, + 1.3175183240509034, + 1.301716223526001, + 1.286239836654663, + 1.2730019290542602, + 1.2588182968902588, + 1.2396523715209962, + 1.2286129103851318, + 1.216484442100525, + 1.2020161497688293, + 1.191397441482544, + 1.1803369410705566, + 1.1678005861663818, + 1.158150842514038, + 1.1437132249832154, + 1.1321278622055053, + 1.122210889930725, + 1.1123670346450805, + 1.1020959008026123, + 1.0898543254470825, + 1.0772244114494325, + 1.0695367335128785, + 1.0618911952209473, + 1.0524220000839233, + 1.0425953432464599, + 1.0304253259277343, + 1.023384765663147, + 1.0077225874519349, + 0.9960999109649659, + 0.9944095385360717, + 0.983660818862915, + 0.968802798652649, + 0.9584540496826172, + 0.9542556776809692, + 0.9423338845062256, + 0.9271652110481262, + 0.9240609010696411, + 0.9173964101791382, + 0.9032901007080079, + 0.8992292018318176, + 0.8873294083976746, + 0.8718722639083862, + 0.8695090994262695, + 0.858162225074768, + 0.8499397317695617, + 0.8388333418083191, + 0.8261937767410278, + 0.8185464579582215, + 0.810011429862976, + 0.7982917448425293, + 0.7877091710281372, + 0.7813588368415832, + 0.7747608847618103, + 0.7637265836715699, + 0.7545594720649719, + 0.7478000127983093, + 0.7360342462348938, + 0.7309902267074585, + 0.7200408243942261, + 0.7086022729682923, + 0.7048035074615479, + 0.6956654514884949, + 0.6874777590370178, + 0.682139354915619, + 0.6745446991729737, + 0.6719911893653869, + 0.6605463418197632, + 0.6587527468109131, + 0.653552459449768, + 0.6490319774246216, + 0.6399379921340942, + 0.6357991346931458, + 0.6328972053527832, + 0.6210838864898681, + 0.6178263852119446, + 0.615306571187973, + 0.6115417842102051, + 0.6158308602905274, + 0.6098391858100891, + 0.6050217900466919, + 0.6065702855396271, + 0.6006206908416748, + 0.5975759600830078, + 0.5960665979194641, + 0.5940444506263733, + 0.5969071801757813, + 0.5900075828170777, + 0.5945732257270813, + 0.5974702124786377, + 0.590236732711792 + ], + "train_acc": [ + 0.31564, + 0.39178, + 0.42, + 0.44194, + 0.45874, + 0.47242, + 0.48206, + 0.49302, + 0.50368, + 0.5108, + 0.51956, + 0.52752, + 0.531, + 0.5371, + 0.54046, + 0.54568, + 0.55426, + 0.55788, + 0.56382, + 0.56942, + 0.57036, + 0.5758, + 0.5802, + 0.58474, + 0.58888, + 0.5928, + 0.59766, + 0.6015, + 0.60714, + 0.6108, + 0.61308, + 0.61564, + 0.61944, + 0.6234, + 0.62626, + 0.62754, + 0.63226, + 0.63652, + 0.64376, + 0.6433, + 0.64368, + 0.65028, + 0.65508, + 0.65658, + 0.66194, + 0.6674, + 0.6677, + 0.67076, + 0.67436, + 0.67902, + 0.68228, + 0.6872, + 0.68646, + 0.6916, + 0.6952, + 0.69856, + 0.70518, + 0.70516, + 0.7078, + 0.71188, + 0.72018, + 0.71728, + 0.72058, + 0.72528, + 0.72892, + 0.73086, + 0.73516, + 0.73802, + 0.74118, + 0.74528, + 0.7469, + 0.7505, + 0.7517, + 0.75458, + 0.76024, + 0.76044, + 0.76314, + 0.76424, + 0.76568, + 0.76864, + 0.77176, + 0.7746, + 0.7747, + 0.77746, + 0.7786, + 0.77756, + 0.78208, + 0.78172, + 0.78232, + 0.78392, + 0.78542, + 0.78776, + 0.78702, + 0.78846, + 0.78602, + 0.78574, + 0.78886, + 0.78892, + 0.78904, + 0.79178 + ], + "test_acc": [ + 0.3932, + 0.4305, + 0.4599, + 0.4575, + 0.4965, + 0.5052, + 0.5072, + 0.513, + 0.5146, + 0.5331, + 0.5293, + 0.5323, + 0.5389, + 0.545, + 0.5545, + 0.5444, + 0.5494, + 0.5539, + 0.5652, + 0.5702, + 0.5638, + 0.5713, + 0.5729, + 0.5719, + 0.5722, + 0.5763, + 0.5807, + 0.5794, + 0.5855, + 0.5804, + 0.5844, + 0.59, + 0.5892, + 0.59, + 0.5955, + 0.5931, + 0.5877, + 0.5906, + 0.5944, + 0.6001, + 0.5976, + 0.5995, + 0.6036, + 0.6032, + 0.6069, + 0.6, + 0.6025, + 0.6029, + 0.5956, + 0.603, + 0.6055, + 0.6021, + 0.5997, + 0.6045, + 0.608, + 0.6077, + 0.6047, + 0.6033, + 0.6049, + 0.6026, + 0.6064, + 0.6089, + 0.6065, + 0.6025, + 0.6069, + 0.6068, + 0.6032, + 0.6036, + 0.6062, + 0.6023, + 0.6024, + 0.6011, + 0.603, + 0.6052, + 0.602, + 0.6042, + 0.6033, + 0.6026, + 0.6018, + 0.6026, + 0.6035, + 0.6033, + 0.6028, + 0.6044, + 0.6005, + 0.6037, + 0.6018, + 0.6031, + 0.6027, + 0.6043, + 0.604, + 0.6035, + 0.6024, + 0.604, + 0.6038, + 0.6031, + 0.6021, + 0.6027, + 0.603, + 0.6032 + ] + }, + "diagnostics": { + "bp_cosine": [ + 1.0, + 1.0, + 1.0, + 1.0 + ], + "perturbation_rho": [ + 0.98465895652771, + 0.9885985851287842, + 0.9880813360214233, + 0.9883240461349487 + ], + "nudging": { + "0.001": [ + -0.001627826364710927, + -0.0016166457207873464, + -0.0015995900612324476, + -0.0014260262250900269 + ], + "0.003": [ + -0.004879107233136892, + -0.004846072755753994, + -0.004795195069164038, + -0.004275224171578884 + ], + "0.01": [ + -0.016217362135648727, + -0.01610748842358589, + -0.015940139070153236, + -0.014218071475625038 + ] + } + }, + "drift": { + "embed.weight": 8.8243080894614, + "embed.bias": 16.94096306102109, + "blocks.0.ln.weight": 0.27074600681784294, + "blocks.0.w1.weight": 4.412644958801875, + "blocks.0.w1.bias": 7.117085807367152, + "blocks.0.w2.weight": 11.508053240186102, + "blocks.1.ln.weight": 0.16732973494773748, + "blocks.1.w1.weight": 4.742762067497133, + "blocks.1.w1.bias": 4.5510383530906955, + "blocks.1.w2.weight": 13.171214559405497, + "blocks.2.ln.weight": 0.17887226073929113, + "blocks.2.w1.weight": 4.753555652638221, + "blocks.2.w1.bias": 4.0288582989197055, + "blocks.2.w2.weight": 14.123960280583763, + "blocks.3.ln.weight": 0.19235362588922475, + "blocks.3.w1.weight": 4.831153218839085, + "blocks.3.w1.bias": 3.727898847051419, + "blocks.3.w2.weight": 15.974843151960325, + "out_ln.weight": 0.4103308080908126, + "out_head.weight": 2.6455778192608332, + "out_head.bias": 1.2917860402449406 + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.0458639289093017, + 2.0289766119384764, + 2.020620018005371, + 2.012297201309204, + 2.0094007360076906, + 2.0115105359649657, + 2.0102763877105714, + 2.006047547874451, + 2.0053908419799806, + 2.006039619178772, + 2.0009452716064455, + 2.0004891522216797, + 1.997944189224243, + 1.9965615715026857, + 1.9999804154205323, + 1.9981115759277344, + 1.9969525494766236, + 1.9967278913879394, + 1.9977753674316405, + 1.9970432605361939, + 1.9937860690307616, + 1.9955713275909424, + 1.994003203048706, + 1.9966396224975587, + 1.9941929375457763, + 1.9933527754974365, + 1.9948605881500243, + 1.99625807762146, + 1.9941814679718017, + 1.9941422396850585, + 1.99151097530365, + 1.9934743473052978, + 1.9893354850769043, + 1.989959321861267, + 1.9919966284942627, + 1.9909703044128417, + 1.9899194409179688, + 1.9901701150512696, + 1.9903043267822265, + 1.9902096912384033, + 1.9900437306976317, + 1.9880607610321044, + 1.9873294051742554, + 1.9879234255981446, + 1.9870288726043701, + 1.9906337995910643, + 1.98670257522583, + 1.986429832382202, + 1.9861535691070558, + 1.9875364014053345, + 1.9880395639801025, + 1.9859618353652955, + 1.9838686182403564, + 1.9850774764251709, + 1.984304948348999, + 1.9849093035125733, + 1.9841952557373046, + 1.9846441001129151, + 1.984178702659607, + 1.9851755959320068, + 1.9839427744293212, + 1.9841270837020875, + 1.9833368181991577, + 1.9830518650817872, + 1.9827289093780518, + 1.9815367695617676, + 1.9821726945495606, + 1.9826502087020874, + 1.9826591117858887, + 1.9820565001678467, + 1.9842380196762084, + 1.9824368360137938, + 1.9822880676269532, + 1.9798370397949219, + 1.9824768118286134, + 1.982346687965393, + 1.9822141482543945, + 1.9804879917907714, + 1.9800791321182252, + 1.9813715744018554, + 1.9813639123535156, + 1.9790491080093384, + 1.980683646774292, + 1.9790133563232422, + 1.9805930490112305, + 1.980672128944397, + 1.981869688796997, + 1.9792622634124757, + 1.9801762536239624, + 1.9814309076690675, + 1.9808863278579711, + 1.9783899629211426, + 1.980429323272705, + 1.9808515368652344, + 1.9805352714538573, + 1.978631600112915, + 1.9817959378814698, + 1.9797530443954467, + 1.9781674542999268, + 1.9783192428970338 + ], + "train_acc": [ + 0.2491, + 0.25984, + 0.2652, + 0.26518, + 0.26756, + 0.26822, + 0.26646, + 0.26766, + 0.26952, + 0.26786, + 0.2692, + 0.27078, + 0.2744, + 0.27082, + 0.27058, + 0.26992, + 0.27464, + 0.2732, + 0.2712, + 0.27484, + 0.27366, + 0.27528, + 0.27524, + 0.27466, + 0.2739, + 0.27726, + 0.2754, + 0.27326, + 0.27062, + 0.2751, + 0.27784, + 0.27426, + 0.27818, + 0.28086, + 0.27724, + 0.27694, + 0.27696, + 0.27858, + 0.2784, + 0.27956, + 0.27774, + 0.28002, + 0.28038, + 0.2798, + 0.2806, + 0.27946, + 0.27928, + 0.28056, + 0.28084, + 0.28006, + 0.2811, + 0.28282, + 0.2807, + 0.28176, + 0.2819, + 0.28218, + 0.28188, + 0.28362, + 0.28256, + 0.28266, + 0.28368, + 0.28256, + 0.28366, + 0.28098, + 0.28328, + 0.28394, + 0.28346, + 0.28286, + 0.28388, + 0.28246, + 0.28286, + 0.28164, + 0.28372, + 0.28418, + 0.28458, + 0.28382, + 0.28406, + 0.2839, + 0.28352, + 0.28454, + 0.28204, + 0.28542, + 0.28458, + 0.2855, + 0.28488, + 0.28726, + 0.28564, + 0.2841, + 0.2856, + 0.28356, + 0.2863, + 0.28382, + 0.2859, + 0.28326, + 0.28584, + 0.28438, + 0.28494, + 0.2853, + 0.28502, + 0.28404 + ], + "test_acc": [ + 0.29, + 0.3005, + 0.2688, + 0.2879, + 0.2899, + 0.2866, + 0.2708, + 0.2917, + 0.2939, + 0.2888, + 0.3039, + 0.3014, + 0.2872, + 0.2932, + 0.3039, + 0.2983, + 0.3074, + 0.2815, + 0.3073, + 0.3121, + 0.3117, + 0.2972, + 0.2956, + 0.2898, + 0.3126, + 0.3014, + 0.3087, + 0.2844, + 0.2987, + 0.3162, + 0.2839, + 0.3007, + 0.299, + 0.2998, + 0.2977, + 0.3051, + 0.304, + 0.3093, + 0.3049, + 0.3037, + 0.3143, + 0.3147, + 0.2974, + 0.3146, + 0.3051, + 0.3068, + 0.3035, + 0.3095, + 0.3052, + 0.3107, + 0.3102, + 0.3022, + 0.3059, + 0.315, + 0.3074, + 0.3028, + 0.3144, + 0.3099, + 0.3026, + 0.3032, + 0.3081, + 0.3198, + 0.3133, + 0.3066, + 0.314, + 0.3126, + 0.3091, + 0.3119, + 0.3124, + 0.3184, + 0.3069, + 0.3125, + 0.3005, + 0.3117, + 0.3089, + 0.3089, + 0.3169, + 0.3106, + 0.3187, + 0.3165, + 0.3151, + 0.3145, + 0.3146, + 0.3104, + 0.3147, + 0.3125, + 0.3156, + 0.3169, + 0.3141, + 0.316, + 0.3152, + 0.3129, + 0.3126, + 0.3141, + 0.3143, + 0.3147, + 0.3146, + 0.3142, + 0.314, + 0.314 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.4003449082374573, + 0.001211420283652842, + -0.00036704502417705953, + -0.001560344360768795 + ], + "perturbation_rho": [ + 0.011487731710076332, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -4.852190613746643e-07, + 0.0, + 0.0, + 0.0 + ], + "0.003": [ + -1.4952383935451508e-06, + -9.313225746154785e-10, + 0.0, + 0.0 + ], + "0.01": [ + -4.9872323870658875e-06, + -3.725290298461914e-09, + 2.3283064365386963e-09, + -1.862645149230957e-09 + ] + } + }, + "drift": { + "embed.weight": 315.1599803678731, + "embed.bias": 244.58720774886493, + "blocks.0.ln.weight": 8.197430677494586, + "blocks.0.w1.weight": 199.45530019449558, + "blocks.0.w1.bias": 169.48912351090533, + "blocks.0.w2.weight": 327.4002685876291, + "blocks.1.ln.weight": 6.599592372532966, + "blocks.1.w1.weight": 229.02521385968495, + "blocks.1.w1.bias": 216.20223057872374, + "blocks.1.w2.weight": 201.88759050630722, + "blocks.2.ln.weight": 7.947358922483768, + "blocks.2.w1.weight": 321.18706085148796, + "blocks.2.w1.bias": 277.92923879713146, + "blocks.2.w2.weight": 246.2703649903627, + "blocks.3.ln.weight": 5.776195341542472, + "blocks.3.w1.weight": 200.0071643423771, + "blocks.3.w1.bias": 167.9311499839471, + "blocks.3.w2.weight": 151.89636822620278, + "out_ln.weight": 0.5328500972285665, + "out_head.weight": 8.52020076404927, + "out_head.bias": 1.2327914968426916 + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.0418811988830567, + 2.0244707107162476, + 2.015521148300171, + 2.0061337772369385, + 2.0037599030303954, + 2.0030078707885743, + 1.999246537513733, + 1.9986579943847655, + 1.9972485411834717, + 1.9962204788970948, + 1.9977344912338257, + 1.9994980056381226, + 1.9950928838729858, + 1.9959543724060058, + 1.9950839403533935, + 1.995928331451416, + 1.9931118923950195, + 1.9951996542739867, + 1.9903301047134399, + 1.99565612575531, + 1.9905316178131103, + 1.9879318959045411, + 1.9921765214538574, + 1.988416219329834, + 1.988950412826538, + 1.9850122336578369, + 1.9853902856445313, + 1.985061616744995, + 1.9886472620391846, + 1.9883863719940185, + 1.9913309915161133, + 1.9895416070175171, + 1.987194644241333, + 1.9894078858947755, + 1.9878019535827636, + 1.9846340017700195, + 1.9846721477508544, + 1.9833970055389405, + 1.97837587184906, + 1.9834315983581543, + 1.976168726158142, + 1.976138740310669, + 1.9748867916488648, + 1.9714933393096923, + 1.9723309854888915, + 1.9734577295303344, + 1.9773753978729247, + 1.9739041761779785, + 1.9783673559570312, + 1.9767930798339843, + 1.9739136279678344, + 1.970040503616333, + 1.969602509536743, + 1.970613325881958, + 1.9665965628051758, + 1.9671646138763428, + 1.9675314767074585, + 1.9716551809692382, + 1.971007603111267, + 1.976275298461914, + 1.9748961191558838, + 1.9742881618881225, + 1.9736152155303954, + 1.9752269494628907, + 1.973985399093628, + 1.9731344959259034, + 1.9733161668395995, + 1.9738907193756103, + 1.9722116097640991, + 1.9699555205535888, + 1.972003019142151, + 1.9740287133407592, + 1.9716516065979004, + 1.969599935836792, + 1.9734370888900756, + 1.9703946390533447, + 1.9703987968444825, + 1.96968883518219, + 1.969948963279724, + 1.9703090355682373, + 1.969407484512329, + 1.9689243365097047, + 1.9691953955078125, + 1.9695471990966797, + 1.9693656219482423, + 1.9675928352355958, + 1.9688836163711547, + 1.9679821907043458, + 1.9700432720184327, + 1.9663442990493774, + 1.9663598616790772, + 1.9673082627868652, + 1.9678210963439942, + 1.96654816696167, + 1.9666101715087891, + 1.9660805171203612, + 1.966873331642151, + 1.966620960006714, + 1.9675770812606812, + 1.964846303024292 + ], + "train_acc": [ + 0.2533, + 0.2611, + 0.26526, + 0.26344, + 0.26812, + 0.2687, + 0.27104, + 0.27094, + 0.27094, + 0.27538, + 0.27276, + 0.27328, + 0.2756, + 0.27502, + 0.274, + 0.27276, + 0.2765, + 0.275, + 0.27584, + 0.27372, + 0.27766, + 0.27726, + 0.27552, + 0.2776, + 0.27428, + 0.2813, + 0.27736, + 0.2803, + 0.27882, + 0.27776, + 0.27758, + 0.2801, + 0.28084, + 0.27702, + 0.2819, + 0.27934, + 0.28016, + 0.2815, + 0.28464, + 0.2808, + 0.28334, + 0.28568, + 0.2852, + 0.2873, + 0.28756, + 0.287, + 0.29052, + 0.28836, + 0.28402, + 0.28472, + 0.28438, + 0.28548, + 0.28464, + 0.28252, + 0.2821, + 0.27936, + 0.28156, + 0.27808, + 0.27828, + 0.277, + 0.2753, + 0.27688, + 0.27532, + 0.27604, + 0.27414, + 0.27342, + 0.27416, + 0.27398, + 0.2779, + 0.2781, + 0.276, + 0.27548, + 0.2788, + 0.2794, + 0.27964, + 0.28044, + 0.28268, + 0.2817, + 0.28064, + 0.27928, + 0.28, + 0.28164, + 0.28246, + 0.28102, + 0.28358, + 0.28138, + 0.28232, + 0.28474, + 0.28286, + 0.28322, + 0.28316, + 0.28318, + 0.28198, + 0.28422, + 0.28366, + 0.28454, + 0.28538, + 0.2829, + 0.2831, + 0.28552 + ], + "test_acc": [ + 0.2888, + 0.2864, + 0.2858, + 0.2885, + 0.2871, + 0.3073, + 0.2926, + 0.3191, + 0.3113, + 0.3016, + 0.3124, + 0.2995, + 0.3046, + 0.2943, + 0.3111, + 0.2989, + 0.2944, + 0.2888, + 0.3006, + 0.2952, + 0.2985, + 0.3075, + 0.2969, + 0.3113, + 0.3152, + 0.3054, + 0.3137, + 0.3075, + 0.3116, + 0.3207, + 0.3132, + 0.3203, + 0.3138, + 0.2868, + 0.3006, + 0.3085, + 0.3173, + 0.3158, + 0.3112, + 0.3166, + 0.3082, + 0.2936, + 0.3047, + 0.3188, + 0.3158, + 0.3186, + 0.3109, + 0.2969, + 0.3073, + 0.3111, + 0.3051, + 0.2869, + 0.3112, + 0.2917, + 0.282, + 0.2801, + 0.3098, + 0.3097, + 0.2986, + 0.2964, + 0.2884, + 0.2738, + 0.2961, + 0.2958, + 0.2773, + 0.297, + 0.3029, + 0.2907, + 0.2935, + 0.2936, + 0.2939, + 0.2991, + 0.2958, + 0.2873, + 0.2939, + 0.2961, + 0.2942, + 0.2871, + 0.3067, + 0.293, + 0.3001, + 0.2932, + 0.2985, + 0.2896, + 0.3012, + 0.298, + 0.2904, + 0.2971, + 0.3012, + 0.291, + 0.2965, + 0.2961, + 0.2997, + 0.2997, + 0.3002, + 0.2997, + 0.2982, + 0.2984, + 0.2979, + 0.2983 + ], + "value_loss": [ + 0.5735433899068832, + 0.19343321340560912, + 0.1459548154258728, + 0.11554339327573776, + 0.10444803307533264, + 0.09662322332382202, + 0.07835375997543335, + 0.07846195635318756, + 0.07231992372989654, + 0.06300295606732369, + 0.0541220169878006, + 0.061311349160671234, + 0.054080903697013856, + 0.04913855415701866, + 0.053713992041945456, + 0.053991433643102646, + 0.042828602213859555, + 0.04867008077502251, + 0.036165564210414884, + 0.04136963748335838, + 0.03747292908787728, + 0.036461174008846284, + 0.03738185323476791, + 0.036185857799053193, + 0.037782702654600146, + 0.03236810895383358, + 0.028799428634643555, + 0.026735566897988318, + 0.028131072289943694, + 0.025900923478007317, + 0.02817378466963768, + 0.02747203625589609, + 0.022810295909643175, + 0.02715033429145813, + 0.023775706954598425, + 0.024240291431546213, + 0.02618250633716583, + 0.018726080359220503, + 0.019515147968530655, + 0.020435102397203444, + 0.02499964476108551, + 0.025505309803485872, + 0.029445164866447448, + 0.025735821738243105, + 0.02567795764923096, + 0.026399999004602433, + 0.02691687547147274, + 0.029062440598011018, + 0.030562642726898192, + 0.030370158289074897, + 0.030683111140727998, + 0.026187384767532348, + 0.024638052703738214, + 0.023440595749616624, + 0.020625758872032166, + 0.02062276856124401, + 0.01832583192050457, + 0.019966158434748648, + 0.018222353776693345, + 0.01633087551832199, + 0.01604582875967026, + 0.017060256469249725, + 0.016002053155303002, + 0.012738182610273362, + 0.012326533913612365, + 0.011105860123932361, + 0.009771750206947327, + 0.01024535400569439, + 0.009756301180124282, + 0.010442935926914216, + 0.008487312002182007, + 0.007283874700143933, + 0.007183250502049923, + 0.006603042964339256, + 0.006635444448143244, + 0.0059348720067739485, + 0.005370370441824198, + 0.004778812771886587, + 0.004565887214839458, + 0.0041534857338666915, + 0.003742397453635931, + 0.002904790796712041, + 0.0025213647907227276, + 0.002474344636797905, + 0.0021933346104249358, + 0.0016953631690889597, + 0.0015760234126448631, + 0.0016894616746902466, + 0.0012066031998768448, + 0.0011484015756100417, + 0.0009841965650953352, + 0.0010899798352271318, + 0.0011266277173534035, + 0.000903698658272624, + 0.0006944430249370635, + 0.000758418973647058, + 0.0006867282877117396, + 0.0007330659104511142, + 0.0006502793713379652, + 0.0009213672729767859 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.4021158814430237, + 0.01842920482158661, + 0.0360899493098259, + 0.03449413180351257 + ], + "perturbation_rho": [ + -0.009267053566873074, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -7.189810276031494e-07, + 0.0, + 0.0, + 0.0 + ], + "0.003": [ + -2.16485932469368e-06, + 0.0, + 0.0, + 0.0 + ], + "0.01": [ + -7.1660615503787994e-06, + 0.0, + 0.0, + 0.0 + ] + } + }, + "drift": { + "embed.weight": 172.83875443763608, + "embed.bias": 95.3607064520029, + "blocks.0.ln.weight": 7.63160821502783, + "blocks.0.w1.weight": 152.1378494011768, + "blocks.0.w1.bias": 96.77665305560761, + "blocks.0.w2.weight": 233.87471998777892, + "blocks.1.ln.weight": 5.632208554748294, + "blocks.1.w1.weight": 278.87861207801535, + "blocks.1.w1.bias": 289.80305690116165, + "blocks.1.w2.weight": 229.62867282953147, + "blocks.2.ln.weight": 6.009254605154408, + "blocks.2.w1.weight": 273.52084419582525, + "blocks.2.w1.bias": 229.66597331157521, + "blocks.2.w2.weight": 178.21767131714722, + "blocks.3.ln.weight": 4.147781351924253, + "blocks.3.w1.weight": 131.08945490495597, + "blocks.3.w1.bias": 109.99062036071389, + "blocks.3.w2.weight": 129.72460456542194, + "out_ln.weight": 0.3547089789563311, + "out_head.weight": 5.58566439429333, + "out_head.bias": 2.120221083274003 + } + } +} \ No newline at end of file diff --git a/results/cifar_depth_scan_s42/d512_L6_s42.json b/results/cifar_depth_scan_s42/d512_L6_s42.json new file mode 100644 index 0000000..307248f --- /dev/null +++ b/results/cifar_depth_scan_s42/d512_L6_s42.json @@ -0,0 +1,1259 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.9181581103515626, + 1.6830080932235718, + 1.5920702320480347, + 1.5328609270477296, + 1.4799005626678468, + 1.443107092781067, + 1.4138772471618652, + 1.3873612524032592, + 1.3651276648712158, + 1.3390819979095459, + 1.3217692392349243, + 1.305022211074829, + 1.2817235651779175, + 1.2682050260925293, + 1.2521741982269288, + 1.2378110882568358, + 1.215573044204712, + 1.2035384091949464, + 1.1932872578430176, + 1.1754147102737427, + 1.1641269732284545, + 1.1506621165275575, + 1.1339097010803223, + 1.1212864548492432, + 1.1109269207000732, + 1.0991801218032837, + 1.085493840484619, + 1.068724670715332, + 1.0622537975883484, + 1.0497802551078796, + 1.0335843839645387, + 1.0245532283782959, + 1.0139307324409486, + 1.003597820968628, + 0.9886502099990845, + 0.9805063750457763, + 0.9631068154907226, + 0.9566182117843628, + 0.9359624940299988, + 0.9330330731201172, + 0.9160753777313232, + 0.9056328008651734, + 0.8898537806510926, + 0.8787901188278199, + 0.8694718393707276, + 0.8506128107833862, + 0.8468854373931884, + 0.8328564296150207, + 0.8235082776260376, + 0.8091592510604858, + 0.7912276449775696, + 0.7819558120727539, + 0.7648613720703125, + 0.7557380415725709, + 0.7431310074996949, + 0.7325722367095947, + 0.7191381365394592, + 0.7073116994094849, + 0.6935642263793945, + 0.6829617013549805, + 0.6721186479949951, + 0.6607764552879334, + 0.6520131350326538, + 0.6347136948776245, + 0.6286079556655884, + 0.6146584116744995, + 0.6037020747566223, + 0.5897762714195252, + 0.5843867614936828, + 0.57075146068573, + 0.5668514904212951, + 0.5526476261138916, + 0.5426406643104553, + 0.5337510031700134, + 0.524534646692276, + 0.5152219123649597, + 0.508841796541214, + 0.5018864378547668, + 0.49528331829071043, + 0.4755337562465668, + 0.47835412044525144, + 0.47154994369506836, + 0.4639086106681824, + 0.4569279855918884, + 0.45118384454727173, + 0.4504211899662018, + 0.44511490434646606, + 0.44647758895874023, + 0.4362948834133148, + 0.43578986066818237, + 0.42930271067619324, + 0.4292936919593811, + 0.42567773310661317, + 0.4261182806301117, + 0.4239413748073578, + 0.42333943349838254, + 0.42293740759849546, + 0.4217962563323975, + 0.4224112439918518, + 0.41819300340652465 + ], + "train_acc": [ + 0.3148, + 0.3896, + 0.4219, + 0.4456, + 0.4649, + 0.47824, + 0.48992, + 0.49962, + 0.50886, + 0.51698, + 0.5202, + 0.52942, + 0.5382, + 0.5446, + 0.55176, + 0.5529, + 0.56062, + 0.56588, + 0.57028, + 0.577, + 0.58132, + 0.58658, + 0.59166, + 0.5987, + 0.59994, + 0.60574, + 0.6103, + 0.61766, + 0.61624, + 0.62304, + 0.62624, + 0.63198, + 0.63774, + 0.6413, + 0.64644, + 0.64766, + 0.65282, + 0.6553, + 0.66614, + 0.66296, + 0.67122, + 0.67416, + 0.68156, + 0.68518, + 0.6881, + 0.69356, + 0.69534, + 0.70084, + 0.70508, + 0.7084, + 0.71508, + 0.72034, + 0.72434, + 0.72938, + 0.73464, + 0.73592, + 0.7404, + 0.74552, + 0.75048, + 0.75408, + 0.75802, + 0.76272, + 0.76562, + 0.77362, + 0.77548, + 0.77904, + 0.78336, + 0.78934, + 0.79158, + 0.79514, + 0.79768, + 0.80414, + 0.80546, + 0.80986, + 0.81272, + 0.8163, + 0.81728, + 0.82112, + 0.82318, + 0.83366, + 0.83042, + 0.83306, + 0.836, + 0.83884, + 0.84078, + 0.83852, + 0.84302, + 0.8422, + 0.84388, + 0.84512, + 0.84892, + 0.85022, + 0.84986, + 0.85088, + 0.85284, + 0.8506, + 0.85018, + 0.85162, + 0.85258, + 0.85238 + ], + "test_acc": [ + 0.3995, + 0.428, + 0.4626, + 0.4828, + 0.4996, + 0.4961, + 0.5122, + 0.5214, + 0.5273, + 0.5318, + 0.5434, + 0.5431, + 0.5502, + 0.5495, + 0.5558, + 0.561, + 0.5593, + 0.5638, + 0.5727, + 0.5612, + 0.5661, + 0.5729, + 0.5769, + 0.5734, + 0.5798, + 0.5882, + 0.5883, + 0.5755, + 0.5828, + 0.5873, + 0.597, + 0.5833, + 0.5976, + 0.5915, + 0.5937, + 0.5918, + 0.5933, + 0.5934, + 0.5907, + 0.5972, + 0.5938, + 0.5974, + 0.5929, + 0.5938, + 0.6001, + 0.5933, + 0.6036, + 0.5987, + 0.5999, + 0.6037, + 0.594, + 0.5996, + 0.598, + 0.6017, + 0.597, + 0.6042, + 0.6017, + 0.5988, + 0.6004, + 0.6015, + 0.5984, + 0.6042, + 0.6041, + 0.6052, + 0.5989, + 0.605, + 0.6022, + 0.6055, + 0.6057, + 0.6064, + 0.6051, + 0.6055, + 0.6057, + 0.6056, + 0.6008, + 0.6045, + 0.6039, + 0.6033, + 0.6037, + 0.6022, + 0.6002, + 0.6018, + 0.5997, + 0.6029, + 0.6038, + 0.601, + 0.6044, + 0.6028, + 0.603, + 0.6031, + 0.6026, + 0.6029, + 0.6016, + 0.6033, + 0.6014, + 0.6027, + 0.6025, + 0.602, + 0.6014, + 0.6015 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9925569295883179, + 0.9925950765609741, + 0.9925851225852966, + 0.9926368594169617, + 0.992660403251648, + 0.9924540519714355 + ], + "perturbation_rho": [ + 0.9874800443649292, + 0.9890985488891602, + 0.991584300994873, + 0.9924823641777039, + 0.9907411336898804, + 0.9890323877334595 + ], + "nudging": { + "0.001": [ + -0.0019930435810238123, + -0.002028408693149686, + -0.002009383402764797, + -0.001996344421058893, + -0.0018836274975910783, + -0.001594579080119729 + ], + "0.003": [ + -0.00597399240359664, + -0.006079169921576977, + -0.006022875662893057, + -0.005983929615467787, + -0.005646158009767532, + -0.004780753515660763 + ], + "0.01": [ + -0.01984817534685135, + -0.020196668803691864, + -0.020013831555843353, + -0.019886385649442673, + -0.018769418820738792, + -0.015900740399956703 + ] + } + }, + "drift": { + "embed.weight": 8.830199479874222, + "embed.bias": 13.652383066527548, + "blocks.0.ln.weight": 0.3209315667509576, + "blocks.0.w1.weight": 4.304189279431552, + "blocks.0.w1.bias": 6.874941583705022, + "blocks.0.w2.weight": 11.040131085404404, + "blocks.1.ln.weight": 0.19033462322360514, + "blocks.1.w1.weight": 4.611319361803835, + "blocks.1.w1.bias": 4.589828072495789, + "blocks.1.w2.weight": 12.410841455300883, + "blocks.2.ln.weight": 0.17767497411972724, + "blocks.2.w1.weight": 4.66461449969762, + "blocks.2.w1.bias": 4.221528366446113, + "blocks.2.w2.weight": 13.02617784277652, + "blocks.3.ln.weight": 0.18648530933637847, + "blocks.3.w1.weight": 4.703468866414805, + "blocks.3.w1.bias": 3.845782047024037, + "blocks.3.w2.weight": 13.668238845356765, + "blocks.4.ln.weight": 0.20878906370184375, + "blocks.4.w1.weight": 4.6585385757744255, + "blocks.4.w1.bias": 3.740256675221265, + "blocks.4.w2.weight": 14.188102590431034, + "blocks.5.ln.weight": 0.21537598403409916, + "blocks.5.w1.weight": 4.700384882175978, + "blocks.5.w1.bias": 3.7260920466734655, + "blocks.5.w2.weight": 15.8432281824125, + "out_ln.weight": 0.3676580083270373, + "out_head.weight": 2.951732465896682, + "out_head.bias": 1.3797369883266803 + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.0429981646728517, + 2.0311185948181154, + 2.025969026145935, + 2.0156248236846923, + 2.012451182785034, + 2.0101683282852174, + 2.0090535586547853, + 2.0049661489105226, + 2.0042781643676757, + 2.007534557952881, + 2.005720973892212, + 2.0033944567108155, + 2.0026611005401613, + 2.0042629623413086, + 2.0030657132339478, + 2.0019637285614014, + 2.0002238693237304, + 2.0020113787841796, + 2.002593652191162, + 1.999959507446289, + 1.99915257938385, + 1.996764479637146, + 1.99686444190979, + 1.9965196546936035, + 1.9979205041503907, + 1.9956562859344482, + 1.9973748725128173, + 1.9964571334075927, + 1.9960263302993775, + 1.9924271702575684, + 1.992831787261963, + 1.99499480758667, + 1.9891729098892212, + 1.9939897597503662, + 1.9930099172210693, + 1.993308459815979, + 1.9917978497314452, + 1.9914746307754516, + 1.9900447463989257, + 1.992962121963501, + 1.9900524688720702, + 1.9900013018798828, + 1.990018187599182, + 1.9914000466537476, + 1.9891149829864503, + 1.9894212562561036, + 1.99083076171875, + 1.9897665852355957, + 1.98873883934021, + 1.990058041343689, + 1.987586608581543, + 1.987379070777893, + 1.9863710124206544, + 1.988468872642517, + 1.9863781386947632, + 1.9846030602264404, + 1.986063505783081, + 1.9875353760147094, + 1.9865796419525146, + 1.9875003507995606, + 1.9842604379272462, + 1.9855676065444947, + 1.9839949224472047, + 1.985175651473999, + 1.9853779614639282, + 1.9842977197265625, + 1.9852548834228516, + 1.9850790433120729, + 1.983184485321045, + 1.9850950769805908, + 1.9860374071502687, + 1.985449473876953, + 1.986313660736084, + 1.9834488523864746, + 1.9854728340911865, + 1.9834792975616455, + 1.9839858917999267, + 1.983295297241211, + 1.9832000505065919, + 1.9842015452575683, + 1.9817747521209716, + 1.9825036289215088, + 1.983466981277466, + 1.9826897898864746, + 1.9832522836303712, + 1.9837559247589112, + 1.9846134539031983, + 1.980646923828125, + 1.9809106316375733, + 1.9838191221618653, + 1.981862756576538, + 1.9802230101013183, + 1.9814140343475342, + 1.9822363115692139, + 1.982738264541626, + 1.9809983926773072, + 1.9829246353912353, + 1.981134694480896, + 1.9824947088241578, + 1.9818510884094238 + ], + "train_acc": [ + 0.25012, + 0.2569, + 0.25934, + 0.26228, + 0.26296, + 0.26604, + 0.2663, + 0.26786, + 0.26776, + 0.26536, + 0.26794, + 0.2679, + 0.27008, + 0.26912, + 0.27114, + 0.27122, + 0.27314, + 0.27074, + 0.26774, + 0.26882, + 0.2714, + 0.27276, + 0.27218, + 0.2744, + 0.27288, + 0.27368, + 0.27384, + 0.27596, + 0.27198, + 0.27772, + 0.27426, + 0.27528, + 0.27714, + 0.2757, + 0.27328, + 0.27562, + 0.27496, + 0.27752, + 0.27654, + 0.27576, + 0.27678, + 0.2766, + 0.27842, + 0.2765, + 0.28062, + 0.2769, + 0.27744, + 0.27504, + 0.27708, + 0.2794, + 0.27856, + 0.27826, + 0.28152, + 0.2805, + 0.27904, + 0.28034, + 0.28012, + 0.27994, + 0.27844, + 0.27932, + 0.28254, + 0.28096, + 0.28152, + 0.2795, + 0.28278, + 0.28194, + 0.28228, + 0.28134, + 0.28312, + 0.28172, + 0.2811, + 0.28118, + 0.2794, + 0.28338, + 0.2802, + 0.2814, + 0.28282, + 0.28256, + 0.2834, + 0.28248, + 0.28152, + 0.28336, + 0.28338, + 0.28288, + 0.28162, + 0.28292, + 0.28282, + 0.2848, + 0.28472, + 0.28266, + 0.28232, + 0.2875, + 0.28232, + 0.28272, + 0.28286, + 0.28446, + 0.28254, + 0.28228, + 0.28414, + 0.28394 + ], + "test_acc": [ + 0.2768, + 0.2776, + 0.2962, + 0.2815, + 0.2956, + 0.2956, + 0.2961, + 0.2963, + 0.3082, + 0.2895, + 0.2713, + 0.2959, + 0.299, + 0.2984, + 0.2889, + 0.3083, + 0.2967, + 0.2921, + 0.2979, + 0.3049, + 0.2897, + 0.2956, + 0.308, + 0.2866, + 0.2924, + 0.2989, + 0.2996, + 0.3051, + 0.2983, + 0.3066, + 0.2983, + 0.3082, + 0.3046, + 0.2948, + 0.3114, + 0.2894, + 0.3002, + 0.298, + 0.3016, + 0.2936, + 0.3076, + 0.3011, + 0.2884, + 0.2918, + 0.3046, + 0.2889, + 0.3154, + 0.3042, + 0.2921, + 0.3109, + 0.283, + 0.3003, + 0.2988, + 0.3024, + 0.2983, + 0.295, + 0.304, + 0.3112, + 0.3015, + 0.3044, + 0.314, + 0.3058, + 0.3094, + 0.3042, + 0.3112, + 0.3133, + 0.3064, + 0.2975, + 0.2975, + 0.3004, + 0.3054, + 0.3134, + 0.3093, + 0.3082, + 0.3084, + 0.3096, + 0.3041, + 0.3089, + 0.3033, + 0.3073, + 0.311, + 0.3131, + 0.3036, + 0.3127, + 0.3087, + 0.3117, + 0.3102, + 0.3056, + 0.3102, + 0.3087, + 0.3107, + 0.3099, + 0.3092, + 0.3094, + 0.3093, + 0.3102, + 0.3092, + 0.31, + 0.3098, + 0.3098 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.38683176040649414, + 0.0029573289211839437, + -0.0009689683793112636, + -0.0011474918574094772, + 0.0005293102003633976, + -0.0015941932797431946 + ], + "perturbation_rho": [ + -0.0035741720348596573, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -3.972090780735016e-07, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "0.003": [ + -1.2861564755439758e-06, + -1.862645149230957e-09, + 3.725290298461914e-09, + 0.0, + 0.0, + -1.862645149230957e-09 + ], + "0.01": [ + -4.382338374853134e-06, + -4.6566128730773926e-09, + 3.725290298461914e-09, + 0.0, + 9.313225746154785e-10, + -1.862645149230957e-09 + ] + } + }, + "drift": { + "embed.weight": 317.7495659655673, + "embed.bias": 246.61272235367505, + "blocks.0.ln.weight": 8.188531285985507, + "blocks.0.w1.weight": 202.7185165753587, + "blocks.0.w1.bias": 170.46943772700087, + "blocks.0.w2.weight": 332.85691144395827, + "blocks.1.ln.weight": 6.620851917635279, + "blocks.1.w1.weight": 230.61620075220995, + "blocks.1.w1.bias": 215.19134278855063, + "blocks.1.w2.weight": 203.35112374907072, + "blocks.2.ln.weight": 7.98453379220575, + "blocks.2.w1.weight": 315.5497282597786, + "blocks.2.w1.bias": 271.50424171303735, + "blocks.2.w2.weight": 248.3335414952481, + "blocks.3.ln.weight": 5.77177430564541, + "blocks.3.w1.weight": 199.54069059972556, + "blocks.3.w1.bias": 166.19848046359377, + "blocks.3.w2.weight": 156.3431036649652, + "blocks.4.ln.weight": 6.358256142081412, + "blocks.4.w1.weight": 230.11944086882187, + "blocks.4.w1.bias": 194.42511513927937, + "blocks.4.w2.weight": 171.6648008658166, + "blocks.5.ln.weight": 5.859230703676208, + "blocks.5.w1.weight": 209.3533985279986, + "blocks.5.w1.bias": 181.2514045255841, + "blocks.5.w2.weight": 161.81010288736894, + "out_ln.weight": 0.520622874797811, + "out_head.weight": 8.076281865086848, + "out_head.bias": 1.2313841339767553 + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.0568496820831297, + 2.0357495067596436, + 2.0265325052642824, + 2.0255675648498537, + 2.0211820729827883, + 2.0130653564453125, + 2.0164043712615967, + 2.011985154876709, + 2.0152608364868163, + 2.0114740381622314, + 2.0100359706878663, + 2.0067753753662108, + 2.0120022153091432, + 2.009950690765381, + 2.0081368783187865, + 2.012003229904175, + 2.0099324744415283, + 2.010634113998413, + 2.0069234494400026, + 2.003235507774353, + 2.0058242790985106, + 2.0072046648406983, + 2.00108302066803, + 2.0016218561553956, + 1.9978092765045166, + 1.995793134841919, + 1.994058724822998, + 1.9918723776245117, + 1.98977053981781, + 1.989516119003296, + 1.9898863918304444, + 1.9870066958236694, + 1.9896904999160767, + 1.9879004209136963, + 1.9867612840270996, + 1.9895719361877442, + 1.9847314866638184, + 1.9836825936508178, + 1.9799864123535156, + 1.978990509414673, + 1.97883055809021, + 1.9726349740219116, + 1.9712072018432618, + 1.978619043121338, + 1.9836511195373536, + 1.9836528234100341, + 1.9868938672256469, + 1.993108935470581, + 1.9985688564300537, + 2.0061389767074584, + 2.0023673818969727, + 1.9980067819595337, + 1.990028013458252, + 1.9925069525146484, + 1.9965549280548096, + 2.0004678047943116, + 2.0091910595321654, + 2.0153573443603516, + 2.0439902848815916, + 2.087756749229431, + 2.1218214894104004, + 2.133594408798218, + 2.1355165560913085, + 2.1193470074462892, + 2.070676408615112, + 2.0247885906219483, + 2.002980169754028, + 2.001423611793518, + 2.011682106933594, + 2.0117178466796877, + 2.0037788080596926, + 1.9931315280914306, + 1.986942767906189, + 1.9871479096984863, + 1.9841199736785888, + 1.9854342544555663, + 1.984901067276001, + 1.9828116521835326, + 1.987117846031189, + 1.980504002685547, + 1.9845846620178222, + 1.9854082400131225, + 1.9839192948150635, + 1.9855693399429322, + 1.9832484759521485, + 1.9859395289611816, + 1.9864675799942018, + 1.98523220413208, + 1.9856301559066774, + 1.9843646090698241, + 1.983153977355957, + 1.984056966934204, + 1.9850010103607179, + 1.986421587867737, + 1.9846718848037719, + 1.9840921591186524, + 1.9866302879333495, + 1.9842277576065064, + 1.9866961249160766, + 1.9863304554748535 + ], + "train_acc": [ + 0.24782, + 0.25582, + 0.25558, + 0.25876, + 0.2594, + 0.26644, + 0.26466, + 0.2638, + 0.26388, + 0.26448, + 0.26608, + 0.26734, + 0.26408, + 0.26614, + 0.26748, + 0.26298, + 0.2657, + 0.26878, + 0.26736, + 0.27, + 0.26918, + 0.2684, + 0.27234, + 0.27186, + 0.26998, + 0.27096, + 0.27406, + 0.27414, + 0.27628, + 0.27624, + 0.27302, + 0.27606, + 0.27518, + 0.27628, + 0.27844, + 0.27712, + 0.2805, + 0.27752, + 0.27616, + 0.27868, + 0.27654, + 0.28048, + 0.27978, + 0.2762, + 0.26926, + 0.27272, + 0.2737, + 0.26804, + 0.26878, + 0.26534, + 0.26856, + 0.27126, + 0.27694, + 0.28054, + 0.2827, + 0.2824, + 0.28504, + 0.28396, + 0.2755, + 0.26492, + 0.25088, + 0.24706, + 0.24506, + 0.25206, + 0.26578, + 0.27702, + 0.28328, + 0.27956, + 0.26926, + 0.26452, + 0.2656, + 0.27034, + 0.2789, + 0.2823, + 0.28274, + 0.28074, + 0.28288, + 0.28368, + 0.28134, + 0.28298, + 0.28284, + 0.28366, + 0.28172, + 0.28472, + 0.28516, + 0.2844, + 0.2836, + 0.28454, + 0.28676, + 0.28268, + 0.28488, + 0.28714, + 0.28404, + 0.286, + 0.28564, + 0.28672, + 0.28564, + 0.28652, + 0.2853, + 0.28532 + ], + "test_acc": [ + 0.2802, + 0.284, + 0.3008, + 0.2741, + 0.286, + 0.2865, + 0.2852, + 0.2925, + 0.286, + 0.3018, + 0.3012, + 0.2835, + 0.3037, + 0.2877, + 0.3014, + 0.3066, + 0.2908, + 0.2958, + 0.2946, + 0.2903, + 0.2807, + 0.2935, + 0.3134, + 0.3113, + 0.3034, + 0.2931, + 0.3001, + 0.311, + 0.3128, + 0.3116, + 0.3099, + 0.2976, + 0.2893, + 0.291, + 0.2988, + 0.2959, + 0.2992, + 0.3119, + 0.2906, + 0.2967, + 0.3031, + 0.3076, + 0.2874, + 0.282, + 0.289, + 0.2638, + 0.2745, + 0.2872, + 0.2764, + 0.2711, + 0.2732, + 0.2744, + 0.3014, + 0.302, + 0.2931, + 0.3077, + 0.2884, + 0.2883, + 0.2814, + 0.2816, + 0.2618, + 0.2679, + 0.2625, + 0.269, + 0.2844, + 0.2972, + 0.2945, + 0.2752, + 0.276, + 0.2833, + 0.2859, + 0.2809, + 0.3011, + 0.2909, + 0.3046, + 0.3047, + 0.2977, + 0.3012, + 0.3024, + 0.2816, + 0.3022, + 0.2915, + 0.2965, + 0.3004, + 0.3024, + 0.299, + 0.2977, + 0.3026, + 0.295, + 0.3036, + 0.2982, + 0.3023, + 0.2953, + 0.3008, + 0.3, + 0.3001, + 0.299, + 0.2995, + 0.2985, + 0.2989 + ], + "value_loss": [ + 0.5431940293550491, + 0.19173510383605957, + 0.12268259384393693, + 0.10493469659805298, + 0.10201048459529877, + 0.0708414131128788, + 0.06408844601988792, + 0.0720686790394783, + 0.06697397160291672, + 0.06196294789075851, + 0.05502780232191086, + 0.04616951223134994, + 0.05243575494527817, + 0.04471795217871666, + 0.044362507430315015, + 0.045647807506322864, + 0.04227230613827705, + 0.04649371607661247, + 0.037143924347162245, + 0.03761421796441078, + 0.0374193194770813, + 0.03865032393813133, + 0.03604385726451874, + 0.0348061216533184, + 0.034909065720438955, + 0.03548428529679775, + 0.03034081528186798, + 0.030923059933185577, + 0.03219221098482609, + 0.028869735319614412, + 0.02921472702085972, + 0.025344824229478837, + 0.03069723398923874, + 0.023911022167205812, + 0.02546191979944706, + 0.0234756334400177, + 0.021548947972655295, + 0.024292344799041746, + 0.021204249440431595, + 0.023217988926172255, + 0.032371759564876555, + 0.027472765368819235, + 0.03582359938144684, + 0.040054642882347107, + 0.0429941078042984, + 0.04646095623970032, + 0.05297355647087097, + 0.07127084519863129, + 0.0587913763999939, + 0.0855120901298523, + 0.5175958820724488, + 2.393956252441406, + 11.913925989227295, + 21.20466460494995, + 122.39695868041993, + 517.7628999365235, + 530.3028672167969, + 404.2268926171875, + 258.459100078125, + 283.38131254882813, + 102.50320305175781, + 27.287051020507814, + 12.905007503051758, + 4.956491999969482, + 1.5449322800445557, + 0.5012244256973266, + 0.26081433165550233, + 0.14692765646934508, + 0.10439578160524368, + 0.07197002289533615, + 0.05530310579776764, + 0.04514324131727219, + 0.031837492654323576, + 0.024001008454561233, + 0.019366809893846513, + 0.01406323720932007, + 0.010792444348335267, + 0.008763177410960197, + 0.007306897183656693, + 0.009082207316458226, + 0.005549766648113728, + 0.005990845524594187, + 0.004990600987970829, + 0.00429255537956953, + 0.005432345700562001, + 0.003525814834535122, + 0.004226339301913976, + 0.003729854447096586, + 0.004537549587935209, + 0.0023256922054290773, + 0.003219376254081726, + 0.0022955145540088416, + 0.00276749915830791, + 0.003175384805947542, + 0.0025999026219546795, + 0.0021026480976492168, + 0.0022611236164718864, + 0.0022266844733059405, + 0.002546760700196028, + 0.0024256033681333065 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.3041490912437439, + 0.03387444466352463, + 0.05120290070772171, + 0.0619620680809021, + 0.06251867115497589, + 0.06249140202999115 + ], + "perturbation_rho": [ + -0.005746336653828621, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -7.874332368373871e-07, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "0.003": [ + -2.527143806219101e-06, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "0.01": [ + -8.463859558105469e-06, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ] + } + }, + "drift": { + "embed.weight": 150.13851572417417, + "embed.bias": 128.41508525356625, + "blocks.0.ln.weight": 5.836368229603896, + "blocks.0.w1.weight": 137.83692167652973, + "blocks.0.w1.bias": 120.59820508387907, + "blocks.0.w2.weight": 191.89941055268133, + "blocks.1.ln.weight": 5.7364977300128475, + "blocks.1.w1.weight": 223.49362295122356, + "blocks.1.w1.bias": 194.26884532235184, + "blocks.1.w2.weight": 197.19643675985097, + "blocks.2.ln.weight": 5.407984956609397, + "blocks.2.w1.weight": 224.96419292004586, + "blocks.2.w1.bias": 183.18926393313106, + "blocks.2.w2.weight": 163.77095460658097, + "blocks.3.ln.weight": 3.788219163278833, + "blocks.3.w1.weight": 178.78795349787814, + "blocks.3.w1.bias": 158.67792032092242, + "blocks.3.w2.weight": 127.01894259639586, + "blocks.4.ln.weight": 3.65585411727934, + "blocks.4.w1.weight": 138.57885809433404, + "blocks.4.w1.bias": 99.2214242231741, + "blocks.4.w2.weight": 101.99300788405023, + "blocks.5.ln.weight": 3.409437674208733, + "blocks.5.w1.weight": 110.32921272933086, + "blocks.5.w1.bias": 71.51527802753176, + "blocks.5.w2.weight": 83.53550127994924, + "out_ln.weight": 0.3630675420960623, + "out_head.weight": 5.826911511271652, + "out_head.bias": 3.507322897493987 + } + } +} \ No newline at end of file diff --git a/results/cifar_depth_scan_s42/d512_L8_s42.json b/results/cifar_depth_scan_s42/d512_L8_s42.json new file mode 100644 index 0000000..1b9e3ac --- /dev/null +++ b/results/cifar_depth_scan_s42/d512_L8_s42.json @@ -0,0 +1,1313 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.915883038673401, + 1.6826532165908814, + 1.5945291757965088, + 1.5274945846557617, + 1.4820034421539308, + 1.442767191696167, + 1.4153068727493285, + 1.3821979986190795, + 1.3577272303390502, + 1.3394956853485107, + 1.317076534767151, + 1.2955091687774658, + 1.2746722560501098, + 1.2573306383514404, + 1.2403777645874023, + 1.2230817644500733, + 1.2058218476486207, + 1.1939524814605713, + 1.1745232657241822, + 1.157467629776001, + 1.1439746014022827, + 1.1305697510528565, + 1.1148247271347045, + 1.1023933839797975, + 1.086283505592346, + 1.073430366706848, + 1.0622342100524902, + 1.0457359760665894, + 1.0301126390266417, + 1.0175300416183473, + 1.0012673997306825, + 0.9858699301910401, + 0.978185770187378, + 0.9613556467437744, + 0.945394755973816, + 0.9297811899185181, + 0.9155407496261597, + 0.8999193870353699, + 0.883978879852295, + 0.8744391927337647, + 0.8499023978042602, + 0.8385310165596008, + 0.8242085730552673, + 0.8106124278068543, + 0.7989885342788696, + 0.7789599366378784, + 0.7652538424110412, + 0.7498692364501953, + 0.7314479119682312, + 0.7191568143844604, + 0.7038094125175476, + 0.6889407563781739, + 0.6683795366287232, + 0.6543509451675416, + 0.6412768173599244, + 0.6269769005203247, + 0.6097362549209595, + 0.5970014540195465, + 0.5797126161766052, + 0.5652852652168274, + 0.5507066846847534, + 0.5374195718574524, + 0.5179209604072571, + 0.5085140320968627, + 0.49228226098060607, + 0.47772936537742616, + 0.46773862747192385, + 0.4499609982967377, + 0.437783351650238, + 0.4272708469581604, + 0.414694590549469, + 0.40083733788490294, + 0.3944969776344299, + 0.3800938123130798, + 0.3698486288642883, + 0.359144784078598, + 0.35212729773521423, + 0.3423941581821442, + 0.33239298017501834, + 0.32468383754730223, + 0.3140012940311432, + 0.30757560186386107, + 0.306006680727005, + 0.2992121668767929, + 0.2903935454463959, + 0.2856505290937424, + 0.28447353170394896, + 0.27721282821655274, + 0.27670302483081816, + 0.2717075553417206, + 0.26587641248703003, + 0.2625578575849533, + 0.25637605533599855, + 0.26298797123908996, + 0.25818991552352905, + 0.25911176864147184, + 0.2525204331064224, + 0.25532632726669313, + 0.2519308549976349, + 0.25220084325790404 + ], + "train_acc": [ + 0.31264, + 0.39142, + 0.4222, + 0.44868, + 0.46492, + 0.47794, + 0.48996, + 0.50224, + 0.51198, + 0.51518, + 0.52792, + 0.5311, + 0.53912, + 0.54762, + 0.55402, + 0.56126, + 0.56546, + 0.56916, + 0.58018, + 0.58254, + 0.59062, + 0.59414, + 0.59952, + 0.60316, + 0.60978, + 0.6147, + 0.61912, + 0.62562, + 0.63032, + 0.63576, + 0.64308, + 0.64636, + 0.64882, + 0.65384, + 0.6618, + 0.66354, + 0.67342, + 0.67882, + 0.68372, + 0.68614, + 0.69758, + 0.69736, + 0.70374, + 0.70786, + 0.7118, + 0.7184, + 0.72552, + 0.72828, + 0.73742, + 0.74336, + 0.74852, + 0.75294, + 0.76092, + 0.76556, + 0.76962, + 0.77602, + 0.7833, + 0.78558, + 0.7929, + 0.79948, + 0.80264, + 0.80768, + 0.8158, + 0.81734, + 0.82548, + 0.8299, + 0.834, + 0.83984, + 0.8439, + 0.84742, + 0.85312, + 0.85774, + 0.85856, + 0.8659, + 0.8691, + 0.87372, + 0.87712, + 0.88168, + 0.88188, + 0.885, + 0.88966, + 0.89152, + 0.89464, + 0.89494, + 0.8985, + 0.90096, + 0.90124, + 0.9037, + 0.90518, + 0.90646, + 0.9091, + 0.90814, + 0.91108, + 0.91036, + 0.91186, + 0.91076, + 0.91388, + 0.91184, + 0.91348, + 0.91236 + ], + "test_acc": [ + 0.3856, + 0.4346, + 0.4501, + 0.478, + 0.4875, + 0.5022, + 0.5082, + 0.5204, + 0.5286, + 0.526, + 0.5408, + 0.5448, + 0.5497, + 0.554, + 0.5586, + 0.5582, + 0.5704, + 0.5716, + 0.5706, + 0.5786, + 0.5784, + 0.5793, + 0.5749, + 0.5803, + 0.5861, + 0.5853, + 0.5914, + 0.5853, + 0.5857, + 0.5931, + 0.5927, + 0.5896, + 0.5884, + 0.5893, + 0.592, + 0.5967, + 0.596, + 0.5986, + 0.5954, + 0.5947, + 0.5926, + 0.5925, + 0.5975, + 0.5989, + 0.596, + 0.5905, + 0.5967, + 0.5981, + 0.6016, + 0.5987, + 0.5932, + 0.5941, + 0.6009, + 0.5969, + 0.6018, + 0.5988, + 0.5972, + 0.5994, + 0.5961, + 0.6002, + 0.5958, + 0.5927, + 0.5963, + 0.5966, + 0.5983, + 0.5938, + 0.5983, + 0.5933, + 0.5971, + 0.5994, + 0.5915, + 0.5951, + 0.5928, + 0.5914, + 0.595, + 0.5951, + 0.5918, + 0.5922, + 0.594, + 0.5895, + 0.5919, + 0.5959, + 0.5924, + 0.59, + 0.5911, + 0.5889, + 0.5895, + 0.5893, + 0.5895, + 0.5895, + 0.5888, + 0.5889, + 0.5883, + 0.5884, + 0.589, + 0.5886, + 0.5887, + 0.5891, + 0.5891, + 0.5893 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9652402400970459, + 0.9650944471359253, + 0.9653107523918152, + 0.9652330875396729, + 0.9652847051620483, + 0.9657888412475586, + 0.9645384550094604, + 0.9626421928405762 + ], + "perturbation_rho": [ + 0.988792896270752, + 0.9915838837623596, + 0.9924975037574768, + 0.9927228689193726, + 0.9931389093399048, + 0.9920060038566589, + 0.9927037358283997, + 0.9916384816169739 + ], + "nudging": { + "0.001": [ + -0.002859140280634165, + -0.0028454181738197803, + -0.0028910627588629723, + -0.002915592398494482, + -0.002882363274693489, + -0.0027308787684887648, + -0.0025113134179264307, + -0.002093898830935359 + ], + "0.003": [ + -0.008569219149649143, + -0.008527351543307304, + -0.00866447202861309, + -0.008737519383430481, + -0.00863889791071415, + -0.00818516593426466, + -0.007527736481279135, + -0.00627755094319582 + ], + "0.01": [ + -0.028463756665587425, + -0.02832203544676304, + -0.028776202350854874, + -0.02901865355670452, + -0.028697077184915543, + -0.02719692885875702, + -0.025021735578775406, + -0.02087603136897087 + ] + } + }, + "drift": { + "embed.weight": 8.768116164246894, + "embed.bias": 14.842866852450323, + "blocks.0.ln.weight": 0.3243736999277519, + "blocks.0.w1.weight": 4.248609055700286, + "blocks.0.w1.bias": 6.812297519559175, + "blocks.0.w2.weight": 10.91013034026142, + "blocks.1.ln.weight": 0.2264375721290641, + "blocks.1.w1.weight": 4.530696239577078, + "blocks.1.w1.bias": 4.691704909019707, + "blocks.1.w2.weight": 12.033360841473895, + "blocks.2.ln.weight": 0.19514233538894757, + "blocks.2.w1.weight": 4.641536271142397, + "blocks.2.w1.bias": 3.9592492063653415, + "blocks.2.w2.weight": 12.825064196706213, + "blocks.3.ln.weight": 0.20608382603702532, + "blocks.3.w1.weight": 4.675452058260372, + "blocks.3.w1.bias": 3.8959342701768565, + "blocks.3.w2.weight": 13.295810386821595, + "blocks.4.ln.weight": 0.21010986166308263, + "blocks.4.w1.weight": 4.643995186005312, + "blocks.4.w1.bias": 3.768514281224811, + "blocks.4.w2.weight": 13.646370291700444, + "blocks.5.ln.weight": 0.23069735418096324, + "blocks.5.w1.weight": 4.626200002743113, + "blocks.5.w1.bias": 3.8236708931328205, + "blocks.5.w2.weight": 14.086269621793239, + "blocks.6.ln.weight": 0.2603177383528657, + "blocks.6.w1.weight": 4.602646477526439, + "blocks.6.w1.bias": 3.7825134675181187, + "blocks.6.w2.weight": 14.472250927890926, + "blocks.7.ln.weight": 0.261911500383157, + "blocks.7.w1.weight": 4.5487829119704335, + "blocks.7.w1.bias": 3.638463299582741, + "blocks.7.w2.weight": 15.316485617563446, + "out_ln.weight": 0.33173738669135683, + "out_head.weight": 3.2824882859100533, + "out_head.bias": 1.1419967578910684 + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.0608128107070924, + 2.0412321961975097, + 2.0255805563354494, + 2.0184878905487063, + 2.01624364112854, + 2.012751336364746, + 2.013942890319824, + 2.013219351119995, + 2.011828511428833, + 2.0141313094329836, + 2.0115797592163087, + 2.0122245865631103, + 2.0109272706604004, + 2.0090200772476194, + 2.009412646636963, + 2.008880652618408, + 2.0089728942489624, + 2.0055529666900633, + 2.0086945219421386, + 2.0047824951171873, + 2.0031694742202757, + 2.005182927017212, + 2.0044863636779784, + 2.004345258331299, + 2.0049652186584472, + 2.000570617828369, + 2.004866870994568, + 2.0028822119522096, + 2.003401609535217, + 2.001731799697876, + 2.0005709008789063, + 1.9988768460464477, + 1.9997380918884278, + 2.002846463394165, + 1.9990734589385986, + 1.9994710061264038, + 1.9974897908782958, + 1.9986941064453125, + 1.997244268875122, + 1.9990774517822265, + 1.9992041358184816, + 1.998780822906494, + 1.9990862586975098, + 1.9967566333770752, + 1.9988449997329711, + 1.995755309448242, + 1.996486500854492, + 1.9974545507049561, + 1.9962934982681275, + 1.995275443725586, + 1.9972379402923583, + 1.9948255879974366, + 1.994635205116272, + 1.995422209739685, + 1.9959965203857422, + 1.9941707052993773, + 1.9957991414642333, + 1.995743550643921, + 1.9927717569732666, + 1.9928340990829467, + 1.9935791075134277, + 1.9936188889312745, + 1.9914473522949219, + 1.99154779296875, + 1.993619135131836, + 1.9917610000228883, + 1.9916434611511231, + 1.993833284072876, + 1.9928128030395509, + 1.991187938156128, + 1.9918081129455567, + 1.9942408345794678, + 1.9907841648101807, + 1.9906754878234862, + 1.9921169677352906, + 1.990103793334961, + 1.9908813669204712, + 1.9915815322113037, + 1.991861714782715, + 1.9920157837295531, + 1.9913273377227783, + 1.9915946127319335, + 1.9907670964050292, + 1.991461629562378, + 1.9904960403442382, + 1.9905955597686769, + 1.9918609113311767, + 1.991680837097168, + 1.9905535266494752, + 1.9902639037322998, + 1.991429512939453, + 1.9898409436798095, + 1.9906655899047851, + 1.9915429690170288, + 1.98768330619812, + 1.988915832824707, + 1.9896351364135743, + 1.990216370239258, + 1.9885352130889893, + 1.9870271291351318 + ], + "train_acc": [ + 0.243, + 0.25202, + 0.25564, + 0.26482, + 0.26238, + 0.26154, + 0.26364, + 0.26322, + 0.26436, + 0.26482, + 0.2633, + 0.26298, + 0.26476, + 0.2654, + 0.26356, + 0.26538, + 0.26644, + 0.26838, + 0.26656, + 0.26864, + 0.27314, + 0.27042, + 0.26898, + 0.26672, + 0.26908, + 0.2701, + 0.26998, + 0.27056, + 0.26842, + 0.27026, + 0.27222, + 0.27208, + 0.27172, + 0.27086, + 0.27158, + 0.2727, + 0.27244, + 0.27268, + 0.27344, + 0.27336, + 0.27228, + 0.27516, + 0.27298, + 0.2762, + 0.27606, + 0.27508, + 0.27436, + 0.27444, + 0.27638, + 0.27438, + 0.27472, + 0.27788, + 0.27694, + 0.27622, + 0.27612, + 0.2758, + 0.2748, + 0.2753, + 0.27684, + 0.27852, + 0.2789, + 0.27824, + 0.27708, + 0.27816, + 0.27774, + 0.2779, + 0.27866, + 0.27744, + 0.28004, + 0.2772, + 0.27834, + 0.27546, + 0.279, + 0.27854, + 0.27808, + 0.28114, + 0.27966, + 0.27976, + 0.27822, + 0.2767, + 0.28038, + 0.27794, + 0.2817, + 0.27958, + 0.27992, + 0.27988, + 0.28026, + 0.28032, + 0.28058, + 0.27946, + 0.2797, + 0.2796, + 0.28088, + 0.27574, + 0.28058, + 0.27854, + 0.27872, + 0.28038, + 0.28194, + 0.28066 + ], + "test_acc": [ + 0.2682, + 0.2742, + 0.2881, + 0.2861, + 0.2979, + 0.294, + 0.291, + 0.2966, + 0.2988, + 0.2988, + 0.2844, + 0.2888, + 0.2806, + 0.2961, + 0.2761, + 0.2908, + 0.2853, + 0.2763, + 0.2759, + 0.2962, + 0.3049, + 0.2905, + 0.2945, + 0.2803, + 0.2978, + 0.2973, + 0.3048, + 0.2627, + 0.2941, + 0.2926, + 0.3019, + 0.2993, + 0.2753, + 0.2948, + 0.3083, + 0.3031, + 0.2891, + 0.3018, + 0.3049, + 0.2925, + 0.3133, + 0.2912, + 0.3036, + 0.2953, + 0.3011, + 0.2927, + 0.2895, + 0.3024, + 0.3009, + 0.3024, + 0.3012, + 0.3091, + 0.2932, + 0.2974, + 0.2911, + 0.2949, + 0.2978, + 0.3017, + 0.3025, + 0.3032, + 0.3051, + 0.3055, + 0.3024, + 0.3093, + 0.2987, + 0.3004, + 0.2907, + 0.3094, + 0.296, + 0.3036, + 0.302, + 0.3117, + 0.3083, + 0.3012, + 0.3019, + 0.3025, + 0.2994, + 0.3071, + 0.3043, + 0.3032, + 0.3018, + 0.3078, + 0.3044, + 0.3039, + 0.3067, + 0.3035, + 0.3002, + 0.3073, + 0.3035, + 0.3045, + 0.3054, + 0.3075, + 0.3032, + 0.3055, + 0.305, + 0.3059, + 0.3053, + 0.3057, + 0.3058, + 0.3057 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.37686973810195923, + 0.0015315066557377577, + -0.0013667643070220947, + 7.698773697484285e-05, + 5.11965190526098e-05, + -0.0007562801474705338, + -0.00026300083845853806, + -4.065445682499558e-05 + ], + "perturbation_rho": [ + 0.015484973788261414, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -3.7671998143196106e-07, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "0.003": [ + -1.1455267667770386e-06, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "0.01": [ + -3.912951797246933e-06, + -4.6566128730773926e-09, + 0.0, + 0.0, + 1.862645149230957e-09, + 0.0, + 0.0, + 0.0 + ] + } + }, + "drift": { + "embed.weight": 322.7518389055776, + "embed.bias": 247.2993592394181, + "blocks.0.ln.weight": 7.905005047928133, + "blocks.0.w1.weight": 212.9905007399479, + "blocks.0.w1.bias": 182.14933416642216, + "blocks.0.w2.weight": 330.2619044995618, + "blocks.1.ln.weight": 6.755700255991533, + "blocks.1.w1.weight": 232.57652888590908, + "blocks.1.w1.bias": 216.016264679947, + "blocks.1.w2.weight": 201.84872258219994, + "blocks.2.ln.weight": 8.01709273899982, + "blocks.2.w1.weight": 320.8453952706143, + "blocks.2.w1.bias": 276.695608451841, + "blocks.2.w2.weight": 249.60378814337417, + "blocks.3.ln.weight": 5.7943043253709785, + "blocks.3.w1.weight": 199.17683771092914, + "blocks.3.w1.bias": 166.1495411478002, + "blocks.3.w2.weight": 154.7202840885994, + "blocks.4.ln.weight": 6.436414607996792, + "blocks.4.w1.weight": 234.06786452519447, + "blocks.4.w1.bias": 198.33331425257262, + "blocks.4.w2.weight": 172.58039651693562, + "blocks.5.ln.weight": 5.904929352186912, + "blocks.5.w1.weight": 213.62873358910434, + "blocks.5.w1.bias": 184.85933031281215, + "blocks.5.w2.weight": 162.5444110371982, + "blocks.6.ln.weight": 5.922534596873395, + "blocks.6.w1.weight": 212.35774255360528, + "blocks.6.w1.bias": 187.6428413347025, + "blocks.6.w2.weight": 168.7920563845852, + "blocks.7.ln.weight": 6.9752563434590575, + "blocks.7.w1.weight": 251.09533847711697, + "blocks.7.w1.bias": 212.42015960200564, + "blocks.7.w2.weight": 182.17183040015334, + "out_ln.weight": 0.5380156572173149, + "out_head.weight": 8.131814182552638, + "out_head.bias": 0.8699895784813219 + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.0511436333847044, + 2.0277864767456055, + 2.02313751663208, + 2.0225361193847657, + 2.0088740489196777, + 2.0053706857681273, + 2.0050094537353518, + 2.0043996282196046, + 1.9971280477905273, + 2.0012310653686525, + 1.9964948630142212, + 1.994698377227783, + 1.9948096728134155, + 1.9947182064437867, + 1.9971965953826905, + 1.9937935817718506, + 1.9970728733825684, + 1.9935891329956055, + 1.9934549239730834, + 1.9943741856384278, + 1.9916830521392823, + 1.987718446044922, + 1.9891010809326173, + 1.9910999655532837, + 1.9870087446594238, + 1.9892022339248656, + 1.9874243151855469, + 1.9917996590423583, + 1.9928570490264892, + 1.9904958669281005, + 1.9926761375427247, + 1.9937843286895751, + 1.9929048935317992, + 1.9935734990692138, + 1.9881847104263306, + 1.9887749886322021, + 1.9857899047851562, + 1.9843308640289308, + 1.9787338375091552, + 1.9824666664886474, + 1.978441342086792, + 1.9784807219696046, + 1.975589619178772, + 1.9833358307647706, + 1.9823905195617675, + 2.005378373565674, + 2.044235708847046, + 2.053414641113281, + 2.062485707550049, + 2.082823034057617, + 2.0909555229187013, + 2.080506026992798, + 2.068187072105408, + 2.0602312271881105, + 2.051138618621826, + 2.048516896209717, + 2.0438889092254637, + 2.0391429753875734, + 2.030038472366333, + 2.025220480957031, + 2.0230712211608886, + 2.0209190673828124, + 2.0193369206237795, + 2.016298021621704, + 2.0145631092071534, + 2.007977565994263, + 2.007634442100525, + 2.00878977973938, + 2.0094445184707643, + 2.01266563041687, + 2.017705497894287, + 2.022621645774841, + 2.032514253387451, + 2.0355931142425536, + 2.0368993505859376, + 2.0395946674346925, + 2.0404893283081056, + 2.0423217945861816, + 2.0412329326629637, + 2.037104062347412, + 2.0325731353759764, + 2.0280113526916503, + 2.0226307469177245, + 2.0187665083312987, + 2.0180757246398926, + 2.016418752593994, + 2.013713173828125, + 2.013864770889282, + 2.0139804064941407, + 2.012384439239502, + 2.0120543003082276, + 2.013385525588989, + 2.0126590882873536, + 2.0125275871276855, + 2.0113051068878174, + 2.012384732666016, + 2.0117678832626344, + 2.0116403619766237, + 2.0123612815093996, + 2.0132470719146727 + ], + "train_acc": [ + 0.24252, + 0.25588, + 0.261, + 0.25814, + 0.26604, + 0.26736, + 0.26858, + 0.26616, + 0.27332, + 0.2707, + 0.27226, + 0.27346, + 0.27344, + 0.271, + 0.2724, + 0.27562, + 0.2716, + 0.27578, + 0.27566, + 0.27588, + 0.2756, + 0.2763, + 0.27646, + 0.2747, + 0.2769, + 0.27584, + 0.27532, + 0.27358, + 0.27436, + 0.27466, + 0.2748, + 0.27282, + 0.27324, + 0.2744, + 0.27718, + 0.27714, + 0.27682, + 0.2795, + 0.28304, + 0.28044, + 0.28062, + 0.28496, + 0.2849, + 0.28414, + 0.28304, + 0.27624, + 0.2686, + 0.26552, + 0.26574, + 0.2669, + 0.2667, + 0.26856, + 0.26866, + 0.27098, + 0.2677, + 0.26784, + 0.26828, + 0.2664, + 0.27158, + 0.27212, + 0.26908, + 0.27222, + 0.2712, + 0.27086, + 0.2689, + 0.27072, + 0.26998, + 0.27202, + 0.26646, + 0.26438, + 0.26242, + 0.26064, + 0.25896, + 0.25936, + 0.25754, + 0.26352, + 0.26094, + 0.263, + 0.26368, + 0.26518, + 0.2691, + 0.2693, + 0.26912, + 0.27422, + 0.2738, + 0.27242, + 0.27296, + 0.27486, + 0.27162, + 0.27384, + 0.27526, + 0.27172, + 0.27436, + 0.27512, + 0.27536, + 0.2737, + 0.27316, + 0.27306, + 0.27564, + 0.27502 + ], + "test_acc": [ + 0.2611, + 0.2728, + 0.2907, + 0.2809, + 0.2926, + 0.308, + 0.3005, + 0.3036, + 0.3052, + 0.2847, + 0.2973, + 0.2946, + 0.3093, + 0.2907, + 0.2893, + 0.3111, + 0.3023, + 0.2891, + 0.2992, + 0.295, + 0.2972, + 0.2999, + 0.3136, + 0.305, + 0.2994, + 0.3022, + 0.308, + 0.2936, + 0.2988, + 0.3132, + 0.299, + 0.2989, + 0.2874, + 0.2961, + 0.3114, + 0.3062, + 0.2921, + 0.3129, + 0.2986, + 0.2975, + 0.3083, + 0.2973, + 0.2912, + 0.3022, + 0.294, + 0.2862, + 0.264, + 0.2576, + 0.2455, + 0.2604, + 0.2623, + 0.2694, + 0.2661, + 0.2696, + 0.2726, + 0.265, + 0.2603, + 0.2717, + 0.2617, + 0.2692, + 0.2806, + 0.2848, + 0.2879, + 0.271, + 0.2743, + 0.2673, + 0.279, + 0.2598, + 0.2612, + 0.2694, + 0.2531, + 0.2553, + 0.254, + 0.2426, + 0.2479, + 0.2594, + 0.2546, + 0.2605, + 0.2661, + 0.27, + 0.2717, + 0.2842, + 0.2891, + 0.2864, + 0.2804, + 0.2904, + 0.2905, + 0.2865, + 0.2837, + 0.2868, + 0.2888, + 0.2865, + 0.2922, + 0.2874, + 0.2855, + 0.2892, + 0.2892, + 0.2887, + 0.2881, + 0.2881 + ], + "value_loss": [ + 0.42954374360084535, + 0.15756836537361146, + 0.12134378553867341, + 0.11469457547187806, + 0.09599290944099426, + 0.0877463513469696, + 0.0803228804397583, + 0.0667632784330845, + 0.0672521750831604, + 0.0677217069363594, + 0.06062764830827713, + 0.05060176089763641, + 0.05358793372392654, + 0.0549625644493103, + 0.052779753321409224, + 0.046068096545934675, + 0.060794142736196516, + 0.045549960198402406, + 0.04104518217980862, + 0.046112847526073454, + 0.04252848902463913, + 0.03344858367443085, + 0.03625167763471603, + 0.04116482120513916, + 0.03612018641352654, + 0.03742522090911865, + 0.03000010380625725, + 0.03407002721071243, + 0.03310543386161327, + 0.02845939307689667, + 0.02669600613832474, + 0.029440363923311234, + 0.025257505105137825, + 0.02826717380940914, + 0.024276180317401887, + 0.021678789145350458, + 0.02275293359041214, + 0.024361893134117126, + 0.019806503029465676, + 0.028984218854904174, + 0.025155036890506743, + 0.028825275114774705, + 0.035153553171157835, + 0.04898144502878189, + 0.053181294503211976, + 0.25244187658309936, + 9.008439293670655, + 244.4939577636719, + 1492.590131953125, + 5003.36131859375, + 15302.2068553125, + 42179.784040625, + 40569.28429, + 55602.10701875, + 58168.276421875, + 47172.94552875, + 32400.684385, + 36457.8510815625, + 55178.61985875, + 33309.7381096875, + 11320.94740828125, + 20943.124659375, + 19742.98079, + 7133.2663896875, + 7511.98685734375, + 4198.7234078125, + 5113.87740875, + 3748.421473125, + 2814.479872578125, + 2090.86994609375, + 1224.1438057421874, + 568.31011984375, + 272.7561458203125, + 120.44688937988282, + 92.17080795898437, + 58.42213998718262, + 22.001411871643068, + 13.230551771850585, + 7.299799581985473, + 1.8038615107917786, + 0.6261436622428894, + 0.23487731760025024, + 0.09752666207790375, + 0.05221867031812668, + 0.03414971536874771, + 0.02229098296046257, + 0.014439315105676651, + 0.01196531643152237, + 0.009077809438109399, + 0.008066386908292771, + 0.006000318608433008, + 0.006079038715660572, + 0.0053833009558916095, + 0.004241169492304325, + 0.003964086800217629, + 0.0037191870298981665, + 0.004121905582398176, + 0.0030519997741281987, + 0.002969844557568431, + 0.00373484493046999 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.20516762137413025, + 0.010197397321462631, + 0.012989584356546402, + 0.01799590140581131, + 0.026415985077619553, + 0.028529509902000427, + 0.02881331369280815, + 0.029378943145275116 + ], + "perturbation_rho": [ + 0.03650364279747009, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -5.299225449562073e-07, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "0.003": [ + -1.5022233128547668e-06, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "0.01": [ + -5.0407834351062775e-06, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ] + } + }, + "drift": { + "embed.weight": 144.386565398537, + "embed.bias": 134.32612651237073, + "blocks.0.ln.weight": 6.748346473737498, + "blocks.0.w1.weight": 132.91428698293475, + "blocks.0.w1.bias": 119.60864597492228, + "blocks.0.w2.weight": 212.526020150235, + "blocks.1.ln.weight": 4.414642051445624, + "blocks.1.w1.weight": 225.12165033097793, + "blocks.1.w1.bias": 234.43494513588323, + "blocks.1.w2.weight": 178.536762788961, + "blocks.2.ln.weight": 5.970302149919209, + "blocks.2.w1.weight": 271.1166277423572, + "blocks.2.w1.bias": 227.3762025819469, + "blocks.2.w2.weight": 203.14523981621292, + "blocks.3.ln.weight": 5.796867528153885, + "blocks.3.w1.weight": 255.0825523445021, + "blocks.3.w1.bias": 231.33899213301072, + "blocks.3.w2.weight": 158.37683433796386, + "blocks.4.ln.weight": 4.529609889606443, + "blocks.4.w1.weight": 162.41528397286507, + "blocks.4.w1.bias": 142.635739824408, + "blocks.4.w2.weight": 120.99022470237554, + "blocks.5.ln.weight": 4.160579158399913, + "blocks.5.w1.weight": 154.8997138115475, + "blocks.5.w1.bias": 138.47252168248815, + "blocks.5.w2.weight": 128.9164645106335, + "blocks.6.ln.weight": 3.6901613153795623, + "blocks.6.w1.weight": 111.81360738270082, + "blocks.6.w1.bias": 84.19462418565291, + "blocks.6.w2.weight": 97.14752351362607, + "blocks.7.ln.weight": 4.210487097037135, + "blocks.7.w1.weight": 93.35554428980572, + "blocks.7.w1.bias": 43.21054718035769, + "blocks.7.w2.weight": 87.7426729890803, + "out_ln.weight": 0.3258527803812823, + "out_head.weight": 5.969889930683836, + "out_head.bias": 3.3113123218582157 + } + } +} \ No newline at end of file diff --git a/results/cifar_depth_scan_s42/summary.json b/results/cifar_depth_scan_s42/summary.json new file mode 100644 index 0000000..b16273d --- /dev/null +++ b/results/cifar_depth_scan_s42/summary.json @@ -0,0 +1,186 @@ +{ + "d512_L8_s42": { + "bp": { + "test_acc": 0.5893, + "mean_bp_cosine": 0.9648915901780128, + "mean_rho": 0.9918855354189873, + "mean_nudge_01": -0.027046552626416087, + "bp_cosine_per_layer": [ + 0.9652402400970459, + 0.9650944471359253, + 0.9653107523918152, + 0.9652330875396729, + 0.9652847051620483, + 0.9657888412475586, + 0.9645384550094604, + 0.9626421928405762 + ], + "rho_per_layer": [ + 0.988792896270752, + 0.9915838837623596, + 0.9924975037574768, + 0.9927228689193726, + 0.9931389093399048, + 0.9920060038566589, + 0.9927037358283997, + 0.9916384816169739 + ] + }, + "dfa": { + "test_acc": 0.3057, + "mean_bp_cosine": 0.047012841157993535, + "mean_rho": 0.0019356217235326767, + "mean_nudge_01": -4.894682206213474e-07, + "bp_cosine_per_layer": [ + 0.37686973810195923, + 0.0015315066557377577, + -0.0013667643070220947, + 7.698773697484285e-05, + 5.11965190526098e-05, + -0.0007562801474705338, + -0.00026300083845853806, + -4.065445682499558e-05 + ], + "rho_per_layer": [ + 0.015484973788261414, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ] + }, + "credit_bridge": { + "test_acc": 0.2881, + "mean_bp_cosine": 0.04493603203445673, + "mean_rho": 0.004562955349683762, + "mean_nudge_01": -6.300979293882847e-07, + "bp_cosine_per_layer": [ + 0.20516762137413025, + 0.010197397321462631, + 0.012989584356546402, + 0.01799590140581131, + 0.026415985077619553, + 0.028529509902000427, + 0.02881331369280815, + 0.029378943145275116 + ], + "rho_per_layer": [ + 0.03650364279747009, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ] + } + }, + "d512_L12_s42": { + "bp": { + "test_acc": 0.594, + "mean_bp_cosine": 0.9404260218143463, + "mean_rho": 0.9899803350369135, + "mean_nudge_01": -0.026733027460674446, + "bp_cosine_per_layer": [ + 0.9423961043357849, + 0.9423063397407532, + 0.9428478479385376, + 0.9422410726547241, + 0.9424552917480469, + 0.9417660236358643, + 0.9408372640609741, + 0.9404677152633667, + 0.9403290748596191, + 0.9396632313728333, + 0.935971736907959, + 0.9338305592536926 + ], + "rho_per_layer": [ + 0.987454891204834, + 0.9897942543029785, + 0.990141749382019, + 0.9901803731918335, + 0.9920680522918701, + 0.9906818866729736, + 0.9903223514556885, + 0.9926531910896301, + 0.9914379119873047, + 0.9897843599319458, + 0.9882909059524536, + 0.9869540929794312 + ] + }, + "dfa": { + "test_acc": 0.309, + "mean_bp_cosine": 0.032277349038243607, + "mean_rho": -0.003907783577839534, + "mean_nudge_01": -3.9018535365660984e-07, + "bp_cosine_per_layer": [ + 0.38828110694885254, + 0.0037502094637602568, + -0.0013616610085591674, + -0.0004177851078566164, + 0.0008564171148464084, + 0.00033698498737066984, + 0.0006134084542281926, + -0.00040099132456816733, + -0.00013616093201562762, + -0.0008071845513768494, + -0.0019259440014138818, + -0.0014602115843445063 + ], + "rho_per_layer": [ + -0.0468934029340744, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ] + }, + "credit_bridge": { + "test_acc": 0.239, + "mean_bp_cosine": 0.032352436101064086, + "mean_rho": 0.0008616718308379253, + "mean_nudge_01": -3.4909074505170185e-07, + "bp_cosine_per_layer": [ + 0.20759254693984985, + 0.005885659717023373, + 0.014463091269135475, + 0.013757804408669472, + 0.01659775897860527, + 0.0177934467792511, + 0.018012138083577156, + 0.019089948385953903, + 0.019284311681985855, + 0.01838410645723343, + 0.01891487091779709, + 0.018453549593687057 + ], + "rho_per_layer": [ + 0.010340061970055103, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ] + } + } +} \ No newline at end of file diff --git a/results/confirmatory/T1_cifar_full_metrics_gpu1.csv b/results/confirmatory/T1_cifar_full_metrics_gpu1.csv new file mode 100644 index 0000000..2934ca0 --- /dev/null +++ b/results/confirmatory/T1_cifar_full_metrics_gpu1.csv @@ -0,0 +1,41 @@ +method,seed,acc,naive_StateErr,Gamma_raw,Gamma_filtered,rho,mean_bp_grad_norm +bp,42,0.595703125,1.2188102006912231,1.0,1.0,0.9967928230762482,3.693166225718662e-13 +bp,123,0.58203125,0.3951377868652344,1.0,1.0,0.9970253705978394,3.384779884827338e-13 +bp,456,0.599609375,0.5329511165618896,1.0,1.0,0.9970139116048813,3.510028164931296e-13 +bp,789,0.587890625,0.5530461072921753,1.0,1.0,0.9970511049032211,4.048752029169392e-13 +bp,1024,0.583984375,0.42479196190834045,1.0,1.0,0.996942326426506,3.1443557745600495e-13 +bp,2048,0.599609375,1.1986371278762817,1.0,1.0,0.9970080107450485,4.468056682288297e-13 +bp,3000,0.61328125,0.3282836675643921,1.0,1.0,0.9970394372940063,2.6564703195963886e-13 +bp,4000,0.587890625,0.5284427404403687,1.0,1.0,0.996964618563652,3.3071591323233403e-13 +bp,5000,0.599609375,0.8547693490982056,1.0,1.0,0.9970963299274445,6.753224010818543e-13 +bp,6000,0.625,0.4777200222015381,1.0,1.0,0.9974031299352646,3.588729994056204e-13 +dfa,42,0.3046875,0.40483805537223816,0.1080235467525199,nan,0.0011517246020957828,1.1386262709764883e-15 +dfa,123,0.3203125,2.333367347717285,0.11465638730078354,nan,0.008965837070718408,9.595368991455386e-16 +dfa,456,0.3046875,0.9767144918441772,0.09943736994864594,nan,0.0008550649508833885,1.1573423951446467e-15 +dfa,789,0.296875,0.8594386577606201,0.09887104675726732,nan,-0.0052263434045016766,1.3544077377898581e-15 +dfa,1024,0.31640625,0.5865541696548462,0.10695325827691704,nan,-0.00039922623545862734,1.2429848301023218e-15 +dfa,2048,0.3125,1.8731361627578735,0.10717901979660382,nan,0.0007712631486356258,8.331752373430004e-16 +dfa,3000,0.33203125,2.387418746948242,0.09558150597149506,nan,-0.0022608496947214007,5.989186956841618e-16 +dfa,4000,0.310546875,1.8185988664627075,0.09947461802858015,nan,-0.0008177041891030967,1.1832308083786999e-15 +dfa,5000,0.318359375,2.25960636138916,0.10727746496195323,nan,0.0021863116417080164,1.088633344130269e-15 +dfa,6000,0.2734375,0.6399673819541931,0.09705478792602662,nan,-0.00021292048040777445,5.782290864404175e-16 +state_bridge,42,0.1875,0.5480539798736572,-0.006847438809927553,nan,-0.0033503572922199965,6.753647187263035e-15 +state_bridge,123,0.271484375,0.9387213587760925,0.00029219509451650083,nan,-0.004323488799855113,4.7659078111067574e-15 +state_bridge,456,0.212890625,1.2990467548370361,0.00021752348402515054,nan,0.001790215028449893,6.9080542137086315e-15 +state_bridge,789,0.2265625,0.6292945146560669,-0.005122891270730179,nan,-0.004575830884277821,6.371482087621293e-15 +state_bridge,1024,0.138671875,7.639553070068359,-0.0010206155529886018,nan,0.0013428584206849337,3.4327788698175814e-15 +state_bridge,2048,0.216796875,0.7094012498855591,-0.0007200911632025964,nan,-0.0017147627077065408,2.6454378526256264e-14 +state_bridge,3000,0.072265625,0.2765243649482727,0.003786540313740261,nan,0.006711192894726992,7.873830126760254e-15 +state_bridge,4000,0.23046875,0.7042198777198792,0.0015801019317223108,nan,-0.001743727712891996,1.0400603707230018e-14 +state_bridge,5000,0.21484375,1.012908935546875,0.007500769032048993,nan,0.005288134561851621,1.9910279811604025e-15 +state_bridge,6000,0.19140625,0.5420122146606445,-0.0020646299635700416,nan,-0.007079285569489002,1.3198276672869995e-14 +credit_bridge,42,0.2421875,2.073707103729248,0.060074162160162814,nan,-0.00017933925846591592,8.895705675661841e-16 +credit_bridge,123,0.30859375,0.4683569073677063,0.09847837615234312,nan,0.002981545985676348,1.9165702501404017e-15 +credit_bridge,456,0.28515625,0.5449144840240479,0.0752467044221703,nan,0.006958535872399807,1.7329475580791445e-15 +credit_bridge,789,0.296875,0.8320807218551636,0.07125743849610444,nan,-0.0008974073571152985,1.0435722653786667e-15 +credit_bridge,1024,0.31640625,1.1375874280929565,0.08833102410426363,nan,-0.00041424453957006335,1.4308689298251692e-15 +credit_bridge,2048,0.28515625,0.4803884029388428,0.08503903213568265,nan,0.004536385647952557,1.3573925402413024e-15 +credit_bridge,3000,0.25390625,13.376199722290039,0.052660267348983325,nan,0.004218182526528835,2.137676845175495e-15 +credit_bridge,4000,0.28515625,2.305067300796509,0.07496658433956327,nan,0.0011277806479483843,1.4501345329102488e-15 +credit_bridge,5000,0.287109375,0.3139641284942627,0.0831147322896868,nan,-0.00015175246517173946,1.8978978519801938e-16 +credit_bridge,6000,0.271484375,1.1344530582427979,0.07538191772073333,nan,0.007047428167425096,1.1003135644617374e-15 diff --git a/results/confirmatory/T2_support_sparsity_FIXED.csv b/results/confirmatory/T2_support_sparsity_FIXED.csv new file mode 100644 index 0000000..5fdfa9c --- /dev/null +++ b/results/confirmatory/T2_support_sparsity_FIXED.csv @@ -0,0 +1,961 @@ +method,seed,layer,threshold,support_fraction,mean_norm,median_norm +bp,42,0,1e-08,0.9990234375,6.420379941118881e-05,4.757100032293238e-05 +bp,42,0,1e-07,0.998046875,6.420379941118881e-05,4.757100032293238e-05 +bp,42,0,1e-06,0.9443359375,6.420379941118881e-05,4.757100032293238e-05 +bp,42,0,1e-05,0.78125,6.420379941118881e-05,4.757100032293238e-05 +bp,42,0,0.0001,0.2548828125,6.420379941118881e-05,4.757100032293238e-05 +bp,42,0,0.001,0.0,6.420379941118881e-05,4.757100032293238e-05 +bp,42,1,1e-08,0.9990234375,6.868089258205146e-05,5.125039388076402e-05 +bp,42,1,1e-07,0.998046875,6.868089258205146e-05,5.125039388076402e-05 +bp,42,1,1e-06,0.9482421875,6.868089258205146e-05,5.125039388076402e-05 +bp,42,1,1e-05,0.79296875,6.868089258205146e-05,5.125039388076402e-05 +bp,42,1,0.0001,0.2861328125,6.868089258205146e-05,5.125039388076402e-05 +bp,42,1,0.001,0.0,6.868089258205146e-05,5.125039388076402e-05 +bp,42,2,1e-08,0.9990234375,7.030378037597984e-05,5.254471398075111e-05 +bp,42,2,1e-07,0.998046875,7.030378037597984e-05,5.254471398075111e-05 +bp,42,2,1e-06,0.9501953125,7.030378037597984e-05,5.254471398075111e-05 +bp,42,2,1e-05,0.8017578125,7.030378037597984e-05,5.254471398075111e-05 +bp,42,2,0.0001,0.3056640625,7.030378037597984e-05,5.254471398075111e-05 +bp,42,2,0.001,0.0,7.030378037597984e-05,5.254471398075111e-05 +bp,42,3,1e-08,0.9990234375,6.579310866072774e-05,5.176133709028363e-05 +bp,42,3,1e-07,0.998046875,6.579310866072774e-05,5.176133709028363e-05 +bp,42,3,1e-06,0.9501953125,6.579310866072774e-05,5.176133709028363e-05 +bp,42,3,1e-05,0.7939453125,6.579310866072774e-05,5.176133709028363e-05 +bp,42,3,0.0001,0.2763671875,6.579310866072774e-05,5.176133709028363e-05 +bp,42,3,0.001,0.0,6.579310866072774e-05,5.176133709028363e-05 +bp,123,0,1e-08,0.9990234375,6.826331082265824e-05,5.234080526861362e-05 +bp,123,0,1e-07,0.9921875,6.826331082265824e-05,5.234080526861362e-05 +bp,123,0,1e-06,0.9345703125,6.826331082265824e-05,5.234080526861362e-05 +bp,123,0,1e-05,0.7724609375,6.826331082265824e-05,5.234080526861362e-05 +bp,123,0,0.0001,0.27734375,6.826331082265824e-05,5.234080526861362e-05 +bp,123,0,0.001,0.0,6.826331082265824e-05,5.234080526861362e-05 +bp,123,1,1e-08,0.9990234375,7.233803626149893e-05,5.5852517107268795e-05 +bp,123,1,1e-07,0.9931640625,7.233803626149893e-05,5.5852517107268795e-05 +bp,123,1,1e-06,0.939453125,7.233803626149893e-05,5.5852517107268795e-05 +bp,123,1,1e-05,0.77734375,7.233803626149893e-05,5.5852517107268795e-05 +bp,123,1,0.0001,0.306640625,7.233803626149893e-05,5.5852517107268795e-05 +bp,123,1,0.001,0.0,7.233803626149893e-05,5.5852517107268795e-05 +bp,123,2,1e-08,0.9990234375,7.557235949207097e-05,5.8344197896076366e-05 +bp,123,2,1e-07,0.994140625,7.557235949207097e-05,5.8344197896076366e-05 +bp,123,2,1e-06,0.94140625,7.557235949207097e-05,5.8344197896076366e-05 +bp,123,2,1e-05,0.7900390625,7.557235949207097e-05,5.8344197896076366e-05 +bp,123,2,0.0001,0.3251953125,7.557235949207097e-05,5.8344197896076366e-05 +bp,123,2,0.001,0.0,7.557235949207097e-05,5.8344197896076366e-05 +bp,123,3,1e-08,0.9990234375,7.112986349966377e-05,5.571585279540159e-05 +bp,123,3,1e-07,0.9931640625,7.112986349966377e-05,5.571585279540159e-05 +bp,123,3,1e-06,0.9375,7.112986349966377e-05,5.571585279540159e-05 +bp,123,3,1e-05,0.783203125,7.112986349966377e-05,5.571585279540159e-05 +bp,123,3,0.0001,0.3193359375,7.112986349966377e-05,5.571585279540159e-05 +bp,123,3,0.001,0.0,7.112986349966377e-05,5.571585279540159e-05 +bp,456,0,1e-08,0.9990234375,6.796819070586935e-05,5.103028888697736e-05 +bp,456,0,1e-07,0.9931640625,6.796819070586935e-05,5.103028888697736e-05 +bp,456,0,1e-06,0.94921875,6.796819070586935e-05,5.103028888697736e-05 +bp,456,0,1e-05,0.802734375,6.796819070586935e-05,5.103028888697736e-05 +bp,456,0,0.0001,0.2705078125,6.796819070586935e-05,5.103028888697736e-05 +bp,456,0,0.001,0.0,6.796819070586935e-05,5.103028888697736e-05 +bp,456,1,1e-08,0.9990234375,7.196342630777508e-05,5.5566310038557276e-05 +bp,456,1,1e-07,0.9931640625,7.196342630777508e-05,5.5566310038557276e-05 +bp,456,1,1e-06,0.9501953125,7.196342630777508e-05,5.5566310038557276e-05 +bp,456,1,1e-05,0.80859375,7.196342630777508e-05,5.5566310038557276e-05 +bp,456,1,0.0001,0.294921875,7.196342630777508e-05,5.5566310038557276e-05 +bp,456,1,0.001,0.0,7.196342630777508e-05,5.5566310038557276e-05 +bp,456,2,1e-08,0.9990234375,7.424073555739596e-05,5.7587629271438345e-05 +bp,456,2,1e-07,0.994140625,7.424073555739596e-05,5.7587629271438345e-05 +bp,456,2,1e-06,0.953125,7.424073555739596e-05,5.7587629271438345e-05 +bp,456,2,1e-05,0.8173828125,7.424073555739596e-05,5.7587629271438345e-05 +bp,456,2,0.0001,0.3173828125,7.424073555739596e-05,5.7587629271438345e-05 +bp,456,2,0.001,0.0,7.424073555739596e-05,5.7587629271438345e-05 +bp,456,3,1e-08,0.9990234375,6.964454951230437e-05,5.580891956924461e-05 +bp,456,3,1e-07,0.994140625,6.964454951230437e-05,5.580891956924461e-05 +bp,456,3,1e-06,0.951171875,6.964454951230437e-05,5.580891956924461e-05 +bp,456,3,1e-05,0.8115234375,6.964454951230437e-05,5.580891956924461e-05 +bp,456,3,0.0001,0.302734375,6.964454951230437e-05,5.580891956924461e-05 +bp,456,3,0.001,0.0,6.964454951230437e-05,5.580891956924461e-05 +bp,789,0,1e-08,1.0,6.683701940346509e-05,5.013712871004827e-05 +bp,789,0,1e-07,0.9921875,6.683701940346509e-05,5.013712871004827e-05 +bp,789,0,1e-06,0.9365234375,6.683701940346509e-05,5.013712871004827e-05 +bp,789,0,1e-05,0.7763671875,6.683701940346509e-05,5.013712871004827e-05 +bp,789,0,0.0001,0.2666015625,6.683701940346509e-05,5.013712871004827e-05 +bp,789,0,0.001,0.0,6.683701940346509e-05,5.013712871004827e-05 +bp,789,1,1e-08,1.0,7.033518340904266e-05,5.225545828579925e-05 +bp,789,1,1e-07,0.9921875,7.033518340904266e-05,5.225545828579925e-05 +bp,789,1,1e-06,0.9375,7.033518340904266e-05,5.225545828579925e-05 +bp,789,1,1e-05,0.7841796875,7.033518340904266e-05,5.225545828579925e-05 +bp,789,1,0.0001,0.2890625,7.033518340904266e-05,5.225545828579925e-05 +bp,789,1,0.001,0.0,7.033518340904266e-05,5.225545828579925e-05 +bp,789,2,1e-08,1.0,7.296205149032176e-05,5.62719396839384e-05 +bp,789,2,1e-07,0.9931640625,7.296205149032176e-05,5.62719396839384e-05 +bp,789,2,1e-06,0.939453125,7.296205149032176e-05,5.62719396839384e-05 +bp,789,2,1e-05,0.7939453125,7.296205149032176e-05,5.62719396839384e-05 +bp,789,2,0.0001,0.3095703125,7.296205149032176e-05,5.62719396839384e-05 +bp,789,2,0.001,0.0,7.296205149032176e-05,5.62719396839384e-05 +bp,789,3,1e-08,1.0,6.898639549035579e-05,5.509496986633167e-05 +bp,789,3,1e-07,0.9921875,6.898639549035579e-05,5.509496986633167e-05 +bp,789,3,1e-06,0.9404296875,6.898639549035579e-05,5.509496986633167e-05 +bp,789,3,1e-05,0.7919921875,6.898639549035579e-05,5.509496986633167e-05 +bp,789,3,0.0001,0.2919921875,6.898639549035579e-05,5.509496986633167e-05 +bp,789,3,0.001,0.0,6.898639549035579e-05,5.509496986633167e-05 +bp,1024,0,1e-08,1.0,6.834884698037058e-05,5.0669295887928456e-05 +bp,1024,0,1e-07,0.994140625,6.834884698037058e-05,5.0669295887928456e-05 +bp,1024,0,1e-06,0.9462890625,6.834884698037058e-05,5.0669295887928456e-05 +bp,1024,0,1e-05,0.7783203125,6.834884698037058e-05,5.0669295887928456e-05 +bp,1024,0,0.0001,0.271484375,6.834884698037058e-05,5.0669295887928456e-05 +bp,1024,0,0.001,0.0,6.834884698037058e-05,5.0669295887928456e-05 +bp,1024,1,1e-08,1.0,7.204482244560495e-05,5.331864667823538e-05 +bp,1024,1,1e-07,0.9951171875,7.204482244560495e-05,5.331864667823538e-05 +bp,1024,1,1e-06,0.9501953125,7.204482244560495e-05,5.331864667823538e-05 +bp,1024,1,1e-05,0.7939453125,7.204482244560495e-05,5.331864667823538e-05 +bp,1024,1,0.0001,0.291015625,7.204482244560495e-05,5.331864667823538e-05 +bp,1024,1,0.001,0.0,7.204482244560495e-05,5.331864667823538e-05 +bp,1024,2,1e-08,1.0,7.371444371528924e-05,5.558579505304806e-05 +bp,1024,2,1e-07,0.9951171875,7.371444371528924e-05,5.558579505304806e-05 +bp,1024,2,1e-06,0.953125,7.371444371528924e-05,5.558579505304806e-05 +bp,1024,2,1e-05,0.794921875,7.371444371528924e-05,5.558579505304806e-05 +bp,1024,2,0.0001,0.3115234375,7.371444371528924e-05,5.558579505304806e-05 +bp,1024,2,0.001,0.0,7.371444371528924e-05,5.558579505304806e-05 +bp,1024,3,1e-08,1.0,7.016785821178928e-05,5.4680447647115216e-05 +bp,1024,3,1e-07,0.9951171875,7.016785821178928e-05,5.4680447647115216e-05 +bp,1024,3,1e-06,0.951171875,7.016785821178928e-05,5.4680447647115216e-05 +bp,1024,3,1e-05,0.7880859375,7.016785821178928e-05,5.4680447647115216e-05 +bp,1024,3,0.0001,0.2939453125,7.016785821178928e-05,5.4680447647115216e-05 +bp,1024,3,0.001,0.0,7.016785821178928e-05,5.4680447647115216e-05 +bp,2048,0,1e-08,1.0,6.853526429040357e-05,5.024272468290292e-05 +bp,2048,0,1e-07,0.994140625,6.853526429040357e-05,5.024272468290292e-05 +bp,2048,0,1e-06,0.9541015625,6.853526429040357e-05,5.024272468290292e-05 +bp,2048,0,1e-05,0.7685546875,6.853526429040357e-05,5.024272468290292e-05 +bp,2048,0,0.0001,0.28515625,6.853526429040357e-05,5.024272468290292e-05 +bp,2048,0,0.001,0.0,6.853526429040357e-05,5.024272468290292e-05 +bp,2048,1,1e-08,1.0,7.284673483809456e-05,5.515595694305375e-05 +bp,2048,1,1e-07,0.994140625,7.284673483809456e-05,5.515595694305375e-05 +bp,2048,1,1e-06,0.9599609375,7.284673483809456e-05,5.515595694305375e-05 +bp,2048,1,1e-05,0.7783203125,7.284673483809456e-05,5.515595694305375e-05 +bp,2048,1,0.0001,0.314453125,7.284673483809456e-05,5.515595694305375e-05 +bp,2048,1,0.001,0.0,7.284673483809456e-05,5.515595694305375e-05 +bp,2048,2,1e-08,1.0,7.534313044743612e-05,5.8226603869115934e-05 +bp,2048,2,1e-07,0.9951171875,7.534313044743612e-05,5.8226603869115934e-05 +bp,2048,2,1e-06,0.9599609375,7.534313044743612e-05,5.8226603869115934e-05 +bp,2048,2,1e-05,0.78515625,7.534313044743612e-05,5.8226603869115934e-05 +bp,2048,2,0.0001,0.322265625,7.534313044743612e-05,5.8226603869115934e-05 +bp,2048,2,0.001,0.0,7.534313044743612e-05,5.8226603869115934e-05 +bp,2048,3,1e-08,1.0,7.111730519682169e-05,5.6857017625588924e-05 +bp,2048,3,1e-07,0.994140625,7.111730519682169e-05,5.6857017625588924e-05 +bp,2048,3,1e-06,0.958984375,7.111730519682169e-05,5.6857017625588924e-05 +bp,2048,3,1e-05,0.779296875,7.111730519682169e-05,5.6857017625588924e-05 +bp,2048,3,0.0001,0.306640625,7.111730519682169e-05,5.6857017625588924e-05 +bp,2048,3,0.001,0.0,7.111730519682169e-05,5.6857017625588924e-05 +bp,3000,0,1e-08,1.0,6.646307883784175e-05,5.034794594394043e-05 +bp,3000,0,1e-07,0.990234375,6.646307883784175e-05,5.034794594394043e-05 +bp,3000,0,1e-06,0.9404296875,6.646307883784175e-05,5.034794594394043e-05 +bp,3000,0,1e-05,0.7822265625,6.646307883784175e-05,5.034794594394043e-05 +bp,3000,0,0.0001,0.265625,6.646307883784175e-05,5.034794594394043e-05 +bp,3000,0,0.001,0.0,6.646307883784175e-05,5.034794594394043e-05 +bp,3000,1,1e-08,1.0,7.086140976753086e-05,5.4273528803605586e-05 +bp,3000,1,1e-07,0.990234375,7.086140976753086e-05,5.4273528803605586e-05 +bp,3000,1,1e-06,0.943359375,7.086140976753086e-05,5.4273528803605586e-05 +bp,3000,1,1e-05,0.796875,7.086140976753086e-05,5.4273528803605586e-05 +bp,3000,1,0.0001,0.2958984375,7.086140976753086e-05,5.4273528803605586e-05 +bp,3000,1,0.001,0.0,7.086140976753086e-05,5.4273528803605586e-05 +bp,3000,2,1e-08,1.0,7.262172584887594e-05,5.737805622629821e-05 +bp,3000,2,1e-07,0.9912109375,7.262172584887594e-05,5.737805622629821e-05 +bp,3000,2,1e-06,0.9443359375,7.262172584887594e-05,5.737805622629821e-05 +bp,3000,2,1e-05,0.8056640625,7.262172584887594e-05,5.737805622629821e-05 +bp,3000,2,0.0001,0.3115234375,7.262172584887594e-05,5.737805622629821e-05 +bp,3000,2,0.001,0.0,7.262172584887594e-05,5.737805622629821e-05 +bp,3000,3,1e-08,1.0,6.807150202803314e-05,5.377770503400825e-05 +bp,3000,3,1e-07,0.990234375,6.807150202803314e-05,5.377770503400825e-05 +bp,3000,3,1e-06,0.943359375,6.807150202803314e-05,5.377770503400825e-05 +bp,3000,3,1e-05,0.7998046875,6.807150202803314e-05,5.377770503400825e-05 +bp,3000,3,0.0001,0.29296875,6.807150202803314e-05,5.377770503400825e-05 +bp,3000,3,0.001,0.0,6.807150202803314e-05,5.377770503400825e-05 +bp,4000,0,1e-08,1.0,7.025089144008234e-05,5.309484186000191e-05 +bp,4000,0,1e-07,0.994140625,7.025089144008234e-05,5.309484186000191e-05 +bp,4000,0,1e-06,0.9521484375,7.025089144008234e-05,5.309484186000191e-05 +bp,4000,0,1e-05,0.783203125,7.025089144008234e-05,5.309484186000191e-05 +bp,4000,0,0.0001,0.283203125,7.025089144008234e-05,5.309484186000191e-05 +bp,4000,0,0.001,0.0,7.025089144008234e-05,5.309484186000191e-05 +bp,4000,1,1e-08,1.0,7.402441406156868e-05,5.798995334771462e-05 +bp,4000,1,1e-07,0.994140625,7.402441406156868e-05,5.798995334771462e-05 +bp,4000,1,1e-06,0.9521484375,7.402441406156868e-05,5.798995334771462e-05 +bp,4000,1,1e-05,0.798828125,7.402441406156868e-05,5.798995334771462e-05 +bp,4000,1,0.0001,0.3154296875,7.402441406156868e-05,5.798995334771462e-05 +bp,4000,1,0.001,0.0,7.402441406156868e-05,5.798995334771462e-05 +bp,4000,2,1e-08,1.0,7.629235915374011e-05,6.0592668887693435e-05 +bp,4000,2,1e-07,0.9951171875,7.629235915374011e-05,6.0592668887693435e-05 +bp,4000,2,1e-06,0.953125,7.629235915374011e-05,6.0592668887693435e-05 +bp,4000,2,1e-05,0.7998046875,7.629235915374011e-05,6.0592668887693435e-05 +bp,4000,2,0.0001,0.328125,7.629235915374011e-05,6.0592668887693435e-05 +bp,4000,2,0.001,0.0,7.629235915374011e-05,6.0592668887693435e-05 +bp,4000,3,1e-08,1.0,7.227784226415679e-05,5.925814184593037e-05 +bp,4000,3,1e-07,0.9951171875,7.227784226415679e-05,5.925814184593037e-05 +bp,4000,3,1e-06,0.951171875,7.227784226415679e-05,5.925814184593037e-05 +bp,4000,3,1e-05,0.7958984375,7.227784226415679e-05,5.925814184593037e-05 +bp,4000,3,0.0001,0.3115234375,7.227784226415679e-05,5.925814184593037e-05 +bp,4000,3,0.001,0.0,7.227784226415679e-05,5.925814184593037e-05 +bp,5000,0,1e-08,0.9990234375,6.594879232579842e-05,4.9741967814043164e-05 +bp,5000,0,1e-07,0.994140625,6.594879232579842e-05,4.9741967814043164e-05 +bp,5000,0,1e-06,0.951171875,6.594879232579842e-05,4.9741967814043164e-05 +bp,5000,0,1e-05,0.78125,6.594879232579842e-05,4.9741967814043164e-05 +bp,5000,0,0.0001,0.263671875,6.594879232579842e-05,4.9741967814043164e-05 +bp,5000,0,0.001,0.0,6.594879232579842e-05,4.9741967814043164e-05 +bp,5000,1,1e-08,0.9990234375,7.030676351860166e-05,5.423953552963212e-05 +bp,5000,1,1e-07,0.9951171875,7.030676351860166e-05,5.423953552963212e-05 +bp,5000,1,1e-06,0.951171875,7.030676351860166e-05,5.423953552963212e-05 +bp,5000,1,1e-05,0.7900390625,7.030676351860166e-05,5.423953552963212e-05 +bp,5000,1,0.0001,0.291015625,7.030676351860166e-05,5.423953552963212e-05 +bp,5000,1,0.001,0.0,7.030676351860166e-05,5.423953552963212e-05 +bp,5000,2,1e-08,0.9990234375,7.197874947451055e-05,5.679406604031101e-05 +bp,5000,2,1e-07,0.9951171875,7.197874947451055e-05,5.679406604031101e-05 +bp,5000,2,1e-06,0.95703125,7.197874947451055e-05,5.679406604031101e-05 +bp,5000,2,1e-05,0.7919921875,7.197874947451055e-05,5.679406604031101e-05 +bp,5000,2,0.0001,0.2998046875,7.197874947451055e-05,5.679406604031101e-05 +bp,5000,2,0.001,0.0,7.197874947451055e-05,5.679406604031101e-05 +bp,5000,3,1e-08,0.9990234375,6.68182983645238e-05,5.4613014071946964e-05 +bp,5000,3,1e-07,0.9951171875,6.68182983645238e-05,5.4613014071946964e-05 +bp,5000,3,1e-06,0.95703125,6.68182983645238e-05,5.4613014071946964e-05 +bp,5000,3,1e-05,0.7919921875,6.68182983645238e-05,5.4613014071946964e-05 +bp,5000,3,0.0001,0.275390625,6.68182983645238e-05,5.4613014071946964e-05 +bp,5000,3,0.001,0.0,6.68182983645238e-05,5.4613014071946964e-05 +bp,6000,0,1e-08,1.0,6.760624091839418e-05,5.10387726535555e-05 +bp,6000,0,1e-07,0.9931640625,6.760624091839418e-05,5.10387726535555e-05 +bp,6000,0,1e-06,0.9453125,6.760624091839418e-05,5.10387726535555e-05 +bp,6000,0,1e-05,0.794921875,6.760624091839418e-05,5.10387726535555e-05 +bp,6000,0,0.0001,0.2685546875,6.760624091839418e-05,5.10387726535555e-05 +bp,6000,0,0.001,0.0,6.760624091839418e-05,5.10387726535555e-05 +bp,6000,1,1e-08,1.0,7.153110345825553e-05,5.47873969480861e-05 +bp,6000,1,1e-07,0.9931640625,7.153110345825553e-05,5.47873969480861e-05 +bp,6000,1,1e-06,0.9462890625,7.153110345825553e-05,5.47873969480861e-05 +bp,6000,1,1e-05,0.8076171875,7.153110345825553e-05,5.47873969480861e-05 +bp,6000,1,0.0001,0.2900390625,7.153110345825553e-05,5.47873969480861e-05 +bp,6000,1,0.001,0.0,7.153110345825553e-05,5.47873969480861e-05 +bp,6000,2,1e-08,1.0,7.395615102723241e-05,5.86082496738527e-05 +bp,6000,2,1e-07,0.9931640625,7.395615102723241e-05,5.86082496738527e-05 +bp,6000,2,1e-06,0.9501953125,7.395615102723241e-05,5.86082496738527e-05 +bp,6000,2,1e-05,0.814453125,7.395615102723241e-05,5.86082496738527e-05 +bp,6000,2,0.0001,0.306640625,7.395615102723241e-05,5.86082496738527e-05 +bp,6000,2,0.001,0.0,7.395615102723241e-05,5.86082496738527e-05 +bp,6000,3,1e-08,1.0,6.97624491294846e-05,5.6313398090424016e-05 +bp,6000,3,1e-07,0.994140625,6.97624491294846e-05,5.6313398090424016e-05 +bp,6000,3,1e-06,0.9482421875,6.97624491294846e-05,5.6313398090424016e-05 +bp,6000,3,1e-05,0.80859375,6.97624491294846e-05,5.6313398090424016e-05 +bp,6000,3,0.0001,0.287109375,6.97624491294846e-05,5.6313398090424016e-05 +bp,6000,3,0.001,0.0,6.97624491294846e-05,5.6313398090424016e-05 +dfa,42,0,1e-08,1.0,7.445955674256766e-08,6.033278054928815e-08 +dfa,42,0,1e-07,0.21484375,7.445955674256766e-08,6.033278054928815e-08 +dfa,42,0,1e-06,0.0,7.445955674256766e-08,6.033278054928815e-08 +dfa,42,0,1e-05,0.0,7.445955674256766e-08,6.033278054928815e-08 +dfa,42,0,0.0001,0.0,7.445955674256766e-08,6.033278054928815e-08 +dfa,42,0,0.001,0.0,7.445955674256766e-08,6.033278054928815e-08 +dfa,42,1,1e-08,0.0,6.029913235394702e-10,5.467529207159316e-10 +dfa,42,1,1e-07,0.0,6.029913235394702e-10,5.467529207159316e-10 +dfa,42,1,1e-06,0.0,6.029913235394702e-10,5.467529207159316e-10 +dfa,42,1,1e-05,0.0,6.029913235394702e-10,5.467529207159316e-10 +dfa,42,1,0.0001,0.0,6.029913235394702e-10,5.467529207159316e-10 +dfa,42,1,0.001,0.0,6.029913235394702e-10,5.467529207159316e-10 +dfa,42,2,1e-08,0.0,5.976069639146431e-10,5.441311290432793e-10 +dfa,42,2,1e-07,0.0,5.976069639146431e-10,5.441311290432793e-10 +dfa,42,2,1e-06,0.0,5.976069639146431e-10,5.441311290432793e-10 +dfa,42,2,1e-05,0.0,5.976069639146431e-10,5.441311290432793e-10 +dfa,42,2,0.0001,0.0,5.976069639146431e-10,5.441311290432793e-10 +dfa,42,2,0.001,0.0,5.976069639146431e-10,5.441311290432793e-10 +dfa,42,3,1e-08,0.0,5.973174732609721e-10,5.436861516550096e-10 +dfa,42,3,1e-07,0.0,5.973174732609721e-10,5.436861516550096e-10 +dfa,42,3,1e-06,0.0,5.973174732609721e-10,5.436861516550096e-10 +dfa,42,3,1e-05,0.0,5.973174732609721e-10,5.436861516550096e-10 +dfa,42,3,0.0001,0.0,5.973174732609721e-10,5.436861516550096e-10 +dfa,42,3,0.001,0.0,5.973174732609721e-10,5.436861516550096e-10 +dfa,123,0,1e-08,1.0,8.558982500517232e-08,6.690434872780315e-08 +dfa,123,0,1e-07,0.2802734375,8.558982500517232e-08,6.690434872780315e-08 +dfa,123,0,1e-06,0.0,8.558982500517232e-08,6.690434872780315e-08 +dfa,123,0,1e-05,0.0,8.558982500517232e-08,6.690434872780315e-08 +dfa,123,0,0.0001,0.0,8.558982500517232e-08,6.690434872780315e-08 +dfa,123,0,0.001,0.0,8.558982500517232e-08,6.690434872780315e-08 +dfa,123,1,1e-08,0.0,3.885574917372736e-10,3.6982170104060685e-10 +dfa,123,1,1e-07,0.0,3.885574917372736e-10,3.6982170104060685e-10 +dfa,123,1,1e-06,0.0,3.885574917372736e-10,3.6982170104060685e-10 +dfa,123,1,1e-05,0.0,3.885574917372736e-10,3.6982170104060685e-10 +dfa,123,1,0.0001,0.0,3.885574917372736e-10,3.6982170104060685e-10 +dfa,123,1,0.001,0.0,3.885574917372736e-10,3.6982170104060685e-10 +dfa,123,2,1e-08,0.0,3.82178039215475e-10,3.643452484158871e-10 +dfa,123,2,1e-07,0.0,3.82178039215475e-10,3.643452484158871e-10 +dfa,123,2,1e-06,0.0,3.82178039215475e-10,3.643452484158871e-10 +dfa,123,2,1e-05,0.0,3.82178039215475e-10,3.643452484158871e-10 +dfa,123,2,0.0001,0.0,3.82178039215475e-10,3.643452484158871e-10 +dfa,123,2,0.001,0.0,3.82178039215475e-10,3.643452484158871e-10 +dfa,123,3,1e-08,0.0,3.82106263296933e-10,3.6438793649118395e-10 +dfa,123,3,1e-07,0.0,3.82106263296933e-10,3.6438793649118395e-10 +dfa,123,3,1e-06,0.0,3.82106263296933e-10,3.6438793649118395e-10 +dfa,123,3,1e-05,0.0,3.82106263296933e-10,3.6438793649118395e-10 +dfa,123,3,0.0001,0.0,3.82106263296933e-10,3.6438793649118395e-10 +dfa,123,3,0.001,0.0,3.82106263296933e-10,3.6438793649118395e-10 +dfa,456,0,1e-08,0.9990234375,6.62804069406775e-08,5.096582356145518e-08 +dfa,456,0,1e-07,0.1728515625,6.62804069406775e-08,5.096582356145518e-08 +dfa,456,0,1e-06,0.0,6.62804069406775e-08,5.096582356145518e-08 +dfa,456,0,1e-05,0.0,6.62804069406775e-08,5.096582356145518e-08 +dfa,456,0,0.0001,0.0,6.62804069406775e-08,5.096582356145518e-08 +dfa,456,0,0.001,0.0,6.62804069406775e-08,5.096582356145518e-08 +dfa,456,1,1e-08,0.0,2.723611336463705e-10,2.5308924400668786e-10 +dfa,456,1,1e-07,0.0,2.723611336463705e-10,2.5308924400668786e-10 +dfa,456,1,1e-06,0.0,2.723611336463705e-10,2.5308924400668786e-10 +dfa,456,1,1e-05,0.0,2.723611336463705e-10,2.5308924400668786e-10 +dfa,456,1,0.0001,0.0,2.723611336463705e-10,2.5308924400668786e-10 +dfa,456,1,0.001,0.0,2.723611336463705e-10,2.5308924400668786e-10 +dfa,456,2,1e-08,0.0,2.684660826979268e-10,2.498188322874739e-10 +dfa,456,2,1e-07,0.0,2.684660826979268e-10,2.498188322874739e-10 +dfa,456,2,1e-06,0.0,2.684660826979268e-10,2.498188322874739e-10 +dfa,456,2,1e-05,0.0,2.684660826979268e-10,2.498188322874739e-10 +dfa,456,2,0.0001,0.0,2.684660826979268e-10,2.498188322874739e-10 +dfa,456,2,0.001,0.0,2.684660826979268e-10,2.498188322874739e-10 +dfa,456,3,1e-08,0.0,2.68405991876719e-10,2.499166429359434e-10 +dfa,456,3,1e-07,0.0,2.68405991876719e-10,2.499166429359434e-10 +dfa,456,3,1e-06,0.0,2.68405991876719e-10,2.499166429359434e-10 +dfa,456,3,1e-05,0.0,2.68405991876719e-10,2.499166429359434e-10 +dfa,456,3,0.0001,0.0,2.68405991876719e-10,2.499166429359434e-10 +dfa,456,3,0.001,0.0,2.68405991876719e-10,2.499166429359434e-10 +dfa,789,0,1e-08,0.998046875,7.355507136708184e-08,5.720548301724193e-08 +dfa,789,0,1e-07,0.2080078125,7.355507136708184e-08,5.720548301724193e-08 +dfa,789,0,1e-06,0.0,7.355507136708184e-08,5.720548301724193e-08 +dfa,789,0,1e-05,0.0,7.355507136708184e-08,5.720548301724193e-08 +dfa,789,0,0.0001,0.0,7.355507136708184e-08,5.720548301724193e-08 +dfa,789,0,0.001,0.0,7.355507136708184e-08,5.720548301724193e-08 +dfa,789,1,1e-08,0.0,3.6360320310180327e-10,3.5382324847788027e-10 +dfa,789,1,1e-07,0.0,3.6360320310180327e-10,3.5382324847788027e-10 +dfa,789,1,1e-06,0.0,3.6360320310180327e-10,3.5382324847788027e-10 +dfa,789,1,1e-05,0.0,3.6360320310180327e-10,3.5382324847788027e-10 +dfa,789,1,0.0001,0.0,3.6360320310180327e-10,3.5382324847788027e-10 +dfa,789,1,0.001,0.0,3.6360320310180327e-10,3.5382324847788027e-10 +dfa,789,2,1e-08,0.0,3.605674925299951e-10,3.526874348125375e-10 +dfa,789,2,1e-07,0.0,3.605674925299951e-10,3.526874348125375e-10 +dfa,789,2,1e-06,0.0,3.605674925299951e-10,3.526874348125375e-10 +dfa,789,2,1e-05,0.0,3.605674925299951e-10,3.526874348125375e-10 +dfa,789,2,0.0001,0.0,3.605674925299951e-10,3.526874348125375e-10 +dfa,789,2,0.001,0.0,3.605674925299951e-10,3.526874348125375e-10 +dfa,789,3,1e-08,0.0,3.6057717922588495e-10,3.5249728136399483e-10 +dfa,789,3,1e-07,0.0,3.6057717922588495e-10,3.5249728136399483e-10 +dfa,789,3,1e-06,0.0,3.6057717922588495e-10,3.5249728136399483e-10 +dfa,789,3,1e-05,0.0,3.6057717922588495e-10,3.5249728136399483e-10 +dfa,789,3,0.0001,0.0,3.6057717922588495e-10,3.5249728136399483e-10 +dfa,789,3,0.001,0.0,3.6057717922588495e-10,3.5249728136399483e-10 +dfa,1024,0,1e-08,1.0,7.678321622961448e-08,6.240912142629895e-08 +dfa,1024,0,1e-07,0.2275390625,7.678321622961448e-08,6.240912142629895e-08 +dfa,1024,0,1e-06,0.0,7.678321622961448e-08,6.240912142629895e-08 +dfa,1024,0,1e-05,0.0,7.678321622961448e-08,6.240912142629895e-08 +dfa,1024,0,0.0001,0.0,7.678321622961448e-08,6.240912142629895e-08 +dfa,1024,0,0.001,0.0,7.678321622961448e-08,6.240912142629895e-08 +dfa,1024,1,1e-08,0.0,3.4086847233716355e-10,3.261897418838089e-10 +dfa,1024,1,1e-07,0.0,3.4086847233716355e-10,3.261897418838089e-10 +dfa,1024,1,1e-06,0.0,3.4086847233716355e-10,3.261897418838089e-10 +dfa,1024,1,1e-05,0.0,3.4086847233716355e-10,3.261897418838089e-10 +dfa,1024,1,0.0001,0.0,3.4086847233716355e-10,3.261897418838089e-10 +dfa,1024,1,0.001,0.0,3.4086847233716355e-10,3.261897418838089e-10 +dfa,1024,2,1e-08,0.0,3.385664248956033e-10,3.2339939060044287e-10 +dfa,1024,2,1e-07,0.0,3.385664248956033e-10,3.2339939060044287e-10 +dfa,1024,2,1e-06,0.0,3.385664248956033e-10,3.2339939060044287e-10 +dfa,1024,2,1e-05,0.0,3.385664248956033e-10,3.2339939060044287e-10 +dfa,1024,2,0.0001,0.0,3.385664248956033e-10,3.2339939060044287e-10 +dfa,1024,2,0.001,0.0,3.385664248956033e-10,3.2339939060044287e-10 +dfa,1024,3,1e-08,0.0,3.3844413382944083e-10,3.233243117684026e-10 +dfa,1024,3,1e-07,0.0,3.3844413382944083e-10,3.233243117684026e-10 +dfa,1024,3,1e-06,0.0,3.3844413382944083e-10,3.233243117684026e-10 +dfa,1024,3,1e-05,0.0,3.3844413382944083e-10,3.233243117684026e-10 +dfa,1024,3,0.0001,0.0,3.3844413382944083e-10,3.233243117684026e-10 +dfa,1024,3,0.001,0.0,3.3844413382944083e-10,3.233243117684026e-10 +dfa,2048,0,1e-08,1.0,7.40840917501373e-08,6.056081502947563e-08 +dfa,2048,0,1e-07,0.2119140625,7.40840917501373e-08,6.056081502947563e-08 +dfa,2048,0,1e-06,0.0,7.40840917501373e-08,6.056081502947563e-08 +dfa,2048,0,1e-05,0.0,7.40840917501373e-08,6.056081502947563e-08 +dfa,2048,0,0.0001,0.0,7.40840917501373e-08,6.056081502947563e-08 +dfa,2048,0,0.001,0.0,7.40840917501373e-08,6.056081502947563e-08 +dfa,2048,1,1e-08,0.0,2.6816954212804944e-10,2.616813432609888e-10 +dfa,2048,1,1e-07,0.0,2.6816954212804944e-10,2.616813432609888e-10 +dfa,2048,1,1e-06,0.0,2.6816954212804944e-10,2.616813432609888e-10 +dfa,2048,1,1e-05,0.0,2.6816954212804944e-10,2.616813432609888e-10 +dfa,2048,1,0.0001,0.0,2.6816954212804944e-10,2.616813432609888e-10 +dfa,2048,1,0.001,0.0,2.6816954212804944e-10,2.616813432609888e-10 +dfa,2048,2,1e-08,0.0,2.6471219660706424e-10,2.605666515886895e-10 +dfa,2048,2,1e-07,0.0,2.6471219660706424e-10,2.605666515886895e-10 +dfa,2048,2,1e-06,0.0,2.6471219660706424e-10,2.605666515886895e-10 +dfa,2048,2,1e-05,0.0,2.6471219660706424e-10,2.605666515886895e-10 +dfa,2048,2,0.0001,0.0,2.6471219660706424e-10,2.605666515886895e-10 +dfa,2048,2,0.001,0.0,2.6471219660706424e-10,2.605666515886895e-10 +dfa,2048,3,1e-08,0.0,2.6466975833194795e-10,2.6055227420052063e-10 +dfa,2048,3,1e-07,0.0,2.6466975833194795e-10,2.6055227420052063e-10 +dfa,2048,3,1e-06,0.0,2.6466975833194795e-10,2.6055227420052063e-10 +dfa,2048,3,1e-05,0.0,2.6466975833194795e-10,2.6055227420052063e-10 +dfa,2048,3,0.0001,0.0,2.6466975833194795e-10,2.6055227420052063e-10 +dfa,2048,3,0.001,0.0,2.6466975833194795e-10,2.6055227420052063e-10 +dfa,3000,0,1e-08,1.0,5.859586238443626e-08,4.686578947143971e-08 +dfa,3000,0,1e-07,0.109375,5.859586238443626e-08,4.686578947143971e-08 +dfa,3000,0,1e-06,0.0,5.859586238443626e-08,4.686578947143971e-08 +dfa,3000,0,1e-05,0.0,5.859586238443626e-08,4.686578947143971e-08 +dfa,3000,0,0.0001,0.0,5.859586238443626e-08,4.686578947143971e-08 +dfa,3000,0,0.001,0.0,5.859586238443626e-08,4.686578947143971e-08 +dfa,3000,1,1e-08,0.0,2.5324747854327256e-10,2.367189222418631e-10 +dfa,3000,1,1e-07,0.0,2.5324747854327256e-10,2.367189222418631e-10 +dfa,3000,1,1e-06,0.0,2.5324747854327256e-10,2.367189222418631e-10 +dfa,3000,1,1e-05,0.0,2.5324747854327256e-10,2.367189222418631e-10 +dfa,3000,1,0.0001,0.0,2.5324747854327256e-10,2.367189222418631e-10 +dfa,3000,1,0.001,0.0,2.5324747854327256e-10,2.367189222418631e-10 +dfa,3000,2,1e-08,0.0,2.51835663434008e-10,2.35156727423913e-10 +dfa,3000,2,1e-07,0.0,2.51835663434008e-10,2.35156727423913e-10 +dfa,3000,2,1e-06,0.0,2.51835663434008e-10,2.35156727423913e-10 +dfa,3000,2,1e-05,0.0,2.51835663434008e-10,2.35156727423913e-10 +dfa,3000,2,0.0001,0.0,2.51835663434008e-10,2.35156727423913e-10 +dfa,3000,2,0.001,0.0,2.51835663434008e-10,2.35156727423913e-10 +dfa,3000,3,1e-08,0.0,2.521023945156742e-10,2.359840933774393e-10 +dfa,3000,3,1e-07,0.0,2.521023945156742e-10,2.359840933774393e-10 +dfa,3000,3,1e-06,0.0,2.521023945156742e-10,2.359840933774393e-10 +dfa,3000,3,1e-05,0.0,2.521023945156742e-10,2.359840933774393e-10 +dfa,3000,3,0.0001,0.0,2.521023945156742e-10,2.359840933774393e-10 +dfa,3000,3,0.001,0.0,2.521023945156742e-10,2.359840933774393e-10 +dfa,4000,0,1e-08,1.0,8.277459073724458e-08,6.603810476235594e-08 +dfa,4000,0,1e-07,0.2763671875,8.277459073724458e-08,6.603810476235594e-08 +dfa,4000,0,1e-06,0.0,8.277459073724458e-08,6.603810476235594e-08 +dfa,4000,0,1e-05,0.0,8.277459073724458e-08,6.603810476235594e-08 +dfa,4000,0,0.0001,0.0,8.277459073724458e-08,6.603810476235594e-08 +dfa,4000,0,0.001,0.0,8.277459073724458e-08,6.603810476235594e-08 +dfa,4000,1,1e-08,0.0,2.8688929010201036e-10,2.6567845146097113e-10 +dfa,4000,1,1e-07,0.0,2.8688929010201036e-10,2.6567845146097113e-10 +dfa,4000,1,1e-06,0.0,2.8688929010201036e-10,2.6567845146097113e-10 +dfa,4000,1,1e-05,0.0,2.8688929010201036e-10,2.6567845146097113e-10 +dfa,4000,1,0.0001,0.0,2.8688929010201036e-10,2.6567845146097113e-10 +dfa,4000,1,0.001,0.0,2.8688929010201036e-10,2.6567845146097113e-10 +dfa,4000,2,1e-08,0.0,2.8389277040297145e-10,2.6511040585042167e-10 +dfa,4000,2,1e-07,0.0,2.8389277040297145e-10,2.6511040585042167e-10 +dfa,4000,2,1e-06,0.0,2.8389277040297145e-10,2.6511040585042167e-10 +dfa,4000,2,1e-05,0.0,2.8389277040297145e-10,2.6511040585042167e-10 +dfa,4000,2,0.0001,0.0,2.8389277040297145e-10,2.6511040585042167e-10 +dfa,4000,2,0.001,0.0,2.8389277040297145e-10,2.6511040585042167e-10 +dfa,4000,3,1e-08,0.0,2.839262158715883e-10,2.6529473062808506e-10 +dfa,4000,3,1e-07,0.0,2.839262158715883e-10,2.6529473062808506e-10 +dfa,4000,3,1e-06,0.0,2.839262158715883e-10,2.6529473062808506e-10 +dfa,4000,3,1e-05,0.0,2.839262158715883e-10,2.6529473062808506e-10 +dfa,4000,3,0.0001,0.0,2.839262158715883e-10,2.6529473062808506e-10 +dfa,4000,3,0.001,0.0,2.839262158715883e-10,2.6529473062808506e-10 +dfa,5000,0,1e-08,0.9990234375,7.934817602972544e-08,6.382192196952019e-08 +dfa,5000,0,1e-07,0.2568359375,7.934817602972544e-08,6.382192196952019e-08 +dfa,5000,0,1e-06,0.0,7.934817602972544e-08,6.382192196952019e-08 +dfa,5000,0,1e-05,0.0,7.934817602972544e-08,6.382192196952019e-08 +dfa,5000,0,0.0001,0.0,7.934817602972544e-08,6.382192196952019e-08 +dfa,5000,0,0.001,0.0,7.934817602972544e-08,6.382192196952019e-08 +dfa,5000,1,1e-08,0.0,3.2386976434040093e-10,3.104253798458245e-10 +dfa,5000,1,1e-07,0.0,3.2386976434040093e-10,3.104253798458245e-10 +dfa,5000,1,1e-06,0.0,3.2386976434040093e-10,3.104253798458245e-10 +dfa,5000,1,1e-05,0.0,3.2386976434040093e-10,3.104253798458245e-10 +dfa,5000,1,0.0001,0.0,3.2386976434040093e-10,3.104253798458245e-10 +dfa,5000,1,0.001,0.0,3.2386976434040093e-10,3.104253798458245e-10 +dfa,5000,2,1e-08,0.0,3.1908084507925594e-10,3.0578073406672956e-10 +dfa,5000,2,1e-07,0.0,3.1908084507925594e-10,3.0578073406672956e-10 +dfa,5000,2,1e-06,0.0,3.1908084507925594e-10,3.0578073406672956e-10 +dfa,5000,2,1e-05,0.0,3.1908084507925594e-10,3.0578073406672956e-10 +dfa,5000,2,0.0001,0.0,3.1908084507925594e-10,3.0578073406672956e-10 +dfa,5000,2,0.001,0.0,3.1908084507925594e-10,3.0578073406672956e-10 +dfa,5000,3,1e-08,0.0,3.1896082997029396e-10,3.054817787617736e-10 +dfa,5000,3,1e-07,0.0,3.1896082997029396e-10,3.054817787617736e-10 +dfa,5000,3,1e-06,0.0,3.1896082997029396e-10,3.054817787617736e-10 +dfa,5000,3,1e-05,0.0,3.1896082997029396e-10,3.054817787617736e-10 +dfa,5000,3,0.0001,0.0,3.1896082997029396e-10,3.054817787617736e-10 +dfa,5000,3,0.001,0.0,3.1896082997029396e-10,3.054817787617736e-10 +dfa,6000,0,1e-08,0.994140625,4.818060261868595e-08,3.649725499599299e-08 +dfa,6000,0,1e-07,0.0869140625,4.818060261868595e-08,3.649725499599299e-08 +dfa,6000,0,1e-06,0.0,4.818060261868595e-08,3.649725499599299e-08 +dfa,6000,0,1e-05,0.0,4.818060261868595e-08,3.649725499599299e-08 +dfa,6000,0,0.0001,0.0,4.818060261868595e-08,3.649725499599299e-08 +dfa,6000,0,0.001,0.0,4.818060261868595e-08,3.649725499599299e-08 +dfa,6000,1,1e-08,0.0,2.385994735121244e-10,2.2566398749646055e-10 +dfa,6000,1,1e-07,0.0,2.385994735121244e-10,2.2566398749646055e-10 +dfa,6000,1,1e-06,0.0,2.385994735121244e-10,2.2566398749646055e-10 +dfa,6000,1,1e-05,0.0,2.385994735121244e-10,2.2566398749646055e-10 +dfa,6000,1,0.0001,0.0,2.385994735121244e-10,2.2566398749646055e-10 +dfa,6000,1,0.001,0.0,2.385994735121244e-10,2.2566398749646055e-10 +dfa,6000,2,1e-08,0.0,2.3768884083175124e-10,2.2491537798874361e-10 +dfa,6000,2,1e-07,0.0,2.3768884083175124e-10,2.2491537798874361e-10 +dfa,6000,2,1e-06,0.0,2.3768884083175124e-10,2.2491537798874361e-10 +dfa,6000,2,1e-05,0.0,2.3768884083175124e-10,2.2491537798874361e-10 +dfa,6000,2,0.0001,0.0,2.3768884083175124e-10,2.2491537798874361e-10 +dfa,6000,2,0.001,0.0,2.3768884083175124e-10,2.2491537798874361e-10 +dfa,6000,3,1e-08,0.0,2.379895724935466e-10,2.2488950979226985e-10 +dfa,6000,3,1e-07,0.0,2.379895724935466e-10,2.2488950979226985e-10 +dfa,6000,3,1e-06,0.0,2.379895724935466e-10,2.2488950979226985e-10 +dfa,6000,3,1e-05,0.0,2.379895724935466e-10,2.2488950979226985e-10 +dfa,6000,3,0.0001,0.0,2.379895724935466e-10,2.2488950979226985e-10 +dfa,6000,3,0.001,0.0,2.379895724935466e-10,2.2488950979226985e-10 +state_bridge,42,0,1e-08,0.9951171875,1.5461689599760575e-06,1.046195166054531e-06 +state_bridge,42,0,1e-07,0.94140625,1.5461689599760575e-06,1.046195166054531e-06 +state_bridge,42,0,1e-06,0.5283203125,1.5461689599760575e-06,1.046195166054531e-06 +state_bridge,42,0,1e-05,0.0048828125,1.5461689599760575e-06,1.046195166054531e-06 +state_bridge,42,0,0.0001,0.0,1.5461689599760575e-06,1.046195166054531e-06 +state_bridge,42,0,0.001,0.0,1.5461689599760575e-06,1.046195166054531e-06 +state_bridge,42,1,1e-08,0.0,2.511534313853758e-10,2.357372075323383e-10 +state_bridge,42,1,1e-07,0.0,2.511534313853758e-10,2.357372075323383e-10 +state_bridge,42,1,1e-06,0.0,2.511534313853758e-10,2.357372075323383e-10 +state_bridge,42,1,1e-05,0.0,2.511534313853758e-10,2.357372075323383e-10 +state_bridge,42,1,0.0001,0.0,2.511534313853758e-10,2.357372075323383e-10 +state_bridge,42,1,0.001,0.0,2.511534313853758e-10,2.357372075323383e-10 +state_bridge,42,2,1e-08,0.0,2.4734042591845196e-10,2.313833846745439e-10 +state_bridge,42,2,1e-07,0.0,2.4734042591845196e-10,2.313833846745439e-10 +state_bridge,42,2,1e-06,0.0,2.4734042591845196e-10,2.313833846745439e-10 +state_bridge,42,2,1e-05,0.0,2.4734042591845196e-10,2.313833846745439e-10 +state_bridge,42,2,0.0001,0.0,2.4734042591845196e-10,2.313833846745439e-10 +state_bridge,42,2,0.001,0.0,2.4734042591845196e-10,2.313833846745439e-10 +state_bridge,42,3,1e-08,0.0,2.3524043823996976e-10,2.1822209317345909e-10 +state_bridge,42,3,1e-07,0.0,2.3524043823996976e-10,2.1822209317345909e-10 +state_bridge,42,3,1e-06,0.0,2.3524043823996976e-10,2.1822209317345909e-10 +state_bridge,42,3,1e-05,0.0,2.3524043823996976e-10,2.1822209317345909e-10 +state_bridge,42,3,0.0001,0.0,2.3524043823996976e-10,2.1822209317345909e-10 +state_bridge,42,3,0.001,0.0,2.3524043823996976e-10,2.1822209317345909e-10 +state_bridge,123,0,1e-08,1.0,3.0364531085069757e-06,2.199241635025828e-06 +state_bridge,123,0,1e-07,0.9814453125,3.0364531085069757e-06,2.199241635025828e-06 +state_bridge,123,0,1e-06,0.7802734375,3.0364531085069757e-06,2.199241635025828e-06 +state_bridge,123,0,1e-05,0.0283203125,3.0364531085069757e-06,2.199241635025828e-06 +state_bridge,123,0,0.0001,0.0,3.0364531085069757e-06,2.199241635025828e-06 +state_bridge,123,0,0.001,0.0,3.0364531085069757e-06,2.199241635025828e-06 +state_bridge,123,1,1e-08,0.0,3.445063123663772e-10,3.0412453111416937e-10 +state_bridge,123,1,1e-07,0.0,3.445063123663772e-10,3.0412453111416937e-10 +state_bridge,123,1,1e-06,0.0,3.445063123663772e-10,3.0412453111416937e-10 +state_bridge,123,1,1e-05,0.0,3.445063123663772e-10,3.0412453111416937e-10 +state_bridge,123,1,0.0001,0.0,3.445063123663772e-10,3.0412453111416937e-10 +state_bridge,123,1,0.001,0.0,3.445063123663772e-10,3.0412453111416937e-10 +state_bridge,123,2,1e-08,0.0,3.406872561839691e-10,2.9890334651838657e-10 +state_bridge,123,2,1e-07,0.0,3.406872561839691e-10,2.9890334651838657e-10 +state_bridge,123,2,1e-06,0.0,3.406872561839691e-10,2.9890334651838657e-10 +state_bridge,123,2,1e-05,0.0,3.406872561839691e-10,2.9890334651838657e-10 +state_bridge,123,2,0.0001,0.0,3.406872561839691e-10,2.9890334651838657e-10 +state_bridge,123,2,0.001,0.0,3.406872561839691e-10,2.9890334651838657e-10 +state_bridge,123,3,1e-08,0.0,3.3725344739110596e-10,2.9520974553776114e-10 +state_bridge,123,3,1e-07,0.0,3.3725344739110596e-10,2.9520974553776114e-10 +state_bridge,123,3,1e-06,0.0,3.3725344739110596e-10,2.9520974553776114e-10 +state_bridge,123,3,1e-05,0.0,3.3725344739110596e-10,2.9520974553776114e-10 +state_bridge,123,3,0.0001,0.0,3.3725344739110596e-10,2.9520974553776114e-10 +state_bridge,123,3,0.001,0.0,3.3725344739110596e-10,2.9520974553776114e-10 +state_bridge,456,0,1e-08,0.9921875,3.4133063309127465e-06,1.421034198756388e-06 +state_bridge,456,0,1e-07,0.947265625,3.4133063309127465e-06,1.421034198756388e-06 +state_bridge,456,0,1e-06,0.6044921875,3.4133063309127465e-06,1.421034198756388e-06 +state_bridge,456,0,1e-05,0.044921875,3.4133063309127465e-06,1.421034198756388e-06 +state_bridge,456,0,0.0001,0.001953125,3.4133063309127465e-06,1.421034198756388e-06 +state_bridge,456,0,0.001,0.0,3.4133063309127465e-06,1.421034198756388e-06 +state_bridge,456,1,1e-08,0.0107421875,2.6507986916612936e-09,3.6186914575964124e-10 +state_bridge,456,1,1e-07,0.0048828125,2.6507986916612936e-09,3.6186914575964124e-10 +state_bridge,456,1,1e-06,0.0,2.6507986916612936e-09,3.6186914575964124e-10 +state_bridge,456,1,1e-05,0.0,2.6507986916612936e-09,3.6186914575964124e-10 +state_bridge,456,1,0.0001,0.0,2.6507986916612936e-09,3.6186914575964124e-10 +state_bridge,456,1,0.001,0.0,2.6507986916612936e-09,3.6186914575964124e-10 +state_bridge,456,2,1e-08,0.0,3.456599451112652e-10,3.0120325678062443e-10 +state_bridge,456,2,1e-07,0.0,3.456599451112652e-10,3.0120325678062443e-10 +state_bridge,456,2,1e-06,0.0,3.456599451112652e-10,3.0120325678062443e-10 +state_bridge,456,2,1e-05,0.0,3.456599451112652e-10,3.0120325678062443e-10 +state_bridge,456,2,0.0001,0.0,3.456599451112652e-10,3.0120325678062443e-10 +state_bridge,456,2,0.001,0.0,3.456599451112652e-10,3.0120325678062443e-10 +state_bridge,456,3,1e-08,0.0,3.452579333540484e-10,3.0106017678832586e-10 +state_bridge,456,3,1e-07,0.0,3.452579333540484e-10,3.0106017678832586e-10 +state_bridge,456,3,1e-06,0.0,3.452579333540484e-10,3.0106017678832586e-10 +state_bridge,456,3,1e-05,0.0,3.452579333540484e-10,3.0106017678832586e-10 +state_bridge,456,3,0.0001,0.0,3.452579333540484e-10,3.0106017678832586e-10 +state_bridge,456,3,0.001,0.0,3.452579333540484e-10,3.0106017678832586e-10 +state_bridge,789,0,1e-08,1.0,2.1964008283248404e-06,5.427056066764635e-07 +state_bridge,789,0,1e-07,0.9013671875,2.1964008283248404e-06,5.427056066764635e-07 +state_bridge,789,0,1e-06,0.4013671875,2.1964008283248404e-06,5.427056066764635e-07 +state_bridge,789,0,1e-05,0.0439453125,2.1964008283248404e-06,5.427056066764635e-07 +state_bridge,789,0,0.0001,0.0,2.1964008283248404e-06,5.427056066764635e-07 +state_bridge,789,0,0.001,0.0,2.1964008283248404e-06,5.427056066764635e-07 +state_bridge,789,1,1e-08,0.0,2.503308116352798e-10,1.606154237387969e-10 +state_bridge,789,1,1e-07,0.0,2.503308116352798e-10,1.606154237387969e-10 +state_bridge,789,1,1e-06,0.0,2.503308116352798e-10,1.606154237387969e-10 +state_bridge,789,1,1e-05,0.0,2.503308116352798e-10,1.606154237387969e-10 +state_bridge,789,1,0.0001,0.0,2.503308116352798e-10,1.606154237387969e-10 +state_bridge,789,1,0.001,0.0,2.503308116352798e-10,1.606154237387969e-10 +state_bridge,789,2,1e-08,0.0,7.482816449799756e-11,6.650602984992204e-11 +state_bridge,789,2,1e-07,0.0,7.482816449799756e-11,6.650602984992204e-11 +state_bridge,789,2,1e-06,0.0,7.482816449799756e-11,6.650602984992204e-11 +state_bridge,789,2,1e-05,0.0,7.482816449799756e-11,6.650602984992204e-11 +state_bridge,789,2,0.0001,0.0,7.482816449799756e-11,6.650602984992204e-11 +state_bridge,789,2,0.001,0.0,7.482816449799756e-11,6.650602984992204e-11 +state_bridge,789,3,1e-08,0.0,7.645344080042804e-11,6.691018572535512e-11 +state_bridge,789,3,1e-07,0.0,7.645344080042804e-11,6.691018572535512e-11 +state_bridge,789,3,1e-06,0.0,7.645344080042804e-11,6.691018572535512e-11 +state_bridge,789,3,1e-05,0.0,7.645344080042804e-11,6.691018572535512e-11 +state_bridge,789,3,0.0001,0.0,7.645344080042804e-11,6.691018572535512e-11 +state_bridge,789,3,0.001,0.0,7.645344080042804e-11,6.691018572535512e-11 +state_bridge,1024,0,1e-08,0.99609375,2.087348093482433e-06,5.252314849713002e-07 +state_bridge,1024,0,1e-07,0.8271484375,2.087348093482433e-06,5.252314849713002e-07 +state_bridge,1024,0,1e-06,0.3388671875,2.087348093482433e-06,5.252314849713002e-07 +state_bridge,1024,0,1e-05,0.0400390625,2.087348093482433e-06,5.252314849713002e-07 +state_bridge,1024,0,0.0001,0.001953125,2.087348093482433e-06,5.252314849713002e-07 +state_bridge,1024,0,0.001,0.0,2.087348093482433e-06,5.252314849713002e-07 +state_bridge,1024,1,1e-08,0.0068359375,1.13835030290943e-09,6.494170201598592e-10 +state_bridge,1024,1,1e-07,0.0,1.13835030290943e-09,6.494170201598592e-10 +state_bridge,1024,1,1e-06,0.0,1.13835030290943e-09,6.494170201598592e-10 +state_bridge,1024,1,1e-05,0.0,1.13835030290943e-09,6.494170201598592e-10 +state_bridge,1024,1,0.0001,0.0,1.13835030290943e-09,6.494170201598592e-10 +state_bridge,1024,1,0.001,0.0,1.13835030290943e-09,6.494170201598592e-10 +state_bridge,1024,2,1e-08,0.0,5.4832090257139754e-11,5.040141221046568e-11 +state_bridge,1024,2,1e-07,0.0,5.4832090257139754e-11,5.040141221046568e-11 +state_bridge,1024,2,1e-06,0.0,5.4832090257139754e-11,5.040141221046568e-11 +state_bridge,1024,2,1e-05,0.0,5.4832090257139754e-11,5.040141221046568e-11 +state_bridge,1024,2,0.0001,0.0,5.4832090257139754e-11,5.040141221046568e-11 +state_bridge,1024,2,0.001,0.0,5.4832090257139754e-11,5.040141221046568e-11 +state_bridge,1024,3,1e-08,0.0,5.544187331452122e-11,5.1105165238540806e-11 +state_bridge,1024,3,1e-07,0.0,5.544187331452122e-11,5.1105165238540806e-11 +state_bridge,1024,3,1e-06,0.0,5.544187331452122e-11,5.1105165238540806e-11 +state_bridge,1024,3,1e-05,0.0,5.544187331452122e-11,5.1105165238540806e-11 +state_bridge,1024,3,0.0001,0.0,5.544187331452122e-11,5.1105165238540806e-11 +state_bridge,1024,3,0.001,0.0,5.544187331452122e-11,5.1105165238540806e-11 +state_bridge,2048,0,1e-08,1.0,2.8339600248727947e-06,1.4121683307166677e-06 +state_bridge,2048,0,1e-07,1.0,2.8339600248727947e-06,1.4121683307166677e-06 +state_bridge,2048,0,1e-06,0.6171875,2.8339600248727947e-06,1.4121683307166677e-06 +state_bridge,2048,0,1e-05,0.05078125,2.8339600248727947e-06,1.4121683307166677e-06 +state_bridge,2048,0,0.0001,0.0,2.8339600248727947e-06,1.4121683307166677e-06 +state_bridge,2048,0,0.001,0.0,2.8339600248727947e-06,1.4121683307166677e-06 +state_bridge,2048,1,1e-08,0.0,1.9096885184310963e-10,1.431140206342718e-10 +state_bridge,2048,1,1e-07,0.0,1.9096885184310963e-10,1.431140206342718e-10 +state_bridge,2048,1,1e-06,0.0,1.9096885184310963e-10,1.431140206342718e-10 +state_bridge,2048,1,1e-05,0.0,1.9096885184310963e-10,1.431140206342718e-10 +state_bridge,2048,1,0.0001,0.0,1.9096885184310963e-10,1.431140206342718e-10 +state_bridge,2048,1,0.001,0.0,1.9096885184310963e-10,1.431140206342718e-10 +state_bridge,2048,2,1e-08,0.0,1.7883472480662022e-10,1.3591548719826818e-10 +state_bridge,2048,2,1e-07,0.0,1.7883472480662022e-10,1.3591548719826818e-10 +state_bridge,2048,2,1e-06,0.0,1.7883472480662022e-10,1.3591548719826818e-10 +state_bridge,2048,2,1e-05,0.0,1.7883472480662022e-10,1.3591548719826818e-10 +state_bridge,2048,2,0.0001,0.0,1.7883472480662022e-10,1.3591548719826818e-10 +state_bridge,2048,2,0.001,0.0,1.7883472480662022e-10,1.3591548719826818e-10 +state_bridge,2048,3,1e-08,0.0,1.7761189741172245e-10,1.3533535403453811e-10 +state_bridge,2048,3,1e-07,0.0,1.7761189741172245e-10,1.3533535403453811e-10 +state_bridge,2048,3,1e-06,0.0,1.7761189741172245e-10,1.3533535403453811e-10 +state_bridge,2048,3,1e-05,0.0,1.7761189741172245e-10,1.3533535403453811e-10 +state_bridge,2048,3,0.0001,0.0,1.7761189741172245e-10,1.3533535403453811e-10 +state_bridge,2048,3,0.001,0.0,1.7761189741172245e-10,1.3533535403453811e-10 +state_bridge,3000,0,1e-08,1.0,1.6625788248347817e-06,6.754059995728312e-07 +state_bridge,3000,0,1e-07,0.982421875,1.6625788248347817e-06,6.754059995728312e-07 +state_bridge,3000,0,1e-06,0.3681640625,1.6625788248347817e-06,6.754059995728312e-07 +state_bridge,3000,0,1e-05,0.0224609375,1.6625788248347817e-06,6.754059995728312e-07 +state_bridge,3000,0,0.0001,0.0,1.6625788248347817e-06,6.754059995728312e-07 +state_bridge,3000,0,0.001,0.0,1.6625788248347817e-06,6.754059995728312e-07 +state_bridge,3000,1,1e-08,0.0,2.742292226631804e-10,1.944834987499533e-10 +state_bridge,3000,1,1e-07,0.0,2.742292226631804e-10,1.944834987499533e-10 +state_bridge,3000,1,1e-06,0.0,2.742292226631804e-10,1.944834987499533e-10 +state_bridge,3000,1,1e-05,0.0,2.742292226631804e-10,1.944834987499533e-10 +state_bridge,3000,1,0.0001,0.0,2.742292226631804e-10,1.944834987499533e-10 +state_bridge,3000,1,0.001,0.0,2.742292226631804e-10,1.944834987499533e-10 +state_bridge,3000,2,1e-08,0.0,1.0382110449125292e-10,1.0345420353718993e-10 +state_bridge,3000,2,1e-07,0.0,1.0382110449125292e-10,1.0345420353718993e-10 +state_bridge,3000,2,1e-06,0.0,1.0382110449125292e-10,1.0345420353718993e-10 +state_bridge,3000,2,1e-05,0.0,1.0382110449125292e-10,1.0345420353718993e-10 +state_bridge,3000,2,0.0001,0.0,1.0382110449125292e-10,1.0345420353718993e-10 +state_bridge,3000,2,0.001,0.0,1.0382110449125292e-10,1.0345420353718993e-10 +state_bridge,3000,3,1e-08,0.0,1.0396156158165581e-10,1.0367201541683357e-10 +state_bridge,3000,3,1e-07,0.0,1.0396156158165581e-10,1.0367201541683357e-10 +state_bridge,3000,3,1e-06,0.0,1.0396156158165581e-10,1.0367201541683357e-10 +state_bridge,3000,3,1e-05,0.0,1.0396156158165581e-10,1.0367201541683357e-10 +state_bridge,3000,3,0.0001,0.0,1.0396156158165581e-10,1.0367201541683357e-10 +state_bridge,3000,3,0.001,0.0,1.0396156158165581e-10,1.0367201541683357e-10 +state_bridge,4000,0,1e-08,1.0,3.5008215490961447e-06,1.5757057099108351e-06 +state_bridge,4000,0,1e-07,0.984375,3.5008215490961447e-06,1.5757057099108351e-06 +state_bridge,4000,0,1e-06,0.583984375,3.5008215490961447e-06,1.5757057099108351e-06 +state_bridge,4000,0,1e-05,0.06640625,3.5008215490961447e-06,1.5757057099108351e-06 +state_bridge,4000,0,0.0001,0.0009765625,3.5008215490961447e-06,1.5757057099108351e-06 +state_bridge,4000,0,0.001,0.0,3.5008215490961447e-06,1.5757057099108351e-06 +state_bridge,4000,1,1e-08,0.0,3.210323673563664e-10,2.3108980007346958e-10 +state_bridge,4000,1,1e-07,0.0,3.210323673563664e-10,2.3108980007346958e-10 +state_bridge,4000,1,1e-06,0.0,3.210323673563664e-10,2.3108980007346958e-10 +state_bridge,4000,1,1e-05,0.0,3.210323673563664e-10,2.3108980007346958e-10 +state_bridge,4000,1,0.0001,0.0,3.210323673563664e-10,2.3108980007346958e-10 +state_bridge,4000,1,0.001,0.0,3.210323673563664e-10,2.3108980007346958e-10 +state_bridge,4000,2,1e-08,0.0,1.71735667353623e-10,1.6171709804613243e-10 +state_bridge,4000,2,1e-07,0.0,1.71735667353623e-10,1.6171709804613243e-10 +state_bridge,4000,2,1e-06,0.0,1.71735667353623e-10,1.6171709804613243e-10 +state_bridge,4000,2,1e-05,0.0,1.71735667353623e-10,1.6171709804613243e-10 +state_bridge,4000,2,0.0001,0.0,1.71735667353623e-10,1.6171709804613243e-10 +state_bridge,4000,2,0.001,0.0,1.71735667353623e-10,1.6171709804613243e-10 +state_bridge,4000,3,1e-08,0.0,1.709427044360723e-10,1.6136368630181863e-10 +state_bridge,4000,3,1e-07,0.0,1.709427044360723e-10,1.6136368630181863e-10 +state_bridge,4000,3,1e-06,0.0,1.709427044360723e-10,1.6136368630181863e-10 +state_bridge,4000,3,1e-05,0.0,1.709427044360723e-10,1.6136368630181863e-10 +state_bridge,4000,3,0.0001,0.0,1.709427044360723e-10,1.6136368630181863e-10 +state_bridge,4000,3,0.001,0.0,1.709427044360723e-10,1.6136368630181863e-10 +state_bridge,5000,0,1e-08,1.0,2.6143970899283886e-06,5.47988236121455e-07 +state_bridge,5000,0,1e-07,0.8310546875,2.6143970899283886e-06,5.47988236121455e-07 +state_bridge,5000,0,1e-06,0.3857421875,2.6143970899283886e-06,5.47988236121455e-07 +state_bridge,5000,0,1e-05,0.0458984375,2.6143970899283886e-06,5.47988236121455e-07 +state_bridge,5000,0,0.0001,0.001953125,2.6143970899283886e-06,5.47988236121455e-07 +state_bridge,5000,0,0.001,0.0,2.6143970899283886e-06,5.47988236121455e-07 +state_bridge,5000,1,1e-08,0.05078125,3.4061580223010424e-09,1.969567176018927e-09 +state_bridge,5000,1,1e-07,0.0,3.4061580223010424e-09,1.969567176018927e-09 +state_bridge,5000,1,1e-06,0.0,3.4061580223010424e-09,1.969567176018927e-09 +state_bridge,5000,1,1e-05,0.0,3.4061580223010424e-09,1.969567176018927e-09 +state_bridge,5000,1,0.0001,0.0,3.4061580223010424e-09,1.969567176018927e-09 +state_bridge,5000,1,0.001,0.0,3.4061580223010424e-09,1.969567176018927e-09 +state_bridge,5000,2,1e-08,0.0,2.0902392317001528e-10,1.7718780609410345e-10 +state_bridge,5000,2,1e-07,0.0,2.0902392317001528e-10,1.7718780609410345e-10 +state_bridge,5000,2,1e-06,0.0,2.0902392317001528e-10,1.7718780609410345e-10 +state_bridge,5000,2,1e-05,0.0,2.0902392317001528e-10,1.7718780609410345e-10 +state_bridge,5000,2,0.0001,0.0,2.0902392317001528e-10,1.7718780609410345e-10 +state_bridge,5000,2,0.001,0.0,2.0902392317001528e-10,1.7718780609410345e-10 +state_bridge,5000,3,1e-08,0.0,2.038432478368435e-10,1.7670918894818755e-10 +state_bridge,5000,3,1e-07,0.0,2.038432478368435e-10,1.7670918894818755e-10 +state_bridge,5000,3,1e-06,0.0,2.038432478368435e-10,1.7670918894818755e-10 +state_bridge,5000,3,1e-05,0.0,2.038432478368435e-10,1.7670918894818755e-10 +state_bridge,5000,3,0.0001,0.0,2.038432478368435e-10,1.7670918894818755e-10 +state_bridge,5000,3,0.001,0.0,2.038432478368435e-10,1.7670918894818755e-10 +state_bridge,6000,0,1e-08,1.0,2.269962351419963e-06,1.216433815898199e-06 +state_bridge,6000,0,1e-07,0.9892578125,2.269962351419963e-06,1.216433815898199e-06 +state_bridge,6000,0,1e-06,0.55078125,2.269962351419963e-06,1.216433815898199e-06 +state_bridge,6000,0,1e-05,0.0322265625,2.269962351419963e-06,1.216433815898199e-06 +state_bridge,6000,0,0.0001,0.0,2.269962351419963e-06,1.216433815898199e-06 +state_bridge,6000,0,0.001,0.0,2.269962351419963e-06,1.216433815898199e-06 +state_bridge,6000,1,1e-08,0.001953125,1.0463097055435355e-09,5.961666715847969e-10 +state_bridge,6000,1,1e-07,0.0,1.0463097055435355e-09,5.961666715847969e-10 +state_bridge,6000,1,1e-06,0.0,1.0463097055435355e-09,5.961666715847969e-10 +state_bridge,6000,1,1e-05,0.0,1.0463097055435355e-09,5.961666715847969e-10 +state_bridge,6000,1,0.0001,0.0,1.0463097055435355e-09,5.961666715847969e-10 +state_bridge,6000,1,0.001,0.0,1.0463097055435355e-09,5.961666715847969e-10 +state_bridge,6000,2,1e-08,0.0,2.0832731373321423e-10,1.793355047796652e-10 +state_bridge,6000,2,1e-07,0.0,2.0832731373321423e-10,1.793355047796652e-10 +state_bridge,6000,2,1e-06,0.0,2.0832731373321423e-10,1.793355047796652e-10 +state_bridge,6000,2,1e-05,0.0,2.0832731373321423e-10,1.793355047796652e-10 +state_bridge,6000,2,0.0001,0.0,2.0832731373321423e-10,1.793355047796652e-10 +state_bridge,6000,2,0.001,0.0,2.0832731373321423e-10,1.793355047796652e-10 +state_bridge,6000,3,1e-08,0.0,2.0960241875478403e-10,1.7990194056682896e-10 +state_bridge,6000,3,1e-07,0.0,2.0960241875478403e-10,1.7990194056682896e-10 +state_bridge,6000,3,1e-06,0.0,2.0960241875478403e-10,1.7990194056682896e-10 +state_bridge,6000,3,1e-05,0.0,2.0960241875478403e-10,1.7990194056682896e-10 +state_bridge,6000,3,0.0001,0.0,2.0960241875478403e-10,1.7990194056682896e-10 +state_bridge,6000,3,0.001,0.0,2.0960241875478403e-10,1.7990194056682896e-10 +credit_bridge,42,0,1e-08,0.982421875,1.573595085346824e-07,9.742006312762896e-08 +credit_bridge,42,0,1e-07,0.4921875,1.573595085346824e-07,9.742006312762896e-08 +credit_bridge,42,0,1e-06,0.0048828125,1.573595085346824e-07,9.742006312762896e-08 +credit_bridge,42,0,1e-05,0.0,1.573595085346824e-07,9.742006312762896e-08 +credit_bridge,42,0,0.0001,0.0,1.573595085346824e-07,9.742006312762896e-08 +credit_bridge,42,0,0.001,0.0,1.573595085346824e-07,9.742006312762896e-08 +credit_bridge,42,1,1e-08,0.0,1.8079358843348103e-10,1.3712213309258203e-10 +credit_bridge,42,1,1e-07,0.0,1.8079358843348103e-10,1.3712213309258203e-10 +credit_bridge,42,1,1e-06,0.0,1.8079358843348103e-10,1.3712213309258203e-10 +credit_bridge,42,1,1e-05,0.0,1.8079358843348103e-10,1.3712213309258203e-10 +credit_bridge,42,1,0.0001,0.0,1.8079358843348103e-10,1.3712213309258203e-10 +credit_bridge,42,1,0.001,0.0,1.8079358843348103e-10,1.3712213309258203e-10 +credit_bridge,42,2,1e-08,0.0,1.2228654200363565e-10,1.16817375217515e-10 +credit_bridge,42,2,1e-07,0.0,1.2228654200363565e-10,1.16817375217515e-10 +credit_bridge,42,2,1e-06,0.0,1.2228654200363565e-10,1.16817375217515e-10 +credit_bridge,42,2,1e-05,0.0,1.2228654200363565e-10,1.16817375217515e-10 +credit_bridge,42,2,0.0001,0.0,1.2228654200363565e-10,1.16817375217515e-10 +credit_bridge,42,2,0.001,0.0,1.2228654200363565e-10,1.16817375217515e-10 +credit_bridge,42,3,1e-08,0.0,1.2209952493513754e-10,1.168843077881121e-10 +credit_bridge,42,3,1e-07,0.0,1.2209952493513754e-10,1.168843077881121e-10 +credit_bridge,42,3,1e-06,0.0,1.2209952493513754e-10,1.168843077881121e-10 +credit_bridge,42,3,1e-05,0.0,1.2209952493513754e-10,1.168843077881121e-10 +credit_bridge,42,3,0.0001,0.0,1.2209952493513754e-10,1.168843077881121e-10 +credit_bridge,42,3,0.001,0.0,1.2209952493513754e-10,1.168843077881121e-10 +credit_bridge,123,0,1e-08,1.0,1.822186845856777e-07,1.3197313819546252e-07 +credit_bridge,123,0,1e-07,0.6630859375,1.822186845856777e-07,1.3197313819546252e-07 +credit_bridge,123,0,1e-06,0.0087890625,1.822186845856777e-07,1.3197313819546252e-07 +credit_bridge,123,0,1e-05,0.0,1.822186845856777e-07,1.3197313819546252e-07 +credit_bridge,123,0,0.0001,0.0,1.822186845856777e-07,1.3197313819546252e-07 +credit_bridge,123,0,0.001,0.0,1.822186845856777e-07,1.3197313819546252e-07 +credit_bridge,123,1,1e-08,0.0,5.901329425128665e-10,5.348693710161001e-10 +credit_bridge,123,1,1e-07,0.0,5.901329425128665e-10,5.348693710161001e-10 +credit_bridge,123,1,1e-06,0.0,5.901329425128665e-10,5.348693710161001e-10 +credit_bridge,123,1,1e-05,0.0,5.901329425128665e-10,5.348693710161001e-10 +credit_bridge,123,1,0.0001,0.0,5.901329425128665e-10,5.348693710161001e-10 +credit_bridge,123,1,0.001,0.0,5.901329425128665e-10,5.348693710161001e-10 +credit_bridge,123,2,1e-08,0.0,5.687246784624733e-10,5.182918538793047e-10 +credit_bridge,123,2,1e-07,0.0,5.687246784624733e-10,5.182918538793047e-10 +credit_bridge,123,2,1e-06,0.0,5.687246784624733e-10,5.182918538793047e-10 +credit_bridge,123,2,1e-05,0.0,5.687246784624733e-10,5.182918538793047e-10 +credit_bridge,123,2,0.0001,0.0,5.687246784624733e-10,5.182918538793047e-10 +credit_bridge,123,2,0.001,0.0,5.687246784624733e-10,5.182918538793047e-10 +credit_bridge,123,3,1e-08,0.0,5.659206436803288e-10,5.167046790433005e-10 +credit_bridge,123,3,1e-07,0.0,5.659206436803288e-10,5.167046790433005e-10 +credit_bridge,123,3,1e-06,0.0,5.659206436803288e-10,5.167046790433005e-10 +credit_bridge,123,3,1e-05,0.0,5.659206436803288e-10,5.167046790433005e-10 +credit_bridge,123,3,0.0001,0.0,5.659206436803288e-10,5.167046790433005e-10 +credit_bridge,123,3,0.001,0.0,5.659206436803288e-10,5.167046790433005e-10 +credit_bridge,456,0,1e-08,1.0,1.1763398788389168e-07,8.743072044126166e-08 +credit_bridge,456,0,1e-07,0.43359375,1.1763398788389168e-07,8.743072044126166e-08 +credit_bridge,456,0,1e-06,0.0,1.1763398788389168e-07,8.743072044126166e-08 +credit_bridge,456,0,1e-05,0.0,1.1763398788389168e-07,8.743072044126166e-08 +credit_bridge,456,0,0.0001,0.0,1.1763398788389168e-07,8.743072044126166e-08 +credit_bridge,456,0,0.001,0.0,1.1763398788389168e-07,8.743072044126166e-08 +credit_bridge,456,1,1e-08,0.0,3.321813102363791e-10,3.178909635526139e-10 +credit_bridge,456,1,1e-07,0.0,3.321813102363791e-10,3.178909635526139e-10 +credit_bridge,456,1,1e-06,0.0,3.321813102363791e-10,3.178909635526139e-10 +credit_bridge,456,1,1e-05,0.0,3.321813102363791e-10,3.178909635526139e-10 +credit_bridge,456,1,0.0001,0.0,3.321813102363791e-10,3.178909635526139e-10 +credit_bridge,456,1,0.001,0.0,3.321813102363791e-10,3.178909635526139e-10 +credit_bridge,456,2,1e-08,0.0,3.2246236236765924e-10,3.0897787106631824e-10 +credit_bridge,456,2,1e-07,0.0,3.2246236236765924e-10,3.0897787106631824e-10 +credit_bridge,456,2,1e-06,0.0,3.2246236236765924e-10,3.0897787106631824e-10 +credit_bridge,456,2,1e-05,0.0,3.2246236236765924e-10,3.0897787106631824e-10 +credit_bridge,456,2,0.0001,0.0,3.2246236236765924e-10,3.0897787106631824e-10 +credit_bridge,456,2,0.001,0.0,3.2246236236765924e-10,3.0897787106631824e-10 +credit_bridge,456,3,1e-08,0.0,3.219113864361134e-10,3.0849234278207405e-10 +credit_bridge,456,3,1e-07,0.0,3.219113864361134e-10,3.0849234278207405e-10 +credit_bridge,456,3,1e-06,0.0,3.219113864361134e-10,3.0849234278207405e-10 +credit_bridge,456,3,1e-05,0.0,3.219113864361134e-10,3.0849234278207405e-10 +credit_bridge,456,3,0.0001,0.0,3.219113864361134e-10,3.0849234278207405e-10 +credit_bridge,456,3,0.001,0.0,3.219113864361134e-10,3.0849234278207405e-10 +credit_bridge,789,0,1e-08,0.9970703125,1.2130860227443918e-07,9.41449300739805e-08 +credit_bridge,789,0,1e-07,0.46484375,1.2130860227443918e-07,9.41449300739805e-08 +credit_bridge,789,0,1e-06,0.0,1.2130860227443918e-07,9.41449300739805e-08 +credit_bridge,789,0,1e-05,0.0,1.2130860227443918e-07,9.41449300739805e-08 +credit_bridge,789,0,0.0001,0.0,1.2130860227443918e-07,9.41449300739805e-08 +credit_bridge,789,0,0.001,0.0,1.2130860227443918e-07,9.41449300739805e-08 +credit_bridge,789,1,1e-08,0.0,2.2500852570050967e-10,2.085357719838754e-10 +credit_bridge,789,1,1e-07,0.0,2.2500852570050967e-10,2.085357719838754e-10 +credit_bridge,789,1,1e-06,0.0,2.2500852570050967e-10,2.085357719838754e-10 +credit_bridge,789,1,1e-05,0.0,2.2500852570050967e-10,2.085357719838754e-10 +credit_bridge,789,1,0.0001,0.0,2.2500852570050967e-10,2.085357719838754e-10 +credit_bridge,789,1,0.001,0.0,2.2500852570050967e-10,2.085357719838754e-10 +credit_bridge,789,2,1e-08,0.0,2.1138567285472476e-10,2.072469834635271e-10 +credit_bridge,789,2,1e-07,0.0,2.1138567285472476e-10,2.072469834635271e-10 +credit_bridge,789,2,1e-06,0.0,2.1138567285472476e-10,2.072469834635271e-10 +credit_bridge,789,2,1e-05,0.0,2.1138567285472476e-10,2.072469834635271e-10 +credit_bridge,789,2,0.0001,0.0,2.1138567285472476e-10,2.072469834635271e-10 +credit_bridge,789,2,0.001,0.0,2.1138567285472476e-10,2.072469834635271e-10 +credit_bridge,789,3,1e-08,0.0,2.1107138259424119e-10,2.0760486385551502e-10 +credit_bridge,789,3,1e-07,0.0,2.1107138259424119e-10,2.0760486385551502e-10 +credit_bridge,789,3,1e-06,0.0,2.1107138259424119e-10,2.0760486385551502e-10 +credit_bridge,789,3,1e-05,0.0,2.1107138259424119e-10,2.0760486385551502e-10 +credit_bridge,789,3,0.0001,0.0,2.1107138259424119e-10,2.0760486385551502e-10 +credit_bridge,789,3,0.001,0.0,2.1107138259424119e-10,2.0760486385551502e-10 +credit_bridge,1024,0,1e-08,1.0,1.4595693187402503e-07,1.1624652529462765e-07 +credit_bridge,1024,0,1e-07,0.572265625,1.4595693187402503e-07,1.1624652529462765e-07 +credit_bridge,1024,0,1e-06,0.0009765625,1.4595693187402503e-07,1.1624652529462765e-07 +credit_bridge,1024,0,1e-05,0.0,1.4595693187402503e-07,1.1624652529462765e-07 +credit_bridge,1024,0,0.0001,0.0,1.4595693187402503e-07,1.1624652529462765e-07 +credit_bridge,1024,0,0.001,0.0,1.4595693187402503e-07,1.1624652529462765e-07 +credit_bridge,1024,1,1e-08,0.0,4.4246256658553307e-10,4.2227771279712556e-10 +credit_bridge,1024,1,1e-07,0.0,4.4246256658553307e-10,4.2227771279712556e-10 +credit_bridge,1024,1,1e-06,0.0,4.4246256658553307e-10,4.2227771279712556e-10 +credit_bridge,1024,1,1e-05,0.0,4.4246256658553307e-10,4.2227771279712556e-10 +credit_bridge,1024,1,0.0001,0.0,4.4246256658553307e-10,4.2227771279712556e-10 +credit_bridge,1024,1,0.001,0.0,4.4246256658553307e-10,4.2227771279712556e-10 +credit_bridge,1024,2,1e-08,0.0,4.371256134838575e-10,4.1471998057929227e-10 +credit_bridge,1024,2,1e-07,0.0,4.371256134838575e-10,4.1471998057929227e-10 +credit_bridge,1024,2,1e-06,0.0,4.371256134838575e-10,4.1471998057929227e-10 +credit_bridge,1024,2,1e-05,0.0,4.371256134838575e-10,4.1471998057929227e-10 +credit_bridge,1024,2,0.0001,0.0,4.371256134838575e-10,4.1471998057929227e-10 +credit_bridge,1024,2,0.001,0.0,4.371256134838575e-10,4.1471998057929227e-10 +credit_bridge,1024,3,1e-08,0.0,4.3731454568707306e-10,4.1535089256861113e-10 +credit_bridge,1024,3,1e-07,0.0,4.3731454568707306e-10,4.1535089256861113e-10 +credit_bridge,1024,3,1e-06,0.0,4.3731454568707306e-10,4.1535089256861113e-10 +credit_bridge,1024,3,1e-05,0.0,4.3731454568707306e-10,4.1535089256861113e-10 +credit_bridge,1024,3,0.0001,0.0,4.3731454568707306e-10,4.1535089256861113e-10 +credit_bridge,1024,3,0.001,0.0,4.3731454568707306e-10,4.1535089256861113e-10 +credit_bridge,2048,0,1e-08,1.0,1.074129869493845e-07,9.11462194608248e-08 +credit_bridge,2048,0,1e-07,0.4453125,1.074129869493845e-07,9.11462194608248e-08 +credit_bridge,2048,0,1e-06,0.0,1.074129869493845e-07,9.11462194608248e-08 +credit_bridge,2048,0,1e-05,0.0,1.074129869493845e-07,9.11462194608248e-08 +credit_bridge,2048,0,0.0001,0.0,1.074129869493845e-07,9.11462194608248e-08 +credit_bridge,2048,0,0.001,0.0,1.074129869493845e-07,9.11462194608248e-08 +credit_bridge,2048,1,1e-08,0.0,2.5469237829867097e-10,2.5587329477438914e-10 +credit_bridge,2048,1,1e-07,0.0,2.5469237829867097e-10,2.5587329477438914e-10 +credit_bridge,2048,1,1e-06,0.0,2.5469237829867097e-10,2.5587329477438914e-10 +credit_bridge,2048,1,1e-05,0.0,2.5469237829867097e-10,2.5587329477438914e-10 +credit_bridge,2048,1,0.0001,0.0,2.5469237829867097e-10,2.5587329477438914e-10 +credit_bridge,2048,1,0.001,0.0,2.5469237829867097e-10,2.5587329477438914e-10 +credit_bridge,2048,2,1e-08,0.0,2.5126389857632603e-10,2.5415392013172777e-10 +credit_bridge,2048,2,1e-07,0.0,2.5126389857632603e-10,2.5415392013172777e-10 +credit_bridge,2048,2,1e-06,0.0,2.5126389857632603e-10,2.5415392013172777e-10 +credit_bridge,2048,2,1e-05,0.0,2.5126389857632603e-10,2.5415392013172777e-10 +credit_bridge,2048,2,0.0001,0.0,2.5126389857632603e-10,2.5415392013172777e-10 +credit_bridge,2048,2,0.001,0.0,2.5126389857632603e-10,2.5415392013172777e-10 +credit_bridge,2048,3,1e-08,0.0,2.5130866831979404e-10,2.541315768933572e-10 +credit_bridge,2048,3,1e-07,0.0,2.5130866831979404e-10,2.541315768933572e-10 +credit_bridge,2048,3,1e-06,0.0,2.5130866831979404e-10,2.541315768933572e-10 +credit_bridge,2048,3,1e-05,0.0,2.5130866831979404e-10,2.541315768933572e-10 +credit_bridge,2048,3,0.0001,0.0,2.5130866831979404e-10,2.541315768933572e-10 +credit_bridge,2048,3,0.001,0.0,2.5130866831979404e-10,2.541315768933572e-10 +credit_bridge,3000,0,1e-08,0.9990234375,1.4798638403590303e-07,1.137780429871782e-07 +credit_bridge,3000,0,1e-07,0.556640625,1.4798638403590303e-07,1.137780429871782e-07 +credit_bridge,3000,0,1e-06,0.0009765625,1.4798638403590303e-07,1.137780429871782e-07 +credit_bridge,3000,0,1e-05,0.0,1.4798638403590303e-07,1.137780429871782e-07 +credit_bridge,3000,0,0.0001,0.0,1.4798638403590303e-07,1.137780429871782e-07 +credit_bridge,3000,0,0.001,0.0,1.4798638403590303e-07,1.137780429871782e-07 +credit_bridge,3000,1,1e-08,0.0,1.8992001027395844e-10,1.6869838859179254e-10 +credit_bridge,3000,1,1e-07,0.0,1.8992001027395844e-10,1.6869838859179254e-10 +credit_bridge,3000,1,1e-06,0.0,1.8992001027395844e-10,1.6869838859179254e-10 +credit_bridge,3000,1,1e-05,0.0,1.8992001027395844e-10,1.6869838859179254e-10 +credit_bridge,3000,1,0.0001,0.0,1.8992001027395844e-10,1.6869838859179254e-10 +credit_bridge,3000,1,0.001,0.0,1.8992001027395844e-10,1.6869838859179254e-10 +credit_bridge,3000,2,1e-08,0.0,1.7987969447297303e-10,1.6722193074691916e-10 +credit_bridge,3000,2,1e-07,0.0,1.7987969447297303e-10,1.6722193074691916e-10 +credit_bridge,3000,2,1e-06,0.0,1.7987969447297303e-10,1.6722193074691916e-10 +credit_bridge,3000,2,1e-05,0.0,1.7987969447297303e-10,1.6722193074691916e-10 +credit_bridge,3000,2,0.0001,0.0,1.7987969447297303e-10,1.6722193074691916e-10 +credit_bridge,3000,2,0.001,0.0,1.7987969447297303e-10,1.6722193074691916e-10 +credit_bridge,3000,3,1e-08,0.0,1.8002110913073466e-10,1.6753128051494315e-10 +credit_bridge,3000,3,1e-07,0.0,1.8002110913073466e-10,1.6753128051494315e-10 +credit_bridge,3000,3,1e-06,0.0,1.8002110913073466e-10,1.6753128051494315e-10 +credit_bridge,3000,3,1e-05,0.0,1.8002110913073466e-10,1.6753128051494315e-10 +credit_bridge,3000,3,0.0001,0.0,1.8002110913073466e-10,1.6753128051494315e-10 +credit_bridge,3000,3,0.001,0.0,1.8002110913073466e-10,1.6753128051494315e-10 +credit_bridge,4000,0,1e-08,0.9814453125,1.2629469381408853e-07,9.372890019676561e-08 +credit_bridge,4000,0,1e-07,0.4755859375,1.2629469381408853e-07,9.372890019676561e-08 +credit_bridge,4000,0,1e-06,0.0,1.2629469381408853e-07,9.372890019676561e-08 +credit_bridge,4000,0,1e-05,0.0,1.2629469381408853e-07,9.372890019676561e-08 +credit_bridge,4000,0,0.0001,0.0,1.2629469381408853e-07,9.372890019676561e-08 +credit_bridge,4000,0,0.001,0.0,1.2629469381408853e-07,9.372890019676561e-08 +credit_bridge,4000,1,1e-08,0.0,1.9080659274806067e-10,1.8736633078386689e-10 +credit_bridge,4000,1,1e-07,0.0,1.9080659274806067e-10,1.8736633078386689e-10 +credit_bridge,4000,1,1e-06,0.0,1.9080659274806067e-10,1.8736633078386689e-10 +credit_bridge,4000,1,1e-05,0.0,1.9080659274806067e-10,1.8736633078386689e-10 +credit_bridge,4000,1,0.0001,0.0,1.9080659274806067e-10,1.8736633078386689e-10 +credit_bridge,4000,1,0.001,0.0,1.9080659274806067e-10,1.8736633078386689e-10 +credit_bridge,4000,2,1e-08,0.0,1.887861811322722e-10,1.857383552517078e-10 +credit_bridge,4000,2,1e-07,0.0,1.887861811322722e-10,1.857383552517078e-10 +credit_bridge,4000,2,1e-06,0.0,1.887861811322722e-10,1.857383552517078e-10 +credit_bridge,4000,2,1e-05,0.0,1.887861811322722e-10,1.857383552517078e-10 +credit_bridge,4000,2,0.0001,0.0,1.887861811322722e-10,1.857383552517078e-10 +credit_bridge,4000,2,0.001,0.0,1.887861811322722e-10,1.857383552517078e-10 +credit_bridge,4000,3,1e-08,0.0,1.8857371220093455e-10,1.8558354852871162e-10 +credit_bridge,4000,3,1e-07,0.0,1.8857371220093455e-10,1.8558354852871162e-10 +credit_bridge,4000,3,1e-06,0.0,1.8857371220093455e-10,1.8558354852871162e-10 +credit_bridge,4000,3,1e-05,0.0,1.8857371220093455e-10,1.8558354852871162e-10 +credit_bridge,4000,3,0.0001,0.0,1.8857371220093455e-10,1.8558354852871162e-10 +credit_bridge,4000,3,0.001,0.0,1.8857371220093455e-10,1.8558354852871162e-10 +credit_bridge,5000,0,1e-08,0.9951171875,1.2024895568174543e-07,9.053461980101929e-08 +credit_bridge,5000,0,1e-07,0.455078125,1.2024895568174543e-07,9.053461980101929e-08 +credit_bridge,5000,0,1e-06,0.0009765625,1.2024895568174543e-07,9.053461980101929e-08 +credit_bridge,5000,0,1e-05,0.0,1.2024895568174543e-07,9.053461980101929e-08 +credit_bridge,5000,0,0.0001,0.0,1.2024895568174543e-07,9.053461980101929e-08 +credit_bridge,5000,0,0.001,0.0,1.2024895568174543e-07,9.053461980101929e-08 +credit_bridge,5000,1,1e-08,0.0,1.5791068452841728e-10,1.4876434806243566e-10 +credit_bridge,5000,1,1e-07,0.0,1.5791068452841728e-10,1.4876434806243566e-10 +credit_bridge,5000,1,1e-06,0.0,1.5791068452841728e-10,1.4876434806243566e-10 +credit_bridge,5000,1,1e-05,0.0,1.5791068452841728e-10,1.4876434806243566e-10 +credit_bridge,5000,1,0.0001,0.0,1.5791068452841728e-10,1.4876434806243566e-10 +credit_bridge,5000,1,0.001,0.0,1.5791068452841728e-10,1.4876434806243566e-10 +credit_bridge,5000,2,1e-08,0.0,1.5668744079988528e-10,1.4798093306289672e-10 +credit_bridge,5000,2,1e-07,0.0,1.5668744079988528e-10,1.4798093306289672e-10 +credit_bridge,5000,2,1e-06,0.0,1.5668744079988528e-10,1.4798093306289672e-10 +credit_bridge,5000,2,1e-05,0.0,1.5668744079988528e-10,1.4798093306289672e-10 +credit_bridge,5000,2,0.0001,0.0,1.5668744079988528e-10,1.4798093306289672e-10 +credit_bridge,5000,2,0.001,0.0,1.5668744079988528e-10,1.4798093306289672e-10 +credit_bridge,5000,3,1e-08,0.0,1.5554743604262455e-10,1.4748766097305577e-10 +credit_bridge,5000,3,1e-07,0.0,1.5554743604262455e-10,1.4748766097305577e-10 +credit_bridge,5000,3,1e-06,0.0,1.5554743604262455e-10,1.4748766097305577e-10 +credit_bridge,5000,3,1e-05,0.0,1.5554743604262455e-10,1.4748766097305577e-10 +credit_bridge,5000,3,0.0001,0.0,1.5554743604262455e-10,1.4748766097305577e-10 +credit_bridge,5000,3,0.001,0.0,1.5554743604262455e-10,1.4748766097305577e-10 +credit_bridge,6000,0,1e-08,0.99609375,9.945837575742189e-08,7.272087998444476e-08 +credit_bridge,6000,0,1e-07,0.359375,9.945837575742189e-08,7.272087998444476e-08 +credit_bridge,6000,0,1e-06,0.0,9.945837575742189e-08,7.272087998444476e-08 +credit_bridge,6000,0,1e-05,0.0,9.945837575742189e-08,7.272087998444476e-08 +credit_bridge,6000,0,0.0001,0.0,9.945837575742189e-08,7.272087998444476e-08 +credit_bridge,6000,0,0.001,0.0,9.945837575742189e-08,7.272087998444476e-08 +credit_bridge,6000,1,1e-08,0.0,2.8420565900688644e-10,2.7506663613507953e-10 +credit_bridge,6000,1,1e-07,0.0,2.8420565900688644e-10,2.7506663613507953e-10 +credit_bridge,6000,1,1e-06,0.0,2.8420565900688644e-10,2.7506663613507953e-10 +credit_bridge,6000,1,1e-05,0.0,2.8420565900688644e-10,2.7506663613507953e-10 +credit_bridge,6000,1,0.0001,0.0,2.8420565900688644e-10,2.7506663613507953e-10 +credit_bridge,6000,1,0.001,0.0,2.8420565900688644e-10,2.7506663613507953e-10 +credit_bridge,6000,2,1e-08,0.0,2.7818530812240283e-10,2.701625589907053e-10 +credit_bridge,6000,2,1e-07,0.0,2.7818530812240283e-10,2.701625589907053e-10 +credit_bridge,6000,2,1e-06,0.0,2.7818530812240283e-10,2.701625589907053e-10 +credit_bridge,6000,2,1e-05,0.0,2.7818530812240283e-10,2.701625589907053e-10 +credit_bridge,6000,2,0.0001,0.0,2.7818530812240283e-10,2.701625589907053e-10 +credit_bridge,6000,2,0.001,0.0,2.7818530812240283e-10,2.701625589907053e-10 +credit_bridge,6000,3,1e-08,0.0,2.789828368321423e-10,2.7161273230547067e-10 +credit_bridge,6000,3,1e-07,0.0,2.789828368321423e-10,2.7161273230547067e-10 +credit_bridge,6000,3,1e-06,0.0,2.789828368321423e-10,2.7161273230547067e-10 +credit_bridge,6000,3,1e-05,0.0,2.789828368321423e-10,2.7161273230547067e-10 +credit_bridge,6000,3,0.0001,0.0,2.789828368321423e-10,2.7161273230547067e-10 +credit_bridge,6000,3,0.001,0.0,2.789828368321423e-10,2.7161273230547067e-10 diff --git a/results/confirmatory/T2_support_sparsity_gpu1.csv b/results/confirmatory/T2_support_sparsity_gpu1.csv new file mode 100644 index 0000000..9c30a55 --- /dev/null +++ b/results/confirmatory/T2_support_sparsity_gpu1.csv @@ -0,0 +1,801 @@ +method,seed,layer,threshold,support_fraction,mean_norm,median_norm +bp,42,0,1e-08,0.0,4.731865940743596e-13,4.731865940743596e-13 +bp,42,0,1e-07,0.0,4.731865940743596e-13,4.731865940743596e-13 +bp,42,0,1e-06,0.0,4.731865940743596e-13,4.731865940743596e-13 +bp,42,0,1e-05,0.0,4.731865940743596e-13,4.731865940743596e-13 +bp,42,0,0.0001,0.0,4.731865940743596e-13,4.731865940743596e-13 +bp,42,1,1e-08,0.0,4.724761706008385e-13,4.724761706008385e-13 +bp,42,1,1e-07,0.0,4.724761706008385e-13,4.724761706008385e-13 +bp,42,1,1e-06,0.0,4.724761706008385e-13,4.724761706008385e-13 +bp,42,1,1e-05,0.0,4.724761706008385e-13,4.724761706008385e-13 +bp,42,1,0.0001,0.0,4.724761706008385e-13,4.724761706008385e-13 +bp,42,2,1e-08,0.0,8.05216014850528e-14,8.05216014850528e-14 +bp,42,2,1e-07,0.0,8.05216014850528e-14,8.05216014850528e-14 +bp,42,2,1e-06,0.0,8.05216014850528e-14,8.05216014850528e-14 +bp,42,2,1e-05,0.0,8.05216014850528e-14,8.05216014850528e-14 +bp,42,2,0.0001,0.0,8.05216014850528e-14,8.05216014850528e-14 +bp,42,3,1e-08,0.0,4.5108212412721393e-13,4.5108212412721393e-13 +bp,42,3,1e-07,0.0,4.5108212412721393e-13,4.5108212412721393e-13 +bp,42,3,1e-06,0.0,4.5108212412721393e-13,4.5108212412721393e-13 +bp,42,3,1e-05,0.0,4.5108212412721393e-13,4.5108212412721393e-13 +bp,42,3,0.0001,0.0,4.5108212412721393e-13,4.5108212412721393e-13 +bp,123,0,1e-08,0.0,3.9156500849894804e-13,3.9156500849894804e-13 +bp,123,0,1e-07,0.0,3.9156500849894804e-13,3.9156500849894804e-13 +bp,123,0,1e-06,0.0,3.9156500849894804e-13,3.9156500849894804e-13 +bp,123,0,1e-05,0.0,3.9156500849894804e-13,3.9156500849894804e-13 +bp,123,0,0.0001,0.0,3.9156500849894804e-13,3.9156500849894804e-13 +bp,123,1,1e-08,0.0,3.5110701509816905e-15,3.5110701509816905e-15 +bp,123,1,1e-07,0.0,3.5110701509816905e-15,3.5110701509816905e-15 +bp,123,1,1e-06,0.0,3.5110701509816905e-15,3.5110701509816905e-15 +bp,123,1,1e-05,0.0,3.5110701509816905e-15,3.5110701509816905e-15 +bp,123,1,0.0001,0.0,3.5110701509816905e-15,3.5110701509816905e-15 +bp,123,2,1e-08,0.0,4.893933023587815e-13,4.893933023587815e-13 +bp,123,2,1e-07,0.0,4.893933023587815e-13,4.893933023587815e-13 +bp,123,2,1e-06,0.0,4.893933023587815e-13,4.893933023587815e-13 +bp,123,2,1e-05,0.0,4.893933023587815e-13,4.893933023587815e-13 +bp,123,2,0.0001,0.0,4.893933023587815e-13,4.893933023587815e-13 +bp,123,3,1e-08,0.0,4.69442572922224e-13,4.69442572922224e-13 +bp,123,3,1e-07,0.0,4.69442572922224e-13,4.69442572922224e-13 +bp,123,3,1e-06,0.0,4.69442572922224e-13,4.69442572922224e-13 +bp,123,3,1e-05,0.0,4.69442572922224e-13,4.69442572922224e-13 +bp,123,3,0.0001,0.0,4.69442572922224e-13,4.69442572922224e-13 +bp,456,0,1e-08,0.0,3.285176492819064e-13,3.285176492819064e-13 +bp,456,0,1e-07,0.0,3.285176492819064e-13,3.285176492819064e-13 +bp,456,0,1e-06,0.0,3.285176492819064e-13,3.285176492819064e-13 +bp,456,0,1e-05,0.0,3.285176492819064e-13,3.285176492819064e-13 +bp,456,0,0.0001,0.0,3.285176492819064e-13,3.285176492819064e-13 +bp,456,1,1e-08,0.0,3.928409789306919e-13,3.928409789306919e-13 +bp,456,1,1e-07,0.0,3.928409789306919e-13,3.928409789306919e-13 +bp,456,1,1e-06,0.0,3.928409789306919e-13,3.928409789306919e-13 +bp,456,1,1e-05,0.0,3.928409789306919e-13,3.928409789306919e-13 +bp,456,1,0.0001,0.0,3.928409789306919e-13,3.928409789306919e-13 +bp,456,2,1e-08,0.0,2.4372496208735495e-13,2.4372496208735495e-13 +bp,456,2,1e-07,0.0,2.4372496208735495e-13,2.4372496208735495e-13 +bp,456,2,1e-06,0.0,2.4372496208735495e-13,2.4372496208735495e-13 +bp,456,2,1e-05,0.0,2.4372496208735495e-13,2.4372496208735495e-13 +bp,456,2,0.0001,0.0,2.4372496208735495e-13,2.4372496208735495e-13 +bp,456,3,1e-08,0.0,4.389276756725652e-13,4.389276756725652e-13 +bp,456,3,1e-07,0.0,4.389276756725652e-13,4.389276756725652e-13 +bp,456,3,1e-06,0.0,4.389276756725652e-13,4.389276756725652e-13 +bp,456,3,1e-05,0.0,4.389276756725652e-13,4.389276756725652e-13 +bp,456,3,0.0001,0.0,4.389276756725652e-13,4.389276756725652e-13 +bp,789,0,1e-08,0.0,3.8051492837719303e-13,3.8051492837719303e-13 +bp,789,0,1e-07,0.0,3.8051492837719303e-13,3.8051492837719303e-13 +bp,789,0,1e-06,0.0,3.8051492837719303e-13,3.8051492837719303e-13 +bp,789,0,1e-05,0.0,3.8051492837719303e-13,3.8051492837719303e-13 +bp,789,0,0.0001,0.0,3.8051492837719303e-13,3.8051492837719303e-13 +bp,789,1,1e-08,0.0,3.4288153913375474e-13,3.4288153913375474e-13 +bp,789,1,1e-07,0.0,3.4288153913375474e-13,3.4288153913375474e-13 +bp,789,1,1e-06,0.0,3.4288153913375474e-13,3.4288153913375474e-13 +bp,789,1,1e-05,0.0,3.4288153913375474e-13,3.4288153913375474e-13 +bp,789,1,0.0001,0.0,3.4288153913375474e-13,3.4288153913375474e-13 +bp,789,2,1e-08,0.0,4.883813622610922e-13,4.883813622610922e-13 +bp,789,2,1e-07,0.0,4.883813622610922e-13,4.883813622610922e-13 +bp,789,2,1e-06,0.0,4.883813622610922e-13,4.883813622610922e-13 +bp,789,2,1e-05,0.0,4.883813622610922e-13,4.883813622610922e-13 +bp,789,2,0.0001,0.0,4.883813622610922e-13,4.883813622610922e-13 +bp,789,3,1e-08,0.0,4.0772298189571676e-13,4.0772298189571676e-13 +bp,789,3,1e-07,0.0,4.0772298189571676e-13,4.0772298189571676e-13 +bp,789,3,1e-06,0.0,4.0772298189571676e-13,4.0772298189571676e-13 +bp,789,3,1e-05,0.0,4.0772298189571676e-13,4.0772298189571676e-13 +bp,789,3,0.0001,0.0,4.0772298189571676e-13,4.0772298189571676e-13 +bp,1024,0,1e-08,0.0,2.951636331183227e-13,2.951636331183227e-13 +bp,1024,0,1e-07,0.0,2.951636331183227e-13,2.951636331183227e-13 +bp,1024,0,1e-06,0.0,2.951636331183227e-13,2.951636331183227e-13 +bp,1024,0,1e-05,0.0,2.951636331183227e-13,2.951636331183227e-13 +bp,1024,0,0.0001,0.0,2.951636331183227e-13,2.951636331183227e-13 +bp,1024,1,1e-08,0.0,3.266093992482233e-13,3.266093992482233e-13 +bp,1024,1,1e-07,0.0,3.266093992482233e-13,3.266093992482233e-13 +bp,1024,1,1e-06,0.0,3.266093992482233e-13,3.266093992482233e-13 +bp,1024,1,1e-05,0.0,3.266093992482233e-13,3.266093992482233e-13 +bp,1024,1,0.0001,0.0,3.266093992482233e-13,3.266093992482233e-13 +bp,1024,2,1e-08,0.0,3.021454885333147e-13,3.021454885333147e-13 +bp,1024,2,1e-07,0.0,3.021454885333147e-13,3.021454885333147e-13 +bp,1024,2,1e-06,0.0,3.021454885333147e-13,3.021454885333147e-13 +bp,1024,2,1e-05,0.0,3.021454885333147e-13,3.021454885333147e-13 +bp,1024,2,0.0001,0.0,3.021454885333147e-13,3.021454885333147e-13 +bp,1024,3,1e-08,0.0,3.338237889241591e-13,3.338237889241591e-13 +bp,1024,3,1e-07,0.0,3.338237889241591e-13,3.338237889241591e-13 +bp,1024,3,1e-06,0.0,3.338237889241591e-13,3.338237889241591e-13 +bp,1024,3,1e-05,0.0,3.338237889241591e-13,3.338237889241591e-13 +bp,1024,3,0.0001,0.0,3.338237889241591e-13,3.338237889241591e-13 +bp,2048,0,1e-08,0.0,5.86302599352162e-13,5.86302599352162e-13 +bp,2048,0,1e-07,0.0,5.86302599352162e-13,5.86302599352162e-13 +bp,2048,0,1e-06,0.0,5.86302599352162e-13,5.86302599352162e-13 +bp,2048,0,1e-05,0.0,5.86302599352162e-13,5.86302599352162e-13 +bp,2048,0,0.0001,0.0,5.86302599352162e-13,5.86302599352162e-13 +bp,2048,1,1e-08,0.0,4.492778490818722e-13,4.492778490818722e-13 +bp,2048,1,1e-07,0.0,4.492778490818722e-13,4.492778490818722e-13 +bp,2048,1,1e-06,0.0,4.492778490818722e-13,4.492778490818722e-13 +bp,2048,1,1e-05,0.0,4.492778490818722e-13,4.492778490818722e-13 +bp,2048,1,0.0001,0.0,4.492778490818722e-13,4.492778490818722e-13 +bp,2048,2,1e-08,0.0,5.734980090647823e-13,5.734980090647823e-13 +bp,2048,2,1e-07,0.0,5.734980090647823e-13,5.734980090647823e-13 +bp,2048,2,1e-06,0.0,5.734980090647823e-13,5.734980090647823e-13 +bp,2048,2,1e-05,0.0,5.734980090647823e-13,5.734980090647823e-13 +bp,2048,2,0.0001,0.0,5.734980090647823e-13,5.734980090647823e-13 +bp,2048,3,1e-08,0.0,1.7814421541650222e-13,1.7814421541650222e-13 +bp,2048,3,1e-07,0.0,1.7814421541650222e-13,1.7814421541650222e-13 +bp,2048,3,1e-06,0.0,1.7814421541650222e-13,1.7814421541650222e-13 +bp,2048,3,1e-05,0.0,1.7814421541650222e-13,1.7814421541650222e-13 +bp,2048,3,0.0001,0.0,1.7814421541650222e-13,1.7814421541650222e-13 +bp,3000,0,1e-08,0.0,3.6805094020229967e-13,3.6805094020229967e-13 +bp,3000,0,1e-07,0.0,3.6805094020229967e-13,3.6805094020229967e-13 +bp,3000,0,1e-06,0.0,3.6805094020229967e-13,3.6805094020229967e-13 +bp,3000,0,1e-05,0.0,3.6805094020229967e-13,3.6805094020229967e-13 +bp,3000,0,0.0001,0.0,3.6805094020229967e-13,3.6805094020229967e-13 +bp,3000,1,1e-08,0.0,2.2325122707531758e-13,2.2325122707531758e-13 +bp,3000,1,1e-07,0.0,2.2325122707531758e-13,2.2325122707531758e-13 +bp,3000,1,1e-06,0.0,2.2325122707531758e-13,2.2325122707531758e-13 +bp,3000,1,1e-05,0.0,2.2325122707531758e-13,2.2325122707531758e-13 +bp,3000,1,0.0001,0.0,2.2325122707531758e-13,2.2325122707531758e-13 +bp,3000,2,1e-08,0.0,3.759683807769837e-13,3.759683807769837e-13 +bp,3000,2,1e-07,0.0,3.759683807769837e-13,3.759683807769837e-13 +bp,3000,2,1e-06,0.0,3.759683807769837e-13,3.759683807769837e-13 +bp,3000,2,1e-05,0.0,3.759683807769837e-13,3.759683807769837e-13 +bp,3000,2,0.0001,0.0,3.759683807769837e-13,3.759683807769837e-13 +bp,3000,3,1e-08,0.0,9.53175797839545e-14,9.53175797839545e-14 +bp,3000,3,1e-07,0.0,9.53175797839545e-14,9.53175797839545e-14 +bp,3000,3,1e-06,0.0,9.53175797839545e-14,9.53175797839545e-14 +bp,3000,3,1e-05,0.0,9.53175797839545e-14,9.53175797839545e-14 +bp,3000,3,0.0001,0.0,9.53175797839545e-14,9.53175797839545e-14 +bp,4000,0,1e-08,0.0,3.164588274588709e-13,3.164588274588709e-13 +bp,4000,0,1e-07,0.0,3.164588274588709e-13,3.164588274588709e-13 +bp,4000,0,1e-06,0.0,3.164588274588709e-13,3.164588274588709e-13 +bp,4000,0,1e-05,0.0,3.164588274588709e-13,3.164588274588709e-13 +bp,4000,0,0.0001,0.0,3.164588274588709e-13,3.164588274588709e-13 +bp,4000,1,1e-08,0.0,2.2068578789478238e-13,2.2068578789478238e-13 +bp,4000,1,1e-07,0.0,2.2068578789478238e-13,2.2068578789478238e-13 +bp,4000,1,1e-06,0.0,2.2068578789478238e-13,2.2068578789478238e-13 +bp,4000,1,1e-05,0.0,2.2068578789478238e-13,2.2068578789478238e-13 +bp,4000,1,0.0001,0.0,2.2068578789478238e-13,2.2068578789478238e-13 +bp,4000,2,1e-08,0.0,3.1602102662162124e-13,3.1602102662162124e-13 +bp,4000,2,1e-07,0.0,3.1602102662162124e-13,3.1602102662162124e-13 +bp,4000,2,1e-06,0.0,3.1602102662162124e-13,3.1602102662162124e-13 +bp,4000,2,1e-05,0.0,3.1602102662162124e-13,3.1602102662162124e-13 +bp,4000,2,0.0001,0.0,3.1602102662162124e-13,3.1602102662162124e-13 +bp,4000,3,1e-08,0.0,4.696980109540616e-13,4.696980109540616e-13 +bp,4000,3,1e-07,0.0,4.696980109540616e-13,4.696980109540616e-13 +bp,4000,3,1e-06,0.0,4.696980109540616e-13,4.696980109540616e-13 +bp,4000,3,1e-05,0.0,4.696980109540616e-13,4.696980109540616e-13 +bp,4000,3,0.0001,0.0,4.696980109540616e-13,4.696980109540616e-13 +bp,5000,0,1e-08,0.0,5.047975384052383e-13,5.047975384052383e-13 +bp,5000,0,1e-07,0.0,5.047975384052383e-13,5.047975384052383e-13 +bp,5000,0,1e-06,0.0,5.047975384052383e-13,5.047975384052383e-13 +bp,5000,0,1e-05,0.0,5.047975384052383e-13,5.047975384052383e-13 +bp,5000,0,0.0001,0.0,5.047975384052383e-13,5.047975384052383e-13 +bp,5000,1,1e-08,0.0,6.719673645641522e-13,6.719673645641522e-13 +bp,5000,1,1e-07,0.0,6.719673645641522e-13,6.719673645641522e-13 +bp,5000,1,1e-06,0.0,6.719673645641522e-13,6.719673645641522e-13 +bp,5000,1,1e-05,0.0,6.719673645641522e-13,6.719673645641522e-13 +bp,5000,1,0.0001,0.0,6.719673645641522e-13,6.719673645641522e-13 +bp,5000,2,1e-08,0.0,8.080094210903555e-13,8.080094210903555e-13 +bp,5000,2,1e-07,0.0,8.080094210903555e-13,8.080094210903555e-13 +bp,5000,2,1e-06,0.0,8.080094210903555e-13,8.080094210903555e-13 +bp,5000,2,1e-05,0.0,8.080094210903555e-13,8.080094210903555e-13 +bp,5000,2,0.0001,0.0,8.080094210903555e-13,8.080094210903555e-13 +bp,5000,3,1e-08,0.0,7.165152802676711e-13,7.165152802676711e-13 +bp,5000,3,1e-07,0.0,7.165152802676711e-13,7.165152802676711e-13 +bp,5000,3,1e-06,0.0,7.165152802676711e-13,7.165152802676711e-13 +bp,5000,3,1e-05,0.0,7.165152802676711e-13,7.165152802676711e-13 +bp,5000,3,0.0001,0.0,7.165152802676711e-13,7.165152802676711e-13 +bp,6000,0,1e-08,0.0,2.982623371373949e-13,2.982623371373949e-13 +bp,6000,0,1e-07,0.0,2.982623371373949e-13,2.982623371373949e-13 +bp,6000,0,1e-06,0.0,2.982623371373949e-13,2.982623371373949e-13 +bp,6000,0,1e-05,0.0,2.982623371373949e-13,2.982623371373949e-13 +bp,6000,0,0.0001,0.0,2.982623371373949e-13,2.982623371373949e-13 +bp,6000,1,1e-08,0.0,3.9399871711552625e-13,3.9399871711552625e-13 +bp,6000,1,1e-07,0.0,3.9399871711552625e-13,3.9399871711552625e-13 +bp,6000,1,1e-06,0.0,3.9399871711552625e-13,3.9399871711552625e-13 +bp,6000,1,1e-05,0.0,3.9399871711552625e-13,3.9399871711552625e-13 +bp,6000,1,0.0001,0.0,3.9399871711552625e-13,3.9399871711552625e-13 +bp,6000,2,1e-08,0.0,3.59752836244856e-13,3.59752836244856e-13 +bp,6000,2,1e-07,0.0,3.59752836244856e-13,3.59752836244856e-13 +bp,6000,2,1e-06,0.0,3.59752836244856e-13,3.59752836244856e-13 +bp,6000,2,1e-05,0.0,3.59752836244856e-13,3.59752836244856e-13 +bp,6000,2,0.0001,0.0,3.59752836244856e-13,3.59752836244856e-13 +bp,6000,3,1e-08,0.0,3.8347810712470454e-13,3.8347810712470454e-13 +bp,6000,3,1e-07,0.0,3.8347810712470454e-13,3.8347810712470454e-13 +bp,6000,3,1e-06,0.0,3.8347810712470454e-13,3.8347810712470454e-13 +bp,6000,3,1e-05,0.0,3.8347810712470454e-13,3.8347810712470454e-13 +bp,6000,3,0.0001,0.0,3.8347810712470454e-13,3.8347810712470454e-13 +dfa,42,0,1e-08,0.0,4.532996767119164e-15,4.532996767119164e-15 +dfa,42,0,1e-07,0.0,4.532996767119164e-15,4.532996767119164e-15 +dfa,42,0,1e-06,0.0,4.532996767119164e-15,4.532996767119164e-15 +dfa,42,0,1e-05,0.0,4.532996767119164e-15,4.532996767119164e-15 +dfa,42,0,0.0001,0.0,4.532996767119164e-15,4.532996767119164e-15 +dfa,42,1,1e-08,0.0,8.351995495653005e-18,8.351995495653005e-18 +dfa,42,1,1e-07,0.0,8.351995495653005e-18,8.351995495653005e-18 +dfa,42,1,1e-06,0.0,8.351995495653005e-18,8.351995495653005e-18 +dfa,42,1,1e-05,0.0,8.351995495653005e-18,8.351995495653005e-18 +dfa,42,1,0.0001,0.0,8.351995495653005e-18,8.351995495653005e-18 +dfa,42,2,1e-08,0.0,7.555760536996199e-18,7.555760536996199e-18 +dfa,42,2,1e-07,0.0,7.555760536996199e-18,7.555760536996199e-18 +dfa,42,2,1e-06,0.0,7.555760536996199e-18,7.555760536996199e-18 +dfa,42,2,1e-05,0.0,7.555760536996199e-18,7.555760536996199e-18 +dfa,42,2,0.0001,0.0,7.555760536996199e-18,7.555760536996199e-18 +dfa,42,3,1e-08,0.0,5.600560754139814e-18,5.600560754139814e-18 +dfa,42,3,1e-07,0.0,5.600560754139814e-18,5.600560754139814e-18 +dfa,42,3,1e-06,0.0,5.600560754139814e-18,5.600560754139814e-18 +dfa,42,3,1e-05,0.0,5.600560754139814e-18,5.600560754139814e-18 +dfa,42,3,0.0001,0.0,5.600560754139814e-18,5.600560754139814e-18 +dfa,123,0,1e-08,0.0,3.818720140720978e-15,3.818720140720978e-15 +dfa,123,0,1e-07,0.0,3.818720140720978e-15,3.818720140720978e-15 +dfa,123,0,1e-06,0.0,3.818720140720978e-15,3.818720140720978e-15 +dfa,123,0,1e-05,0.0,3.818720140720978e-15,3.818720140720978e-15 +dfa,123,0,0.0001,0.0,3.818720140720978e-15,3.818720140720978e-15 +dfa,123,1,1e-08,0.0,6.4485875589000965e-18,6.4485875589000965e-18 +dfa,123,1,1e-07,0.0,6.4485875589000965e-18,6.4485875589000965e-18 +dfa,123,1,1e-06,0.0,6.4485875589000965e-18,6.4485875589000965e-18 +dfa,123,1,1e-05,0.0,6.4485875589000965e-18,6.4485875589000965e-18 +dfa,123,1,0.0001,0.0,6.4485875589000965e-18,6.4485875589000965e-18 +dfa,123,2,1e-08,0.0,6.893900241668019e-18,6.893900241668019e-18 +dfa,123,2,1e-07,0.0,6.893900241668019e-18,6.893900241668019e-18 +dfa,123,2,1e-06,0.0,6.893900241668019e-18,6.893900241668019e-18 +dfa,123,2,1e-05,0.0,6.893900241668019e-18,6.893900241668019e-18 +dfa,123,2,0.0001,0.0,6.893900241668019e-18,6.893900241668019e-18 +dfa,123,3,1e-08,0.0,6.084968060608524e-18,6.084968060608524e-18 +dfa,123,3,1e-07,0.0,6.084968060608524e-18,6.084968060608524e-18 +dfa,123,3,1e-06,0.0,6.084968060608524e-18,6.084968060608524e-18 +dfa,123,3,1e-05,0.0,6.084968060608524e-18,6.084968060608524e-18 +dfa,123,3,0.0001,0.0,6.084968060608524e-18,6.084968060608524e-18 +dfa,456,0,1e-08,0.0,4.617333296578433e-15,4.617333296578433e-15 +dfa,456,0,1e-07,0.0,4.617333296578433e-15,4.617333296578433e-15 +dfa,456,0,1e-06,0.0,4.617333296578433e-15,4.617333296578433e-15 +dfa,456,0,1e-05,0.0,4.617333296578433e-15,4.617333296578433e-15 +dfa,456,0,0.0001,0.0,4.617333296578433e-15,4.617333296578433e-15 +dfa,456,1,1e-08,0.0,5.420622914720235e-18,5.420622914720235e-18 +dfa,456,1,1e-07,0.0,5.420622914720235e-18,5.420622914720235e-18 +dfa,456,1,1e-06,0.0,5.420622914720235e-18,5.420622914720235e-18 +dfa,456,1,1e-05,0.0,5.420622914720235e-18,5.420622914720235e-18 +dfa,456,1,0.0001,0.0,5.420622914720235e-18,5.420622914720235e-18 +dfa,456,2,1e-08,0.0,3.4272330301628893e-18,3.4272330301628893e-18 +dfa,456,2,1e-07,0.0,3.4272330301628893e-18,3.4272330301628893e-18 +dfa,456,2,1e-06,0.0,3.4272330301628893e-18,3.4272330301628893e-18 +dfa,456,2,1e-05,0.0,3.4272330301628893e-18,3.4272330301628893e-18 +dfa,456,2,0.0001,0.0,3.4272330301628893e-18,3.4272330301628893e-18 +dfa,456,3,1e-08,0.0,3.1884280552703615e-18,3.1884280552703615e-18 +dfa,456,3,1e-07,0.0,3.1884280552703615e-18,3.1884280552703615e-18 +dfa,456,3,1e-06,0.0,3.1884280552703615e-18,3.1884280552703615e-18 +dfa,456,3,1e-05,0.0,3.1884280552703615e-18,3.1884280552703615e-18 +dfa,456,3,0.0001,0.0,3.1884280552703615e-18,3.1884280552703615e-18 +dfa,789,0,1e-08,0.0,5.3966218192607555e-15,5.3966218192607555e-15 +dfa,789,0,1e-07,0.0,5.3966218192607555e-15,5.3966218192607555e-15 +dfa,789,0,1e-06,0.0,5.3966218192607555e-15,5.3966218192607555e-15 +dfa,789,0,1e-05,0.0,5.3966218192607555e-15,5.3966218192607555e-15 +dfa,789,0,0.0001,0.0,5.3966218192607555e-15,5.3966218192607555e-15 +dfa,789,1,1e-08,0.0,6.891336808949717e-18,6.891336808949717e-18 +dfa,789,1,1e-07,0.0,6.891336808949717e-18,6.891336808949717e-18 +dfa,789,1,1e-06,0.0,6.891336808949717e-18,6.891336808949717e-18 +dfa,789,1,1e-05,0.0,6.891336808949717e-18,6.891336808949717e-18 +dfa,789,1,0.0001,0.0,6.891336808949717e-18,6.891336808949717e-18 +dfa,789,2,1e-08,0.0,5.7309314497133776e-18,5.7309314497133776e-18 +dfa,789,2,1e-07,0.0,5.7309314497133776e-18,5.7309314497133776e-18 +dfa,789,2,1e-06,0.0,5.7309314497133776e-18,5.7309314497133776e-18 +dfa,789,2,1e-05,0.0,5.7309314497133776e-18,5.7309314497133776e-18 +dfa,789,2,0.0001,0.0,5.7309314497133776e-18,5.7309314497133776e-18 +dfa,789,3,1e-08,0.0,8.386863640013953e-18,8.386863640013953e-18 +dfa,789,3,1e-07,0.0,8.386863640013953e-18,8.386863640013953e-18 +dfa,789,3,1e-06,0.0,8.386863640013953e-18,8.386863640013953e-18 +dfa,789,3,1e-05,0.0,8.386863640013953e-18,8.386863640013953e-18 +dfa,789,3,0.0001,0.0,8.386863640013953e-18,8.386863640013953e-18 +dfa,1024,0,1e-08,0.0,4.9555408469228665e-15,4.9555408469228665e-15 +dfa,1024,0,1e-07,0.0,4.9555408469228665e-15,4.9555408469228665e-15 +dfa,1024,0,1e-06,0.0,4.9555408469228665e-15,4.9555408469228665e-15 +dfa,1024,0,1e-05,0.0,4.9555408469228665e-15,4.9555408469228665e-15 +dfa,1024,0,0.0001,0.0,4.9555408469228665e-15,4.9555408469228665e-15 +dfa,1024,1,1e-08,0.0,6.755392983999077e-18,6.755392983999077e-18 +dfa,1024,1,1e-07,0.0,6.755392983999077e-18,6.755392983999077e-18 +dfa,1024,1,1e-06,0.0,6.755392983999077e-18,6.755392983999077e-18 +dfa,1024,1,1e-05,0.0,6.755392983999077e-18,6.755392983999077e-18 +dfa,1024,1,0.0001,0.0,6.755392983999077e-18,6.755392983999077e-18 +dfa,1024,2,1e-08,0.0,3.3610594083392596e-18,3.3610594083392596e-18 +dfa,1024,2,1e-07,0.0,3.3610594083392596e-18,3.3610594083392596e-18 +dfa,1024,2,1e-06,0.0,3.3610594083392596e-18,3.3610594083392596e-18 +dfa,1024,2,1e-05,0.0,3.3610594083392596e-18,3.3610594083392596e-18 +dfa,1024,2,0.0001,0.0,3.3610594083392596e-18,3.3610594083392596e-18 +dfa,1024,3,1e-08,0.0,6.282021094082437e-18,6.282021094082437e-18 +dfa,1024,3,1e-07,0.0,6.282021094082437e-18,6.282021094082437e-18 +dfa,1024,3,1e-06,0.0,6.282021094082437e-18,6.282021094082437e-18 +dfa,1024,3,1e-05,0.0,6.282021094082437e-18,6.282021094082437e-18 +dfa,1024,3,0.0001,0.0,6.282021094082437e-18,6.282021094082437e-18 +dfa,2048,0,1e-08,0.0,3.3245124148983517e-15,3.3245124148983517e-15 +dfa,2048,0,1e-07,0.0,3.3245124148983517e-15,3.3245124148983517e-15 +dfa,2048,0,1e-06,0.0,3.3245124148983517e-15,3.3245124148983517e-15 +dfa,2048,0,1e-05,0.0,3.3245124148983517e-15,3.3245124148983517e-15 +dfa,2048,0,0.0001,0.0,3.3245124148983517e-15,3.3245124148983517e-15 +dfa,2048,1,1e-08,0.0,2.703394366282796e-18,2.703394366282796e-18 +dfa,2048,1,1e-07,0.0,2.703394366282796e-18,2.703394366282796e-18 +dfa,2048,1,1e-06,0.0,2.703394366282796e-18,2.703394366282796e-18 +dfa,2048,1,1e-05,0.0,2.703394366282796e-18,2.703394366282796e-18 +dfa,2048,1,0.0001,0.0,2.703394366282796e-18,2.703394366282796e-18 +dfa,2048,2,1e-08,0.0,2.4058364068418517e-18,2.4058364068418517e-18 +dfa,2048,2,1e-07,0.0,2.4058364068418517e-18,2.4058364068418517e-18 +dfa,2048,2,1e-06,0.0,2.4058364068418517e-18,2.4058364068418517e-18 +dfa,2048,2,1e-05,0.0,2.4058364068418517e-18,2.4058364068418517e-18 +dfa,2048,2,0.0001,0.0,2.4058364068418517e-18,2.4058364068418517e-18 +dfa,2048,3,1e-08,0.0,3.0793037005253753e-18,3.0793037005253753e-18 +dfa,2048,3,1e-07,0.0,3.0793037005253753e-18,3.0793037005253753e-18 +dfa,2048,3,1e-06,0.0,3.0793037005253753e-18,3.0793037005253753e-18 +dfa,2048,3,1e-05,0.0,3.0793037005253753e-18,3.0793037005253753e-18 +dfa,2048,3,0.0001,0.0,3.0793037005253753e-18,3.0793037005253753e-18 +dfa,3000,0,1e-08,0.0,2.3844331101464033e-15,2.3844331101464033e-15 +dfa,3000,0,1e-07,0.0,2.3844331101464033e-15,2.3844331101464033e-15 +dfa,3000,0,1e-06,0.0,2.3844331101464033e-15,2.3844331101464033e-15 +dfa,3000,0,1e-05,0.0,2.3844331101464033e-15,2.3844331101464033e-15 +dfa,3000,0,0.0001,0.0,2.3844331101464033e-15,2.3844331101464033e-15 +dfa,3000,1,1e-08,0.0,3.579943392539673e-18,3.579943392539673e-18 +dfa,3000,1,1e-07,0.0,3.579943392539673e-18,3.579943392539673e-18 +dfa,3000,1,1e-06,0.0,3.579943392539673e-18,3.579943392539673e-18 +dfa,3000,1,1e-05,0.0,3.579943392539673e-18,3.579943392539673e-18 +dfa,3000,1,0.0001,0.0,3.579943392539673e-18,3.579943392539673e-18 +dfa,3000,2,1e-08,0.0,3.374655982862947e-18,3.374655982862947e-18 +dfa,3000,2,1e-07,0.0,3.374655982862947e-18,3.374655982862947e-18 +dfa,3000,2,1e-06,0.0,3.374655982862947e-18,3.374655982862947e-18 +dfa,3000,2,1e-05,0.0,3.374655982862947e-18,3.374655982862947e-18 +dfa,3000,2,0.0001,0.0,3.374655982862947e-18,3.374655982862947e-18 +dfa,3000,3,1e-08,0.0,4.287073214841348e-18,4.287073214841348e-18 +dfa,3000,3,1e-07,0.0,4.287073214841348e-18,4.287073214841348e-18 +dfa,3000,3,1e-06,0.0,4.287073214841348e-18,4.287073214841348e-18 +dfa,3000,3,1e-05,0.0,4.287073214841348e-18,4.287073214841348e-18 +dfa,3000,3,0.0001,0.0,4.287073214841348e-18,4.287073214841348e-18 +dfa,4000,0,1e-08,0.0,4.721260427558273e-15,4.721260427558273e-15 +dfa,4000,0,1e-07,0.0,4.721260427558273e-15,4.721260427558273e-15 +dfa,4000,0,1e-06,0.0,4.721260427558273e-15,4.721260427558273e-15 +dfa,4000,0,1e-05,0.0,4.721260427558273e-15,4.721260427558273e-15 +dfa,4000,0,0.0001,0.0,4.721260427558273e-15,4.721260427558273e-15 +dfa,4000,1,1e-08,0.0,3.345425074376548e-18,3.345425074376548e-18 +dfa,4000,1,1e-07,0.0,3.345425074376548e-18,3.345425074376548e-18 +dfa,4000,1,1e-06,0.0,3.345425074376548e-18,3.345425074376548e-18 +dfa,4000,1,1e-05,0.0,3.345425074376548e-18,3.345425074376548e-18 +dfa,4000,1,0.0001,0.0,3.345425074376548e-18,3.345425074376548e-18 +dfa,4000,2,1e-08,0.0,4.748028710173261e-18,4.748028710173261e-18 +dfa,4000,2,1e-07,0.0,4.748028710173261e-18,4.748028710173261e-18 +dfa,4000,2,1e-06,0.0,4.748028710173261e-18,4.748028710173261e-18 +dfa,4000,2,1e-05,0.0,4.748028710173261e-18,4.748028710173261e-18 +dfa,4000,2,0.0001,0.0,4.748028710173261e-18,4.748028710173261e-18 +dfa,4000,3,1e-08,0.0,3.569352171976544e-18,3.569352171976544e-18 +dfa,4000,3,1e-07,0.0,3.569352171976544e-18,3.569352171976544e-18 +dfa,4000,3,1e-06,0.0,3.569352171976544e-18,3.569352171976544e-18 +dfa,4000,3,1e-05,0.0,3.569352171976544e-18,3.569352171976544e-18 +dfa,4000,3,0.0001,0.0,3.569352171976544e-18,3.569352171976544e-18 +dfa,5000,0,1e-08,0.0,4.341474994448442e-15,4.341474994448442e-15 +dfa,5000,0,1e-07,0.0,4.341474994448442e-15,4.341474994448442e-15 +dfa,5000,0,1e-06,0.0,4.341474994448442e-15,4.341474994448442e-15 +dfa,5000,0,1e-05,0.0,4.341474994448442e-15,4.341474994448442e-15 +dfa,5000,0,0.0001,0.0,4.341474994448442e-15,4.341474994448442e-15 +dfa,5000,1,1e-08,0.0,4.732926046549268e-18,4.732926046549268e-18 +dfa,5000,1,1e-07,0.0,4.732926046549268e-18,4.732926046549268e-18 +dfa,5000,1,1e-06,0.0,4.732926046549268e-18,4.732926046549268e-18 +dfa,5000,1,1e-05,0.0,4.732926046549268e-18,4.732926046549268e-18 +dfa,5000,1,0.0001,0.0,4.732926046549268e-18,4.732926046549268e-18 +dfa,5000,2,1e-08,0.0,5.175341115631417e-18,5.175341115631417e-18 +dfa,5000,2,1e-07,0.0,5.175341115631417e-18,5.175341115631417e-18 +dfa,5000,2,1e-06,0.0,5.175341115631417e-18,5.175341115631417e-18 +dfa,5000,2,1e-05,0.0,5.175341115631417e-18,5.175341115631417e-18 +dfa,5000,2,0.0001,0.0,5.175341115631417e-18,5.175341115631417e-18 +dfa,5000,3,1e-08,0.0,3.1501149104532835e-18,3.1501149104532835e-18 +dfa,5000,3,1e-07,0.0,3.1501149104532835e-18,3.1501149104532835e-18 +dfa,5000,3,1e-06,0.0,3.1501149104532835e-18,3.1501149104532835e-18 +dfa,5000,3,1e-05,0.0,3.1501149104532835e-18,3.1501149104532835e-18 +dfa,5000,3,0.0001,0.0,3.1501149104532835e-18,3.1501149104532835e-18 +dfa,6000,0,1e-08,0.0,2.302985598311982e-15,2.302985598311982e-15 +dfa,6000,0,1e-07,0.0,2.302985598311982e-15,2.302985598311982e-15 +dfa,6000,0,1e-06,0.0,2.302985598311982e-15,2.302985598311982e-15 +dfa,6000,0,1e-05,0.0,2.302985598311982e-15,2.302985598311982e-15 +dfa,6000,0,0.0001,0.0,2.302985598311982e-15,2.302985598311982e-15 +dfa,6000,1,1e-08,0.0,3.9696885632981204e-18,3.9696885632981204e-18 +dfa,6000,1,1e-07,0.0,3.9696885632981204e-18,3.9696885632981204e-18 +dfa,6000,1,1e-06,0.0,3.9696885632981204e-18,3.9696885632981204e-18 +dfa,6000,1,1e-05,0.0,3.9696885632981204e-18,3.9696885632981204e-18 +dfa,6000,1,0.0001,0.0,3.9696885632981204e-18,3.9696885632981204e-18 +dfa,6000,2,1e-08,0.0,3.98756517710631e-18,3.98756517710631e-18 +dfa,6000,2,1e-07,0.0,3.98756517710631e-18,3.98756517710631e-18 +dfa,6000,2,1e-06,0.0,3.98756517710631e-18,3.98756517710631e-18 +dfa,6000,2,1e-05,0.0,3.98756517710631e-18,3.98756517710631e-18 +dfa,6000,2,0.0001,0.0,3.98756517710631e-18,3.98756517710631e-18 +dfa,6000,3,1e-08,0.0,1.9734937092836076e-18,1.9734937092836076e-18 +dfa,6000,3,1e-07,0.0,1.9734937092836076e-18,1.9734937092836076e-18 +dfa,6000,3,1e-06,0.0,1.9734937092836076e-18,1.9734937092836076e-18 +dfa,6000,3,1e-05,0.0,1.9734937092836076e-18,1.9734937092836076e-18 +dfa,6000,3,0.0001,0.0,1.9734937092836076e-18,1.9734937092836076e-18 +state_bridge,42,0,1e-08,0.0,2.6992344720044165e-14,2.6992344720044165e-14 +state_bridge,42,0,1e-07,0.0,2.6992344720044165e-14,2.6992344720044165e-14 +state_bridge,42,0,1e-06,0.0,2.6992344720044165e-14,2.6992344720044165e-14 +state_bridge,42,0,1e-05,0.0,2.6992344720044165e-14,2.6992344720044165e-14 +state_bridge,42,0,0.0001,0.0,2.6992344720044165e-14,2.6992344720044165e-14 +state_bridge,42,1,1e-08,0.0,6.471185719644739e-18,6.471185719644739e-18 +state_bridge,42,1,1e-07,0.0,6.471185719644739e-18,6.471185719644739e-18 +state_bridge,42,1,1e-06,0.0,6.471185719644739e-18,6.471185719644739e-18 +state_bridge,42,1,1e-05,0.0,6.471185719644739e-18,6.471185719644739e-18 +state_bridge,42,1,0.0001,0.0,6.471185719644739e-18,6.471185719644739e-18 +state_bridge,42,2,1e-08,0.0,9.027409145317866e-18,9.027409145317866e-18 +state_bridge,42,2,1e-07,0.0,9.027409145317866e-18,9.027409145317866e-18 +state_bridge,42,2,1e-06,0.0,9.027409145317866e-18,9.027409145317866e-18 +state_bridge,42,2,1e-05,0.0,9.027409145317866e-18,9.027409145317866e-18 +state_bridge,42,2,0.0001,0.0,9.027409145317866e-18,9.027409145317866e-18 +state_bridge,42,3,1e-08,0.0,6.745434143014245e-18,6.745434143014245e-18 +state_bridge,42,3,1e-07,0.0,6.745434143014245e-18,6.745434143014245e-18 +state_bridge,42,3,1e-06,0.0,6.745434143014245e-18,6.745434143014245e-18 +state_bridge,42,3,1e-05,0.0,6.745434143014245e-18,6.745434143014245e-18 +state_bridge,42,3,0.0001,0.0,6.745434143014245e-18,6.745434143014245e-18 +state_bridge,123,0,1e-08,0.0,1.902188496505971e-14,1.902188496505971e-14 +state_bridge,123,0,1e-07,0.0,1.902188496505971e-14,1.902188496505971e-14 +state_bridge,123,0,1e-06,0.0,1.902188496505971e-14,1.902188496505971e-14 +state_bridge,123,0,1e-05,0.0,1.902188496505971e-14,1.902188496505971e-14 +state_bridge,123,0,0.0001,0.0,1.902188496505971e-14,1.902188496505971e-14 +state_bridge,123,1,1e-08,0.0,1.6455236274415388e-17,1.6455236274415388e-17 +state_bridge,123,1,1e-07,0.0,1.6455236274415388e-17,1.6455236274415388e-17 +state_bridge,123,1,1e-06,0.0,1.6455236274415388e-17,1.6455236274415388e-17 +state_bridge,123,1,1e-05,0.0,1.6455236274415388e-17,1.6455236274415388e-17 +state_bridge,123,1,0.0001,0.0,1.6455236274415388e-17,1.6455236274415388e-17 +state_bridge,123,2,1e-08,0.0,1.010095474997185e-17,1.010095474997185e-17 +state_bridge,123,2,1e-07,0.0,1.010095474997185e-17,1.010095474997185e-17 +state_bridge,123,2,1e-06,0.0,1.010095474997185e-17,1.010095474997185e-17 +state_bridge,123,2,1e-05,0.0,1.010095474997185e-17,1.010095474997185e-17 +state_bridge,123,2,0.0001,0.0,1.010095474997185e-17,1.010095474997185e-17 +state_bridge,123,3,1e-08,0.0,1.519008834293391e-17,1.519008834293391e-17 +state_bridge,123,3,1e-07,0.0,1.519008834293391e-17,1.519008834293391e-17 +state_bridge,123,3,1e-06,0.0,1.519008834293391e-17,1.519008834293391e-17 +state_bridge,123,3,1e-05,0.0,1.519008834293391e-17,1.519008834293391e-17 +state_bridge,123,3,0.0001,0.0,1.519008834293391e-17,1.519008834293391e-17 +state_bridge,456,0,1e-08,0.0,2.7614251556511323e-14,2.7614251556511323e-14 +state_bridge,456,0,1e-07,0.0,2.7614251556511323e-14,2.7614251556511323e-14 +state_bridge,456,0,1e-06,0.0,2.7614251556511323e-14,2.7614251556511323e-14 +state_bridge,456,0,1e-05,0.0,2.7614251556511323e-14,2.7614251556511323e-14 +state_bridge,456,0,0.0001,0.0,2.7614251556511323e-14,2.7614251556511323e-14 +state_bridge,456,1,1e-08,0.0,7.874712282209908e-18,7.874712282209908e-18 +state_bridge,456,1,1e-07,0.0,7.874712282209908e-18,7.874712282209908e-18 +state_bridge,456,1,1e-06,0.0,7.874712282209908e-18,7.874712282209908e-18 +state_bridge,456,1,1e-05,0.0,7.874712282209908e-18,7.874712282209908e-18 +state_bridge,456,1,0.0001,0.0,7.874712282209908e-18,7.874712282209908e-18 +state_bridge,456,2,1e-08,0.0,6.6395744633518525e-18,6.6395744633518525e-18 +state_bridge,456,2,1e-07,0.0,6.6395744633518525e-18,6.6395744633518525e-18 +state_bridge,456,2,1e-06,0.0,6.6395744633518525e-18,6.6395744633518525e-18 +state_bridge,456,2,1e-05,0.0,6.6395744633518525e-18,6.6395744633518525e-18 +state_bridge,456,2,0.0001,0.0,6.6395744633518525e-18,6.6395744633518525e-18 +state_bridge,456,3,1e-08,0.0,3.451011577641645e-18,3.451011577641645e-18 +state_bridge,456,3,1e-07,0.0,3.451011577641645e-18,3.451011577641645e-18 +state_bridge,456,3,1e-06,0.0,3.451011577641645e-18,3.451011577641645e-18 +state_bridge,456,3,1e-05,0.0,3.451011577641645e-18,3.451011577641645e-18 +state_bridge,456,3,0.0001,0.0,3.451011577641645e-18,3.451011577641645e-18 +state_bridge,789,0,1e-08,0.0,2.5475205373492148e-14,2.5475205373492148e-14 +state_bridge,789,0,1e-07,0.0,2.5475205373492148e-14,2.5475205373492148e-14 +state_bridge,789,0,1e-06,0.0,2.5475205373492148e-14,2.5475205373492148e-14 +state_bridge,789,0,1e-05,0.0,2.5475205373492148e-14,2.5475205373492148e-14 +state_bridge,789,0,0.0001,0.0,2.5475205373492148e-14,2.5475205373492148e-14 +state_bridge,789,1,1e-08,0.0,2.9189688008523843e-18,2.9189688008523843e-18 +state_bridge,789,1,1e-07,0.0,2.9189688008523843e-18,2.9189688008523843e-18 +state_bridge,789,1,1e-06,0.0,2.9189688008523843e-18,2.9189688008523843e-18 +state_bridge,789,1,1e-05,0.0,2.9189688008523843e-18,2.9189688008523843e-18 +state_bridge,789,1,0.0001,0.0,2.9189688008523843e-18,2.9189688008523843e-18 +state_bridge,789,2,1e-08,0.0,3.5936932022718354e-18,3.5936932022718354e-18 +state_bridge,789,2,1e-07,0.0,3.5936932022718354e-18,3.5936932022718354e-18 +state_bridge,789,2,1e-06,0.0,3.5936932022718354e-18,3.5936932022718354e-18 +state_bridge,789,2,1e-05,0.0,3.5936932022718354e-18,3.5936932022718354e-18 +state_bridge,789,2,0.0001,0.0,3.5936932022718354e-18,3.5936932022718354e-18 +state_bridge,789,3,1e-08,0.0,4.21031498989949e-18,4.21031498989949e-18 +state_bridge,789,3,1e-07,0.0,4.21031498989949e-18,4.21031498989949e-18 +state_bridge,789,3,1e-06,0.0,4.21031498989949e-18,4.21031498989949e-18 +state_bridge,789,3,1e-05,0.0,4.21031498989949e-18,4.21031498989949e-18 +state_bridge,789,3,0.0001,0.0,4.21031498989949e-18,4.21031498989949e-18 +state_bridge,1024,0,1e-08,0.0,1.369330403190247e-14,1.369330403190247e-14 +state_bridge,1024,0,1e-07,0.0,1.369330403190247e-14,1.369330403190247e-14 +state_bridge,1024,0,1e-06,0.0,1.369330403190247e-14,1.369330403190247e-14 +state_bridge,1024,0,1e-05,0.0,1.369330403190247e-14,1.369330403190247e-14 +state_bridge,1024,0,0.0001,0.0,1.369330403190247e-14,1.369330403190247e-14 +state_bridge,1024,1,1e-08,0.0,3.222414755970573e-17,3.222414755970573e-17 +state_bridge,1024,1,1e-07,0.0,3.222414755970573e-17,3.222414755970573e-17 +state_bridge,1024,1,1e-06,0.0,3.222414755970573e-17,3.222414755970573e-17 +state_bridge,1024,1,1e-05,0.0,3.222414755970573e-17,3.222414755970573e-17 +state_bridge,1024,1,0.0001,0.0,3.222414755970573e-17,3.222414755970573e-17 +state_bridge,1024,2,1e-08,0.0,2.9792427637521327e-18,2.9792427637521327e-18 +state_bridge,1024,2,1e-07,0.0,2.9792427637521327e-18,2.9792427637521327e-18 +state_bridge,1024,2,1e-06,0.0,2.9792427637521327e-18,2.9792427637521327e-18 +state_bridge,1024,2,1e-05,0.0,2.9792427637521327e-18,2.9792427637521327e-18 +state_bridge,1024,2,0.0001,0.0,2.9792427637521327e-18,2.9792427637521327e-18 +state_bridge,1024,3,1e-08,0.0,2.6080570443975372e-18,2.6080570443975372e-18 +state_bridge,1024,3,1e-07,0.0,2.6080570443975372e-18,2.6080570443975372e-18 +state_bridge,1024,3,1e-06,0.0,2.6080570443975372e-18,2.6080570443975372e-18 +state_bridge,1024,3,1e-05,0.0,2.6080570443975372e-18,2.6080570443975372e-18 +state_bridge,1024,3,0.0001,0.0,2.6080570443975372e-18,2.6080570443975372e-18 +state_bridge,2048,0,1e-08,0.0,1.0580407128766081e-13,1.0580407128766081e-13 +state_bridge,2048,0,1e-07,0.0,1.0580407128766081e-13,1.0580407128766081e-13 +state_bridge,2048,0,1e-06,0.0,1.0580407128766081e-13,1.0580407128766081e-13 +state_bridge,2048,0,1e-05,0.0,1.0580407128766081e-13,1.0580407128766081e-13 +state_bridge,2048,0,0.0001,0.0,1.0580407128766081e-13,1.0580407128766081e-13 +state_bridge,2048,1,1e-08,0.0,3.589417919275855e-18,3.589417919275855e-18 +state_bridge,2048,1,1e-07,0.0,3.589417919275855e-18,3.589417919275855e-18 +state_bridge,2048,1,1e-06,0.0,3.589417919275855e-18,3.589417919275855e-18 +state_bridge,2048,1,1e-05,0.0,3.589417919275855e-18,3.589417919275855e-18 +state_bridge,2048,1,0.0001,0.0,3.589417919275855e-18,3.589417919275855e-18 +state_bridge,2048,2,1e-08,0.0,5.82013750210324e-18,5.82013750210324e-18 +state_bridge,2048,2,1e-07,0.0,5.82013750210324e-18,5.82013750210324e-18 +state_bridge,2048,2,1e-06,0.0,5.82013750210324e-18,5.82013750210324e-18 +state_bridge,2048,2,1e-05,0.0,5.82013750210324e-18,5.82013750210324e-18 +state_bridge,2048,2,0.0001,0.0,5.82013750210324e-18,5.82013750210324e-18 +state_bridge,2048,3,1e-08,0.0,4.03326194286619e-18,4.03326194286619e-18 +state_bridge,2048,3,1e-07,0.0,4.03326194286619e-18,4.03326194286619e-18 +state_bridge,2048,3,1e-06,0.0,4.03326194286619e-18,4.03326194286619e-18 +state_bridge,2048,3,1e-05,0.0,4.03326194286619e-18,4.03326194286619e-18 +state_bridge,2048,3,0.0001,0.0,4.03326194286619e-18,4.03326194286619e-18 +state_bridge,3000,0,1e-08,0.0,3.148102980556067e-14,3.148102980556067e-14 +state_bridge,3000,0,1e-07,0.0,3.148102980556067e-14,3.148102980556067e-14 +state_bridge,3000,0,1e-06,0.0,3.148102980556067e-14,3.148102980556067e-14 +state_bridge,3000,0,1e-05,0.0,3.148102980556067e-14,3.148102980556067e-14 +state_bridge,3000,0,0.0001,0.0,3.148102980556067e-14,3.148102980556067e-14 +state_bridge,3000,1,1e-08,0.0,6.836890126670252e-18,6.836890126670252e-18 +state_bridge,3000,1,1e-07,0.0,6.836890126670252e-18,6.836890126670252e-18 +state_bridge,3000,1,1e-06,0.0,6.836890126670252e-18,6.836890126670252e-18 +state_bridge,3000,1,1e-05,0.0,6.836890126670252e-18,6.836890126670252e-18 +state_bridge,3000,1,0.0001,0.0,6.836890126670252e-18,6.836890126670252e-18 +state_bridge,3000,2,1e-08,0.0,3.2751385037521515e-18,3.2751385037521515e-18 +state_bridge,3000,2,1e-07,0.0,3.2751385037521515e-18,3.2751385037521515e-18 +state_bridge,3000,2,1e-06,0.0,3.2751385037521515e-18,3.2751385037521515e-18 +state_bridge,3000,2,1e-05,0.0,3.2751385037521515e-18,3.2751385037521515e-18 +state_bridge,3000,2,0.0001,0.0,3.2751385037521515e-18,3.2751385037521515e-18 +state_bridge,3000,3,1e-08,0.0,4.178672849927499e-18,4.178672849927499e-18 +state_bridge,3000,3,1e-07,0.0,4.178672849927499e-18,4.178672849927499e-18 +state_bridge,3000,3,1e-06,0.0,4.178672849927499e-18,4.178672849927499e-18 +state_bridge,3000,3,1e-05,0.0,4.178672849927499e-18,4.178672849927499e-18 +state_bridge,3000,3,0.0001,0.0,4.178672849927499e-18,4.178672849927499e-18 +state_bridge,4000,0,1e-08,0.0,4.157557544764989e-14,4.157557544764989e-14 +state_bridge,4000,0,1e-07,0.0,4.157557544764989e-14,4.157557544764989e-14 +state_bridge,4000,0,1e-06,0.0,4.157557544764989e-14,4.157557544764989e-14 +state_bridge,4000,0,1e-05,0.0,4.157557544764989e-14,4.157557544764989e-14 +state_bridge,4000,0,0.0001,0.0,4.157557544764989e-14,4.157557544764989e-14 +state_bridge,4000,1,1e-08,0.0,1.2419642922992718e-17,1.2419642922992718e-17 +state_bridge,4000,1,1e-07,0.0,1.2419642922992718e-17,1.2419642922992718e-17 +state_bridge,4000,1,1e-06,0.0,1.2419642922992718e-17,1.2419642922992718e-17 +state_bridge,4000,1,1e-05,0.0,1.2419642922992718e-17,1.2419642922992718e-17 +state_bridge,4000,1,0.0001,0.0,1.2419642922992718e-17,1.2419642922992718e-17 +state_bridge,4000,2,1e-08,0.0,7.897693841168469e-18,7.897693841168469e-18 +state_bridge,4000,2,1e-07,0.0,7.897693841168469e-18,7.897693841168469e-18 +state_bridge,4000,2,1e-06,0.0,7.897693841168469e-18,7.897693841168469e-18 +state_bridge,4000,2,1e-05,0.0,7.897693841168469e-18,7.897693841168469e-18 +state_bridge,4000,2,0.0001,0.0,7.897693841168469e-18,7.897693841168469e-18 +state_bridge,4000,3,1e-08,0.0,6.5220445060172556e-18,6.5220445060172556e-18 +state_bridge,4000,3,1e-07,0.0,6.5220445060172556e-18,6.5220445060172556e-18 +state_bridge,4000,3,1e-06,0.0,6.5220445060172556e-18,6.5220445060172556e-18 +state_bridge,4000,3,1e-05,0.0,6.5220445060172556e-18,6.5220445060172556e-18 +state_bridge,4000,3,0.0001,0.0,6.5220445060172556e-18,6.5220445060172556e-18 +state_bridge,5000,0,1e-08,0.0,7.853930044298893e-15,7.853930044298893e-15 +state_bridge,5000,0,1e-07,0.0,7.853930044298893e-15,7.853930044298893e-15 +state_bridge,5000,0,1e-06,0.0,7.853930044298893e-15,7.853930044298893e-15 +state_bridge,5000,0,1e-05,0.0,7.853930044298893e-15,7.853930044298893e-15 +state_bridge,5000,0,0.0001,0.0,7.853930044298893e-15,7.853930044298893e-15 +state_bridge,5000,1,1e-08,0.0,9.066262811306217e-17,9.066262811306217e-17 +state_bridge,5000,1,1e-07,0.0,9.066262811306217e-17,9.066262811306217e-17 +state_bridge,5000,1,1e-06,0.0,9.066262811306217e-17,9.066262811306217e-17 +state_bridge,5000,1,1e-05,0.0,9.066262811306217e-17,9.066262811306217e-17 +state_bridge,5000,1,0.0001,0.0,9.066262811306217e-17,9.066262811306217e-17 +state_bridge,5000,2,1e-08,0.0,1.1614074058303863e-17,1.1614074058303863e-17 +state_bridge,5000,2,1e-07,0.0,1.1614074058303863e-17,1.1614074058303863e-17 +state_bridge,5000,2,1e-06,0.0,1.1614074058303863e-17,1.1614074058303863e-17 +state_bridge,5000,2,1e-05,0.0,1.1614074058303863e-17,1.1614074058303863e-17 +state_bridge,5000,2,0.0001,0.0,1.1614074058303863e-17,1.1614074058303863e-17 +state_bridge,5000,3,1e-08,0.0,7.905178171350849e-18,7.905178171350849e-18 +state_bridge,5000,3,1e-07,0.0,7.905178171350849e-18,7.905178171350849e-18 +state_bridge,5000,3,1e-06,0.0,7.905178171350849e-18,7.905178171350849e-18 +state_bridge,5000,3,1e-05,0.0,7.905178171350849e-18,7.905178171350849e-18 +state_bridge,5000,3,0.0001,0.0,7.905178171350849e-18,7.905178171350849e-18 +state_bridge,6000,0,1e-08,0.0,5.2776244474899564e-14,5.2776244474899564e-14 +state_bridge,6000,0,1e-07,0.0,5.2776244474899564e-14,5.2776244474899564e-14 +state_bridge,6000,0,1e-06,0.0,5.2776244474899564e-14,5.2776244474899564e-14 +state_bridge,6000,0,1e-05,0.0,5.2776244474899564e-14,5.2776244474899564e-14 +state_bridge,6000,0,0.0001,0.0,5.2776244474899564e-14,5.2776244474899564e-14 +state_bridge,6000,1,1e-08,0.0,3.3115853223121567e-18,3.3115853223121567e-18 +state_bridge,6000,1,1e-07,0.0,3.3115853223121567e-18,3.3115853223121567e-18 +state_bridge,6000,1,1e-06,0.0,3.3115853223121567e-18,3.3115853223121567e-18 +state_bridge,6000,1,1e-05,0.0,3.3115853223121567e-18,3.3115853223121567e-18 +state_bridge,6000,1,0.0001,0.0,3.3115853223121567e-18,3.3115853223121567e-18 +state_bridge,6000,2,1e-08,0.0,6.5850864220417595e-18,6.5850864220417595e-18 +state_bridge,6000,2,1e-07,0.0,6.5850864220417595e-18,6.5850864220417595e-18 +state_bridge,6000,2,1e-06,0.0,6.5850864220417595e-18,6.5850864220417595e-18 +state_bridge,6000,2,1e-05,0.0,6.5850864220417595e-18,6.5850864220417595e-18 +state_bridge,6000,2,0.0001,0.0,6.5850864220417595e-18,6.5850864220417595e-18 +state_bridge,6000,3,1e-08,0.0,6.965544836063074e-18,6.965544836063074e-18 +state_bridge,6000,3,1e-07,0.0,6.965544836063074e-18,6.965544836063074e-18 +state_bridge,6000,3,1e-06,0.0,6.965544836063074e-18,6.965544836063074e-18 +state_bridge,6000,3,1e-05,0.0,6.965544836063074e-18,6.965544836063074e-18 +state_bridge,6000,3,0.0001,0.0,6.965544836063074e-18,6.965544836063074e-18 +credit_bridge,42,0,1e-08,0.0,3.5371820591631725e-15,3.5371820591631725e-15 +credit_bridge,42,0,1e-07,0.0,3.5371820591631725e-15,3.5371820591631725e-15 +credit_bridge,42,0,1e-06,0.0,3.5371820591631725e-15,3.5371820591631725e-15 +credit_bridge,42,0,1e-05,0.0,3.5371820591631725e-15,3.5371820591631725e-15 +credit_bridge,42,0,0.0001,0.0,3.5371820591631725e-15,3.5371820591631725e-15 +credit_bridge,42,1,1e-08,0.0,1.2021043610957502e-17,1.2021043610957502e-17 +credit_bridge,42,1,1e-07,0.0,1.2021043610957502e-17,1.2021043610957502e-17 +credit_bridge,42,1,1e-06,0.0,1.2021043610957502e-17,1.2021043610957502e-17 +credit_bridge,42,1,1e-05,0.0,1.2021043610957502e-17,1.2021043610957502e-17 +credit_bridge,42,1,0.0001,0.0,1.2021043610957502e-17,1.2021043610957502e-17 +credit_bridge,42,2,1e-08,0.0,4.787851252813095e-18,4.787851252813095e-18 +credit_bridge,42,2,1e-07,0.0,4.787851252813095e-18,4.787851252813095e-18 +credit_bridge,42,2,1e-06,0.0,4.787851252813095e-18,4.787851252813095e-18 +credit_bridge,42,2,1e-05,0.0,4.787851252813095e-18,4.787851252813095e-18 +credit_bridge,42,2,0.0001,0.0,4.787851252813095e-18,4.787851252813095e-18 +credit_bridge,42,3,1e-08,0.0,4.291316237793439e-18,4.291316237793439e-18 +credit_bridge,42,3,1e-07,0.0,4.291316237793439e-18,4.291316237793439e-18 +credit_bridge,42,3,1e-06,0.0,4.291316237793439e-18,4.291316237793439e-18 +credit_bridge,42,3,1e-05,0.0,4.291316237793439e-18,4.291316237793439e-18 +credit_bridge,42,3,0.0001,0.0,4.291316237793439e-18,4.291316237793439e-18 +credit_bridge,123,0,1e-08,0.0,7.599696493312304e-15,7.599696493312304e-15 +credit_bridge,123,0,1e-07,0.0,7.599696493312304e-15,7.599696493312304e-15 +credit_bridge,123,0,1e-06,0.0,7.599696493312304e-15,7.599696493312304e-15 +credit_bridge,123,0,1e-05,0.0,7.599696493312304e-15,7.599696493312304e-15 +credit_bridge,123,0,0.0001,0.0,7.599696493312304e-15,7.599696493312304e-15 +credit_bridge,123,1,1e-08,0.0,2.7300932335551393e-17,2.7300932335551393e-17 +credit_bridge,123,1,1e-07,0.0,2.7300932335551393e-17,2.7300932335551393e-17 +credit_bridge,123,1,1e-06,0.0,2.7300932335551393e-17,2.7300932335551393e-17 +credit_bridge,123,1,1e-05,0.0,2.7300932335551393e-17,2.7300932335551393e-17 +credit_bridge,123,1,0.0001,0.0,2.7300932335551393e-17,2.7300932335551393e-17 +credit_bridge,123,2,1e-08,0.0,2.7487155506855456e-17,2.7487155506855456e-17 +credit_bridge,123,2,1e-07,0.0,2.7487155506855456e-17,2.7487155506855456e-17 +credit_bridge,123,2,1e-06,0.0,2.7487155506855456e-17,2.7487155506855456e-17 +credit_bridge,123,2,1e-05,0.0,2.7487155506855456e-17,2.7487155506855456e-17 +credit_bridge,123,2,0.0001,0.0,2.7487155506855456e-17,2.7487155506855456e-17 +credit_bridge,123,3,1e-08,0.0,1.1796419406896277e-17,1.1796419406896277e-17 +credit_bridge,123,3,1e-07,0.0,1.1796419406896277e-17,1.1796419406896277e-17 +credit_bridge,123,3,1e-06,0.0,1.1796419406896277e-17,1.1796419406896277e-17 +credit_bridge,123,3,1e-05,0.0,1.1796419406896277e-17,1.1796419406896277e-17 +credit_bridge,123,3,0.0001,0.0,1.1796419406896277e-17,1.1796419406896277e-17 +credit_bridge,456,0,1e-08,0.0,6.9011674799529955e-15,6.9011674799529955e-15 +credit_bridge,456,0,1e-07,0.0,6.9011674799529955e-15,6.9011674799529955e-15 +credit_bridge,456,0,1e-06,0.0,6.9011674799529955e-15,6.9011674799529955e-15 +credit_bridge,456,0,1e-05,0.0,6.9011674799529955e-15,6.9011674799529955e-15 +credit_bridge,456,0,0.0001,0.0,6.9011674799529955e-15,6.9011674799529955e-15 +credit_bridge,456,1,1e-08,0.0,1.5494967264386254e-17,1.5494967264386254e-17 +credit_bridge,456,1,1e-07,0.0,1.5494967264386254e-17,1.5494967264386254e-17 +credit_bridge,456,1,1e-06,0.0,1.5494967264386254e-17,1.5494967264386254e-17 +credit_bridge,456,1,1e-05,0.0,1.5494967264386254e-17,1.5494967264386254e-17 +credit_bridge,456,1,0.0001,0.0,1.5494967264386254e-17,1.5494967264386254e-17 +credit_bridge,456,2,1e-08,0.0,5.662822225256374e-18,5.662822225256374e-18 +credit_bridge,456,2,1e-07,0.0,5.662822225256374e-18,5.662822225256374e-18 +credit_bridge,456,2,1e-06,0.0,5.662822225256374e-18,5.662822225256374e-18 +credit_bridge,456,2,1e-05,0.0,5.662822225256374e-18,5.662822225256374e-18 +credit_bridge,456,2,0.0001,0.0,5.662822225256374e-18,5.662822225256374e-18 +credit_bridge,456,3,1e-08,0.0,9.464962873940041e-18,9.464962873940041e-18 +credit_bridge,456,3,1e-07,0.0,9.464962873940041e-18,9.464962873940041e-18 +credit_bridge,456,3,1e-06,0.0,9.464962873940041e-18,9.464962873940041e-18 +credit_bridge,456,3,1e-05,0.0,9.464962873940041e-18,9.464962873940041e-18 +credit_bridge,456,3,0.0001,0.0,9.464962873940041e-18,9.464962873940041e-18 +credit_bridge,789,0,1e-08,0.0,4.1465803365817525e-15,4.1465803365817525e-15 +credit_bridge,789,0,1e-07,0.0,4.1465803365817525e-15,4.1465803365817525e-15 +credit_bridge,789,0,1e-06,0.0,4.1465803365817525e-15,4.1465803365817525e-15 +credit_bridge,789,0,1e-05,0.0,4.1465803365817525e-15,4.1465803365817525e-15 +credit_bridge,789,0,0.0001,0.0,4.1465803365817525e-15,4.1465803365817525e-15 +credit_bridge,789,1,1e-08,0.0,8.336049107804208e-18,8.336049107804208e-18 +credit_bridge,789,1,1e-07,0.0,8.336049107804208e-18,8.336049107804208e-18 +credit_bridge,789,1,1e-06,0.0,8.336049107804208e-18,8.336049107804208e-18 +credit_bridge,789,1,1e-05,0.0,8.336049107804208e-18,8.336049107804208e-18 +credit_bridge,789,1,0.0001,0.0,8.336049107804208e-18,8.336049107804208e-18 +credit_bridge,789,2,1e-08,0.0,7.228085345042505e-18,7.228085345042505e-18 +credit_bridge,789,2,1e-07,0.0,7.228085345042505e-18,7.228085345042505e-18 +credit_bridge,789,2,1e-06,0.0,7.228085345042505e-18,7.228085345042505e-18 +credit_bridge,789,2,1e-05,0.0,7.228085345042505e-18,7.228085345042505e-18 +credit_bridge,789,2,0.0001,0.0,7.228085345042505e-18,7.228085345042505e-18 +credit_bridge,789,3,1e-08,0.0,1.214459048006781e-17,1.214459048006781e-17 +credit_bridge,789,3,1e-07,0.0,1.214459048006781e-17,1.214459048006781e-17 +credit_bridge,789,3,1e-06,0.0,1.214459048006781e-17,1.214459048006781e-17 +credit_bridge,789,3,1e-05,0.0,1.214459048006781e-17,1.214459048006781e-17 +credit_bridge,789,3,0.0001,0.0,1.214459048006781e-17,1.214459048006781e-17 +credit_bridge,1024,0,1e-08,0.0,5.6746116798025124e-15,5.6746116798025124e-15 +credit_bridge,1024,0,1e-07,0.0,5.6746116798025124e-15,5.6746116798025124e-15 +credit_bridge,1024,0,1e-06,0.0,5.6746116798025124e-15,5.6746116798025124e-15 +credit_bridge,1024,0,1e-05,0.0,5.6746116798025124e-15,5.6746116798025124e-15 +credit_bridge,1024,0,0.0001,0.0,5.6746116798025124e-15,5.6746116798025124e-15 +credit_bridge,1024,1,1e-08,0.0,2.0532265584262677e-17,2.0532265584262677e-17 +credit_bridge,1024,1,1e-07,0.0,2.0532265584262677e-17,2.0532265584262677e-17 +credit_bridge,1024,1,1e-06,0.0,2.0532265584262677e-17,2.0532265584262677e-17 +credit_bridge,1024,1,1e-05,0.0,2.0532265584262677e-17,2.0532265584262677e-17 +credit_bridge,1024,1,0.0001,0.0,2.0532265584262677e-17,2.0532265584262677e-17 +credit_bridge,1024,2,1e-08,0.0,1.4865846777702923e-17,1.4865846777702923e-17 +credit_bridge,1024,2,1e-07,0.0,1.4865846777702923e-17,1.4865846777702923e-17 +credit_bridge,1024,2,1e-06,0.0,1.4865846777702923e-17,1.4865846777702923e-17 +credit_bridge,1024,2,1e-05,0.0,1.4865846777702923e-17,1.4865846777702923e-17 +credit_bridge,1024,2,0.0001,0.0,1.4865846777702923e-17,1.4865846777702923e-17 +credit_bridge,1024,3,1e-08,0.0,1.3465927136198791e-17,1.3465927136198791e-17 +credit_bridge,1024,3,1e-07,0.0,1.3465927136198791e-17,1.3465927136198791e-17 +credit_bridge,1024,3,1e-06,0.0,1.3465927136198791e-17,1.3465927136198791e-17 +credit_bridge,1024,3,1e-05,0.0,1.3465927136198791e-17,1.3465927136198791e-17 +credit_bridge,1024,3,0.0001,0.0,1.3465927136198791e-17,1.3465927136198791e-17 +credit_bridge,2048,0,1e-08,0.0,5.402996165705318e-15,5.402996165705318e-15 +credit_bridge,2048,0,1e-07,0.0,5.402996165705318e-15,5.402996165705318e-15 +credit_bridge,2048,0,1e-06,0.0,5.402996165705318e-15,5.402996165705318e-15 +credit_bridge,2048,0,1e-05,0.0,5.402996165705318e-15,5.402996165705318e-15 +credit_bridge,2048,0,0.0001,0.0,5.402996165705318e-15,5.402996165705318e-15 +credit_bridge,2048,1,1e-08,0.0,9.586679192354769e-18,9.586679192354769e-18 +credit_bridge,2048,1,1e-07,0.0,9.586679192354769e-18,9.586679192354769e-18 +credit_bridge,2048,1,1e-06,0.0,9.586679192354769e-18,9.586679192354769e-18 +credit_bridge,2048,1,1e-05,0.0,9.586679192354769e-18,9.586679192354769e-18 +credit_bridge,2048,1,0.0001,0.0,9.586679192354769e-18,9.586679192354769e-18 +credit_bridge,2048,2,1e-08,0.0,7.414172031545497e-18,7.414172031545497e-18 +credit_bridge,2048,2,1e-07,0.0,7.414172031545497e-18,7.414172031545497e-18 +credit_bridge,2048,2,1e-06,0.0,7.414172031545497e-18,7.414172031545497e-18 +credit_bridge,2048,2,1e-05,0.0,7.414172031545497e-18,7.414172031545497e-18 +credit_bridge,2048,2,0.0001,0.0,7.414172031545497e-18,7.414172031545497e-18 +credit_bridge,2048,3,1e-08,0.0,9.573144035991564e-18,9.573144035991564e-18 +credit_bridge,2048,3,1e-07,0.0,9.573144035991564e-18,9.573144035991564e-18 +credit_bridge,2048,3,1e-06,0.0,9.573144035991564e-18,9.573144035991564e-18 +credit_bridge,2048,3,1e-05,0.0,9.573144035991564e-18,9.573144035991564e-18 +credit_bridge,2048,3,0.0001,0.0,9.573144035991564e-18,9.573144035991564e-18 +credit_bridge,3000,0,1e-08,0.0,8.525080835220574e-15,8.525080835220574e-15 +credit_bridge,3000,0,1e-07,0.0,8.525080835220574e-15,8.525080835220574e-15 +credit_bridge,3000,0,1e-06,0.0,8.525080835220574e-15,8.525080835220574e-15 +credit_bridge,3000,0,1e-05,0.0,8.525080835220574e-15,8.525080835220574e-15 +credit_bridge,3000,0,0.0001,0.0,8.525080835220574e-15,8.525080835220574e-15 +credit_bridge,3000,1,1e-08,0.0,1.0697184881138847e-17,1.0697184881138847e-17 +credit_bridge,3000,1,1e-07,0.0,1.0697184881138847e-17,1.0697184881138847e-17 +credit_bridge,3000,1,1e-06,0.0,1.0697184881138847e-17,1.0697184881138847e-17 +credit_bridge,3000,1,1e-05,0.0,1.0697184881138847e-17,1.0697184881138847e-17 +credit_bridge,3000,1,0.0001,0.0,1.0697184881138847e-17,1.0697184881138847e-17 +credit_bridge,3000,2,1e-08,0.0,6.892823666100781e-18,6.892823666100781e-18 +credit_bridge,3000,2,1e-07,0.0,6.892823666100781e-18,6.892823666100781e-18 +credit_bridge,3000,2,1e-06,0.0,6.892823666100781e-18,6.892823666100781e-18 +credit_bridge,3000,2,1e-05,0.0,6.892823666100781e-18,6.892823666100781e-18 +credit_bridge,3000,2,0.0001,0.0,6.892823666100781e-18,6.892823666100781e-18 +credit_bridge,3000,3,1e-08,0.0,8.036536934166107e-18,8.036536934166107e-18 +credit_bridge,3000,3,1e-07,0.0,8.036536934166107e-18,8.036536934166107e-18 +credit_bridge,3000,3,1e-06,0.0,8.036536934166107e-18,8.036536934166107e-18 +credit_bridge,3000,3,1e-05,0.0,8.036536934166107e-18,8.036536934166107e-18 +credit_bridge,3000,3,0.0001,0.0,8.036536934166107e-18,8.036536934166107e-18 +credit_bridge,4000,0,1e-08,0.0,5.779050842198968e-15,5.779050842198968e-15 +credit_bridge,4000,0,1e-07,0.0,5.779050842198968e-15,5.779050842198968e-15 +credit_bridge,4000,0,1e-06,0.0,5.779050842198968e-15,5.779050842198968e-15 +credit_bridge,4000,0,1e-05,0.0,5.779050842198968e-15,5.779050842198968e-15 +credit_bridge,4000,0,0.0001,0.0,5.779050842198968e-15,5.779050842198968e-15 +credit_bridge,4000,1,1e-08,0.0,8.463552381784356e-18,8.463552381784356e-18 +credit_bridge,4000,1,1e-07,0.0,8.463552381784356e-18,8.463552381784356e-18 +credit_bridge,4000,1,1e-06,0.0,8.463552381784356e-18,8.463552381784356e-18 +credit_bridge,4000,1,1e-05,0.0,8.463552381784356e-18,8.463552381784356e-18 +credit_bridge,4000,1,0.0001,0.0,8.463552381784356e-18,8.463552381784356e-18 +credit_bridge,4000,2,1e-08,0.0,7.17157815585717e-18,7.17157815585717e-18 +credit_bridge,4000,2,1e-07,0.0,7.17157815585717e-18,7.17157815585717e-18 +credit_bridge,4000,2,1e-06,0.0,7.17157815585717e-18,7.17157815585717e-18 +credit_bridge,4000,2,1e-05,0.0,7.17157815585717e-18,7.17157815585717e-18 +credit_bridge,4000,2,0.0001,0.0,7.17157815585717e-18,7.17157815585717e-18 +credit_bridge,4000,3,1e-08,0.0,5.8521589043860866e-18,5.8521589043860866e-18 +credit_bridge,4000,3,1e-07,0.0,5.8521589043860866e-18,5.8521589043860866e-18 +credit_bridge,4000,3,1e-06,0.0,5.8521589043860866e-18,5.8521589043860866e-18 +credit_bridge,4000,3,1e-05,0.0,5.8521589043860866e-18,5.8521589043860866e-18 +credit_bridge,4000,3,0.0001,0.0,5.8521589043860866e-18,5.8521589043860866e-18 +credit_bridge,5000,0,1e-08,0.0,7.448512335413962e-16,7.448512335413962e-16 +credit_bridge,5000,0,1e-07,0.0,7.448512335413962e-16,7.448512335413962e-16 +credit_bridge,5000,0,1e-06,0.0,7.448512335413962e-16,7.448512335413962e-16 +credit_bridge,5000,0,1e-05,0.0,7.448512335413962e-16,7.448512335413962e-16 +credit_bridge,5000,0,0.0001,0.0,7.448512335413962e-16,7.448512335413962e-16 +credit_bridge,5000,1,1e-08,0.0,4.8524974856356455e-18,4.8524974856356455e-18 +credit_bridge,5000,1,1e-07,0.0,4.8524974856356455e-18,4.8524974856356455e-18 +credit_bridge,5000,1,1e-06,0.0,4.8524974856356455e-18,4.8524974856356455e-18 +credit_bridge,5000,1,1e-05,0.0,4.8524974856356455e-18,4.8524974856356455e-18 +credit_bridge,5000,1,0.0001,0.0,4.8524974856356455e-18,4.8524974856356455e-18 +credit_bridge,5000,2,1e-08,0.0,4.791040447664793e-18,4.791040447664793e-18 +credit_bridge,5000,2,1e-07,0.0,4.791040447664793e-18,4.791040447664793e-18 +credit_bridge,5000,2,1e-06,0.0,4.791040447664793e-18,4.791040447664793e-18 +credit_bridge,5000,2,1e-05,0.0,4.791040447664793e-18,4.791040447664793e-18 +credit_bridge,5000,2,0.0001,0.0,4.791040447664793e-18,4.791040447664793e-18 +credit_bridge,5000,3,1e-08,0.0,4.664369317380873e-18,4.664369317380873e-18 +credit_bridge,5000,3,1e-07,0.0,4.664369317380873e-18,4.664369317380873e-18 +credit_bridge,5000,3,1e-06,0.0,4.664369317380873e-18,4.664369317380873e-18 +credit_bridge,5000,3,1e-05,0.0,4.664369317380873e-18,4.664369317380873e-18 +credit_bridge,5000,3,0.0001,0.0,4.664369317380873e-18,4.664369317380873e-18 +credit_bridge,6000,0,1e-08,0.0,4.370516366078003e-15,4.370516366078003e-15 +credit_bridge,6000,0,1e-07,0.0,4.370516366078003e-15,4.370516366078003e-15 +credit_bridge,6000,0,1e-06,0.0,4.370516366078003e-15,4.370516366078003e-15 +credit_bridge,6000,0,1e-05,0.0,4.370516366078003e-15,4.370516366078003e-15 +credit_bridge,6000,0,0.0001,0.0,4.370516366078003e-15,4.370516366078003e-15 +credit_bridge,6000,1,1e-08,0.0,1.1715800730035634e-17,1.1715800730035634e-17 +credit_bridge,6000,1,1e-07,0.0,1.1715800730035634e-17,1.1715800730035634e-17 +credit_bridge,6000,1,1e-06,0.0,1.1715800730035634e-17,1.1715800730035634e-17 +credit_bridge,6000,1,1e-05,0.0,1.1715800730035634e-17,1.1715800730035634e-17 +credit_bridge,6000,1,0.0001,0.0,1.1715800730035634e-17,1.1715800730035634e-17 +credit_bridge,6000,2,1e-08,0.0,9.63377306616925e-18,9.63377306616925e-18 +credit_bridge,6000,2,1e-07,0.0,9.63377306616925e-18,9.63377306616925e-18 +credit_bridge,6000,2,1e-06,0.0,9.63377306616925e-18,9.63377306616925e-18 +credit_bridge,6000,2,1e-05,0.0,9.63377306616925e-18,9.63377306616925e-18 +credit_bridge,6000,2,0.0001,0.0,9.63377306616925e-18,9.63377306616925e-18 +credit_bridge,6000,3,1e-08,0.0,9.388317972742102e-18,9.388317972742102e-18 +credit_bridge,6000,3,1e-07,0.0,9.388317972742102e-18,9.388317972742102e-18 +credit_bridge,6000,3,1e-06,0.0,9.388317972742102e-18,9.388317972742102e-18 +credit_bridge,6000,3,1e-05,0.0,9.388317972742102e-18,9.388317972742102e-18 +credit_bridge,6000,3,0.0001,0.0,9.388317972742102e-18,9.388317972742102e-18 diff --git a/results/confirmatory/T4_active_gamma_gpu1.csv b/results/confirmatory/T4_active_gamma_gpu1.csv new file mode 100644 index 0000000..4046b56 --- /dev/null +++ b/results/confirmatory/T4_active_gamma_gpu1.csv @@ -0,0 +1,101 @@ +method,seed,threshold,Gamma_active,Gamma_energy_weighted,mean_n_active,pct_active +bp,42,1e-08,nan,0.008410674568274684,0.0,0.0 +bp,123,1e-08,nan,0.00784901991651998,0.0,0.0 +bp,456,1e-08,nan,0.006583035346366685,0.0,0.0 +bp,789,1e-08,nan,0.008538903233346464,0.0,0.0 +bp,1024,1e-08,nan,0.00507547548717944,0.0,0.0 +bp,2048,1e-08,nan,0.011599486253741421,0.0,0.0 +bp,3000,1e-08,nan,0.0042974231253519605,0.0,0.0 +bp,4000,1e-08,nan,0.006007383163063016,0.0,0.0 +bp,5000,1e-08,nan,0.02396848893996247,0.0,0.0 +bp,6000,1e-08,nan,0.006664523954968009,0.0,0.0 +dfa,42,1e-08,nan,1.154343437255555e-07,0.0,0.0 +dfa,123,1e-08,nan,8.510892557758953e-08,0.0,0.0 +dfa,456,1e-08,nan,1.0844539793350438e-07,0.0,0.0 +dfa,789,1e-08,nan,1.4972250258491785e-07,0.0,0.0 +dfa,1024,1e-08,nan,1.3450313392413304e-07,0.0,0.0 +dfa,2048,1e-08,nan,6.095239875868572e-08,0.0,0.0 +dfa,3000,1e-08,nan,2.7933511957871546e-08,0.0,0.0 +dfa,4000,1e-08,nan,1.1400320738241886e-07,0.0,0.0 +dfa,5000,1e-08,nan,1.0320791846662267e-07,0.0,0.0 +dfa,6000,1e-08,nan,2.6408062272672387e-08,0.0,0.0 +bp,42,1e-07,nan,0.008410674568274684,0.0,0.0 +bp,123,1e-07,nan,0.00784901991651998,0.0,0.0 +bp,456,1e-07,nan,0.006583035346366685,0.0,0.0 +bp,789,1e-07,nan,0.008538903233346464,0.0,0.0 +bp,1024,1e-07,nan,0.00507547548717944,0.0,0.0 +bp,2048,1e-07,nan,0.011599486253741421,0.0,0.0 +bp,3000,1e-07,nan,0.0042974231253519605,0.0,0.0 +bp,4000,1e-07,nan,0.006007383163063016,0.0,0.0 +bp,5000,1e-07,nan,0.02396848893996247,0.0,0.0 +bp,6000,1e-07,nan,0.006664523954968009,0.0,0.0 +dfa,42,1e-07,nan,1.154343437255555e-07,0.0,0.0 +dfa,123,1e-07,nan,8.510892557758953e-08,0.0,0.0 +dfa,456,1e-07,nan,1.0844539793350438e-07,0.0,0.0 +dfa,789,1e-07,nan,1.4972250258491785e-07,0.0,0.0 +dfa,1024,1e-07,nan,1.3450313392413304e-07,0.0,0.0 +dfa,2048,1e-07,nan,6.095239875868572e-08,0.0,0.0 +dfa,3000,1e-07,nan,2.7933511957871546e-08,0.0,0.0 +dfa,4000,1e-07,nan,1.1400320738241886e-07,0.0,0.0 +dfa,5000,1e-07,nan,1.0320791846662267e-07,0.0,0.0 +dfa,6000,1e-07,nan,2.6408062272672387e-08,0.0,0.0 +bp,42,1e-06,nan,0.008410674568274684,0.0,0.0 +bp,123,1e-06,nan,0.00784901991651998,0.0,0.0 +bp,456,1e-06,nan,0.006583035346366685,0.0,0.0 +bp,789,1e-06,nan,0.008538903233346464,0.0,0.0 +bp,1024,1e-06,nan,0.00507547548717944,0.0,0.0 +bp,2048,1e-06,nan,0.011599486253741421,0.0,0.0 +bp,3000,1e-06,nan,0.0042974231253519605,0.0,0.0 +bp,4000,1e-06,nan,0.006007383163063016,0.0,0.0 +bp,5000,1e-06,nan,0.02396848893996247,0.0,0.0 +bp,6000,1e-06,nan,0.006664523954968009,0.0,0.0 +dfa,42,1e-06,nan,1.154343437255555e-07,0.0,0.0 +dfa,123,1e-06,nan,8.510892557758953e-08,0.0,0.0 +dfa,456,1e-06,nan,1.0844539793350438e-07,0.0,0.0 +dfa,789,1e-06,nan,1.4972250258491785e-07,0.0,0.0 +dfa,1024,1e-06,nan,1.3450313392413304e-07,0.0,0.0 +dfa,2048,1e-06,nan,6.095239875868572e-08,0.0,0.0 +dfa,3000,1e-06,nan,2.7933511957871546e-08,0.0,0.0 +dfa,4000,1e-06,nan,1.1400320738241886e-07,0.0,0.0 +dfa,5000,1e-06,nan,1.0320791846662267e-07,0.0,0.0 +dfa,6000,1e-06,nan,2.6408062272672387e-08,0.0,0.0 +bp,42,1e-05,nan,0.008410674568274684,0.0,0.0 +bp,123,1e-05,nan,0.00784901991651998,0.0,0.0 +bp,456,1e-05,nan,0.006583035346366685,0.0,0.0 +bp,789,1e-05,nan,0.008538903233346464,0.0,0.0 +bp,1024,1e-05,nan,0.00507547548717944,0.0,0.0 +bp,2048,1e-05,nan,0.011599486253741421,0.0,0.0 +bp,3000,1e-05,nan,0.0042974231253519605,0.0,0.0 +bp,4000,1e-05,nan,0.006007383163063016,0.0,0.0 +bp,5000,1e-05,nan,0.02396848893996247,0.0,0.0 +bp,6000,1e-05,nan,0.006664523954968009,0.0,0.0 +dfa,42,1e-05,nan,1.154343437255555e-07,0.0,0.0 +dfa,123,1e-05,nan,8.510892557758953e-08,0.0,0.0 +dfa,456,1e-05,nan,1.0844539793350438e-07,0.0,0.0 +dfa,789,1e-05,nan,1.4972250258491785e-07,0.0,0.0 +dfa,1024,1e-05,nan,1.3450313392413304e-07,0.0,0.0 +dfa,2048,1e-05,nan,6.095239875868572e-08,0.0,0.0 +dfa,3000,1e-05,nan,2.7933511957871546e-08,0.0,0.0 +dfa,4000,1e-05,nan,1.1400320738241886e-07,0.0,0.0 +dfa,5000,1e-05,nan,1.0320791846662267e-07,0.0,0.0 +dfa,6000,1e-05,nan,2.6408062272672387e-08,0.0,0.0 +bp,42,0.0001,nan,0.008410674568274684,0.0,0.0 +bp,123,0.0001,nan,0.00784901991651998,0.0,0.0 +bp,456,0.0001,nan,0.006583035346366685,0.0,0.0 +bp,789,0.0001,nan,0.008538903233346464,0.0,0.0 +bp,1024,0.0001,nan,0.00507547548717944,0.0,0.0 +bp,2048,0.0001,nan,0.011599486253741421,0.0,0.0 +bp,3000,0.0001,nan,0.0042974231253519605,0.0,0.0 +bp,4000,0.0001,nan,0.006007383163063016,0.0,0.0 +bp,5000,0.0001,nan,0.02396848893996247,0.0,0.0 +bp,6000,0.0001,nan,0.006664523954968009,0.0,0.0 +dfa,42,0.0001,nan,1.154343437255555e-07,0.0,0.0 +dfa,123,0.0001,nan,8.510892557758953e-08,0.0,0.0 +dfa,456,0.0001,nan,1.0844539793350438e-07,0.0,0.0 +dfa,789,0.0001,nan,1.4972250258491785e-07,0.0,0.0 +dfa,1024,0.0001,nan,1.3450313392413304e-07,0.0,0.0 +dfa,2048,0.0001,nan,6.095239875868572e-08,0.0,0.0 +dfa,3000,0.0001,nan,2.7933511957871546e-08,0.0,0.0 +dfa,4000,0.0001,nan,1.1400320738241886e-07,0.0,0.0 +dfa,5000,0.0001,nan,1.0320791846662267e-07,0.0,0.0 +dfa,6000,0.0001,nan,2.6408062272672387e-08,0.0,0.0 diff --git a/results/confirmatory/element_grad_concentration_gpu1.csv b/results/confirmatory/element_grad_concentration_gpu1.csv new file mode 100644 index 0000000..d9e5f64 --- /dev/null +++ b/results/confirmatory/element_grad_concentration_gpu1.csv @@ -0,0 +1,49 @@ +method,seed,layer,mean_norm,mean_r_inf,mean_pr,topk1_mean,topk5_mean,mean_eff_dim +bp,42,0,0.00013205190771259367,0.19995930790901184,0.320745050907135,0.07267192006111145,0.27676719427108765,0.6284974813461304 +bp,42,1,0.00014113880752120167,0.19624419510364532,0.3271224796772003,0.07037509977817535,0.27253925800323486,0.6316149234771729 +bp,42,2,0.00014439549704547971,0.1940011978149414,0.3327023983001709,0.06852715462446213,0.2683585584163666,0.635016679763794 +bp,42,3,0.0001360554015263915,0.19137907028198242,0.34159576892852783,0.06657430529594421,0.2615853250026703,0.6404645442962646 +bp,123,0,0.0001410204276908189,0.20094770193099976,0.3183582127094269,0.07336939871311188,0.27868813276290894,0.626787543296814 +bp,123,1,0.0001497487974120304,0.1956033706665039,0.3267548978328705,0.069853775203228,0.27310454845428467,0.6306979060173035 +bp,123,2,0.00015584431821480393,0.1955823302268982,0.329276442527771,0.06937956809997559,0.2705806493759155,0.6324625015258789 +bp,123,3,0.00014744212967343628,0.19288593530654907,0.3365374803543091,0.0673883780837059,0.2647479176521301,0.6369346380233765 +bp,456,0,0.00013993130414746702,0.2073223739862442,0.30707576870918274,0.07792861014604568,0.2867095470428467,0.6226484775543213 +bp,456,1,0.00014768482651561499,0.1996297836303711,0.3194756805896759,0.07266608625650406,0.2778666615486145,0.6277467012405396 +bp,456,2,0.00015311191964428872,0.19662046432495117,0.3266047239303589,0.07031284272670746,0.2727530002593994,0.6317288279533386 +bp,456,3,0.00014388732961378992,0.19098828732967377,0.3372885584831238,0.06676372140645981,0.2657164931297302,0.6366862058639526 +dfa,42,0,1.4626327526912064e-07,0.2192157804965973,0.2556527256965637,0.0891900509595871,0.34188225865364075,0.5702722072601318 +dfa,42,1,1.190095022529647e-09,0.6395785808563232,0.018672918900847435,0.6006988286972046,0.9294781684875488,0.11252760142087936 +dfa,42,2,1.1846384984082192e-09,0.6420882940292358,0.018416907638311386,0.6043064594268799,0.9321770071983337,0.10781284421682358 +dfa,42,3,1.1840007863028745e-09,0.6420532464981079,0.018423013389110565,0.6042190790176392,0.9319357872009277,0.10818937420845032 +dfa,123,0,1.7059814183539856e-07,0.22954490780830383,0.25190770626068115,0.09639231860637665,0.344560831785202,0.5766515731811523 +dfa,123,1,7.704760163207425e-10,0.5346307158470154,0.035571008920669556,0.42611783742904663,0.7804778814315796,0.22384336590766907 +dfa,123,2,7.577615201981303e-10,0.5401381254196167,0.03358124569058418,0.4356116056442261,0.7963865995407104,0.2042352557182312 +dfa,123,3,7.576308469481319e-10,0.5403565168380737,0.03355948626995087,0.43586090207099915,0.7965404987335205,0.20404565334320068 +dfa,456,0,1.321748470672901e-07,0.1959579437971115,0.3197200298309326,0.07280920445919037,0.2877272665500641,0.6280426383018494 +dfa,456,1,5.463409724626445e-10,0.5662611722946167,0.028242507949471474,0.4978998899459839,0.8235111236572266,0.18554803729057312 +dfa,456,2,5.38817768180877e-10,0.5703938007354736,0.02750721015036106,0.5034178495407104,0.8328064680099487,0.1696137636899948 +dfa,456,3,5.386884271985082e-10,0.5700349807739258,0.02755354717373848,0.5032708048820496,0.8326113820075989,0.16910555958747864 +state_bridge,42,0,3.023951649083756e-06,0.18504567444324493,0.32861703634262085,0.06476573646068573,0.2713982164859772,0.6255342960357666 +state_bridge,42,1,4.968894184997907e-10,0.2943871319293976,0.12534531950950623,0.1579325646162033,0.5166130065917969,0.40138113498687744 +state_bridge,42,2,4.896933969433803e-10,0.29881954193115234,0.12269431352615356,0.161039799451828,0.5214621424674988,0.39810389280319214 +state_bridge,42,3,4.669763464804078e-10,0.3080902695655823,0.11231986433267593,0.17093375325202942,0.5439932346343994,0.372189462184906 +state_bridge,123,0,6.046858743502526e-06,0.1817636489868164,0.3603183925151825,0.06420911848545074,0.26240652799606323,0.6442065238952637 +state_bridge,123,1,6.8831090827004e-10,0.27536946535110474,0.17245665192604065,0.1349649429321289,0.43179115653038025,0.5045968294143677 +state_bridge,123,2,6.79806044789899e-10,0.27179133892059326,0.1734859049320221,0.1320682168006897,0.4311187267303467,0.5061776638031006 +state_bridge,123,3,6.728649859510938e-10,0.2743262052536011,0.16675016283988953,0.13534706830978394,0.44226858019828796,0.4961113929748535 +state_bridge,456,0,7.66168705013115e-06,0.2138153612613678,0.25556856393814087,0.08795160055160522,0.3388819098472595,0.5581467151641846 +state_bridge,456,1,5.046121742680043e-09,0.3826007843017578,0.14723747968673706,0.222370445728302,0.46178531646728516,0.5120208263397217 +state_bridge,456,2,6.946614394820472e-10,0.509243905544281,0.04666562378406525,0.3711031675338745,0.7174608111381531,0.28527751564979553 +state_bridge,456,3,6.938281060797635e-10,0.5089173316955566,0.04689159244298935,0.3710116147994995,0.7176994681358337,0.28476428985595703 +credit_bridge,42,0,3.2832352303557855e-07,0.1986602246761322,0.2922472357749939,0.07348651438951492,0.30311092734336853,0.591210126876831 +credit_bridge,42,1,3.779444812668231e-10,0.3539695143699646,0.1457032859325409,0.20796863734722137,0.47020894289016724,0.49256768822669983 +credit_bridge,42,2,2.4595092629198234e-10,0.4228324890136719,0.07622009515762329,0.27860307693481445,0.5916883945465088,0.3799220323562622 +credit_bridge,42,3,2.455395331502075e-10,0.4239165782928467,0.07530638575553894,0.27949607372283936,0.5938265323638916,0.376716673374176 +credit_bridge,123,0,3.767189014070027e-07,0.20776748657226562,0.2798425555229187,0.07951992750167847,0.3096029758453369,0.5842440128326416 +credit_bridge,123,1,1.1916050368654396e-09,0.35956278443336487,0.12112382054328918,0.20661751925945282,0.5058196783065796,0.4451233148574829 +credit_bridge,123,2,1.147270944912293e-09,0.3667011559009552,0.10823968052864075,0.2142077386379242,0.527270495891571,0.4174838662147522 +credit_bridge,123,3,1.1412368827734554e-09,0.3674423396587372,0.10674013197422028,0.21544697880744934,0.5311102867126465,0.41357749700546265 +credit_bridge,456,0,2.3464230025638244e-07,0.20265212655067444,0.29567617177963257,0.07575372606515884,0.3008849024772644,0.5979419350624084 +credit_bridge,456,1,6.680229702737961e-10,0.4358518719673157,0.08221361041069031,0.2807537019252777,0.5842965841293335,0.37426555156707764 +credit_bridge,456,2,6.499010218874446e-10,0.4448775351047516,0.07321283966302872,0.2947343587875366,0.6133072376251221,0.3301146328449249 +credit_bridge,456,3,6.488426462780694e-10,0.4451141953468323,0.07312416285276413,0.2950716018676758,0.6131926774978638,0.33010828495025635 diff --git a/results/deeper_L_multiseed_scan.log b/results/deeper_L_multiseed_scan.log new file mode 100644 index 0000000..560f5af --- /dev/null +++ b/results/deeper_L_multiseed_scan.log @@ -0,0 +1,1090 @@ +=== DEEPER L MULTI-SEED SCAN: FA+DFA at d=512 === +Start: Sun Apr 26 09:06:47 AM CDT 2026 + +--- L=6, seeds 0-9 --- + L=6 seed=0 (Sun Apr 26 09:06:47 AM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 0 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0754, train=0.2320, test=0.2527 + [DFA] Epoch 10: loss=2.0139, train=0.2619, test=0.2897 + [DFA] Epoch 20: loss=2.0040, train=0.2690, test=0.2954 + [DFA] Epoch 30: loss=1.9986, train=0.2736, test=0.2876 + [DFA] Epoch 40: loss=1.9954, train=0.2758, test=0.3052 + [DFA] Epoch 50: loss=1.9963, train=0.2792, test=0.2894 + [DFA] Epoch 60: loss=1.9962, train=0.2786, test=0.3100 + [DFA] Epoch 70: loss=1.9948, train=0.2789, test=0.3016 + [DFA] Epoch 80: loss=1.9907, train=0.2809, test=0.3006 + [DFA] Epoch 90: loss=1.9898, train=0.2826, test=0.3051 + [DFA] Epoch 100: loss=1.9902, train=0.2837, test=0.3053 + Final test acc: 0.3053 + +--- FA --- + [FA] Epoch 1: loss=2.0268, train=0.2612, test=0.3205 + [FA] Epoch 10: loss=1.8316, train=0.3422, test=0.3736 + [FA] Epoch 20: loss=1.7763, train=0.3640, test=0.3927 + [FA] Epoch 30: loss=1.7367, train=0.3770, test=0.4106 + [FA] Epoch 40: loss=1.7089, train=0.3868, test=0.4180 + [FA] Epoch 50: loss=1.6936, train=0.3950, test=0.4171 + [FA] Epoch 60: loss=1.6784, train=0.4007, test=0.4270 + [FA] Epoch 70: loss=1.6704, train=0.4039, test=0.4255 + [FA] Epoch 80: loss=1.6650, train=0.4050, test=0.4330 + [FA] Epoch 90: loss=1.6637, train=0.4082, test=0.4337 + [FA] Epoch 100: loss=1.6589, train=0.4098, test=0.4340 + Final test acc: 0.4340 + +All results saved to results/fa_dfa_d512_L6_seed0/results_cifar10.json + L=6 seed=1 (Sun Apr 26 09:23:02 AM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 1 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0749, train=0.2331, test=0.2476 + [DFA] Epoch 10: loss=2.0192, train=0.2571, test=0.2900 + [DFA] Epoch 20: loss=2.0100, train=0.2664, test=0.2811 + [DFA] Epoch 30: loss=2.0046, train=0.2714, test=0.2892 + [DFA] Epoch 40: loss=2.0057, train=0.2721, test=0.2870 + [DFA] Epoch 50: loss=2.0049, train=0.2737, test=0.3065 + [DFA] Epoch 60: loss=2.0012, train=0.2747, test=0.2887 + [DFA] Epoch 70: loss=2.0005, train=0.2751, test=0.2941 + [DFA] Epoch 80: loss=2.0006, train=0.2763, test=0.2989 + [DFA] Epoch 90: loss=1.9995, train=0.2769, test=0.3003 + [DFA] Epoch 100: loss=2.0021, train=0.2756, test=0.2969 + Final test acc: 0.2969 + +--- FA --- + [FA] Epoch 1: loss=2.0533, train=0.2428, test=0.2926 + [FA] Epoch 10: loss=1.8535, train=0.3363, test=0.3756 + [FA] Epoch 20: loss=1.8062, train=0.3571, test=0.3875 + [FA] Epoch 30: loss=1.7723, train=0.3662, test=0.3939 + [FA] Epoch 40: loss=1.7430, train=0.3759, test=0.3990 + [FA] Epoch 50: loss=1.7342, train=0.3794, test=0.4118 + [FA] Epoch 60: loss=1.7145, train=0.3860, test=0.4059 + [FA] Epoch 70: loss=1.7081, train=0.3908, test=0.4132 + [FA] Epoch 80: loss=1.7039, train=0.3921, test=0.4148 + [FA] Epoch 90: loss=1.6982, train=0.3950, test=0.4153 + [FA] Epoch 100: loss=1.7012, train=0.3941, test=0.4144 + Final test acc: 0.4144 + +All results saved to results/fa_dfa_d512_L6_seed1/results_cifar10.json + L=6 seed=2 (Sun Apr 26 09:38:43 AM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 2 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0705, train=0.2380, test=0.2537 + [DFA] Epoch 10: loss=2.0288, train=0.2563, test=0.2663 + [DFA] Epoch 20: loss=2.0188, train=0.2614, test=0.2833 + [DFA] Epoch 30: loss=2.0179, train=0.2628, test=0.2877 + [DFA] Epoch 40: loss=2.0204, train=0.2651, test=0.3036 + [DFA] Epoch 50: loss=2.0163, train=0.2661, test=0.2882 + [DFA] Epoch 60: loss=2.0160, train=0.2661, test=0.2978 + [DFA] Epoch 70: loss=2.0176, train=0.2666, test=0.2931 + [DFA] Epoch 80: loss=2.0166, train=0.2675, test=0.2959 + [DFA] Epoch 90: loss=2.0153, train=0.2665, test=0.2963 + [DFA] Epoch 100: loss=2.0165, train=0.2695, test=0.2950 + Final test acc: 0.2950 + +--- FA --- + [FA] Epoch 1: loss=2.0383, train=0.2502, test=0.3027 + [FA] Epoch 10: loss=1.8441, train=0.3396, test=0.3702 + [FA] Epoch 20: loss=1.8158, train=0.3501, test=0.3714 + [FA] Epoch 30: loss=1.7969, train=0.3584, test=0.3776 + [FA] Epoch 40: loss=1.7879, train=0.3628, test=0.3924 + [FA] Epoch 50: loss=1.7698, train=0.3673, test=0.3828 + [FA] Epoch 60: loss=1.7611, train=0.3710, test=0.3979 + [FA] Epoch 70: loss=1.7502, train=0.3763, test=0.3982 + [FA] Epoch 80: loss=1.7518, train=0.3746, test=0.4012 + [FA] Epoch 90: loss=1.7454, train=0.3783, test=0.4024 + [FA] Epoch 100: loss=1.7443, train=0.3785, test=0.4016 + Final test acc: 0.4016 + +All results saved to results/fa_dfa_d512_L6_seed2/results_cifar10.json + L=6 seed=3 (Sun Apr 26 09:54:20 AM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 3 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0551, train=0.2424, test=0.2839 + [DFA] Epoch 10: loss=2.0036, train=0.2661, test=0.2742 + [DFA] Epoch 20: loss=1.9931, train=0.2699, test=0.2904 + [DFA] Epoch 30: loss=1.9856, train=0.2757, test=0.2969 + [DFA] Epoch 40: loss=1.9860, train=0.2784, test=0.2938 + [DFA] Epoch 50: loss=1.9833, train=0.2789, test=0.3045 + [DFA] Epoch 60: loss=1.9813, train=0.2807, test=0.2941 + [DFA] Epoch 70: loss=1.9833, train=0.2824, test=0.3029 + [DFA] Epoch 80: loss=1.9830, train=0.2828, test=0.3035 + [DFA] Epoch 90: loss=1.9786, train=0.2843, test=0.3041 + [DFA] Epoch 100: loss=1.9818, train=0.2838, test=0.3046 + Final test acc: 0.3046 + +--- FA --- + [FA] Epoch 1: loss=2.0187, train=0.2604, test=0.3158 + [FA] Epoch 10: loss=1.8322, train=0.3433, test=0.3646 + [FA] Epoch 20: loss=1.8053, train=0.3555, test=0.3793 + [FA] Epoch 30: loss=1.7969, train=0.3584, test=0.3885 + [FA] Epoch 40: loss=1.7757, train=0.3651, test=0.3996 + [FA] Epoch 50: loss=1.7556, train=0.3750, test=0.4063 + [FA] Epoch 60: loss=1.7459, train=0.3774, test=0.4058 + [FA] Epoch 70: loss=1.7338, train=0.3837, test=0.4081 + [FA] Epoch 80: loss=1.7303, train=0.3837, test=0.4096 + [FA] Epoch 90: loss=1.7250, train=0.3865, test=0.4112 + [FA] Epoch 100: loss=1.7252, train=0.3872, test=0.4118 + Final test acc: 0.4118 + +All results saved to results/fa_dfa_d512_L6_seed3/results_cifar10.json + L=6 seed=4 (Sun Apr 26 10:09:44 AM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 4 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0741, train=0.2323, test=0.2469 + [DFA] Epoch 10: loss=2.0382, train=0.2467, test=0.2707 + [DFA] Epoch 20: loss=2.0274, train=0.2540, test=0.2671 + [DFA] Epoch 30: loss=2.0237, train=0.2569, test=0.2758 + [DFA] Epoch 40: loss=2.0224, train=0.2618, test=0.2838 + [DFA] Epoch 50: loss=2.0164, train=0.2652, test=0.2812 + [DFA] Epoch 60: loss=2.0164, train=0.2629, test=0.2797 + [DFA] Epoch 70: loss=2.0141, train=0.2656, test=0.2787 + [DFA] Epoch 80: loss=2.0132, train=0.2666, test=0.2837 + [DFA] Epoch 90: loss=2.0100, train=0.2675, test=0.2809 + [DFA] Epoch 100: loss=2.0116, train=0.2658, test=0.2837 + Final test acc: 0.2837 + +--- FA --- + [FA] Epoch 1: loss=2.0380, train=0.2477, test=0.2942 + [FA] Epoch 10: loss=1.8578, train=0.3313, test=0.3670 + [FA] Epoch 20: loss=1.8016, train=0.3536, test=0.3779 + [FA] Epoch 30: loss=1.7595, train=0.3687, test=0.3971 + [FA] Epoch 40: loss=1.7326, train=0.3806, test=0.4089 + [FA] Epoch 50: loss=1.7184, train=0.3869, test=0.4079 + [FA] Epoch 60: loss=1.7024, train=0.3918, test=0.4186 + [FA] Epoch 70: loss=1.6926, train=0.3963, test=0.4170 + [FA] Epoch 80: loss=1.6852, train=0.3995, test=0.4206 + [FA] Epoch 90: loss=1.6837, train=0.4019, test=0.4186 + [FA] Epoch 100: loss=1.6809, train=0.4006, test=0.4195 + Final test acc: 0.4195 + +All results saved to results/fa_dfa_d512_L6_seed4/results_cifar10.json + L=6 seed=5 (Sun Apr 26 10:24:33 AM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 5 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0603, train=0.2425, test=0.2458 + [DFA] Epoch 10: loss=2.0115, train=0.2650, test=0.3025 + [DFA] Epoch 20: loss=1.9990, train=0.2713, test=0.2873 + [DFA] Epoch 30: loss=1.9938, train=0.2750, test=0.2974 + [DFA] Epoch 40: loss=1.9885, train=0.2802, test=0.2975 + [DFA] Epoch 50: loss=1.9872, train=0.2804, test=0.2910 + [DFA] Epoch 60: loss=1.9857, train=0.2820, test=0.3037 + [DFA] Epoch 70: loss=1.9872, train=0.2816, test=0.3060 + [DFA] Epoch 80: loss=1.9859, train=0.2824, test=0.3100 + [DFA] Epoch 90: loss=1.9870, train=0.2825, test=0.3028 + [DFA] Epoch 100: loss=1.9847, train=0.2843, test=0.3022 + Final test acc: 0.3022 + +--- FA --- + [FA] Epoch 1: loss=2.0246, train=0.2562, test=0.2956 + [FA] Epoch 10: loss=1.8641, train=0.3305, test=0.3594 + [FA] Epoch 20: loss=1.8319, train=0.3441, test=0.3755 + [FA] Epoch 30: loss=1.7993, train=0.3558, test=0.3790 + [FA] Epoch 40: loss=1.7832, train=0.3645, test=0.3943 + [FA] Epoch 50: loss=1.7677, train=0.3718, test=0.3982 + [FA] Epoch 60: loss=1.7570, train=0.3721, test=0.4016 + [FA] Epoch 70: loss=1.7503, train=0.3798, test=0.4044 + [FA] Epoch 80: loss=1.7434, train=0.3807, test=0.4059 + [FA] Epoch 90: loss=1.7394, train=0.3816, test=0.4084 + [FA] Epoch 100: loss=1.7398, train=0.3813, test=0.4058 + Final test acc: 0.4058 + +All results saved to results/fa_dfa_d512_L6_seed5/results_cifar10.json + L=6 seed=6 (Sun Apr 26 10:40:00 AM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 6 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0581, train=0.2431, test=0.2564 + [DFA] Epoch 10: loss=2.0129, train=0.2628, test=0.2827 + [DFA] Epoch 20: loss=2.0026, train=0.2685, test=0.2773 + [DFA] Epoch 30: loss=2.0049, train=0.2688, test=0.2826 + [DFA] Epoch 40: loss=1.9997, train=0.2737, test=0.2871 + [DFA] Epoch 50: loss=1.9980, train=0.2745, test=0.2988 + [DFA] Epoch 60: loss=1.9955, train=0.2780, test=0.3071 + [DFA] Epoch 70: loss=1.9951, train=0.2780, test=0.2975 + [DFA] Epoch 80: loss=1.9925, train=0.2789, test=0.3030 + [DFA] Epoch 90: loss=1.9924, train=0.2799, test=0.2977 + [DFA] Epoch 100: loss=1.9936, train=0.2779, test=0.2994 + Final test acc: 0.2994 + +--- FA --- + [FA] Epoch 1: loss=2.0281, train=0.2600, test=0.3013 + [FA] Epoch 10: loss=1.8386, train=0.3413, test=0.3632 + [FA] Epoch 20: loss=1.8134, train=0.3512, test=0.3692 + [FA] Epoch 30: loss=1.8012, train=0.3546, test=0.3809 + [FA] Epoch 40: loss=1.7733, train=0.3677, test=0.3989 + [FA] Epoch 50: loss=1.7604, train=0.3721, test=0.3971 + [FA] Epoch 60: loss=1.7482, train=0.3771, test=0.4060 + [FA] Epoch 70: loss=1.7369, train=0.3823, test=0.4024 + [FA] Epoch 80: loss=1.7315, train=0.3841, test=0.4131 + [FA] Epoch 90: loss=1.7255, train=0.3841, test=0.4105 + [FA] Epoch 100: loss=1.7224, train=0.3860, test=0.4117 + Final test acc: 0.4117 + +All results saved to results/fa_dfa_d512_L6_seed6/results_cifar10.json + L=6 seed=7 (Sun Apr 26 10:55:28 AM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 7 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0645, train=0.2374, test=0.2747 + [DFA] Epoch 10: loss=2.0061, train=0.2647, test=0.2898 + [DFA] Epoch 20: loss=1.9941, train=0.2695, test=0.2934 + [DFA] Epoch 30: loss=1.9881, train=0.2746, test=0.2942 + [DFA] Epoch 40: loss=1.9842, train=0.2784, test=0.2966 + [DFA] Epoch 50: loss=1.9830, train=0.2793, test=0.2902 + [DFA] Epoch 60: loss=1.9781, train=0.2808, test=0.3070 + [DFA] Epoch 70: loss=1.9795, train=0.2827, test=0.3080 + [DFA] Epoch 80: loss=1.9781, train=0.2831, test=0.3008 + [DFA] Epoch 90: loss=1.9748, train=0.2839, test=0.3084 + [DFA] Epoch 100: loss=1.9758, train=0.2823, test=0.3065 + Final test acc: 0.3065 + +--- FA --- + [FA] Epoch 1: loss=2.0354, train=0.2520, test=0.2994 + [FA] Epoch 10: loss=1.8603, train=0.3285, test=0.3638 + [FA] Epoch 20: loss=1.7985, train=0.3575, test=0.3897 + [FA] Epoch 30: loss=1.7541, train=0.3725, test=0.3938 + [FA] Epoch 40: loss=1.7245, train=0.3821, test=0.4058 + [FA] Epoch 50: loss=1.7039, train=0.3870, test=0.4140 + [FA] Epoch 60: loss=1.6908, train=0.3948, test=0.4167 + [FA] Epoch 70: loss=1.6804, train=0.3976, test=0.4199 + [FA] Epoch 80: loss=1.6716, train=0.3999, test=0.4257 + [FA] Epoch 90: loss=1.6675, train=0.4033, test=0.4253 + [FA] Epoch 100: loss=1.6672, train=0.4031, test=0.4253 + Final test acc: 0.4253 + +All results saved to results/fa_dfa_d512_L6_seed7/results_cifar10.json + L=6 seed=8 (Sun Apr 26 11:09:51 AM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 8 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0808, train=0.2286, test=0.2500 + [DFA] Epoch 10: loss=2.0191, train=0.2514, test=0.2806 + [DFA] Epoch 20: loss=2.0052, train=0.2625, test=0.2895 + [DFA] Epoch 30: loss=1.9980, train=0.2691, test=0.2892 + [DFA] Epoch 40: loss=1.9981, train=0.2688, test=0.2929 + [DFA] Epoch 50: loss=1.9960, train=0.2724, test=0.3026 + [DFA] Epoch 60: loss=1.9889, train=0.2736, test=0.2928 + [DFA] Epoch 70: loss=1.9906, train=0.2766, test=0.2874 + [DFA] Epoch 80: loss=1.9888, train=0.2756, test=0.2903 + [DFA] Epoch 90: loss=1.9869, train=0.2772, test=0.2956 + [DFA] Epoch 100: loss=1.9873, train=0.2772, test=0.2937 + Final test acc: 0.2937 + +--- FA --- + [FA] Epoch 1: loss=2.0414, train=0.2477, test=0.2817 + [FA] Epoch 10: loss=1.8438, train=0.3378, test=0.3627 + [FA] Epoch 20: loss=1.8157, train=0.3483, test=0.3739 + [FA] Epoch 30: loss=1.7973, train=0.3567, test=0.3844 + [FA] Epoch 40: loss=1.7774, train=0.3641, test=0.3987 + [FA] Epoch 50: loss=1.7612, train=0.3712, test=0.4044 + [FA] Epoch 60: loss=1.7405, train=0.3777, test=0.3962 + [FA] Epoch 70: loss=1.7277, train=0.3838, test=0.4041 + [FA] Epoch 80: loss=1.7220, train=0.3866, test=0.4081 + [FA] Epoch 90: loss=1.7148, train=0.3886, test=0.4068 + [FA] Epoch 100: loss=1.7179, train=0.3903, test=0.4080 + Final test acc: 0.4080 + +All results saved to results/fa_dfa_d512_L6_seed8/results_cifar10.json + L=6 seed=9 (Sun Apr 26 11:24:34 AM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 9 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0732, train=0.2346, test=0.2428 + [DFA] Epoch 10: loss=2.0163, train=0.2613, test=0.3009 + [DFA] Epoch 20: loss=2.0058, train=0.2651, test=0.2964 + [DFA] Epoch 30: loss=2.0001, train=0.2700, test=0.3069 + [DFA] Epoch 40: loss=1.9955, train=0.2739, test=0.3043 + [DFA] Epoch 50: loss=1.9937, train=0.2752, test=0.2967 + [DFA] Epoch 60: loss=1.9934, train=0.2783, test=0.3100 + [DFA] Epoch 70: loss=1.9902, train=0.2783, test=0.3044 + [DFA] Epoch 80: loss=1.9883, train=0.2813, test=0.3051 + [DFA] Epoch 90: loss=1.9886, train=0.2779, test=0.3041 + [DFA] Epoch 100: loss=1.9877, train=0.2784, test=0.3041 + Final test acc: 0.3041 + +--- FA --- + [FA] Epoch 1: loss=2.0333, train=0.2513, test=0.2784 + [FA] Epoch 10: loss=1.8637, train=0.3296, test=0.3631 + [FA] Epoch 20: loss=1.8369, train=0.3416, test=0.3696 + [FA] Epoch 30: loss=1.8113, train=0.3514, test=0.3800 + [FA] Epoch 40: loss=1.7897, train=0.3624, test=0.3793 + [FA] Epoch 50: loss=1.7690, train=0.3689, test=0.3924 + [FA] Epoch 60: loss=1.7552, train=0.3755, test=0.3959 + [FA] Epoch 70: loss=1.7418, train=0.3792, test=0.4016 + [FA] Epoch 80: loss=1.7311, train=0.3842, test=0.4000 + [FA] Epoch 90: loss=1.7330, train=0.3840, test=0.4016 + [FA] Epoch 100: loss=1.7305, train=0.3839, test=0.4025 + Final test acc: 0.4025 + +All results saved to results/fa_dfa_d512_L6_seed9/results_cifar10.json + +--- L=8, seeds 0-9 --- + L=8 seed=0 (Sun Apr 26 11:40:06 AM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 0 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0686, train=0.2354, test=0.2555 + [DFA] Epoch 10: loss=2.0237, train=0.2579, test=0.2828 + [DFA] Epoch 20: loss=2.0088, train=0.2678, test=0.3013 + [DFA] Epoch 30: loss=2.0052, train=0.2715, test=0.2935 + [DFA] Epoch 40: loss=2.0015, train=0.2727, test=0.3020 + [DFA] Epoch 50: loss=1.9974, train=0.2770, test=0.2890 + [DFA] Epoch 60: loss=1.9978, train=0.2760, test=0.3057 + [DFA] Epoch 70: loss=1.9949, train=0.2789, test=0.3065 + [DFA] Epoch 80: loss=1.9941, train=0.2785, test=0.3049 + [DFA] Epoch 90: loss=1.9958, train=0.2788, test=0.3062 + [DFA] Epoch 100: loss=1.9940, train=0.2811, test=0.3055 + Final test acc: 0.3055 + +--- FA --- + [FA] Epoch 1: loss=2.0311, train=0.2512, test=0.2945 + [FA] Epoch 10: loss=1.8528, train=0.3327, test=0.3602 + [FA] Epoch 20: loss=1.8045, train=0.3541, test=0.3917 + [FA] Epoch 30: loss=1.7622, train=0.3712, test=0.3840 + [FA] Epoch 40: loss=1.7380, train=0.3761, test=0.4008 + [FA] Epoch 50: loss=1.7170, train=0.3861, test=0.4089 + [FA] Epoch 60: loss=1.7056, train=0.3913, test=0.4115 + [FA] Epoch 70: loss=1.6973, train=0.3930, test=0.4188 + [FA] Epoch 80: loss=1.6902, train=0.3956, test=0.4204 + [FA] Epoch 90: loss=1.6888, train=0.3940, test=0.4194 + [FA] Epoch 100: loss=1.6833, train=0.4002, test=0.4191 + Final test acc: 0.4191 + +All results saved to results/fa_dfa_d512_L8_seed0/results_cifar10.json + L=8 seed=1 (Sun Apr 26 11:59:07 AM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 1 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0824, train=0.2277, test=0.2423 + [DFA] Epoch 10: loss=2.0254, train=0.2568, test=0.2660 + [DFA] Epoch 20: loss=2.0168, train=0.2619, test=0.2608 + [DFA] Epoch 30: loss=2.0087, train=0.2684, test=0.2952 + [DFA] Epoch 40: loss=2.0085, train=0.2700, test=0.2925 + [DFA] Epoch 50: loss=2.0048, train=0.2728, test=0.2958 + [DFA] Epoch 60: loss=2.0034, train=0.2745, test=0.2994 + [DFA] Epoch 70: loss=2.0001, train=0.2772, test=0.2911 + [DFA] Epoch 80: loss=2.0000, train=0.2778, test=0.2978 + [DFA] Epoch 90: loss=1.9999, train=0.2775, test=0.2999 + [DFA] Epoch 100: loss=1.9988, train=0.2788, test=0.2958 + Final test acc: 0.2958 + +--- FA --- + [FA] Epoch 1: loss=2.0216, train=0.2573, test=0.3016 + [FA] Epoch 10: loss=1.8318, train=0.3420, test=0.3786 + [FA] Epoch 20: loss=1.7819, train=0.3618, test=0.3769 + [FA] Epoch 30: loss=1.7449, train=0.3765, test=0.4017 + [FA] Epoch 40: loss=1.7395, train=0.3785, test=0.4020 + [FA] Epoch 50: loss=1.7304, train=0.3799, test=0.4057 + [FA] Epoch 60: loss=1.7268, train=0.3817, test=0.4132 + [FA] Epoch 70: loss=1.7219, train=0.3845, test=0.4144 + [FA] Epoch 80: loss=1.7163, train=0.3888, test=0.4084 + [FA] Epoch 90: loss=1.7173, train=0.3860, test=0.4123 + [FA] Epoch 100: loss=1.7119, train=0.3907, test=0.4123 + Final test acc: 0.4123 + +All results saved to results/fa_dfa_d512_L8_seed1/results_cifar10.json + L=8 seed=2 (Sun Apr 26 12:17:53 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 2 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0644, train=0.2387, test=0.2603 + [DFA] Epoch 10: loss=2.0294, train=0.2538, test=0.2880 + [DFA] Epoch 20: loss=2.0222, train=0.2605, test=0.2880 + [DFA] Epoch 30: loss=2.0184, train=0.2638, test=0.2846 + [DFA] Epoch 40: loss=2.0148, train=0.2668, test=0.2988 + [DFA] Epoch 50: loss=2.0132, train=0.2699, test=0.2841 + [DFA] Epoch 60: loss=2.0110, train=0.2689, test=0.3031 + [DFA] Epoch 70: loss=2.0113, train=0.2706, test=0.2926 + [DFA] Epoch 80: loss=2.0091, train=0.2741, test=0.2949 + [DFA] Epoch 90: loss=2.0082, train=0.2725, test=0.2975 + [DFA] Epoch 100: loss=2.0093, train=0.2748, test=0.2966 + Final test acc: 0.2966 + +--- FA --- + [FA] Epoch 1: loss=2.0312, train=0.2537, test=0.2876 + [FA] Epoch 10: loss=1.8375, train=0.3379, test=0.3697 + [FA] Epoch 20: loss=1.7817, train=0.3609, test=0.3774 + [FA] Epoch 30: loss=1.7570, train=0.3717, test=0.3951 + [FA] Epoch 40: loss=1.7423, train=0.3774, test=0.4004 + [FA] Epoch 50: loss=1.7287, train=0.3809, test=0.4028 + [FA] Epoch 60: loss=1.7158, train=0.3882, test=0.4084 + [FA] Epoch 70: loss=1.7110, train=0.3907, test=0.4107 + [FA] Epoch 80: loss=1.7002, train=0.3932, test=0.4125 + [FA] Epoch 90: loss=1.7015, train=0.3927, test=0.4146 + [FA] Epoch 100: loss=1.6987, train=0.3936, test=0.4120 + Final test acc: 0.4120 + +All results saved to results/fa_dfa_d512_L8_seed2/results_cifar10.json + L=8 seed=3 (Sun Apr 26 12:35:38 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 3 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0677, train=0.2326, test=0.2578 + [DFA] Epoch 10: loss=2.0196, train=0.2591, test=0.2638 + [DFA] Epoch 20: loss=2.0081, train=0.2646, test=0.2804 + [DFA] Epoch 30: loss=2.0014, train=0.2724, test=0.2952 + [DFA] Epoch 40: loss=1.9997, train=0.2738, test=0.2932 + [DFA] Epoch 50: loss=1.9985, train=0.2748, test=0.2846 + [DFA] Epoch 60: loss=1.9980, train=0.2771, test=0.2920 + [DFA] Epoch 70: loss=1.9972, train=0.2768, test=0.2881 + [DFA] Epoch 80: loss=1.9974, train=0.2761, test=0.2973 + [DFA] Epoch 90: loss=1.9947, train=0.2787, test=0.2944 + [DFA] Epoch 100: loss=1.9938, train=0.2781, test=0.2967 + Final test acc: 0.2967 + +--- FA --- + [FA] Epoch 1: loss=2.0319, train=0.2529, test=0.3107 + [FA] Epoch 10: loss=1.8432, train=0.3372, test=0.3697 + [FA] Epoch 20: loss=1.7929, train=0.3574, test=0.3836 + [FA] Epoch 30: loss=1.7488, train=0.3731, test=0.4040 + [FA] Epoch 40: loss=1.7228, train=0.3815, test=0.4100 + [FA] Epoch 50: loss=1.7003, train=0.3931, test=0.4150 + [FA] Epoch 60: loss=1.6882, train=0.3974, test=0.4169 + [FA] Epoch 70: loss=1.6802, train=0.3990, test=0.4237 + [FA] Epoch 80: loss=1.6684, train=0.4039, test=0.4219 + [FA] Epoch 90: loss=1.6652, train=0.4063, test=0.4260 + [FA] Epoch 100: loss=1.6635, train=0.4050, test=0.4251 + Final test acc: 0.4251 + +All results saved to results/fa_dfa_d512_L8_seed3/results_cifar10.json + L=8 seed=4 (Sun Apr 26 12:53:26 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 4 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0559, train=0.2432, test=0.2550 + [DFA] Epoch 10: loss=2.0292, train=0.2497, test=0.2611 + [DFA] Epoch 20: loss=2.0249, train=0.2563, test=0.2550 + [DFA] Epoch 30: loss=2.0178, train=0.2609, test=0.2765 + [DFA] Epoch 40: loss=2.0140, train=0.2601, test=0.2829 + [DFA] Epoch 50: loss=2.0119, train=0.2643, test=0.2796 + [DFA] Epoch 60: loss=2.0100, train=0.2676, test=0.2797 + [DFA] Epoch 70: loss=2.0083, train=0.2681, test=0.2820 + [DFA] Epoch 80: loss=2.0068, train=0.2686, test=0.2882 + [DFA] Epoch 90: loss=2.0060, train=0.2688, test=0.2853 + [DFA] Epoch 100: loss=2.0040, train=0.2703, test=0.2861 + Final test acc: 0.2861 + +--- FA --- + [FA] Epoch 1: loss=2.0499, train=0.2421, test=0.2980 + [FA] Epoch 10: loss=1.8468, train=0.3371, test=0.3615 + [FA] Epoch 20: loss=1.7747, train=0.3605, test=0.3749 + [FA] Epoch 30: loss=1.7448, train=0.3753, test=0.3958 + [FA] Epoch 40: loss=1.7325, train=0.3785, test=0.4076 + [FA] Epoch 50: loss=1.7202, train=0.3839, test=0.4118 + [FA] Epoch 60: loss=1.7132, train=0.3875, test=0.4104 + [FA] Epoch 70: loss=1.7066, train=0.3921, test=0.4088 + [FA] Epoch 80: loss=1.6998, train=0.3929, test=0.4152 + [FA] Epoch 90: loss=1.6938, train=0.3929, test=0.4127 + [FA] Epoch 100: loss=1.6935, train=0.3962, test=0.4143 + Final test acc: 0.4143 + +All results saved to results/fa_dfa_d512_L8_seed4/results_cifar10.json + L=8 seed=5 (Sun Apr 26 01:11:06 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 5 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0787, train=0.2307, test=0.2557 + [DFA] Epoch 10: loss=2.0261, train=0.2540, test=0.2646 + [DFA] Epoch 20: loss=2.0107, train=0.2651, test=0.2900 + [DFA] Epoch 30: loss=2.0057, train=0.2666, test=0.2929 + [DFA] Epoch 40: loss=2.0034, train=0.2703, test=0.2944 + [DFA] Epoch 50: loss=2.0026, train=0.2728, test=0.2811 + [DFA] Epoch 60: loss=2.0009, train=0.2756, test=0.2901 + [DFA] Epoch 70: loss=1.9981, train=0.2758, test=0.2947 + [DFA] Epoch 80: loss=1.9976, train=0.2775, test=0.2940 + [DFA] Epoch 90: loss=1.9956, train=0.2759, test=0.2940 + [DFA] Epoch 100: loss=1.9953, train=0.2778, test=0.2938 + Final test acc: 0.2938 + +--- FA --- + [FA] Epoch 1: loss=2.0382, train=0.2496, test=0.3045 + [FA] Epoch 10: loss=1.8518, train=0.3334, test=0.3668 + [FA] Epoch 20: loss=1.8099, train=0.3510, test=0.3839 + [FA] Epoch 30: loss=1.7989, train=0.3517, test=0.3876 + [FA] Epoch 40: loss=1.7806, train=0.3635, test=0.3979 + [FA] Epoch 50: loss=1.7765, train=0.3634, test=0.3922 + [FA] Epoch 60: loss=1.7637, train=0.3703, test=0.4000 + [FA] Epoch 70: loss=1.7528, train=0.3747, test=0.4000 + [FA] Epoch 80: loss=1.7456, train=0.3787, test=0.4028 + [FA] Epoch 90: loss=1.7389, train=0.3791, test=0.4051 + [FA] Epoch 100: loss=1.7390, train=0.3801, test=0.4025 + Final test acc: 0.4025 + +All results saved to results/fa_dfa_d512_L8_seed5/results_cifar10.json + L=8 seed=6 (Sun Apr 26 01:28:32 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 6 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0488, train=0.2474, test=0.2851 + [DFA] Epoch 10: loss=2.0149, train=0.2607, test=0.2869 + [DFA] Epoch 20: loss=2.0076, train=0.2645, test=0.2908 + [DFA] Epoch 30: loss=2.0015, train=0.2714, test=0.3020 + [DFA] Epoch 40: loss=1.9977, train=0.2738, test=0.3020 + [DFA] Epoch 50: loss=1.9944, train=0.2761, test=0.2966 + [DFA] Epoch 60: loss=1.9945, train=0.2742, test=0.2961 + [DFA] Epoch 70: loss=1.9933, train=0.2770, test=0.2994 + [DFA] Epoch 80: loss=1.9909, train=0.2786, test=0.2939 + [DFA] Epoch 90: loss=1.9894, train=0.2790, test=0.2982 + [DFA] Epoch 100: loss=1.9911, train=0.2796, test=0.2960 + Final test acc: 0.2960 + +--- FA --- + [FA] Epoch 1: loss=2.0267, train=0.2552, test=0.3093 + [FA] Epoch 10: loss=1.8456, train=0.3364, test=0.3586 + [FA] Epoch 20: loss=1.7877, train=0.3586, test=0.3884 + [FA] Epoch 30: loss=1.7469, train=0.3726, test=0.4001 + [FA] Epoch 40: loss=1.7398, train=0.3766, test=0.3949 + [FA] Epoch 50: loss=1.7227, train=0.3817, test=0.3969 + [FA] Epoch 60: loss=1.7106, train=0.3860, test=0.4102 + [FA] Epoch 70: loss=1.7000, train=0.3936, test=0.4046 + [FA] Epoch 80: loss=1.6933, train=0.3922, test=0.4133 + [FA] Epoch 90: loss=1.6878, train=0.3969, test=0.4100 + [FA] Epoch 100: loss=1.6847, train=0.3987, test=0.4109 + Final test acc: 0.4109 + +All results saved to results/fa_dfa_d512_L8_seed6/results_cifar10.json + L=8 seed=7 (Sun Apr 26 01:46:09 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 7 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0667, train=0.2334, test=0.2395 + [DFA] Epoch 10: loss=2.0155, train=0.2563, test=0.2736 + [DFA] Epoch 20: loss=1.9987, train=0.2661, test=0.2881 + [DFA] Epoch 30: loss=1.9906, train=0.2696, test=0.3007 + [DFA] Epoch 40: loss=1.9870, train=0.2762, test=0.2973 + [DFA] Epoch 50: loss=1.9854, train=0.2763, test=0.3014 + [DFA] Epoch 60: loss=1.9830, train=0.2781, test=0.3044 + [DFA] Epoch 70: loss=1.9812, train=0.2818, test=0.2954 + [DFA] Epoch 80: loss=1.9772, train=0.2831, test=0.2935 + [DFA] Epoch 90: loss=1.9765, train=0.2830, test=0.3067 + [DFA] Epoch 100: loss=1.9773, train=0.2828, test=0.3055 + Final test acc: 0.3055 + +--- FA --- + [FA] Epoch 1: loss=2.0300, train=0.2506, test=0.2982 + [FA] Epoch 10: loss=1.8507, train=0.3370, test=0.3721 + [FA] Epoch 20: loss=1.8040, train=0.3518, test=0.3871 + [FA] Epoch 30: loss=1.7669, train=0.3650, test=0.3946 + [FA] Epoch 40: loss=1.7425, train=0.3760, test=0.4054 + [FA] Epoch 50: loss=1.7255, train=0.3821, test=0.4021 + [FA] Epoch 60: loss=1.7092, train=0.3899, test=0.4059 + [FA] Epoch 70: loss=1.7013, train=0.3949, test=0.4107 + [FA] Epoch 80: loss=1.6932, train=0.3963, test=0.4197 + [FA] Epoch 90: loss=1.6906, train=0.3980, test=0.4200 + [FA] Epoch 100: loss=1.6880, train=0.3960, test=0.4200 + Final test acc: 0.4200 + +All results saved to results/fa_dfa_d512_L8_seed7/results_cifar10.json + L=8 seed=8 (Sun Apr 26 02:03:33 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 8 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0683, train=0.2363, test=0.2602 + [DFA] Epoch 10: loss=2.0129, train=0.2585, test=0.2885 + [DFA] Epoch 20: loss=2.0016, train=0.2636, test=0.2819 + [DFA] Epoch 30: loss=1.9983, train=0.2685, test=0.2764 + [DFA] Epoch 40: loss=1.9929, train=0.2713, test=0.2871 + [DFA] Epoch 50: loss=1.9924, train=0.2726, test=0.2923 + [DFA] Epoch 60: loss=1.9907, train=0.2727, test=0.2905 + [DFA] Epoch 70: loss=1.9884, train=0.2755, test=0.2822 + [DFA] Epoch 80: loss=1.9884, train=0.2747, test=0.2945 + [DFA] Epoch 90: loss=1.9868, train=0.2770, test=0.2929 + [DFA] Epoch 100: loss=1.9849, train=0.2757, test=0.2943 + Final test acc: 0.2943 + +--- FA --- + [FA] Epoch 1: loss=2.0412, train=0.2497, test=0.3050 + [FA] Epoch 10: loss=1.8491, train=0.3389, test=0.3644 + [FA] Epoch 20: loss=1.8135, train=0.3491, test=0.3701 + [FA] Epoch 30: loss=1.7963, train=0.3579, test=0.3830 + [FA] Epoch 40: loss=1.7769, train=0.3649, test=0.3879 + [FA] Epoch 50: loss=1.7618, train=0.3683, test=0.3914 + [FA] Epoch 60: loss=1.7529, train=0.3718, test=0.4003 + [FA] Epoch 70: loss=1.7454, train=0.3789, test=0.4012 + [FA] Epoch 80: loss=1.7402, train=0.3802, test=0.4025 + [FA] Epoch 90: loss=1.7360, train=0.3820, test=0.4004 + [FA] Epoch 100: loss=1.7297, train=0.3853, test=0.4026 + Final test acc: 0.4026 + +All results saved to results/fa_dfa_d512_L8_seed8/results_cifar10.json + L=8 seed=9 (Sun Apr 26 02:21:11 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 9 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0749, train=0.2330, test=0.2539 + [DFA] Epoch 10: loss=2.0183, train=0.2586, test=0.2576 + [DFA] Epoch 20: loss=2.0107, train=0.2614, test=0.2834 + [DFA] Epoch 30: loss=2.0014, train=0.2669, test=0.2849 + [DFA] Epoch 40: loss=1.9982, train=0.2717, test=0.2993 + [DFA] Epoch 50: loss=1.9968, train=0.2730, test=0.2959 + [DFA] Epoch 60: loss=1.9945, train=0.2756, test=0.3016 + [DFA] Epoch 70: loss=1.9922, train=0.2742, test=0.2938 + [DFA] Epoch 80: loss=1.9907, train=0.2774, test=0.2988 + [DFA] Epoch 90: loss=1.9877, train=0.2779, test=0.2969 + [DFA] Epoch 100: loss=1.9897, train=0.2781, test=0.2977 + Final test acc: 0.2977 + +--- FA --- + [FA] Epoch 1: loss=2.0547, train=0.2347, test=0.2763 + [FA] Epoch 10: loss=1.8719, train=0.3216, test=0.3324 + [FA] Epoch 20: loss=1.8399, train=0.3385, test=0.3637 + [FA] Epoch 30: loss=1.8047, train=0.3538, test=0.3782 + [FA] Epoch 40: loss=1.7922, train=0.3605, test=0.3830 + [FA] Epoch 50: loss=1.7799, train=0.3645, test=0.3859 + [FA] Epoch 60: loss=1.7698, train=0.3668, test=0.3950 + [FA] Epoch 70: loss=1.7573, train=0.3723, test=0.3963 + [FA] Epoch 80: loss=1.7546, train=0.3759, test=0.3950 + [FA] Epoch 90: loss=1.7476, train=0.3774, test=0.3995 + [FA] Epoch 100: loss=1.7496, train=0.3771, test=0.3992 + Final test acc: 0.3992 + +All results saved to results/fa_dfa_d512_L8_seed9/results_cifar10.json + +--- L=12, seeds 0-9 --- + L=12 seed=0 (Sun Apr 26 02:38:56 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 0 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0728, train=0.2332, test=0.2507 + [DFA] Epoch 10: loss=2.0139, train=0.2623, test=0.2941 + [DFA] Epoch 20: loss=2.0039, train=0.2680, test=0.2924 + [DFA] Epoch 30: loss=1.9980, train=0.2730, test=0.2981 + [DFA] Epoch 40: loss=1.9953, train=0.2747, test=0.2960 + [DFA] Epoch 50: loss=1.9903, train=0.2772, test=0.3028 + [DFA] Epoch 60: loss=1.9883, train=0.2762, test=0.3004 + [DFA] Epoch 70: loss=1.9859, train=0.2802, test=0.3035 + [DFA] Epoch 80: loss=1.9843, train=0.2801, test=0.3071 + [DFA] Epoch 90: loss=1.9821, train=0.2834, test=0.3080 + [DFA] Epoch 100: loss=1.9833, train=0.2835, test=0.3086 + Final test acc: 0.3086 + +--- FA --- + [FA] Epoch 1: loss=2.0294, train=0.2526, test=0.2924 + [FA] Epoch 10: loss=1.8579, train=0.3310, test=0.3606 + [FA] Epoch 20: loss=1.8031, train=0.3533, test=0.3745 + [FA] Epoch 30: loss=1.7613, train=0.3668, test=0.3978 + [FA] Epoch 40: loss=1.7239, train=0.3809, test=0.4064 + [FA] Epoch 50: loss=1.7011, train=0.3911, test=0.4125 + [FA] Epoch 60: loss=1.6889, train=0.3943, test=0.4140 + [FA] Epoch 70: loss=1.6731, train=0.4016, test=0.4220 + [FA] Epoch 80: loss=1.6635, train=0.4057, test=0.4215 + [FA] Epoch 90: loss=1.6579, train=0.4072, test=0.4260 + [FA] Epoch 100: loss=1.6615, train=0.4068, test=0.4239 + Final test acc: 0.4239 + +All results saved to results/fa_dfa_d512_L12_seed0/results_cifar10.json + L=12 seed=1 (Sun Apr 26 03:01:25 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 1 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0878, train=0.2247, test=0.2444 + [DFA] Epoch 10: loss=2.0278, train=0.2491, test=0.2609 + [DFA] Epoch 20: loss=2.0169, train=0.2600, test=0.2676 + [DFA] Epoch 30: loss=2.0113, train=0.2670, test=0.2971 + [DFA] Epoch 40: loss=2.0088, train=0.2675, test=0.2833 + [DFA] Epoch 50: loss=2.0063, train=0.2727, test=0.2874 + [DFA] Epoch 60: loss=2.0052, train=0.2728, test=0.2901 + [DFA] Epoch 70: loss=2.0068, train=0.2697, test=0.3010 + [DFA] Epoch 80: loss=2.0047, train=0.2723, test=0.2944 + [DFA] Epoch 90: loss=2.0015, train=0.2755, test=0.2930 + [DFA] Epoch 100: loss=2.0039, train=0.2744, test=0.2932 + Final test acc: 0.2932 + +--- FA --- + [FA] Epoch 1: loss=2.0398, train=0.2476, test=0.2816 + [FA] Epoch 10: loss=1.8783, train=0.3196, test=0.3372 + [FA] Epoch 20: loss=1.8384, train=0.3395, test=0.3542 + [FA] Epoch 30: loss=1.7912, train=0.3583, test=0.3790 + [FA] Epoch 40: loss=1.7586, train=0.3700, test=0.3879 + [FA] Epoch 50: loss=1.7364, train=0.3772, test=0.3986 + [FA] Epoch 60: loss=1.7279, train=0.3819, test=0.4016 + [FA] Epoch 70: loss=1.7195, train=0.3841, test=0.4041 + [FA] Epoch 80: loss=1.7064, train=0.3904, test=0.4059 + [FA] Epoch 90: loss=1.7049, train=0.3901, test=0.4052 + [FA] Epoch 100: loss=1.7029, train=0.3911, test=0.4067 + Final test acc: 0.4067 + +All results saved to results/fa_dfa_d512_L12_seed1/results_cifar10.json + L=12 seed=2 (Sun Apr 26 03:23:30 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 2 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0675, train=0.2390, test=0.2486 + [DFA] Epoch 10: loss=2.0351, train=0.2548, test=0.2903 + [DFA] Epoch 20: loss=2.0279, train=0.2578, test=0.2742 + [DFA] Epoch 30: loss=2.0245, train=0.2578, test=0.2912 + [DFA] Epoch 40: loss=2.0192, train=0.2651, test=0.2862 + [DFA] Epoch 50: loss=2.0191, train=0.2628, test=0.3027 + [DFA] Epoch 60: loss=2.0165, train=0.2668, test=0.2878 + [DFA] Epoch 70: loss=2.0158, train=0.2669, test=0.2917 + [DFA] Epoch 80: loss=2.0166, train=0.2666, test=0.2954 + [DFA] Epoch 90: loss=2.0130, train=0.2668, test=0.2920 + [DFA] Epoch 100: loss=2.0154, train=0.2701, test=0.2933 + Final test acc: 0.2933 + +--- FA --- + [FA] Epoch 1: loss=2.0564, train=0.2412, test=0.2906 + [FA] Epoch 10: loss=1.8592, train=0.3337, test=0.3441 + [FA] Epoch 20: loss=1.8280, train=0.3438, test=0.3753 + [FA] Epoch 30: loss=1.7987, train=0.3555, test=0.3820 + [FA] Epoch 40: loss=1.7781, train=0.3631, test=0.3904 + [FA] Epoch 50: loss=1.7620, train=0.3721, test=0.3962 + [FA] Epoch 60: loss=1.7464, train=0.3761, test=0.3949 + [FA] Epoch 70: loss=1.7377, train=0.3800, test=0.3976 + [FA] Epoch 80: loss=1.7297, train=0.3856, test=0.4018 + [FA] Epoch 90: loss=1.7231, train=0.3884, test=0.4026 + [FA] Epoch 100: loss=1.7269, train=0.3860, test=0.4025 + Final test acc: 0.4025 + +All results saved to results/fa_dfa_d512_L12_seed2/results_cifar10.json + L=12 seed=3 (Sun Apr 26 03:45:24 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 3 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0759, train=0.2279, test=0.2245 + [DFA] Epoch 10: loss=2.0204, train=0.2579, test=0.2911 + [DFA] Epoch 20: loss=2.0140, train=0.2648, test=0.2796 + [DFA] Epoch 30: loss=2.0068, train=0.2669, test=0.2936 + [DFA] Epoch 40: loss=2.0032, train=0.2733, test=0.3002 + [DFA] Epoch 50: loss=1.9991, train=0.2762, test=0.2838 + [DFA] Epoch 60: loss=1.9988, train=0.2749, test=0.2917 + [DFA] Epoch 70: loss=1.9974, train=0.2762, test=0.2949 + [DFA] Epoch 80: loss=1.9956, train=0.2778, test=0.2953 + [DFA] Epoch 90: loss=1.9954, train=0.2779, test=0.2958 + [DFA] Epoch 100: loss=1.9942, train=0.2803, test=0.2970 + Final test acc: 0.2970 + +--- FA --- + [FA] Epoch 1: loss=2.0397, train=0.2449, test=0.2636 + [FA] Epoch 10: loss=1.8607, train=0.3291, test=0.3598 + [FA] Epoch 20: loss=1.8178, train=0.3486, test=0.3644 + [FA] Epoch 30: loss=1.7954, train=0.3548, test=0.3829 + [FA] Epoch 40: loss=1.7790, train=0.3633, test=0.3896 + [FA] Epoch 50: loss=1.7589, train=0.3718, test=0.3956 + [FA] Epoch 60: loss=1.7487, train=0.3748, test=0.4010 + [FA] Epoch 70: loss=1.7414, train=0.3780, test=0.4059 + [FA] Epoch 80: loss=1.7351, train=0.3810, test=0.4074 + [FA] Epoch 90: loss=1.7321, train=0.3820, test=0.4087 + [FA] Epoch 100: loss=1.7255, train=0.3854, test=0.4088 + Final test acc: 0.4088 + +All results saved to results/fa_dfa_d512_L12_seed3/results_cifar10.json + L=12 seed=4 (Sun Apr 26 04:07:27 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 4 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0759, train=0.2298, test=0.2600 + [DFA] Epoch 10: loss=2.0279, train=0.2509, test=0.2747 + [DFA] Epoch 20: loss=2.0182, train=0.2590, test=0.2708 + [DFA] Epoch 30: loss=2.0105, train=0.2640, test=0.2875 + [DFA] Epoch 40: loss=2.0070, train=0.2650, test=0.2936 + [DFA] Epoch 50: loss=2.0055, train=0.2682, test=0.2845 + [DFA] Epoch 60: loss=2.0037, train=0.2692, test=0.2887 + [DFA] Epoch 70: loss=1.9991, train=0.2715, test=0.2898 + [DFA] Epoch 80: loss=1.9990, train=0.2729, test=0.2896 + [DFA] Epoch 90: loss=1.9996, train=0.2717, test=0.2834 + [DFA] Epoch 100: loss=1.9997, train=0.2726, test=0.2878 + Final test acc: 0.2878 + +--- FA --- + [FA] Epoch 1: loss=2.0479, train=0.2395, test=0.2937 + [FA] Epoch 10: loss=1.8582, train=0.3302, test=0.3564 + [FA] Epoch 20: loss=1.7941, train=0.3549, test=0.3788 + [FA] Epoch 30: loss=1.7729, train=0.3650, test=0.3920 + [FA] Epoch 40: loss=1.7521, train=0.3713, test=0.3971 + [FA] Epoch 50: loss=1.7363, train=0.3786, test=0.4115 + [FA] Epoch 60: loss=1.7227, train=0.3825, test=0.4055 + [FA] Epoch 70: loss=1.7223, train=0.3859, test=0.4100 + [FA] Epoch 80: loss=1.7159, train=0.3864, test=0.4126 + [FA] Epoch 90: loss=1.7119, train=0.3879, test=0.4082 + [FA] Epoch 100: loss=1.7080, train=0.3921, test=0.4108 + Final test acc: 0.4108 + +All results saved to results/fa_dfa_d512_L12_seed4/results_cifar10.json + L=12 seed=5 (Sun Apr 26 04:29:29 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 5 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0685, train=0.2380, test=0.2445 + [DFA] Epoch 10: loss=2.0152, train=0.2646, test=0.2909 + [DFA] Epoch 20: loss=2.0023, train=0.2669, test=0.2992 + [DFA] Epoch 30: loss=1.9997, train=0.2714, test=0.3025 + [DFA] Epoch 40: loss=1.9960, train=0.2753, test=0.2802 + [DFA] Epoch 50: loss=1.9937, train=0.2769, test=0.3031 + [DFA] Epoch 60: loss=1.9927, train=0.2804, test=0.2956 + [DFA] Epoch 70: loss=1.9892, train=0.2814, test=0.3068 + [DFA] Epoch 80: loss=1.9892, train=0.2804, test=0.3036 + [DFA] Epoch 90: loss=1.9884, train=0.2794, test=0.3009 + [DFA] Epoch 100: loss=1.9884, train=0.2791, test=0.3018 + Final test acc: 0.3018 + +--- FA --- + [FA] Epoch 1: loss=2.0708, train=0.2292, test=0.2587 + [FA] Epoch 10: loss=1.8931, train=0.3117, test=0.3454 + [FA] Epoch 20: loss=1.8683, train=0.3264, test=0.3644 + [FA] Epoch 30: loss=1.8452, train=0.3390, test=0.3686 + [FA] Epoch 40: loss=1.8322, train=0.3485, test=0.3781 + [FA] Epoch 50: loss=1.8143, train=0.3550, test=0.3893 + [FA] Epoch 60: loss=1.7966, train=0.3639, test=0.3904 + [FA] Epoch 70: loss=1.7844, train=0.3687, test=0.3933 + [FA] Epoch 80: loss=1.7761, train=0.3709, test=0.4026 + [FA] Epoch 90: loss=1.7732, train=0.3684, test=0.4049 + [FA] Epoch 100: loss=1.7754, train=0.3729, test=0.4040 + Final test acc: 0.4040 + +All results saved to results/fa_dfa_d512_L12_seed5/results_cifar10.json + L=12 seed=6 (Sun Apr 26 04:51:18 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 6 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0822, train=0.2309, test=0.2459 + [DFA] Epoch 10: loss=2.0275, train=0.2537, test=0.2714 + [DFA] Epoch 20: loss=2.0172, train=0.2625, test=0.2808 + [DFA] Epoch 30: loss=2.0116, train=0.2650, test=0.2992 + [DFA] Epoch 40: loss=2.0076, train=0.2679, test=0.2906 + [DFA] Epoch 50: loss=2.0060, train=0.2704, test=0.2939 + [DFA] Epoch 60: loss=2.0017, train=0.2720, test=0.2816 + [DFA] Epoch 70: loss=2.0022, train=0.2703, test=0.2892 + [DFA] Epoch 80: loss=2.0001, train=0.2731, test=0.2902 + [DFA] Epoch 90: loss=1.9980, train=0.2719, test=0.2896 + [DFA] Epoch 100: loss=2.0006, train=0.2720, test=0.2896 + Final test acc: 0.2896 + +--- FA --- + [FA] Epoch 1: loss=2.0523, train=0.2384, test=0.2743 + [FA] Epoch 10: loss=1.8689, train=0.3242, test=0.3518 + [FA] Epoch 20: loss=1.8466, train=0.3401, test=0.3779 + [FA] Epoch 30: loss=1.8186, train=0.3509, test=0.3752 + [FA] Epoch 40: loss=1.7917, train=0.3605, test=0.3924 + [FA] Epoch 50: loss=1.7723, train=0.3687, test=0.3963 + [FA] Epoch 60: loss=1.7517, train=0.3748, test=0.3974 + [FA] Epoch 70: loss=1.7404, train=0.3806, test=0.4095 + [FA] Epoch 80: loss=1.7335, train=0.3829, test=0.4065 + [FA] Epoch 90: loss=1.7319, train=0.3838, test=0.4086 + [FA] Epoch 100: loss=1.7297, train=0.3847, test=0.4076 + Final test acc: 0.4076 + +All results saved to results/fa_dfa_d512_L12_seed6/results_cifar10.json + L=12 seed=7 (Sun Apr 26 05:13:31 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 7 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0718, train=0.2398, test=0.2673 + [DFA] Epoch 10: loss=2.0065, train=0.2642, test=0.2629 + [DFA] Epoch 20: loss=1.9931, train=0.2714, test=0.2990 + [DFA] Epoch 30: loss=1.9825, train=0.2769, test=0.2977 + [DFA] Epoch 40: loss=1.9781, train=0.2807, test=0.3066 + [DFA] Epoch 50: loss=1.9756, train=0.2815, test=0.3029 + [DFA] Epoch 60: loss=1.9724, train=0.2822, test=0.3115 + [DFA] Epoch 70: loss=1.9685, train=0.2868, test=0.3067 + [DFA] Epoch 80: loss=1.9683, train=0.2867, test=0.3055 + [DFA] Epoch 90: loss=1.9683, train=0.2883, test=0.3089 + [DFA] Epoch 100: loss=1.9669, train=0.2875, test=0.3108 + Final test acc: 0.3108 + +--- FA --- + [FA] Epoch 1: loss=2.0308, train=0.2547, test=0.3120 + [FA] Epoch 10: loss=1.8409, train=0.3401, test=0.3443 + [FA] Epoch 20: loss=1.8222, train=0.3459, test=0.3623 + [FA] Epoch 30: loss=1.8168, train=0.3476, test=0.3545 + [FA] Epoch 40: loss=1.7845, train=0.3584, test=0.3813 + [FA] Epoch 50: loss=1.7634, train=0.3685, test=0.3910 + [FA] Epoch 60: loss=1.7523, train=0.3735, test=0.3971 + [FA] Epoch 70: loss=1.7398, train=0.3776, test=0.4015 + [FA] Epoch 80: loss=1.7339, train=0.3800, test=0.4033 + [FA] Epoch 90: loss=1.7289, train=0.3836, test=0.4055 + [FA] Epoch 100: loss=1.7276, train=0.3838, test=0.4062 + Final test acc: 0.4062 + +All results saved to results/fa_dfa_d512_L12_seed7/results_cifar10.json + L=12 seed=8 (Sun Apr 26 05:35:42 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 8 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0622, train=0.2372, test=0.2412 + [DFA] Epoch 10: loss=2.0108, train=0.2579, test=0.2859 + [DFA] Epoch 20: loss=2.0011, train=0.2675, test=0.2666 + [DFA] Epoch 30: loss=1.9932, train=0.2711, test=0.2923 + [DFA] Epoch 40: loss=1.9927, train=0.2730, test=0.2980 + [DFA] Epoch 50: loss=1.9886, train=0.2743, test=0.2935 + [DFA] Epoch 60: loss=1.9865, train=0.2771, test=0.2991 + [DFA] Epoch 70: loss=1.9855, train=0.2761, test=0.2946 + [DFA] Epoch 80: loss=1.9845, train=0.2775, test=0.2992 + [DFA] Epoch 90: loss=1.9831, train=0.2794, test=0.2946 + [DFA] Epoch 100: loss=1.9856, train=0.2764, test=0.2946 + Final test acc: 0.2946 + +--- FA --- + [FA] Epoch 1: loss=2.0407, train=0.2475, test=0.2791 + [FA] Epoch 10: loss=1.8617, train=0.3286, test=0.3655 + [FA] Epoch 20: loss=1.8300, train=0.3445, test=0.3803 + [FA] Epoch 30: loss=1.7865, train=0.3626, test=0.3942 + [FA] Epoch 40: loss=1.7690, train=0.3698, test=0.3907 + [FA] Epoch 50: loss=1.7526, train=0.3796, test=0.4045 + [FA] Epoch 60: loss=1.7478, train=0.3781, test=0.4042 + [FA] Epoch 70: loss=1.7436, train=0.3751, test=0.4063 + [FA] Epoch 80: loss=1.7419, train=0.3793, test=0.4095 + [FA] Epoch 90: loss=1.7385, train=0.3805, test=0.4117 + [FA] Epoch 100: loss=1.7350, train=0.3843, test=0.4122 + Final test acc: 0.4122 + +All results saved to results/fa_dfa_d512_L12_seed8/results_cifar10.json + L=12 seed=9 (Sun Apr 26 05:57:53 PM CDT 2026) +Using device: cuda:0 + +============================================================ +Seed 9 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0865, train=0.2293, test=0.2701 + [DFA] Epoch 10: loss=2.0162, train=0.2616, test=0.2901 + [DFA] Epoch 20: loss=2.0014, train=0.2697, test=0.3049 + [DFA] Epoch 30: loss=1.9969, train=0.2713, test=0.3018 + [DFA] Epoch 40: loss=1.9921, train=0.2745, test=0.3004 + [DFA] Epoch 50: loss=1.9895, train=0.2789, test=0.2976 + [DFA] Epoch 60: loss=1.9873, train=0.2771, test=0.2891 + [DFA] Epoch 70: loss=1.9857, train=0.2802, test=0.3008 + [DFA] Epoch 80: loss=1.9837, train=0.2816, test=0.3024 + [DFA] Epoch 90: loss=1.9836, train=0.2842, test=0.3063 + [DFA] Epoch 100: loss=1.9829, train=0.2846, test=0.3043 + Final test acc: 0.3043 + +--- FA --- + [FA] Epoch 1: loss=2.0459, train=0.2430, test=0.2729 + [FA] Epoch 10: loss=1.8585, train=0.3313, test=0.3661 + [FA] Epoch 20: loss=1.8133, train=0.3467, test=0.3773 + [FA] Epoch 30: loss=1.7948, train=0.3585, test=0.3820 + [FA] Epoch 40: loss=1.7644, train=0.3673, test=0.3939 + [FA] Epoch 50: loss=1.7323, train=0.3796, test=0.4043 + [FA] Epoch 60: loss=1.7190, train=0.3844, test=0.3986 + [FA] Epoch 70: loss=1.7100, train=0.3879, test=0.4096 + [FA] Epoch 80: loss=1.7034, train=0.3903, test=0.4076 + [FA] Epoch 90: loss=1.6981, train=0.3927, test=0.4125 + [FA] Epoch 100: loss=1.6980, train=0.3923, test=0.4115 + Final test acc: 0.4115 + +All results saved to results/fa_dfa_d512_L12_seed9/results_cifar10.json + +=== DEEPER L SCAN DONE (Sun Apr 26 06:20:00 PM CDT 2026) === diff --git a/results/dfa_canonical_freshB.log b/results/dfa_canonical_freshB.log new file mode 100644 index 0000000..3e9551e --- /dev/null +++ b/results/dfa_canonical_freshB.log @@ -0,0 +1,13 @@ +Training DFA canonical λ=0.01, seed=42 + [DFA pen] ep 10 + [DFA pen] ep 20 + [DFA pen] ep 30 +Saved checkpoint: results/dfa_canonical_freshB/dfa_canonical_lam0.01_s42.pt +Training-Bs: acc=0.3672, deep cos=+0.1660 + per-layer cos: ['+0.3259', '+0.1658', '+0.1618', '+0.1703'] + ||g_l||: ['1.34e-05', '1.32e-05', '1.31e-05', '1.31e-05', '1.32e-05'] + ||h_l||: ['1.21e+04', '1.21e+04', '1.21e+04', '1.22e+04', '1.21e+04'] + +Fresh-B null calibration (20 draws)... +Fresh-Bs deep cos: -0.0048 ± 0.0182 (ddof=1) +Saved: results/dfa_canonical_freshB/freshB_null_canonical_s42.json diff --git a/results/dfa_canonical_freshB/freshB_null_canonical_s42.json b/results/dfa_canonical_freshB/freshB_null_canonical_s42.json new file mode 100644 index 0000000..8f20467 --- /dev/null +++ b/results/dfa_canonical_freshB/freshB_null_canonical_s42.json @@ -0,0 +1,56 @@ +{ + "description": "Canonical DFA \u03bb=0.01 s=42 + fresh-B null (N=20)", + "training_Bs_deep_cos": 0.1659978379805883, + "training_Bs_per_layer_cos": [ + 0.3258553445339203, + 0.1658061444759369, + 0.1618424952030182, + 0.17034487426280975 + ], + "training_Bs_acc": 0.3671875, + "training_Bs_g_norms": [ + 1.335966408078093e-05, + 1.3213058991823345e-05, + 1.31442438942031e-05, + 1.3120022231305484e-05, + 1.3151197890692856e-05 + ], + "training_Bs_h_norms": [ + 12069.3095703125, + 12144.8427734375, + 12143.939453125, + 12156.6904296875, + 12147.8271484375 + ], + "fresh_Bs_n_draws": 20, + "fresh_Bs_deep_cos_per_draw": [ + -0.009986335256447395, + -0.025985106825828552, + -0.0050429514376446605, + 0.01727348566055298, + 0.006780429219361395, + -0.0012651278326908748, + 0.016534411969284218, + -0.028123627106348675, + 0.0018596930118898551, + 0.011628065335874757, + -0.00797742527599136, + -0.013325384507576624, + -0.00039871477444345754, + -0.0407400643453002, + -0.028840728104114532, + 0.009858534671366215, + -0.02509508344034354, + 0.008517433578769365, + 0.02818053464094798, + -0.010525024806459745 + ], + "fresh_Bs_deep_mean": -0.004833649281257142, + "fresh_Bs_deep_std_ddof1": 0.01823727849606041, + "fresh_Bs_per_layer_mean": [ + 0.0092626029625535, + -0.004385327867930755, + -0.0051876686746254565, + -0.004927951301215217 + ] +} \ No newline at end of file diff --git a/results/dfa_canonical_lam1e-2_30ep/results_cifar10.json b/results/dfa_canonical_lam1e-2_30ep/results_cifar10.json new file mode 100644 index 0000000..01a7a9f --- /dev/null +++ b/results/dfa_canonical_lam1e-2_30ep/results_cifar10.json @@ -0,0 +1,549 @@ +{ + "42": { + "dfa": { + "log": { + "train_loss": [ + 1.9962164908218383, + 1.9369539144134522, + 1.9308127733612062, + 1.9288829196548463, + 1.924676773147583, + 1.918132286529541, + 1.918223798522949, + 1.9147104105377197, + 1.9164991827011109, + 1.9150708497619628, + 1.9118981461334228, + 1.9094872266387939, + 1.905809390487671, + 1.9049867826080322, + 1.90767120262146, + 1.9046393532562256, + 1.9038504275894166, + 1.9006466190338134, + 1.8996596237182617, + 1.8986669551086426, + 1.8997121560668946, + 1.8965645993423461, + 1.8971398455047608, + 1.8969778009414673, + 1.89667788482666, + 1.8934650146484375, + 1.8900965643310548, + 1.8924740059661864, + 1.892325519180298, + 1.8923273934555054 + ], + "train_acc": [ + 0.2802, + 0.30808, + 0.31262, + 0.3156, + 0.31668, + 0.31968, + 0.3211, + 0.32238, + 0.3231, + 0.32382, + 0.32378, + 0.32668, + 0.32826, + 0.32862, + 0.32902, + 0.32944, + 0.32948, + 0.33388, + 0.33008, + 0.33162, + 0.33228, + 0.33294, + 0.33364, + 0.33536, + 0.33534, + 0.3341, + 0.33584, + 0.33624, + 0.33534, + 0.34052 + ], + "test_acc": [ + 0.3313, + 0.3463, + 0.3422, + 0.3411, + 0.3597, + 0.3549, + 0.3499, + 0.3438, + 0.3423, + 0.3476, + 0.3497, + 0.3524, + 0.3595, + 0.3521, + 0.354, + 0.3537, + 0.3588, + 0.3613, + 0.356, + 0.359, + 0.3599, + 0.3572, + 0.3615, + 0.3592, + 0.3592, + 0.3609, + 0.3578, + 0.36, + 0.3611, + 0.3607 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.33146190643310547, + 0.16347576677799225, + 0.1610197126865387, + 0.17380905151367188 + ], + "perturbation_rho": [ + 0.12955714762210846, + 0.045910485088825226, + 0.08855772018432617, + 0.06986565887928009 + ], + "nudging": { + "0.001": [ + -1.3143871910870075e-05, + -5.465932190418243e-06, + -5.55114820599556e-06, + -5.612848326563835e-06 + ], + "0.003": [ + -3.937864676117897e-05, + -1.6393139958381653e-05, + -1.6577658243477345e-05, + -1.6813864931464195e-05 + ], + "0.01": [ + -0.00013115769252181053, + -5.455967038869858e-05, + -5.524198058992624e-05, + -5.596294067800045e-05 + ] + }, + "hidden_norms_per_layer": [ + 12120.9111328125, + 12188.2958984375, + 12193.77734375, + 12198.8359375, + 12219.8369140625 + ], + "bp_grad_norms_per_layer": [ + 1.3196319741837215e-05, + 1.3040654266660567e-05, + 1.2841821444453672e-05, + 1.2863742995250504e-05, + 1.2522319593699649e-05 + ] + }, + "drift": { + "embed.weight": 92.65036012342134, + "embed.bias": 95.50366326873346, + "blocks.0.ln.weight": 0.34198617935180664, + "blocks.0.w1.weight": 3.6285842919394478, + "blocks.0.w1.bias": 6.327346232452673, + "blocks.0.w2.weight": 18.245981750960237, + "blocks.1.ln.weight": 0.3590666353702545, + "blocks.1.w1.weight": 3.60860615088841, + "blocks.1.w1.bias": 6.19502489141982, + "blocks.1.w2.weight": 17.96136875105609, + "blocks.2.ln.weight": 0.36136317253112793, + "blocks.2.w1.weight": 3.702767807151941, + "blocks.2.w1.bias": 6.508610347801663, + "blocks.2.w2.weight": 19.259072912976688, + "blocks.3.ln.weight": 0.35671475529670715, + "blocks.3.w1.weight": 3.7164720093334025, + "blocks.3.w1.bias": 6.203418611522943, + "blocks.3.w2.weight": 19.77945180777123, + "out_ln.weight": 0.16879618167877197, + "out_head.weight": 2.418863784769041, + "out_head.bias": 1.1721698518470152 + } + } + }, + "123": { + "dfa": { + "log": { + "train_loss": [ + 1.9917970180892943, + 1.9455738663482667, + 1.9412584506225585, + 1.9381972328948975, + 1.935788204345703, + 1.9355586415863038, + 1.9291299639892578, + 1.9304945249938965, + 1.9279169077301026, + 1.9247258889389038, + 1.9270652098083496, + 1.9239173442077637, + 1.920924050216675, + 1.9179519243621825, + 1.9187614895629883, + 1.9149749173736572, + 1.9101889783477783, + 1.9113776821517945, + 1.9123343227767944, + 1.9115107091522217, + 1.9105930194091796, + 1.9092110122680663, + 1.9085102457046508, + 1.9054700579071044, + 1.906116495628357, + 1.9055400652313232, + 1.9055342751312256, + 1.9067684815216064, + 1.9050640679168702, + 1.9041575216674804 + ], + "train_acc": [ + 0.2828, + 0.3048, + 0.30986, + 0.31168, + 0.31358, + 0.31522, + 0.31574, + 0.317, + 0.31914, + 0.31836, + 0.31874, + 0.31798, + 0.32148, + 0.32276, + 0.32502, + 0.3259, + 0.32756, + 0.32626, + 0.32706, + 0.32784, + 0.329, + 0.32942, + 0.32888, + 0.33042, + 0.33034, + 0.33086, + 0.33476, + 0.33214, + 0.33166, + 0.33136 + ], + "test_acc": [ + 0.3309, + 0.3491, + 0.3382, + 0.3519, + 0.3375, + 0.3487, + 0.3436, + 0.3431, + 0.3632, + 0.341, + 0.3632, + 0.3623, + 0.3531, + 0.3536, + 0.3476, + 0.3485, + 0.3662, + 0.3539, + 0.3453, + 0.36, + 0.3532, + 0.3566, + 0.3562, + 0.3639, + 0.3622, + 0.3623, + 0.3579, + 0.3541, + 0.3576, + 0.3582 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.3322567343711853, + 0.10321325808763504, + 0.15636520087718964, + 0.19004486501216888 + ], + "perturbation_rho": [ + 0.18363387882709503, + 0.04898637533187866, + 0.09784461557865143, + 0.09405896812677383 + ], + "nudging": { + "0.001": [ + -1.0297924745827913e-05, + -3.0525843612849712e-06, + -4.650210030376911e-06, + -5.671870894730091e-06 + ], + "0.003": [ + -3.089715028181672e-05, + -9.163166396319866e-06, + -1.3922981452196836e-05, + -1.7057405784726143e-05 + ], + "0.01": [ + -0.00010294892126694322, + -3.057112917304039e-05, + -4.6447094064205885e-05, + -5.68098621442914e-05 + ] + }, + "hidden_norms_per_layer": [ + 13127.3251953125, + 13128.8193359375, + 13141.9501953125, + 13135.3408203125, + 13141.1806640625 + ], + "bp_grad_norms_per_layer": [ + 1.0922197361651342e-05, + 1.074585088645108e-05, + 1.0719732017605565e-05, + 1.0678052603907418e-05, + 1.0736169315350708e-05 + ] + }, + "drift": { + "embed.weight": 95.06253847427116, + "embed.bias": 69.56343057263858, + "blocks.0.ln.weight": 0.35518038272857666, + "blocks.0.w1.weight": 3.5318213424051828, + "blocks.0.w1.bias": 6.6251757142063346, + "blocks.0.w2.weight": 18.1649292755703, + "blocks.1.ln.weight": 0.37566548585891724, + "blocks.1.w1.weight": 3.577683688515039, + "blocks.1.w1.bias": 6.4976786510039295, + "blocks.1.w2.weight": 18.132601820579644, + "blocks.2.ln.weight": 0.39002206921577454, + "blocks.2.w1.weight": 3.7319215256746268, + "blocks.2.w1.bias": 6.266003010226504, + "blocks.2.w2.weight": 18.870330386369503, + "blocks.3.ln.weight": 0.35860922932624817, + "blocks.3.w1.weight": 3.790655898639472, + "blocks.3.w1.bias": 5.892665738859735, + "blocks.3.w2.weight": 20.602751226104075, + "out_ln.weight": 0.15972787141799927, + "out_head.weight": 2.3651003853179144, + "out_head.bias": 1.3627504013501806 + } + } + }, + "456": { + "dfa": { + "log": { + "train_loss": [ + 1.9882178707504272, + 1.9317677951049805, + 1.9248256610870362, + 1.9217043152618407, + 1.917682172279358, + 1.919907767944336, + 1.9130486701202392, + 1.9160204236221314, + 1.9124437686920166, + 1.910402643661499, + 1.9057467068099976, + 1.9108504774475097, + 1.9094166152572631, + 1.9078613684844972, + 1.9042421661376954, + 1.9058136753082275, + 1.9045625204467773, + 1.9027692486953736, + 1.901805549621582, + 1.9018799402236939, + 1.8972413793945313, + 1.8987792961883545, + 1.897886729812622, + 1.894330054550171, + 1.8959275032806397, + 1.8961896368408202, + 1.8971351692962646, + 1.8951918316650391, + 1.89493817653656, + 1.8952873357391358 + ], + "train_acc": [ + 0.2782, + 0.30628, + 0.31294, + 0.31586, + 0.31784, + 0.31944, + 0.32352, + 0.32056, + 0.32366, + 0.32092, + 0.32656, + 0.3254, + 0.3272, + 0.3234, + 0.32672, + 0.32684, + 0.33252, + 0.3313, + 0.32936, + 0.33102, + 0.3319, + 0.33272, + 0.33364, + 0.3357, + 0.334, + 0.3336, + 0.33476, + 0.33474, + 0.3348, + 0.33498 + ], + "test_acc": [ + 0.3368, + 0.3538, + 0.3441, + 0.3634, + 0.343, + 0.3574, + 0.341, + 0.3403, + 0.3594, + 0.3606, + 0.3628, + 0.3674, + 0.3684, + 0.3558, + 0.3637, + 0.3632, + 0.3649, + 0.3565, + 0.3631, + 0.3629, + 0.3546, + 0.3629, + 0.3594, + 0.3629, + 0.3619, + 0.3609, + 0.3623, + 0.3609, + 0.3607, + 0.3614 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.35106080770492554, + 0.12957611680030823, + 0.12942053377628326, + 0.15940426290035248 + ], + "perturbation_rho": [ + 0.17636069655418396, + 0.08117785304784775, + 0.0472814217209816, + 0.11043912172317505 + ], + "nudging": { + "0.001": [ + -1.4475401258096099e-05, + -4.396220901980996e-06, + -4.46141348220408e-06, + -5.974114174023271e-06 + ], + "0.003": [ + -4.3450010707601905e-05, + -1.3241806300356984e-05, + -1.3367069186642766e-05, + -1.7999671399593353e-05 + ], + "0.01": [ + -0.00014482333790510893, + -4.394981078803539e-05, + -4.4448592234402895e-05, + -5.99866034463048e-05 + ] + }, + "hidden_norms_per_layer": [ + 12229.544921875, + 12266.8916015625, + 12257.5791015625, + 12255.2705078125, + 12254.3017578125 + ], + "bp_grad_norms_per_layer": [ + 1.334045191470068e-05, + 1.2721701750706416e-05, + 1.251421963388566e-05, + 1.2780437828041613e-05, + 1.2897891792817973e-05 + ] + }, + "drift": { + "embed.weight": 96.08641084786761, + "embed.bias": 127.15202633956196, + "blocks.0.ln.weight": 0.3495213985443115, + "blocks.0.w1.weight": 3.6819779928624996, + "blocks.0.w1.bias": 6.228241220813173, + "blocks.0.w2.weight": 17.84445507605505, + "blocks.1.ln.weight": 0.34699368476867676, + "blocks.1.w1.weight": 3.6269651247865355, + "blocks.1.w1.bias": 6.23888543559435, + "blocks.1.w2.weight": 17.036835876989706, + "blocks.2.ln.weight": 0.3590497076511383, + "blocks.2.w1.weight": 3.638377800312274, + "blocks.2.w1.bias": 6.075326782548754, + "blocks.2.w2.weight": 17.82232398341993, + "blocks.3.ln.weight": 0.35772791504859924, + "blocks.3.w1.weight": 3.76772753341028, + "blocks.3.w1.bias": 6.390494916053956, + "blocks.3.w2.weight": 18.92297820750716, + "out_ln.weight": 0.18465575575828552, + "out_head.weight": 2.515055641320841, + "out_head.bias": 1.320315434071626 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 30, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 42, + 123, + 456 + ], + "gpu": 0, + "output_dir": "results/dfa_canonical_lam1e-2_30ep", + "methods": [ + "dfa" + ], + "random_targets": false, + "penalty_lam": 0.01, + "num_classes": 10 + } +} \ No newline at end of file diff --git a/results/dfa_canonical_lam1e-4_30ep/results_cifar10.json b/results/dfa_canonical_lam1e-4_30ep/results_cifar10.json new file mode 100644 index 0000000..c5480c9 --- /dev/null +++ b/results/dfa_canonical_lam1e-4_30ep/results_cifar10.json @@ -0,0 +1,549 @@ +{ + "42": { + "dfa": { + "log": { + "train_loss": [ + 2.0261129596710203, + 1.965970752182007, + 1.9461470681762696, + 1.931545509109497, + 1.9184623413085937, + 1.9065282035064697, + 1.902437851715088, + 1.895544966506958, + 1.8950473132705687, + 1.889725124206543, + 1.8855420764541626, + 1.880997481918335, + 1.8747885485839844, + 1.8749551737976073, + 1.873095685119629, + 1.8711490287017822, + 1.8692577294540405, + 1.865205725440979, + 1.8637552904891967, + 1.8656678380966187, + 1.8631304251480103, + 1.8602397272491455, + 1.8614968471908568, + 1.860624254989624, + 1.8599734017944336, + 1.8587864357757569, + 1.854469165649414, + 1.856863537902832, + 1.8563300177001953, + 1.8545278675079346 + ], + "train_acc": [ + 0.26118, + 0.28972, + 0.30092, + 0.3046, + 0.30976, + 0.31652, + 0.31542, + 0.31824, + 0.3199, + 0.32334, + 0.32476, + 0.32794, + 0.32848, + 0.32864, + 0.32798, + 0.33074, + 0.33078, + 0.33602, + 0.33204, + 0.33176, + 0.33496, + 0.33462, + 0.33306, + 0.33528, + 0.33536, + 0.33594, + 0.33782, + 0.33676, + 0.33434, + 0.33972 + ], + "test_acc": [ + 0.3121, + 0.3285, + 0.3222, + 0.32, + 0.3344, + 0.3365, + 0.3411, + 0.3402, + 0.3386, + 0.3497, + 0.3454, + 0.3599, + 0.3558, + 0.3517, + 0.3509, + 0.3522, + 0.3602, + 0.3593, + 0.3563, + 0.3609, + 0.3561, + 0.3571, + 0.3611, + 0.3599, + 0.3629, + 0.3627, + 0.3615, + 0.3611, + 0.3613, + 0.3617 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.4050517678260803, + -0.013029102236032486, + 0.03315805643796921, + -0.013960793614387512 + ], + "perturbation_rho": [ + 0.12510338425636292, + -0.006976948119699955, + -0.015925724059343338, + 0.011312087066471577 + ], + "nudging": { + "0.001": [ + -7.806112989783287e-06, + -6.705522537231445e-08, + -3.022141754627228e-07, + 8.172355592250824e-08 + ], + "0.003": [ + -2.3321015760302544e-05, + -2.1257437765598297e-07, + -9.727664291858673e-07, + 2.891756594181061e-07 + ], + "0.01": [ + -7.774354889988899e-05, + -6.752088665962219e-07, + -3.1027011573314667e-06, + 1.0223593562841415e-06 + ] + }, + "hidden_norms_per_layer": [ + 10956.861328125, + 18143.607421875, + 21060.630859375, + 23016.607421875, + 24491.1171875 + ], + "bp_grad_norms_per_layer": [ + 7.272880793607328e-06, + 4.709177119366359e-06, + 4.678456662077224e-06, + 4.567728865367826e-06, + 4.537882432487095e-06 + ] + }, + "drift": { + "embed.weight": 89.9981502906406, + "embed.bias": 98.48191085272376, + "blocks.0.ln.weight": 0.9167992472648621, + "blocks.0.w1.weight": 10.6815522190785, + "blocks.0.w1.bias": 7.828161751177281, + "blocks.0.w2.weight": 38.808210617134726, + "blocks.1.ln.weight": 0.9728876352310181, + "blocks.1.w1.weight": 10.963974441809082, + "blocks.1.w1.bias": 5.055703734088147, + "blocks.1.w2.weight": 35.990717171803034, + "blocks.2.ln.weight": 0.9287830591201782, + "blocks.2.w1.weight": 11.93235751064561, + "blocks.2.w1.bias": 5.599607529376271, + "blocks.2.w2.weight": 43.70271229681688, + "blocks.3.ln.weight": 0.9019887447357178, + "blocks.3.w1.weight": 11.73703214757272, + "blocks.3.w1.bias": 4.954978948196952, + "blocks.3.w2.weight": 39.60266222485616, + "out_ln.weight": 0.1381552666425705, + "out_head.weight": 1.6594692518127092, + "out_head.bias": 1.1554215734743463 + } + } + }, + "123": { + "dfa": { + "log": { + "train_loss": [ + 2.0199886853790283, + 1.9583829278564453, + 1.9399597728729248, + 1.9226381231689453, + 1.9109827480697632, + 1.9015012389755248, + 1.8941318827056886, + 1.890287815246582, + 1.8868233013153075, + 1.8811580016708374, + 1.8821455502319335, + 1.879702535018921, + 1.8747499548721314, + 1.8705888650894165, + 1.8737954347991943, + 1.8678274332427978, + 1.861484291419983, + 1.8633367358398438, + 1.864215413131714, + 1.8632674326324463, + 1.862329735069275, + 1.863224948348999, + 1.8597282915878295, + 1.8569441051864624, + 1.8570497719955443, + 1.8558143846893311, + 1.8551305682373047, + 1.8570148430633544, + 1.8583727548217774, + 1.8555032357025147 + ], + "train_acc": [ + 0.26116, + 0.29306, + 0.30176, + 0.30766, + 0.31666, + 0.32172, + 0.32304, + 0.32316, + 0.32528, + 0.32762, + 0.32708, + 0.32632, + 0.32938, + 0.33256, + 0.33252, + 0.3339, + 0.33636, + 0.33564, + 0.3344, + 0.33576, + 0.33646, + 0.33592, + 0.33694, + 0.33802, + 0.33924, + 0.33946, + 0.34026, + 0.33802, + 0.33666, + 0.34056 + ], + "test_acc": [ + 0.3089, + 0.333, + 0.3314, + 0.3446, + 0.3445, + 0.3441, + 0.3434, + 0.3491, + 0.3456, + 0.3411, + 0.3524, + 0.3535, + 0.3493, + 0.3523, + 0.3599, + 0.3569, + 0.3643, + 0.3577, + 0.3539, + 0.3635, + 0.3616, + 0.3633, + 0.3622, + 0.3652, + 0.3634, + 0.3637, + 0.3622, + 0.3614, + 0.3636, + 0.3637 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.4339396357536316, + -0.10015994310379028, + -0.017887549474835396, + 0.040999654680490494 + ], + "perturbation_rho": [ + 0.19203181564807892, + -0.038277432322502136, + 0.011904019862413406, + 0.005113246850669384 + ], + "nudging": { + "0.001": [ + -1.0719290003180504e-05, + 1.0670628398656845e-06, + 8.614733815193176e-08, + -5.248002707958221e-07 + ], + "0.003": [ + -3.2095471397042274e-05, + 3.2514799386262894e-06, + 3.771856427192688e-07, + -1.496635377407074e-06 + ], + "0.01": [ + -0.0001069442369043827, + 1.088087446987629e-05, + 1.3296958059072495e-06, + -4.966510459780693e-06 + ] + }, + "hidden_norms_per_layer": [ + 11421.578125, + 15917.556640625, + 17952.0625, + 20818.056640625, + 22884.724609375 + ], + "bp_grad_norms_per_layer": [ + 8.24415656097699e-06, + 5.0456683311495e-06, + 5.334758498065639e-06, + 5.458482974063372e-06, + 4.856112354900688e-06 + ] + }, + "drift": { + "embed.weight": 86.77573804339026, + "embed.bias": 84.55079592528128, + "blocks.0.ln.weight": 0.873725414276123, + "blocks.0.w1.weight": 10.119984774778466, + "blocks.0.w1.bias": 8.290345155770092, + "blocks.0.w2.weight": 38.8465868516302, + "blocks.1.ln.weight": 0.8992828726768494, + "blocks.1.w1.weight": 10.725943451191046, + "blocks.1.w1.bias": 6.0767567772252775, + "blocks.1.w2.weight": 34.06827682802752, + "blocks.2.ln.weight": 0.8814435601234436, + "blocks.2.w1.weight": 11.093024893301187, + "blocks.2.w1.bias": 5.85466310572377, + "blocks.2.w2.weight": 39.17455488648176, + "blocks.3.ln.weight": 0.864281952381134, + "blocks.3.w1.weight": 11.522907264038254, + "blocks.3.w1.bias": 5.830217292197888, + "blocks.3.w2.weight": 44.7400774921075, + "out_ln.weight": 0.14324577152729034, + "out_head.weight": 1.7398795739866528, + "out_head.bias": 1.603565887046315 + } + } + }, + "456": { + "dfa": { + "log": { + "train_loss": [ + 2.0270494400787356, + 1.9626524370956422, + 1.9387351146697998, + 1.9183588446426392, + 1.9022310787582397, + 1.8986060205841064, + 1.889561926574707, + 1.8879889819335938, + 1.879786368637085, + 1.8794735382461547, + 1.8745473431777955, + 1.8756215816497803, + 1.871411202316284, + 1.871703953819275, + 1.8679741104507446, + 1.8662110556793212, + 1.8646783707427979, + 1.8631719284820556, + 1.8607554779052735, + 1.8609626446151732, + 1.8584174155426025, + 1.856995953140259, + 1.8584875451660157, + 1.8541203423309327, + 1.8528442667388916, + 1.8555702542114259, + 1.854158247909546, + 1.8552892169570923, + 1.8528213509750366, + 1.853795170211792 + ], + "train_acc": [ + 0.25994, + 0.28998, + 0.30092, + 0.30864, + 0.31382, + 0.31866, + 0.32452, + 0.32284, + 0.32676, + 0.32548, + 0.32872, + 0.32832, + 0.33044, + 0.32716, + 0.32984, + 0.33082, + 0.33492, + 0.33234, + 0.33334, + 0.3352, + 0.33426, + 0.33602, + 0.33428, + 0.33574, + 0.33652, + 0.33572, + 0.33734, + 0.33416, + 0.33524, + 0.33676 + ], + "test_acc": [ + 0.303, + 0.3213, + 0.3218, + 0.3366, + 0.3324, + 0.3414, + 0.3426, + 0.3355, + 0.3523, + 0.357, + 0.3577, + 0.3603, + 0.3571, + 0.3588, + 0.3587, + 0.3621, + 0.3612, + 0.3582, + 0.3596, + 0.3601, + 0.3617, + 0.3598, + 0.3607, + 0.3598, + 0.3627, + 0.3609, + 0.3619, + 0.3611, + 0.3612, + 0.3614 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.42865899205207825, + -0.05478518456220627, + 0.038068704307079315, + -0.056306466460227966 + ], + "perturbation_rho": [ + 0.20215260982513428, + 0.011766819283366203, + 0.013697815127670765, + -0.005670403130352497 + ], + "nudging": { + "0.001": [ + -9.712064638733864e-06, + 4.707835614681244e-07, + -3.8545113056898117e-07, + 4.920875653624535e-07 + ], + "0.003": [ + -2.92585464194417e-05, + 1.3945391401648521e-06, + -1.1923257261514664e-06, + 1.539476215839386e-06 + ], + "0.01": [ + -9.755697101354599e-05, + 4.76837158203125e-06, + -4.0211016312241554e-06, + 5.003763362765312e-06 + ] + }, + "hidden_norms_per_layer": [ + 10800.751953125, + 18185.798828125, + 21568.359375, + 23534.529296875, + 25767.765625 + ], + "bp_grad_norms_per_layer": [ + 8.111597708193585e-06, + 4.7823082240938675e-06, + 4.949825324729318e-06, + 4.701300895249005e-06, + 4.799476755579235e-06 + ] + }, + "drift": { + "embed.weight": 91.29796969081434, + "embed.bias": 132.64457736863756, + "blocks.0.ln.weight": 0.9450518488883972, + "blocks.0.w1.weight": 11.023232822335661, + "blocks.0.w1.bias": 7.565836772828061, + "blocks.0.w2.weight": 40.72087672870546, + "blocks.1.ln.weight": 0.9085477590560913, + "blocks.1.w1.weight": 10.945316270784486, + "blocks.1.w1.bias": 4.626647858456354, + "blocks.1.w2.weight": 34.33902143396201, + "blocks.2.ln.weight": 0.900463879108429, + "blocks.2.w1.weight": 11.644326056575537, + "blocks.2.w1.bias": 5.303598149511605, + "blocks.2.w2.weight": 40.633521007369026, + "blocks.3.ln.weight": 0.898414671421051, + "blocks.3.w1.weight": 11.992557831950368, + "blocks.3.w1.bias": 4.96772779247091, + "blocks.3.w2.weight": 42.20788924018908, + "out_ln.weight": 0.14031164348125458, + "out_head.weight": 1.830198193189751, + "out_head.bias": 1.3683500872345247 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 30, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 42, + 123, + 456 + ], + "gpu": 0, + "output_dir": "results/dfa_canonical_lam1e-4_30ep", + "methods": [ + "dfa" + ], + "random_targets": false, + "penalty_lam": 0.0001, + "num_classes": 10 + } +} \ No newline at end of file diff --git a/results/dfa_canonical_penalty_sweep.log b/results/dfa_canonical_penalty_sweep.log new file mode 100644 index 0000000..533cddb --- /dev/null +++ b/results/dfa_canonical_penalty_sweep.log @@ -0,0 +1,77 @@ +=== DFA canonical penalty sweep === +Start: Wed Apr 29 02:04:53 PM CDT 2026 +--- λ=1e-4 --- +Using device: cuda:0 + +============================================================ +Seed 42 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0261, train=0.2612, test=0.3121 + [DFA] Epoch 10: loss=1.8897, train=0.3233, test=0.3497 + [DFA] Epoch 20: loss=1.8657, train=0.3318, test=0.3609 + [DFA] Epoch 30: loss=1.8545, train=0.3397, test=0.3617 + Final test acc: 0.3617 + +============================================================ +Seed 123 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0200, train=0.2612, test=0.3089 + [DFA] Epoch 10: loss=1.8812, train=0.3276, test=0.3411 + [DFA] Epoch 20: loss=1.8633, train=0.3358, test=0.3635 + [DFA] Epoch 30: loss=1.8555, train=0.3406, test=0.3637 + Final test acc: 0.3637 + +============================================================ +Seed 456 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=2.0270, train=0.2599, test=0.3030 + [DFA] Epoch 10: loss=1.8795, train=0.3255, test=0.3570 + [DFA] Epoch 20: loss=1.8610, train=0.3352, test=0.3601 + [DFA] Epoch 30: loss=1.8538, train=0.3368, test=0.3614 + Final test acc: 0.3614 + +All results saved to results/dfa_canonical_lam1e-4_30ep/results_cifar10.json +--- λ=1e-2 --- +Using device: cuda:0 + +============================================================ +Seed 42 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=1.9962, train=0.2802, test=0.3313 + [DFA] Epoch 10: loss=1.9151, train=0.3238, test=0.3476 + [DFA] Epoch 20: loss=1.8987, train=0.3316, test=0.3590 + [DFA] Epoch 30: loss=1.8923, train=0.3405, test=0.3607 + Final test acc: 0.3607 + +============================================================ +Seed 123 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=1.9918, train=0.2828, test=0.3309 + [DFA] Epoch 10: loss=1.9247, train=0.3184, test=0.3410 + [DFA] Epoch 20: loss=1.9115, train=0.3278, test=0.3600 + [DFA] Epoch 30: loss=1.9042, train=0.3314, test=0.3582 + Final test acc: 0.3582 + +============================================================ +Seed 456 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=1.9882, train=0.2782, test=0.3368 + [DFA] Epoch 10: loss=1.9104, train=0.3209, test=0.3606 + [DFA] Epoch 20: loss=1.9019, train=0.3310, test=0.3629 + [DFA] Epoch 30: loss=1.8953, train=0.3350, test=0.3614 + Final test acc: 0.3614 + +All results saved to results/dfa_canonical_lam1e-2_30ep/results_cifar10.json +=== PENALTY SWEEP DONE (Wed Apr 29 02:16:23 PM CDT 2026) === diff --git a/results/dfa_canonical_penalty_trajectory.json b/results/dfa_canonical_penalty_trajectory.json new file mode 100644 index 0000000..7e0a0b0 --- /dev/null +++ b/results/dfa_canonical_penalty_trajectory.json @@ -0,0 +1,1700 @@ +{ + "lam_0.0": { + "42": [ + { + "epoch": 0, + "h_L": 8.712287902832031, + "g_L": 0.007692961022257805, + "acc": 0.1875 + }, + { + "epoch": 1, + "h_L": 25517.626953125, + "g_L": 3.015350330315414e-06, + "acc": 0.3046875 + }, + { + "epoch": 2, + "h_L": 187723.15625, + "g_L": 4.921329264107044e-07, + "acc": 0.2734375 + }, + { + "epoch": 3, + "h_L": 638804.3125, + "g_L": 1.72370846485137e-07, + "acc": 0.3359375 + }, + { + "epoch": 4, + "h_L": 1530757.25, + "g_L": 8.140671781120545e-08, + "acc": 0.3203125 + }, + { + "epoch": 5, + "h_L": 2929533.25, + "g_L": 4.8859149615054775e-08, + "acc": 0.28125 + }, + { + "epoch": 6, + "h_L": 4820091.0, + "g_L": 3.349508759242781e-08, + "acc": 0.296875 + }, + { + "epoch": 7, + "h_L": 7294731.5, + "g_L": 2.5191106090005633e-08, + "acc": 0.28125 + }, + { + "epoch": 8, + "h_L": 10272320.0, + "g_L": 2.0386393018156923e-08, + "acc": 0.3125 + }, + { + "epoch": 9, + "h_L": 13648756.0, + "g_L": 1.696361628944487e-08, + "acc": 0.3359375 + }, + { + "epoch": 10, + "h_L": 17385214.0, + "g_L": 1.4690270333517219e-08, + "acc": 0.296875 + }, + { + "epoch": 11, + "h_L": 21316766.0, + "g_L": 1.3290279987643316e-08, + "acc": 0.3203125 + }, + { + "epoch": 12, + "h_L": 25327862.0, + "g_L": 1.2404703042534493e-08, + "acc": 0.3515625 + }, + { + "epoch": 13, + "h_L": 29378768.0, + "g_L": 1.1357126794564465e-08, + "acc": 0.3125 + }, + { + "epoch": 14, + "h_L": 33453014.0, + "g_L": 1.1003758793037832e-08, + "acc": 0.3125 + }, + { + "epoch": 15, + "h_L": 37359424.0, + "g_L": 1.0427936736334686e-08, + "acc": 0.28125 + }, + { + "epoch": 16, + "h_L": 41125660.0, + "g_L": 1.009045380584439e-08, + "acc": 0.3125 + }, + { + "epoch": 17, + "h_L": 44608188.0, + "g_L": 9.842747061838963e-09, + "acc": 0.34375 + }, + { + "epoch": 18, + "h_L": 47778936.0, + "g_L": 9.599874672971964e-09, + "acc": 0.328125 + }, + { + "epoch": 19, + "h_L": 50641172.0, + "g_L": 9.438979375886447e-09, + "acc": 0.3203125 + }, + { + "epoch": 20, + "h_L": 53166848.0, + "g_L": 9.18363252111476e-09, + "acc": 0.3203125 + }, + { + "epoch": 21, + "h_L": 55307292.0, + "g_L": 9.047339766254936e-09, + "acc": 0.328125 + }, + { + "epoch": 22, + "h_L": 57118320.0, + "g_L": 9.087989916167771e-09, + "acc": 0.3515625 + }, + { + "epoch": 23, + "h_L": 58568284.0, + "g_L": 8.887828251147312e-09, + "acc": 0.328125 + }, + { + "epoch": 24, + "h_L": 59706620.0, + "g_L": 8.837604426048529e-09, + "acc": 0.3671875 + }, + { + "epoch": 25, + "h_L": 60537984.0, + "g_L": 8.748822111215304e-09, + "acc": 0.3515625 + }, + { + "epoch": 26, + "h_L": 61129664.0, + "g_L": 8.773011650475837e-09, + "acc": 0.3359375 + }, + { + "epoch": 27, + "h_L": 61528648.0, + "g_L": 8.687391250816745e-09, + "acc": 0.3203125 + }, + { + "epoch": 28, + "h_L": 61746964.0, + "g_L": 8.71883010233887e-09, + "acc": 0.34375 + }, + { + "epoch": 29, + "h_L": 61837164.0, + "g_L": 8.695896447363793e-09, + "acc": 0.3359375 + }, + { + "epoch": 30, + "h_L": 61864056.0, + "g_L": 8.705518084184405e-09, + "acc": 0.3359375 + } + ], + "123": [ + { + "epoch": 0, + "h_L": 8.727029800415039, + "g_L": 0.007806388195604086, + "acc": 0.125 + }, + { + "epoch": 1, + "h_L": 28512.310546875, + "g_L": 2.7645430691336514e-06, + "acc": 0.3125 + }, + { + "epoch": 2, + "h_L": 242307.015625, + "g_L": 4.435606797414948e-07, + "acc": 0.28125 + }, + { + "epoch": 3, + "h_L": 778565.125, + "g_L": 1.5542912024102407e-07, + "acc": 0.3515625 + }, + { + "epoch": 4, + "h_L": 1817878.125, + "g_L": 7.429830617411426e-08, + "acc": 0.328125 + }, + { + "epoch": 5, + "h_L": 3405286.75, + "g_L": 4.3793082937781946e-08, + "acc": 0.34375 + }, + { + "epoch": 6, + "h_L": 5529127.0, + "g_L": 2.9323603101261142e-08, + "acc": 0.2890625 + }, + { + "epoch": 7, + "h_L": 8235227.5, + "g_L": 2.169775648042105e-08, + "acc": 0.3125 + }, + { + "epoch": 8, + "h_L": 11420799.0, + "g_L": 1.6955192805312436e-08, + "acc": 0.328125 + }, + { + "epoch": 9, + "h_L": 14979192.0, + "g_L": 1.3999311043733087e-08, + "acc": 0.3359375 + }, + { + "epoch": 10, + "h_L": 18824920.0, + "g_L": 1.1846083225464099e-08, + "acc": 0.359375 + }, + { + "epoch": 11, + "h_L": 22902218.0, + "g_L": 1.026967311190674e-08, + "acc": 0.34375 + }, + { + "epoch": 12, + "h_L": 27016386.0, + "g_L": 9.538137391018608e-09, + "acc": 0.3515625 + }, + { + "epoch": 13, + "h_L": 31142226.0, + "g_L": 8.575429255586187e-09, + "acc": 0.3359375 + }, + { + "epoch": 14, + "h_L": 35200724.0, + "g_L": 7.853660832779497e-09, + "acc": 0.3359375 + }, + { + "epoch": 15, + "h_L": 39174616.0, + "g_L": 7.4487194190453465e-09, + "acc": 0.3203125 + }, + { + "epoch": 16, + "h_L": 42896120.0, + "g_L": 6.9939956048870044e-09, + "acc": 0.328125 + }, + { + "epoch": 17, + "h_L": 46370948.0, + "g_L": 6.490188830809984e-09, + "acc": 0.328125 + }, + { + "epoch": 18, + "h_L": 49550152.0, + "g_L": 6.39121644496754e-09, + "acc": 0.3515625 + }, + { + "epoch": 19, + "h_L": 52373968.0, + "g_L": 6.192652168834911e-09, + "acc": 0.3203125 + }, + { + "epoch": 20, + "h_L": 54860348.0, + "g_L": 5.9536344743094105e-09, + "acc": 0.3359375 + }, + { + "epoch": 21, + "h_L": 57018952.0, + "g_L": 5.7695772603949536e-09, + "acc": 0.34375 + }, + { + "epoch": 22, + "h_L": 58809320.0, + "g_L": 5.8747517961421636e-09, + "acc": 0.3359375 + }, + { + "epoch": 23, + "h_L": 60258896.0, + "g_L": 5.576731521017564e-09, + "acc": 0.3359375 + }, + { + "epoch": 24, + "h_L": 61394224.0, + "g_L": 5.6349089838647615e-09, + "acc": 0.34375 + }, + { + "epoch": 25, + "h_L": 62249124.0, + "g_L": 5.502207578444995e-09, + "acc": 0.3515625 + }, + { + "epoch": 26, + "h_L": 62824264.0, + "g_L": 5.472856834387585e-09, + "acc": 0.3125 + }, + { + "epoch": 27, + "h_L": 63214608.0, + "g_L": 5.4884821132361594e-09, + "acc": 0.328125 + }, + { + "epoch": 28, + "h_L": 63431440.0, + "g_L": 5.445803363812729e-09, + "acc": 0.3203125 + }, + { + "epoch": 29, + "h_L": 63531652.0, + "g_L": 5.426181726164714e-09, + "acc": 0.34375 + }, + { + "epoch": 30, + "h_L": 63556504.0, + "g_L": 5.43510747519349e-09, + "acc": 0.328125 + } + ], + "456": [ + { + "epoch": 0, + "h_L": 8.894441604614258, + "g_L": 0.007735385559499264, + "acc": 0.0859375 + }, + { + "epoch": 1, + "h_L": 62562.77734375, + "g_L": 1.3566098004957894e-06, + "acc": 0.2578125 + }, + { + "epoch": 2, + "h_L": 450057.34375, + "g_L": 2.3346490252151852e-07, + "acc": 0.3359375 + }, + { + "epoch": 3, + "h_L": 1439747.0, + "g_L": 8.182778543641689e-08, + "acc": 0.3125 + }, + { + "epoch": 4, + "h_L": 3178386.0, + "g_L": 4.1966078612176716e-08, + "acc": 0.3203125 + }, + { + "epoch": 5, + "h_L": 5781704.5, + "g_L": 2.5947548110138996e-08, + "acc": 0.3046875 + }, + { + "epoch": 6, + "h_L": 9215938.0, + "g_L": 1.8552263725268858e-08, + "acc": 0.3046875 + }, + { + "epoch": 7, + "h_L": 13491701.0, + "g_L": 1.392057846771877e-08, + "acc": 0.28125 + }, + { + "epoch": 8, + "h_L": 18509538.0, + "g_L": 1.1343586514556137e-08, + "acc": 0.3125 + }, + { + "epoch": 9, + "h_L": 24168566.0, + "g_L": 9.524081967526854e-09, + "acc": 0.2890625 + }, + { + "epoch": 10, + "h_L": 30181044.0, + "g_L": 8.360129477580358e-09, + "acc": 0.296875 + }, + { + "epoch": 11, + "h_L": 36407860.0, + "g_L": 7.424783898812848e-09, + "acc": 0.265625 + }, + { + "epoch": 12, + "h_L": 42878992.0, + "g_L": 6.818685172049754e-09, + "acc": 0.296875 + }, + { + "epoch": 13, + "h_L": 49422496.0, + "g_L": 6.295156840252503e-09, + "acc": 0.328125 + }, + { + "epoch": 14, + "h_L": 55832960.0, + "g_L": 5.912176526123858e-09, + "acc": 0.3125 + }, + { + "epoch": 15, + "h_L": 62015928.0, + "g_L": 5.570892191997245e-09, + "acc": 0.296875 + }, + { + "epoch": 16, + "h_L": 67939856.0, + "g_L": 5.281161730152917e-09, + "acc": 0.34375 + }, + { + "epoch": 17, + "h_L": 73442712.0, + "g_L": 5.147563708618463e-09, + "acc": 0.3125 + }, + { + "epoch": 18, + "h_L": 78496368.0, + "g_L": 4.936989927983859e-09, + "acc": 0.328125 + }, + { + "epoch": 19, + "h_L": 82992408.0, + "g_L": 4.855085666832792e-09, + "acc": 0.328125 + }, + { + "epoch": 20, + "h_L": 86961680.0, + "g_L": 4.7778438982959415e-09, + "acc": 0.3125 + }, + { + "epoch": 21, + "h_L": 90389344.0, + "g_L": 4.6255612673462565e-09, + "acc": 0.2734375 + }, + { + "epoch": 22, + "h_L": 93246512.0, + "g_L": 4.607939363410196e-09, + "acc": 0.265625 + }, + { + "epoch": 23, + "h_L": 95522544.0, + "g_L": 4.5615355936945434e-09, + "acc": 0.3046875 + }, + { + "epoch": 24, + "h_L": 97324656.0, + "g_L": 4.491897076519535e-09, + "acc": 0.2890625 + }, + { + "epoch": 25, + "h_L": 98654984.0, + "g_L": 4.464624669964223e-09, + "acc": 0.3046875 + }, + { + "epoch": 26, + "h_L": 99586368.0, + "g_L": 4.4403134502601915e-09, + "acc": 0.296875 + }, + { + "epoch": 27, + "h_L": 100193928.0, + "g_L": 4.401520481422949e-09, + "acc": 0.2890625 + }, + { + "epoch": 28, + "h_L": 100529568.0, + "g_L": 4.431190525622242e-09, + "acc": 0.3125 + }, + { + "epoch": 29, + "h_L": 100676312.0, + "g_L": 4.422026744776986e-09, + "acc": 0.3125 + }, + { + "epoch": 30, + "h_L": 100718184.0, + "g_L": 4.412690213229098e-09, + "acc": 0.3125 + } + ] + }, + "lam_0.0001": { + "42": [ + { + "epoch": 0, + "h_L": 8.712287902832031, + "g_L": 0.007692961022257805, + "acc": 0.1875 + }, + { + "epoch": 1, + "h_L": 5304.19677734375, + "g_L": 1.3745666365139186e-05, + "acc": 0.359375 + }, + { + "epoch": 2, + "h_L": 8347.4375, + "g_L": 8.957185855251737e-06, + "acc": 0.375 + }, + { + "epoch": 3, + "h_L": 9963.34765625, + "g_L": 7.723083399469033e-06, + "acc": 0.390625 + }, + { + "epoch": 4, + "h_L": 11214.49609375, + "g_L": 7.199604169727536e-06, + "acc": 0.3828125 + }, + { + "epoch": 5, + "h_L": 12479.6572265625, + "g_L": 6.587237294297665e-06, + "acc": 0.3828125 + }, + { + "epoch": 6, + "h_L": 14410.3369140625, + "g_L": 5.815574695589021e-06, + "acc": 0.390625 + }, + { + "epoch": 7, + "h_L": 14976.51953125, + "g_L": 5.894468358746963e-06, + "acc": 0.421875 + }, + { + "epoch": 8, + "h_L": 16621.982421875, + "g_L": 5.4373017519537825e-06, + "acc": 0.40625 + }, + { + "epoch": 9, + "h_L": 17072.162109375, + "g_L": 5.349741968529997e-06, + "acc": 0.390625 + }, + { + "epoch": 10, + "h_L": 18436.125, + "g_L": 5.2785831030632835e-06, + "acc": 0.40625 + }, + { + "epoch": 11, + "h_L": 19100.84375, + "g_L": 4.93000470669358e-06, + "acc": 0.40625 + }, + { + "epoch": 12, + "h_L": 20026.234375, + "g_L": 4.96132270200178e-06, + "acc": 0.3984375 + }, + { + "epoch": 13, + "h_L": 20926.4296875, + "g_L": 4.77847743241e-06, + "acc": 0.4375 + }, + { + "epoch": 14, + "h_L": 21417.533203125, + "g_L": 4.665030701289652e-06, + "acc": 0.421875 + }, + { + "epoch": 15, + "h_L": 21616.3828125, + "g_L": 4.687757609644905e-06, + "acc": 0.4140625 + }, + { + "epoch": 16, + "h_L": 22411.86328125, + "g_L": 4.594817255565431e-06, + "acc": 0.4140625 + }, + { + "epoch": 17, + "h_L": 23077.751953125, + "g_L": 4.6028981159906834e-06, + "acc": 0.4296875 + }, + { + "epoch": 18, + "h_L": 23492.974609375, + "g_L": 4.451253516890574e-06, + "acc": 0.4375 + }, + { + "epoch": 19, + "h_L": 23953.103515625, + "g_L": 4.620688741852064e-06, + "acc": 0.3984375 + }, + { + "epoch": 20, + "h_L": 24102.9609375, + "g_L": 4.5326728468353394e-06, + "acc": 0.421875 + }, + { + "epoch": 21, + "h_L": 24251.92578125, + "g_L": 4.4520375013235025e-06, + "acc": 0.40625 + }, + { + "epoch": 22, + "h_L": 24588.142578125, + "g_L": 4.374121544969967e-06, + "acc": 0.390625 + }, + { + "epoch": 23, + "h_L": 24537.626953125, + "g_L": 4.499482201936189e-06, + "acc": 0.4140625 + }, + { + "epoch": 24, + "h_L": 24779.64453125, + "g_L": 4.444983005669201e-06, + "acc": 0.4140625 + }, + { + "epoch": 25, + "h_L": 24894.173828125, + "g_L": 4.422732672537677e-06, + "acc": 0.4140625 + }, + { + "epoch": 26, + "h_L": 24921.201171875, + "g_L": 4.38425468018977e-06, + "acc": 0.421875 + }, + { + "epoch": 27, + "h_L": 25045.3125, + "g_L": 4.367500878288411e-06, + "acc": 0.4296875 + }, + { + "epoch": 28, + "h_L": 25072.015625, + "g_L": 4.3748268581111915e-06, + "acc": 0.421875 + }, + { + "epoch": 29, + "h_L": 25075.091796875, + "g_L": 4.3758886931755114e-06, + "acc": 0.4296875 + }, + { + "epoch": 30, + "h_L": 25079.751953125, + "g_L": 4.373700448923046e-06, + "acc": 0.4296875 + } + ], + "123": [ + { + "epoch": 0, + "h_L": 8.727029800415039, + "g_L": 0.007806388195604086, + "acc": 0.125 + }, + { + "epoch": 1, + "h_L": 4016.624267578125, + "g_L": 1.7260634194826707e-05, + "acc": 0.3828125 + }, + { + "epoch": 2, + "h_L": 6011.0166015625, + "g_L": 1.3166837561584543e-05, + "acc": 0.359375 + }, + { + "epoch": 3, + "h_L": 7996.4658203125, + "g_L": 1.0084489076689351e-05, + "acc": 0.40625 + }, + { + "epoch": 4, + "h_L": 10071.7587890625, + "g_L": 9.058319847099483e-06, + "acc": 0.3359375 + }, + { + "epoch": 5, + "h_L": 11450.2314453125, + "g_L": 7.843047569622286e-06, + "acc": 0.390625 + }, + { + "epoch": 6, + "h_L": 12963.515625, + "g_L": 7.70912356529152e-06, + "acc": 0.3828125 + }, + { + "epoch": 7, + "h_L": 13889.9296875, + "g_L": 7.074252607708331e-06, + "acc": 0.3984375 + }, + { + "epoch": 8, + "h_L": 14898.4521484375, + "g_L": 6.701112397422548e-06, + "acc": 0.3671875 + }, + { + "epoch": 9, + "h_L": 15605.6416015625, + "g_L": 6.628116352658253e-06, + "acc": 0.3359375 + }, + { + "epoch": 10, + "h_L": 16354.34765625, + "g_L": 6.123417733761016e-06, + "acc": 0.4140625 + }, + { + "epoch": 11, + "h_L": 17406.775390625, + "g_L": 6.1299856497498695e-06, + "acc": 0.3515625 + }, + { + "epoch": 12, + "h_L": 18088.765625, + "g_L": 5.712134225177579e-06, + "acc": 0.421875 + }, + { + "epoch": 13, + "h_L": 19012.17578125, + "g_L": 5.742204848502297e-06, + "acc": 0.3984375 + }, + { + "epoch": 14, + "h_L": 19094.021484375, + "g_L": 5.576457624556497e-06, + "acc": 0.3828125 + }, + { + "epoch": 15, + "h_L": 19893.8984375, + "g_L": 5.415755822468782e-06, + "acc": 0.3828125 + }, + { + "epoch": 16, + "h_L": 20340.494140625, + "g_L": 5.4991201068332884e-06, + "acc": 0.3671875 + }, + { + "epoch": 17, + "h_L": 20969.142578125, + "g_L": 5.276073807181092e-06, + "acc": 0.390625 + }, + { + "epoch": 18, + "h_L": 21435.447265625, + "g_L": 5.061881438450655e-06, + "acc": 0.3984375 + }, + { + "epoch": 19, + "h_L": 21808.82421875, + "g_L": 5.190079264139058e-06, + "acc": 0.34375 + }, + { + "epoch": 20, + "h_L": 21931.640625, + "g_L": 5.1184742915211245e-06, + "acc": 0.421875 + }, + { + "epoch": 21, + "h_L": 22451.287109375, + "g_L": 5.059521299699554e-06, + "acc": 0.3984375 + }, + { + "epoch": 22, + "h_L": 22345.939453125, + "g_L": 5.103088369651232e-06, + "acc": 0.390625 + }, + { + "epoch": 23, + "h_L": 22520.41796875, + "g_L": 4.985096893506125e-06, + "acc": 0.3984375 + }, + { + "epoch": 24, + "h_L": 22641.974609375, + "g_L": 5.011982921132585e-06, + "acc": 0.3828125 + }, + { + "epoch": 25, + "h_L": 22696.12109375, + "g_L": 5.002185844205087e-06, + "acc": 0.390625 + }, + { + "epoch": 26, + "h_L": 22765.455078125, + "g_L": 5.096676432003733e-06, + "acc": 0.3828125 + }, + { + "epoch": 27, + "h_L": 22801.35546875, + "g_L": 5.082401457912056e-06, + "acc": 0.3828125 + }, + { + "epoch": 28, + "h_L": 22840.58984375, + "g_L": 5.019065156375291e-06, + "acc": 0.40625 + }, + { + "epoch": 29, + "h_L": 22821.912109375, + "g_L": 5.026035069022328e-06, + "acc": 0.40625 + }, + { + "epoch": 30, + "h_L": 22816.4609375, + "g_L": 5.030014563089935e-06, + "acc": 0.40625 + } + ], + "456": [ + { + "epoch": 0, + "h_L": 8.894441604614258, + "g_L": 0.007735385559499264, + "acc": 0.0859375 + }, + { + "epoch": 1, + "h_L": 5110.58203125, + "g_L": 1.5124841411306988e-05, + "acc": 0.3125 + }, + { + "epoch": 2, + "h_L": 7120.255859375, + "g_L": 1.0910134733421728e-05, + "acc": 0.3515625 + }, + { + "epoch": 3, + "h_L": 8524.048828125, + "g_L": 9.681118172011338e-06, + "acc": 0.3671875 + }, + { + "epoch": 4, + "h_L": 10678.4375, + "g_L": 8.237396286858711e-06, + "acc": 0.3828125 + }, + { + "epoch": 5, + "h_L": 12649.2197265625, + "g_L": 7.375441782642156e-06, + "acc": 0.359375 + }, + { + "epoch": 6, + "h_L": 14385.1181640625, + "g_L": 6.8287376961961854e-06, + "acc": 0.3828125 + }, + { + "epoch": 7, + "h_L": 15401.474609375, + "g_L": 6.515695986308856e-06, + "acc": 0.375 + }, + { + "epoch": 8, + "h_L": 16394.466796875, + "g_L": 6.375977591233095e-06, + "acc": 0.3515625 + }, + { + "epoch": 9, + "h_L": 17472.876953125, + "g_L": 5.9727485677285586e-06, + "acc": 0.3515625 + }, + { + "epoch": 10, + "h_L": 18387.716796875, + "g_L": 5.8594741858541965e-06, + "acc": 0.3828125 + }, + { + "epoch": 11, + "h_L": 19510.287109375, + "g_L": 5.543481620406965e-06, + "acc": 0.34375 + }, + { + "epoch": 12, + "h_L": 20385.5390625, + "g_L": 5.301766577758826e-06, + "acc": 0.3828125 + }, + { + "epoch": 13, + "h_L": 21074.40625, + "g_L": 5.097903795103775e-06, + "acc": 0.3828125 + }, + { + "epoch": 14, + "h_L": 21849.759765625, + "g_L": 5.058767783339135e-06, + "acc": 0.3828125 + }, + { + "epoch": 15, + "h_L": 22503.189453125, + "g_L": 5.003597379982239e-06, + "acc": 0.375 + }, + { + "epoch": 16, + "h_L": 22886.828125, + "g_L": 5.006335868529277e-06, + "acc": 0.34375 + }, + { + "epoch": 17, + "h_L": 23453.025390625, + "g_L": 4.8392594180768356e-06, + "acc": 0.375 + }, + { + "epoch": 18, + "h_L": 23727.587890625, + "g_L": 4.791942046722397e-06, + "acc": 0.3515625 + }, + { + "epoch": 19, + "h_L": 24562.845703125, + "g_L": 4.76715558761498e-06, + "acc": 0.3515625 + }, + { + "epoch": 20, + "h_L": 24665.26953125, + "g_L": 4.814321073354222e-06, + "acc": 0.4140625 + }, + { + "epoch": 21, + "h_L": 24827.166015625, + "g_L": 4.5910783228464425e-06, + "acc": 0.375 + }, + { + "epoch": 22, + "h_L": 25102.697265625, + "g_L": 4.780752078659134e-06, + "acc": 0.390625 + }, + { + "epoch": 23, + "h_L": 25473.859375, + "g_L": 4.675451236835215e-06, + "acc": 0.3671875 + }, + { + "epoch": 24, + "h_L": 25564.466796875, + "g_L": 4.625650035450235e-06, + "acc": 0.3828125 + }, + { + "epoch": 25, + "h_L": 25727.142578125, + "g_L": 4.7758098844497e-06, + "acc": 0.3671875 + }, + { + "epoch": 26, + "h_L": 25853.39453125, + "g_L": 4.7036078285600524e-06, + "acc": 0.3671875 + }, + { + "epoch": 27, + "h_L": 25756.21875, + "g_L": 4.671791430155281e-06, + "acc": 0.375 + }, + { + "epoch": 28, + "h_L": 25913.666015625, + "g_L": 4.683739916799823e-06, + "acc": 0.3671875 + }, + { + "epoch": 29, + "h_L": 25931.091796875, + "g_L": 4.690837158705108e-06, + "acc": 0.375 + }, + { + "epoch": 30, + "h_L": 25938.986328125, + "g_L": 4.685749900090741e-06, + "acc": 0.3671875 + } + ] + }, + "lam_0.01": { + "42": [ + { + "epoch": 0, + "h_L": 8.712287902832031, + "g_L": 0.007692961022257805, + "acc": 0.1875 + }, + { + "epoch": 1, + "h_L": 781.689208984375, + "g_L": 8.415478805545717e-05, + "acc": 0.359375 + }, + { + "epoch": 2, + "h_L": 1539.8074951171875, + "g_L": 4.868719042860903e-05, + "acc": 0.328125 + }, + { + "epoch": 3, + "h_L": 2314.643798828125, + "g_L": 3.541138721629977e-05, + "acc": 0.3828125 + }, + { + "epoch": 4, + "h_L": 3041.840576171875, + "g_L": 2.95412046398269e-05, + "acc": 0.390625 + }, + { + "epoch": 5, + "h_L": 3805.263671875, + "g_L": 2.4733428290346637e-05, + "acc": 0.3515625 + }, + { + "epoch": 6, + "h_L": 4531.37060546875, + "g_L": 2.1849658878636546e-05, + "acc": 0.3828125 + }, + { + "epoch": 7, + "h_L": 5269.0361328125, + "g_L": 2.025548747042194e-05, + "acc": 0.3984375 + }, + { + "epoch": 8, + "h_L": 5989.7841796875, + "g_L": 1.8758984879241325e-05, + "acc": 0.375 + }, + { + "epoch": 9, + "h_L": 6682.50439453125, + "g_L": 1.7715005014906637e-05, + "acc": 0.3984375 + }, + { + "epoch": 10, + "h_L": 7327.41845703125, + "g_L": 1.6974596292129718e-05, + "acc": 0.4140625 + }, + { + "epoch": 11, + "h_L": 7892.38623046875, + "g_L": 1.5582731066388078e-05, + "acc": 0.3828125 + }, + { + "epoch": 12, + "h_L": 8436.2568359375, + "g_L": 1.5689396605012007e-05, + "acc": 0.4140625 + }, + { + "epoch": 13, + "h_L": 8911.0517578125, + "g_L": 1.5322731997002847e-05, + "acc": 0.3671875 + }, + { + "epoch": 14, + "h_L": 9403.470703125, + "g_L": 1.4264693163568154e-05, + "acc": 0.40625 + }, + { + "epoch": 15, + "h_L": 9869.5830078125, + "g_L": 1.4241470125853084e-05, + "acc": 0.3828125 + }, + { + "epoch": 16, + "h_L": 10266.16015625, + "g_L": 1.4325265510706231e-05, + "acc": 0.375 + }, + { + "epoch": 17, + "h_L": 10605.20703125, + "g_L": 1.3871001101506408e-05, + "acc": 0.3828125 + }, + { + "epoch": 18, + "h_L": 10923.232421875, + "g_L": 1.3506460163625889e-05, + "acc": 0.3671875 + }, + { + "epoch": 19, + "h_L": 11199.2412109375, + "g_L": 1.3500241948349867e-05, + "acc": 0.375 + }, + { + "epoch": 20, + "h_L": 11431.51953125, + "g_L": 1.3691166714124847e-05, + "acc": 0.3671875 + }, + { + "epoch": 21, + "h_L": 11597.671875, + "g_L": 1.3415501598501578e-05, + "acc": 0.390625 + }, + { + "epoch": 22, + "h_L": 11771.76171875, + "g_L": 1.3021815902902745e-05, + "acc": 0.3984375 + }, + { + "epoch": 23, + "h_L": 11863.4931640625, + "g_L": 1.3140968803782016e-05, + "acc": 0.3828125 + }, + { + "epoch": 24, + "h_L": 11969.8408203125, + "g_L": 1.3101844160701148e-05, + "acc": 0.4140625 + }, + { + "epoch": 25, + "h_L": 12025.537109375, + "g_L": 1.3040696103416849e-05, + "acc": 0.3828125 + }, + { + "epoch": 26, + "h_L": 12073.8076171875, + "g_L": 1.2962437722308096e-05, + "acc": 0.375 + }, + { + "epoch": 27, + "h_L": 12116.3662109375, + "g_L": 1.3158919500710908e-05, + "acc": 0.390625 + }, + { + "epoch": 28, + "h_L": 12139.900390625, + "g_L": 1.3164692063583061e-05, + "acc": 0.375 + }, + { + "epoch": 29, + "h_L": 12146.0966796875, + "g_L": 1.3183536793803796e-05, + "acc": 0.375 + }, + { + "epoch": 30, + "h_L": 12147.8271484375, + "g_L": 1.3151197890692856e-05, + "acc": 0.3671875 + } + ], + "123": [ + { + "epoch": 0, + "h_L": 8.727029800415039, + "g_L": 0.007806388195604086, + "acc": 0.125 + }, + { + "epoch": 1, + "h_L": 804.5269775390625, + "g_L": 7.68803438404575e-05, + "acc": 0.3828125 + }, + { + "epoch": 2, + "h_L": 1581.7164306640625, + "g_L": 4.342455213190988e-05, + "acc": 0.359375 + }, + { + "epoch": 3, + "h_L": 2421.16015625, + "g_L": 3.13532909785863e-05, + "acc": 0.40625 + }, + { + "epoch": 4, + "h_L": 3297.1318359375, + "g_L": 2.4924784156610258e-05, + "acc": 0.375 + }, + { + "epoch": 5, + "h_L": 4140.81787109375, + "g_L": 2.2291569621302187e-05, + "acc": 0.359375 + }, + { + "epoch": 6, + "h_L": 4962.48828125, + "g_L": 1.878242073871661e-05, + "acc": 0.359375 + }, + { + "epoch": 7, + "h_L": 5745.4970703125, + "g_L": 1.714128848107066e-05, + "acc": 0.40625 + }, + { + "epoch": 8, + "h_L": 6502.54833984375, + "g_L": 1.6141369997058064e-05, + "acc": 0.3671875 + }, + { + "epoch": 9, + "h_L": 7201.73095703125, + "g_L": 1.5111980246729217e-05, + "acc": 0.3828125 + }, + { + "epoch": 10, + "h_L": 7894.11962890625, + "g_L": 1.4007100617163815e-05, + "acc": 0.4375 + }, + { + "epoch": 11, + "h_L": 8513.216796875, + "g_L": 1.3769726137979887e-05, + "acc": 0.3984375 + }, + { + "epoch": 12, + "h_L": 9157.7392578125, + "g_L": 1.3569000657298602e-05, + "acc": 0.390625 + }, + { + "epoch": 13, + "h_L": 9707.62890625, + "g_L": 1.2571725164889358e-05, + "acc": 0.4140625 + }, + { + "epoch": 14, + "h_L": 10252.697265625, + "g_L": 1.2447404515114613e-05, + "acc": 0.390625 + }, + { + "epoch": 15, + "h_L": 10741.009765625, + "g_L": 1.2337825864960905e-05, + "acc": 0.3671875 + }, + { + "epoch": 16, + "h_L": 11135.705078125, + "g_L": 1.2025854630337562e-05, + "acc": 0.390625 + }, + { + "epoch": 17, + "h_L": 11506.6748046875, + "g_L": 1.1528948562045116e-05, + "acc": 0.4140625 + }, + { + "epoch": 18, + "h_L": 11867.5556640625, + "g_L": 1.1563630323507823e-05, + "acc": 0.375 + }, + { + "epoch": 19, + "h_L": 12145.7763671875, + "g_L": 1.1255759091000073e-05, + "acc": 0.3828125 + }, + { + "epoch": 20, + "h_L": 12389.25, + "g_L": 1.1145174539706204e-05, + "acc": 0.3984375 + }, + { + "epoch": 21, + "h_L": 12601.6962890625, + "g_L": 1.1093687135144137e-05, + "acc": 0.3984375 + }, + { + "epoch": 22, + "h_L": 12786.6484375, + "g_L": 1.1049281056330074e-05, + "acc": 0.3984375 + }, + { + "epoch": 23, + "h_L": 12927.1630859375, + "g_L": 1.081726441043429e-05, + "acc": 0.390625 + }, + { + "epoch": 24, + "h_L": 13034.91796875, + "g_L": 1.0955274774460122e-05, + "acc": 0.3984375 + }, + { + "epoch": 25, + "h_L": 13112.890625, + "g_L": 1.0876665328396484e-05, + "acc": 0.3984375 + }, + { + "epoch": 26, + "h_L": 13168.7705078125, + "g_L": 1.0894200386246666e-05, + "acc": 0.3671875 + }, + { + "epoch": 27, + "h_L": 13206.673828125, + "g_L": 1.08816493593622e-05, + "acc": 0.390625 + }, + { + "epoch": 28, + "h_L": 13228.2421875, + "g_L": 1.0845806173165329e-05, + "acc": 0.3828125 + }, + { + "epoch": 29, + "h_L": 13234.9462890625, + "g_L": 1.0821668183780275e-05, + "acc": 0.3984375 + }, + { + "epoch": 30, + "h_L": 13236.921875, + "g_L": 1.0833139640453737e-05, + "acc": 0.3984375 + } + ], + "456": [ + { + "epoch": 0, + "h_L": 8.894441604614258, + "g_L": 0.007735385559499264, + "acc": 0.0859375 + }, + { + "epoch": 1, + "h_L": 829.6934204101562, + "g_L": 7.929334242362529e-05, + "acc": 0.359375 + }, + { + "epoch": 2, + "h_L": 1575.5511474609375, + "g_L": 4.435138907865621e-05, + "acc": 0.390625 + }, + { + "epoch": 3, + "h_L": 2381.2763671875, + "g_L": 3.261367237428203e-05, + "acc": 0.3828125 + }, + { + "epoch": 4, + "h_L": 3160.59326171875, + "g_L": 2.7582153052208014e-05, + "acc": 0.3828125 + }, + { + "epoch": 5, + "h_L": 3938.484375, + "g_L": 2.2988910131971352e-05, + "acc": 0.3515625 + }, + { + "epoch": 6, + "h_L": 4690.099609375, + "g_L": 2.184785989811644e-05, + "acc": 0.359375 + }, + { + "epoch": 7, + "h_L": 5416.181640625, + "g_L": 1.9117769625154324e-05, + "acc": 0.3671875 + }, + { + "epoch": 8, + "h_L": 6141.73193359375, + "g_L": 1.844516009441577e-05, + "acc": 0.359375 + }, + { + "epoch": 9, + "h_L": 6827.73291015625, + "g_L": 1.6444697394035757e-05, + "acc": 0.3515625 + }, + { + "epoch": 10, + "h_L": 7443.5869140625, + "g_L": 1.6328842320945114e-05, + "acc": 0.359375 + }, + { + "epoch": 11, + "h_L": 8031.5986328125, + "g_L": 1.5774490748299286e-05, + "acc": 0.3359375 + }, + { + "epoch": 12, + "h_L": 8571.142578125, + "g_L": 1.5156500012381002e-05, + "acc": 0.3671875 + }, + { + "epoch": 13, + "h_L": 9071.01953125, + "g_L": 1.4580495189875364e-05, + "acc": 0.359375 + }, + { + "epoch": 14, + "h_L": 9517.59765625, + "g_L": 1.453970526199555e-05, + "acc": 0.3515625 + }, + { + "epoch": 15, + "h_L": 9979.744140625, + "g_L": 1.3590201888291631e-05, + "acc": 0.390625 + }, + { + "epoch": 16, + "h_L": 10357.6572265625, + "g_L": 1.351606897515012e-05, + "acc": 0.3359375 + }, + { + "epoch": 17, + "h_L": 10739.0205078125, + "g_L": 1.3668774045072496e-05, + "acc": 0.3671875 + }, + { + "epoch": 18, + "h_L": 11051.26171875, + "g_L": 1.28570209199097e-05, + "acc": 0.359375 + }, + { + "epoch": 19, + "h_L": 11345.6669921875, + "g_L": 1.3053796465101186e-05, + "acc": 0.375 + }, + { + "epoch": 20, + "h_L": 11574.2275390625, + "g_L": 1.289151896344265e-05, + "acc": 0.359375 + }, + { + "epoch": 21, + "h_L": 11759.0185546875, + "g_L": 1.2874368621851318e-05, + "acc": 0.375 + }, + { + "epoch": 22, + "h_L": 11920.4658203125, + "g_L": 1.2835512279707473e-05, + "acc": 0.3828125 + }, + { + "epoch": 23, + "h_L": 12071.0576171875, + "g_L": 1.2617413631232921e-05, + "acc": 0.3984375 + }, + { + "epoch": 24, + "h_L": 12176.2275390625, + "g_L": 1.2873709238192532e-05, + "acc": 0.359375 + }, + { + "epoch": 25, + "h_L": 12251.54296875, + "g_L": 1.2865211829193868e-05, + "acc": 0.375 + }, + { + "epoch": 26, + "h_L": 12298.298828125, + "g_L": 1.2873412742919754e-05, + "acc": 0.359375 + }, + { + "epoch": 27, + "h_L": 12329.041015625, + "g_L": 1.268069081561407e-05, + "acc": 0.3671875 + }, + { + "epoch": 28, + "h_L": 12353.5947265625, + "g_L": 1.2505057384259999e-05, + "acc": 0.375 + }, + { + "epoch": 29, + "h_L": 12361.15234375, + "g_L": 1.255954248335911e-05, + "acc": 0.3828125 + }, + { + "epoch": 30, + "h_L": 12363.9013671875, + "g_L": 1.2592853636306245e-05, + "acc": 0.375 + } + ] + } +} \ No newline at end of file diff --git a/results/dfa_canonical_penalty_trajectory.log b/results/dfa_canonical_penalty_trajectory.log new file mode 100644 index 0000000..9ba812a --- /dev/null +++ b/results/dfa_canonical_penalty_trajectory.log @@ -0,0 +1,47 @@ + +=== λ=0.0, seed=42 === + [lam=0.0] s=42 ep 10: ||h_L||=1.739e+07 ||g_L||=1.469e-08 acc=0.2969 + [lam=0.0] s=42 ep 20: ||h_L||=5.317e+07 ||g_L||=9.184e-09 acc=0.3203 + [lam=0.0] s=42 ep 30: ||h_L||=6.186e+07 ||g_L||=8.706e-09 acc=0.3359 + +=== λ=0.0, seed=123 === + [lam=0.0] s=123 ep 10: ||h_L||=1.882e+07 ||g_L||=1.185e-08 acc=0.3594 + [lam=0.0] s=123 ep 20: ||h_L||=5.486e+07 ||g_L||=5.954e-09 acc=0.3359 + [lam=0.0] s=123 ep 30: ||h_L||=6.356e+07 ||g_L||=5.435e-09 acc=0.3281 + +=== λ=0.0, seed=456 === + [lam=0.0] s=456 ep 10: ||h_L||=3.018e+07 ||g_L||=8.360e-09 acc=0.2969 + [lam=0.0] s=456 ep 20: ||h_L||=8.696e+07 ||g_L||=4.778e-09 acc=0.3125 + [lam=0.0] s=456 ep 30: ||h_L||=1.007e+08 ||g_L||=4.413e-09 acc=0.3125 + +=== λ=0.0001, seed=42 === + [lam=0.0001] s=42 ep 10: ||h_L||=1.844e+04 ||g_L||=5.279e-06 acc=0.4062 + [lam=0.0001] s=42 ep 20: ||h_L||=2.410e+04 ||g_L||=4.533e-06 acc=0.4219 + [lam=0.0001] s=42 ep 30: ||h_L||=2.508e+04 ||g_L||=4.374e-06 acc=0.4297 + +=== λ=0.0001, seed=123 === + [lam=0.0001] s=123 ep 10: ||h_L||=1.635e+04 ||g_L||=6.123e-06 acc=0.4141 + [lam=0.0001] s=123 ep 20: ||h_L||=2.193e+04 ||g_L||=5.118e-06 acc=0.4219 + [lam=0.0001] s=123 ep 30: ||h_L||=2.282e+04 ||g_L||=5.030e-06 acc=0.4062 + +=== λ=0.0001, seed=456 === + [lam=0.0001] s=456 ep 10: ||h_L||=1.839e+04 ||g_L||=5.859e-06 acc=0.3828 + [lam=0.0001] s=456 ep 20: ||h_L||=2.467e+04 ||g_L||=4.814e-06 acc=0.4141 + [lam=0.0001] s=456 ep 30: ||h_L||=2.594e+04 ||g_L||=4.686e-06 acc=0.3672 + +=== λ=0.01, seed=42 === + [lam=0.01] s=42 ep 10: ||h_L||=7.327e+03 ||g_L||=1.697e-05 acc=0.4141 + [lam=0.01] s=42 ep 20: ||h_L||=1.143e+04 ||g_L||=1.369e-05 acc=0.3672 + [lam=0.01] s=42 ep 30: ||h_L||=1.215e+04 ||g_L||=1.315e-05 acc=0.3672 + +=== λ=0.01, seed=123 === + [lam=0.01] s=123 ep 10: ||h_L||=7.894e+03 ||g_L||=1.401e-05 acc=0.4375 + [lam=0.01] s=123 ep 20: ||h_L||=1.239e+04 ||g_L||=1.115e-05 acc=0.3984 + [lam=0.01] s=123 ep 30: ||h_L||=1.324e+04 ||g_L||=1.083e-05 acc=0.3984 + +=== λ=0.01, seed=456 === + [lam=0.01] s=456 ep 10: ||h_L||=7.444e+03 ||g_L||=1.633e-05 acc=0.3594 + [lam=0.01] s=456 ep 20: ||h_L||=1.157e+04 ||g_L||=1.289e-05 acc=0.3594 + [lam=0.01] s=456 ep 30: ||h_L||=1.236e+04 ||g_L||=1.259e-05 acc=0.3750 + +Saved: results/dfa_canonical_penalty_trajectory.json diff --git a/results/dfa_direction_quality_run.log b/results/dfa_direction_quality_run.log new file mode 100644 index 0000000..0b40ae2 --- /dev/null +++ b/results/dfa_direction_quality_run.log @@ -0,0 +1,3 @@ +DFA direction-quality direct test: seed=42, lam=0.01 + +=== Vanilla DFA (lam=0) === diff --git a/results/dfa_pen_short_lam1e-1.log b/results/dfa_pen_short_lam1e-1.log new file mode 100644 index 0000000..2da564b --- /dev/null +++ b/results/dfa_pen_short_lam1e-1.log @@ -0,0 +1,15 @@ +DFA + residual-branch penalty test: seed=42, lam=0.1 + ep 0: ||h_L||=8.893e+00 ||g_2||=9.934e-04 acc=0.1152 + ep 1: ||h_L||=7.313e+02 ||g_2||=1.234e-05 eval_acc=0.3330 test_acc=0.3271 + ep 10: ||h_L||=6.932e+03 ||g_2||=2.318e-06 eval_acc=0.3467 test_acc=0.3430 + ep 20: ||h_L||=1.083e+04 ||g_2||=1.721e-06 eval_acc=0.3564 test_acc=0.3531 + ep 30: ||h_L||=1.157e+04 ||g_2||=1.634e-06 eval_acc=0.3594 test_acc=0.3486 + +FINAL test acc: 0.3486 +Compare to: + DFA-vanilla (3-seed mean): 0.308 + DFA-shallow (3-seed mean): 0.349 + DFA-frozen (3-seed mean): 0.349 + BP-trainable (3-seed mean): 0.609 +Saved results/dfa_pen_short/dfa_pen_lam0.1_s42.json +Saved results/dfa_pen_short/dfa_pen_lam0.1_s42.pt diff --git a/results/dfa_pen_short_lam1e-4.log b/results/dfa_pen_short_lam1e-4.log new file mode 100644 index 0000000..fbf8806 --- /dev/null +++ b/results/dfa_pen_short_lam1e-4.log @@ -0,0 +1,15 @@ +DFA + residual-branch penalty test: seed=42, lam=0.0001 + ep 0: ||h_L||=8.893e+00 ||g_2||=9.934e-04 acc=0.1152 + ep 1: ||h_L||=3.544e+03 ||g_2||=2.682e-06 eval_acc=0.3154 test_acc=0.3127 + ep 10: ||h_L||=1.654e+04 ||g_2||=7.706e-07 eval_acc=0.3496 test_acc=0.3479 + ep 20: ||h_L||=2.248e+04 ||g_2||=6.429e-07 eval_acc=0.3633 test_acc=0.3616 + ep 30: ||h_L||=2.365e+04 ||g_2||=6.276e-07 eval_acc=0.3643 test_acc=0.3593 + +FINAL test acc: 0.3593 +Compare to: + DFA-vanilla (3-seed mean): 0.308 + DFA-shallow (3-seed mean): 0.349 + DFA-frozen (3-seed mean): 0.349 + BP-trainable (3-seed mean): 0.609 +Saved results/dfa_pen_short/dfa_pen_lam0.0001_s42.json +Saved results/dfa_pen_short/dfa_pen_lam0.0001_s42.pt diff --git a/results/dfa_pen_short_lam1e-4_s123.log b/results/dfa_pen_short_lam1e-4_s123.log new file mode 100644 index 0000000..54bda12 --- /dev/null +++ b/results/dfa_pen_short_lam1e-4_s123.log @@ -0,0 +1,15 @@ +DFA + residual-branch penalty test: seed=123, lam=0.0001 + ep 0: ||h_L||=8.791e+00 ||g_2||=9.848e-04 acc=0.0957 + ep 1: ||h_L||=2.827e+03 ||g_2||=3.043e-06 eval_acc=0.3262 test_acc=0.3037 + ep 10: ||h_L||=1.476e+04 ||g_2||=9.239e-07 eval_acc=0.3379 test_acc=0.3408 + ep 20: ||h_L||=1.954e+04 ||g_2||=7.765e-07 eval_acc=0.3604 test_acc=0.3606 + ep 30: ||h_L||=2.057e+04 ||g_2||=7.580e-07 eval_acc=0.3682 test_acc=0.3622 + +FINAL test acc: 0.3622 +Compare to: + DFA-vanilla (3-seed mean): 0.308 + DFA-shallow (3-seed mean): 0.349 + DFA-frozen (3-seed mean): 0.349 + BP-trainable (3-seed mean): 0.609 +Saved results/dfa_pen_short/dfa_pen_lam0.0001_s123.json +Saved results/dfa_pen_short/dfa_pen_lam0.0001_s123.pt diff --git a/results/dfa_pen_short_lam1e-4_s456.log b/results/dfa_pen_short_lam1e-4_s456.log new file mode 100644 index 0000000..e46f4ad --- /dev/null +++ b/results/dfa_pen_short_lam1e-4_s456.log @@ -0,0 +1,15 @@ +DFA + residual-branch penalty test: seed=456, lam=0.0001 + ep 0: ||h_L||=8.890e+00 ||g_2||=9.971e-04 acc=0.0928 + ep 1: ||h_L||=3.954e+03 ||g_2||=2.489e-06 eval_acc=0.2988 test_acc=0.3043 + ep 10: ||h_L||=1.636e+04 ||g_2||=8.429e-07 eval_acc=0.3506 test_acc=0.3490 + ep 20: ||h_L||=2.166e+04 ||g_2||=7.285e-07 eval_acc=0.3721 test_acc=0.3601 + ep 30: ||h_L||=2.285e+04 ||g_2||=7.001e-07 eval_acc=0.3711 test_acc=0.3597 + +FINAL test acc: 0.3597 +Compare to: + DFA-vanilla (3-seed mean): 0.308 + DFA-shallow (3-seed mean): 0.349 + DFA-frozen (3-seed mean): 0.349 + BP-trainable (3-seed mean): 0.609 +Saved results/dfa_pen_short/dfa_pen_lam0.0001_s456.json +Saved results/dfa_pen_short/dfa_pen_lam0.0001_s456.pt diff --git a/results/dfa_pen_short_run.log b/results/dfa_pen_short_run.log new file mode 100644 index 0000000..a996ab8 --- /dev/null +++ b/results/dfa_pen_short_run.log @@ -0,0 +1,15 @@ +DFA + residual-branch penalty test: seed=42, lam=0.01 + ep 0: ||h_L||=8.893e+00 ||g_2||=9.934e-04 acc=0.1152 + ep 1: ||h_L||=7.888e+02 ||g_2||=1.141e-05 eval_acc=0.3359 test_acc=0.3353 + ep 10: ||h_L||=7.251e+03 ||g_2||=2.304e-06 eval_acc=0.3662 test_acc=0.3517 + ep 20: ||h_L||=1.137e+04 ||g_2||=1.814e-06 eval_acc=0.3730 test_acc=0.3649 + ep 30: ||h_L||=1.216e+04 ||g_2||=1.757e-06 eval_acc=0.3750 test_acc=0.3593 + +FINAL test acc: 0.3593 +Compare to: + DFA-vanilla (3-seed mean): 0.308 + DFA-shallow (3-seed mean): 0.349 + DFA-frozen (3-seed mean): 0.349 + BP-trainable (3-seed mean): 0.609 +Saved results/dfa_pen_short/dfa_pen_lam0.01_s42.json +Saved results/dfa_pen_short/dfa_pen_lam0.01_s42.pt diff --git a/results/dfa_pen_short_s123.log b/results/dfa_pen_short_s123.log new file mode 100644 index 0000000..36edc85 --- /dev/null +++ b/results/dfa_pen_short_s123.log @@ -0,0 +1,15 @@ +DFA + residual-branch penalty test: seed=123, lam=0.01 + ep 0: ||h_L||=8.791e+00 ||g_2||=9.848e-04 acc=0.0957 + ep 1: ||h_L||=8.047e+02 ||g_2||=1.064e-05 eval_acc=0.3320 test_acc=0.3279 + ep 10: ||h_L||=7.988e+03 ||g_2||=1.857e-06 eval_acc=0.3584 test_acc=0.3448 + ep 20: ||h_L||=1.251e+04 ||g_2||=1.450e-06 eval_acc=0.3633 test_acc=0.3597 + ep 30: ||h_L||=1.337e+04 ||g_2||=1.414e-06 eval_acc=0.3672 test_acc=0.3610 + +FINAL test acc: 0.3610 +Compare to: + DFA-vanilla (3-seed mean): 0.308 + DFA-shallow (3-seed mean): 0.349 + DFA-frozen (3-seed mean): 0.349 + BP-trainable (3-seed mean): 0.609 +Saved results/dfa_pen_short/dfa_pen_lam0.01_s123.json +Saved results/dfa_pen_short/dfa_pen_lam0.01_s123.pt diff --git a/results/dfa_pen_short_s456.log b/results/dfa_pen_short_s456.log new file mode 100644 index 0000000..e918e2a --- /dev/null +++ b/results/dfa_pen_short_s456.log @@ -0,0 +1,15 @@ +DFA + residual-branch penalty test: seed=456, lam=0.01 + ep 0: ||h_L||=8.890e+00 ||g_2||=9.971e-04 acc=0.0928 + ep 1: ||h_L||=8.559e+02 ||g_2||=1.043e-05 eval_acc=0.3379 test_acc=0.3428 + ep 10: ||h_L||=7.817e+03 ||g_2||=2.220e-06 eval_acc=0.3594 test_acc=0.3539 + ep 20: ||h_L||=1.233e+04 ||g_2||=1.772e-06 eval_acc=0.3691 test_acc=0.3592 + ep 30: ||h_L||=1.320e+04 ||g_2||=1.691e-06 eval_acc=0.3691 test_acc=0.3604 + +FINAL test acc: 0.3604 +Compare to: + DFA-vanilla (3-seed mean): 0.308 + DFA-shallow (3-seed mean): 0.349 + DFA-frozen (3-seed mean): 0.349 + BP-trainable (3-seed mean): 0.609 +Saved results/dfa_pen_short/dfa_pen_lam0.01_s456.json +Saved results/dfa_pen_short/dfa_pen_lam0.01_s456.pt diff --git a/results/dfa_residual_penalty/dfa_pen_lam0.001_s42.json b/results/dfa_residual_penalty/dfa_pen_lam0.001_s42.json new file mode 100644 index 0000000..ab34189 --- /dev/null +++ b/results/dfa_residual_penalty/dfa_pen_lam0.001_s42.json @@ -0,0 +1,85 @@ +{ + "config": { + "seed": 42, + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "lam": 0.001, + "output_dir": "results/dfa_residual_penalty" + }, + "final_test_acc": 0.3721, + "log": [ + { + "epoch": 0, + "h_L_norm": 8.893179893493652, + "g_2_norm": 0.0009934091940522194, + "acc_eval": 0.115234375 + }, + { + "epoch": 1, + "h_L_norm": 1232.41015625, + "g_2_norm": 7.278651537490077e-06, + "acc_eval": 0.3232421875 + }, + { + "epoch": 10, + "h_L_norm": 8450.7138671875, + "g_2_norm": 1.682184233686712e-06, + "acc_eval": 0.34765625 + }, + { + "epoch": 20, + "h_L_norm": 15709.046875, + "g_2_norm": 1.124352024817199e-06, + "acc_eval": 0.380859375 + }, + { + "epoch": 30, + "h_L_norm": 22514.3671875, + "g_2_norm": 9.156933629128616e-07, + "acc_eval": 0.3798828125 + }, + { + "epoch": 40, + "h_L_norm": 28256.328125, + "g_2_norm": 8.128682793540065e-07, + "acc_eval": 0.390625 + }, + { + "epoch": 50, + "h_L_norm": 32716.849609375, + "g_2_norm": 7.677509756831569e-07, + "acc_eval": 0.380859375 + }, + { + "epoch": 60, + "h_L_norm": 35976.05078125, + "g_2_norm": 7.403396580230037e-07, + "acc_eval": 0.3798828125 + }, + { + "epoch": 70, + "h_L_norm": 38103.2109375, + "g_2_norm": 7.278070484062482e-07, + "acc_eval": 0.388671875 + }, + { + "epoch": 80, + "h_L_norm": 39303.2109375, + "g_2_norm": 7.065188469823624e-07, + "acc_eval": 0.3857421875 + }, + { + "epoch": 90, + "h_L_norm": 39756.09375, + "g_2_norm": 7.082798560986703e-07, + "acc_eval": 0.3818359375 + }, + { + "epoch": 100, + "h_L_norm": 39833.37890625, + "g_2_norm": 7.09268647369754e-07, + "acc_eval": 0.3818359375 + } + ] +} \ No newline at end of file diff --git a/results/dfa_residual_penalty/dfa_pen_lam0.01_s123.json b/results/dfa_residual_penalty/dfa_pen_lam0.01_s123.json new file mode 100644 index 0000000..4a3e013 --- /dev/null +++ b/results/dfa_residual_penalty/dfa_pen_lam0.01_s123.json @@ -0,0 +1,85 @@ +{ + "config": { + "seed": 123, + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "lam": 0.01, + "output_dir": "results/dfa_residual_penalty" + }, + "final_test_acc": 0.3623, + "log": [ + { + "epoch": 0, + "h_L_norm": 8.790542602539062, + "g_2_norm": 0.0009848480112850666, + "acc_eval": 0.095703125 + }, + { + "epoch": 1, + "h_L_norm": 804.6716918945312, + "g_2_norm": 1.0638542335072998e-05, + "acc_eval": 0.33203125 + }, + { + "epoch": 10, + "h_L_norm": 8562.5556640625, + "g_2_norm": 1.780398406481254e-06, + "acc_eval": 0.35546875 + }, + { + "epoch": 20, + "h_L_norm": 16654.19140625, + "g_2_norm": 1.2289126516407123e-06, + "acc_eval": 0.369140625 + }, + { + "epoch": 30, + "h_L_norm": 23707.400390625, + "g_2_norm": 1.0487134431969025e-06, + "acc_eval": 0.3525390625 + }, + { + "epoch": 40, + "h_L_norm": 29600.91796875, + "g_2_norm": 9.340964197690482e-07, + "acc_eval": 0.3583984375 + }, + { + "epoch": 50, + "h_L_norm": 34168.984375, + "g_2_norm": 8.874068839759275e-07, + "acc_eval": 0.3486328125 + }, + { + "epoch": 60, + "h_L_norm": 37448.43359375, + "g_2_norm": 8.381613838537305e-07, + "acc_eval": 0.34765625 + }, + { + "epoch": 70, + "h_L_norm": 39587.50390625, + "g_2_norm": 8.235564905589854e-07, + "acc_eval": 0.3623046875 + }, + { + "epoch": 80, + "h_L_norm": 40736.8203125, + "g_2_norm": 8.101840194285614e-07, + "acc_eval": 0.3662109375 + }, + { + "epoch": 90, + "h_L_norm": 41192.90234375, + "g_2_norm": 8.102718993541203e-07, + "acc_eval": 0.361328125 + }, + { + "epoch": 100, + "h_L_norm": 41262.97265625, + "g_2_norm": 8.093736596492818e-07, + "acc_eval": 0.3642578125 + } + ] +} \ No newline at end of file diff --git a/results/dfa_residual_penalty/dfa_pen_lam0.01_s42.json b/results/dfa_residual_penalty/dfa_pen_lam0.01_s42.json new file mode 100644 index 0000000..25a1040 --- /dev/null +++ b/results/dfa_residual_penalty/dfa_pen_lam0.01_s42.json @@ -0,0 +1,85 @@ +{ + "config": { + "seed": 42, + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "lam": 0.01, + "output_dir": "results/dfa_residual_penalty" + }, + "final_test_acc": 0.3625, + "log": [ + { + "epoch": 0, + "h_L_norm": 8.893179893493652, + "g_2_norm": 0.0009934091940522194, + "acc_eval": 0.115234375 + }, + { + "epoch": 1, + "h_L_norm": 788.7547607421875, + "g_2_norm": 1.1413892934797332e-05, + "acc_eval": 0.3359375 + }, + { + "epoch": 10, + "h_L_norm": 7782.26904296875, + "g_2_norm": 2.211311766586732e-06, + "acc_eval": 0.36328125 + }, + { + "epoch": 20, + "h_L_norm": 15153.8720703125, + "g_2_norm": 1.525812194813625e-06, + "acc_eval": 0.375 + }, + { + "epoch": 30, + "h_L_norm": 21562.537109375, + "g_2_norm": 1.2776303037753678e-06, + "acc_eval": 0.3564453125 + }, + { + "epoch": 40, + "h_L_norm": 26854.45703125, + "g_2_norm": 1.154939354819362e-06, + "acc_eval": 0.3720703125 + }, + { + "epoch": 50, + "h_L_norm": 31004.7734375, + "g_2_norm": 1.0770245353342034e-06, + "acc_eval": 0.3681640625 + }, + { + "epoch": 60, + "h_L_norm": 34082.734375, + "g_2_norm": 1.0429424719404778e-06, + "acc_eval": 0.3623046875 + }, + { + "epoch": 70, + "h_L_norm": 36057.671875, + "g_2_norm": 1.0143049848920782e-06, + "acc_eval": 0.3740234375 + }, + { + "epoch": 80, + "h_L_norm": 37152.69921875, + "g_2_norm": 9.944840257958276e-07, + "acc_eval": 0.37109375 + }, + { + "epoch": 90, + "h_L_norm": 37571.5859375, + "g_2_norm": 9.8765985967475e-07, + "acc_eval": 0.3681640625 + }, + { + "epoch": 100, + "h_L_norm": 37639.328125, + "g_2_norm": 9.872784403341939e-07, + "acc_eval": 0.3720703125 + } + ] +} \ No newline at end of file diff --git a/results/dfa_residual_penalty/dfa_pen_lam0.01_s456.json b/results/dfa_residual_penalty/dfa_pen_lam0.01_s456.json new file mode 100644 index 0000000..f4fe212 --- /dev/null +++ b/results/dfa_residual_penalty/dfa_pen_lam0.01_s456.json @@ -0,0 +1,85 @@ +{ + "config": { + "seed": 456, + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "lam": 0.01, + "output_dir": "results/dfa_residual_penalty" + }, + "final_test_acc": 0.3635, + "log": [ + { + "epoch": 0, + "h_L_norm": 8.889528274536133, + "g_2_norm": 0.0009970925748348236, + "acc_eval": 0.0927734375 + }, + { + "epoch": 1, + "h_L_norm": 855.8524780273438, + "g_2_norm": 1.0432391718495637e-05, + "acc_eval": 0.337890625 + }, + { + "epoch": 10, + "h_L_norm": 8393.11328125, + "g_2_norm": 2.126787421730114e-06, + "acc_eval": 0.3564453125 + }, + { + "epoch": 20, + "h_L_norm": 16381.1162109375, + "g_2_norm": 1.4970787560741883e-06, + "acc_eval": 0.3603515625 + }, + { + "epoch": 30, + "h_L_norm": 23492.884765625, + "g_2_norm": 1.2246630376466783e-06, + "acc_eval": 0.3662109375 + }, + { + "epoch": 40, + "h_L_norm": 29340.23046875, + "g_2_norm": 1.0880221452680416e-06, + "acc_eval": 0.3427734375 + }, + { + "epoch": 50, + "h_L_norm": 33961.85546875, + "g_2_norm": 1.0040256483989651e-06, + "acc_eval": 0.3447265625 + }, + { + "epoch": 60, + "h_L_norm": 37291.0, + "g_2_norm": 9.557429621054325e-07, + "acc_eval": 0.3701171875 + }, + { + "epoch": 70, + "h_L_norm": 39383.98828125, + "g_2_norm": 9.201546617987333e-07, + "acc_eval": 0.3759765625 + }, + { + "epoch": 80, + "h_L_norm": 40525.0625, + "g_2_norm": 9.115954071603483e-07, + "acc_eval": 0.369140625 + }, + { + "epoch": 90, + "h_L_norm": 40957.48046875, + "g_2_norm": 8.987436217466893e-07, + "acc_eval": 0.3681640625 + }, + { + "epoch": 100, + "h_L_norm": 41024.0859375, + "g_2_norm": 9.000136174108775e-07, + "acc_eval": 0.369140625 + } + ] +} \ No newline at end of file diff --git a/results/dfa_residual_penalty/run_lam1e-1_s42.log b/results/dfa_residual_penalty/run_lam1e-1_s42.log new file mode 100644 index 0000000..c9cf336 --- /dev/null +++ b/results/dfa_residual_penalty/run_lam1e-1_s42.log @@ -0,0 +1,7 @@ +DFA + residual-branch penalty test: seed=42, lam=0.1 + ep 0: ||h_L||=8.893e+00 ||g_2||=9.934e-04 acc=0.1152 + ep 1: ||h_L||=7.313e+02 ||g_2||=1.234e-05 eval_acc=0.3330 test_acc=0.3271 + ep 10: ||h_L||=7.442e+03 ||g_2||=2.212e-06 eval_acc=0.3467 test_acc=0.3403 + ep 20: ||h_L||=1.436e+04 ||g_2||=1.377e-06 eval_acc=0.3457 test_acc=0.3452 + ep 30: ||h_L||=2.044e+04 ||g_2||=1.075e-06 eval_acc=0.3457 test_acc=0.3440 + ep 40: ||h_L||=2.549e+04 ||g_2||=9.277e-07 eval_acc=0.3584 test_acc=0.3450 diff --git a/results/dfa_residual_penalty/run_lam1e-2_s123.log b/results/dfa_residual_penalty/run_lam1e-2_s123.log new file mode 100644 index 0000000..dda8095 --- /dev/null +++ b/results/dfa_residual_penalty/run_lam1e-2_s123.log @@ -0,0 +1,21 @@ +DFA + residual-branch penalty test: seed=123, lam=0.01 + ep 0: ||h_L||=8.791e+00 ||g_2||=9.848e-04 acc=0.0957 + ep 1: ||h_L||=8.047e+02 ||g_2||=1.064e-05 eval_acc=0.3320 test_acc=0.3279 + ep 10: ||h_L||=8.563e+03 ||g_2||=1.780e-06 eval_acc=0.3555 test_acc=0.3425 + ep 20: ||h_L||=1.665e+04 ||g_2||=1.229e-06 eval_acc=0.3691 test_acc=0.3600 + ep 30: ||h_L||=2.371e+04 ||g_2||=1.049e-06 eval_acc=0.3525 test_acc=0.3479 + ep 40: ||h_L||=2.960e+04 ||g_2||=9.341e-07 eval_acc=0.3584 test_acc=0.3509 + ep 50: ||h_L||=3.417e+04 ||g_2||=8.874e-07 eval_acc=0.3486 test_acc=0.3436 + ep 60: ||h_L||=3.745e+04 ||g_2||=8.382e-07 eval_acc=0.3477 test_acc=0.3521 + ep 70: ||h_L||=3.959e+04 ||g_2||=8.236e-07 eval_acc=0.3623 test_acc=0.3573 + ep 80: ||h_L||=4.074e+04 ||g_2||=8.102e-07 eval_acc=0.3662 test_acc=0.3579 + ep 90: ||h_L||=4.119e+04 ||g_2||=8.103e-07 eval_acc=0.3613 test_acc=0.3595 + ep 100: ||h_L||=4.126e+04 ||g_2||=8.094e-07 eval_acc=0.3643 test_acc=0.3623 + +FINAL test acc: 0.3623 +Compare to: + DFA-vanilla (3-seed mean): 0.308 + DFA-shallow (3-seed mean): 0.349 + DFA-frozen (3-seed mean): 0.349 + BP-trainable (3-seed mean): 0.609 +Saved results/dfa_residual_penalty/dfa_pen_lam0.01_s123.json diff --git a/results/dfa_residual_penalty/run_lam1e-2_s42.log b/results/dfa_residual_penalty/run_lam1e-2_s42.log new file mode 100644 index 0000000..28de526 --- /dev/null +++ b/results/dfa_residual_penalty/run_lam1e-2_s42.log @@ -0,0 +1,21 @@ +DFA + residual-branch penalty test: seed=42, lam=0.01 + ep 0: ||h_L||=8.893e+00 ||g_2||=9.934e-04 acc=0.1152 + ep 1: ||h_L||=7.888e+02 ||g_2||=1.141e-05 eval_acc=0.3359 test_acc=0.3353 + ep 10: ||h_L||=7.782e+03 ||g_2||=2.211e-06 eval_acc=0.3633 test_acc=0.3482 + ep 20: ||h_L||=1.515e+04 ||g_2||=1.526e-06 eval_acc=0.3750 test_acc=0.3571 + ep 30: ||h_L||=2.156e+04 ||g_2||=1.278e-06 eval_acc=0.3564 test_acc=0.3549 + ep 40: ||h_L||=2.685e+04 ||g_2||=1.155e-06 eval_acc=0.3721 test_acc=0.3550 + ep 50: ||h_L||=3.100e+04 ||g_2||=1.077e-06 eval_acc=0.3682 test_acc=0.3545 + ep 60: ||h_L||=3.408e+04 ||g_2||=1.043e-06 eval_acc=0.3623 test_acc=0.3579 + ep 70: ||h_L||=3.606e+04 ||g_2||=1.014e-06 eval_acc=0.3740 test_acc=0.3652 + ep 80: ||h_L||=3.715e+04 ||g_2||=9.945e-07 eval_acc=0.3711 test_acc=0.3606 + ep 90: ||h_L||=3.757e+04 ||g_2||=9.877e-07 eval_acc=0.3682 test_acc=0.3609 + ep 100: ||h_L||=3.764e+04 ||g_2||=9.873e-07 eval_acc=0.3721 test_acc=0.3625 + +FINAL test acc: 0.3625 +Compare to: + DFA-vanilla (3-seed mean): 0.308 + DFA-shallow (3-seed mean): 0.349 + DFA-frozen (3-seed mean): 0.349 + BP-trainable (3-seed mean): 0.609 +Saved results/dfa_residual_penalty/dfa_pen_lam0.01_s42.json diff --git a/results/dfa_residual_penalty/run_lam1e-2_s456.log b/results/dfa_residual_penalty/run_lam1e-2_s456.log new file mode 100644 index 0000000..2287cd0 --- /dev/null +++ b/results/dfa_residual_penalty/run_lam1e-2_s456.log @@ -0,0 +1,21 @@ +DFA + residual-branch penalty test: seed=456, lam=0.01 + ep 0: ||h_L||=8.890e+00 ||g_2||=9.971e-04 acc=0.0928 + ep 1: ||h_L||=8.559e+02 ||g_2||=1.043e-05 eval_acc=0.3379 test_acc=0.3428 + ep 10: ||h_L||=8.393e+03 ||g_2||=2.127e-06 eval_acc=0.3564 test_acc=0.3525 + ep 20: ||h_L||=1.638e+04 ||g_2||=1.497e-06 eval_acc=0.3604 test_acc=0.3563 + ep 30: ||h_L||=2.349e+04 ||g_2||=1.225e-06 eval_acc=0.3662 test_acc=0.3606 + ep 40: ||h_L||=2.934e+04 ||g_2||=1.088e-06 eval_acc=0.3428 test_acc=0.3427 + ep 50: ||h_L||=3.396e+04 ||g_2||=1.004e-06 eval_acc=0.3447 test_acc=0.3538 + ep 60: ||h_L||=3.729e+04 ||g_2||=9.557e-07 eval_acc=0.3701 test_acc=0.3654 + ep 70: ||h_L||=3.938e+04 ||g_2||=9.202e-07 eval_acc=0.3760 test_acc=0.3655 + ep 80: ||h_L||=4.053e+04 ||g_2||=9.116e-07 eval_acc=0.3691 test_acc=0.3615 + ep 90: ||h_L||=4.096e+04 ||g_2||=8.987e-07 eval_acc=0.3682 test_acc=0.3639 + ep 100: ||h_L||=4.102e+04 ||g_2||=9.000e-07 eval_acc=0.3691 test_acc=0.3635 + +FINAL test acc: 0.3635 +Compare to: + DFA-vanilla (3-seed mean): 0.308 + DFA-shallow (3-seed mean): 0.349 + DFA-frozen (3-seed mean): 0.349 + BP-trainable (3-seed mean): 0.609 +Saved results/dfa_residual_penalty/dfa_pen_lam0.01_s456.json diff --git a/results/dfa_residual_penalty/run_lam1e-3_s123.log b/results/dfa_residual_penalty/run_lam1e-3_s123.log new file mode 100644 index 0000000..45f9097 --- /dev/null +++ b/results/dfa_residual_penalty/run_lam1e-3_s123.log @@ -0,0 +1,7 @@ +DFA + residual-branch penalty test: seed=123, lam=0.001 + ep 0: ||h_L||=8.791e+00 ||g_2||=9.848e-04 acc=0.0957 + ep 1: ||h_L||=1.165e+03 ||g_2||=7.637e-06 eval_acc=0.3242 test_acc=0.3179 + ep 10: ||h_L||=8.474e+03 ||g_2||=1.661e-06 eval_acc=0.3652 test_acc=0.3519 + ep 20: ||h_L||=1.658e+04 ||g_2||=1.026e-06 eval_acc=0.3662 test_acc=0.3632 + ep 30: ||h_L||=2.394e+04 ||g_2||=8.435e-07 eval_acc=0.3564 test_acc=0.3537 + ep 40: ||h_L||=3.023e+04 ||g_2||=7.463e-07 eval_acc=0.3652 test_acc=0.3590 diff --git a/results/dfa_residual_penalty/run_lam1e-3_s42.log b/results/dfa_residual_penalty/run_lam1e-3_s42.log new file mode 100644 index 0000000..cd081a7 --- /dev/null +++ b/results/dfa_residual_penalty/run_lam1e-3_s42.log @@ -0,0 +1,21 @@ +DFA + residual-branch penalty test: seed=42, lam=0.001 + ep 0: ||h_L||=8.893e+00 ||g_2||=9.934e-04 acc=0.1152 + ep 1: ||h_L||=1.232e+03 ||g_2||=7.279e-06 eval_acc=0.3232 test_acc=0.3225 + ep 10: ||h_L||=8.451e+03 ||g_2||=1.682e-06 eval_acc=0.3477 test_acc=0.3521 + ep 20: ||h_L||=1.571e+04 ||g_2||=1.124e-06 eval_acc=0.3809 test_acc=0.3648 + ep 30: ||h_L||=2.251e+04 ||g_2||=9.157e-07 eval_acc=0.3799 test_acc=0.3637 + ep 40: ||h_L||=2.826e+04 ||g_2||=8.129e-07 eval_acc=0.3906 test_acc=0.3630 + ep 50: ||h_L||=3.272e+04 ||g_2||=7.678e-07 eval_acc=0.3809 test_acc=0.3654 + ep 60: ||h_L||=3.598e+04 ||g_2||=7.403e-07 eval_acc=0.3799 test_acc=0.3669 + ep 70: ||h_L||=3.810e+04 ||g_2||=7.278e-07 eval_acc=0.3887 test_acc=0.3732 + ep 80: ||h_L||=3.930e+04 ||g_2||=7.065e-07 eval_acc=0.3857 test_acc=0.3711 + ep 90: ||h_L||=3.976e+04 ||g_2||=7.083e-07 eval_acc=0.3818 test_acc=0.3719 + ep 100: ||h_L||=3.983e+04 ||g_2||=7.093e-07 eval_acc=0.3818 test_acc=0.3721 + +FINAL test acc: 0.3721 +Compare to: + DFA-vanilla (3-seed mean): 0.308 + DFA-shallow (3-seed mean): 0.349 + DFA-frozen (3-seed mean): 0.349 + BP-trainable (3-seed mean): 0.609 +Saved results/dfa_residual_penalty/dfa_pen_lam0.001_s42.json diff --git a/results/dfa_residual_penalty/run_lam1e-3_s456.log b/results/dfa_residual_penalty/run_lam1e-3_s456.log new file mode 100644 index 0000000..2719354 --- /dev/null +++ b/results/dfa_residual_penalty/run_lam1e-3_s456.log @@ -0,0 +1,7 @@ +DFA + residual-branch penalty test: seed=456, lam=0.001 + ep 0: ||h_L||=8.890e+00 ||g_2||=9.971e-04 acc=0.0928 + ep 1: ||h_L||=1.332e+03 ||g_2||=6.768e-06 eval_acc=0.3350 test_acc=0.3299 + ep 10: ||h_L||=8.773e+03 ||g_2||=1.743e-06 eval_acc=0.3691 test_acc=0.3606 + ep 20: ||h_L||=1.678e+04 ||g_2||=1.177e-06 eval_acc=0.3760 test_acc=0.3639 + ep 30: ||h_L||=2.409e+04 ||g_2||=9.326e-07 eval_acc=0.3750 test_acc=0.3647 + ep 40: ||h_L||=3.023e+04 ||g_2||=8.219e-07 eval_acc=0.3662 test_acc=0.3579 diff --git a/results/ep_baseline/ep_s2048.json b/results/ep_baseline/ep_s2048.json new file mode 100644 index 0000000..4cb0cbd --- /dev/null +++ b/results/ep_baseline/ep_s2048.json @@ -0,0 +1,23 @@ +{ + "method": "ep", + "seed": 2048, + "acc": 0.2792, + "Gamma": 0.008133413677569479, + "rho": 0.028946227626875043, + "naive_StateErr": 0.8209338188171387, + "gammas_per_layer": [ + 0.0, + 0.000846301787532866, + -0.0009015983669087291, + 0.03258895128965378 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + -0.01539901178330183, + 0.131183922290802 + ], + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.1 +} \ No newline at end of file diff --git a/results/exploit_linesearch/linesearch_L4_d256_s42.json b/results/exploit_linesearch/linesearch_L4_d256_s42.json new file mode 100644 index 0000000..a25a480 --- /dev/null +++ b/results/exploit_linesearch/linesearch_L4_d256_s42.json @@ -0,0 +1,112 @@ +{ + "oracle_bp_last1_raw_eta1e-05": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "raw", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913531064987183, + "delta_loss_same": 0.0, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "oracle_bp_last1_raw_eta3e-05": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "raw", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913531064987183, + "delta_loss_same": 0.0, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "oracle_bp_last1_raw_eta0.0001": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913530468940735, + "delta_loss_same": -5.960464477539063e-08, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "oracle_bp_last1_raw_eta0.0003": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913528680801392, + "delta_loss_same": -2.384185791015625e-07, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "oracle_bp_last1_raw_eta0.001": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913521528244019, + "delta_loss_same": -9.5367431640625e-07, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last1_raw_eta1e-05": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "raw", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913519144058228, + "delta_loss_same": -1.1920928955078125e-06, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last1_raw_eta3e-05": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "raw", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913492321968079, + "delta_loss_same": -3.874301910400391e-06, + "delta_loss_held": 1.1920928955078125e-07, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last1_raw_eta0.0001": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913403511047363, + "delta_loss_same": -1.2755393981933594e-05, + "delta_loss_held": 3.5762786865234375e-07, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last1_raw_eta0.0003": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913147211074829, + "delta_loss_same": -3.838539123535156e-05, + "delta_loss_held": 1.430511474609375e-06, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last1_raw_eta0.001": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7912248373031616, + "delta_loss_same": -0.00012826919555664062, + "delta_loss_held": 4.76837158203125e-06, + "delta_acc_same": 0.0 + } +} \ No newline at end of file diff --git a/results/exploit_linesearch_full/linesearch_L4_d256_s42.json b/results/exploit_linesearch_full/linesearch_L4_d256_s42.json new file mode 100644 index 0000000..9a719d8 --- /dev/null +++ b/results/exploit_linesearch_full/linesearch_L4_d256_s42.json @@ -0,0 +1,1850 @@ +{ + "dfa_last1_raw_eta1e-05": { + "method": "dfa", + "update_range": "last1", + "norm_mode": "raw", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913527488708496, + "delta_loss_same": -3.5762786865234375e-07, + "delta_loss_held": 2.384185791015625e-07, + "delta_acc_same": 0.0 + }, + "dfa_last1_raw_eta3e-05": { + "method": "dfa", + "update_range": "last1", + "norm_mode": "raw", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913520336151123, + "delta_loss_same": -1.0728836059570312e-06, + "delta_loss_held": 1.0132789611816406e-06, + "delta_acc_same": 0.0 + }, + "dfa_last1_raw_eta0.0001": { + "method": "dfa", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913494110107422, + "delta_loss_same": -3.6954879760742188e-06, + "delta_loss_held": 3.3974647521972656e-06, + "delta_acc_same": 0.0 + }, + "dfa_last1_raw_eta0.0003": { + "method": "dfa", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913422584533691, + "delta_loss_same": -1.0848045349121094e-05, + "delta_loss_held": 1.0371208190917969e-05, + "delta_acc_same": 0.0 + }, + "dfa_last1_raw_eta0.001": { + "method": "dfa", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913171052932739, + "delta_loss_same": -3.600120544433594e-05, + "delta_loss_held": 3.4809112548828125e-05, + "delta_acc_same": 0.0 + }, + "dfa_last1_raw_eta0.003": { + "method": "dfa", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7912467122077942, + "delta_loss_same": -0.00010639429092407227, + "delta_loss_held": 0.00010526180267333984, + "delta_acc_same": 0.0 + }, + "dfa_last1_raw_eta0.01": { + "method": "dfa", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7910203337669373, + "delta_loss_same": -0.00033277273178100586, + "delta_loss_held": 0.0003624558448791504, + "delta_acc_same": -0.0078125 + }, + "scalar_cb_last1_raw_eta1e-05": { + "method": "scalar_cb", + "update_range": "last1", + "norm_mode": "raw", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913531064987183, + "delta_loss_same": 0.0, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "scalar_cb_last1_raw_eta3e-05": { + "method": "scalar_cb", + "update_range": "last1", + "norm_mode": "raw", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913529872894287, + "delta_loss_same": -1.1920928955078125e-07, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "scalar_cb_last1_raw_eta0.0001": { + "method": "scalar_cb", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913524508476257, + "delta_loss_same": -6.556510925292969e-07, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "scalar_cb_last1_raw_eta0.0003": { + "method": "scalar_cb", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913510203361511, + "delta_loss_same": -2.086162567138672e-06, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "scalar_cb_last1_raw_eta0.001": { + "method": "scalar_cb", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913459539413452, + "delta_loss_same": -7.152557373046875e-06, + "delta_loss_held": 2.384185791015625e-07, + "delta_acc_same": 0.0 + }, + "scalar_cb_last1_raw_eta0.003": { + "method": "scalar_cb", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913317680358887, + "delta_loss_same": -2.1338462829589844e-05, + "delta_loss_held": 8.344650268554688e-07, + "delta_acc_same": 0.0 + }, + "scalar_cb_last1_raw_eta0.01": { + "method": "scalar_cb", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7912819385528564, + "delta_loss_same": -7.11679458618164e-05, + "delta_loss_held": 2.6226043701171875e-06, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last1_raw_eta1e-05": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "raw", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913519144058228, + "delta_loss_same": -1.1920928955078125e-06, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last1_raw_eta3e-05": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "raw", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913492321968079, + "delta_loss_same": -3.874301910400391e-06, + "delta_loss_held": 1.1920928955078125e-07, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last1_raw_eta0.0001": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913403511047363, + "delta_loss_same": -1.2755393981933594e-05, + "delta_loss_held": 3.5762786865234375e-07, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last1_raw_eta0.0003": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913147211074829, + "delta_loss_same": -3.838539123535156e-05, + "delta_loss_held": 1.430511474609375e-06, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last1_raw_eta0.001": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7912248373031616, + "delta_loss_same": -0.00012826919555664062, + "delta_loss_held": 4.76837158203125e-06, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last1_raw_eta0.003": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7909681797027588, + "delta_loss_same": -0.00038492679595947266, + "delta_loss_held": 1.4126300811767578e-05, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last1_raw_eta0.01": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7900704145431519, + "delta_loss_same": -0.0012826919555664062, + "delta_loss_held": 4.7266483306884766e-05, + "delta_acc_same": 0.0 + }, + "oracle_bp_last1_raw_eta1e-05": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "raw", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913531064987183, + "delta_loss_same": 0.0, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "oracle_bp_last1_raw_eta3e-05": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "raw", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913531064987183, + "delta_loss_same": 0.0, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "oracle_bp_last1_raw_eta0.0001": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913530468940735, + "delta_loss_same": -5.960464477539063e-08, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "oracle_bp_last1_raw_eta0.0003": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913528680801392, + "delta_loss_same": -2.384185791015625e-07, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "oracle_bp_last1_raw_eta0.001": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913521528244019, + "delta_loss_same": -9.5367431640625e-07, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "oracle_bp_last1_raw_eta0.003": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913498878479004, + "delta_loss_same": -3.2186508178710938e-06, + "delta_loss_held": 5.960464477539063e-08, + "delta_acc_same": 0.0 + }, + "oracle_bp_last1_raw_eta0.01": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "raw", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913422584533691, + "delta_loss_same": -1.0848045349121094e-05, + "delta_loss_held": 5.364418029785156e-07, + "delta_acc_same": 0.0 + }, + "dfa_last1_norm_eta1e-05": { + "method": "dfa", + "update_range": "last1", + "norm_mode": "norm", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913490533828735, + "delta_loss_same": -4.0531158447265625e-06, + "delta_loss_held": 1.3709068298339844e-06, + "delta_acc_same": 0.0 + }, + "dfa_last1_norm_eta3e-05": { + "method": "dfa", + "update_range": "last1", + "norm_mode": "norm", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913411855697632, + "delta_loss_same": -1.1920928955078125e-05, + "delta_loss_held": 3.933906555175781e-06, + "delta_acc_same": 0.0 + }, + "dfa_last1_norm_eta0.0001": { + "method": "dfa", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.791313111782074, + "delta_loss_same": -3.999471664428711e-05, + "delta_loss_held": 1.3470649719238281e-05, + "delta_acc_same": 0.0 + }, + "dfa_last1_norm_eta0.0003": { + "method": "dfa", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7912337779998779, + "delta_loss_same": -0.00011932849884033203, + "delta_loss_held": 4.106760025024414e-05, + "delta_acc_same": 0.0 + }, + "dfa_last1_norm_eta0.001": { + "method": "dfa", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7909631133079529, + "delta_loss_same": -0.00038999319076538086, + "delta_loss_held": 0.00014281272888183594, + "delta_acc_same": -0.0078125 + }, + "dfa_last1_norm_eta0.003": { + "method": "dfa", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7902504205703735, + "delta_loss_same": -0.0011026859283447266, + "delta_loss_held": 0.0004792213439941406, + "delta_acc_same": -0.0078125 + }, + "dfa_last1_norm_eta0.01": { + "method": "dfa", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7884711623191833, + "delta_loss_same": -0.002881944179534912, + "delta_loss_held": 0.0021938085556030273, + "delta_acc_same": -0.0078125 + }, + "scalar_cb_last1_norm_eta1e-05": { + "method": "scalar_cb", + "update_range": "last1", + "norm_mode": "norm", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7912606000900269, + "delta_loss_same": -9.250640869140625e-05, + "delta_loss_held": 1.329183578491211e-05, + "delta_acc_same": 0.0 + }, + "scalar_cb_last1_norm_eta3e-05": { + "method": "scalar_cb", + "update_range": "last1", + "norm_mode": "norm", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7910759449005127, + "delta_loss_same": -0.0002771615982055664, + "delta_loss_held": 4.011392593383789e-05, + "delta_acc_same": 0.0 + }, + "scalar_cb_last1_norm_eta0.0001": { + "method": "scalar_cb", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7904340028762817, + "delta_loss_same": -0.0009191036224365234, + "delta_loss_held": 0.00013649463653564453, + "delta_acc_same": 0.0 + }, + "scalar_cb_last1_norm_eta0.0003": { + "method": "scalar_cb", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7886358499526978, + "delta_loss_same": -0.002717256546020508, + "delta_loss_held": 0.00043272972106933594, + "delta_acc_same": 0.0 + }, + "scalar_cb_last1_norm_eta0.001": { + "method": "scalar_cb", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7827593088150024, + "delta_loss_same": -0.00859379768371582, + "delta_loss_held": 0.001717686653137207, + "delta_acc_same": 0.0 + }, + "scalar_cb_last1_norm_eta0.003": { + "method": "scalar_cb", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7694397568702698, + "delta_loss_same": -0.021913349628448486, + "delta_loss_held": 0.007596492767333984, + "delta_acc_same": 0.0078125 + }, + "scalar_cb_last1_norm_eta0.01": { + "method": "scalar_cb", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7611995935440063, + "delta_loss_same": -0.030153512954711914, + "delta_loss_held": 0.05731534957885742, + "delta_acc_same": -0.0234375 + }, + "vec_eT_M4_last1_norm_eta1e-05": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "norm", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7910163402557373, + "delta_loss_same": -0.00033676624298095703, + "delta_loss_held": 2.3186206817626953e-05, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last1_norm_eta3e-05": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "norm", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7903435230255127, + "delta_loss_same": -0.0010095834732055664, + "delta_loss_held": 6.99758529663086e-05, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last1_norm_eta0.0001": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7879958152770996, + "delta_loss_same": -0.0033572912216186523, + "delta_loss_held": 0.00023698806762695312, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last1_norm_eta0.0003": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7813490629196167, + "delta_loss_same": -0.010004043579101562, + "delta_loss_held": 0.0007431507110595703, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last1_norm_eta0.001": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7587857246398926, + "delta_loss_same": -0.032567381858825684, + "delta_loss_held": 0.002847909927368164, + "delta_acc_same": 0.015625 + }, + "vec_eT_M4_last1_norm_eta0.003": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7000553011894226, + "delta_loss_same": -0.09129780530929565, + "delta_loss_held": 0.0116502046585083, + "delta_acc_same": 0.03125 + }, + "vec_eT_M4_last1_norm_eta0.01": { + "method": "vec_eT_M4", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.5529239773750305, + "delta_loss_same": -0.23842912912368774, + "delta_loss_held": 0.0728445053100586, + "delta_acc_same": 0.078125 + }, + "oracle_bp_last1_norm_eta1e-05": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "norm", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7911322116851807, + "delta_loss_same": -0.00022089481353759766, + "delta_loss_held": 2.2411346435546875e-05, + "delta_acc_same": 0.0 + }, + "oracle_bp_last1_norm_eta3e-05": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "norm", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7906907796859741, + "delta_loss_same": -0.0006623268127441406, + "delta_loss_held": 6.73532485961914e-05, + "delta_acc_same": 0.0 + }, + "oracle_bp_last1_norm_eta0.0001": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.78914874792099, + "delta_loss_same": -0.0022043585777282715, + "delta_loss_held": 0.00022560358047485352, + "delta_acc_same": 0.0 + }, + "oracle_bp_last1_norm_eta0.0003": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7847684025764465, + "delta_loss_same": -0.0065847039222717285, + "delta_loss_held": 0.0006849765777587891, + "delta_acc_same": 0.0 + }, + "oracle_bp_last1_norm_eta0.001": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.769731879234314, + "delta_loss_same": -0.021621227264404297, + "delta_loss_held": 0.002378702163696289, + "delta_acc_same": 0.0078125 + }, + "oracle_bp_last1_norm_eta0.003": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7291945815086365, + "delta_loss_same": -0.06215852499008179, + "delta_loss_held": 0.007954299449920654, + "delta_acc_same": 0.0078125 + }, + "oracle_bp_last1_norm_eta0.01": { + "method": "oracle_bp", + "update_range": "last1", + "norm_mode": "norm", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.6127457618713379, + "delta_loss_same": -0.17860734462738037, + "delta_loss_held": 0.03617274761199951, + "delta_acc_same": 0.0703125 + }, + "dfa_last2_raw_eta1e-05": { + "method": "dfa", + "update_range": "last2", + "norm_mode": "raw", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.791350245475769, + "delta_loss_same": -2.86102294921875e-06, + "delta_loss_held": -3.5762786865234375e-07, + "delta_acc_same": 0.0 + }, + "dfa_last2_raw_eta3e-05": { + "method": "dfa", + "update_range": "last2", + "norm_mode": "raw", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913442850112915, + "delta_loss_same": -8.821487426757812e-06, + "delta_loss_held": -8.940696716308594e-07, + "delta_acc_same": 0.0 + }, + "dfa_last2_raw_eta0.0001": { + "method": "dfa", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913237810134888, + "delta_loss_same": -2.9325485229492188e-05, + "delta_loss_held": -2.8014183044433594e-06, + "delta_acc_same": 0.0 + }, + "dfa_last2_raw_eta0.0003": { + "method": "dfa", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.791265070438385, + "delta_loss_same": -8.803606033325195e-05, + "delta_loss_held": -8.285045623779297e-06, + "delta_acc_same": 0.0 + }, + "dfa_last2_raw_eta0.001": { + "method": "dfa", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7910601496696472, + "delta_loss_same": -0.0002929568290710449, + "delta_loss_held": -2.7179718017578125e-05, + "delta_acc_same": -0.0078125 + }, + "dfa_last2_raw_eta0.003": { + "method": "dfa", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7904785871505737, + "delta_loss_same": -0.0008745193481445312, + "delta_loss_held": -7.939338684082031e-05, + "delta_acc_same": -0.0078125 + }, + "dfa_last2_raw_eta0.01": { + "method": "dfa", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7884876728057861, + "delta_loss_same": -0.002865433692932129, + "delta_loss_held": -0.00024127960205078125, + "delta_acc_same": -0.0078125 + }, + "scalar_cb_last2_raw_eta1e-05": { + "method": "scalar_cb", + "update_range": "last2", + "norm_mode": "raw", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913503646850586, + "delta_loss_same": -2.7418136596679688e-06, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "scalar_cb_last2_raw_eta3e-05": { + "method": "scalar_cb", + "update_range": "last2", + "norm_mode": "raw", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913447618484497, + "delta_loss_same": -8.344650268554688e-06, + "delta_loss_held": 5.960464477539063e-08, + "delta_acc_same": 0.0 + }, + "scalar_cb_last2_raw_eta0.0001": { + "method": "scalar_cb", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913253307342529, + "delta_loss_same": -2.777576446533203e-05, + "delta_loss_held": 4.172325134277344e-07, + "delta_acc_same": 0.0 + }, + "scalar_cb_last2_raw_eta0.0003": { + "method": "scalar_cb", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7912696003913879, + "delta_loss_same": -8.350610733032227e-05, + "delta_loss_held": 1.1920928955078125e-06, + "delta_acc_same": 0.0 + }, + "scalar_cb_last2_raw_eta0.001": { + "method": "scalar_cb", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7910747528076172, + "delta_loss_same": -0.0002783536911010742, + "delta_loss_held": 3.993511199951172e-06, + "delta_acc_same": 0.0 + }, + "scalar_cb_last2_raw_eta0.003": { + "method": "scalar_cb", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7905182242393494, + "delta_loss_same": -0.0008348822593688965, + "delta_loss_held": 1.1920928955078125e-05, + "delta_acc_same": 0.0 + }, + "scalar_cb_last2_raw_eta0.01": { + "method": "scalar_cb", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7885727882385254, + "delta_loss_same": -0.002780318260192871, + "delta_loss_held": 4.106760025024414e-05, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last2_raw_eta1e-05": { + "method": "vec_eT_M4", + "update_range": "last2", + "norm_mode": "raw", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913484573364258, + "delta_loss_same": -4.649162292480469e-06, + "delta_loss_held": 1.1920928955078125e-07, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last2_raw_eta3e-05": { + "method": "vec_eT_M4", + "update_range": "last2", + "norm_mode": "raw", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913389205932617, + "delta_loss_same": -1.4185905456542969e-05, + "delta_loss_held": 2.384185791015625e-07, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last2_raw_eta0.0001": { + "method": "vec_eT_M4", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913057804107666, + "delta_loss_same": -4.7326087951660156e-05, + "delta_loss_held": 1.1324882507324219e-06, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last2_raw_eta0.0003": { + "method": "vec_eT_M4", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7912108302116394, + "delta_loss_same": -0.00014227628707885742, + "delta_loss_held": 3.337860107421875e-06, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last2_raw_eta0.001": { + "method": "vec_eT_M4", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7908790707588196, + "delta_loss_same": -0.00047403573989868164, + "delta_loss_held": 1.1324882507324219e-05, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last2_raw_eta0.003": { + "method": "vec_eT_M4", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7899314165115356, + "delta_loss_same": -0.0014216899871826172, + "delta_loss_held": 3.445148468017578e-05, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last2_raw_eta0.01": { + "method": "vec_eT_M4", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7866207361221313, + "delta_loss_same": -0.004732370376586914, + "delta_loss_held": 0.00011670589447021484, + "delta_acc_same": 0.0 + }, + "oracle_bp_last2_raw_eta1e-05": { + "method": "oracle_bp", + "update_range": "last2", + "norm_mode": "raw", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913504242897034, + "delta_loss_same": -2.682209014892578e-06, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "oracle_bp_last2_raw_eta3e-05": { + "method": "oracle_bp", + "update_range": "last2", + "norm_mode": "raw", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913450598716736, + "delta_loss_same": -8.046627044677734e-06, + "delta_loss_held": 5.960464477539063e-08, + "delta_acc_same": 0.0 + }, + "oracle_bp_last2_raw_eta0.0001": { + "method": "oracle_bp", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913261651992798, + "delta_loss_same": -2.6941299438476562e-05, + "delta_loss_held": 2.980232238769531e-07, + "delta_acc_same": 0.0 + }, + "oracle_bp_last2_raw_eta0.0003": { + "method": "oracle_bp", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7912721037864685, + "delta_loss_same": -8.100271224975586e-05, + "delta_loss_held": 1.1324882507324219e-06, + "delta_acc_same": 0.0 + }, + "oracle_bp_last2_raw_eta0.001": { + "method": "oracle_bp", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.791082501411438, + "delta_loss_same": -0.00027060508728027344, + "delta_loss_held": 3.814697265625e-06, + "delta_acc_same": 0.0 + }, + "oracle_bp_last2_raw_eta0.003": { + "method": "oracle_bp", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7905414700508118, + "delta_loss_same": -0.0008116364479064941, + "delta_loss_held": 1.1682510375976562e-05, + "delta_acc_same": 0.0 + }, + "oracle_bp_last2_raw_eta0.01": { + "method": "oracle_bp", + "update_range": "last2", + "norm_mode": "raw", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7886502146720886, + "delta_loss_same": -0.0027028918266296387, + "delta_loss_held": 4.017353057861328e-05, + "delta_acc_same": 0.0 + }, + "dfa_last2_norm_eta1e-05": { + "method": "dfa", + "update_range": "last2", + "norm_mode": "norm", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.791345477104187, + "delta_loss_same": -7.62939453125e-06, + "delta_loss_held": -2.1457672119140625e-06, + "delta_acc_same": 0.0 + }, + "dfa_last2_norm_eta3e-05": { + "method": "dfa", + "update_range": "last2", + "norm_mode": "norm", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913300395011902, + "delta_loss_same": -2.3066997528076172e-05, + "delta_loss_held": -6.377696990966797e-06, + "delta_acc_same": 0.0 + }, + "dfa_last2_norm_eta0.0001": { + "method": "dfa", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.791276216506958, + "delta_loss_same": -7.68899917602539e-05, + "delta_loss_held": -2.09808349609375e-05, + "delta_acc_same": 0.0 + }, + "dfa_last2_norm_eta0.0003": { + "method": "dfa", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.791123628616333, + "delta_loss_same": -0.0002294778823852539, + "delta_loss_held": -6.175041198730469e-05, + "delta_acc_same": -0.0078125 + }, + "dfa_last2_norm_eta0.001": { + "method": "dfa", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7906030416488647, + "delta_loss_same": -0.0007500648498535156, + "delta_loss_held": -0.00019317865371704102, + "delta_acc_same": -0.0078125 + }, + "dfa_last2_norm_eta0.003": { + "method": "dfa", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.78923100233078, + "delta_loss_same": -0.0021221041679382324, + "delta_loss_held": -0.00047093629837036133, + "delta_acc_same": -0.0078125 + }, + "dfa_last2_norm_eta0.01": { + "method": "dfa", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7858060598373413, + "delta_loss_same": -0.005547046661376953, + "delta_loss_held": -0.00029981136322021484, + "delta_acc_same": -0.015625 + }, + "scalar_cb_last2_norm_eta1e-05": { + "method": "scalar_cb", + "update_range": "last2", + "norm_mode": "norm", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7912271022796631, + "delta_loss_same": -0.00012600421905517578, + "delta_loss_held": 2.0742416381835938e-05, + "delta_acc_same": 0.0 + }, + "scalar_cb_last2_norm_eta3e-05": { + "method": "scalar_cb", + "update_range": "last2", + "norm_mode": "norm", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7909758687019348, + "delta_loss_same": -0.00037723779678344727, + "delta_loss_held": 6.282329559326172e-05, + "delta_acc_same": 0.0 + }, + "scalar_cb_last2_norm_eta0.0001": { + "method": "scalar_cb", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7901065349578857, + "delta_loss_same": -0.0012465715408325195, + "delta_loss_held": 0.0002161264419555664, + "delta_acc_same": 0.0 + }, + "scalar_cb_last2_norm_eta0.0003": { + "method": "scalar_cb", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7877075672149658, + "delta_loss_same": -0.0036455392837524414, + "delta_loss_held": 0.0007035136222839355, + "delta_acc_same": 0.0 + }, + "scalar_cb_last2_norm_eta0.001": { + "method": "scalar_cb", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7802847623825073, + "delta_loss_same": -0.011068344116210938, + "delta_loss_held": 0.0029941797256469727, + "delta_acc_same": 0.0 + }, + "scalar_cb_last2_norm_eta0.003": { + "method": "scalar_cb", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7671945095062256, + "delta_loss_same": -0.024158596992492676, + "delta_loss_held": 0.014712095260620117, + "delta_acc_same": -0.015625 + }, + "scalar_cb_last2_norm_eta0.01": { + "method": "scalar_cb", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.8153536319732666, + "delta_loss_same": 0.02400052547454834, + "delta_loss_held": 0.12053942680358887, + "delta_acc_same": -0.0234375 + }, + "vec_eT_M4_last2_norm_eta1e-05": { + "method": "vec_eT_M4", + "update_range": "last2", + "norm_mode": "norm", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7907758355140686, + "delta_loss_same": -0.0005772709846496582, + "delta_loss_held": 3.4749507904052734e-05, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last2_norm_eta3e-05": { + "method": "vec_eT_M4", + "update_range": "last2", + "norm_mode": "norm", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7896230816841125, + "delta_loss_same": -0.0017300248146057129, + "delta_loss_held": 0.00010508298873901367, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last2_norm_eta0.0001": { + "method": "vec_eT_M4", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7856085300445557, + "delta_loss_same": -0.005744576454162598, + "delta_loss_held": 0.0003609657287597656, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_last2_norm_eta0.0003": { + "method": "vec_eT_M4", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7743081450462341, + "delta_loss_same": -0.01704496145248413, + "delta_loss_held": 0.0011725425720214844, + "delta_acc_same": 0.0078125 + }, + "vec_eT_M4_last2_norm_eta0.001": { + "method": "vec_eT_M4", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7366842031478882, + "delta_loss_same": -0.05466890335083008, + "delta_loss_held": 0.004941463470458984, + "delta_acc_same": 0.0234375 + }, + "vec_eT_M4_last2_norm_eta0.003": { + "method": "vec_eT_M4", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.6443334221839905, + "delta_loss_same": -0.14701968431472778, + "delta_loss_held": 0.023414790630340576, + "delta_acc_same": 0.0546875 + }, + "vec_eT_M4_last2_norm_eta0.01": { + "method": "vec_eT_M4", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.45750147104263306, + "delta_loss_same": -0.3338516354560852, + "delta_loss_held": 0.17275190353393555, + "delta_acc_same": 0.1171875 + }, + "oracle_bp_last2_norm_eta1e-05": { + "method": "oracle_bp", + "update_range": "last2", + "norm_mode": "norm", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7909836769104004, + "delta_loss_same": -0.0003694295883178711, + "delta_loss_held": 3.635883331298828e-05, + "delta_acc_same": 0.0 + }, + "oracle_bp_last2_norm_eta3e-05": { + "method": "oracle_bp", + "update_range": "last2", + "norm_mode": "norm", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7902452945709229, + "delta_loss_same": -0.0011078119277954102, + "delta_loss_held": 0.00010913610458374023, + "delta_acc_same": 0.0 + }, + "oracle_bp_last2_norm_eta0.0001": { + "method": "oracle_bp", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7876681685447693, + "delta_loss_same": -0.0036849379539489746, + "delta_loss_held": 0.00036537647247314453, + "delta_acc_same": 0.0 + }, + "oracle_bp_last2_norm_eta0.0003": { + "method": "oracle_bp", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7803657054901123, + "delta_loss_same": -0.010987401008605957, + "delta_loss_held": 0.0011096596717834473, + "delta_acc_same": 0.0 + }, + "oracle_bp_last2_norm_eta0.001": { + "method": "oracle_bp", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7555018663406372, + "delta_loss_same": -0.035851240158081055, + "delta_loss_held": 0.0038559436798095703, + "delta_acc_same": 0.0078125 + }, + "oracle_bp_last2_norm_eta0.003": { + "method": "oracle_bp", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.6901124715805054, + "delta_loss_same": -0.10124063491821289, + "delta_loss_held": 0.012904942035675049, + "delta_acc_same": 0.0234375 + }, + "oracle_bp_last2_norm_eta0.01": { + "method": "oracle_bp", + "update_range": "last2", + "norm_mode": "norm", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.5176879167556763, + "delta_loss_same": -0.273665189743042, + "delta_loss_held": 0.058579206466674805, + "delta_acc_same": 0.109375 + }, + "dfa_all_raw_eta1e-05": { + "method": "dfa", + "update_range": "all", + "norm_mode": "raw", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913514375686646, + "delta_loss_same": -1.6689300537109375e-06, + "delta_loss_held": -1.0132789611816406e-06, + "delta_acc_same": 0.0 + }, + "dfa_all_raw_eta3e-05": { + "method": "dfa", + "update_range": "all", + "norm_mode": "raw", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913480997085571, + "delta_loss_same": -5.0067901611328125e-06, + "delta_loss_held": -3.0994415283203125e-06, + "delta_acc_same": 0.0 + }, + "dfa_all_raw_eta0.0001": { + "method": "dfa", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913365364074707, + "delta_loss_same": -1.6570091247558594e-05, + "delta_loss_held": -1.0132789611816406e-05, + "delta_acc_same": 0.0 + }, + "dfa_all_raw_eta0.0003": { + "method": "dfa", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913035154342651, + "delta_loss_same": -4.9591064453125e-05, + "delta_loss_held": -3.0517578125e-05, + "delta_acc_same": 0.0 + }, + "dfa_all_raw_eta0.001": { + "method": "dfa", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7911888360977173, + "delta_loss_same": -0.00016427040100097656, + "delta_loss_held": -0.00010085105895996094, + "delta_acc_same": 0.0 + }, + "dfa_all_raw_eta0.003": { + "method": "dfa", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7908685803413391, + "delta_loss_same": -0.0004845261573791504, + "delta_loss_held": -0.00029754638671875, + "delta_acc_same": -0.0078125 + }, + "dfa_all_raw_eta0.01": { + "method": "dfa", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7898344993591309, + "delta_loss_same": -0.0015186071395874023, + "delta_loss_held": -0.0009320974349975586, + "delta_acc_same": -0.0078125 + }, + "scalar_cb_all_raw_eta1e-05": { + "method": "scalar_cb", + "update_range": "all", + "norm_mode": "raw", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913503646850586, + "delta_loss_same": -2.7418136596679688e-06, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "scalar_cb_all_raw_eta3e-05": { + "method": "scalar_cb", + "update_range": "all", + "norm_mode": "raw", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913447022438049, + "delta_loss_same": -8.404254913330078e-06, + "delta_loss_held": 5.960464477539063e-08, + "delta_acc_same": 0.0 + }, + "scalar_cb_all_raw_eta0.0001": { + "method": "scalar_cb", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.791325032711029, + "delta_loss_same": -2.8073787689208984e-05, + "delta_loss_held": 3.5762786865234375e-07, + "delta_acc_same": 0.0 + }, + "scalar_cb_all_raw_eta0.0003": { + "method": "scalar_cb", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7912687063217163, + "delta_loss_same": -8.440017700195312e-05, + "delta_loss_held": 1.1920928955078125e-06, + "delta_acc_same": 0.0 + }, + "scalar_cb_all_raw_eta0.001": { + "method": "scalar_cb", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7910715937614441, + "delta_loss_same": -0.0002815127372741699, + "delta_loss_held": 4.0531158447265625e-06, + "delta_acc_same": 0.0 + }, + "scalar_cb_all_raw_eta0.003": { + "method": "scalar_cb", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7905087471008301, + "delta_loss_same": -0.0008443593978881836, + "delta_loss_held": 1.2278556823730469e-05, + "delta_acc_same": 0.0 + }, + "scalar_cb_all_raw_eta0.01": { + "method": "scalar_cb", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7885413765907288, + "delta_loss_same": -0.002811729907989502, + "delta_loss_held": 4.2557716369628906e-05, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_all_raw_eta1e-05": { + "method": "vec_eT_M4", + "update_range": "all", + "norm_mode": "raw", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913480401039124, + "delta_loss_same": -5.066394805908203e-06, + "delta_loss_held": 5.960464477539063e-08, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_all_raw_eta3e-05": { + "method": "vec_eT_M4", + "update_range": "all", + "norm_mode": "raw", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913376092910767, + "delta_loss_same": -1.5497207641601562e-05, + "delta_loss_held": 2.980232238769531e-07, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_all_raw_eta0.0001": { + "method": "vec_eT_M4", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913011312484741, + "delta_loss_same": -5.1975250244140625e-05, + "delta_loss_held": 8.344650268554688e-07, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_all_raw_eta0.0003": { + "method": "vec_eT_M4", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7911967635154724, + "delta_loss_same": -0.0001563429832458496, + "delta_loss_held": 2.7418136596679688e-06, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_all_raw_eta0.001": { + "method": "vec_eT_M4", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7908321022987366, + "delta_loss_same": -0.0005210041999816895, + "delta_loss_held": 9.000301361083984e-06, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_all_raw_eta0.003": { + "method": "vec_eT_M4", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7897908687591553, + "delta_loss_same": -0.0015622377395629883, + "delta_loss_held": 2.7120113372802734e-05, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_all_raw_eta0.01": { + "method": "vec_eT_M4", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7861536741256714, + "delta_loss_same": -0.005199432373046875, + "delta_loss_held": 9.28640365600586e-05, + "delta_acc_same": 0.0 + }, + "oracle_bp_all_raw_eta1e-05": { + "method": "oracle_bp", + "update_range": "all", + "norm_mode": "raw", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913504242897034, + "delta_loss_same": -2.682209014892578e-06, + "delta_loss_held": 0.0, + "delta_acc_same": 0.0 + }, + "oracle_bp_all_raw_eta3e-05": { + "method": "oracle_bp", + "update_range": "all", + "norm_mode": "raw", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913450598716736, + "delta_loss_same": -8.046627044677734e-06, + "delta_loss_held": 5.960464477539063e-08, + "delta_acc_same": 0.0 + }, + "oracle_bp_all_raw_eta0.0001": { + "method": "oracle_bp", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913261651992798, + "delta_loss_same": -2.6941299438476562e-05, + "delta_loss_held": 2.980232238769531e-07, + "delta_acc_same": 0.0 + }, + "oracle_bp_all_raw_eta0.0003": { + "method": "oracle_bp", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7912718057632446, + "delta_loss_same": -8.130073547363281e-05, + "delta_loss_held": 1.1324882507324219e-06, + "delta_acc_same": 0.0 + }, + "oracle_bp_all_raw_eta0.001": { + "method": "oracle_bp", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7910813689231873, + "delta_loss_same": -0.00027173757553100586, + "delta_loss_held": 3.874301910400391e-06, + "delta_acc_same": 0.0 + }, + "oracle_bp_all_raw_eta0.003": { + "method": "oracle_bp", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7905375957489014, + "delta_loss_same": -0.0008155107498168945, + "delta_loss_held": 1.1801719665527344e-05, + "delta_acc_same": 0.0 + }, + "oracle_bp_all_raw_eta0.01": { + "method": "oracle_bp", + "update_range": "all", + "norm_mode": "raw", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7886372804641724, + "delta_loss_same": -0.0027158260345458984, + "delta_loss_held": 4.0531158447265625e-05, + "delta_acc_same": 0.0 + }, + "dfa_all_norm_eta1e-05": { + "method": "dfa", + "update_range": "all", + "norm_mode": "norm", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913448810577393, + "delta_loss_same": -8.225440979003906e-06, + "delta_loss_held": -1.5497207641601562e-06, + "delta_acc_same": 0.0 + }, + "dfa_all_norm_eta3e-05": { + "method": "dfa", + "update_range": "all", + "norm_mode": "norm", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7913283109664917, + "delta_loss_same": -2.47955322265625e-05, + "delta_loss_held": -4.589557647705078e-06, + "delta_acc_same": 0.0 + }, + "dfa_all_norm_eta0.0001": { + "method": "dfa", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7912708520889282, + "delta_loss_same": -8.225440979003906e-05, + "delta_loss_held": -1.4662742614746094e-05, + "delta_acc_same": 0.0 + }, + "dfa_all_norm_eta0.0003": { + "method": "dfa", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7911094427108765, + "delta_loss_same": -0.00024366378784179688, + "delta_loss_held": -4.124641418457031e-05, + "delta_acc_same": -0.0078125 + }, + "dfa_all_norm_eta0.001": { + "method": "dfa", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7905774712562561, + "delta_loss_same": -0.0007756352424621582, + "delta_loss_held": -0.00010246038436889648, + "delta_acc_same": -0.0078125 + }, + "dfa_all_norm_eta0.003": { + "method": "dfa", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7893450856208801, + "delta_loss_same": -0.0020080208778381348, + "delta_loss_held": -6.556510925292969e-06, + "delta_acc_same": -0.015625 + }, + "dfa_all_norm_eta0.01": { + "method": "dfa", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7885127067565918, + "delta_loss_same": -0.002840399742126465, + "delta_loss_held": 0.0035433173179626465, + "delta_acc_same": -0.0234375 + }, + "scalar_cb_all_norm_eta1e-05": { + "method": "scalar_cb", + "update_range": "all", + "norm_mode": "norm", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.79117751121521, + "delta_loss_same": -0.00017559528350830078, + "delta_loss_held": 2.3484230041503906e-05, + "delta_acc_same": 0.0 + }, + "scalar_cb_all_norm_eta3e-05": { + "method": "scalar_cb", + "update_range": "all", + "norm_mode": "norm", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7908279895782471, + "delta_loss_same": -0.0005251169204711914, + "delta_loss_held": 7.164478302001953e-05, + "delta_acc_same": 0.0 + }, + "scalar_cb_all_norm_eta0.0001": { + "method": "scalar_cb", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7896244525909424, + "delta_loss_same": -0.001728653907775879, + "delta_loss_held": 0.0002532005310058594, + "delta_acc_same": 0.0 + }, + "scalar_cb_all_norm_eta0.0003": { + "method": "scalar_cb", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7863528728485107, + "delta_loss_same": -0.0050002336502075195, + "delta_loss_held": 0.0008819103240966797, + "delta_acc_same": 0.0 + }, + "scalar_cb_all_norm_eta0.001": { + "method": "scalar_cb", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7768233418464661, + "delta_loss_same": -0.014529764652252197, + "delta_loss_held": 0.00439530611038208, + "delta_acc_same": -0.0078125 + }, + "scalar_cb_all_norm_eta0.003": { + "method": "scalar_cb", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7660057544708252, + "delta_loss_same": -0.025347352027893066, + "delta_loss_held": 0.026503384113311768, + "delta_acc_same": -0.015625 + }, + "scalar_cb_all_norm_eta0.01": { + "method": "scalar_cb", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.9399646520614624, + "delta_loss_same": 0.14861154556274414, + "delta_loss_held": 0.2661614418029785, + "delta_acc_same": -0.078125 + }, + "vec_eT_M4_all_norm_eta1e-05": { + "method": "vec_eT_M4", + "update_range": "all", + "norm_mode": "norm", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7906086444854736, + "delta_loss_same": -0.0007444620132446289, + "delta_loss_held": -5.054473876953125e-05, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_all_norm_eta3e-05": { + "method": "vec_eT_M4", + "update_range": "all", + "norm_mode": "norm", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7891266942024231, + "delta_loss_same": -0.002226412296295166, + "delta_loss_held": -0.0001468062400817871, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_all_norm_eta0.0001": { + "method": "vec_eT_M4", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.784011721611023, + "delta_loss_same": -0.0073413848876953125, + "delta_loss_held": -0.0004343390464782715, + "delta_acc_same": 0.0 + }, + "vec_eT_M4_all_norm_eta0.0003": { + "method": "vec_eT_M4", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7700058817863464, + "delta_loss_same": -0.021347224712371826, + "delta_loss_held": -0.0008407831192016602, + "delta_acc_same": 0.0078125 + }, + "vec_eT_M4_all_norm_eta0.001": { + "method": "vec_eT_M4", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.727683424949646, + "delta_loss_same": -0.06366968154907227, + "delta_loss_held": 0.0022974610328674316, + "delta_acc_same": 0.015625 + }, + "vec_eT_M4_all_norm_eta0.003": { + "method": "vec_eT_M4", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.6565364599227905, + "delta_loss_same": -0.13481664657592773, + "delta_loss_held": 0.04539656639099121, + "delta_acc_same": 0.0234375 + }, + "vec_eT_M4_all_norm_eta0.01": { + "method": "vec_eT_M4", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.8973477482795715, + "delta_loss_same": 0.10599464178085327, + "delta_loss_held": 0.5848973989486694, + "delta_acc_same": -0.09375 + }, + "oracle_bp_all_norm_eta1e-05": { + "method": "oracle_bp", + "update_range": "all", + "norm_mode": "norm", + "eta": 1e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7907174825668335, + "delta_loss_same": -0.0006356239318847656, + "delta_loss_held": 4.70280647277832e-05, + "delta_acc_same": 0.0 + }, + "oracle_bp_all_norm_eta3e-05": { + "method": "oracle_bp", + "update_range": "all", + "norm_mode": "norm", + "eta": 3e-05, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7894477248191833, + "delta_loss_same": -0.0019053816795349121, + "delta_loss_held": 0.00014150142669677734, + "delta_acc_same": 0.0 + }, + "oracle_bp_all_norm_eta0.0001": { + "method": "oracle_bp", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.0001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7850220203399658, + "delta_loss_same": -0.006331086158752441, + "delta_loss_held": 0.0004749298095703125, + "delta_acc_same": 0.0 + }, + "oracle_bp_all_norm_eta0.0003": { + "method": "oracle_bp", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.0003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7725323438644409, + "delta_loss_same": -0.018820762634277344, + "delta_loss_held": 0.0014526844024658203, + "delta_acc_same": 0.0 + }, + "oracle_bp_all_norm_eta0.001": { + "method": "oracle_bp", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.001, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.7305884957313538, + "delta_loss_same": -0.0607646107673645, + "delta_loss_held": 0.0051686763763427734, + "delta_acc_same": 0.015625 + }, + "oracle_bp_all_norm_eta0.003": { + "method": "oracle_bp", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.003, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.6248641014099121, + "delta_loss_same": -0.16648900508880615, + "delta_loss_held": 0.01829373836517334, + "delta_acc_same": 0.0546875 + }, + "oracle_bp_all_norm_eta0.01": { + "method": "oracle_bp", + "update_range": "all", + "norm_mode": "norm", + "eta": 0.01, + "loss_before_same": 0.7913531064987183, + "loss_after_same": 0.3855624794960022, + "delta_loss_same": -0.40579062700271606, + "delta_loss_held": 0.09351706504821777, + "delta_acc_same": 0.1484375 + } +} \ No newline at end of file diff --git a/results/fa_canonical_lam1e-2_30ep/results_cifar10.json b/results/fa_canonical_lam1e-2_30ep/results_cifar10.json new file mode 100644 index 0000000..d9a9f65 --- /dev/null +++ b/results/fa_canonical_lam1e-2_30ep/results_cifar10.json @@ -0,0 +1,549 @@ +{ + "42": { + "fa": { + "log": { + "train_loss": [ + 2.001119369430542, + 1.9333542645263673, + 1.9240801361083983, + 1.9216663201141357, + 1.918965964050293, + 1.9119908702850341, + 1.9097738315582276, + 1.9049057181167603, + 1.9038385245513916, + 1.901488224105835, + 1.8975307934951782, + 1.8936708712768555, + 1.8894188814544677, + 1.8864306787872314, + 1.8895101571655273, + 1.8835669344329835, + 1.8832266155624389, + 1.8791197660064698, + 1.8797098063659667, + 1.8761708308410645, + 1.875095842552185, + 1.8748220810317993, + 1.8743982402801513, + 1.8738871404266357, + 1.8735411545562743, + 1.8693548073577881, + 1.8659294427871704, + 1.8685178174591064, + 1.8670922566986083, + 1.8683236782455444 + ], + "train_acc": [ + 0.27484, + 0.30662, + 0.31156, + 0.3128, + 0.31684, + 0.3173, + 0.32102, + 0.32226, + 0.3248, + 0.32594, + 0.32582, + 0.33134, + 0.33202, + 0.33344, + 0.33274, + 0.33626, + 0.33556, + 0.33774, + 0.33918, + 0.33762, + 0.34082, + 0.34052, + 0.34092, + 0.34432, + 0.34294, + 0.3436, + 0.34578, + 0.34654, + 0.34636, + 0.3472 + ], + "test_acc": [ + 0.3237, + 0.3505, + 0.3372, + 0.3327, + 0.3511, + 0.3455, + 0.3449, + 0.344, + 0.3413, + 0.3462, + 0.35, + 0.3511, + 0.3604, + 0.3569, + 0.3565, + 0.3584, + 0.3634, + 0.3651, + 0.3684, + 0.362, + 0.3674, + 0.3586, + 0.3704, + 0.3688, + 0.3729, + 0.3715, + 0.3702, + 0.3713, + 0.3715, + 0.3713 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.154661625623703, + 0.148232564330101, + 0.11714619398117065, + 0.9808143377304077 + ], + "perturbation_rho": [ + 0.2043638527393341, + 0.03451352193951607, + 0.20099492371082306, + 0.6849091649055481 + ], + "nudging": { + "0.001": [ + -7.456343155354261e-06, + -7.0015667006373405e-06, + -6.1238533817231655e-06, + -4.935957258567214e-05 + ], + "0.003": [ + -2.2464897483587265e-05, + -2.095731906592846e-05, + -1.8515565898269415e-05, + -0.00014814879978075624 + ], + "0.01": [ + -7.48702441342175e-05, + -6.984942592680454e-05, + -6.168842082843184e-05, + -0.0004938761703670025 + ] + }, + "hidden_norms_per_layer": [ + 12005.7001953125, + 12007.416015625, + 12011.4248046875, + 12003.9306640625, + 12006.5830078125 + ], + "bp_grad_norms_per_layer": [ + 1.7161242794827558e-05, + 1.712461198621895e-05, + 1.7262802430195734e-05, + 1.6996016711345874e-05, + 1.602559132152237e-05 + ] + }, + "drift": { + "embed.weight": 78.51231332812849, + "embed.bias": 102.12148052673881, + "blocks.0.ln.weight": 0.2991768419742584, + "blocks.0.w1.weight": 3.288291856838975, + "blocks.0.w1.bias": 5.396373593768907, + "blocks.0.w2.weight": 18.07176198506393, + "blocks.1.ln.weight": 0.30484291911125183, + "blocks.1.w1.weight": 3.363888651672944, + "blocks.1.w1.bias": 5.6524749125654825, + "blocks.1.w2.weight": 19.430774882635927, + "blocks.2.ln.weight": 0.3102824091911316, + "blocks.2.w1.weight": 3.4139876185805202, + "blocks.2.w1.bias": 5.452178486528747, + "blocks.2.w2.weight": 20.125989565290535, + "blocks.3.ln.weight": 0.3048917055130005, + "blocks.3.w1.weight": 3.480676314799551, + "blocks.3.w1.bias": 5.215887111238424, + "blocks.3.w2.weight": 18.601435796851646, + "out_ln.weight": 0.20746967196464539, + "out_head.weight": 2.830159264066497, + "out_head.bias": 1.3353853268796754 + } + } + }, + "123": { + "fa": { + "log": { + "train_loss": [ + 1.9927266687774658, + 1.9300689645767213, + 1.92596540309906, + 1.9193654559326172, + 1.9174729382324218, + 1.914334167137146, + 1.9108343372344971, + 1.9098404777526856, + 1.9070983071517944, + 1.9046820580291748, + 1.9035546282958984, + 1.902319673461914, + 1.9007709796524048, + 1.8978776998901368, + 1.896000676651001, + 1.8922497060394288, + 1.889219735031128, + 1.8912379706573486, + 1.8899934759902954, + 1.886697685585022, + 1.8858332043457031, + 1.8851475219726563, + 1.8850083080673217, + 1.8836419734191894, + 1.8818570189666748, + 1.880578341293335, + 1.8828362002563477, + 1.8791149730682373, + 1.881042135925293, + 1.8783651885986328 + ], + "train_acc": [ + 0.28066, + 0.30852, + 0.31142, + 0.3131, + 0.31726, + 0.31894, + 0.31884, + 0.3222, + 0.32346, + 0.325, + 0.32962, + 0.32534, + 0.32718, + 0.32974, + 0.33498, + 0.33296, + 0.33498, + 0.33642, + 0.33698, + 0.33676, + 0.3368, + 0.33892, + 0.33858, + 0.34048, + 0.34248, + 0.34264, + 0.34458, + 0.34442, + 0.34196, + 0.3428 + ], + "test_acc": [ + 0.3339, + 0.344, + 0.3447, + 0.3537, + 0.3523, + 0.3448, + 0.3569, + 0.3548, + 0.3564, + 0.3513, + 0.3558, + 0.3555, + 0.3578, + 0.3565, + 0.3511, + 0.3617, + 0.3621, + 0.3603, + 0.3619, + 0.36, + 0.3663, + 0.3679, + 0.3665, + 0.3645, + 0.363, + 0.3632, + 0.3656, + 0.3666, + 0.3666, + 0.366 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.10381253063678741, + 0.11509518325328827, + 0.17561045289039612, + 0.9849518537521362 + ], + "perturbation_rho": [ + -0.013579179532825947, + 0.098294198513031, + 0.1665695607662201, + 0.7168847322463989 + ], + "nudging": { + "0.001": [ + -3.704102709889412e-06, + -5.607143975794315e-06, + -8.841510862112045e-06, + -5.108967889100313e-05 + ], + "0.003": [ + -1.0923598892986774e-05, + -1.6769510693848133e-05, + -2.6412191800773144e-05, + -0.00015316426288336515 + ], + "0.01": [ + -3.6393641494214535e-05, + -5.586724728345871e-05, + -8.803850505501032e-05, + -0.0005103998119011521 + ] + }, + "hidden_norms_per_layer": [ + 12513.1455078125, + 12514.5771484375, + 12517.3583984375, + 12520.568359375, + 12517.57421875 + ], + "bp_grad_norms_per_layer": [ + 1.9153141693095677e-05, + 1.9135366528644226e-05, + 1.8911112420028076e-05, + 1.892356522148475e-05, + 1.7506923541077413e-05 + ] + }, + "drift": { + "embed.weight": 89.53228672658916, + "embed.bias": 152.8584432062178, + "blocks.0.ln.weight": 0.2654326856136322, + "blocks.0.w1.weight": 3.3634291127986065, + "blocks.0.w1.bias": 5.280393391584056, + "blocks.0.w2.weight": 19.28885452796699, + "blocks.1.ln.weight": 0.2610284984111786, + "blocks.1.w1.weight": 3.3605846097214807, + "blocks.1.w1.bias": 4.889820303164699, + "blocks.1.w2.weight": 20.281310673104024, + "blocks.2.ln.weight": 0.2743469476699829, + "blocks.2.w1.weight": 3.391098035259505, + "blocks.2.w1.bias": 4.733926864945133, + "blocks.2.w2.weight": 20.84238400209855, + "blocks.3.ln.weight": 0.28759220242500305, + "blocks.3.w1.weight": 3.4831818014183473, + "blocks.3.w1.bias": 4.539792496168549, + "blocks.3.w2.weight": 17.922103982945213, + "out_ln.weight": 0.23056229948997498, + "out_head.weight": 2.947940047368198, + "out_head.bias": 0.999532168893943 + } + } + }, + "456": { + "fa": { + "log": { + "train_loss": [ + 2.007471420669556, + 1.9475741510772706, + 1.935076278114319, + 1.9286792455673218, + 1.9233443587493897, + 1.921987562637329, + 1.9133965182113648, + 1.9098651378631593, + 1.9032709611511232, + 1.9005253164291382, + 1.8951593602752685, + 1.8959063681793213, + 1.8941862697982788, + 1.8903014281845092, + 1.887538351173401, + 1.8868630823516845, + 1.8855092962646485, + 1.882849036026001, + 1.88272844581604, + 1.880844307899475, + 1.8779692416000366, + 1.8777563387298584, + 1.8754584911346435, + 1.8720009698104858, + 1.8718394606018067, + 1.871922555580139, + 1.8742619204330444, + 1.871095755996704, + 1.8686067379379272, + 1.8697797116470336 + ], + "train_acc": [ + 0.27346, + 0.30166, + 0.30968, + 0.31384, + 0.3171, + 0.31864, + 0.32234, + 0.32546, + 0.32768, + 0.32608, + 0.33286, + 0.33212, + 0.33646, + 0.33228, + 0.33466, + 0.33496, + 0.33834, + 0.34088, + 0.33898, + 0.34018, + 0.3417, + 0.34182, + 0.3446, + 0.34544, + 0.34776, + 0.34688, + 0.3461, + 0.34764, + 0.3487, + 0.34986 + ], + "test_acc": [ + 0.3312, + 0.3461, + 0.3375, + 0.3554, + 0.3417, + 0.349, + 0.3492, + 0.3315, + 0.3524, + 0.3561, + 0.3452, + 0.3612, + 0.3675, + 0.361, + 0.3588, + 0.3671, + 0.3652, + 0.3621, + 0.3608, + 0.3682, + 0.3607, + 0.3563, + 0.3698, + 0.3701, + 0.3677, + 0.373, + 0.3704, + 0.3674, + 0.37, + 0.3695 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.1374516785144806, + 0.16781684756278992, + 0.13626089692115784, + 0.9774131774902344 + ], + "perturbation_rho": [ + 0.0486995093524456, + 0.06349372863769531, + 0.007340744137763977, + 0.6342363357543945 + ], + "nudging": { + "0.001": [ + -5.1066745072603226e-06, + -7.127760909497738e-06, + -6.226240657269955e-06, + -4.646868910640478e-05 + ], + "0.003": [ + -1.5374505892395973e-05, + -2.130062784999609e-05, + -1.874461304396391e-05, + -0.0001394655555486679 + ], + "0.01": [ + -5.139666609466076e-05, + -7.112661842256784e-05, + -6.259605288505554e-05, + -0.0004648104077205062 + ] + }, + "hidden_norms_per_layer": [ + 12142.6181640625, + 12149.4814453125, + 12152.4228515625, + 12154.3623046875, + 12153.6318359375 + ], + "bp_grad_norms_per_layer": [ + 1.7370659406878985e-05, + 1.7375436073052697e-05, + 1.7465752534917556e-05, + 1.755404082359746e-05, + 1.6847530787345022e-05 + ] + }, + "drift": { + "embed.weight": 81.50708429789378, + "embed.bias": 90.80998898870095, + "blocks.0.ln.weight": 0.30019262433052063, + "blocks.0.w1.weight": 3.2393405099782573, + "blocks.0.w1.bias": 5.11706466812565, + "blocks.0.w2.weight": 17.26999421209171, + "blocks.1.ln.weight": 0.29391026496887207, + "blocks.1.w1.weight": 3.2524768916503883, + "blocks.1.w1.bias": 5.375142102957966, + "blocks.1.w2.weight": 17.822565033735142, + "blocks.2.ln.weight": 0.29711613059043884, + "blocks.2.w1.weight": 3.347203060867532, + "blocks.2.w1.bias": 5.458224100319586, + "blocks.2.w2.weight": 19.038612136675116, + "blocks.3.ln.weight": 0.3008574843406677, + "blocks.3.w1.weight": 3.407494069111075, + "blocks.3.w1.bias": 5.482950458082574, + "blocks.3.w2.weight": 17.98442064571867, + "out_ln.weight": 0.21060113608837128, + "out_head.weight": 2.7473203281973158, + "out_head.bias": 0.9871044007414218 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 30, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 42, + 123, + 456 + ], + "gpu": 0, + "output_dir": "results/fa_canonical_lam1e-2_30ep", + "methods": [ + "fa" + ], + "random_targets": false, + "penalty_lam": 0.01, + "num_classes": 10 + } +} \ No newline at end of file diff --git a/results/fa_canonical_lam1e-4_30ep/results_cifar10.json b/results/fa_canonical_lam1e-4_30ep/results_cifar10.json new file mode 100644 index 0000000..d04a393 --- /dev/null +++ b/results/fa_canonical_lam1e-4_30ep/results_cifar10.json @@ -0,0 +1,549 @@ +{ + "42": { + "fa": { + "log": { + "train_loss": [ + 2.0345889838027955, + 1.9560137537384032, + 1.9360403113555908, + 1.9143632999420166, + 1.8943112557601929, + 1.883546539993286, + 1.87789137008667, + 1.8733353225708007, + 1.8758181957626343, + 1.8700244534301758, + 1.8686021829605102, + 1.8640803202056884, + 1.8597132386779784, + 1.8604257183837891, + 1.860362275390625, + 1.8570359252166748, + 1.8561881994247436, + 1.8504637549209595, + 1.8508178236389161, + 1.8495385042572021, + 1.8523688412475585, + 1.8491829050445556, + 1.849259608154297, + 1.8475904892730712, + 1.846731012802124, + 1.8426731698989869, + 1.8409621490097046, + 1.8425804473876952, + 1.8410273541259765, + 1.8429513037109375 + ], + "train_acc": [ + 0.25574, + 0.29268, + 0.30346, + 0.31094, + 0.31784, + 0.3242, + 0.32714, + 0.3321, + 0.33104, + 0.3346, + 0.33454, + 0.33844, + 0.33788, + 0.33896, + 0.3398, + 0.34038, + 0.3428, + 0.34448, + 0.34504, + 0.34356, + 0.34638, + 0.34678, + 0.3455, + 0.34862, + 0.34636, + 0.35102, + 0.34858, + 0.35316, + 0.3505, + 0.3521 + ], + "test_acc": [ + 0.2909, + 0.3244, + 0.3269, + 0.3335, + 0.3455, + 0.3577, + 0.3581, + 0.3473, + 0.359, + 0.3635, + 0.3513, + 0.3583, + 0.3735, + 0.3642, + 0.3646, + 0.364, + 0.3653, + 0.3734, + 0.3717, + 0.3682, + 0.3792, + 0.3722, + 0.3728, + 0.3747, + 0.3749, + 0.3751, + 0.3748, + 0.375, + 0.3766, + 0.3759 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.03903631120920181, + 0.014399020932614803, + -0.033061157912015915, + 0.8762983083724976 + ], + "perturbation_rho": [ + 0.04046167433261871, + 0.029874827712774277, + 0.018399983644485474, + 0.5844764113426208 + ], + "nudging": { + "0.001": [ + -3.4736585803329945e-06, + -1.6225967556238174e-06, + 8.612405508756638e-07, + -4.002035711891949e-05 + ], + "0.003": [ + -1.0443473001942039e-05, + -4.940724465996027e-06, + 2.589426003396511e-06, + -0.00012009820784442127 + ], + "0.01": [ + -3.477800055406988e-05, + -1.6514735762029886e-05, + 8.722592610865831e-06, + -0.00040041320607997477 + ] + }, + "hidden_norms_per_layer": [ + 9302.052734375, + 9300.826171875, + 9304.12890625, + 9388.5966796875, + 9324.71484375 + ], + "bp_grad_norms_per_layer": [ + 1.8842416466213763e-05, + 1.7771730199456215e-05, + 1.7083899365388788e-05, + 1.6848869563546032e-05, + 1.1624123544606846e-05 + ] + }, + "drift": { + "embed.weight": 59.712949390275256, + "embed.bias": 109.7242290933353, + "blocks.0.ln.weight": 0.4963775873184204, + "blocks.0.w1.weight": 6.181720741000805, + "blocks.0.w1.bias": 4.020397499075911, + "blocks.0.w2.weight": 27.582674728139626, + "blocks.1.ln.weight": 0.5040290951728821, + "blocks.1.w1.weight": 6.5836738314372525, + "blocks.1.w1.bias": 3.6793793299266104, + "blocks.1.w2.weight": 30.666596548839138, + "blocks.2.ln.weight": 0.5469347834587097, + "blocks.2.w1.weight": 6.732229120538098, + "blocks.2.w1.bias": 3.7361472645162905, + "blocks.2.w2.weight": 32.57792259935943, + "blocks.3.ln.weight": 0.5613139867782593, + "blocks.3.w1.weight": 6.581817915516039, + "blocks.3.w1.bias": 3.910112736502136, + "blocks.3.w2.weight": 30.460380132293686, + "out_ln.weight": 0.13369733095169067, + "out_head.weight": 2.149734268892375, + "out_head.bias": 1.8324297050244958 + } + } + }, + "123": { + "fa": { + "log": { + "train_loss": [ + 2.02592181602478, + 1.9371592224121095, + 1.8974695124053955, + 1.8743731897735596, + 1.86856899684906, + 1.866699522743225, + 1.8631246627807616, + 1.8699150874328614, + 1.8676455249404906, + 1.8666385611724854, + 1.8668112030792237, + 1.8644982721710206, + 1.8628531475448609, + 1.8602032104492188, + 1.859476708946228, + 1.8544428533554078, + 1.8534636458969116, + 1.8551011206054688, + 1.854274546432495, + 1.850538496170044, + 1.8506593602752686, + 1.849616947631836, + 1.8474625555419921, + 1.8434547743988037, + 1.8423766018676757, + 1.8429830319976808, + 1.8445982418823241, + 1.842038772354126, + 1.8427192529296874, + 1.8390978100585937 + ], + "train_acc": [ + 0.26002, + 0.30074, + 0.31632, + 0.32608, + 0.33058, + 0.3327, + 0.33324, + 0.3331, + 0.33306, + 0.3358, + 0.33708, + 0.33474, + 0.33836, + 0.33936, + 0.34254, + 0.34292, + 0.34406, + 0.34572, + 0.34532, + 0.34724, + 0.34686, + 0.35018, + 0.34834, + 0.35062, + 0.35238, + 0.35146, + 0.35322, + 0.3507, + 0.35174, + 0.35298 + ], + "test_acc": [ + 0.3099, + 0.3371, + 0.35, + 0.3548, + 0.3568, + 0.3543, + 0.3595, + 0.3565, + 0.3605, + 0.3532, + 0.3572, + 0.3574, + 0.3587, + 0.3635, + 0.3598, + 0.3716, + 0.3664, + 0.3641, + 0.3588, + 0.3685, + 0.3704, + 0.3738, + 0.3678, + 0.3716, + 0.3726, + 0.3706, + 0.3715, + 0.3711, + 0.3718, + 0.3725 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.12851236760616302, + 0.0212344229221344, + 0.06850548088550568, + 0.912018895149231 + ], + "perturbation_rho": [ + 0.1286340206861496, + 0.05542958900332451, + 0.095004141330719, + 0.5912511944770813 + ], + "nudging": { + "0.001": [ + -1.2503878679126501e-05, + -2.949964255094528e-06, + -4.535817424766719e-06, + -4.0970538975670934e-05 + ], + "0.003": [ + -3.755756188184023e-05, + -8.84209293872118e-06, + -1.3517230399884284e-05, + -0.00012284089461900294 + ], + "0.01": [ + -0.00012522244651336223, + -2.9436778277158737e-05, + -4.5000226236879826e-05, + -0.0004094060859642923 + ] + }, + "hidden_norms_per_layer": [ + 8440.2509765625, + 8675.947265625, + 8919.455078125, + 9151.62890625, + 9001.966796875 + ], + "bp_grad_norms_per_layer": [ + 2.2785976398154162e-05, + 1.9475846784189343e-05, + 1.76876437762985e-05, + 1.6414065612480044e-05, + 1.2445364518498536e-05 + ] + }, + "drift": { + "embed.weight": 58.570146595416965, + "embed.bias": 129.66757192630527, + "blocks.0.ln.weight": 0.506428599357605, + "blocks.0.w1.weight": 6.100287737701914, + "blocks.0.w1.bias": 4.352361447004298, + "blocks.0.w2.weight": 29.053039362183725, + "blocks.1.ln.weight": 0.48886165022850037, + "blocks.1.w1.weight": 6.289397911525807, + "blocks.1.w1.bias": 4.491060429115057, + "blocks.1.w2.weight": 31.966204529299326, + "blocks.2.ln.weight": 0.47751307487487793, + "blocks.2.w1.weight": 6.165341672963252, + "blocks.2.w1.bias": 4.204746402092476, + "blocks.2.w2.weight": 31.785153220803842, + "blocks.3.ln.weight": 0.522526741027832, + "blocks.3.w1.weight": 6.2976831221121925, + "blocks.3.w1.bias": 3.31165977931123, + "blocks.3.w2.weight": 29.399820039375125, + "out_ln.weight": 0.12725675106048584, + "out_head.weight": 2.171575181004019, + "out_head.bias": 1.7024717076770008 + } + } + }, + "456": { + "fa": { + "log": { + "train_loss": [ + 2.0370823514556884, + 1.9467987035751342, + 1.912523896484375, + 1.8945044506072999, + 1.881802406349182, + 1.8781717306137085, + 1.8688158060073852, + 1.8661776677703859, + 1.8603027975845337, + 1.8572819149017334, + 1.8532151040267943, + 1.8534327938461304, + 1.8522534008407592, + 1.8507964714050293, + 1.8465819549179077, + 1.8432143920135498, + 1.8410576669311522, + 1.8371334344863892, + 1.8372844079208375, + 1.8335014197540282, + 1.8299405459213256, + 1.8304111400985719, + 1.8290630575561524, + 1.8247105368041991, + 1.8245959228515625, + 1.825667812576294, + 1.8260319690322877, + 1.8243235848999024, + 1.8212057236480712, + 1.8206781775283813 + ], + "train_acc": [ + 0.25624, + 0.29612, + 0.3112, + 0.31836, + 0.32406, + 0.32822, + 0.33338, + 0.3358, + 0.3376, + 0.33728, + 0.34174, + 0.34368, + 0.34628, + 0.34296, + 0.34426, + 0.34552, + 0.34848, + 0.35006, + 0.34902, + 0.34998, + 0.35384, + 0.35252, + 0.35216, + 0.35542, + 0.35508, + 0.35538, + 0.35446, + 0.35524, + 0.3556, + 0.35744 + ], + "test_acc": [ + 0.2999, + 0.3434, + 0.3434, + 0.364, + 0.3546, + 0.3612, + 0.3581, + 0.3492, + 0.367, + 0.3567, + 0.3655, + 0.3723, + 0.3761, + 0.3771, + 0.3778, + 0.3763, + 0.3825, + 0.3744, + 0.3812, + 0.3831, + 0.3751, + 0.3821, + 0.3809, + 0.3833, + 0.3812, + 0.3832, + 0.3835, + 0.3836, + 0.3841, + 0.3837 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.11049995571374893, + 0.014905610121786594, + -0.0519559383392334, + 0.861151933670044 + ], + "perturbation_rho": [ + 0.058121487498283386, + 0.011935144662857056, + -0.056115295737981796, + 0.5436498522758484 + ], + "nudging": { + "0.001": [ + -7.875027222326025e-06, + -1.205597072839737e-06, + 2.052285708487034e-06, + -3.838281554635614e-05 + ], + "0.003": [ + -2.359108839300461e-05, + -3.5760422179009765e-06, + 6.082700565457344e-06, + -0.00011519025429151952 + ], + "0.01": [ + -7.864644430810586e-05, + -1.1975058441748843e-05, + 2.0268842490622774e-05, + -0.000383934035198763 + ] + }, + "hidden_norms_per_layer": [ + 8074.6318359375, + 8344.6298828125, + 8543.16796875, + 8806.9365234375, + 8809.208984375 + ], + "bp_grad_norms_per_layer": [ + 2.0788113033631817e-05, + 1.6527425032109022e-05, + 1.6617635992588475e-05, + 1.6509349734405987e-05, + 1.1822515261883382e-05 + ] + }, + "drift": { + "embed.weight": 55.0795347886669, + "embed.bias": 104.1791057670674, + "blocks.0.ln.weight": 0.5131628513336182, + "blocks.0.w1.weight": 6.423288157104268, + "blocks.0.w1.bias": 5.260214874942604, + "blocks.0.w2.weight": 28.84901365790228, + "blocks.1.ln.weight": 0.5011720657348633, + "blocks.1.w1.weight": 6.239148515891604, + "blocks.1.w1.bias": 3.694106675391347, + "blocks.1.w2.weight": 28.607867363928534, + "blocks.2.ln.weight": 0.46569541096687317, + "blocks.2.w1.weight": 6.112045116014977, + "blocks.2.w1.bias": 4.730623150261222, + "blocks.2.w2.weight": 28.99578369272475, + "blocks.3.ln.weight": 0.5072412490844727, + "blocks.3.w1.weight": 6.376723566598171, + "blocks.3.w1.bias": 4.743548803408704, + "blocks.3.w2.weight": 30.777217385288502, + "out_ln.weight": 0.1257992684841156, + "out_head.weight": 2.0103689615464178, + "out_head.bias": 1.8804179129019218 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 30, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 42, + 123, + 456 + ], + "gpu": 0, + "output_dir": "results/fa_canonical_lam1e-4_30ep", + "methods": [ + "fa" + ], + "random_targets": false, + "penalty_lam": 0.0001, + "num_classes": 10 + } +} \ No newline at end of file diff --git a/results/fa_canonical_penalty_sweep.log b/results/fa_canonical_penalty_sweep.log new file mode 100644 index 0000000..37e42d4 --- /dev/null +++ b/results/fa_canonical_penalty_sweep.log @@ -0,0 +1,76 @@ +=== FA canonical penalty sweep === +--- FA λ=1e-4 --- +Using device: cuda:0 + +============================================================ +Seed 42 +============================================================ + +--- FA --- + [FA] Epoch 1: loss=2.0346, train=0.2557, test=0.2909 + [FA] Epoch 10: loss=1.8700, train=0.3346, test=0.3635 + [FA] Epoch 20: loss=1.8495, train=0.3436, test=0.3682 + [FA] Epoch 30: loss=1.8430, train=0.3521, test=0.3759 + Final test acc: 0.3759 + +============================================================ +Seed 123 +============================================================ + +--- FA --- + [FA] Epoch 1: loss=2.0259, train=0.2600, test=0.3099 + [FA] Epoch 10: loss=1.8666, train=0.3358, test=0.3532 + [FA] Epoch 20: loss=1.8505, train=0.3472, test=0.3685 + [FA] Epoch 30: loss=1.8391, train=0.3530, test=0.3725 + Final test acc: 0.3725 + +============================================================ +Seed 456 +============================================================ + +--- FA --- + [FA] Epoch 1: loss=2.0371, train=0.2562, test=0.2999 + [FA] Epoch 10: loss=1.8573, train=0.3373, test=0.3567 + [FA] Epoch 20: loss=1.8335, train=0.3500, test=0.3831 + [FA] Epoch 30: loss=1.8207, train=0.3574, test=0.3837 + Final test acc: 0.3837 + +All results saved to results/fa_canonical_lam1e-4_30ep/results_cifar10.json +--- FA λ=1e-2 --- +Using device: cuda:0 + +============================================================ +Seed 42 +============================================================ + +--- FA --- + [FA] Epoch 1: loss=2.0011, train=0.2748, test=0.3237 + [FA] Epoch 10: loss=1.9015, train=0.3259, test=0.3462 + [FA] Epoch 20: loss=1.8762, train=0.3376, test=0.3620 + [FA] Epoch 30: loss=1.8683, train=0.3472, test=0.3713 + Final test acc: 0.3713 + +============================================================ +Seed 123 +============================================================ + +--- FA --- + [FA] Epoch 1: loss=1.9927, train=0.2807, test=0.3339 + [FA] Epoch 10: loss=1.9047, train=0.3250, test=0.3513 + [FA] Epoch 20: loss=1.8867, train=0.3368, test=0.3600 + [FA] Epoch 30: loss=1.8784, train=0.3428, test=0.3660 + Final test acc: 0.3660 + +============================================================ +Seed 456 +============================================================ + +--- FA --- + [FA] Epoch 1: loss=2.0075, train=0.2735, test=0.3312 + [FA] Epoch 10: loss=1.9005, train=0.3261, test=0.3561 + [FA] Epoch 20: loss=1.8808, train=0.3402, test=0.3682 + [FA] Epoch 30: loss=1.8698, train=0.3499, test=0.3695 + Final test acc: 0.3695 + +All results saved to results/fa_canonical_lam1e-2_30ep/results_cifar10.json +=== FA PENALTY SWEEP DONE === diff --git a/results/figures/figure_snapshot_resmlp.pdf b/results/figures/figure_snapshot_resmlp.pdf new file mode 100644 index 0000000..3724bca Binary files /dev/null and b/results/figures/figure_snapshot_resmlp.pdf differ diff --git a/results/figures/figure_snapshot_vit.pdf b/results/figures/figure_snapshot_vit.pdf new file mode 100644 index 0000000..b9a78dc Binary files /dev/null and b/results/figures/figure_snapshot_vit.pdf differ diff --git a/results/freeze_with_decay/freeze_with_decay_t5_s42.json b/results/freeze_with_decay/freeze_with_decay_t5_s42.json new file mode 100644 index 0000000..6f52855 --- /dev/null +++ b/results/freeze_with_decay/freeze_with_decay_t5_s42.json @@ -0,0 +1,5762 @@ +{ + "args": { + "num_blocks": 4, + "d_hidden": 256, + "batch_size": 128, + "epochs": 100, + "t0": 5, + "alpha": 0.75, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "M": 4, + "seed": 42, + "gpu": 2, + "output_dir": "/home/yurenh2/fa/results/freeze_with_decay" + }, + "dfa_ckpt_acc": 0.304, + "continue_DFA": { + "test_acc": [ + 0.2982, + 0.3109, + 0.3125, + 0.3038, + 0.3113, + 0.3135, + 0.302, + 0.3075, + 0.3097, + 0.3101, + 0.3029, + 0.3054, + 0.3108, + 0.3095, + 0.3047, + 0.3164, + 0.3031, + 0.3083, + 0.3171, + 0.3029, + 0.2979, + 0.2958, + 0.3099, + 0.2966, + 0.2959, + 0.3017, + 0.3082, + 0.3046, + 0.306, + 0.292, + 0.281, + 0.3129, + 0.3075, + 0.3115, + 0.3141, + 0.3111, + 0.3151, + 0.2969, + 0.3097, + 0.321, + 0.3058, + 0.3145, + 0.32, + 0.303, + 0.3093, + 0.3071, + 0.3118, + 0.3043, + 0.3104, + 0.3127, + 0.3148, + 0.3203, + 0.3112, + 0.3016, + 0.315, + 0.312, + 0.3134, + 0.3129, + 0.3049, + 0.3125, + 0.3142, + 0.3164, + 0.314, + 0.309, + 0.3142, + 0.3165, + 0.3125, + 0.3095, + 0.3104, + 0.3188, + 0.3149, + 0.3142, + 0.3119, + 0.3166, + 0.3118, + 0.3119, + 0.3127, + 0.311, + 0.3141, + 0.3164, + 0.3123, + 0.3128, + 0.3126, + 0.3091, + 0.3115, + 0.3127, + 0.3121, + 0.3123, + 0.3127, + 0.3132, + 0.3118, + 0.3118, + 0.3117, + 0.3114, + 0.3115 + ], + "train_loss": [ + 1.989790809059143, + 1.990307411880493, + 1.9905100513458251, + 1.9918334338378907, + 1.9863724251937867, + 1.9870153832244872, + 1.9874663953399658, + 1.9870845441055298, + 1.9880484677505492, + 1.9872064337539672, + 1.9897905487823486, + 1.9892820449066162, + 1.9874972410583496, + 1.9877921746444702, + 1.9876875100708007, + 1.9888226028060914, + 1.9874765905761718, + 1.9867966274642945, + 1.987537554550171, + 1.9880204120254517, + 1.9879772283935546, + 1.987797650413513, + 1.9874019779968262, + 1.9876940496063233, + 1.986886355819702, + 1.9884147914123536, + 1.9890670285797118, + 1.9873397811889648, + 1.9847210833740234, + 1.9871949213027955, + 1.9887558262634277, + 1.9838399686431885, + 1.9857967501068114, + 1.9860699237060546, + 1.9850847225952148, + 1.987654845123291, + 1.983670299758911, + 1.987481754837036, + 1.9858247266387938, + 1.9868243627166748, + 1.9862985388946532, + 1.984481724205017, + 1.9851255657958984, + 1.9881289917373657, + 1.9866780487442017, + 1.9885919563293457, + 1.9857788675308228, + 1.9890421838378907, + 1.9863371643066405, + 1.986637942276001, + 1.9849364169311523, + 1.9842691050720216, + 1.9856912046051025, + 1.988491299057007, + 1.9852929847717284, + 1.9856826776123047, + 1.9851847518920898, + 1.9835067967987061, + 1.9865730474853516, + 1.9850236835479735, + 1.9849657077789307, + 1.9844414936065673, + 1.9851242599105834, + 1.9842400899505614, + 1.9859014458847046, + 1.9850837426757812, + 1.985779475440979, + 1.985046662750244, + 1.9846652752685547, + 1.9845653623199462, + 1.984431827697754, + 1.9861651288223268, + 1.9833351360702514, + 1.9858753430175782, + 1.9859362523651123, + 1.9840349249649047, + 1.9841974882507325, + 1.9834141875457765, + 1.9854680131530762, + 1.9825797986221314, + 1.9835828475570678, + 1.9841230081176757, + 1.9844115731811522, + 1.9840126071548463, + 1.9844582679748535, + 1.9840802533340454, + 1.9842612131118775, + 1.984658988571167, + 1.9846206958770751, + 1.983520182762146, + 1.981859715309143, + 1.9833977752304077, + 1.9841900691986083, + 1.982843738861084, + 1.9838121879577637 + ], + "gamma": [ + [ + 6, + 0.0821653357706964 + ], + [ + 7, + 0.083711032057181 + ], + [ + 8, + 0.08393650152720511 + ], + [ + 9, + 0.08384976850356907 + ], + [ + 10, + 0.08560753799974918 + ], + [ + 13, + 0.0868276598630473 + ], + [ + 15, + 0.08848524722270668 + ], + [ + 20, + 0.08918609796091914 + ], + [ + 25, + 0.09372491284739226 + ], + [ + 35, + 0.09340126946335658 + ], + [ + 45, + 0.09817965375259519 + ], + [ + 55, + 0.09978153288830072 + ], + [ + 65, + 0.1001084745512344 + ], + [ + 75, + 0.1013008076697588 + ], + [ + 85, + 0.1014239476644434 + ], + [ + 95, + 0.10141936334548518 + ], + [ + 100, + 0.10145300498697907 + ] + ], + "rho": [ + [ + 6, + 0.019282110035419464 + ], + [ + 7, + 0.006952052121050656 + ], + [ + 8, + 0.008748143445700407 + ], + [ + 9, + 0.008938514394685626 + ], + [ + 10, + 0.01805932994466275 + ], + [ + 13, + 0.01803369668778032 + ], + [ + 15, + 0.0023002898087725043 + ], + [ + 20, + 0.012751705711707473 + ], + [ + 25, + 0.0011155498214066029 + ], + [ + 35, + 0.009300894802436233 + ], + [ + 45, + -0.0039156777784228325 + ], + [ + 55, + -0.007268198300153017 + ], + [ + 65, + 0.008430896326899529 + ], + [ + 75, + 0.004795442800968885 + ], + [ + 85, + -0.0030130266677588224 + ], + [ + 95, + 0.006304946728050709 + ], + [ + 100, + 0.004224925301969051 + ] + ], + "alpha_eff": [ + [ + 6, + 0.0 + ], + [ + 7, + 0.0 + ], + [ + 8, + 0.0 + ], + [ + 9, + 0.0 + ], + [ + 10, + 0.0 + ], + [ + 11, + 0.0 + ], + [ + 12, + 0.0 + ], + [ + 13, + 0.0 + ], + [ + 14, + 0.0 + ], + [ + 15, + 0.0 + ], + [ + 16, + 0.0 + ], + [ + 17, + 0.0 + ], + [ + 18, + 0.0 + ], + [ + 19, + 0.0 + ], + [ + 20, + 0.0 + ], + [ + 21, + 0.0 + ], + [ + 22, + 0.0 + ], + [ + 23, + 0.0 + ], + [ + 24, + 0.0 + ], + [ + 25, + 0.0 + ], + [ + 26, + 0.0 + ], + [ + 27, + 0.0 + ], + [ + 28, + 0.0 + ], + [ + 29, + 0.0 + ], + [ + 30, + 0.0 + ], + [ + 31, + 0.0 + ], + [ + 32, + 0.0 + ], + [ + 33, + 0.0 + ], + [ + 34, + 0.0 + ], + [ + 35, + 0.0 + ], + [ + 36, + 0.0 + ], + [ + 37, + 0.0 + ], + [ + 38, + 0.0 + ], + [ + 39, + 0.0 + ], + [ + 40, + 0.0 + ], + [ + 41, + 0.0 + ], + [ + 42, + 0.0 + ], + [ + 43, + 0.0 + ], + [ + 44, + 0.0 + ], + [ + 45, + 0.0 + ], + [ + 46, + 0.0 + ], + [ + 47, + 0.0 + ], + [ + 48, + 0.0 + ], + [ + 49, + 0.0 + ], + [ + 50, + 0.0 + ], + [ + 51, + 0.0 + ], + [ + 52, + 0.0 + ], + [ + 53, + 0.0 + ], + [ + 54, + 0.0 + ], + [ + 55, + 0.0 + ], + [ + 56, + 0.0 + ], + [ + 57, + 0.0 + ], + [ + 58, + 0.0 + ], + [ + 59, + 0.0 + ], + [ + 60, + 0.0 + ], + [ + 61, + 0.0 + ], + [ + 62, + 0.0 + ], + [ + 63, + 0.0 + ], + [ + 64, + 0.0 + ], + [ + 65, + 0.0 + ], + [ + 66, + 0.0 + ], + [ + 67, + 0.0 + ], + [ + 68, + 0.0 + ], + [ + 69, + 0.0 + ], + [ + 70, + 0.0 + ], + [ + 71, + 0.0 + ], + [ + 72, + 0.0 + ], + [ + 73, + 0.0 + ], + [ + 74, + 0.0 + ], + [ + 75, + 0.0 + ], + [ + 76, + 0.0 + ], + [ + 77, + 0.0 + ], + [ + 78, + 0.0 + ], + [ + 79, + 0.0 + ], + [ + 80, + 0.0 + ], + [ + 81, + 0.0 + ], + [ + 82, + 0.0 + ], + [ + 83, + 0.0 + ], + [ + 84, + 0.0 + ], + [ + 85, + 0.0 + ], + [ + 86, + 0.0 + ], + [ + 87, + 0.0 + ], + [ + 88, + 0.0 + ], + [ + 89, + 0.0 + ], + [ + 90, + 0.0 + ], + [ + 91, + 0.0 + ], + [ + 92, + 0.0 + ], + [ + 93, + 0.0 + ], + [ + 94, + 0.0 + ], + [ + 95, + 0.0 + ], + [ + 96, + 0.0 + ], + [ + 97, + 0.0 + ], + [ + 98, + 0.0 + ], + [ + 99, + 0.0 + ], + [ + 100, + 0.0 + ] + ] + }, + "blend_random_trainable_alpha075": { + "test_acc": [ + 0.3057, + 0.313, + 0.3159, + 0.3074, + 0.3127, + 0.3075, + 0.2992, + 0.3017, + 0.2934, + 0.3036, + 0.3107, + 0.3157, + 0.3175, + 0.3067, + 0.3038, + 0.3036, + 0.3188, + 0.3151, + 0.3159, + 0.306, + 0.3065, + 0.3211, + 0.3101, + 0.3111, + 0.3086, + 0.3114, + 0.315, + 0.3177, + 0.3148, + 0.3155, + 0.3192, + 0.315, + 0.314, + 0.3112, + 0.3237, + 0.3152, + 0.3232, + 0.3246, + 0.315, + 0.322, + 0.3147, + 0.3138, + 0.3184, + 0.3186, + 0.3112, + 0.3167, + 0.3203, + 0.3108, + 0.3149, + 0.32, + 0.3166, + 0.319, + 0.3187, + 0.3122, + 0.3185, + 0.3175, + 0.3226, + 0.3188, + 0.3184, + 0.3178, + 0.3234, + 0.322, + 0.3222, + 0.3306, + 0.313, + 0.3163, + 0.3231, + 0.3259, + 0.3243, + 0.3182, + 0.3185, + 0.3235, + 0.3219, + 0.3217, + 0.317, + 0.324, + 0.3179, + 0.3234, + 0.3202, + 0.3218, + 0.3251, + 0.3246, + 0.3246, + 0.3222, + 0.3217, + 0.3228, + 0.3219, + 0.3212, + 0.3214, + 0.3226, + 0.3219, + 0.3226, + 0.3226, + 0.3224, + 0.3224 + ], + "train_loss": [ + 1.9863584661102296, + 1.9901082321166992, + 1.9899895672607422, + 1.9905559247207643, + 1.9933388582992553, + 1.9831242485809326, + 1.9819840459823608, + 1.9838320283508302, + 1.9812498509216308, + 1.980695964202881, + 1.9775935582733155, + 1.9746784218597413, + 1.9758756914520264, + 1.9731443271255493, + 1.9735053044128419, + 1.9710882552337647, + 1.9679033090591431, + 1.9719498504257202, + 1.96802033203125, + 1.9680989447021484, + 1.9678990168762207, + 1.9670032351303102, + 1.9651213776016236, + 1.9671727653503417, + 1.9690395525741577, + 1.9632393447494507, + 1.9625915707778931, + 1.9642795868301393, + 1.962284288253784, + 1.9620551160430908, + 1.9625657203674316, + 1.9611133654403687, + 1.9630646159362792, + 1.960646312789917, + 1.9632540558242797, + 1.9595271733093262, + 1.96106090385437, + 1.9597418651580811, + 1.9601698782730101, + 1.9627716778945923, + 1.960522246322632, + 1.9592057704925536, + 1.9605137160873414, + 1.9641116384506225, + 1.9620838027954102, + 1.9584725994873047, + 1.9602987656402588, + 1.9586591900253296, + 1.9589158935165405, + 1.9596970495605468, + 1.9598131320571899, + 1.9568223999023437, + 1.96024339012146, + 1.9578165494155884, + 1.9596277838134766, + 1.9579522448730469, + 1.9601750942230225, + 1.9571070608520509, + 1.9577818801116944, + 1.9579749005508422, + 1.958904959487915, + 1.9588295747375488, + 1.9592107725524903, + 1.9556558278656007, + 1.9566347140502929, + 1.9571185677337646, + 1.9556720935058594, + 1.960075058364868, + 1.9572499262237548, + 1.9573225322723389, + 1.9572704486465453, + 1.956118627243042, + 1.9577359083557129, + 1.9548047360229492, + 1.9568554579925537, + 1.9560601205444337, + 1.9569705477905273, + 1.9573911285018921, + 1.9555766596984863, + 1.9534356274032594, + 1.9576097611236571, + 1.9529308759307862, + 1.956716926498413, + 1.9529449435043336, + 1.9519823665618896, + 1.9550598822021485, + 1.95468404838562, + 1.9547595784759522, + 1.9551029265975952, + 1.9516690326690673, + 1.9553640102386474, + 1.9570171786880493, + 1.9546185680770873, + 1.9530967560577392, + 1.9577186687469483 + ], + "gamma": [ + [ + 6, + 0.02217397012282163 + ], + [ + 7, + 0.03206559922546148 + ], + [ + 8, + 0.026470738579519093 + ], + [ + 9, + 0.03263817366678268 + ], + [ + 10, + 0.021615365520119667 + ], + [ + 13, + 0.02192097995430231 + ], + [ + 15, + 0.024044587509706616 + ], + [ + 20, + 0.03487626521382481 + ], + [ + 25, + 0.02460204972885549 + ], + [ + 35, + 0.01627764804288745 + ], + [ + 45, + 0.027334752143360674 + ], + [ + 55, + 0.018939002882689238 + ], + [ + 65, + 0.022531974245794117 + ], + [ + 75, + 0.024030609405599535 + ], + [ + 85, + 0.030015499010914937 + ], + [ + 95, + 0.027055976912379265 + ], + [ + 100, + 0.02679809636902064 + ] + ], + "rho": [ + [ + 6, + -0.0035915356129407883 + ], + [ + 7, + 0.0014759176410734653 + ], + [ + 8, + 0.022930681821890175 + ], + [ + 9, + -0.0021478012204170227 + ], + [ + 10, + 0.0070319639053195715 + ], + [ + 13, + 0.011672343825921416 + ], + [ + 15, + 0.001020955154672265 + ], + [ + 20, + 0.009278092067688704 + ], + [ + 25, + 0.015854547498747706 + ], + [ + 35, + 0.014141641091555357 + ], + [ + 45, + 0.006546026677824557 + ], + [ + 55, + -0.019327251007780433 + ], + [ + 65, + -0.004201943869702518 + ], + [ + 75, + 0.020702308975160122 + ], + [ + 85, + 0.003142602858133614 + ], + [ + 95, + 0.0026063444674946368 + ], + [ + 100, + 0.0022612916654907167 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7499216896909023 + ], + [ + 7, + 0.7498440373042877 + ], + [ + 8, + 0.749787791792374 + ], + [ + 9, + 0.7497660312647594 + ], + [ + 10, + 0.7496698512243913 + ], + [ + 11, + 0.7496028887524708 + ], + [ + 12, + 0.7495682025386097 + ], + [ + 13, + 0.7495497796575948 + ], + [ + 14, + 0.7495278946529158 + ], + [ + 15, + 0.7495465922369274 + ], + [ + 16, + 0.7494974732165709 + ], + [ + 17, + 0.7494886637697328 + ], + [ + 18, + 0.749446088982838 + ], + [ + 19, + 0.7494274087356515 + ], + [ + 20, + 0.7494273452819361 + ], + [ + 21, + 0.7494116633638669 + ], + [ + 22, + 0.7494229551569503 + ], + [ + 23, + 0.7494157627578178 + ], + [ + 24, + 0.7494041680686359 + ], + [ + 25, + 0.7494067179442755 + ], + [ + 26, + 0.7493968180240337 + ], + [ + 27, + 0.749388494671204 + ], + [ + 28, + 0.749378866029789 + ], + [ + 29, + 0.7493964109696862 + ], + [ + 30, + 0.7494099349639679 + ], + [ + 31, + 0.7493784143534457 + ], + [ + 32, + 0.7493838745706526 + ], + [ + 33, + 0.7493904517206977 + ], + [ + 34, + 0.7493914742706692 + ], + [ + 35, + 0.7493781312951258 + ], + [ + 36, + 0.7493907587768501 + ], + [ + 37, + 0.749394500246949 + ], + [ + 38, + 0.7493778587931351 + ], + [ + 39, + 0.7493688891732854 + ], + [ + 40, + 0.7493823741113532 + ], + [ + 41, + 0.74938731356516 + ], + [ + 42, + 0.749384416847116 + ], + [ + 43, + 0.749379162241639 + ], + [ + 44, + 0.7494005355837596 + ], + [ + 45, + 0.7493878339718874 + ], + [ + 46, + 0.7493878727291137 + ], + [ + 47, + 0.7493848747913123 + ], + [ + 48, + 0.7493798828813794 + ], + [ + 49, + 0.7494170256811937 + ], + [ + 50, + 0.7493987277579729 + ], + [ + 51, + 0.7493867453013181 + ], + [ + 52, + 0.7493837198444278 + ], + [ + 53, + 0.7493890335665235 + ], + [ + 54, + 0.7493956779966846 + ], + [ + 55, + 0.7494003459618025 + ], + [ + 56, + 0.7494051709629193 + ], + [ + 57, + 0.7494082200830192 + ], + [ + 58, + 0.7494020402310835 + ], + [ + 59, + 0.7493862054413847 + ], + [ + 60, + 0.7493973855755164 + ], + [ + 61, + 0.7493973882263439 + ], + [ + 62, + 0.7494149261184524 + ], + [ + 63, + 0.7493854416261437 + ], + [ + 64, + 0.7493889765743919 + ], + [ + 65, + 0.7494028563344639 + ], + [ + 66, + 0.7493849269122205 + ], + [ + 67, + 0.7493880154634703 + ], + [ + 68, + 0.7493916026439615 + ], + [ + 69, + 0.7494058526428821 + ], + [ + 70, + 0.7493947824045847 + ], + [ + 71, + 0.749390175876749 + ], + [ + 72, + 0.7493922810752203 + ], + [ + 73, + 0.749384920194829 + ], + [ + 74, + 0.7494043041760992 + ], + [ + 75, + 0.7494011851269835 + ], + [ + 76, + 0.7493994055097649 + ], + [ + 77, + 0.749404380057707 + ], + [ + 78, + 0.7494041466149483 + ], + [ + 79, + 0.7494322935583441 + ], + [ + 80, + 0.7494012188470695 + ], + [ + 81, + 0.7493911152990194 + ], + [ + 82, + 0.7493913151652338 + ], + [ + 83, + 0.7493844626120792 + ], + [ + 84, + 0.7493761067751588 + ], + [ + 85, + 0.7493730743526231 + ], + [ + 86, + 0.7493879622325962 + ], + [ + 87, + 0.7493956231730691 + ], + [ + 88, + 0.7494007786848756 + ], + [ + 89, + 0.749378023795819 + ], + [ + 90, + 0.7493771370629041 + ], + [ + 91, + 0.7493743269328277 + ], + [ + 92, + 0.7493712575432526 + ], + [ + 93, + 0.749394418601039 + ], + [ + 94, + 0.7494010172300447 + ], + [ + 95, + 0.7494063411107746 + ], + [ + 96, + 0.7493997325774271 + ], + [ + 97, + 0.7493922172034428 + ], + [ + 98, + 0.7493986014625239 + ], + [ + 99, + 0.7493954058535361 + ], + [ + 100, + 0.7493942121735473 + ] + ] + }, + "freeze_after_1_fixed075": { + "test_acc": [ + 0.3057, + 0.2045, + 0.1305, + 0.1437, + 0.1215, + 0.1397, + 0.1243, + 0.1398, + 0.1417, + 0.1276, + 0.1214, + 0.1482, + 0.1262, + 0.1384, + 0.1293, + 0.1318, + 0.1206, + 0.1194, + 0.1399, + 0.1217, + 0.1127, + 0.1239, + 0.1435, + 0.1444, + 0.1318, + 0.1395, + 0.1269, + 0.1229, + 0.1453, + 0.1207, + 0.131, + 0.143, + 0.1326, + 0.1469, + 0.1292, + 0.1237, + 0.142, + 0.144, + 0.1332, + 0.1308, + 0.141, + 0.1356, + 0.1296, + 0.1429, + 0.1458, + 0.1489, + 0.1352, + 0.1446, + 0.1188, + 0.1201, + 0.1389, + 0.1247, + 0.126, + 0.1452, + 0.1453, + 0.124, + 0.1482, + 0.1322, + 0.1481, + 0.127, + 0.1464, + 0.1342, + 0.1244, + 0.1324, + 0.1426, + 0.1435, + 0.1219, + 0.1346, + 0.1428, + 0.1478, + 0.1444, + 0.1351, + 0.1382, + 0.147, + 0.1454, + 0.1399, + 0.1483, + 0.1449, + 0.1455, + 0.1449, + 0.1375, + 0.1381, + 0.1379, + 0.142, + 0.1375, + 0.1465, + 0.1457, + 0.1443, + 0.1444, + 0.1465, + 0.1454, + 0.1453, + 0.1457, + 0.1458, + 0.1457 + ], + "train_loss": [ + 1.9906995290374756, + 2.0737685120391847, + 2.2155820433044435, + 2.2721241608428957, + 2.2924982513427734, + 2.29488955909729, + 2.2970185789489745, + 2.2986293141174317, + 2.294429828338623, + 2.296617165603638, + 2.29678421836853, + 2.295137005081177, + 2.294201057739258, + 2.294304957885742, + 2.2925959534454345, + 2.2927727430725096, + 2.2926478660583496, + 2.2941555421447752, + 2.2922998066711426, + 2.2922051114654542, + 2.291230871047974, + 2.2909607197570803, + 2.290787425079346, + 2.289492441482544, + 2.2906497711944582, + 2.2900892761230467, + 2.289130498123169, + 2.288355968475342, + 2.287702822418213, + 2.288278614883423, + 2.2896552796936036, + 2.289241484832764, + 2.2869311714172365, + 2.286889280548096, + 2.287323820877075, + 2.2864588946533204, + 2.287139986495972, + 2.2864987995147703, + 2.2848596308898927, + 2.2853628147888183, + 2.2857934356689453, + 2.285166664352417, + 2.285637107772827, + 2.2866209410095215, + 2.2844921535491944, + 2.2842216230773924, + 2.2845423082733154, + 2.283267167892456, + 2.2844598588562013, + 2.2829305644226072, + 2.283300087814331, + 2.282644022369385, + 2.281965013961792, + 2.2826355504608156, + 2.281901387939453, + 2.282285031661987, + 2.282372682952881, + 2.281888911819458, + 2.2809345600891113, + 2.2809602374267577, + 2.281319549102783, + 2.2817195971679687, + 2.280134122848511, + 2.281717905654907, + 2.280990512542725, + 2.2795736303710936, + 2.2796770709991456, + 2.280508980102539, + 2.2805651750183107, + 2.280122625579834, + 2.2804177006530764, + 2.2795247370147704, + 2.2803760807800293, + 2.278886136932373, + 2.2790786742401123, + 2.2791181636810305, + 2.279737799835205, + 2.27865718788147, + 2.279473173675537, + 2.2787302172088624, + 2.278779428024292, + 2.2784378577423094, + 2.2783523303222655, + 2.278849890823364, + 2.2790181679534913, + 2.2783080220794676, + 2.279018676223755, + 2.278016226654053, + 2.2786078874969484, + 2.2791138971710203, + 2.2777640832519532, + 2.2778554022216797, + 2.2784366593933107, + 2.2778875938415526, + 2.2782850380706785 + ], + "gamma": [ + [ + 6, + 0.029229389503598213 + ], + [ + 7, + 0.022255003335885704 + ], + [ + 8, + 0.022101536189438775 + ], + [ + 9, + 0.02245766983833164 + ], + [ + 10, + 0.02511510974727571 + ], + [ + 13, + 0.007977887464221567 + ], + [ + 15, + 0.005509988921403419 + ], + [ + 20, + 0.0035846279861289077 + ], + [ + 25, + 0.0045192451416369295 + ], + [ + 35, + 0.004759672311593022 + ], + [ + 45, + 0.006429436665939647 + ], + [ + 55, + 0.006245920291348739 + ], + [ + 65, + 0.005974134820235122 + ], + [ + 75, + 0.0057584647736348415 + ], + [ + 85, + 0.005155308514304124 + ], + [ + 95, + 0.00543625851150864 + ], + [ + 100, + 0.005401106335625627 + ] + ], + "rho": [ + [ + 6, + -0.004526643548160791 + ], + [ + 7, + 0.006596404826268554 + ], + [ + 8, + -0.005334540968760848 + ], + [ + 9, + 0.015801534289494157 + ], + [ + 10, + -0.0070290109142661095 + ], + [ + 13, + 0.014296236913651228 + ], + [ + 15, + -0.0012522098841145635 + ], + [ + 20, + -0.0065160891972482204 + ], + [ + 25, + 0.003924963064491749 + ], + [ + 35, + -0.0048978012055158615 + ], + [ + 45, + -0.003648596117272973 + ], + [ + 55, + 0.004803311545401812 + ], + [ + 65, + -0.003128552343696356 + ], + [ + 75, + 0.0007290660869330168 + ], + [ + 85, + -0.010232515633106232 + ], + [ + 95, + 0.00676717609167099 + ], + [ + 100, + -0.003135102801024914 + ] + ], + "alpha_eff": [ + [ + 6, + 0.749923294977622 + ], + [ + 7, + 0.749905672226397 + ], + [ + 8, + 0.7499356070495369 + ], + [ + 9, + 0.7499492318105373 + ], + [ + 10, + 0.7499561113658882 + ], + [ + 11, + 0.7499592320476945 + ], + [ + 12, + 0.7499606817947195 + ], + [ + 13, + 0.7499613785850733 + ], + [ + 14, + 0.7499616792301997 + ], + [ + 15, + 0.7499617264427558 + ], + [ + 16, + 0.7499616305173084 + ], + [ + 17, + 0.749961421920658 + ], + [ + 18, + 0.749961138829684 + ], + [ + 19, + 0.7499608219196955 + ], + [ + 20, + 0.7499604845040225 + ], + [ + 21, + 0.7499601619924307 + ], + [ + 22, + 0.7499598537310682 + ], + [ + 23, + 0.7499595938790594 + ], + [ + 24, + 0.7499593658764514 + ], + [ + 25, + 0.7499591768673664 + ], + [ + 26, + 0.7499590363427018 + ], + [ + 27, + 0.7499589173882474 + ], + [ + 28, + 0.7499588217775399 + ], + [ + 29, + 0.749958747288934 + ], + [ + 30, + 0.7499586755412131 + ], + [ + 31, + 0.749958612839054 + ], + [ + 32, + 0.7499585615289758 + ], + [ + 33, + 0.749958508492663 + ], + [ + 34, + 0.7499584651594168 + ], + [ + 35, + 0.74995841130046 + ], + [ + 36, + 0.7499583685606458 + ], + [ + 37, + 0.7499583289325864 + ], + [ + 38, + 0.7499582876827926 + ], + [ + 39, + 0.7499582574778539 + ], + [ + 40, + 0.7499582279911792 + ], + [ + 41, + 0.7499581946541439 + ], + [ + 42, + 0.7499581739635384 + ], + [ + 43, + 0.7499581524165019 + ], + [ + 44, + 0.7499581320832189 + ], + [ + 45, + 0.7499581102362035 + ], + [ + 46, + 0.7499580982742708 + ], + [ + 47, + 0.7499580923809621 + ], + [ + 48, + 0.7499580815652703 + ], + [ + 49, + 0.749958067357978 + ], + [ + 50, + 0.7499580530157078 + ], + [ + 51, + 0.749958048069753 + ], + [ + 52, + 0.7499580363606989 + ], + [ + 53, + 0.749958029240193 + ], + [ + 54, + 0.7499580162128252 + ], + [ + 55, + 0.7499580007917895 + ], + [ + 56, + 0.7499580021673148 + ], + [ + 57, + 0.7499579822925718 + ], + [ + 58, + 0.7499579734694033 + ], + [ + 59, + 0.7499579618850298 + ], + [ + 60, + 0.7499579621312126 + ], + [ + 61, + 0.7499579521347911 + ], + [ + 62, + 0.7499579480991593 + ], + [ + 63, + 0.7499579435307815 + ], + [ + 64, + 0.7499579342626495 + ], + [ + 65, + 0.7499579337433985 + ], + [ + 66, + 0.7499579322364557 + ], + [ + 67, + 0.7499579328837135 + ], + [ + 68, + 0.7499579263127302 + ], + [ + 69, + 0.7499579250618643 + ], + [ + 70, + 0.7499579235953246 + ], + [ + 71, + 0.749957920732971 + ], + [ + 72, + 0.7499579202710053 + ], + [ + 73, + 0.7499579181503966 + ], + [ + 74, + 0.7499579123177976 + ], + [ + 75, + 0.7499579137641768 + ], + [ + 76, + 0.7499579142260154 + ], + [ + 77, + 0.7499579142091058 + ], + [ + 78, + 0.7499579169805186 + ], + [ + 79, + 0.749957916205036 + ], + [ + 80, + 0.7499579182178123 + ], + [ + 81, + 0.7499579091148644 + ], + [ + 82, + 0.7499579113737009 + ], + [ + 83, + 0.7499579126616054 + ], + [ + 84, + 0.7499579107432754 + ], + [ + 85, + 0.7499579087406157 + ], + [ + 86, + 0.7499579139191689 + ], + [ + 87, + 0.7499579105578154 + ], + [ + 88, + 0.7499579109522972 + ], + [ + 89, + 0.7499579126211704 + ], + [ + 90, + 0.7499579089698573 + ], + [ + 91, + 0.7499579074897771 + ], + [ + 92, + 0.7499579114917091 + ], + [ + 93, + 0.7499579054028283 + ], + [ + 94, + 0.749957910722974 + ], + [ + 95, + 0.7499579117951909 + ], + [ + 96, + 0.7499579089563578 + ], + [ + 97, + 0.7499579072572299 + ], + [ + 98, + 0.7499579098599333 + ], + [ + 99, + 0.749957915638598 + ], + [ + 100, + 0.7499579170546363 + ] + ] + }, + "freeze_after_5_fixed075": { + "test_acc": [ + 0.3068, + 0.3108, + 0.3075, + 0.2962, + 0.3064, + 0.2256, + 0.1503, + 0.1093, + 0.1576, + 0.0999, + 0.1164, + 0.142, + 0.1179, + 0.1338, + 0.1269, + 0.1257, + 0.1182, + 0.1183, + 0.1323, + 0.1186, + 0.1142, + 0.1362, + 0.1396, + 0.1419, + 0.1293, + 0.1309, + 0.125, + 0.1202, + 0.1429, + 0.1173, + 0.1289, + 0.1405, + 0.1243, + 0.1438, + 0.1251, + 0.1217, + 0.1388, + 0.1397, + 0.1309, + 0.1286, + 0.1361, + 0.1235, + 0.1284, + 0.1401, + 0.1427, + 0.1471, + 0.133, + 0.1262, + 0.1176, + 0.1175, + 0.1316, + 0.1188, + 0.1251, + 0.1443, + 0.1442, + 0.1226, + 0.144, + 0.1168, + 0.1276, + 0.126, + 0.1431, + 0.1326, + 0.1235, + 0.1229, + 0.1398, + 0.1425, + 0.1179, + 0.1323, + 0.1406, + 0.1434, + 0.1428, + 0.1334, + 0.1334, + 0.1461, + 0.1421, + 0.134, + 0.1426, + 0.141, + 0.1422, + 0.1166, + 0.134, + 0.1349, + 0.1338, + 0.1376, + 0.1347, + 0.1452, + 0.1437, + 0.1423, + 0.1419, + 0.1402, + 0.1419, + 0.1423, + 0.1425, + 0.1427, + 0.1429 + ], + "train_loss": [ + 1.9893489678192138, + 1.985487917022705, + 1.9859093509292602, + 1.983449199180603, + 1.9827121502685547, + 2.0594376360321043, + 2.207141205444336, + 2.2714959971618653, + 2.2873566510772707, + 2.2961153761291504, + 2.2985075205993653, + 2.2977035494995115, + 2.2974455174255373, + 2.2976522528076173, + 2.296003302154541, + 2.2963047105407717, + 2.2965452262115478, + 2.297999372329712, + 2.2962898539733887, + 2.2960005585479735, + 2.2950949415588378, + 2.2948854180908205, + 2.2944784745025633, + 2.29330205947876, + 2.2943646950531007, + 2.2941731243896486, + 2.293124954071045, + 2.2922902240753174, + 2.2919424175262453, + 2.29253370513916, + 2.294221692428589, + 2.2934059229278563, + 2.2912623796844485, + 2.291140076522827, + 2.291435696258545, + 2.2908271159362794, + 2.291476573486328, + 2.2907359911346434, + 2.289365125808716, + 2.2899449461364747, + 2.2903112524414064, + 2.2897306018066406, + 2.2900110057067873, + 2.2913283332824705, + 2.2890629961395264, + 2.288549022140503, + 2.288963945159912, + 2.287618798675537, + 2.289065319366455, + 2.287497896575928, + 2.2880995404815674, + 2.2870908855438232, + 2.2864917352294922, + 2.2871037657928466, + 2.2865074630737303, + 2.28678498550415, + 2.2870698027038574, + 2.2863846828460694, + 2.285519721069336, + 2.2854560637664796, + 2.2857414881134033, + 2.286112783050537, + 2.2844998125457763, + 2.286092988128662, + 2.2855831603240966, + 2.2841854079437254, + 2.284118550491333, + 2.2851279951477053, + 2.2849759539031984, + 2.2846845874023436, + 2.2848418711090086, + 2.28398831489563, + 2.2847050997924803, + 2.2832656199645998, + 2.283573601608276, + 2.283536388168335, + 2.2839898639678955, + 2.2829865564727783, + 2.283732427444458, + 2.2832025003051757, + 2.283129920578003, + 2.2828851631164553, + 2.282600374755859, + 2.283195795211792, + 2.2834493016815185, + 2.2826498027038573, + 2.2833422844696045, + 2.2822403409576415, + 2.2830539070129396, + 2.2833374087524416, + 2.282107705001831, + 2.2822584789276124, + 2.2828566105651857, + 2.2821592779541016, + 2.282512705154419 + ], + "gamma": [ + [ + 6, + 0.02705257706111297 + ], + [ + 7, + 0.028260178864002228 + ], + [ + 8, + 0.03390599135309458 + ], + [ + 9, + 0.04262567771365866 + ], + [ + 10, + 0.039130375924287364 + ], + [ + 13, + 0.015935751143842936 + ], + [ + 15, + 0.020201866049319506 + ], + [ + 20, + 0.016146464011399075 + ], + [ + 25, + 0.01891520711069461 + ], + [ + 35, + 0.015422215528815286 + ], + [ + 45, + 0.02083021820931208 + ], + [ + 55, + 0.020073247775201253 + ], + [ + 65, + 0.019591293325447623 + ], + [ + 75, + 0.019224833375290018 + ], + [ + 85, + 0.017693829966447083 + ], + [ + 95, + 0.01843330923713893 + ], + [ + 100, + 0.01831494387300836 + ] + ], + "rho": [ + [ + 6, + 0.019902817904949188 + ], + [ + 7, + -0.005045581376180053 + ], + [ + 8, + 0.01920311595313251 + ], + [ + 9, + 0.013431413099169731 + ], + [ + 10, + 0.015046576038002968 + ], + [ + 13, + 0.005307852290570736 + ], + [ + 15, + 0.003655511813121848 + ], + [ + 20, + -0.0007810932584106922 + ], + [ + 25, + -0.0020412285812199116 + ], + [ + 35, + -0.0052429186180233955 + ], + [ + 45, + 0.0074201589450240135 + ], + [ + 55, + 0.0018254606984555721 + ], + [ + 65, + 0.001219858299009502 + ], + [ + 75, + 0.004192978609353304 + ], + [ + 85, + -0.007369007915258408 + ], + [ + 95, + 0.00039116619154810905 + ], + [ + 100, + -0.0015693700406700373 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7499202477378032 + ], + [ + 7, + 0.7498463447134337 + ], + [ + 8, + 0.7497995274555987 + ], + [ + 9, + 0.749756139810235 + ], + [ + 10, + 0.7496929019618472 + ], + [ + 11, + 0.7496816831117289 + ], + [ + 12, + 0.7497748903839642 + ], + [ + 13, + 0.7498041658227375 + ], + [ + 14, + 0.7498150362468194 + ], + [ + 15, + 0.7498202200942068 + ], + [ + 16, + 0.7498227834360003 + ], + [ + 17, + 0.7498240283191057 + ], + [ + 18, + 0.7498245421262388 + ], + [ + 19, + 0.7498246437120061 + ], + [ + 20, + 0.7498246045407647 + ], + [ + 21, + 0.7498244894883069 + ], + [ + 22, + 0.7498244285921248 + ], + [ + 23, + 0.7498244377216693 + ], + [ + 24, + 0.7498245354700839 + ], + [ + 25, + 0.7498246065422424 + ], + [ + 26, + 0.7498247640764162 + ], + [ + 27, + 0.7498249075535127 + ], + [ + 28, + 0.7498250394874728 + ], + [ + 29, + 0.749825150388344 + ], + [ + 30, + 0.7498252206431467 + ], + [ + 31, + 0.749825294617509 + ], + [ + 32, + 0.7498253178038817 + ], + [ + 33, + 0.7498253219144003 + ], + [ + 34, + 0.7498253056198279 + ], + [ + 35, + 0.7498252652410382 + ], + [ + 36, + 0.7498252317435838 + ], + [ + 37, + 0.7498252206297409 + ], + [ + 38, + 0.7498252004636857 + ], + [ + 39, + 0.7498252599755928 + ], + [ + 40, + 0.7498253018903019 + ], + [ + 41, + 0.7498253724084616 + ], + [ + 42, + 0.7498254763600888 + ], + [ + 43, + 0.7498255577080846 + ], + [ + 44, + 0.7498256766308641 + ], + [ + 45, + 0.7498257966368489 + ], + [ + 46, + 0.7498259134263283 + ], + [ + 47, + 0.7498260170496108 + ], + [ + 48, + 0.7498261211891766 + ], + [ + 49, + 0.7498262231826883 + ], + [ + 50, + 0.7498263280341823 + ], + [ + 51, + 0.7498263991728029 + ], + [ + 52, + 0.749826493490658 + ], + [ + 53, + 0.749826597346364 + ], + [ + 54, + 0.7498266555449464 + ], + [ + 55, + 0.7498267398731024 + ], + [ + 56, + 0.7498268404379499 + ], + [ + 57, + 0.7498268989263888 + ], + [ + 58, + 0.7498269682220481 + ], + [ + 59, + 0.7498270369841208 + ], + [ + 60, + 0.7498270918177319 + ], + [ + 61, + 0.7498271469011805 + ], + [ + 62, + 0.7498272115254345 + ], + [ + 63, + 0.7498272387579276 + ], + [ + 64, + 0.7498273027242259 + ], + [ + 65, + 0.7498273423498409 + ], + [ + 66, + 0.749827357665683 + ], + [ + 67, + 0.7498274131169155 + ], + [ + 68, + 0.749827438543571 + ], + [ + 69, + 0.7498274592696411 + ], + [ + 70, + 0.749827484794581 + ], + [ + 71, + 0.7498275174678041 + ], + [ + 72, + 0.7498275337586687 + ], + [ + 73, + 0.749827543715034 + ], + [ + 74, + 0.749827559013781 + ], + [ + 75, + 0.7498275711368638 + ], + [ + 76, + 0.7498275865097452 + ], + [ + 77, + 0.7498276108062035 + ], + [ + 78, + 0.7498276224432655 + ], + [ + 79, + 0.7498276336244346 + ], + [ + 80, + 0.7498276402496034 + ], + [ + 81, + 0.7498276470536364 + ], + [ + 82, + 0.7498276455109267 + ], + [ + 83, + 0.7498276600473064 + ], + [ + 84, + 0.7498276680286947 + ], + [ + 85, + 0.7498276733984254 + ], + [ + 86, + 0.7498276956736362 + ], + [ + 87, + 0.7498276915661669 + ], + [ + 88, + 0.7498276801686883 + ], + [ + 89, + 0.7498276945159164 + ], + [ + 90, + 0.7498276797773024 + ], + [ + 91, + 0.7498277005874554 + ], + [ + 92, + 0.7498276913637241 + ], + [ + 93, + 0.7498276957441666 + ], + [ + 94, + 0.7498277056531762 + ], + [ + 95, + 0.7498276953192542 + ], + [ + 96, + 0.7498277054741631 + ], + [ + 97, + 0.7498277021465464 + ], + [ + 98, + 0.7498276917989567 + ], + [ + 99, + 0.7498276940634648 + ], + [ + 100, + 0.7498277162777363 + ] + ] + }, + "freeze_after_1_decay_to_025": { + "test_acc": [ + 0.3054, + 0.2227, + 0.1452, + 0.136, + 0.1258, + 0.1263, + 0.1174, + 0.1035, + 0.1602, + 0.1073, + 0.1203, + 0.1415, + 0.104, + 0.1321, + 0.1003, + 0.1152, + 0.1148, + 0.1199, + 0.1263, + 0.1152, + 0.1164, + 0.1345, + 0.1286, + 0.1241, + 0.1253, + 0.1248, + 0.1227, + 0.1174, + 0.1408, + 0.1181, + 0.1275, + 0.1328, + 0.1189, + 0.1426, + 0.1265, + 0.1183, + 0.1377, + 0.138, + 0.1293, + 0.1281, + 0.1308, + 0.1236, + 0.1282, + 0.1349, + 0.1407, + 0.1473, + 0.1306, + 0.1269, + 0.115, + 0.1113, + 0.1331, + 0.1191, + 0.1231, + 0.1416, + 0.1428, + 0.1213, + 0.143, + 0.1122, + 0.115, + 0.1254, + 0.1404, + 0.1307, + 0.1203, + 0.1155, + 0.1389, + 0.1395, + 0.1173, + 0.1337, + 0.1389, + 0.1361, + 0.1393, + 0.1311, + 0.1297, + 0.1419, + 0.1404, + 0.1325, + 0.135, + 0.1369, + 0.1375, + 0.1133, + 0.1271, + 0.1297, + 0.1301, + 0.1279, + 0.1296, + 0.1423, + 0.1392, + 0.1393, + 0.1397, + 0.1327, + 0.1379, + 0.139, + 0.1402, + 0.1392, + 0.1392 + ], + "train_loss": [ + 1.9895063690948487, + 2.0717621327209472, + 2.189962035522461, + 2.2329315424346925, + 2.260052084579468, + 2.2688772117614744, + 2.2779186013793944, + 2.2852122827148436, + 2.2846843614196777, + 2.291246020050049, + 2.2944116230010985, + 2.294942557373047, + 2.29667289352417, + 2.298328145904541, + 2.297607911529541, + 2.2989455223083497, + 2.299919396362305, + 2.3013042308044436, + 2.3001043883514405, + 2.29936297706604, + 2.298790442123413, + 2.2988700410461425, + 2.297741695022583, + 2.296872480621338, + 2.29784930770874, + 2.2974551319885252, + 2.2960880307769775, + 2.295343821411133, + 2.2947800379180907, + 2.2954108971405027, + 2.296628145904541, + 2.2958906733703612, + 2.29336536026001, + 2.2930805914306642, + 2.2929298010253905, + 2.2927328889465333, + 2.293177236251831, + 2.292220322189331, + 2.290796268234253, + 2.291155597076416, + 2.2914103716278076, + 2.2908911601257325, + 2.2909919847106934, + 2.2923007972717286, + 2.289861133880615, + 2.2892761711120606, + 2.289645308380127, + 2.2883711812591554, + 2.2895432438659666, + 2.287957716674805, + 2.2885722449493406, + 2.287502489776611, + 2.286777231903076, + 2.28740978805542, + 2.2868827954864503, + 2.2870309147644043, + 2.2870197551727296, + 2.2863273274230957, + 2.2856398780059815, + 2.2856489250183105, + 2.2856975270080566, + 2.2862225410461425, + 2.2844740558624266, + 2.2859574056243894, + 2.2855120135498046, + 2.2841620223236085, + 2.2840080644989014, + 2.284847536087036, + 2.284840629043579, + 2.284350129470825, + 2.2846198870849608, + 2.283844443511963, + 2.284575237045288, + 2.28322234664917, + 2.283361275177002, + 2.283530992126465, + 2.283763175811768, + 2.282791965713501, + 2.283448165206909, + 2.2828492040252684, + 2.283028067550659, + 2.2826764515686033, + 2.2823099598693846, + 2.283018860397339, + 2.283153437652588, + 2.282438748855591, + 2.283022185211182, + 2.281942760696411, + 2.282656005859375, + 2.283106033554077, + 2.2819691327667235, + 2.281947142944336, + 2.282431115036011, + 2.28206281791687, + 2.282211386566162 + ], + "gamma": [ + [ + 6, + 0.029319611843675375 + ], + [ + 7, + 0.03185648733051494 + ], + [ + 8, + 0.04233608162030578 + ], + [ + 9, + 0.04189345566555858 + ], + [ + 10, + 0.047544537112116814 + ], + [ + 13, + 0.03297986194957048 + ], + [ + 15, + 0.026738733984529972 + ], + [ + 20, + 0.016979411127977073 + ], + [ + 25, + 0.01216340645623859 + ], + [ + 35, + -0.0019454771036180318 + ], + [ + 45, + -0.0024222739907600044 + ], + [ + 55, + -0.002981824864036753 + ], + [ + 65, + -0.0023194947486899764 + ], + [ + 75, + -0.002351447182263655 + ], + [ + 85, + -0.0024025850020166217 + ], + [ + 95, + -0.002344829682783711 + ], + [ + 100, + -0.0023605154200367906 + ] + ], + "rho": [ + [ + 6, + 0.024813755182549357 + ], + [ + 7, + 0.02137202536687255 + ], + [ + 8, + -0.008550406782887876 + ], + [ + 9, + -0.014014755026437342 + ], + [ + 10, + 0.003713869256898761 + ], + [ + 13, + -0.00019413704285398126 + ], + [ + 15, + -0.004616216290742159 + ], + [ + 20, + 0.004534890875220299 + ], + [ + 25, + -0.0003467597998678684 + ], + [ + 35, + -0.013164100237190723 + ], + [ + 45, + -0.004108893685042858 + ], + [ + 55, + -0.005393396131694317 + ], + [ + 65, + 0.0037673721089959145 + ], + [ + 75, + 0.002991759218275547 + ], + [ + 85, + 0.0030559878796339035 + ], + [ + 95, + 0.0011144964955747128 + ], + [ + 100, + -0.00562389986589551 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7499215605640026 + ], + [ + 7, + 0.6498885895229987 + ], + [ + 8, + 0.5499278178579371 + ], + [ + 9, + 0.4499412865798823 + ], + [ + 10, + 0.3499508856541087 + ], + [ + 11, + 0.24996128541858828 + ], + [ + 12, + 0.2499621277638252 + ], + [ + 13, + 0.24996268584560855 + ], + [ + 14, + 0.2499630643239716 + ], + [ + 15, + 0.2499633203326066 + ], + [ + 16, + 0.24996357761505564 + ], + [ + 17, + 0.24996378587101792 + ], + [ + 18, + 0.24996401189373949 + ], + [ + 19, + 0.2499642051366507 + ], + [ + 20, + 0.24996440432532102 + ], + [ + 21, + 0.24996460811141474 + ], + [ + 22, + 0.24996479507118088 + ], + [ + 23, + 0.24996493590356497 + ], + [ + 24, + 0.2499650811884471 + ], + [ + 25, + 0.24996520118670035 + ], + [ + 26, + 0.24996530426771693 + ], + [ + 27, + 0.24996540318596389 + ], + [ + 28, + 0.24996546582591034 + ], + [ + 29, + 0.24996552319418933 + ], + [ + 30, + 0.24996555460521513 + ], + [ + 31, + 0.2499656046693103 + ], + [ + 32, + 0.24996562179889437 + ], + [ + 33, + 0.24996564218791698 + ], + [ + 34, + 0.24996565128189985 + ], + [ + 35, + 0.2499656640801942 + ], + [ + 36, + 0.249965671182188 + ], + [ + 37, + 0.2499656635678768 + ], + [ + 38, + 0.24996566751146188 + ], + [ + 39, + 0.24996565557938735 + ], + [ + 40, + 0.2499656398790017 + ], + [ + 41, + 0.24996562954120802 + ], + [ + 42, + 0.24996561563060876 + ], + [ + 43, + 0.24996559801562257 + ], + [ + 44, + 0.2499655778322152 + ], + [ + 45, + 0.24996555878137158 + ], + [ + 46, + 0.2499655444965953 + ], + [ + 47, + 0.24996551827972838 + ], + [ + 48, + 0.24996550263323514 + ], + [ + 49, + 0.24996548777208452 + ], + [ + 50, + 0.24996546920322563 + ], + [ + 51, + 0.24996543994936327 + ], + [ + 52, + 0.24996543582032632 + ], + [ + 53, + 0.24996539768484524 + ], + [ + 54, + 0.24996538297205342 + ], + [ + 55, + 0.24996539272334395 + ], + [ + 56, + 0.2499653540216129 + ], + [ + 57, + 0.24996533929186665 + ], + [ + 58, + 0.24996531687037848 + ], + [ + 59, + 0.24996531187167323 + ], + [ + 60, + 0.24996528421891845 + ], + [ + 61, + 0.24996527040606908 + ], + [ + 62, + 0.24996524750259488 + ], + [ + 63, + 0.2499652417994367 + ], + [ + 64, + 0.24996522915611907 + ], + [ + 65, + 0.24996520556498233 + ], + [ + 66, + 0.24996518516584246 + ], + [ + 67, + 0.24996518126601272 + ], + [ + 68, + 0.24996517745044652 + ], + [ + 69, + 0.24996517611567165 + ], + [ + 70, + 0.24996515297285476 + ], + [ + 71, + 0.2499651448967178 + ], + [ + 72, + 0.2499651331466676 + ], + [ + 73, + 0.24996512179775632 + ], + [ + 74, + 0.24996512290329126 + ], + [ + 75, + 0.24996511244085787 + ], + [ + 76, + 0.249965101273893 + ], + [ + 77, + 0.2499651004918571 + ], + [ + 78, + 0.24996508772048512 + ], + [ + 79, + 0.24996507751418334 + ], + [ + 80, + 0.24996506879773767 + ], + [ + 81, + 0.24996508152526425 + ], + [ + 82, + 0.24996508364200018 + ], + [ + 83, + 0.24996506643488683 + ], + [ + 84, + 0.24996507066164142 + ], + [ + 85, + 0.24996507105268392 + ], + [ + 86, + 0.24996506060701437 + ], + [ + 87, + 0.249965055918445 + ], + [ + 88, + 0.2499650537713543 + ], + [ + 89, + 0.24996505500845378 + ], + [ + 90, + 0.2499650492917446 + ], + [ + 91, + 0.24996504976698292 + ], + [ + 92, + 0.24996505515333245 + ], + [ + 93, + 0.24996506002726224 + ], + [ + 94, + 0.24996505054233178 + ], + [ + 95, + 0.2499650415224445 + ], + [ + 96, + 0.24996505113215065 + ], + [ + 97, + 0.2499650620260496 + ], + [ + 98, + 0.24996504605931247 + ], + [ + 99, + 0.24996503486876115 + ], + [ + 100, + 0.2499650427021916 + ] + ] + }, + "freeze_after_5_decay_to_025": { + "test_acc": [ + 0.3052, + 0.3121, + 0.3135, + 0.2994, + 0.3083, + 0.2037, + 0.1368, + 0.1231, + 0.1271, + 0.1138, + 0.1191, + 0.1163, + 0.1162, + 0.1135, + 0.1155, + 0.0967, + 0.109, + 0.1051, + 0.1075, + 0.0935, + 0.0996, + 0.1119, + 0.1027, + 0.1278, + 0.1004, + 0.1091, + 0.1141, + 0.113, + 0.1348, + 0.1194, + 0.1242, + 0.1191, + 0.1192, + 0.1349, + 0.1207, + 0.1144, + 0.1316, + 0.1325, + 0.1241, + 0.1237, + 0.1276, + 0.1121, + 0.1233, + 0.122, + 0.1335, + 0.1379, + 0.1264, + 0.1214, + 0.1121, + 0.108, + 0.1317, + 0.1181, + 0.1162, + 0.1366, + 0.1369, + 0.1254, + 0.1211, + 0.106, + 0.1075, + 0.1227, + 0.1201, + 0.1274, + 0.1188, + 0.1102, + 0.1313, + 0.1336, + 0.1129, + 0.1283, + 0.1301, + 0.1152, + 0.1325, + 0.1278, + 0.1247, + 0.1357, + 0.134, + 0.1224, + 0.1093, + 0.1188, + 0.1325, + 0.1097, + 0.1196, + 0.1272, + 0.1253, + 0.1126, + 0.1238, + 0.1224, + 0.1263, + 0.1342, + 0.1111, + 0.1095, + 0.1089, + 0.1191, + 0.1143, + 0.1131, + 0.1131 + ], + "train_loss": [ + 1.9889914673614502, + 1.9853284645080567, + 1.9883257375717163, + 1.9826136252593993, + 1.985386326980591, + 2.068510132598877, + 2.2071184797668457, + 2.252070314407349, + 2.262799511871338, + 2.271883014907837, + 2.276685047454834, + 2.2789263591766358, + 2.2829609899139403, + 2.2874077117156983, + 2.289303440246582, + 2.293695969619751, + 2.2960100469207765, + 2.299179527053833, + 2.299998391647339, + 2.2999639778137206, + 2.301144305267334, + 2.3016930992889404, + 2.3010191550445556, + 2.301623288574219, + 2.3021187420654297, + 2.30279943107605, + 2.3010086586761473, + 2.3007896277618407, + 2.3004655308532715, + 2.3013855320739744, + 2.3028329793548585, + 2.3016249320983886, + 2.2996341718292235, + 2.299152314529419, + 2.298686719970703, + 2.2991080980682375, + 2.2990331848907473, + 2.298325881500244, + 2.29721604927063, + 2.297458392868042, + 2.297814186630249, + 2.297540751800537, + 2.2971647343444825, + 2.298780792694092, + 2.296483359832764, + 2.2955091331481934, + 2.296101309814453, + 2.294827574005127, + 2.2959980039978025, + 2.2944129446411132, + 2.2954401092529295, + 2.293963470993042, + 2.293216000289917, + 2.2939060804748537, + 2.293471497955322, + 2.2934607655334474, + 2.2936269941711425, + 2.2927763636779783, + 2.292233616256714, + 2.29233764793396, + 2.2921327173614503, + 2.292641021270752, + 2.290940444793701, + 2.292282715377808, + 2.2920145623779296, + 2.290925247039795, + 2.2905999392700194, + 2.291516679534912, + 2.291281402359009, + 2.2909249305725097, + 2.2908486936950685, + 2.290478879928589, + 2.291001184539795, + 2.28960931350708, + 2.2898020780944823, + 2.2898542040252687, + 2.2900171630859374, + 2.289037522201538, + 2.289808230667114, + 2.2894698133850095, + 2.2893528965759278, + 2.289201781158447, + 2.2886661543273927, + 2.289276965789795, + 2.2895079779052736, + 2.28888594833374, + 2.289304996032715, + 2.2882724632263183, + 2.289115521774292, + 2.2893903966522218, + 2.288375448074341, + 2.2882951035308836, + 2.28868325088501, + 2.288313069458008, + 2.288534205932617 + ], + "gamma": [ + [ + 6, + 0.030998411762993783 + ], + [ + 7, + 0.02042932203039527 + ], + [ + 8, + 0.025238439673557878 + ], + [ + 9, + 0.024348934122826904 + ], + [ + 10, + 0.02691327966749668 + ], + [ + 13, + 0.04581431741826236 + ], + [ + 15, + 0.05122767586726695 + ], + [ + 20, + 0.028180050187074812 + ], + [ + 25, + 0.004695354848081479 + ], + [ + 35, + 0.003258639584601042 + ], + [ + 45, + 0.0060973436638960266 + ], + [ + 55, + 0.0026502537202759413 + ], + [ + 65, + 0.0019636713411728124 + ], + [ + 75, + 0.0013042573217489917 + ], + [ + 85, + 0.0007217170104922843 + ], + [ + 95, + 0.0009432140236640407 + ], + [ + 100, + 0.0008838386715979141 + ] + ], + "rho": [ + [ + 6, + 0.01131400465965271 + ], + [ + 7, + 0.0169760164571926 + ], + [ + 8, + -0.01151197380386293 + ], + [ + 9, + 0.007203209912404418 + ], + [ + 10, + -4.300149157643318e-05 + ], + [ + 13, + -0.0012576030567288399 + ], + [ + 15, + -0.0009340029209852219 + ], + [ + 20, + -0.0016878610476851463 + ], + [ + 25, + -0.003051650244742632 + ], + [ + 35, + -0.005875409580767155 + ], + [ + 45, + -0.0018643303774297237 + ], + [ + 55, + 0.0009776366641744971 + ], + [ + 65, + 0.0013682227581739426 + ], + [ + 75, + 0.003012792905792594 + ], + [ + 85, + -0.01262329239398241 + ], + [ + 95, + -0.0034377884585410357 + ], + [ + 100, + 0.005971882026642561 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7499221587332795 + ], + [ + 7, + 0.7498518854867786 + ], + [ + 8, + 0.7498149497377955 + ], + [ + 9, + 0.7497333518679905 + ], + [ + 10, + 0.7496576925518745 + ], + [ + 11, + 0.649646096496131 + ], + [ + 12, + 0.5497254744391575 + ], + [ + 13, + 0.4497598983126942 + ], + [ + 14, + 0.3497929197623351 + ], + [ + 15, + 0.24983518768582047 + ], + [ + 16, + 0.24983892424235482 + ], + [ + 17, + 0.2498417139676731 + ], + [ + 18, + 0.24984401479168628 + ], + [ + 19, + 0.24984593508981487 + ], + [ + 20, + 0.24984749999759318 + ], + [ + 21, + 0.2498488692465181 + ], + [ + 22, + 0.2498499398578784 + ], + [ + 23, + 0.24985075457954833 + ], + [ + 24, + 0.24985142408517985 + ], + [ + 25, + 0.24985192621001853 + ], + [ + 26, + 0.24985235355814475 + ], + [ + 27, + 0.24985268752743725 + ], + [ + 28, + 0.2498529223564429 + ], + [ + 29, + 0.2498530995331157 + ], + [ + 30, + 0.24985317803507076 + ], + [ + 31, + 0.24985332962472304 + ], + [ + 32, + 0.24985336584290696 + ], + [ + 33, + 0.24985339268117196 + ], + [ + 34, + 0.24985340836624917 + ], + [ + 35, + 0.24985343280065775 + ], + [ + 36, + 0.24985343479985006 + ], + [ + 37, + 0.24985338171996366 + ], + [ + 38, + 0.24985338190189033 + ], + [ + 39, + 0.24985336549546372 + ], + [ + 40, + 0.24985329346337362 + ], + [ + 41, + 0.24985323826291034 + ], + [ + 42, + 0.24985321131998126 + ], + [ + 43, + 0.24985317168636909 + ], + [ + 44, + 0.2498531187479913 + ], + [ + 45, + 0.24985305580921366 + ], + [ + 46, + 0.24985302543067442 + ], + [ + 47, + 0.24985298309286144 + ], + [ + 48, + 0.2498529583618077 + ], + [ + 49, + 0.24985293710674641 + ], + [ + 50, + 0.24985288952612472 + ], + [ + 51, + 0.24985283885329918 + ], + [ + 52, + 0.24985284015502204 + ], + [ + 53, + 0.24985275224582726 + ], + [ + 54, + 0.24985271617612245 + ], + [ + 55, + 0.24985278660278676 + ], + [ + 56, + 0.24985270413912475 + ], + [ + 57, + 0.24985267867606448 + ], + [ + 58, + 0.24985261926432437 + ], + [ + 59, + 0.24985265660538555 + ], + [ + 60, + 0.2498525589688618 + ], + [ + 61, + 0.2498525948263581 + ], + [ + 62, + 0.24985250615215845 + ], + [ + 63, + 0.24985253626419848 + ], + [ + 64, + 0.24985252458806803 + ], + [ + 65, + 0.24985244966970346 + ], + [ + 66, + 0.24985243633144938 + ], + [ + 67, + 0.2498524231990304 + ], + [ + 68, + 0.24985243464573753 + ], + [ + 69, + 0.24985244959899414 + ], + [ + 70, + 0.2498523964585009 + ], + [ + 71, + 0.24985237284663436 + ], + [ + 72, + 0.2498523581157608 + ], + [ + 73, + 0.2498523440457847 + ], + [ + 74, + 0.24985236879381156 + ], + [ + 75, + 0.2498523393358387 + ], + [ + 76, + 0.24985232552208136 + ], + [ + 77, + 0.2498523213984054 + ], + [ + 78, + 0.24985232647951547 + ], + [ + 79, + 0.24985228393588338 + ], + [ + 80, + 0.24985225037440933 + ], + [ + 81, + 0.24985230778709028 + ], + [ + 82, + 0.2498523135425587 + ], + [ + 83, + 0.24985228212536653 + ], + [ + 84, + 0.24985226981544117 + ], + [ + 85, + 0.2498522997423083 + ], + [ + 86, + 0.24985229817429594 + ], + [ + 87, + 0.24985227304543167 + ], + [ + 88, + 0.2498522585136201 + ], + [ + 89, + 0.24985226070861766 + ], + [ + 90, + 0.2498522775804293 + ], + [ + 91, + 0.24985226001407726 + ], + [ + 92, + 0.2498522820512644 + ], + [ + 93, + 0.24985229769889214 + ], + [ + 94, + 0.24985227341291588 + ], + [ + 95, + 0.24985225233689 + ], + [ + 96, + 0.24985227483207073 + ], + [ + 97, + 0.2498522931573161 + ], + [ + 98, + 0.2498522616626271 + ], + [ + 99, + 0.24985222919720057 + ], + [ + 100, + 0.24985224068443718 + ] + ] + }, + "freeze_after_1_decay_to_000": { + "test_acc": [ + 0.2964, + 0.237, + 0.1462, + 0.1483, + 0.1289, + 0.1903, + 0.1958, + 0.2135, + 0.2011, + 0.2192, + 0.2116, + 0.2301, + 0.2391, + 0.2394, + 0.237, + 0.2294, + 0.2425, + 0.246, + 0.2468, + 0.2519, + 0.2479, + 0.2676, + 0.2501, + 0.2636, + 0.2442, + 0.2687, + 0.2567, + 0.2665, + 0.2696, + 0.2726, + 0.2687, + 0.2636, + 0.2726, + 0.2668, + 0.2727, + 0.2694, + 0.2835, + 0.2876, + 0.2757, + 0.2806, + 0.2708, + 0.2622, + 0.2749, + 0.2794, + 0.2698, + 0.2708, + 0.2751, + 0.2702, + 0.2741, + 0.2795, + 0.2744, + 0.28, + 0.2784, + 0.2751, + 0.2708, + 0.2808, + 0.2811, + 0.2814, + 0.2776, + 0.2787, + 0.2839, + 0.288, + 0.2859, + 0.2879, + 0.2706, + 0.274, + 0.2812, + 0.2848, + 0.2847, + 0.2827, + 0.2817, + 0.2861, + 0.2814, + 0.2819, + 0.2768, + 0.2875, + 0.2848, + 0.2837, + 0.281, + 0.2839, + 0.2851, + 0.2851, + 0.2874, + 0.2822, + 0.2854, + 0.2857, + 0.2838, + 0.283, + 0.2827, + 0.2853, + 0.2855, + 0.2853, + 0.2849, + 0.285, + 0.2848 + ], + "train_loss": [ + 1.987770098953247, + 2.058148936920166, + 2.1742564457702636, + 2.227886661987305, + 2.2489118286895753, + 2.215499964141846, + 2.172080729522705, + 2.1515315755462647, + 2.1322266635131837, + 2.1219937451171873, + 2.1115163373565675, + 2.10087213760376, + 2.094084821090698, + 2.0881656538391113, + 2.0830307551574707, + 2.0793406107330323, + 2.0741417255401613, + 2.071706746520996, + 2.0672668325805663, + 2.061994496154785, + 2.0583461866760255, + 2.0575141161346435, + 2.0518029474639894, + 2.0522982623291015, + 2.048578759384155, + 2.0465751447296143, + 2.0437594219589235, + 2.044029693031311, + 2.0412700551605223, + 2.0405831239318846, + 2.04130356338501, + 2.0393758958435058, + 2.039224354324341, + 2.038326994972229, + 2.038590117645264, + 2.0370230613708498, + 2.035887234573364, + 2.0349106960296632, + 2.0352816369247435, + 2.0349522632598878, + 2.0344653484344484, + 2.0331574398040773, + 2.033610480079651, + 2.0358019441986084, + 2.0341035528182982, + 2.030207544937134, + 2.032771106109619, + 2.0311163373565675, + 2.0296363953399656, + 2.0308212451171874, + 2.0306940715789796, + 2.028369594345093, + 2.029138938446045, + 2.029238699264526, + 2.0298833404541017, + 2.0294783560943603, + 2.027595551223755, + 2.027595431060791, + 2.027459530296326, + 2.028411672706604, + 2.0279053328704832, + 2.0280695262908934, + 2.027787509765625, + 2.025281623840332, + 2.0254185902404784, + 2.026019370727539, + 2.0258047150421143, + 2.0285882577514647, + 2.0261368878555297, + 2.026999177932739, + 2.0256639764404296, + 2.025425854759216, + 2.0266070795440676, + 2.0237192176055907, + 2.025412853469849, + 2.0240610698699952, + 2.0247360014343263, + 2.0249295909118654, + 2.0255611853790283, + 2.0232094157409666, + 2.024681177215576, + 2.02321795753479, + 2.024663003501892, + 2.02217747467041, + 2.022007664833069, + 2.023817197189331, + 2.0230373464584352, + 2.022435458984375, + 2.022840128860474, + 2.0205608460998534, + 2.0236412183380126, + 2.024272792053223, + 2.022964626312256, + 2.0220273933410646, + 2.025426727218628 + ], + "gamma": [ + [ + 6, + 0.02804319025017321 + ], + [ + 7, + 0.04006533604115248 + ], + [ + 8, + 0.05339363403618336 + ], + [ + 9, + 0.05600978480651975 + ], + [ + 10, + 0.057343464344739914 + ], + [ + 13, + 0.055115228053182364 + ], + [ + 15, + 0.057215953478589654 + ], + [ + 20, + 0.06352227658499032 + ], + [ + 25, + 0.07144864764995873 + ], + [ + 35, + 0.080837985384278 + ], + [ + 45, + 0.08100816144724376 + ], + [ + 55, + 0.08169284932955634 + ], + [ + 65, + 0.0816943283425644 + ], + [ + 75, + 0.08262447686865926 + ], + [ + 85, + 0.08246231166413054 + ], + [ + 95, + 0.0823301882337546 + ], + [ + 100, + 0.08231175330001861 + ] + ], + "rho": [ + [ + 6, + 0.0330923511646688 + ], + [ + 7, + 0.0015333815244957805 + ], + [ + 8, + 0.012843782315030694 + ], + [ + 9, + 0.0005663076881319284 + ], + [ + 10, + 0.013773382874205709 + ], + [ + 13, + 0.014525709673762321 + ], + [ + 15, + 0.01487097516655922 + ], + [ + 20, + 0.009759962151292711 + ], + [ + 25, + 0.0005541914142668247 + ], + [ + 35, + 0.006065825931727886 + ], + [ + 45, + 0.006206185091286898 + ], + [ + 55, + -0.007286409847438335 + ], + [ + 65, + -0.005138644948601723 + ], + [ + 75, + 0.0040618120692670345 + ], + [ + 85, + 0.005303684622049332 + ], + [ + 95, + -0.008256135508418083 + ], + [ + 100, + 0.009820420295000076 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7499214508544367 + ], + [ + 7, + 0.5998742841330391 + ], + [ + 8, + 0.4499106979272932 + ], + [ + 9, + 0.2999343237198726 + ], + [ + 10, + 0.14996251856344525 + ], + [ + 11, + 0.0 + ], + [ + 12, + 0.0 + ], + [ + 13, + 0.0 + ], + [ + 14, + 0.0 + ], + [ + 15, + 0.0 + ], + [ + 16, + 0.0 + ], + [ + 17, + 0.0 + ], + [ + 18, + 0.0 + ], + [ + 19, + 0.0 + ], + [ + 20, + 0.0 + ], + [ + 21, + 0.0 + ], + [ + 22, + 0.0 + ], + [ + 23, + 0.0 + ], + [ + 24, + 0.0 + ], + [ + 25, + 0.0 + ], + [ + 26, + 0.0 + ], + [ + 27, + 0.0 + ], + [ + 28, + 0.0 + ], + [ + 29, + 0.0 + ], + [ + 30, + 0.0 + ], + [ + 31, + 0.0 + ], + [ + 32, + 0.0 + ], + [ + 33, + 0.0 + ], + [ + 34, + 0.0 + ], + [ + 35, + 0.0 + ], + [ + 36, + 0.0 + ], + [ + 37, + 0.0 + ], + [ + 38, + 0.0 + ], + [ + 39, + 0.0 + ], + [ + 40, + 0.0 + ], + [ + 41, + 0.0 + ], + [ + 42, + 0.0 + ], + [ + 43, + 0.0 + ], + [ + 44, + 0.0 + ], + [ + 45, + 0.0 + ], + [ + 46, + 0.0 + ], + [ + 47, + 0.0 + ], + [ + 48, + 0.0 + ], + [ + 49, + 0.0 + ], + [ + 50, + 0.0 + ], + [ + 51, + 0.0 + ], + [ + 52, + 0.0 + ], + [ + 53, + 0.0 + ], + [ + 54, + 0.0 + ], + [ + 55, + 0.0 + ], + [ + 56, + 0.0 + ], + [ + 57, + 0.0 + ], + [ + 58, + 0.0 + ], + [ + 59, + 0.0 + ], + [ + 60, + 0.0 + ], + [ + 61, + 0.0 + ], + [ + 62, + 0.0 + ], + [ + 63, + 0.0 + ], + [ + 64, + 0.0 + ], + [ + 65, + 0.0 + ], + [ + 66, + 0.0 + ], + [ + 67, + 0.0 + ], + [ + 68, + 0.0 + ], + [ + 69, + 0.0 + ], + [ + 70, + 0.0 + ], + [ + 71, + 0.0 + ], + [ + 72, + 0.0 + ], + [ + 73, + 0.0 + ], + [ + 74, + 0.0 + ], + [ + 75, + 0.0 + ], + [ + 76, + 0.0 + ], + [ + 77, + 0.0 + ], + [ + 78, + 0.0 + ], + [ + 79, + 0.0 + ], + [ + 80, + 0.0 + ], + [ + 81, + 0.0 + ], + [ + 82, + 0.0 + ], + [ + 83, + 0.0 + ], + [ + 84, + 0.0 + ], + [ + 85, + 0.0 + ], + [ + 86, + 0.0 + ], + [ + 87, + 0.0 + ], + [ + 88, + 0.0 + ], + [ + 89, + 0.0 + ], + [ + 90, + 0.0 + ], + [ + 91, + 0.0 + ], + [ + 92, + 0.0 + ], + [ + 93, + 0.0 + ], + [ + 94, + 0.0 + ], + [ + 95, + 0.0 + ], + [ + 96, + 0.0 + ], + [ + 97, + 0.0 + ], + [ + 98, + 0.0 + ], + [ + 99, + 0.0 + ], + [ + 100, + 0.0 + ] + ] + }, + "freeze_after_5_decay_to_000": { + "test_acc": [ + 0.3059, + 0.3107, + 0.3158, + 0.3049, + 0.308, + 0.2218, + 0.1488, + 0.1368, + 0.1427, + 0.1562, + 0.1782, + 0.2205, + 0.2149, + 0.2366, + 0.2259, + 0.2238, + 0.2374, + 0.2428, + 0.2421, + 0.2512, + 0.2405, + 0.2665, + 0.2442, + 0.2657, + 0.2365, + 0.2686, + 0.2529, + 0.2656, + 0.2638, + 0.2685, + 0.273, + 0.2656, + 0.2688, + 0.263, + 0.275, + 0.2675, + 0.2766, + 0.2782, + 0.2783, + 0.2806, + 0.2722, + 0.2575, + 0.2719, + 0.2764, + 0.2681, + 0.2693, + 0.2764, + 0.2703, + 0.272, + 0.2768, + 0.2742, + 0.2809, + 0.2811, + 0.2775, + 0.2726, + 0.2794, + 0.2766, + 0.2812, + 0.2741, + 0.2789, + 0.2803, + 0.2877, + 0.2835, + 0.2879, + 0.2717, + 0.2757, + 0.2818, + 0.2853, + 0.2831, + 0.2803, + 0.2818, + 0.285, + 0.2807, + 0.282, + 0.2793, + 0.288, + 0.2827, + 0.2853, + 0.2842, + 0.282, + 0.2856, + 0.2865, + 0.2879, + 0.285, + 0.2861, + 0.2859, + 0.2853, + 0.2856, + 0.2844, + 0.2857, + 0.2853, + 0.2854, + 0.2852, + 0.2852, + 0.2853 + ], + "train_loss": [ + 1.989389101486206, + 1.9903729549407958, + 1.99436337348938, + 1.9900701868438722, + 1.9933015954589843, + 2.058371421661377, + 2.1906161418151857, + 2.2348922942352294, + 2.2343787562561035, + 2.2099864021301268, + 2.177866358795166, + 2.1560395417022704, + 2.1391963284301756, + 2.1252468937683107, + 2.113511488494873, + 2.1054030198669436, + 2.0950439585876466, + 2.0904504656982423, + 2.084099229812622, + 2.07674031211853, + 2.0714124299621584, + 2.0692392198181153, + 2.062705947227478, + 2.062638821334839, + 2.057503818359375, + 2.0546474283218386, + 2.051254558944702, + 2.0508053442764282, + 2.047545058441162, + 2.046349447784424, + 2.0467114446258545, + 2.0441762962341308, + 2.043712628707886, + 2.042656667137146, + 2.0426513220977784, + 2.040860073852539, + 2.0394876539611815, + 2.0385328398895264, + 2.0384585528564454, + 2.0381276249694826, + 2.037917250213623, + 2.0360237339019776, + 2.036692409439087, + 2.038358888168335, + 2.0366346838378906, + 2.032973290939331, + 2.035324615478516, + 2.0334486687469484, + 2.031794991760254, + 2.0330240043640138, + 2.0328360440063475, + 2.030444066390991, + 2.0312890017700194, + 2.031069114303589, + 2.0315731324005126, + 2.031455577163696, + 2.029421018714905, + 2.02938812789917, + 2.029021885147095, + 2.030032192955017, + 2.0296973515319823, + 2.029736637649536, + 2.029366349105835, + 2.026800500488281, + 2.026819801712036, + 2.027790601730347, + 2.027446739730835, + 2.0302554197692873, + 2.028049821205139, + 2.0287723950958254, + 2.027235142593384, + 2.027090040016174, + 2.028121824874878, + 2.0253573878479005, + 2.026976574707031, + 2.025492007293701, + 2.026246927947998, + 2.026515454330444, + 2.0273433531951905, + 2.02479778503418, + 2.026230363616943, + 2.024716327896118, + 2.0262912517547607, + 2.023776498374939, + 2.023611107559204, + 2.0255411886978147, + 2.0247430859375, + 2.024035308227539, + 2.0245019944763185, + 2.0221999503326415, + 2.0252691249084473, + 2.0261188220596313, + 2.0245826667022704, + 2.023685280380249, + 2.0271104919433593 + ], + "gamma": [ + [ + 6, + 0.019172905129380524 + ], + [ + 7, + 0.03231109178159386 + ], + [ + 8, + 0.026423632371006534 + ], + [ + 9, + 0.027440774225397035 + ], + [ + 10, + 0.03383389429654926 + ], + [ + 13, + 0.05179026070982218 + ], + [ + 15, + 0.05204801121726632 + ], + [ + 20, + 0.06441549817100167 + ], + [ + 25, + 0.06984315533190966 + ], + [ + 35, + 0.07725038478383794 + ], + [ + 45, + 0.07803186881938018 + ], + [ + 55, + 0.07950649873237126 + ], + [ + 65, + 0.08030074625276029 + ], + [ + 75, + 0.08146566100185737 + ], + [ + 85, + 0.08145827654516324 + ], + [ + 95, + 0.08135411059629405 + ], + [ + 100, + 0.08133506249578204 + ] + ], + "rho": [ + [ + 6, + -0.011272484320215881 + ], + [ + 7, + -0.008410613983869553 + ], + [ + 8, + 0.0019524102099239826 + ], + [ + 9, + 0.01624949974939227 + ], + [ + 10, + 0.0026425524847581983 + ], + [ + 13, + -0.005179970525205135 + ], + [ + 15, + 0.011054718401283026 + ], + [ + 20, + 0.009675369132310152 + ], + [ + 25, + 0.003612063592299819 + ], + [ + 35, + -0.0011477797525003552 + ], + [ + 45, + 0.003364500356838107 + ], + [ + 55, + 0.012593701481819153 + ], + [ + 65, + 0.001831691013649106 + ], + [ + 75, + -0.007136601954698563 + ], + [ + 85, + 0.0028698681853711605 + ], + [ + 95, + -0.011590876616537571 + ], + [ + 100, + 0.002832313533872366 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7499220515540377 + ], + [ + 7, + 0.7498463189979196 + ], + [ + 8, + 0.7498030222548633 + ], + [ + 9, + 0.749731526257939 + ], + [ + 10, + 0.7496986720865624 + ], + [ + 11, + 0.5997941301463895 + ], + [ + 12, + 0.44988347044785837 + ], + [ + 13, + 0.2999062167738669 + ], + [ + 14, + 0.14994115019086857 + ], + [ + 15, + 0.0 + ], + [ + 16, + 0.0 + ], + [ + 17, + 0.0 + ], + [ + 18, + 0.0 + ], + [ + 19, + 0.0 + ], + [ + 20, + 0.0 + ], + [ + 21, + 0.0 + ], + [ + 22, + 0.0 + ], + [ + 23, + 0.0 + ], + [ + 24, + 0.0 + ], + [ + 25, + 0.0 + ], + [ + 26, + 0.0 + ], + [ + 27, + 0.0 + ], + [ + 28, + 0.0 + ], + [ + 29, + 0.0 + ], + [ + 30, + 0.0 + ], + [ + 31, + 0.0 + ], + [ + 32, + 0.0 + ], + [ + 33, + 0.0 + ], + [ + 34, + 0.0 + ], + [ + 35, + 0.0 + ], + [ + 36, + 0.0 + ], + [ + 37, + 0.0 + ], + [ + 38, + 0.0 + ], + [ + 39, + 0.0 + ], + [ + 40, + 0.0 + ], + [ + 41, + 0.0 + ], + [ + 42, + 0.0 + ], + [ + 43, + 0.0 + ], + [ + 44, + 0.0 + ], + [ + 45, + 0.0 + ], + [ + 46, + 0.0 + ], + [ + 47, + 0.0 + ], + [ + 48, + 0.0 + ], + [ + 49, + 0.0 + ], + [ + 50, + 0.0 + ], + [ + 51, + 0.0 + ], + [ + 52, + 0.0 + ], + [ + 53, + 0.0 + ], + [ + 54, + 0.0 + ], + [ + 55, + 0.0 + ], + [ + 56, + 0.0 + ], + [ + 57, + 0.0 + ], + [ + 58, + 0.0 + ], + [ + 59, + 0.0 + ], + [ + 60, + 0.0 + ], + [ + 61, + 0.0 + ], + [ + 62, + 0.0 + ], + [ + 63, + 0.0 + ], + [ + 64, + 0.0 + ], + [ + 65, + 0.0 + ], + [ + 66, + 0.0 + ], + [ + 67, + 0.0 + ], + [ + 68, + 0.0 + ], + [ + 69, + 0.0 + ], + [ + 70, + 0.0 + ], + [ + 71, + 0.0 + ], + [ + 72, + 0.0 + ], + [ + 73, + 0.0 + ], + [ + 74, + 0.0 + ], + [ + 75, + 0.0 + ], + [ + 76, + 0.0 + ], + [ + 77, + 0.0 + ], + [ + 78, + 0.0 + ], + [ + 79, + 0.0 + ], + [ + 80, + 0.0 + ], + [ + 81, + 0.0 + ], + [ + 82, + 0.0 + ], + [ + 83, + 0.0 + ], + [ + 84, + 0.0 + ], + [ + 85, + 0.0 + ], + [ + 86, + 0.0 + ], + [ + 87, + 0.0 + ], + [ + 88, + 0.0 + ], + [ + 89, + 0.0 + ], + [ + 90, + 0.0 + ], + [ + 91, + 0.0 + ], + [ + 92, + 0.0 + ], + [ + 93, + 0.0 + ], + [ + 94, + 0.0 + ], + [ + 95, + 0.0 + ], + [ + 96, + 0.0 + ], + [ + 97, + 0.0 + ], + [ + 98, + 0.0 + ], + [ + 99, + 0.0 + ], + [ + 100, + 0.0 + ] + ] + } +} \ No newline at end of file diff --git a/results/frozen_baselines_crossarch.json b/results/frozen_baselines_crossarch.json new file mode 100644 index 0000000..382fc4f --- /dev/null +++ b/results/frozen_baselines_crossarch.json @@ -0,0 +1,14 @@ +{ + "vit_frozen_s42": 0.5678, + "vit_shallow_s42": 0.1, + "vit_frozen_s123": 0.5728, + "vit_shallow_s123": 0.1, + "vit_frozen_s456": 0.5681, + "vit_shallow_s456": 0.1, + "student_frozen_s42": 0.9005, + "student_shallow_s42": 0.9165, + "student_frozen_s123": 0.906, + "student_shallow_s123": 0.9135, + "student_frozen_s456": 0.9175, + "student_shallow_s456": 0.9225 +} \ No newline at end of file diff --git a/results/frozen_baselines_crossarch.log b/results/frozen_baselines_crossarch.log new file mode 100644 index 0000000..7c2efc8 --- /dev/null +++ b/results/frozen_baselines_crossarch.log @@ -0,0 +1,120 @@ + +=== ViT-Mini frozen baselines === + +--- ViT-Mini seed=42 --- + ViT-Mini frozen: 16266/809354 trainable params + [ViT-frozen] s=42 ep 10: acc=0.5014 + [ViT-frozen] s=42 ep 20: acc=0.5297 + [ViT-frozen] s=42 ep 30: acc=0.5375 + [ViT-frozen] s=42 ep 40: acc=0.5554 + [ViT-frozen] s=42 ep 50: acc=0.5619 + [ViT-frozen] s=42 ep 60: acc=0.5678 + ViT-Mini shallow: 16266 params (no blocks) + [ViT-shallow] s=42 ep 10: acc=0.1000 + [ViT-shallow] s=42 ep 20: acc=0.1000 + [ViT-shallow] s=42 ep 30: acc=0.1000 + [ViT-shallow] s=42 ep 40: acc=0.1000 + [ViT-shallow] s=42 ep 50: acc=0.1000 + [ViT-shallow] s=42 ep 60: acc=0.1000 + FINAL ViT s=42: frozen=0.5678, shallow=0.1000 + +--- ViT-Mini seed=123 --- + ViT-Mini frozen: 16266/809354 trainable params + [ViT-frozen] s=123 ep 10: acc=0.5249 + [ViT-frozen] s=123 ep 20: acc=0.5421 + [ViT-frozen] s=123 ep 30: acc=0.5545 + [ViT-frozen] s=123 ep 40: acc=0.5621 + [ViT-frozen] s=123 ep 50: acc=0.5680 + [ViT-frozen] s=123 ep 60: acc=0.5728 + ViT-Mini shallow: 16266 params (no blocks) + [ViT-shallow] s=123 ep 10: acc=0.1000 + [ViT-shallow] s=123 ep 20: acc=0.1000 + [ViT-shallow] s=123 ep 30: acc=0.1000 + [ViT-shallow] s=123 ep 40: acc=0.1000 + [ViT-shallow] s=123 ep 50: acc=0.1000 + [ViT-shallow] s=123 ep 60: acc=0.1000 + FINAL ViT s=123: frozen=0.5728, shallow=0.1000 + +--- ViT-Mini seed=456 --- + ViT-Mini frozen: 16266/809354 trainable params + [ViT-frozen] s=456 ep 10: acc=0.5166 + [ViT-frozen] s=456 ep 20: acc=0.5342 + [ViT-frozen] s=456 ep 30: acc=0.5414 + [ViT-frozen] s=456 ep 40: acc=0.5545 + [ViT-frozen] s=456 ep 50: acc=0.5615 + [ViT-frozen] s=456 ep 60: acc=0.5681 + ViT-Mini shallow: 16266 params (no blocks) + [ViT-shallow] s=456 ep 10: acc=0.1000 + [ViT-shallow] s=456 ep 20: acc=0.1000 + [ViT-shallow] s=456 ep 30: acc=0.1000 + [ViT-shallow] s=456 ep 40: acc=0.1000 + [ViT-shallow] s=456 ep 50: acc=0.1000 + [ViT-shallow] s=456 ep 60: acc=0.1000 + FINAL ViT s=456: frozen=0.5681, shallow=0.1000 + +=== StudentNet frozen baselines === + +--- StudentNet seed=42 --- + StudentNet frozen: 1290/67850 trainable params + [Student-frozen] s=42 ep 10: acc=0.8405 + [Student-frozen] s=42 ep 20: acc=0.8860 + [Student-frozen] s=42 ep 30: acc=0.8990 + [Student-frozen] s=42 ep 40: acc=0.8990 + [Student-frozen] s=42 ep 50: acc=0.9015 + [Student-frozen] s=42 ep 60: acc=0.9005 + [Student-frozen] s=42 ep 70: acc=0.9005 + [Student-frozen] s=42 ep 80: acc=0.9005 + StudentNet shallow: 1290 params (no blocks) + [Student-shallow] s=42 ep 10: acc=0.8555 + [Student-shallow] s=42 ep 20: acc=0.8990 + [Student-shallow] s=42 ep 30: acc=0.9085 + [Student-shallow] s=42 ep 40: acc=0.9140 + [Student-shallow] s=42 ep 50: acc=0.9140 + [Student-shallow] s=42 ep 60: acc=0.9155 + [Student-shallow] s=42 ep 70: acc=0.9165 + [Student-shallow] s=42 ep 80: acc=0.9165 + FINAL Student s=42: frozen=0.9005, shallow=0.9165 + +--- StudentNet seed=123 --- + StudentNet frozen: 1290/67850 trainable params + [Student-frozen] s=123 ep 10: acc=0.8505 + [Student-frozen] s=123 ep 20: acc=0.8915 + [Student-frozen] s=123 ep 30: acc=0.9030 + [Student-frozen] s=123 ep 40: acc=0.9050 + [Student-frozen] s=123 ep 50: acc=0.9050 + [Student-frozen] s=123 ep 60: acc=0.9060 + [Student-frozen] s=123 ep 70: acc=0.9060 + [Student-frozen] s=123 ep 80: acc=0.9060 + StudentNet shallow: 1290 params (no blocks) + [Student-shallow] s=123 ep 10: acc=0.8495 + [Student-shallow] s=123 ep 20: acc=0.8900 + [Student-shallow] s=123 ep 30: acc=0.9050 + [Student-shallow] s=123 ep 40: acc=0.9080 + [Student-shallow] s=123 ep 50: acc=0.9105 + [Student-shallow] s=123 ep 60: acc=0.9125 + [Student-shallow] s=123 ep 70: acc=0.9130 + [Student-shallow] s=123 ep 80: acc=0.9135 + FINAL Student s=123: frozen=0.9060, shallow=0.9135 + +--- StudentNet seed=456 --- + StudentNet frozen: 1290/67850 trainable params + [Student-frozen] s=456 ep 10: acc=0.8300 + [Student-frozen] s=456 ep 20: acc=0.8900 + [Student-frozen] s=456 ep 30: acc=0.9025 + [Student-frozen] s=456 ep 40: acc=0.9115 + [Student-frozen] s=456 ep 50: acc=0.9150 + [Student-frozen] s=456 ep 60: acc=0.9165 + [Student-frozen] s=456 ep 70: acc=0.9180 + [Student-frozen] s=456 ep 80: acc=0.9175 + StudentNet shallow: 1290 params (no blocks) + [Student-shallow] s=456 ep 10: acc=0.8615 + [Student-shallow] s=456 ep 20: acc=0.9050 + [Student-shallow] s=456 ep 30: acc=0.9160 + [Student-shallow] s=456 ep 40: acc=0.9200 + [Student-shallow] s=456 ep 50: acc=0.9235 + [Student-shallow] s=456 ep 60: acc=0.9225 + [Student-shallow] s=456 ep 70: acc=0.9225 + [Student-shallow] s=456 ep 80: acc=0.9225 + FINAL Student s=456: frozen=0.9175, shallow=0.9225 + +Saved: results/frozen_baselines_crossarch.json diff --git a/results/frozen_cifar/frozen_L4_d256_s42.json b/results/frozen_cifar/frozen_L4_d256_s42.json new file mode 100644 index 0000000..2fb0bd3 --- /dev/null +++ b/results/frozen_cifar/frozen_L4_d256_s42.json @@ -0,0 +1,174 @@ +{ + "config": { + "num_blocks": 4, + "d_hidden": 256, + "seed": 42, + "bp_epochs": 100, + "estimator_epochs": 100, + "lr_fb": 0.001, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0 + }, + "bp_acc": 0.6173, + "summary": { + "dfa": { + "mean_gamma": 0.005605479117366485, + "mean_rho": 0.005194449331611395, + "mean_nudge": -2.151036460418254e-05 + }, + "sb_eT": { + "mean_gamma": 0.2866372682154179, + "mean_rho": 0.24588057771325111, + "mean_nudge": -0.0009568915702402592 + }, + "cb_eT": { + "mean_gamma": 0.11484479499049485, + "mean_rho": 0.125152001157403, + "mean_nudge": -0.00036998098585172556 + }, + "cb_deltaL": { + "mean_gamma": 0.06995358848944307, + "mean_rho": 0.06243711616843939, + "mean_nudge": -0.00015994706336641684 + } + }, + "per_layer": { + "dfa": { + "bp_cosine": [ + 0.01097307917661965, + -0.00982702277833596, + 0.004532583430409432, + 0.016743276640772818 + ], + "perturbation_rho": [ + 0.0032103070989251137, + -0.030966611579060555, + 0.06208299845457077, + -0.01354889664798975 + ], + "nudging_0.001": [ + -3.2122152333613485e-06, + 7.709997589699924e-06, + -2.053854950645473e-05, + -1.2655042155529372e-05 + ], + "nudging_0.003": [ + -9.568146197125316e-06, + 2.312526703462936e-05, + -6.160693010315299e-05, + -3.799164915108122e-05 + ], + "nudging_0.01": [ + -3.1933166610542685e-05, + 7.745913171675056e-05, + -0.0002052279596682638, + -0.00012646839604713023 + ] + }, + "sb_eT": { + "bp_cosine": [ + 0.19993784725666047, + 0.2704531639814377, + 0.3183140277862549, + 0.35784403383731844 + ], + "perturbation_rho": [ + 0.14796550571918488, + 0.23224923014640808, + 0.27324193716049194, + 0.33006563782691956 + ], + "nudging_0.001": [ + -0.00020024771220050752, + -0.00030526291811838746, + -0.0003735219652298838, + -0.0003972915874328464 + ], + "nudging_0.003": [ + -0.0006005102768540382, + -0.0009154834551736712, + -0.001120006782002747, + -0.0011915657669305801 + ], + "nudging_0.01": [ + -0.002000064356252551, + -0.0030484027229249477, + -0.0037288377061486244, + -0.0039670998230576515 + ] + }, + "cb_eT": { + "bp_cosine": [ + 0.045131212659180166, + 0.06221269443631172, + 0.1209193505346775, + 0.23111592233181 + ], + "perturbation_rho": [ + 0.05690425634384155, + 0.10793692618608475, + 0.10616493225097656, + 0.2296018898487091 + ], + "nudging_0.001": [ + -5.6506225519115105e-05, + -8.837308996589854e-05, + -0.00011208542855456471, + -0.00023653265088796616 + ], + "nudging_0.003": [ + -0.00016947659605648369, + -0.00026502960827201605, + -0.0003360719420015812, + -0.0007093457970768213 + ], + "nudging_0.01": [ + -0.0005644541233778, + -0.0008825073018670082, + -0.0011192080564796925, + -0.0023615544196218252 + ] + }, + "cb_deltaL": { + "bp_cosine": [ + 0.03819061610847711, + 0.05208469983190298, + 0.06935825981199742, + 0.12018077820539474 + ], + "perturbation_rho": [ + 0.047517478466033936, + 0.013643201440572739, + 0.04729664325714111, + 0.14129114151000977 + ], + "nudging_0.001": [ + -2.239555396954529e-05, + -2.458264680171851e-05, + -4.0700091631151736e-05, + -0.0001256012765225023 + ], + "nudging_0.003": [ + -6.710628804285079e-05, + -7.37799855414778e-05, + -0.00012205714301671833, + -0.00037684483686462045 + ], + "nudging_0.01": [ + -0.0002235029242001474, + -0.00024507055059075356, + -0.00040636284393258393, + -0.0012548293452709913 + ] + } + }, + "sb_pred_error": [ + 9093.49886875, + 3872.840365234375, + 2899.67371015625, + 2407.756592578125 + ] +} \ No newline at end of file diff --git a/results/frozen_cifar/frozen_L4_d512_s42.json b/results/frozen_cifar/frozen_L4_d512_s42.json new file mode 100644 index 0000000..025eea9 --- /dev/null +++ b/results/frozen_cifar/frozen_L4_d512_s42.json @@ -0,0 +1,174 @@ +{ + "config": { + "num_blocks": 4, + "d_hidden": 512, + "seed": 42, + "bp_epochs": 100, + "estimator_epochs": 100, + "lr_fb": 0.001, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0 + }, + "bp_acc": 0.6046, + "summary": { + "dfa": { + "mean_gamma": 0.00014940524997655283, + "mean_rho": 0.0021846434101462364, + "mean_nudge": 9.80043569143163e-06 + }, + "sb_eT": { + "mean_gamma": 0.16364388447254896, + "mean_rho": 0.1367498729377985, + "mean_nudge": -0.0008324724767589942 + }, + "cb_eT": { + "mean_gamma": 0.05695507084019482, + "mean_rho": 0.10538733564317226, + "mean_nudge": -0.00041578355740057305 + }, + "cb_deltaL": { + "mean_gamma": 0.03857357995584607, + "mean_rho": 0.02690578391775489, + "mean_nudge": -0.00015572691336274147 + } + }, + "per_layer": { + "dfa": { + "bp_cosine": [ + 0.0003761224914342165, + 0.0014630826306529343, + 0.0025856316089630125, + -0.0038272157311439515 + ], + "perturbation_rho": [ + 0.041057292371988297, + 0.04760625958442688, + -0.04939739778637886, + -0.03052758052945137 + ], + "nudging_0.001": [ + -6.823556759627536e-07, + 5.570012035605032e-06, + 7.243079380714335e-07, + 7.61153205530718e-06 + ], + "nudging_0.003": [ + -2.2219755919650197e-06, + 1.6406695067416877e-05, + 2.2961030481383204e-06, + 2.2720920242136344e-05 + ], + "nudging_0.01": [ + -7.2418697527609766e-06, + 5.4833959438838065e-05, + 7.364731573034078e-06, + 7.559901860076934e-05 + ] + }, + "sb_eT": { + "bp_cosine": [ + 0.11779971644282342, + 0.15058264434337615, + 0.1757924109697342, + 0.2104007661342621 + ], + "perturbation_rho": [ + 0.05106552690267563, + 0.14929687976837158, + 0.1366019994020462, + 0.21003508567810059 + ], + "nudging_0.001": [ + -0.00020435426267795265, + -0.000274428486591205, + -0.0003065963101107627, + -0.0003246065170969814 + ], + "nudging_0.003": [ + -0.0006134338327683508, + -0.0008232325781136751, + -0.0009195499587804079, + -0.0009736735373735428 + ], + "nudging_0.01": [ + -0.0020439010113477707, + -0.0027431542985141277, + -0.0030633914284408092, + -0.003243957180529833 + ] + }, + "cb_eT": { + "bp_cosine": [ + 0.028400307334959508, + 0.030753960087895393, + 0.04988271631300449, + 0.11878329962491989 + ], + "perturbation_rho": [ + 0.06698533892631531, + 0.07322317361831665, + 0.11097840219736099, + 0.1703624278306961 + ], + "nudging_0.001": [ + -8.199035073630512e-05, + -9.967104415409267e-05, + -0.00014070692122913897, + -0.00023186377075035125 + ], + "nudging_0.003": [ + -0.000246370182139799, + -0.000298988597933203, + -0.0004220257396809757, + -0.0006957497098483145 + ], + "nudging_0.01": [ + -0.0008211369859054685, + -0.0009962331969290972, + -0.0014064292190596461, + -0.0023175508249551058 + ] + }, + "cb_deltaL": { + "bp_cosine": [ + 0.019338275119662286, + 0.03327283784747124, + 0.040172213315963747, + 0.061510993540287016 + ], + "perturbation_rho": [ + -0.0003883522003889084, + 0.029364485293626785, + 0.04492279514670372, + 0.03372420743107796 + ], + "nudging_0.001": [ + -2.7410198526922613e-05, + -5.19197310495656e-05, + -6.934596603969112e-05, + -5.898199015064165e-05 + ], + "nudging_0.003": [ + -8.237811562139541e-05, + -0.00015559815801680088, + -0.00020809093257412314, + -0.00017684044723864645 + ], + "nudging_0.01": [ + -0.00027475334354676306, + -0.000518541899509728, + -0.0006934736738912761, + -0.0005893784109503031 + ] + } + }, + "sb_pred_error": [ + 32627.8307125, + 17715.490584375, + 13710.30735, + 10994.33838125 + ] +} \ No newline at end of file diff --git a/results/frozen_cifar/frozen_L6_d256_s42.json b/results/frozen_cifar/frozen_L6_d256_s42.json new file mode 100644 index 0000000..703dd5a --- /dev/null +++ b/results/frozen_cifar/frozen_L6_d256_s42.json @@ -0,0 +1,216 @@ +{ + "config": { + "num_blocks": 6, + "d_hidden": 256, + "seed": 42, + "bp_epochs": 100, + "estimator_epochs": 100, + "lr_fb": 0.001, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0 + }, + "bp_acc": 0.6172, + "summary": { + "dfa": { + "mean_gamma": 0.008224744617473334, + "mean_rho": -0.007729481750478347, + "mean_nudge": -1.4484473164581383e-05 + }, + "sb_eT": { + "mean_gamma": 0.28419415106376006, + "mean_rho": 0.24331255008776984, + "mean_nudge": -0.0010212107930177201 + }, + "cb_eT": { + "mean_gamma": 0.1356087997245292, + "mean_rho": 0.11836575530469418, + "mean_nudge": -0.000398846738486706 + }, + "cb_deltaL": { + "mean_gamma": 0.06269844393245876, + "mean_rho": 0.07167995596925418, + "mean_nudge": -0.000200468028197065 + } + }, + "per_layer": { + "dfa": { + "bp_cosine": [ + -0.010780696198344231, + -0.0024464363697916268, + 0.006427376973442733, + 0.023271656595170498, + 0.017338427528738976, + 0.015538139175623656 + ], + "perturbation_rho": [ + -0.018140554428100586, + 0.003606993705034256, + -0.045406848192214966, + 0.023949457332491875, + -0.016462121158838272, + 0.00607618223875761 + ], + "nudging_0.001": [ + 3.0692412110511214e-05, + 7.64157812227495e-06, + -9.760969987837598e-08, + -3.085116622969508e-05, + -1.6509711713297293e-05, + -1.9992370653199032e-05 + ], + "nudging_0.003": [ + 9.20678285183385e-05, + 2.31226204050472e-05, + -2.7300666260998696e-07, + -9.241211228072643e-05, + -4.9478214350529015e-05, + -5.993395461700857e-05 + ], + "nudging_0.01": [ + 0.0003075606073252857, + 7.720924622844905e-05, + -5.05835487274453e-07, + -0.0003076052526012063, + -0.00016470525588374585, + -0.00019945789244957268 + ] + }, + "sb_eT": { + "bp_cosine": [ + 0.1685526818037033, + 0.23167533278465272, + 0.2697907418012619, + 0.30822172164916994, + 0.3446090370416641, + 0.3823153913021088 + ], + "perturbation_rho": [ + 0.07154904305934906, + 0.19288617372512817, + 0.2876003682613373, + 0.27649810910224915, + 0.3115084767341614, + 0.3198331296443939 + ], + "nudging_0.001": [ + -0.00018972528050653636, + -0.0002750377752818167, + -0.00032653682865202427, + -0.00039390879101119936, + -0.00042474071960896254, + -0.00043361991993151605 + ], + "nudging_0.003": [ + -0.0005688090459443629, + -0.0008246920770034194, + -0.0009791019838303328, + -0.00118098477832973, + -0.001273483969271183, + -0.001300192903727293 + ], + "nudging_0.01": [ + -0.0018940127920359373, + -0.0027450949419289827, + -0.0032586848828941584, + -0.003929748199880123, + -0.004237486980855465, + -0.004327159374952316 + ] + }, + "cb_eT": { + "bp_cosine": [ + 0.045225401408970356, + 0.053792066499590875, + 0.08010791838169098, + 0.12435948699712754, + 0.19471128135919571, + 0.31545664370059967 + ], + "perturbation_rho": [ + 0.024685420095920563, + -0.01572572812438011, + 0.08793376386165619, + 0.11664978414773941, + 0.1602637767791748, + 0.3363875150680542 + ], + "nudging_0.001": [ + -2.2263082428253256e-05, + -5.150778451934457e-05, + -7.369300146820024e-05, + -0.00012175041774753481, + -0.00019730909843929112, + -0.000331797928083688 + ], + "nudging_0.003": [ + -6.678207137156278e-05, + -0.00015438658010680228, + -0.0002208092628279701, + -0.00036489206831902266, + -0.0005915500223636627, + -0.0009946604259312153 + ], + "nudging_0.01": [ + -0.00022176679340191185, + -0.0005135145038366318, + -0.0007348398794420063, + -0.0012142673367634416, + -0.0019682790152728558, + -0.0033080100547522306 + ] + }, + "cb_deltaL": { + "bp_cosine": [ + 0.01903119832277298, + 0.03658499242737889, + 0.04136112704873085, + 0.05426537357270718, + 0.07572877742350101, + 0.14921919479966164 + ], + "perturbation_rho": [ + -0.004729617387056351, + 0.06955375522375107, + 0.07996401935815811, + 0.11149539798498154, + 0.055956777185201645, + 0.11783940345048904 + ], + "nudging_0.001": [ + -3.080447640968487e-05, + -4.9154667067341506e-05, + -5.3297979320632294e-05, + -5.973243969492614e-05, + -7.465035014320165e-05, + -0.00013362003664951771 + ], + "nudging_0.003": [ + -9.23606421565637e-05, + -0.00014715960423927754, + -0.00015975572750903666, + -0.00017912944895215333, + -0.00022374786203727126, + -0.0004006548842880875 + ], + "nudging_0.01": [ + -0.00030725268879905343, + -0.0004887805553153157, + -0.0005310464184731245, + -0.0005952278152108192, + -0.0007444550283253193, + -0.0013336975825950503 + ] + } + }, + "sb_pred_error": [ + 8914.44174921875, + 5038.8783640625, + 4058.455402734375, + 3433.17113046875, + 2884.829894921875, + 2573.41313515625 + ] +} \ No newline at end of file diff --git a/results/frozen_cifar_vec/frozen_vec_L4_d256_s42.json b/results/frozen_cifar_vec/frozen_vec_L4_d256_s42.json new file mode 100644 index 0000000..f9f4ec8 --- /dev/null +++ b/results/frozen_cifar_vec/frozen_vec_L4_d256_s42.json @@ -0,0 +1,188 @@ +{ + "config": { + "num_blocks": 4, + "d_hidden": 256, + "seed": 42, + "bp_acc": 0.6173, + "estimator_epochs": 100 + }, + "summary": { + "dfa": { + "mean_gamma": 0.004863154428312555, + "mean_rho": 0.0046705943532288074, + "mean_nudge": -5.86726059736975e-06 + }, + "sb_eT": { + "mean_gamma": 0.2866372682154179, + "mean_rho": 0.2637173905968666, + "mean_nudge": -0.0009568915702402592 + }, + "cb_eT": { + "mean_gamma": 0.11484479499049485, + "mean_rho": 0.1202746294438839, + "mean_nudge": -0.00036998098585172556 + }, + "cb_deltaL": { + "mean_gamma": 0.06995358848944307, + "mean_rho": 0.034168413607403636, + "mean_nudge": -0.00015994706336641684 + }, + "vec_eT_M4": { + "mean_gamma": 0.3634969729930162, + "mean_rho": 0.42595484107732773, + "mean_nudge": -0.0014062844711588696 + }, + "vec_eT_M8": { + "mean_gamma": 0.3636624652892351, + "mean_rho": 0.3955033980309963, + "mean_nudge": -0.0013793499529128894 + }, + "vec_eT_M16": { + "mean_gamma": 0.3677208840847015, + "mean_rho": 0.42224912345409393, + "mean_nudge": -0.001392927297274582 + } + }, + "per_layer": { + "dfa": { + "bp_cosine": [ + 0.0033329044468700885, + -0.007507461798377335, + 0.022020796407014133, + 0.0016063786577433347 + ], + "perturbation_rho": [ + -0.0401616208255291, + -0.018128124997019768, + 0.04789097607135773, + 0.02908114716410637 + ], + "nudging_0.003": [ + 4.354264819994569e-05, + 3.3159449230879545e-05, + -9.052902169059962e-05, + -9.642118129704613e-06 + ] + }, + "sb_eT": { + "bp_cosine": [ + 0.19993784725666047, + 0.2704531639814377, + 0.3183140277862549, + 0.35784403383731844 + ], + "perturbation_rho": [ + 0.1395200788974762, + 0.2829156517982483, + 0.2831076979637146, + 0.34932613372802734 + ], + "nudging_0.003": [ + -0.0006005102768540382, + -0.0009154834551736712, + -0.001120006782002747, + -0.0011915657669305801 + ] + }, + "cb_eT": { + "bp_cosine": [ + 0.045131212659180166, + 0.06221269443631172, + 0.1209193505346775, + 0.23111592233181 + ], + "perturbation_rho": [ + 0.03551628440618515, + 0.11640645563602448, + 0.07594657689332962, + 0.25322920083999634 + ], + "nudging_0.003": [ + -0.00016947659605648369, + -0.00026502960827201605, + -0.0003360719420015812, + -0.0007093457970768213 + ] + }, + "cb_deltaL": { + "bp_cosine": [ + 0.03819061610847711, + 0.05208469983190298, + 0.06935825981199742, + 0.12018077820539474 + ], + "perturbation_rho": [ + -0.01345862727612257, + -0.014757020398974419, + 0.03974407538771629, + 0.12514522671699524 + ], + "nudging_0.003": [ + -6.710628804285079e-05, + -7.37799855414778e-05, + -0.00012205714301671833, + -0.00037684483686462045 + ] + }, + "vec_eT_M4": { + "bp_cosine": [ + 0.16388139724731446, + 0.26098581701517104, + 0.41548662185668944, + 0.61363405585289 + ], + "perturbation_rho": [ + 0.22898420691490173, + 0.339008092880249, + 0.4533805847167969, + 0.6824464797973633 + ], + "nudging_0.003": [ + -0.0007082110387273133, + -0.0010581386741250753, + -0.0016506186220794916, + -0.002208169549703598 + ] + }, + "vec_eT_M8": { + "bp_cosine": [ + 0.17386804670095443, + 0.268336746096611, + 0.406103777885437, + 0.606341290473938 + ], + "perturbation_rho": [ + 0.19708333909511566, + 0.2918933629989624, + 0.4379217028617859, + 0.6551151871681213 + ], + "nudging_0.003": [ + -0.0007086814730428159, + -0.0010243982542306185, + -0.0016026028897613287, + -0.0021817171946167946 + ] + }, + "vec_eT_M16": { + "bp_cosine": [ + 0.17664430439472198, + 0.27206156253814695, + 0.41649516522884367, + 0.6056825041770935 + ], + "perturbation_rho": [ + 0.20988652110099792, + 0.3382995128631592, + 0.469192236661911, + 0.6716182231903076 + ], + "nudging_0.003": [ + -0.0007140585803426802, + -0.0010502493241801858, + -0.0016202025581151247, + -0.0021871987264603376 + ] + } + } +} \ No newline at end of file diff --git a/results/h2_no_residual_full_s123.log b/results/h2_no_residual_full_s123.log new file mode 100644 index 0000000..c02879b --- /dev/null +++ b/results/h2_no_residual_full_s123.log @@ -0,0 +1,107 @@ +device=cuda:0, depth=4, d_hidden=256, epochs=100, seed=123 +eval buffer: torch.Size([1024, 3072]) + +=== DFA training === + [DFA] Ep 0: ||h||_med=[8.690464973449707, 42.59831619262695, 44.3453369140625, 42.22452926635742, 42.9206428527832] ||g||_med=[0.001107031712308526, 0.00020295626018196344, 0.00014012052270118147, 0.00011155186803080142, 9.737444634083658e-05] acc=0.1025 + [DFA] Ep 1: ||h_L||=4.633e+03 ||g_2||=6.313e-07 acc=0.0889 gamma_dfa=0.0291 + [DFA] Ep 2: ||h_L||=2.086e+04 ||g_2||=1.040e-07 acc=0.0850 gamma_dfa=0.0262 + [DFA] Ep 3: ||h_L||=4.860e+04 ||g_2||=3.898e-08 acc=0.1299 gamma_dfa=0.0251 + [DFA] Ep 4: ||h_L||=9.117e+04 ||g_2||=2.015e-08 acc=0.1250 gamma_dfa=0.0267 + [DFA] Ep 5: ||h_L||=1.457e+05 ||g_2||=1.234e-08 acc=0.1152 gamma_dfa=0.0230 + [DFA] Ep 6: ||h_L||=2.115e+05 ||g_2||=8.721e-09 acc=0.1094 gamma_dfa=0.0167 + [DFA] Ep 7: ||h_L||=2.991e+05 ||g_2||=6.664e-09 acc=0.1104 gamma_dfa=0.0098 + [DFA] Ep 8: ||h_L||=4.055e+05 ||g_2||=5.241e-09 acc=0.1084 gamma_dfa=0.0026 + [DFA] Ep 9: ||h_L||=5.148e+05 ||g_2||=4.316e-09 acc=0.0879 gamma_dfa=-0.0046 + [DFA] Ep 10: ||h_L||=6.453e+05 ||g_2||=3.792e-09 acc=0.0771 gamma_dfa=-0.0082 + [DFA] Ep 11: ||h_L||=8.114e+05 ||g_2||=3.485e-09 acc=0.1074 gamma_dfa=-0.0135 + [DFA] Ep 12: ||h_L||=9.868e+05 ||g_2||=3.308e-09 acc=0.1006 gamma_dfa=-0.0171 + [DFA] Ep 13: ||h_L||=1.184e+06 ||g_2||=3.072e-09 acc=0.0889 gamma_dfa=-0.0225 + [DFA] Ep 14: ||h_L||=1.390e+06 ||g_2||=3.024e-09 acc=0.0830 gamma_dfa=-0.0248 + [DFA] Ep 15: ||h_L||=1.619e+06 ||g_2||=2.885e-09 acc=0.0977 gamma_dfa=-0.0281 + [DFA] Ep 16: ||h_L||=1.861e+06 ||g_2||=2.708e-09 acc=0.1055 gamma_dfa=-0.0306 + [DFA] Ep 17: ||h_L||=2.124e+06 ||g_2||=2.520e-09 acc=0.1064 gamma_dfa=-0.0322 + [DFA] Ep 18: ||h_L||=2.399e+06 ||g_2||=2.367e-09 acc=0.1064 gamma_dfa=-0.0333 + [DFA] Ep 19: ||h_L||=2.733e+06 ||g_2||=2.217e-09 acc=0.1064 gamma_dfa=-0.0335 + [DFA] Ep 20: ||h_L||=3.105e+06 ||g_2||=2.069e-09 acc=0.1045 gamma_dfa=-0.0344 + [DFA] Ep 21: ||h_L||=3.456e+06 ||g_2||=1.932e-09 acc=0.1045 gamma_dfa=-0.0352 + [DFA] Ep 22: ||h_L||=3.835e+06 ||g_2||=1.813e-09 acc=0.1045 gamma_dfa=-0.0362 + [DFA] Ep 23: ||h_L||=4.269e+06 ||g_2||=1.670e-09 acc=0.1045 gamma_dfa=-0.0372 + [DFA] Ep 24: ||h_L||=4.714e+06 ||g_2||=1.561e-09 acc=0.1045 gamma_dfa=-0.0378 + [DFA] Ep 25: ||h_L||=5.140e+06 ||g_2||=1.458e-09 acc=0.1045 gamma_dfa=-0.0386 + [DFA] Ep 26: ||h_L||=5.621e+06 ||g_2||=1.359e-09 acc=0.1045 gamma_dfa=-0.0396 + [DFA] Ep 27: ||h_L||=6.045e+06 ||g_2||=1.279e-09 acc=0.1045 gamma_dfa=-0.0402 + [DFA] Ep 28: ||h_L||=6.541e+06 ||g_2||=1.201e-09 acc=0.1045 gamma_dfa=-0.0409 + [DFA] Ep 29: ||h_L||=6.999e+06 ||g_2||=1.132e-09 acc=0.1045 gamma_dfa=-0.0414 + [DFA] Ep 30: ||h_L||=7.506e+06 ||g_2||=1.061e-09 acc=0.1045 gamma_dfa=-0.0423 + [DFA] Ep 31: ||h_L||=7.924e+06 ||g_2||=1.003e-09 acc=0.1045 gamma_dfa=-0.0428 + [DFA] Ep 32: ||h_L||=8.527e+06 ||g_2||=9.494e-10 acc=0.1045 gamma_dfa=-0.0438 + [DFA] Ep 33: ||h_L||=9.051e+06 ||g_2||=8.977e-10 acc=0.1045 gamma_dfa=-0.0442 + [DFA] Ep 34: ||h_L||=9.560e+06 ||g_2||=8.499e-10 acc=0.1064 gamma_dfa=-0.0447 + [DFA] Ep 35: ||h_L||=1.015e+07 ||g_2||=8.131e-10 acc=0.1064 gamma_dfa=-0.0450 + [DFA] Ep 36: ||h_L||=1.072e+07 ||g_2||=7.740e-10 acc=0.1035 gamma_dfa=-0.0455 + [DFA] Ep 37: ||h_L||=1.138e+07 ||g_2||=7.381e-10 acc=0.1055 gamma_dfa=-0.0458 + [DFA] Ep 38: ||h_L||=1.195e+07 ||g_2||=7.013e-10 acc=0.1055 gamma_dfa=-0.0464 + [DFA] Ep 39: ||h_L||=1.254e+07 ||g_2||=6.774e-10 acc=0.1055 gamma_dfa=-0.0464 + [DFA] Ep 40: ||h_L||=1.310e+07 ||g_2||=6.487e-10 acc=0.1055 gamma_dfa=-0.0468 + [DFA] Ep 41: ||h_L||=1.374e+07 ||g_2||=6.225e-10 acc=0.1055 gamma_dfa=-0.0472 + [DFA] Ep 42: ||h_L||=1.425e+07 ||g_2||=5.996e-10 acc=0.1045 gamma_dfa=-0.0476 + [DFA] Ep 43: ||h_L||=1.481e+07 ||g_2||=5.769e-10 acc=0.1064 gamma_dfa=-0.0479 + [DFA] Ep 44: ||h_L||=1.541e+07 ||g_2||=5.581e-10 acc=0.1055 gamma_dfa=-0.0478 + [DFA] Ep 45: ||h_L||=1.599e+07 ||g_2||=5.421e-10 acc=0.0996 gamma_dfa=-0.0483 + [DFA] Ep 46: ||h_L||=1.666e+07 ||g_2||=5.243e-10 acc=0.0986 gamma_dfa=-0.0485 + [DFA] Ep 47: ||h_L||=1.729e+07 ||g_2||=5.089e-10 acc=0.1016 gamma_dfa=-0.0487 + [DFA] Ep 48: ||h_L||=1.781e+07 ||g_2||=4.924e-10 acc=0.1025 gamma_dfa=-0.0493 + [DFA] Ep 49: ||h_L||=1.843e+07 ||g_2||=4.781e-10 acc=0.0986 gamma_dfa=-0.0491 + [DFA] Ep 50: ||h_L||=1.904e+07 ||g_2||=4.645e-10 acc=0.0967 gamma_dfa=-0.0492 + [DFA] Ep 51: ||h_L||=1.963e+07 ||g_2||=4.525e-10 acc=0.0986 gamma_dfa=-0.0493 + [DFA] Ep 52: ||h_L||=2.018e+07 ||g_2||=4.412e-10 acc=0.1016 gamma_dfa=-0.0493 + [DFA] Ep 53: ||h_L||=2.075e+07 ||g_2||=4.318e-10 acc=0.1016 gamma_dfa=-0.0495 + [DFA] Ep 54: ||h_L||=2.129e+07 ||g_2||=4.220e-10 acc=0.1025 gamma_dfa=-0.0497 + [DFA] Ep 55: ||h_L||=2.177e+07 ||g_2||=4.106e-10 acc=0.0986 gamma_dfa=-0.0498 + [DFA] Ep 56: ||h_L||=2.230e+07 ||g_2||=4.025e-10 acc=0.0977 gamma_dfa=-0.0499 + [DFA] Ep 57: ||h_L||=2.282e+07 ||g_2||=3.926e-10 acc=0.0986 gamma_dfa=-0.0499 + [DFA] Ep 58: ||h_L||=2.332e+07 ||g_2||=3.848e-10 acc=0.1016 gamma_dfa=-0.0502 + [DFA] Ep 59: ||h_L||=2.377e+07 ||g_2||=3.788e-10 acc=0.1016 gamma_dfa=-0.0503 + [DFA] Ep 60: ||h_L||=2.424e+07 ||g_2||=3.706e-10 acc=0.0957 gamma_dfa=-0.0505 + [DFA] Ep 61: ||h_L||=2.478e+07 ||g_2||=3.645e-10 acc=0.0986 gamma_dfa=-0.0505 + [DFA] Ep 62: ||h_L||=2.525e+07 ||g_2||=3.598e-10 acc=0.0918 gamma_dfa=-0.0508 + [DFA] Ep 63: ||h_L||=2.563e+07 ||g_2||=3.525e-10 acc=0.0957 gamma_dfa=-0.0507 + [DFA] Ep 64: ||h_L||=2.602e+07 ||g_2||=3.496e-10 acc=0.0908 gamma_dfa=-0.0509 + [DFA] Ep 65: ||h_L||=2.647e+07 ||g_2||=3.439e-10 acc=0.0889 gamma_dfa=-0.0510 + [DFA] Ep 66: ||h_L||=2.684e+07 ||g_2||=3.379e-10 acc=0.0918 gamma_dfa=-0.0510 + [DFA] Ep 67: ||h_L||=2.722e+07 ||g_2||=3.349e-10 acc=0.0889 gamma_dfa=-0.0510 + [DFA] Ep 68: ||h_L||=2.761e+07 ||g_2||=3.320e-10 acc=0.0879 gamma_dfa=-0.0509 + [DFA] Ep 69: ||h_L||=2.793e+07 ||g_2||=3.263e-10 acc=0.0918 gamma_dfa=-0.0509 + [DFA] Ep 70: ||h_L||=2.820e+07 ||g_2||=3.249e-10 acc=0.0889 gamma_dfa=-0.0508 + [DFA] Ep 71: ||h_L||=2.855e+07 ||g_2||=3.204e-10 acc=0.0850 gamma_dfa=-0.0510 + [DFA] Ep 72: ||h_L||=2.879e+07 ||g_2||=3.177e-10 acc=0.0879 gamma_dfa=-0.0509 + [DFA] Ep 73: ||h_L||=2.909e+07 ||g_2||=3.147e-10 acc=0.0859 gamma_dfa=-0.0510 + [DFA] Ep 74: ||h_L||=2.932e+07 ||g_2||=3.129e-10 acc=0.0850 gamma_dfa=-0.0510 + [DFA] Ep 75: ||h_L||=2.950e+07 ||g_2||=3.108e-10 acc=0.0840 gamma_dfa=-0.0510 + [DFA] Ep 76: ||h_L||=2.974e+07 ||g_2||=3.089e-10 acc=0.0879 gamma_dfa=-0.0510 + [DFA] Ep 77: ||h_L||=2.992e+07 ||g_2||=3.063e-10 acc=0.0889 gamma_dfa=-0.0509 + [DFA] Ep 78: ||h_L||=3.012e+07 ||g_2||=3.051e-10 acc=0.0889 gamma_dfa=-0.0510 + [DFA] Ep 79: ||h_L||=3.032e+07 ||g_2||=3.036e-10 acc=0.0879 gamma_dfa=-0.0511 + [DFA] Ep 80: ||h_L||=3.045e+07 ||g_2||=3.023e-10 acc=0.0889 gamma_dfa=-0.0511 + [DFA] Ep 81: ||h_L||=3.059e+07 ||g_2||=3.010e-10 acc=0.0879 gamma_dfa=-0.0511 + [DFA] Ep 82: ||h_L||=3.073e+07 ||g_2||=3.001e-10 acc=0.0889 gamma_dfa=-0.0511 + [DFA] Ep 83: ||h_L||=3.085e+07 ||g_2||=2.991e-10 acc=0.0850 gamma_dfa=-0.0512 + [DFA] Ep 84: ||h_L||=3.096e+07 ||g_2||=2.982e-10 acc=0.0840 gamma_dfa=-0.0512 + [DFA] Ep 85: ||h_L||=3.104e+07 ||g_2||=2.976e-10 acc=0.0889 gamma_dfa=-0.0512 + [DFA] Ep 86: ||h_L||=3.113e+07 ||g_2||=2.967e-10 acc=0.0850 gamma_dfa=-0.0512 + [DFA] Ep 87: ||h_L||=3.120e+07 ||g_2||=2.966e-10 acc=0.0889 gamma_dfa=-0.0512 + [DFA] Ep 88: ||h_L||=3.126e+07 ||g_2||=2.957e-10 acc=0.0879 gamma_dfa=-0.0512 + [DFA] Ep 89: ||h_L||=3.132e+07 ||g_2||=2.956e-10 acc=0.0889 gamma_dfa=-0.0512 + [DFA] Ep 90: ||h_L||=3.137e+07 ||g_2||=2.949e-10 acc=0.0879 gamma_dfa=-0.0512 + [DFA] Ep 91: ||h_L||=3.140e+07 ||g_2||=2.945e-10 acc=0.0879 gamma_dfa=-0.0512 + [DFA] Ep 92: ||h_L||=3.144e+07 ||g_2||=2.947e-10 acc=0.0879 gamma_dfa=-0.0512 + [DFA] Ep 93: ||h_L||=3.146e+07 ||g_2||=2.945e-10 acc=0.0889 gamma_dfa=-0.0512 + [DFA] Ep 94: ||h_L||=3.148e+07 ||g_2||=2.944e-10 acc=0.0879 gamma_dfa=-0.0512 + [DFA] Ep 95: ||h_L||=3.149e+07 ||g_2||=2.942e-10 acc=0.0879 gamma_dfa=-0.0512 + [DFA] Ep 96: ||h_L||=3.150e+07 ||g_2||=2.942e-10 acc=0.0879 gamma_dfa=-0.0512 + [DFA] Ep 97: ||h_L||=3.151e+07 ||g_2||=2.941e-10 acc=0.0879 gamma_dfa=-0.0512 + [DFA] Ep 98: ||h_L||=3.151e+07 ||g_2||=2.941e-10 acc=0.0879 gamma_dfa=-0.0512 + [DFA] Ep 99: ||h_L||=3.151e+07 ||g_2||=2.941e-10 acc=0.0879 gamma_dfa=-0.0512 + [DFA] Ep 100: ||h_L||=3.151e+07 ||g_2||=2.941e-10 acc=0.0879 gamma_dfa=-0.0512 + +Saved results/h2_no_residual_full_s123/snapshot_evolution_s123.json diff --git a/results/h2_no_residual_full_s123/snapshot_evolution_s123.json b/results/h2_no_residual_full_s123/snapshot_evolution_s123.json new file mode 100644 index 0000000..cbad0e4 --- /dev/null +++ b/results/h2_no_residual_full_s123/snapshot_evolution_s123.json @@ -0,0 +1,2749 @@ +{ + "config": { + "output_dir": "results/h2_no_residual_full_s123", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 123, + "depth": 4, + "d_hidden": 256, + "log_every": 1, + "no_residual_add": true, + "w2_std": 0.5, + "random_targets": false, + "skip_bp": true + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": null, + "dfa_log": [ + { + "hidden_norms": [ + 8.690464973449707, + 42.59831619262695, + 44.3453369140625, + 42.22452926635742, + 42.9206428527832 + ], + "bp_grad_norms_per_sample_med": [ + 0.001107031712308526, + 0.00020295626018196344, + 0.00014012052270118147, + 0.00011155186803080142, + 9.737444634083658e-05 + ], + "bp_grad_norms_F": [ + 0.03999145328998566, + 0.006603884976357222, + 0.004542526323348284, + 0.0036035836674273014, + 0.003130683209747076 + ], + "gamma_dfa": 0.014937716419808567, + "acc_eval": 0.1025390625, + "loss_eval": 2.4329679012298584, + "epoch": 0 + }, + { + "hidden_norms": [ + 1439.9598388671875, + 6195.9453125, + 9461.9462890625, + 7636.810546875, + 4633.29296875 + ], + "bp_grad_norms_per_sample_med": [ + 9.333700745628448e-07, + 6.382089736689522e-07, + 6.313390485956916e-07, + 6.29996520729037e-07, + 6.307979560915555e-07 + ], + "bp_grad_norms_F": [ + 5.84688204980921e-05, + 4.571088356897235e-05, + 4.522907693171874e-05, + 4.505911419983022e-05, + 4.481491123442538e-05 + ], + "gamma_dfa": 0.029066061251796782, + "acc_eval": 0.0888671875, + "loss_eval": 2.4298276901245117, + "epoch": 1 + }, + { + "hidden_norms": [ + 3191.640380859375, + 44469.08984375, + 64403.30859375, + 40298.74609375, + 20860.859375 + ], + "bp_grad_norms_per_sample_med": [ + 2.3425519657394034e-07, + 1.0419660867455605e-07, + 1.0399938332739112e-07, + 1.0393744531711491e-07, + 1.040296524479345e-07 + ], + "bp_grad_norms_F": [ + 2.9355647711781785e-05, + 1.3215229955676477e-05, + 1.2938599866174627e-05, + 1.2853749467467424e-05, + 1.2806296581402421e-05 + ], + "gamma_dfa": 0.026177803985774517, + "acc_eval": 0.0849609375, + "loss_eval": 2.450077533721924, + "epoch": 2 + }, + { + "hidden_norms": [ + 5072.8369140625, + 136290.921875, + 174667.984375, + 99872.765625, + 48604.14453125 + ], + "bp_grad_norms_per_sample_med": [ + 1.2239583213613514e-07, + 3.922263758227018e-08, + 3.8977361782599473e-08, + 3.902984602177639e-08, + 3.902538381339582e-08 + ], + "bp_grad_norms_F": [ + 2.021085128944833e-05, + 5.516366400115658e-06, + 5.3598869271809235e-06, + 5.317293016560143e-06, + 5.302062618284253e-06 + ], + "gamma_dfa": 0.025070607429370284, + "acc_eval": 0.1298828125, + "loss_eval": 2.470280170440674, + "epoch": 3 + }, + { + "hidden_norms": [ + 6908.81494140625, + 300140.625, + 335781.1875, + 194737.578125, + 91168.953125 + ], + "bp_grad_norms_per_sample_med": [ + 8.2960639247176e-08, + 2.020572686944888e-08, + 2.0147625789945778e-08, + 2.017927869246705e-08, + 2.0169572678696568e-08 + ], + "bp_grad_norms_F": [ + 1.5067237654875498e-05, + 3.154973455821164e-06, + 2.890229097829433e-06, + 2.8368178845994407e-06, + 2.826985564752249e-06 + ], + "gamma_dfa": 0.0266711818985641, + "acc_eval": 0.125, + "loss_eval": 2.5050950050354004, + "epoch": 4 + }, + { + "hidden_norms": [ + 8695.44140625, + 543316.5625, + 567899.375, + 335584.25, + 145692.765625 + ], + "bp_grad_norms_per_sample_med": [ + 6.380926009796895e-08, + 1.238302882455855e-08, + 1.2337157073716298e-08, + 1.2354545830817187e-08, + 1.2352338707444233e-08 + ], + "bp_grad_norms_F": [ + 1.2898051863885485e-05, + 1.8491266473574797e-06, + 1.7919940091815079e-06, + 1.7602286561668734e-06, + 1.7506840777059551e-06 + ], + "gamma_dfa": 0.022991596721112728, + "acc_eval": 0.115234375, + "loss_eval": 2.5430097579956055, + "epoch": 5 + }, + { + "hidden_norms": [ + 10453.0947265625, + 880568.0625, + 851994.125, + 518617.03125, + 211486.65625 + ], + "bp_grad_norms_per_sample_med": [ + 5.6784926982800243e-08, + 8.739263535062491e-09, + 8.721374733511311e-09, + 8.72691785502866e-09, + 8.722811806194386e-09 + ], + "bp_grad_norms_F": [ + 1.2415013770805672e-05, + 1.2789794254786102e-06, + 1.2444495496310992e-06, + 1.2192489293738618e-06, + 1.2128068647143664e-06 + ], + "gamma_dfa": 0.01671441923826933, + "acc_eval": 0.109375, + "loss_eval": 2.6205759048461914, + "epoch": 6 + }, + { + "hidden_norms": [ + 12133.5908203125, + 1301136.875, + 1213412.0, + 761869.4375, + 299099.96875 + ], + "bp_grad_norms_per_sample_med": [ + 5.181741613569102e-08, + 6.701867505398695e-09, + 6.663806839668496e-09, + 6.668138485821373e-09, + 6.665318963428035e-09 + ], + "bp_grad_norms_F": [ + 1.4586516044801101e-05, + 9.615758926884155e-07, + 9.358571446682618e-07, + 9.15065527351544e-07, + 9.087396506402001e-07 + ], + "gamma_dfa": 0.009791500167921185, + "acc_eval": 0.1103515625, + "loss_eval": 2.687662363052368, + "epoch": 7 + }, + { + "hidden_norms": [ + 13778.3701171875, + 1831990.625, + 1660265.5, + 1070697.0, + 405510.90625 + ], + "bp_grad_norms_per_sample_med": [ + 4.950679510784539e-08, + 5.247439816002952e-09, + 5.240861966626653e-09, + 5.241989065041253e-09, + 5.2364685920736065e-09 + ], + "bp_grad_norms_F": [ + 2.731455424509477e-05, + 7.950770282150188e-07, + 7.47014951230085e-07, + 7.077854888848378e-07, + 7.019767735982896e-07 + ], + "gamma_dfa": 0.002645118860527873, + "acc_eval": 0.1083984375, + "loss_eval": 2.749309539794922, + "epoch": 8 + }, + { + "hidden_norms": [ + 15423.7236328125, + 2441876.0, + 2156981.0, + 1456388.625, + 514814.78125 + ], + "bp_grad_norms_per_sample_med": [ + 4.9704105720138614e-08, + 4.314747670264296e-09, + 4.316281554395118e-09, + 4.3085655043739735e-09, + 4.306641265827693e-09 + ], + "bp_grad_norms_F": [ + 1.53065484482795e-05, + 5.914198482059874e-07, + 5.698148015653715e-07, + 5.564911020883301e-07, + 5.521175125977607e-07 + ], + "gamma_dfa": -0.004648297093808651, + "acc_eval": 0.087890625, + "loss_eval": 2.819417953491211, + "epoch": 9 + }, + { + "hidden_norms": [ + 17014.275390625, + 3299996.25, + 2739406.75, + 1924564.5, + 645257.125 + ], + "bp_grad_norms_per_sample_med": [ + 5.217410503632891e-08, + 3.7931444651917445e-09, + 3.791894354066017e-09, + 3.787997471249582e-09, + 3.786980062869816e-09 + ], + "bp_grad_norms_F": [ + 1.8386483134236187e-05, + 5.170510917196225e-07, + 4.828122541766788e-07, + 4.6214248072828923e-07, + 4.5809062498847197e-07 + ], + "gamma_dfa": -0.008237186702899635, + "acc_eval": 0.0771484375, + "loss_eval": 2.8880226612091064, + "epoch": 10 + }, + { + "hidden_norms": [ + 18615.341796875, + 4327781.5, + 3460663.0, + 2493429.0, + 811358.25 + ], + "bp_grad_norms_per_sample_med": [ + 5.4753250822159316e-08, + 3.4849005903225816e-09, + 3.4845948349016e-09, + 3.4844236385112026e-09, + 3.4833074202822445e-09 + ], + "bp_grad_norms_F": [ + 1.760143095452804e-05, + 4.3398881643952336e-07, + 4.0691622871236177e-07, + 3.9397295381604636e-07, + 3.9136793361649325e-07 + ], + "gamma_dfa": -0.013480214809533209, + "acc_eval": 0.107421875, + "loss_eval": 3.0378975868225098, + "epoch": 11 + }, + { + "hidden_norms": [ + 20197.244140625, + 5361947.0, + 4309913.5, + 3117389.0, + 986810.625 + ], + "bp_grad_norms_per_sample_med": [ + 6.110099803890989e-08, + 3.3039087021791147e-09, + 3.3079554651038734e-09, + 3.309411411578367e-09, + 3.3057334647423886e-09 + ], + "bp_grad_norms_F": [ + 1.7853921235655434e-05, + 3.920526410183811e-07, + 3.4606765098033065e-07, + 3.4065161003127287e-07, + 3.3874636073960573e-07 + ], + "gamma_dfa": -0.017087776213884354, + "acc_eval": 0.1005859375, + "loss_eval": 3.226945161819458, + "epoch": 12 + }, + { + "hidden_norms": [ + 21745.060546875, + 6626533.5, + 5288037.5, + 3845802.25, + 1183958.5 + ], + "bp_grad_norms_per_sample_med": [ + 6.904146232500352e-08, + 3.0698867892198223e-09, + 3.072165188910958e-09, + 3.0722313582032257e-09, + 3.0718891874670362e-09 + ], + "bp_grad_norms_F": [ + 9.694533218862489e-05, + 1.2521383041530498e-06, + 3.6304524542174477e-07, + 3.428452259868209e-07, + 3.3693893897179805e-07 + ], + "gamma_dfa": -0.02254341426305473, + "acc_eval": 0.0888671875, + "loss_eval": 3.4535317420959473, + "epoch": 13 + }, + { + "hidden_norms": [ + 23268.326171875, + 8059270.5, + 6347708.5, + 4634334.0, + 1389795.375 + ], + "bp_grad_norms_per_sample_med": [ + 7.468641882724114e-08, + 3.0219813318410615e-09, + 3.0241904536154607e-09, + 3.0243862969570046e-09, + 3.0241051884871695e-09 + ], + "bp_grad_norms_F": [ + 3.818523691734299e-05, + 3.265660666329495e-07, + 2.885882395275985e-07, + 2.7603223884398176e-07, + 2.7437968697086035e-07 + ], + "gamma_dfa": -0.024787384318187833, + "acc_eval": 0.0830078125, + "loss_eval": 3.7082602977752686, + "epoch": 14 + }, + { + "hidden_norms": [ + 24769.162109375, + 9503637.0, + 7524496.0, + 5577708.5, + 1619056.75 + ], + "bp_grad_norms_per_sample_med": [ + 8.079865665422403e-08, + 2.885043093314721e-09, + 2.8850699607119168e-09, + 2.885329752899679e-09, + 2.885090166770965e-09 + ], + "bp_grad_norms_F": [ + 3.172496144543402e-05, + 2.7863097784575075e-07, + 2.5604617803764995e-07, + 2.4778245233392227e-07, + 2.465397699324967e-07 + ], + "gamma_dfa": -0.028090000618249178, + "acc_eval": 0.09765625, + "loss_eval": 3.9940719604492188, + "epoch": 15 + }, + { + "hidden_norms": [ + 26297.634765625, + 11348280.0, + 8835018.0, + 6709572.0, + 1860997.375 + ], + "bp_grad_norms_per_sample_med": [ + 8.416654395659862e-08, + 2.716076252795574e-09, + 2.708202995194142e-09, + 2.713108182561541e-09, + 2.710037305675428e-09 + ], + "bp_grad_norms_F": [ + 6.21284925728105e-05, + 2.910503269504261e-07, + 2.3999916720640613e-07, + 2.286197116063704e-07, + 2.275272947827034e-07 + ], + "gamma_dfa": -0.0305853869067505, + "acc_eval": 0.10546875, + "loss_eval": 4.280234336853027, + "epoch": 16 + }, + { + "hidden_norms": [ + 27796.267578125, + 13131638.0, + 10275209.0, + 7908104.0, + 2124187.75 + ], + "bp_grad_norms_per_sample_med": [ + 8.618104629931622e-08, + 2.527688947040474e-09, + 2.5195041608583324e-09, + 2.5170519002415404e-09, + 2.5167292694305843e-09 + ], + "bp_grad_norms_F": [ + 2.9607001124531962e-05, + 2.280380755337319e-07, + 2.1368994396198104e-07, + 2.0886261609120993e-07, + 2.0800932531983563e-07 + ], + "gamma_dfa": -0.032157177105546, + "acc_eval": 0.1064453125, + "loss_eval": 4.584749221801758, + "epoch": 17 + }, + { + "hidden_norms": [ + 29261.162109375, + 15093201.0, + 11924527.0, + 9201859.0, + 2398880.25 + ], + "bp_grad_norms_per_sample_med": [ + 8.982802057744266e-08, + 2.362436024583303e-09, + 2.3667561244167246e-09, + 2.3683257577289396e-09, + 2.3661459458423906e-09 + ], + "bp_grad_norms_F": [ + 1.4750239643035457e-05, + 2.0303163239532296e-07, + 1.9652848948226165e-07, + 1.9512303595092817e-07, + 1.9424047081884055e-07 + ], + "gamma_dfa": -0.033276769798249006, + "acc_eval": 0.1064453125, + "loss_eval": 4.833416938781738, + "epoch": 18 + }, + { + "hidden_norms": [ + 30654.640625, + 17198064.0, + 13711921.0, + 10622219.0, + 2733435.75 + ], + "bp_grad_norms_per_sample_med": [ + 9.140238432792103e-08, + 2.218417227695113e-09, + 2.217410255411778e-09, + 2.2205985938938966e-09, + 2.2187365278369953e-09 + ], + "bp_grad_norms_F": [ + 2.2792535673943348e-05, + 2.101570970580724e-07, + 1.8281718894286314e-07, + 1.770977462456358e-07, + 1.7618602043967257e-07 + ], + "gamma_dfa": -0.0334639239590615, + "acc_eval": 0.1064453125, + "loss_eval": 5.091382026672363, + "epoch": 19 + }, + { + "hidden_norms": [ + 32095.28125, + 19561478.0, + 15722807.0, + 12287095.0, + 3104931.75 + ], + "bp_grad_norms_per_sample_med": [ + 9.42815958637766e-08, + 2.0783239573773926e-09, + 2.0685115842411506e-09, + 2.072532145902528e-09, + 2.069893811906809e-09 + ], + "bp_grad_norms_F": [ + 2.035827492363751e-05, + 1.7020983023030567e-07, + 1.504546105479676e-07, + 1.4846344242869236e-07, + 1.4791994829010946e-07 + ], + "gamma_dfa": -0.03437755152117461, + "acc_eval": 0.1044921875, + "loss_eval": 5.338113784790039, + "epoch": 20 + }, + { + "hidden_norms": [ + 33549.3515625, + 22241236.0, + 17865768.0, + 13953577.0, + 3455886.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.694593927633832e-08, + 1.9436505738212873e-09, + 1.932475734989225e-09, + 1.9355790303876574e-09, + 1.9334791545588814e-09 + ], + "bp_grad_norms_F": [ + 1.946108568517957e-05, + 1.476916224874003e-07, + 1.3395830933404795e-07, + 1.3276194010813924e-07, + 1.323410430131844e-07 + ], + "gamma_dfa": -0.035225782776251435, + "acc_eval": 0.1044921875, + "loss_eval": 5.639235496520996, + "epoch": 21 + }, + { + "hidden_norms": [ + 35003.625, + 25199516.0, + 20151382.0, + 15868719.0, + 3834722.75 + ], + "bp_grad_norms_per_sample_med": [ + 9.815706647486877e-08, + 1.8191292916469592e-09, + 1.812876404549968e-09, + 1.8141808055816e-09, + 1.813302730191424e-09 + ], + "bp_grad_norms_F": [ + 1.900309871416539e-05, + 1.3126974351962417e-07, + 1.2148075256845914e-07, + 1.204552404487913e-07, + 1.2008344185687747e-07 + ], + "gamma_dfa": -0.036192891420796514, + "acc_eval": 0.1044921875, + "loss_eval": 5.912903785705566, + "epoch": 22 + }, + { + "hidden_norms": [ + 36385.25390625, + 28323954.0, + 22925044.0, + 17971546.0, + 4269257.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.902030484454372e-08, + 1.6868005880965597e-09, + 1.6695808069400186e-09, + 1.6706477312666834e-09, + 1.6698925575653334e-09 + ], + "bp_grad_norms_F": [ + 1.7624819520278834e-05, + 1.1903176755367895e-07, + 1.1061406013368469e-07, + 1.0976869191381411e-07, + 1.094643096166692e-07 + ], + "gamma_dfa": -0.037227407563477755, + "acc_eval": 0.1044921875, + "loss_eval": 6.16106653213501, + "epoch": 23 + }, + { + "hidden_norms": [ + 37805.91796875, + 31593894.0, + 25615532.0, + 20113868.0, + 4713793.5 + ], + "bp_grad_norms_per_sample_med": [ + 9.859636662667981e-08, + 1.5704177958042465e-09, + 1.5608032644109926e-09, + 1.5628717209281717e-09, + 1.5616322679434802e-09 + ], + "bp_grad_norms_F": [ + 1.6187867004191503e-05, + 1.0865824151551351e-07, + 1.0160825070215651e-07, + 1.008768109045377e-07, + 1.0061884125889264e-07 + ], + "gamma_dfa": -0.03782000340288505, + "acc_eval": 0.1044921875, + "loss_eval": 6.406368732452393, + "epoch": 24 + }, + { + "hidden_norms": [ + 39138.39453125, + 34956036.0, + 28542170.0, + 22404560.0, + 5139918.5 + ], + "bp_grad_norms_per_sample_med": [ + 9.837745551521948e-08, + 1.4733757547347182e-09, + 1.4583911855936549e-09, + 1.4602866693635974e-09, + 1.4591743369152255e-09 + ], + "bp_grad_norms_F": [ + 1.768167749105487e-05, + 1.015666910575419e-07, + 9.354967289709748e-08, + 9.288694968745403e-08, + 9.264899603067533e-08 + ], + "gamma_dfa": -0.03860464284662157, + "acc_eval": 0.1044921875, + "loss_eval": 6.634061813354492, + "epoch": 25 + }, + { + "hidden_norms": [ + 40505.18359375, + 38650996.0, + 31492410.0, + 24792780.0, + 5620949.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.942911560756329e-08, + 1.3685884647784974e-09, + 1.3593203229689266e-09, + 1.3602377002541743e-09, + 1.3594056991195202e-09 + ], + "bp_grad_norms_F": [ + 2.0700817913166247e-05, + 9.837697945158652e-08, + 8.757055525165924e-08, + 8.689728048238976e-08, + 8.669941564676265e-08 + ], + "gamma_dfa": -0.03959248901810497, + "acc_eval": 0.1044921875, + "loss_eval": 6.7737202644348145, + "epoch": 26 + }, + { + "hidden_norms": [ + 41849.203125, + 42830568.0, + 34648896.0, + 27355716.0, + 6044684.5 + ], + "bp_grad_norms_per_sample_med": [ + 9.865106420647862e-08, + 1.28658228515377e-09, + 1.2788612391290144e-09, + 1.2804906024399543e-09, + 1.2795147164013088e-09 + ], + "bp_grad_norms_F": [ + 2.3165159291238524e-05, + 9.389359689748744e-08, + 8.146788132989968e-08, + 8.082054137048544e-08, + 8.063241097033824e-08 + ], + "gamma_dfa": -0.040185014018788934, + "acc_eval": 0.1044921875, + "loss_eval": 6.946921348571777, + "epoch": 27 + }, + { + "hidden_norms": [ + 43129.56640625, + 47054352.0, + 37982196.0, + 29955390.0, + 6540964.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0036384878731042e-07, + 1.2043249730808725e-09, + 1.2007507210753943e-09, + 1.2010574756970982e-09, + 1.2009065963880516e-09 + ], + "bp_grad_norms_F": [ + 2.413927359157242e-05, + 8.847878518736252e-08, + 7.592807094169984e-08, + 7.532069901117211e-08, + 7.515143352065934e-08 + ], + "gamma_dfa": -0.04085268918424845, + "acc_eval": 0.1044921875, + "loss_eval": 7.133134841918945, + "epoch": 28 + }, + { + "hidden_norms": [ + 44368.93359375, + 51374800.0, + 41470788.0, + 32761826.0, + 6998702.5 + ], + "bp_grad_norms_per_sample_med": [ + 1.0049345178231306e-07, + 1.1348291195645288e-09, + 1.132080207355557e-09, + 1.1335333782724888e-09, + 1.1326910520637057e-09 + ], + "bp_grad_norms_F": [ + 2.53067773883231e-05, + 8.518416905189952e-08, + 7.111059119324636e-08, + 7.048716810231781e-08, + 7.034290661067644e-08 + ], + "gamma_dfa": -0.04143569804728031, + "acc_eval": 0.1044921875, + "loss_eval": 7.306489944458008, + "epoch": 29 + }, + { + "hidden_norms": [ + 45540.84375, + 55799284.0, + 44925840.0, + 35576004.0, + 7506460.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.999683214800825e-08, + 1.0682152939978096e-09, + 1.0609697564945009e-09, + 1.0612235534779302e-09, + 1.0610903267149752e-09 + ], + "bp_grad_norms_F": [ + 1.843971222115215e-05, + 8.002744067425738e-08, + 6.616264869307997e-08, + 6.571565336344065e-08, + 6.558265397416108e-08 + ], + "gamma_dfa": -0.04231115654692985, + "acc_eval": 0.1044921875, + "loss_eval": 7.393707752227783, + "epoch": 30 + }, + { + "hidden_norms": [ + 46740.3125, + 60156548.0, + 48609568.0, + 38622656.0, + 7923887.5 + ], + "bp_grad_norms_per_sample_med": [ + 9.801681954968444e-08, + 1.007545269438026e-09, + 1.0030560826379542e-09, + 1.0032202846232963e-09, + 1.003132132915141e-09 + ], + "bp_grad_norms_F": [ + 2.0189601855236106e-05, + 7.754985631436284e-08, + 6.295730514693787e-08, + 6.247479689136526e-08, + 6.235500649154346e-08 + ], + "gamma_dfa": -0.042783402430359274, + "acc_eval": 0.1044921875, + "loss_eval": 7.513785362243652, + "epoch": 31 + }, + { + "hidden_norms": [ + 47946.2578125, + 65027368.0, + 52475872.0, + 41636652.0, + 8527125.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.764004715862029e-08, + 9.540165324395389e-10, + 9.49443301756503e-10, + 9.49665124316823e-10, + 9.49536671512874e-10 + ], + "bp_grad_norms_F": [ + 2.2026428268873133e-05, + 7.400986135053245e-08, + 5.9516974459938865e-08, + 5.903561017817083e-08, + 5.892941956631148e-08 + ], + "gamma_dfa": -0.04377710592234507, + "acc_eval": 0.1044921875, + "loss_eval": 7.666411876678467, + "epoch": 32 + }, + { + "hidden_norms": [ + 49101.84765625, + 70129512.0, + 56707888.0, + 44883068.0, + 9051192.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.715147086808429e-08, + 9.088669261636539e-10, + 8.977363297191232e-10, + 8.978853771601791e-10, + 8.978119914182514e-10 + ], + "bp_grad_norms_F": [ + 2.6852110750041902e-05, + 7.312536354220356e-08, + 5.6589971819676066e-08, + 5.605170372291468e-08, + 5.593761187583368e-08 + ], + "gamma_dfa": -0.04420170868979767, + "acc_eval": 0.1044921875, + "loss_eval": 7.917013645172119, + "epoch": 33 + }, + { + "hidden_norms": [ + 50205.94921875, + 75218112.0, + 61038472.0, + 48316120.0, + 9560446.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.637748377144817e-08, + 8.535361861738977e-10, + 8.499229653402551e-10, + 8.501254145087955e-10, + 8.500238846131936e-10 + ], + "bp_grad_norms_F": [ + 2.704818507481832e-05, + 6.82247573990935e-08, + 5.427460791906924e-08, + 5.371628120087735e-08, + 5.360957899824825e-08 + ], + "gamma_dfa": -0.0447281262895558, + "acc_eval": 0.1064453125, + "loss_eval": 7.9629034996032715, + "epoch": 34 + }, + { + "hidden_norms": [ + 51283.7109375, + 79971480.0, + 65131160.0, + 51675436.0, + 10150061.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.52169543211312e-08, + 8.244336879847936e-10, + 8.130549011831079e-10, + 8.13186962211887e-10, + 8.13120237808107e-10 + ], + "bp_grad_norms_F": [ + 3.043289871129673e-05, + 6.438099831029831e-08, + 5.208626419062057e-08, + 5.1470838258182994e-08, + 5.136259773053098e-08 + ], + "gamma_dfa": -0.04496103324345313, + "acc_eval": 0.1064453125, + "loss_eval": 8.225072860717773, + "epoch": 35 + }, + { + "hidden_norms": [ + 52391.31640625, + 85212368.0, + 69690088.0, + 54922688.0, + 10724330.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.460915606496201e-08, + 7.854291661502089e-10, + 7.73968722445062e-10, + 7.748673369611936e-10, + 7.740979524051284e-10 + ], + "bp_grad_norms_F": [ + 3.253111935919151e-05, + 6.160666288224093e-08, + 5.0236756976573815e-08, + 4.957355770329741e-08, + 4.9483450226261994e-08 + ], + "gamma_dfa": -0.04545678128488362, + "acc_eval": 0.103515625, + "loss_eval": 8.447563171386719, + "epoch": 36 + }, + { + "hidden_norms": [ + 53471.4609375, + 90755416.0, + 74424576.0, + 58527500.0, + 11383908.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.481268392619313e-08, + 7.485803088513876e-10, + 7.380538402657066e-10, + 7.38905825414804e-10, + 7.384990952097326e-10 + ], + "bp_grad_norms_F": [ + 2.8782606023014523e-05, + 5.679364178945434e-08, + 4.747649740011184e-08, + 4.686737042902678e-08, + 4.6776307272011763e-08 + ], + "gamma_dfa": -0.04577424196759239, + "acc_eval": 0.10546875, + "loss_eval": 8.63510513305664, + "epoch": 37 + }, + { + "hidden_norms": [ + 54526.26171875, + 96224200.0, + 79402688.0, + 62338148.0, + 11946441.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.414058155243765e-08, + 7.102119448099131e-10, + 7.013249980758474e-10, + 7.021335179935306e-10, + 7.017796899155826e-10 + ], + "bp_grad_norms_F": [ + 2.6797888494911604e-05, + 5.262990754317798e-08, + 4.363804251283909e-08, + 4.31665583278118e-08, + 4.308598633429028e-08 + ], + "gamma_dfa": -0.04641679968335666, + "acc_eval": 0.10546875, + "loss_eval": 8.730607986450195, + "epoch": 38 + }, + { + "hidden_norms": [ + 55583.125, + 101480040.0, + 83697192.0, + 66218348.0, + 12538905.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.47181035826361e-08, + 6.868624002898116e-10, + 6.774021343858294e-10, + 6.77987721520168e-10, + 6.776118000040299e-10 + ], + "bp_grad_norms_F": [ + 2.6024237740784883e-05, + 5.0800426976138624e-08, + 4.1874233858152365e-08, + 4.15037817447228e-08, + 4.1430755715055056e-08 + ], + "gamma_dfa": -0.04637146886670962, + "acc_eval": 0.10546875, + "loss_eval": 8.87772274017334, + "epoch": 39 + }, + { + "hidden_norms": [ + 56556.95703125, + 107073544.0, + 88369376.0, + 69716112.0, + 13102132.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.377198040283474e-08, + 6.585805234493591e-10, + 6.487251291709129e-10, + 6.49616194170477e-10, + 6.491358561788729e-10 + ], + "bp_grad_norms_F": [ + 3.484269473119639e-05, + 7.467966156582406e-08, + 4.40217604591453e-08, + 4.3712645947380224e-08, + 4.352901683546406e-08 + ], + "gamma_dfa": -0.04681209813861642, + "acc_eval": 0.10546875, + "loss_eval": 9.053573608398438, + "epoch": 40 + }, + { + "hidden_norms": [ + 57504.6875, + 113131968.0, + 93389736.0, + 73651392.0, + 13735091.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.427740366163562e-08, + 6.312518285866986e-10, + 6.225254756131449e-10, + 6.232416249751793e-10, + 6.229293747495035e-10 + ], + "bp_grad_norms_F": [ + 0.00021013167861383408, + 5.526797508537129e-07, + 5.349095744122678e-08, + 4.9017671699402854e-08, + 4.773081840880877e-08 + ], + "gamma_dfa": -0.047232568118488416, + "acc_eval": 0.10546875, + "loss_eval": 9.214558601379395, + "epoch": 41 + }, + { + "hidden_norms": [ + 58472.46875, + 118762648.0, + 98279872.0, + 77365656.0, + 14248840.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.310819137908766e-08, + 6.046827483174866e-10, + 5.995566820793385e-10, + 6.004566288630997e-10, + 5.99891414321263e-10 + ], + "bp_grad_norms_F": [ + 0.00010149624722544104, + 2.533984684305324e-07, + 4.4013567901401984e-08, + 4.291897326424987e-08, + 4.2505401864900705e-08 + ], + "gamma_dfa": -0.04764813384099398, + "acc_eval": 0.1044921875, + "loss_eval": 9.217700958251953, + "epoch": 42 + }, + { + "hidden_norms": [ + 59401.03125, + 124607344.0, + 103250600.0, + 81130456.0, + 14810775.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.245275833791311e-08, + 5.824435378443127e-10, + 5.769146271816794e-10, + 5.777631706394004e-10, + 5.772260447400868e-10 + ], + "bp_grad_norms_F": [ + 4.0584909584140405e-05, + 9.203435524796078e-08, + 3.4605545096155765e-08, + 3.4145575256161464e-08, + 3.4092256129270027e-08 + ], + "gamma_dfa": -0.04794895404484123, + "acc_eval": 0.1064453125, + "loss_eval": 9.390031814575195, + "epoch": 43 + }, + { + "hidden_norms": [ + 60278.7890625, + 130581952.0, + 108096264.0, + 85136336.0, + 15405965.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.3390447375441e-08, + 5.630300670134147e-10, + 5.5805338128323e-10, + 5.588779439236191e-10, + 5.583465911840335e-10 + ], + "bp_grad_norms_F": [ + 4.781157258548774e-05, + 1.0881421275144021e-07, + 3.3062310222931046e-08, + 3.248984370429753e-08, + 3.2446724418377926e-08 + ], + "gamma_dfa": -0.04778411969891749, + "acc_eval": 0.10546875, + "loss_eval": 9.621635437011719, + "epoch": 44 + }, + { + "hidden_norms": [ + 61138.51171875, + 136691760.0, + 113402280.0, + 88772512.0, + 15993850.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.273151135857916e-08, + 5.43037670386326e-10, + 5.421059157129093e-10, + 5.42630551603196e-10, + 5.423762550194056e-10 + ], + "bp_grad_norms_F": [ + 2.6410325517645106e-05, + 4.767177586018079e-08, + 3.172428364450752e-08, + 3.129938974666402e-08, + 3.1260690036560845e-08 + ], + "gamma_dfa": -0.04829322246951051, + "acc_eval": 0.099609375, + "loss_eval": 9.733180046081543, + "epoch": 45 + }, + { + "hidden_norms": [ + 61988.87890625, + 142480176.0, + 118613440.0, + 92755400.0, + 16660659.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.238209486284177e-08, + 5.250901380371431e-10, + 5.242600242816309e-10, + 5.243941947341568e-10, + 5.243331879789537e-10 + ], + "bp_grad_norms_F": [ + 2.4320243028341793e-05, + 4.237628559167206e-08, + 3.048009489248216e-08, + 3.0116801497115375e-08, + 3.0080638424578865e-08 + ], + "gamma_dfa": -0.048452052724314854, + "acc_eval": 0.0986328125, + "loss_eval": 9.875200271606445, + "epoch": 46 + }, + { + "hidden_norms": [ + 62831.0078125, + 148088512.0, + 124018112.0, + 96570944.0, + 17294454.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.218231866725546e-08, + 5.094495381108288e-10, + 5.088939269981552e-10, + 5.090234345139777e-10, + 5.089637600264041e-10 + ], + "bp_grad_norms_F": [ + 2.273459904245101e-05, + 3.8132583313199575e-08, + 2.9463127049211835e-08, + 2.9154062275438264e-08, + 2.9119732403160015e-08 + ], + "gamma_dfa": -0.04870791392750107, + "acc_eval": 0.1015625, + "loss_eval": 9.965906143188477, + "epoch": 47 + }, + { + "hidden_norms": [ + 63619.36328125, + 153924256.0, + 129021120.0, + 100401856.0, + 17813234.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.170297232685698e-08, + 4.942196096813234e-10, + 4.92394736095747e-10, + 4.925179708514804e-10, + 4.924622931667955e-10 + ], + "bp_grad_norms_F": [ + 2.1741494492744096e-05, + 3.567927819858596e-08, + 2.843704471899855e-08, + 2.816011068773605e-08, + 2.812711485944419e-08 + ], + "gamma_dfa": -0.049255506150075234, + "acc_eval": 0.1025390625, + "loss_eval": 9.984619140625, + "epoch": 48 + }, + { + "hidden_norms": [ + 64400.26171875, + 159789408.0, + 134080160.0, + 104244408.0, + 18432430.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.070604534144877e-08, + 4.78996176056512e-10, + 4.780518758629171e-10, + 4.781712803492155e-10, + 4.781176565771261e-10 + ], + "bp_grad_norms_F": [ + 2.1263931557768956e-05, + 3.437593676380857e-08, + 2.7499025279098532e-08, + 2.7248480805042163e-08, + 2.7216600528845447e-08 + ], + "gamma_dfa": -0.04910894545173505, + "acc_eval": 0.0986328125, + "loss_eval": 10.146781921386719, + "epoch": 49 + }, + { + "hidden_norms": [ + 65147.40234375, + 165462976.0, + 138862000.0, + 107834176.0, + 19038348.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.061706407464953e-08, + 4.668093134263529e-10, + 4.645184237261901e-10, + 4.6463269343099967e-10, + 4.6457995783732997e-10 + ], + "bp_grad_norms_F": [ + 2.0052335457876325e-05, + 3.337338227993314e-08, + 2.6690587517919084e-08, + 2.646976504649956e-08, + 2.64381352366172e-08 + ], + "gamma_dfa": -0.04920872090588091, + "acc_eval": 0.0966796875, + "loss_eval": 10.281063079833984, + "epoch": 50 + }, + { + "hidden_norms": [ + 65863.96875, + 171261072.0, + 143810992.0, + 111834848.0, + 19625576.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.099313302840528e-08, + 4.5625103695101643e-10, + 4.524729202426414e-10, + 4.5258219394384014e-10, + 4.5253126246258546e-10 + ], + "bp_grad_norms_F": [ + 1.9101036741631106e-05, + 3.2813989747637606e-08, + 2.5957119120789685e-08, + 2.5756730082093782e-08, + 2.572607549211625e-08 + ], + "gamma_dfa": -0.04933306630846346, + "acc_eval": 0.0986328125, + "loss_eval": 10.349817276000977, + "epoch": 51 + }, + { + "hidden_norms": [ + 66593.8203125, + 176983552.0, + 149183712.0, + 115646976.0, + 20178866.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.1175948568889e-08, + 4.444306589412861e-10, + 4.412468168624173e-10, + 4.4135325949490323e-10, + 4.413052423490882e-10 + ], + "bp_grad_norms_F": [ + 1.852569039328955e-05, + 3.21252677792927e-08, + 2.5265682879194173e-08, + 2.5077683929453087e-08, + 2.5048496610224902e-08 + ], + "gamma_dfa": -0.04927207152650226, + "acc_eval": 0.1015625, + "loss_eval": 10.515829086303711, + "epoch": 52 + }, + { + "hidden_norms": [ + 67302.6328125, + 182834976.0, + 154352272.0, + 119312168.0, + 20747826.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.146700818973841e-08, + 4.3625753010090307e-10, + 4.31810531775767e-10, + 4.319128388274862e-10, + 4.3186304532483177e-10 + ], + "bp_grad_norms_F": [ + 1.817524571379181e-05, + 3.176044671704403e-08, + 2.468624060725233e-08, + 2.4515436791716638e-08, + 2.4487377459081472e-08 + ], + "gamma_dfa": -0.04947220539179398, + "acc_eval": 0.1015625, + "loss_eval": 10.631593704223633, + "epoch": 53 + }, + { + "hidden_norms": [ + 67943.6640625, + 188557808.0, + 159066528.0, + 122911296.0, + 21287842.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.120569188780792e-08, + 4.2657519183642023e-10, + 4.219723181986268e-10, + 4.220687410683155e-10, + 4.220172822311241e-10 + ], + "bp_grad_norms_F": [ + 1.8009301129495725e-05, + 3.077772348092367e-08, + 2.4100344830912945e-08, + 2.3935520232498675e-08, + 2.390864395351855e-08 + ], + "gamma_dfa": -0.04969306073326152, + "acc_eval": 0.1025390625, + "loss_eval": 10.66339111328125, + "epoch": 54 + }, + { + "hidden_norms": [ + 68579.2578125, + 193996528.0, + 163940560.0, + 126448000.0, + 21766094.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.058499728098468e-08, + 4.1539605089013776e-10, + 4.1060946309734447e-10, + 4.1091324787245753e-10, + 4.10790096383451e-10 + ], + "bp_grad_norms_F": [ + 1.5884443200775422e-05, + 2.8224185655290057e-08, + 2.346608596326405e-08, + 2.3316024666542035e-08, + 2.328991399735969e-08 + ], + "gamma_dfa": -0.04980730817624135, + "acc_eval": 0.0986328125, + "loss_eval": 10.783552169799805, + "epoch": 55 + }, + { + "hidden_norms": [ + 69203.796875, + 199460144.0, + 168890016.0, + 129780784.0, + 22302874.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.078585350152935e-08, + 4.0699738024230214e-10, + 4.025394462203735e-10, + 4.0283623659043144e-10, + 4.027146949248106e-10 + ], + "bp_grad_norms_F": [ + 1.5867637557676062e-05, + 2.8422073583556084e-08, + 2.300496149132414e-08, + 2.2864167448233275e-08, + 2.2838495539190262e-08 + ], + "gamma_dfa": -0.04992603903519921, + "acc_eval": 0.09765625, + "loss_eval": 10.859743118286133, + "epoch": 56 + }, + { + "hidden_norms": [ + 69791.453125, + 204736432.0, + 173582192.0, + 133232672.0, + 22820996.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.066331330132016e-08, + 3.96910615485524e-10, + 3.925613167865549e-10, + 3.926495240058614e-10, + 3.9260561468523747e-10 + ], + "bp_grad_norms_F": [ + 1.4505669241771102e-05, + 2.6905636829610557e-08, + 2.2510086239435623e-08, + 2.2376122288392253e-08, + 2.235119467286495e-08 + ], + "gamma_dfa": -0.04994637455092743, + "acc_eval": 0.0986328125, + "loss_eval": 10.989320755004883, + "epoch": 57 + }, + { + "hidden_norms": [ + 70371.9375, + 210191472.0, + 178149376.0, + 136544128.0, + 23324878.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.057572469828301e-08, + 3.849987550985645e-10, + 3.8476868913228657e-10, + 3.8500982957323515e-10, + 3.8497979804041904e-10 + ], + "bp_grad_norms_F": [ + 1.4466082575381733e-05, + 2.6583837353655326e-08, + 2.2064293503376575e-08, + 2.1934541294399423e-08, + 2.191077008717457e-08 + ], + "gamma_dfa": -0.05017502269765828, + "acc_eval": 0.1015625, + "loss_eval": 11.14348030090332, + "epoch": 58 + }, + { + "hidden_norms": [ + 70926.1171875, + 215072384.0, + 182463952.0, + 139682864.0, + 23765930.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.095985831208964e-08, + 3.789666913611711e-10, + 3.7876501934874796e-10, + 3.788162006301832e-10, + 3.7878628011966953e-10 + ], + "bp_grad_norms_F": [ + 1.5613211871823296e-05, + 2.6332656943850452e-08, + 2.168836488181114e-08, + 2.1559124263603735e-08, + 2.1535397465299866e-08 + ], + "gamma_dfa": -0.05026113349595107, + "acc_eval": 0.1015625, + "loss_eval": 11.245050430297852, + "epoch": 59 + }, + { + "hidden_norms": [ + 71444.5078125, + 220139504.0, + 186860912.0, + 142962752.0, + 24235874.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.007455048504198e-08, + 3.741315868222017e-10, + 3.7062136692966874e-10, + 3.705513118568149e-10, + 3.7064074032144845e-10 + ], + "bp_grad_norms_F": [ + 2.3456123017240316e-05, + 2.666844878262964e-08, + 2.1298749430798125e-08, + 2.1137482875133173e-08, + 2.1113727655119874e-08 + ], + "gamma_dfa": -0.050498483098635916, + "acc_eval": 0.095703125, + "loss_eval": 11.284198760986328, + "epoch": 60 + }, + { + "hidden_norms": [ + 71960.484375, + 225013808.0, + 190973296.0, + 145961232.0, + 24784322.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.034386749817713e-08, + 3.658137681661344e-10, + 3.6446287654534615e-10, + 3.645108936911612e-10, + 3.6448208340367216e-10 + ], + "bp_grad_norms_F": [ + 2.785225660772994e-05, + 2.5983931450923592e-08, + 2.1029784136317176e-08, + 2.0842044534674642e-08, + 2.0818688994950207e-08 + ], + "gamma_dfa": -0.05046346641029231, + "acc_eval": 0.0986328125, + "loss_eval": 11.392132759094238, + "epoch": 61 + }, + { + "hidden_norms": [ + 72430.8359375, + 229851040.0, + 195010560.0, + 149020912.0, + 25253220.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.096932984675732e-08, + 3.608093823714853e-10, + 3.5983932500371907e-10, + 3.600989784136033e-10, + 3.599919529140294e-10 + ], + "bp_grad_norms_F": [ + 2.763499469438102e-05, + 2.5544034443214514e-08, + 2.0638090347802063e-08, + 2.0451848214975143e-08, + 2.0428588598520037e-08 + ], + "gamma_dfa": -0.050787233689334244, + "acc_eval": 0.091796875, + "loss_eval": 11.378694534301758, + "epoch": 62 + }, + { + "hidden_norms": [ + 72896.0234375, + 234300800.0, + 198948976.0, + 152100720.0, + 25625868.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.0542243924574e-08, + 3.557290573219518e-10, + 3.5249042573681777e-10, + 3.5253552854719317e-10, + 3.5250652397067483e-10 + ], + "bp_grad_norms_F": [ + 2.9849852580809966e-05, + 2.5036932527200406e-08, + 2.0406586642707225e-08, + 2.020845712991104e-08, + 2.0186647020636883e-08 + ], + "gamma_dfa": -0.05070546226488659, + "acc_eval": 0.095703125, + "loss_eval": 11.479286193847656, + "epoch": 63 + }, + { + "hidden_norms": [ + 73328.34375, + 238316288.0, + 202586032.0, + 155039648.0, + 26024600.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.105094989081408e-08, + 3.510710333554101e-10, + 3.495781997209235e-10, + 3.500161271929869e-10, + 3.499118772509746e-10 + ], + "bp_grad_norms_F": [ + 2.91574870061595e-05, + 2.4413550292479158e-08, + 2.0145231260926266e-08, + 1.9952185681404444e-08, + 1.9931007955165114e-08 + ], + "gamma_dfa": -0.05086314045183826, + "acc_eval": 0.0908203125, + "loss_eval": 11.489895820617676, + "epoch": 64 + }, + { + "hidden_norms": [ + 73748.5859375, + 242733616.0, + 206386528.0, + 157821696.0, + 26465746.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.082241803071156e-08, + 3.460224329288053e-10, + 3.438662687926808e-10, + 3.4428762618610165e-10, + 3.442592599878225e-10 + ], + "bp_grad_norms_F": [ + 2.8733484214171767e-05, + 2.375874608162576e-08, + 1.9914560667189107e-08, + 1.971613627915758e-08, + 1.969561402859199e-08 + ], + "gamma_dfa": -0.05102878155594226, + "acc_eval": 0.0888671875, + "loss_eval": 11.548040390014648, + "epoch": 65 + }, + { + "hidden_norms": [ + 74135.421875, + 246595824.0, + 209988560.0, + 160289792.0, + 26835076.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.098909714566616e-08, + 3.4202959908746777e-10, + 3.378679835908116e-10, + 3.3727598491850586e-10, + 3.370834167348846e-10 + ], + "bp_grad_norms_F": [ + 2.7568949008127674e-05, + 2.2366455354472237e-08, + 1.9751842827986366e-08, + 1.955501183203978e-08, + 1.9534347472927038e-08 + ], + "gamma_dfa": -0.05096771135140443, + "acc_eval": 0.091796875, + "loss_eval": 11.69294548034668, + "epoch": 66 + }, + { + "hidden_norms": [ + 74519.4609375, + 250496496.0, + 213470016.0, + 163034096.0, + 27224026.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.081137619659785e-08, + 3.371838919186132e-10, + 3.34856059547306e-10, + 3.351785793359596e-10, + 3.353441968556581e-10 + ], + "bp_grad_norms_F": [ + 2.4417575332336128e-05, + 2.182440006492925e-08, + 1.9469752032819088e-08, + 1.9279319474208023e-08, + 1.925921822021337e-08 + ], + "gamma_dfa": -0.051001671119593084, + "acc_eval": 0.0888671875, + "loss_eval": 11.729022026062012, + "epoch": 67 + }, + { + "hidden_norms": [ + 74894.3515625, + 254264416.0, + 216871648.0, + 165452496.0, + 27605496.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.085709962164401e-08, + 3.3377053898497877e-10, + 3.3198219173691257e-10, + 3.3151825729049733e-10, + 3.3171596025560746e-10 + ], + "bp_grad_norms_F": [ + 2.2483380234916694e-05, + 2.14983302271321e-08, + 1.9263785233647468e-08, + 1.9080003355043118e-08, + 1.9060196976283805e-08 + ], + "gamma_dfa": -0.050941091212735046, + "acc_eval": 0.087890625, + "loss_eval": 11.798931121826172, + "epoch": 68 + }, + { + "hidden_norms": [ + 75242.4609375, + 257808672.0, + 219912720.0, + 167826688.0, + 27928376.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.091576913533572e-08, + 3.2881539158147177e-10, + 3.263028736100182e-10, + 3.2664609905808106e-10, + 3.264644665712524e-10 + ], + "bp_grad_norms_F": [ + 2.127209518221207e-05, + 2.0985540416518234e-08, + 1.9050151678356997e-08, + 1.8875326190936903e-08, + 1.8856361805319466e-08 + ], + "gamma_dfa": -0.05089846828195732, + "acc_eval": 0.091796875, + "loss_eval": 11.895479202270508, + "epoch": 69 + }, + { + "hidden_norms": [ + 75572.1171875, + 261119824.0, + 222742832.0, + 169876672.0, + 28198556.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.057247041255323e-08, + 3.278008420259937e-10, + 3.249100710700503e-10, + 3.242202339936995e-10, + 3.244049195938459e-10 + ], + "bp_grad_norms_F": [ + 1.884793528006412e-05, + 2.07159356335751e-08, + 1.889556244805135e-08, + 1.8724394479363582e-08, + 1.8705017978959404e-08 + ], + "gamma_dfa": -0.05079331841261592, + "acc_eval": 0.0888671875, + "loss_eval": 11.890766143798828, + "epoch": 70 + }, + { + "hidden_norms": [ + 75874.0546875, + 264210176.0, + 225470416.0, + 172025616.0, + 28547836.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.025038849586053e-08, + 3.2404043337486144e-10, + 3.204363163700208e-10, + 3.2077221434612113e-10, + 3.205906651260193e-10 + ], + "bp_grad_norms_F": [ + 1.7337119061267003e-05, + 2.020676426184309e-08, + 1.872472488173571e-08, + 1.8554693781425158e-08, + 1.853570097409829e-08 + ], + "gamma_dfa": -0.05096161225810647, + "acc_eval": 0.0849609375, + "loss_eval": 11.900531768798828, + "epoch": 71 + }, + { + "hidden_norms": [ + 76155.671875, + 267008752.0, + 228187344.0, + 173959248.0, + 28788394.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.046407711821303e-08, + 3.195448350368224e-10, + 3.1774499698045133e-10, + 3.1807836919917065e-10, + 3.179001784037183e-10 + ], + "bp_grad_norms_F": [ + 1.667224569246173e-05, + 2.00564560515204e-08, + 1.8585067707022063e-08, + 1.8417832592376726e-08, + 1.8399065382368462e-08 + ], + "gamma_dfa": -0.05094757055485388, + "acc_eval": 0.087890625, + "loss_eval": 11.944206237792969, + "epoch": 72 + }, + { + "hidden_norms": [ + 76421.0625, + 269839616.0, + 230674688.0, + 175791728.0, + 29094570.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.012642010475247e-08, + 3.166587547731581e-10, + 3.1469221672963954e-10, + 3.1502128683413844e-10, + 3.1484426177286196e-10 + ], + "bp_grad_norms_F": [ + 1.6745894754421897e-05, + 1.9875857404372255e-08, + 1.840698438115851e-08, + 1.8240543298020384e-08, + 1.822207096324746e-08 + ], + "gamma_dfa": -0.05100561307335738, + "acc_eval": 0.0859375, + "loss_eval": 11.99311637878418, + "epoch": 73 + }, + { + "hidden_norms": [ + 76664.2734375, + 272336768.0, + 232959216.0, + 177609664.0, + 29323556.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.990726030333462e-08, + 3.1504263087178686e-10, + 3.12906783817013e-10, + 3.131215564611267e-10, + 3.1305841252660116e-10 + ], + "bp_grad_norms_F": [ + 1.6934929590206593e-05, + 1.98417797747652e-08, + 1.8281056668456586e-08, + 1.8116447009219883e-08, + 1.8098068821359448e-08 + ], + "gamma_dfa": -0.05103835645422805, + "acc_eval": 0.0849609375, + "loss_eval": 12.02127456665039, + "epoch": 74 + }, + { + "hidden_norms": [ + 76888.4921875, + 274732928.0, + 235060816.0, + 179132768.0, + 29504610.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.986659594256707e-08, + 3.121746194878483e-10, + 3.1075714224115814e-10, + 3.1084415597071313e-10, + 3.1076746731528715e-10 + ], + "bp_grad_norms_F": [ + 1.7154834495158866e-05, + 1.9609577961432478e-08, + 1.816025729795001e-08, + 1.7994944201404905e-08, + 1.7976633515104368e-08 + ], + "gamma_dfa": -0.05099774348491337, + "acc_eval": 0.083984375, + "loss_eval": 12.060166358947754, + "epoch": 75 + }, + { + "hidden_norms": [ + 77091.2421875, + 277045280.0, + 237230640.0, + 180794320.0, + 29739022.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.99742147453253e-08, + 3.103251822178521e-10, + 3.08925968139917e-10, + 3.089623279439735e-10, + 3.0893596014713864e-10 + ], + "bp_grad_norms_F": [ + 1.679581509961281e-05, + 1.951891448470633e-08, + 1.803828730828627e-08, + 1.787446990419994e-08, + 1.785628889194868e-08 + ], + "gamma_dfa": -0.050966299066203646, + "acc_eval": 0.087890625, + "loss_eval": 12.12912654876709, + "epoch": 76 + }, + { + "hidden_norms": [ + 77280.328125, + 279085056.0, + 239194416.0, + 182229856.0, + 29919720.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.955728958426334e-08, + 3.0862179478674534e-10, + 3.06326686239089e-10, + 3.067510134791007e-10, + 3.0670044282032904e-10 + ], + "bp_grad_norms_F": [ + 1.6653601051075384e-05, + 1.913345748505435e-08, + 1.7934322471546693e-08, + 1.7773432503531694e-08, + 1.7755372283545512e-08 + ], + "gamma_dfa": -0.050885657081380486, + "acc_eval": 0.0888671875, + "loss_eval": 12.196252822875977, + "epoch": 77 + }, + { + "hidden_norms": [ + 77464.84375, + 281044160.0, + 241080400.0, + 183481632.0, + 30118970.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.968549281007654e-08, + 3.077238464044285e-10, + 3.0509625381647254e-10, + 3.05251185439559e-10, + 3.0514471505149743e-10 + ], + "bp_grad_norms_F": [ + 1.6696472812327556e-05, + 1.9041245025164244e-08, + 1.7839029808897067e-08, + 1.767946500308426e-08, + 1.766149004822637e-08 + ], + "gamma_dfa": -0.05102008958783699, + "acc_eval": 0.0888671875, + "loss_eval": 12.193323135375977, + "epoch": 78 + }, + { + "hidden_norms": [ + 77630.7734375, + 282858400.0, + 242823728.0, + 184645696.0, + 30321804.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.95526710564809e-08, + 3.0606236989250135e-10, + 3.0359312286343254e-10, + 3.0362826142216193e-10, + 3.0360203240320516e-10 + ], + "bp_grad_norms_F": [ + 1.670894562266767e-05, + 1.8970476745039377e-08, + 1.7750505065805555e-08, + 1.7592398648957897e-08, + 1.7574748767401616e-08 + ], + "gamma_dfa": -0.05112272154656239, + "acc_eval": 0.087890625, + "loss_eval": 12.226293563842773, + "epoch": 79 + }, + { + "hidden_norms": [ + 77779.6484375, + 284380192.0, + 244252416.0, + 185749600.0, + 30452270.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.966701159351942e-08, + 3.0471447587387956e-10, + 3.022795902474229e-10, + 3.0231497860633283e-10, + 3.022894989879177e-10 + ], + "bp_grad_norms_F": [ + 1.6740978026064113e-05, + 1.889440781610574e-08, + 1.7666355489609487e-08, + 1.7510158656364183e-08, + 1.749260469807723e-08 + ], + "gamma_dfa": -0.05107468220376177, + "acc_eval": 0.0888671875, + "loss_eval": 12.260065078735352, + "epoch": 80 + }, + { + "hidden_norms": [ + 77920.109375, + 285895104.0, + 245542864.0, + 186746576.0, + 30585936.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.98649830105569e-08, + 3.0335337020126474e-10, + 3.010065807718121e-10, + 3.0114838400763233e-10, + 3.010563187633153e-10 + ], + "bp_grad_norms_F": [ + 1.6312769730575383e-05, + 1.8841578963701977e-08, + 1.7605929159003608e-08, + 1.7449115929935033e-08, + 1.7431389665034658e-08 + ], + "gamma_dfa": -0.051095581700792536, + "acc_eval": 0.087890625, + "loss_eval": 12.283187866210938, + "epoch": 81 + }, + { + "hidden_norms": [ + 78045.9765625, + 287308480.0, + 246744592.0, + 187657408.0, + 30732464.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.991665367830137e-08, + 3.023456207618125e-10, + 3.001092707677344e-10, + 3.002506299143448e-10, + 3.001580373140911e-10 + ], + "bp_grad_norms_F": [ + 1.6261117707472295e-05, + 1.8763861575621377e-08, + 1.7538225094426707e-08, + 1.73831011807124e-08, + 1.7365564985993842e-08 + ], + "gamma_dfa": -0.05111259325349238, + "acc_eval": 0.0888671875, + "loss_eval": 12.312464714050293, + "epoch": 82 + }, + { + "hidden_norms": [ + 78157.4453125, + 288495296.0, + 247894048.0, + 188423328.0, + 30852564.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.983852950450455e-08, + 3.0117680571706273e-10, + 2.9906743748142617e-10, + 2.9920824151652425e-10, + 2.991159819831779e-10 + ], + "bp_grad_norms_F": [ + 1.6263733414234594e-05, + 1.8713789629032362e-08, + 1.7478631875178507e-08, + 1.7324792267459088e-08, + 1.730730758708887e-08 + ], + "gamma_dfa": -0.05116538004585891, + "acc_eval": 0.0849609375, + "loss_eval": 12.31210994720459, + "epoch": 83 + }, + { + "hidden_norms": [ + 78262.0234375, + 289603808.0, + 248882656.0, + 189149776.0, + 30956266.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.960672204239017e-08, + 3.0011432228249646e-10, + 2.9822597169548715e-10, + 2.9836624837464853e-10, + 2.9827409986360465e-10 + ], + "bp_grad_norms_F": [ + 1.631741542951204e-05, + 1.8692462688818523e-08, + 1.7431661447631086e-08, + 1.7277525188319487e-08, + 1.725989662304528e-08 + ], + "gamma_dfa": -0.05115435087645892, + "acc_eval": 0.083984375, + "loss_eval": 12.336039543151855, + "epoch": 84 + }, + { + "hidden_norms": [ + 78353.1171875, + 290648000.0, + 249810592.0, + 189809696.0, + 31040388.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.986083344098006e-08, + 2.995071968214802e-10, + 2.9758684405578606e-10, + 2.977268154236157e-10, + 2.9763422282336194e-10 + ], + "bp_grad_norms_F": [ + 1.6262692952295765e-05, + 1.849162600819909e-08, + 1.73968519590062e-08, + 1.7244063954535704e-08, + 1.7226579274165488e-08 + ], + "gamma_dfa": -0.05118084823334357, + "acc_eval": 0.0888671875, + "loss_eval": 12.381507873535156, + "epoch": 85 + }, + { + "hidden_norms": [ + 78431.15625, + 291523168.0, + 250644688.0, + 190386224.0, + 31126390.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.970421561116382e-08, + 2.984960056906516e-10, + 2.967268375453358e-10, + 2.968662538016531e-10, + 2.967753265359363e-10 + ], + "bp_grad_norms_F": [ + 1.6223337297560647e-05, + 1.8457278372352448e-08, + 1.7345271885460534e-08, + 1.7192725465520198e-08, + 1.717533315570563e-08 + ], + "gamma_dfa": -0.05117447574957623, + "acc_eval": 0.0849609375, + "loss_eval": 12.38785171508789, + "epoch": 86 + }, + { + "hidden_norms": [ + 78499.1484375, + 292312512.0, + 251365920.0, + 190918880.0, + 31200688.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.988487110173082e-08, + 2.980244662165177e-10, + 2.966143997085169e-10, + 2.96407148825395e-10, + 2.965439005464532e-10 + ], + "bp_grad_norms_F": [ + 1.627574602025561e-05, + 1.8460895034877467e-08, + 1.7314020439584965e-08, + 1.7161701393320072e-08, + 1.714437836142224e-08 + ], + "gamma_dfa": -0.05115793484583264, + "acc_eval": 0.0888671875, + "loss_eval": 12.419504165649414, + "epoch": 87 + }, + { + "hidden_norms": [ + 78560.8984375, + 292944192.0, + 251977760.0, + 191372272.0, + 31263360.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.973138676537928e-08, + 2.973402635220168e-10, + 2.9567431836241553e-10, + 2.958131239960693e-10, + 2.957224187749574e-10 + ], + "bp_grad_norms_F": [ + 1.628614336368628e-05, + 1.8427853021307783e-08, + 1.72794418773492e-08, + 1.7127625540069857e-08, + 1.7110302508172026e-08 + ], + "gamma_dfa": -0.0511754965664295, + "acc_eval": 0.087890625, + "loss_eval": 12.422038078308105, + "epoch": 88 + }, + { + "hidden_norms": [ + 78610.8515625, + 293507168.0, + 252467824.0, + 191746752.0, + 31315682.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.979492349681095e-08, + 2.9698124515142865e-10, + 2.9562619019429803e-10, + 2.9538149703967065e-10, + 2.9551999736199264e-10 + ], + "bp_grad_norms_F": [ + 1.631640589039307e-05, + 1.8418628400240777e-08, + 1.726077947239446e-08, + 1.710880859207009e-08, + 1.709145003303547e-08 + ], + "gamma_dfa": -0.051156919635104714, + "acc_eval": 0.0888671875, + "loss_eval": 12.428571701049805, + "epoch": 89 + }, + { + "hidden_norms": [ + 78652.9921875, + 293964640.0, + 252896208.0, + 192039472.0, + 31369200.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.969335141273405e-08, + 2.9646449184461687e-10, + 2.949255561990327e-10, + 2.949690214304468e-10, + 2.9487870478739353e-10 + ], + "bp_grad_norms_F": [ + 1.6324445823556744e-05, + 1.8399745727037953e-08, + 1.7238173555256253e-08, + 1.7086200898575044e-08, + 1.7068817470544673e-08 + ], + "gamma_dfa": -0.051174478845496196, + "acc_eval": 0.087890625, + "loss_eval": 12.429685592651367, + "epoch": 90 + }, + { + "hidden_norms": [ + 78686.6953125, + 294364864.0, + 253268672.0, + 192287472.0, + 31404650.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.964375552977799e-08, + 2.960394152040635e-10, + 2.9448907201690133e-10, + 2.9462729478346716e-10, + 2.9453686711811145e-10 + ], + "bp_grad_norms_F": [ + 1.5716021152911708e-05, + 1.8335738261043844e-08, + 1.7222946624428914e-08, + 1.7072181890398497e-08, + 1.7054745171662944e-08 + ], + "gamma_dfa": -0.05117890803012415, + "acc_eval": 0.087890625, + "loss_eval": 12.430795669555664, + "epoch": 91 + }, + { + "hidden_norms": [ + 78715.6640625, + 294704960.0, + 253580416.0, + 192507984.0, + 31439268.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.966816267275135e-08, + 2.9585070504545286e-10, + 2.9467184248233025e-10, + 2.944416099825986e-10, + 2.943854882087038e-10 + ], + "bp_grad_norms_F": [ + 1.575841633894015e-05, + 1.832342988450364e-08, + 1.7211402081329652e-08, + 1.7061056567513333e-08, + 1.704364827048721e-08 + ], + "gamma_dfa": -0.05119702904630685, + "acc_eval": 0.087890625, + "loss_eval": 12.439577102661133, + "epoch": 92 + }, + { + "hidden_norms": [ + 78736.21875, + 294950432.0, + 253812928.0, + 192667952.0, + 31460118.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.969291798166523e-08, + 2.956498934558738e-10, + 2.9448718463775947e-10, + 2.947934119035267e-10, + 2.946275168280721e-10 + ], + "bp_grad_norms_F": [ + 1.5731959138065577e-05, + 1.8296260506645012e-08, + 1.719953068857194e-08, + 1.7050359346626465e-08, + 1.703298835309397e-08 + ], + "gamma_dfa": -0.05120327511394862, + "acc_eval": 0.0888671875, + "loss_eval": 12.4466552734375, + "epoch": 93 + }, + { + "hidden_norms": [ + 78753.203125, + 295147232.0, + 253989200.0, + 192796160.0, + 31479312.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.963842645925979e-08, + 2.9541508128616556e-10, + 2.9437702275814104e-10, + 2.943085775086729e-10, + 2.9446245441988594e-10 + ], + "bp_grad_norms_F": [ + 1.573332519910764e-05, + 1.8288872638549947e-08, + 1.718973052788897e-08, + 1.7040525435163545e-08, + 1.7023159770701568e-08 + ], + "gamma_dfa": -0.051216166342783254, + "acc_eval": 0.087890625, + "loss_eval": 12.445267677307129, + "epoch": 94 + }, + { + "hidden_norms": [ + 78765.84375, + 295294944.0, + 254123440.0, + 192894032.0, + 31493604.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.965194098209395e-08, + 2.9531932455029164e-10, + 2.942409649264732e-10, + 2.945468868809087e-10, + 2.943810750721809e-10 + ], + "bp_grad_norms_F": [ + 1.5746687495266087e-05, + 1.8289329162257673e-08, + 1.7184650147328284e-08, + 1.703533136776514e-08, + 1.7017976361444198e-08 + ], + "gamma_dfa": -0.0512156481272541, + "acc_eval": 0.087890625, + "loss_eval": 12.449201583862305, + "epoch": 95 + }, + { + "hidden_norms": [ + 78774.0859375, + 295388160.0, + 254208896.0, + 192955280.0, + 31502434.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.963444741993953e-08, + 2.9521793343256775e-10, + 2.941772103692841e-10, + 2.944521015901813e-10, + 2.9431723724826497e-10 + ], + "bp_grad_norms_F": [ + 1.574558154970873e-05, + 1.8287312997244953e-08, + 1.7180775913061552e-08, + 1.7031513976917267e-08, + 1.7014160746953166e-08 + ], + "gamma_dfa": -0.051216532388934866, + "acc_eval": 0.087890625, + "loss_eval": 12.451032638549805, + "epoch": 96 + }, + { + "hidden_norms": [ + 78778.2109375, + 295438176.0, + 254253040.0, + 192987616.0, + 31507318.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.962313557958623e-08, + 2.951474897816553e-10, + 2.9410018864695076e-10, + 2.9431876380492383e-10, + 2.9424027103708283e-10 + ], + "bp_grad_norms_F": [ + 1.5746518329251558e-05, + 1.8286739233985827e-08, + 1.717829789527059e-08, + 1.7028938259500137e-08, + 1.7011583253179197e-08 + ], + "gamma_dfa": -0.051216747364378534, + "acc_eval": 0.087890625, + "loss_eval": 12.451074600219727, + "epoch": 97 + }, + { + "hidden_norms": [ + 78782.125, + 295481568.0, + 254291456.0, + 193016112.0, + 31511684.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.962148712043927e-08, + 2.9511454391339953e-10, + 2.9406876933535386e-10, + 2.942796561988814e-10, + 2.9420885172548594e-10 + ], + "bp_grad_norms_F": [ + 1.574746784172021e-05, + 1.8285794212147266e-08, + 1.7176807531882332e-08, + 1.7027431908900326e-08, + 1.7010076902579385e-08 + ], + "gamma_dfa": -0.05121716375651886, + "acc_eval": 0.087890625, + "loss_eval": 12.451665878295898, + "epoch": 98 + }, + { + "hidden_norms": [ + 78783.9921875, + 295502592.0, + 254310320.0, + 193029024.0, + 31513524.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.961931285966784e-08, + 2.950964195225225e-10, + 2.940539201023995e-10, + 2.942680543682741e-10, + 2.941940024925316e-10 + ], + "bp_grad_norms_F": [ + 1.5747409634059295e-05, + 1.8284790570533005e-08, + 1.717580744298175e-08, + 1.702643714907026e-08, + 1.700908214274932e-08 + ], + "gamma_dfa": -0.05121721836621873, + "acc_eval": 0.087890625, + "loss_eval": 12.452173233032227, + "epoch": 99 + }, + { + "hidden_norms": [ + 78784.0078125, + 295502688.0, + 254310576.0, + 193029360.0, + 31513636.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.96192702271037e-08, + 2.9509686361173237e-10, + 2.940537813245214e-10, + 2.9426569514434675e-10, + 2.941938359590779e-10 + ], + "bp_grad_norms_F": [ + 1.5747655197628774e-05, + 1.8284845637595026e-08, + 1.7175850075545895e-08, + 1.7026476228920728e-08, + 1.7009122998956627e-08 + ], + "gamma_dfa": -0.05121716100984486, + "acc_eval": 0.087890625, + "loss_eval": 12.452241897583008, + "epoch": 100 + } + ] +} \ No newline at end of file diff --git a/results/h2_no_residual_full_s42.log b/results/h2_no_residual_full_s42.log new file mode 100644 index 0000000..aa55d2f --- /dev/null +++ b/results/h2_no_residual_full_s42.log @@ -0,0 +1,210 @@ +device=cuda:0, depth=4, d_hidden=256, epochs=100, seed=42 +eval buffer: torch.Size([1024, 3072]) + +=== BP training === + [BP] Ep 0: ||h||_med=[8.718070030212402, 42.802223205566406, 44.22697067260742, 46.05121994018555, 46.896766662597656] ||g||_med=[0.0010791289387270808, 0.0002035950165009126, 0.00014324457151815295, 0.00011542177526280284, 9.846547618508339e-05] acc=0.0801 + [BP] Ep 1: ||h_L||=1.553e+02 ||g_2||=4.255e-05 acc=0.1436 + [BP] Ep 2: ||h_L||=1.931e+02 ||g_2||=3.570e-05 acc=0.1729 + [BP] Ep 3: ||h_L||=2.162e+02 ||g_2||=3.247e-05 acc=0.1777 + [BP] Ep 4: ||h_L||=2.442e+02 ||g_2||=3.064e-05 acc=0.2012 + [BP] Ep 5: ||h_L||=2.665e+02 ||g_2||=2.965e-05 acc=0.2051 + [BP] Ep 6: ||h_L||=2.731e+02 ||g_2||=2.925e-05 acc=0.2012 + [BP] Ep 7: ||h_L||=2.942e+02 ||g_2||=2.887e-05 acc=0.1895 + [BP] Ep 8: ||h_L||=3.166e+02 ||g_2||=2.825e-05 acc=0.2031 + [BP] Ep 9: ||h_L||=3.356e+02 ||g_2||=2.795e-05 acc=0.1895 + [BP] Ep 10: ||h_L||=3.641e+02 ||g_2||=2.808e-05 acc=0.1885 + [BP] Ep 11: ||h_L||=3.736e+02 ||g_2||=2.828e-05 acc=0.1836 + [BP] Ep 12: ||h_L||=3.991e+02 ||g_2||=2.830e-05 acc=0.1973 + [BP] Ep 13: ||h_L||=4.056e+02 ||g_2||=2.779e-05 acc=0.1865 + [BP] Ep 14: ||h_L||=4.022e+02 ||g_2||=2.821e-05 acc=0.1777 + [BP] Ep 15: ||h_L||=4.162e+02 ||g_2||=2.889e-05 acc=0.1650 + [BP] Ep 16: ||h_L||=4.264e+02 ||g_2||=2.814e-05 acc=0.1748 + [BP] Ep 17: ||h_L||=4.399e+02 ||g_2||=2.813e-05 acc=0.1758 + [BP] Ep 18: ||h_L||=4.389e+02 ||g_2||=2.840e-05 acc=0.1748 + [BP] Ep 19: ||h_L||=4.464e+02 ||g_2||=2.867e-05 acc=0.1729 + [BP] Ep 20: ||h_L||=4.644e+02 ||g_2||=2.883e-05 acc=0.1670 + [BP] Ep 21: ||h_L||=4.655e+02 ||g_2||=2.849e-05 acc=0.1719 + [BP] Ep 22: ||h_L||=4.816e+02 ||g_2||=2.889e-05 acc=0.1592 + [BP] Ep 23: ||h_L||=4.586e+02 ||g_2||=2.932e-05 acc=0.1436 + [BP] Ep 24: ||h_L||=4.573e+02 ||g_2||=2.953e-05 acc=0.1611 + [BP] Ep 25: ||h_L||=4.734e+02 ||g_2||=3.039e-05 acc=0.1455 + [BP] Ep 26: ||h_L||=4.788e+02 ||g_2||=2.986e-05 acc=0.1406 + [BP] Ep 27: ||h_L||=4.735e+02 ||g_2||=3.057e-05 acc=0.1387 + [BP] Ep 28: ||h_L||=4.861e+02 ||g_2||=3.073e-05 acc=0.1299 + [BP] Ep 29: ||h_L||=4.687e+02 ||g_2||=3.094e-05 acc=0.1230 + [BP] Ep 30: ||h_L||=4.786e+02 ||g_2||=3.044e-05 acc=0.1318 + [BP] Ep 31: ||h_L||=4.494e+02 ||g_2||=3.108e-05 acc=0.1309 + [BP] Ep 32: ||h_L||=4.589e+02 ||g_2||=3.128e-05 acc=0.1377 + [BP] Ep 33: ||h_L||=4.573e+02 ||g_2||=3.159e-05 acc=0.1289 + [BP] Ep 34: ||h_L||=4.612e+02 ||g_2||=3.172e-05 acc=0.1279 + [BP] Ep 35: ||h_L||=4.643e+02 ||g_2||=3.162e-05 acc=0.1230 + [BP] Ep 36: ||h_L||=4.563e+02 ||g_2||=3.195e-05 acc=0.1338 + [BP] Ep 37: ||h_L||=4.468e+02 ||g_2||=3.219e-05 acc=0.1279 + [BP] Ep 38: ||h_L||=4.199e+02 ||g_2||=3.231e-05 acc=0.1348 + [BP] Ep 39: ||h_L||=4.249e+02 ||g_2||=3.235e-05 acc=0.1123 + [BP] Ep 40: ||h_L||=4.160e+02 ||g_2||=3.311e-05 acc=0.1172 + [BP] Ep 41: ||h_L||=4.131e+02 ||g_2||=3.336e-05 acc=0.1191 + [BP] Ep 42: ||h_L||=4.131e+02 ||g_2||=3.329e-05 acc=0.1084 + [BP] Ep 43: ||h_L||=3.986e+02 ||g_2||=3.373e-05 acc=0.1074 + [BP] Ep 44: ||h_L||=3.907e+02 ||g_2||=3.344e-05 acc=0.1240 + [BP] Ep 45: ||h_L||=3.760e+02 ||g_2||=3.396e-05 acc=0.1152 + [BP] Ep 46: ||h_L||=3.736e+02 ||g_2||=3.432e-05 acc=0.1123 + [BP] Ep 47: ||h_L||=3.586e+02 ||g_2||=3.479e-05 acc=0.1133 + [BP] Ep 48: ||h_L||=3.632e+02 ||g_2||=3.458e-05 acc=0.1084 + [BP] Ep 49: ||h_L||=3.485e+02 ||g_2||=3.495e-05 acc=0.1055 + [BP] Ep 50: ||h_L||=3.437e+02 ||g_2||=3.525e-05 acc=0.0957 + [BP] Ep 51: ||h_L||=3.300e+02 ||g_2||=3.516e-05 acc=0.1055 + [BP] Ep 52: ||h_L||=3.224e+02 ||g_2||=3.584e-05 acc=0.0996 + [BP] Ep 53: ||h_L||=2.983e+02 ||g_2||=3.604e-05 acc=0.1025 + [BP] Ep 54: ||h_L||=2.993e+02 ||g_2||=3.617e-05 acc=0.0898 + [BP] Ep 55: ||h_L||=2.992e+02 ||g_2||=3.674e-05 acc=0.0889 + [BP] Ep 56: ||h_L||=2.884e+02 ||g_2||=3.681e-05 acc=0.0908 + [BP] Ep 57: ||h_L||=2.793e+02 ||g_2||=3.732e-05 acc=0.0977 + [BP] Ep 58: ||h_L||=2.685e+02 ||g_2||=3.709e-05 acc=0.0938 + [BP] Ep 59: ||h_L||=2.631e+02 ||g_2||=3.763e-05 acc=0.0938 + [BP] Ep 60: ||h_L||=2.557e+02 ||g_2||=3.750e-05 acc=0.1035 + [BP] Ep 61: ||h_L||=2.525e+02 ||g_2||=3.791e-05 acc=0.0947 + [BP] Ep 62: ||h_L||=2.432e+02 ||g_2||=3.832e-05 acc=0.0996 + [BP] Ep 63: ||h_L||=2.397e+02 ||g_2||=3.882e-05 acc=0.0938 + [BP] Ep 64: ||h_L||=2.338e+02 ||g_2||=3.874e-05 acc=0.0957 + [BP] Ep 65: ||h_L||=2.265e+02 ||g_2||=3.944e-05 acc=0.0957 + [BP] Ep 66: ||h_L||=2.175e+02 ||g_2||=3.973e-05 acc=0.0869 + [BP] Ep 67: ||h_L||=2.158e+02 ||g_2||=3.975e-05 acc=0.0928 + [BP] Ep 68: ||h_L||=2.117e+02 ||g_2||=4.036e-05 acc=0.0898 + [BP] Ep 69: ||h_L||=2.119e+02 ||g_2||=4.041e-05 acc=0.0879 + [BP] Ep 70: ||h_L||=2.023e+02 ||g_2||=4.075e-05 acc=0.0869 + [BP] Ep 71: ||h_L||=1.978e+02 ||g_2||=4.113e-05 acc=0.0918 + [BP] Ep 72: ||h_L||=1.925e+02 ||g_2||=4.125e-05 acc=0.0928 + [BP] Ep 73: ||h_L||=1.900e+02 ||g_2||=4.188e-05 acc=0.0869 + [BP] Ep 74: ||h_L||=1.880e+02 ||g_2||=4.231e-05 acc=0.0908 + [BP] Ep 75: ||h_L||=1.866e+02 ||g_2||=4.237e-05 acc=0.0928 + [BP] Ep 76: ||h_L||=1.818e+02 ||g_2||=4.254e-05 acc=0.0928 + [BP] Ep 77: ||h_L||=1.795e+02 ||g_2||=4.277e-05 acc=0.0977 + [BP] Ep 78: ||h_L||=1.770e+02 ||g_2||=4.308e-05 acc=0.0947 + [BP] Ep 79: ||h_L||=1.763e+02 ||g_2||=4.322e-05 acc=0.0889 + [BP] Ep 80: ||h_L||=1.734e+02 ||g_2||=4.371e-05 acc=0.0928 + [BP] Ep 81: ||h_L||=1.711e+02 ||g_2||=4.385e-05 acc=0.0928 + [BP] Ep 82: ||h_L||=1.689e+02 ||g_2||=4.418e-05 acc=0.0947 + [BP] Ep 83: ||h_L||=1.685e+02 ||g_2||=4.438e-05 acc=0.0938 + [BP] Ep 84: ||h_L||=1.666e+02 ||g_2||=4.441e-05 acc=0.0957 + [BP] Ep 85: ||h_L||=1.660e+02 ||g_2||=4.454e-05 acc=0.0879 + [BP] Ep 86: ||h_L||=1.635e+02 ||g_2||=4.459e-05 acc=0.0938 + [BP] Ep 87: ||h_L||=1.640e+02 ||g_2||=4.475e-05 acc=0.0928 + [BP] Ep 88: ||h_L||=1.624e+02 ||g_2||=4.495e-05 acc=0.0938 + [BP] Ep 89: ||h_L||=1.618e+02 ||g_2||=4.503e-05 acc=0.0918 + [BP] Ep 90: ||h_L||=1.619e+02 ||g_2||=4.513e-05 acc=0.0938 + [BP] Ep 91: ||h_L||=1.609e+02 ||g_2||=4.518e-05 acc=0.0928 + [BP] Ep 92: ||h_L||=1.609e+02 ||g_2||=4.525e-05 acc=0.0908 + [BP] Ep 93: ||h_L||=1.601e+02 ||g_2||=4.532e-05 acc=0.0918 + [BP] Ep 94: ||h_L||=1.597e+02 ||g_2||=4.533e-05 acc=0.0928 + [BP] Ep 95: ||h_L||=1.596e+02 ||g_2||=4.529e-05 acc=0.0908 + [BP] Ep 96: ||h_L||=1.593e+02 ||g_2||=4.540e-05 acc=0.0908 + [BP] Ep 97: ||h_L||=1.593e+02 ||g_2||=4.545e-05 acc=0.0918 + [BP] Ep 98: ||h_L||=1.593e+02 ||g_2||=4.546e-05 acc=0.0918 + [BP] Ep 99: ||h_L||=1.593e+02 ||g_2||=4.546e-05 acc=0.0918 + [BP] Ep 100: ||h_L||=1.593e+02 ||g_2||=4.546e-05 acc=0.0918 + +=== DFA training === + [DFA] Ep 0: ||h||_med=[8.718070030212402, 42.802223205566406, 44.22697067260742, 46.05121994018555, 46.896766662597656] ||g||_med=[0.0010791289387270808, 0.0002035950165009126, 0.00014324457151815295, 0.00011542177526280284, 9.846547618508339e-05] acc=0.0801 + [DFA] Ep 1: ||h_L||=5.295e+03 ||g_2||=8.588e-07 acc=0.1562 gamma_dfa=0.0467 + [DFA] Ep 2: ||h_L||=2.157e+04 ||g_2||=1.623e-07 acc=0.1465 gamma_dfa=0.0354 + [DFA] Ep 3: ||h_L||=4.868e+04 ||g_2||=6.499e-08 acc=0.1504 gamma_dfa=0.0336 + [DFA] Ep 4: ||h_L||=8.880e+04 ||g_2||=3.371e-08 acc=0.1494 gamma_dfa=0.0280 + [DFA] Ep 5: ||h_L||=1.410e+05 ||g_2||=2.114e-08 acc=0.1436 gamma_dfa=0.0275 + [DFA] Ep 6: ||h_L||=2.259e+05 ||g_2||=1.408e-08 acc=0.1416 gamma_dfa=0.0224 + [DFA] Ep 7: ||h_L||=3.300e+05 ||g_2||=1.018e-08 acc=0.1338 gamma_dfa=0.0140 + [DFA] Ep 8: ||h_L||=4.608e+05 ||g_2||=7.597e-09 acc=0.1328 gamma_dfa=0.0117 + [DFA] Ep 9: ||h_L||=6.299e+05 ||g_2||=6.086e-09 acc=0.1299 gamma_dfa=0.0090 + [DFA] Ep 10: ||h_L||=8.288e+05 ||g_2||=5.069e-09 acc=0.1250 gamma_dfa=0.0051 + [DFA] Ep 11: ||h_L||=1.047e+06 ||g_2||=4.261e-09 acc=0.1250 gamma_dfa=0.0026 + [DFA] Ep 12: ||h_L||=1.298e+06 ||g_2||=3.751e-09 acc=0.1162 gamma_dfa=-0.0011 + [DFA] Ep 13: ||h_L||=1.633e+06 ||g_2||=3.241e-09 acc=0.1133 gamma_dfa=-0.0034 + [DFA] Ep 14: ||h_L||=2.018e+06 ||g_2||=2.862e-09 acc=0.1104 gamma_dfa=-0.0044 + [DFA] Ep 15: ||h_L||=2.470e+06 ||g_2||=2.457e-09 acc=0.1133 gamma_dfa=-0.0055 + [DFA] Ep 16: ||h_L||=2.981e+06 ||g_2||=2.181e-09 acc=0.1104 gamma_dfa=-0.0057 + [DFA] Ep 17: ||h_L||=3.521e+06 ||g_2||=1.952e-09 acc=0.1123 gamma_dfa=-0.0064 + [DFA] Ep 18: ||h_L||=4.172e+06 ||g_2||=1.740e-09 acc=0.1143 gamma_dfa=-0.0064 + [DFA] Ep 19: ||h_L||=4.909e+06 ||g_2||=1.562e-09 acc=0.1172 gamma_dfa=-0.0077 + [DFA] Ep 20: ||h_L||=5.633e+06 ||g_2||=1.385e-09 acc=0.1113 gamma_dfa=-0.0068 + [DFA] Ep 21: ||h_L||=6.425e+06 ||g_2||=1.257e-09 acc=0.1162 gamma_dfa=-0.0086 + [DFA] Ep 22: ||h_L||=7.322e+06 ||g_2||=1.121e-09 acc=0.1113 gamma_dfa=-0.0074 + [DFA] Ep 23: ||h_L||=8.329e+06 ||g_2||=1.006e-09 acc=0.1123 gamma_dfa=-0.0067 + [DFA] Ep 24: ||h_L||=9.444e+06 ||g_2||=9.108e-10 acc=0.1143 gamma_dfa=-0.0056 + [DFA] Ep 25: ||h_L||=1.064e+07 ||g_2||=8.279e-10 acc=0.1152 gamma_dfa=-0.0044 + [DFA] Ep 26: ||h_L||=1.185e+07 ||g_2||=7.524e-10 acc=0.1123 gamma_dfa=-0.0030 + [DFA] Ep 27: ||h_L||=1.317e+07 ||g_2||=6.949e-10 acc=0.1104 gamma_dfa=-0.0022 + [DFA] Ep 28: ||h_L||=1.456e+07 ||g_2||=6.403e-10 acc=0.1133 gamma_dfa=0.0003 + [DFA] Ep 29: ||h_L||=1.608e+07 ||g_2||=5.905e-10 acc=0.1143 gamma_dfa=0.0035 + [DFA] Ep 30: ||h_L||=1.766e+07 ||g_2||=5.454e-10 acc=0.1152 gamma_dfa=0.0040 + [DFA] Ep 31: ||h_L||=1.913e+07 ||g_2||=5.052e-10 acc=0.1162 gamma_dfa=0.0066 + [DFA] Ep 32: ||h_L||=2.086e+07 ||g_2||=4.702e-10 acc=0.1162 gamma_dfa=0.0085 + [DFA] Ep 33: ||h_L||=2.252e+07 ||g_2||=4.386e-10 acc=0.1143 gamma_dfa=0.0103 + [DFA] Ep 34: ||h_L||=2.431e+07 ||g_2||=4.123e-10 acc=0.1133 gamma_dfa=0.0126 + [DFA] Ep 35: ||h_L||=2.629e+07 ||g_2||=3.859e-10 acc=0.1182 gamma_dfa=0.0154 + [DFA] Ep 36: ||h_L||=2.809e+07 ||g_2||=3.577e-10 acc=0.1162 gamma_dfa=0.0166 + [DFA] Ep 37: ||h_L||=3.012e+07 ||g_2||=3.363e-10 acc=0.1162 gamma_dfa=0.0184 + [DFA] Ep 38: ||h_L||=3.201e+07 ||g_2||=3.192e-10 acc=0.1143 gamma_dfa=0.0196 + [DFA] Ep 39: ||h_L||=3.397e+07 ||g_2||=3.025e-10 acc=0.1143 gamma_dfa=0.0222 + [DFA] Ep 40: ||h_L||=3.603e+07 ||g_2||=2.856e-10 acc=0.1191 gamma_dfa=0.0233 + [DFA] Ep 41: ||h_L||=3.818e+07 ||g_2||=2.714e-10 acc=0.1191 gamma_dfa=0.0246 + [DFA] Ep 42: ||h_L||=4.000e+07 ||g_2||=2.587e-10 acc=0.1201 gamma_dfa=0.0262 + [DFA] Ep 43: ||h_L||=4.217e+07 ||g_2||=2.469e-10 acc=0.1211 gamma_dfa=0.0270 + [DFA] Ep 44: ||h_L||=4.445e+07 ||g_2||=2.350e-10 acc=0.1182 gamma_dfa=0.0282 + [DFA] Ep 45: ||h_L||=4.640e+07 ||g_2||=2.246e-10 acc=0.1221 gamma_dfa=0.0300 + [DFA] Ep 46: ||h_L||=4.865e+07 ||g_2||=2.160e-10 acc=0.1221 gamma_dfa=0.0309 + [DFA] Ep 47: ||h_L||=5.074e+07 ||g_2||=2.057e-10 acc=0.1191 gamma_dfa=0.0319 + [DFA] Ep 48: ||h_L||=5.294e+07 ||g_2||=1.989e-10 acc=0.1221 gamma_dfa=0.0334 + [DFA] Ep 49: ||h_L||=5.507e+07 ||g_2||=1.927e-10 acc=0.1201 gamma_dfa=0.0341 + [DFA] Ep 50: ||h_L||=5.747e+07 ||g_2||=1.853e-10 acc=0.1201 gamma_dfa=0.0345 + [DFA] Ep 51: ||h_L||=5.964e+07 ||g_2||=1.792e-10 acc=0.1211 gamma_dfa=0.0351 + [DFA] Ep 52: ||h_L||=6.183e+07 ||g_2||=1.742e-10 acc=0.1211 gamma_dfa=0.0353 + [DFA] Ep 53: ||h_L||=6.382e+07 ||g_2||=1.697e-10 acc=0.1211 gamma_dfa=0.0356 + [DFA] Ep 54: ||h_L||=6.598e+07 ||g_2||=1.636e-10 acc=0.1211 gamma_dfa=0.0363 + [DFA] Ep 55: ||h_L||=6.804e+07 ||g_2||=1.612e-10 acc=0.1221 gamma_dfa=0.0372 + [DFA] Ep 56: ||h_L||=7.015e+07 ||g_2||=1.567e-10 acc=0.1201 gamma_dfa=0.0373 + [DFA] Ep 57: ||h_L||=7.211e+07 ||g_2||=1.531e-10 acc=0.1201 gamma_dfa=0.0378 + [DFA] Ep 58: ||h_L||=7.388e+07 ||g_2||=1.500e-10 acc=0.1211 gamma_dfa=0.0386 + [DFA] Ep 59: ||h_L||=7.572e+07 ||g_2||=1.468e-10 acc=0.1201 gamma_dfa=0.0388 + [DFA] Ep 60: ||h_L||=7.753e+07 ||g_2||=1.434e-10 acc=0.1191 gamma_dfa=0.0391 + [DFA] Ep 61: ||h_L||=7.944e+07 ||g_2||=1.411e-10 acc=0.1191 gamma_dfa=0.0395 + [DFA] Ep 62: ||h_L||=8.113e+07 ||g_2||=1.380e-10 acc=0.1201 gamma_dfa=0.0395 + [DFA] Ep 63: ||h_L||=8.283e+07 ||g_2||=1.356e-10 acc=0.1182 gamma_dfa=0.0395 + [DFA] Ep 64: ||h_L||=8.423e+07 ||g_2||=1.331e-10 acc=0.1211 gamma_dfa=0.0402 + [DFA] Ep 65: ||h_L||=8.572e+07 ||g_2||=1.311e-10 acc=0.1182 gamma_dfa=0.0406 + [DFA] Ep 66: ||h_L||=8.715e+07 ||g_2||=1.290e-10 acc=0.1191 gamma_dfa=0.0409 + [DFA] Ep 67: ||h_L||=8.854e+07 ||g_2||=1.268e-10 acc=0.1201 gamma_dfa=0.0409 + [DFA] Ep 68: ||h_L||=8.993e+07 ||g_2||=1.251e-10 acc=0.1201 gamma_dfa=0.0407 + [DFA] Ep 69: ||h_L||=9.145e+07 ||g_2||=1.233e-10 acc=0.1201 gamma_dfa=0.0407 + [DFA] Ep 70: ||h_L||=9.264e+07 ||g_2||=1.220e-10 acc=0.1201 gamma_dfa=0.0413 + [DFA] Ep 71: ||h_L||=9.376e+07 ||g_2||=1.204e-10 acc=0.1191 gamma_dfa=0.0415 + [DFA] Ep 72: ||h_L||=9.485e+07 ||g_2||=1.194e-10 acc=0.1191 gamma_dfa=0.0417 + [DFA] Ep 73: ||h_L||=9.596e+07 ||g_2||=1.179e-10 acc=0.1172 gamma_dfa=0.0414 + [DFA] Ep 74: ||h_L||=9.695e+07 ||g_2||=1.171e-10 acc=0.1201 gamma_dfa=0.0416 + [DFA] Ep 75: ||h_L||=9.787e+07 ||g_2||=1.160e-10 acc=0.1182 gamma_dfa=0.0416 + [DFA] Ep 76: ||h_L||=9.874e+07 ||g_2||=1.155e-10 acc=0.1172 gamma_dfa=0.0418 + [DFA] Ep 77: ||h_L||=9.959e+07 ||g_2||=1.146e-10 acc=0.1182 gamma_dfa=0.0418 + [DFA] Ep 78: ||h_L||=1.004e+08 ||g_2||=1.136e-10 acc=0.1172 gamma_dfa=0.0419 + [DFA] Ep 79: ||h_L||=1.011e+08 ||g_2||=1.131e-10 acc=0.1201 gamma_dfa=0.0419 + [DFA] Ep 80: ||h_L||=1.017e+08 ||g_2||=1.126e-10 acc=0.1201 gamma_dfa=0.0421 + [DFA] Ep 81: ||h_L||=1.023e+08 ||g_2||=1.120e-10 acc=0.1201 gamma_dfa=0.0422 + [DFA] Ep 82: ||h_L||=1.029e+08 ||g_2||=1.115e-10 acc=0.1201 gamma_dfa=0.0421 + [DFA] Ep 83: ||h_L||=1.033e+08 ||g_2||=1.111e-10 acc=0.1201 gamma_dfa=0.0422 + [DFA] Ep 84: ||h_L||=1.037e+08 ||g_2||=1.107e-10 acc=0.1201 gamma_dfa=0.0421 + [DFA] Ep 85: ||h_L||=1.041e+08 ||g_2||=1.102e-10 acc=0.1201 gamma_dfa=0.0421 + [DFA] Ep 86: ||h_L||=1.045e+08 ||g_2||=1.099e-10 acc=0.1191 gamma_dfa=0.0422 + [DFA] Ep 87: ||h_L||=1.048e+08 ||g_2||=1.097e-10 acc=0.1201 gamma_dfa=0.0422 + [DFA] Ep 88: ||h_L||=1.050e+08 ||g_2||=1.094e-10 acc=0.1201 gamma_dfa=0.0422 + [DFA] Ep 89: ||h_L||=1.052e+08 ||g_2||=1.092e-10 acc=0.1191 gamma_dfa=0.0422 + [DFA] Ep 90: ||h_L||=1.054e+08 ||g_2||=1.091e-10 acc=0.1201 gamma_dfa=0.0422 + [DFA] Ep 91: ||h_L||=1.056e+08 ||g_2||=1.090e-10 acc=0.1201 gamma_dfa=0.0421 + [DFA] Ep 92: ||h_L||=1.057e+08 ||g_2||=1.089e-10 acc=0.1201 gamma_dfa=0.0421 + [DFA] Ep 93: ||h_L||=1.058e+08 ||g_2||=1.088e-10 acc=0.1201 gamma_dfa=0.0421 + [DFA] Ep 94: ||h_L||=1.059e+08 ||g_2||=1.087e-10 acc=0.1201 gamma_dfa=0.0422 + [DFA] Ep 95: ||h_L||=1.059e+08 ||g_2||=1.087e-10 acc=0.1201 gamma_dfa=0.0422 + [DFA] Ep 96: ||h_L||=1.060e+08 ||g_2||=1.086e-10 acc=0.1201 gamma_dfa=0.0422 + [DFA] Ep 97: ||h_L||=1.060e+08 ||g_2||=1.086e-10 acc=0.1201 gamma_dfa=0.0422 + [DFA] Ep 98: ||h_L||=1.060e+08 ||g_2||=1.086e-10 acc=0.1201 gamma_dfa=0.0422 + [DFA] Ep 99: ||h_L||=1.060e+08 ||g_2||=1.086e-10 acc=0.1201 gamma_dfa=0.0422 + [DFA] Ep 100: ||h_L||=1.060e+08 ||g_2||=1.086e-10 acc=0.1201 gamma_dfa=0.0422 + +Saved results/h2_no_residual_full_s42/snapshot_evolution_s42.json diff --git a/results/h2_no_residual_full_s42/snapshot_evolution_s42.json b/results/h2_no_residual_full_s42/snapshot_evolution_s42.json new file mode 100644 index 0000000..5a96cce --- /dev/null +++ b/results/h2_no_residual_full_s42/snapshot_evolution_s42.json @@ -0,0 +1,5475 @@ +{ + "config": { + "output_dir": "results/h2_no_residual_full_s42", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 42, + "depth": 4, + "d_hidden": 256, + "log_every": 1, + "no_residual_add": true, + "w2_std": 0.5 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 42.802223205566406, + 44.22697067260742, + 46.05121994018555, + 46.896766662597656 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010791289387270808, + 0.0002035950165009126, + 0.00014324457151815295, + 0.00011542177526280284, + 9.846547618508339e-05 + ], + "bp_grad_norms_F": [ + 0.0380445197224617, + 0.00666962843388319, + 0.0046500470489263535, + 0.003719294909387827, + 0.003155440790578723 + ], + "gamma_dfa": NaN, + "acc_eval": 0.080078125, + "loss_eval": 2.446239709854126, + "epoch": 0 + }, + { + "hidden_norms": [ + 86.00836944580078, + 130.30899047851562, + 107.6886215209961, + 127.31951141357422, + 155.31224060058594 + ], + "bp_grad_norms_per_sample_med": [ + 5.636421337840147e-05, + 4.504464232013561e-05, + 4.254864325048402e-05, + 4.0549883124185726e-05, + 3.8371628761524335e-05 + ], + "bp_grad_norms_F": [ + 0.0019479888724163175, + 0.0014867106219753623, + 0.0013919975608587265, + 0.001322419848293066, + 0.0012390650808811188 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1435546875, + "loss_eval": 2.293787717819214, + "epoch": 1 + }, + { + "hidden_norms": [ + 114.72047424316406, + 154.09420776367188, + 128.2491455078125, + 160.83230590820312, + 193.06747436523438 + ], + "bp_grad_norms_per_sample_med": [ + 4.478770642890595e-05, + 3.7948859244352207e-05, + 3.570393528207205e-05, + 3.381549322512001e-05, + 3.158334220643155e-05 + ], + "bp_grad_norms_F": [ + 0.0015459235291928053, + 0.0012464966857805848, + 0.0011667043436318636, + 0.0010993058094754815, + 0.0010170178720727563 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1728515625, + "loss_eval": 2.2832698822021484, + "epoch": 2 + }, + { + "hidden_norms": [ + 129.28399658203125, + 169.31143188476562, + 136.48431396484375, + 176.9506378173828, + 216.20181274414062 + ], + "bp_grad_norms_per_sample_med": [ + 4.090799848199822e-05, + 3.4604578104335815e-05, + 3.2474679755978286e-05, + 3.0787930882070214e-05, + 2.844005575752817e-05 + ], + "bp_grad_norms_F": [ + 0.0014615722466260195, + 0.0011723904171958566, + 0.0010821294272318482, + 0.001009885803796351, + 0.000921491184271872 + ], + "gamma_dfa": NaN, + "acc_eval": 0.177734375, + "loss_eval": 2.248687267303467, + "epoch": 3 + }, + { + "hidden_norms": [ + 146.55203247070312, + 179.31271362304688, + 144.7793426513672, + 195.2471923828125, + 244.1785888671875 + ], + "bp_grad_norms_per_sample_med": [ + 3.7983172660460696e-05, + 3.2681429729564115e-05, + 3.063849362661131e-05, + 2.877583210647572e-05, + 2.62654539255891e-05 + ], + "bp_grad_norms_F": [ + 0.0013270865892991424, + 0.0011031923349946737, + 0.0010214283829554915, + 0.0009468899224884808, + 0.0008542603463865817 + ], + "gamma_dfa": NaN, + "acc_eval": 0.201171875, + "loss_eval": 2.1866140365600586, + "epoch": 4 + }, + { + "hidden_norms": [ + 163.96316528320312, + 186.10421752929688, + 151.66432189941406, + 204.73275756835938, + 266.4998474121094 + ], + "bp_grad_norms_per_sample_med": [ + 3.63540711987298e-05, + 3.1559447961626574e-05, + 2.965202475024853e-05, + 2.767328805930447e-05, + 2.4988346922327764e-05 + ], + "bp_grad_norms_F": [ + 0.0012765713036060333, + 0.0010719435522332788, + 0.0009894924005493522, + 0.0009105658973567188, + 0.0008120943675749004 + ], + "gamma_dfa": NaN, + "acc_eval": 0.205078125, + "loss_eval": 2.213620185852051, + "epoch": 5 + }, + { + "hidden_norms": [ + 173.03375244140625, + 192.33702087402344, + 151.7676544189453, + 211.76028442382812, + 273.14984130859375 + ], + "bp_grad_norms_per_sample_med": [ + 3.612042564782314e-05, + 3.138732790830545e-05, + 2.92498261842411e-05, + 2.741635762504302e-05, + 2.4648286853334866e-05 + ], + "bp_grad_norms_F": [ + 0.0012719081714749336, + 0.0010634849313646555, + 0.0009788337629288435, + 0.0008956211968325078, + 0.0007930789142847061 + ], + "gamma_dfa": NaN, + "acc_eval": 0.201171875, + "loss_eval": 2.20696759223938, + "epoch": 6 + }, + { + "hidden_norms": [ + 184.99200439453125, + 200.6100311279297, + 154.7901611328125, + 216.4141387939453, + 294.1932067871094 + ], + "bp_grad_norms_per_sample_med": [ + 3.5208213375881314e-05, + 3.101788752246648e-05, + 2.887230584747158e-05, + 2.6716055799624883e-05, + 2.381021658948157e-05 + ], + "bp_grad_norms_F": [ + 0.0012596799060702324, + 0.0010643631685525179, + 0.0009746645228005946, + 0.0008811713196337223, + 0.0007715557585470378 + ], + "gamma_dfa": NaN, + "acc_eval": 0.189453125, + "loss_eval": 2.26588773727417, + "epoch": 7 + }, + { + "hidden_norms": [ + 199.71249389648438, + 206.28636169433594, + 159.15716552734375, + 225.3829803466797, + 316.6280517578125 + ], + "bp_grad_norms_per_sample_med": [ + 3.397777982172556e-05, + 3.0055914976401255e-05, + 2.8245711291674525e-05, + 2.577536906755995e-05, + 2.2829581212135963e-05 + ], + "bp_grad_norms_F": [ + 0.0012129175011068583, + 0.0010332722449675202, + 0.0009465343900956213, + 0.0008514428627677262, + 0.0007388851954601705 + ], + "gamma_dfa": NaN, + "acc_eval": 0.203125, + "loss_eval": 2.232454776763916, + "epoch": 8 + }, + { + "hidden_norms": [ + 209.29306030273438, + 211.71087646484375, + 155.6585235595703, + 229.6345672607422, + 335.6332092285156 + ], + "bp_grad_norms_per_sample_med": [ + 3.381286660442129e-05, + 3.0025108571862802e-05, + 2.795294494717382e-05, + 2.5483084755251184e-05, + 2.2450465621659532e-05 + ], + "bp_grad_norms_F": [ + 0.001203069812618196, + 0.0010322949383407831, + 0.0009428044431842864, + 0.0008445970015600324, + 0.0007283088052645326 + ], + "gamma_dfa": NaN, + "acc_eval": 0.189453125, + "loss_eval": 2.2567524909973145, + "epoch": 9 + }, + { + "hidden_norms": [ + 219.5225067138672, + 215.77891540527344, + 158.00711059570312, + 239.82870483398438, + 364.106689453125 + ], + "bp_grad_norms_per_sample_med": [ + 3.357209061505273e-05, + 3.0128332582535222e-05, + 2.8080758056603372e-05, + 2.5434510462218896e-05, + 2.2072978026699275e-05 + ], + "bp_grad_norms_F": [ + 0.001222757389768958, + 0.0010488828411325812, + 0.0009540626197122037, + 0.000844798400066793, + 0.0007152045727707446 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1884765625, + "loss_eval": 2.298661708831787, + "epoch": 10 + }, + { + "hidden_norms": [ + 228.8721160888672, + 219.33489990234375, + 159.22947692871094, + 242.5733642578125, + 373.5672607421875 + ], + "bp_grad_norms_per_sample_med": [ + 3.361105336807668e-05, + 3.0123681426630355e-05, + 2.82819164567627e-05, + 2.5511151761747897e-05, + 2.200892413384281e-05 + ], + "bp_grad_norms_F": [ + 0.0012033756356686354, + 0.0010383055778220296, + 0.0009499595616944134, + 0.0008407059940509498, + 0.000707409402821213 + ], + "gamma_dfa": NaN, + "acc_eval": 0.18359375, + "loss_eval": 2.3219099044799805, + "epoch": 11 + }, + { + "hidden_norms": [ + 238.0825958251953, + 220.4098663330078, + 157.96127319335938, + 246.49105834960938, + 399.103515625 + ], + "bp_grad_norms_per_sample_med": [ + 3.3689280826365575e-05, + 3.044224104087334e-05, + 2.8301144993747585e-05, + 2.544306880736258e-05, + 2.16337175515946e-05 + ], + "bp_grad_norms_F": [ + 0.0012109626550227404, + 0.0010498397750779986, + 0.0009549973183311522, + 0.0008336003520525992, + 0.0006956221768632531 + ], + "gamma_dfa": NaN, + "acc_eval": 0.197265625, + "loss_eval": 2.292271614074707, + "epoch": 12 + }, + { + "hidden_norms": [ + 245.9247589111328, + 225.1177520751953, + 161.000244140625, + 247.5177001953125, + 405.64068603515625 + ], + "bp_grad_norms_per_sample_med": [ + 3.318578455946408e-05, + 2.9796459784847684e-05, + 2.778910129563883e-05, + 2.4826545995892957e-05, + 2.1260259018163197e-05 + ], + "bp_grad_norms_F": [ + 0.0012085892958566546, + 0.0010467838728800416, + 0.0009537216974422336, + 0.0008304294897243381, + 0.0006893921527080238 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1865234375, + "loss_eval": 2.309349536895752, + "epoch": 13 + }, + { + "hidden_norms": [ + 254.78964233398438, + 226.26568603515625, + 158.11354064941406, + 246.54937744140625, + 402.22564697265625 + ], + "bp_grad_norms_per_sample_med": [ + 3.351089617353864e-05, + 3.0367529689101502e-05, + 2.8210330128786154e-05, + 2.5112614821409807e-05, + 2.127070547430776e-05 + ], + "bp_grad_norms_F": [ + 0.0012080274755135179, + 0.0010523217497393489, + 0.0009614708251319826, + 0.0008391732117161155, + 0.0006922443280927837 + ], + "gamma_dfa": NaN, + "acc_eval": 0.177734375, + "loss_eval": 2.3668038845062256, + "epoch": 14 + }, + { + "hidden_norms": [ + 262.1316833496094, + 226.88943481445312, + 157.7928009033203, + 248.3592529296875, + 416.15966796875 + ], + "bp_grad_norms_per_sample_med": [ + 3.413746162550524e-05, + 3.107329393969849e-05, + 2.889345705625601e-05, + 2.570425385783892e-05, + 2.1452229702845216e-05 + ], + "bp_grad_norms_F": [ + 0.0012374932412058115, + 0.001085828524082899, + 0.0009924235055223107, + 0.0008545225136913359, + 0.0006974710267968476 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1650390625, + "loss_eval": 2.3762776851654053, + "epoch": 15 + }, + { + "hidden_norms": [ + 270.8565979003906, + 227.8741455078125, + 160.908935546875, + 249.23391723632812, + 426.4018859863281 + ], + "bp_grad_norms_per_sample_med": [ + 3.346315133967437e-05, + 3.0396649890462868e-05, + 2.8140580980107188e-05, + 2.509099431335926e-05, + 2.0963307179044932e-05 + ], + "bp_grad_norms_F": [ + 0.0012071001110598445, + 0.0010572251630946994, + 0.0009650305728428066, + 0.0008328591356985271, + 0.0006829687627032399 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1748046875, + "loss_eval": 2.3659489154815674, + "epoch": 16 + }, + { + "hidden_norms": [ + 277.88897705078125, + 229.93283081054688, + 160.6474151611328, + 249.1276092529297, + 439.88336181640625 + ], + "bp_grad_norms_per_sample_med": [ + 3.291336179245263e-05, + 3.02154276141664e-05, + 2.813426181091927e-05, + 2.503528776287567e-05, + 2.0815306925214827e-05 + ], + "bp_grad_norms_F": [ + 0.0011904252460226417, + 0.0010531789157539606, + 0.000964420149102807, + 0.0008325970848090947, + 0.0006798306130804121 + ], + "gamma_dfa": NaN, + "acc_eval": 0.17578125, + "loss_eval": 2.3654253482818604, + "epoch": 17 + }, + { + "hidden_norms": [ + 286.05938720703125, + 230.5788116455078, + 160.4178009033203, + 247.1944122314453, + 438.8507995605469 + ], + "bp_grad_norms_per_sample_med": [ + 3.318934977869503e-05, + 3.0551069357898086e-05, + 2.8402588213793933e-05, + 2.525982381484937e-05, + 2.0943261915817857e-05 + ], + "bp_grad_norms_F": [ + 0.0012075696140527725, + 0.001069555408321321, + 0.0009757071966305375, + 0.0008412246825173497, + 0.0006814986118115485 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1748046875, + "loss_eval": 2.3814916610717773, + "epoch": 18 + }, + { + "hidden_norms": [ + 291.21563720703125, + 232.70465087890625, + 157.34620666503906, + 246.0981903076172, + 446.42889404296875 + ], + "bp_grad_norms_per_sample_med": [ + 3.315764479339123e-05, + 3.062548057641834e-05, + 2.8670148822129704e-05, + 2.5318840926047415e-05, + 2.096824573527556e-05 + ], + "bp_grad_norms_F": [ + 0.0012071789242327213, + 0.0010707362089306116, + 0.0009821956045925617, + 0.0008455720380879939, + 0.0006821187562309206 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1728515625, + "loss_eval": 2.4200758934020996, + "epoch": 19 + }, + { + "hidden_norms": [ + 296.9744873046875, + 232.92347717285156, + 155.9208221435547, + 242.89227294921875, + 464.36663818359375 + ], + "bp_grad_norms_per_sample_med": [ + 3.340119292261079e-05, + 3.0905790481483564e-05, + 2.8828215363319032e-05, + 2.5400462618563324e-05, + 2.0934525309712626e-05 + ], + "bp_grad_norms_F": [ + 0.001213042763993144, + 0.001074956264346838, + 0.000986237544566393, + 0.0008489739266224205, + 0.0006839185953140259 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1669921875, + "loss_eval": 2.4464807510375977, + "epoch": 20 + }, + { + "hidden_norms": [ + 302.8837890625, + 232.27020263671875, + 156.21949768066406, + 240.65646362304688, + 465.4597473144531 + ], + "bp_grad_norms_per_sample_med": [ + 3.269123408244923e-05, + 3.057413414353505e-05, + 2.8494312573457137e-05, + 2.536452484491747e-05, + 2.0975066945538856e-05 + ], + "bp_grad_norms_F": [ + 0.0011949212057515979, + 0.0010672758799046278, + 0.0009809982730075717, + 0.0008468242012895644, + 0.0006826177705079317 + ], + "gamma_dfa": NaN, + "acc_eval": 0.171875, + "loss_eval": 2.4423742294311523, + "epoch": 21 + }, + { + "hidden_norms": [ + 309.28985595703125, + 234.24151611328125, + 157.79649353027344, + 237.83340454101562, + 481.6331787109375 + ], + "bp_grad_norms_per_sample_med": [ + 3.304004712845199e-05, + 3.070462844334543e-05, + 2.8894632123410702e-05, + 2.556288927735295e-05, + 2.0964585928595625e-05 + ], + "bp_grad_norms_F": [ + 0.00119681132491678, + 0.001071512931957841, + 0.0009897719137370586, + 0.0008524276199750602, + 0.0006829827907495201 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1591796875, + "loss_eval": 2.4570655822753906, + "epoch": 22 + }, + { + "hidden_norms": [ + 313.0410461425781, + 231.53106689453125, + 157.91920471191406, + 237.67922973632812, + 458.6028137207031 + ], + "bp_grad_norms_per_sample_med": [ + 3.3489413908682764e-05, + 3.1275969377020374e-05, + 2.9323471608222462e-05, + 2.5867013391689397e-05, + 2.119375130860135e-05 + ], + "bp_grad_norms_F": [ + 0.001231541857123375, + 0.0011033288901671767, + 0.001017258851788938, + 0.0008692976552993059, + 0.0006914011319167912 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1435546875, + "loss_eval": 2.4768424034118652, + "epoch": 23 + }, + { + "hidden_norms": [ + 317.760986328125, + 230.58580017089844, + 159.59475708007812, + 231.33895874023438, + 457.3432922363281 + ], + "bp_grad_norms_per_sample_med": [ + 3.3722881198627874e-05, + 3.157257742714137e-05, + 2.952909198938869e-05, + 2.6216532205580734e-05, + 2.1260124412947334e-05 + ], + "bp_grad_norms_F": [ + 0.0012356883380562067, + 0.001110993092879653, + 0.001023975433781743, + 0.0008810298750177026, + 0.0006986238295212388 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1611328125, + "loss_eval": 2.49592661857605, + "epoch": 24 + }, + { + "hidden_norms": [ + 322.651123046875, + 232.43505859375, + 152.87049865722656, + 231.94496154785156, + 473.4416198730469 + ], + "bp_grad_norms_per_sample_med": [ + 3.427052797633223e-05, + 3.222951272618957e-05, + 3.0394427085411735e-05, + 2.6714942578109913e-05, + 2.156150912924204e-05 + ], + "bp_grad_norms_F": [ + 0.0012650383869186044, + 0.001135875703766942, + 0.0010507238330319524, + 0.0008947087335400283, + 0.0007038050098344684 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1455078125, + "loss_eval": 2.5300588607788086, + "epoch": 25 + }, + { + "hidden_norms": [ + 330.46783447265625, + 230.2061004638672, + 152.9967498779297, + 227.8012237548828, + 478.8476867675781 + ], + "bp_grad_norms_per_sample_med": [ + 3.374157677171752e-05, + 3.1537194445263594e-05, + 2.9856541004846804e-05, + 2.6372779757366516e-05, + 2.1366411601775326e-05 + ], + "bp_grad_norms_F": [ + 0.0012416786048561335, + 0.001122219255194068, + 0.0010412678821012378, + 0.0008921810076572001, + 0.0006990613183006644 + ], + "gamma_dfa": NaN, + "acc_eval": 0.140625, + "loss_eval": 2.537388801574707, + "epoch": 26 + }, + { + "hidden_norms": [ + 334.9617919921875, + 229.8689727783203, + 156.80023193359375, + 226.36166381835938, + 473.52545166015625 + ], + "bp_grad_norms_per_sample_med": [ + 3.429998105275445e-05, + 3.2245541660813615e-05, + 3.0571496608899906e-05, + 2.689965367608238e-05, + 2.1567262592725456e-05 + ], + "bp_grad_norms_F": [ + 0.001256743329577148, + 0.0011394708417356014, + 0.0010550402803346515, + 0.0009035509428940713, + 0.0007058348273858428 + ], + "gamma_dfa": NaN, + "acc_eval": 0.138671875, + "loss_eval": 2.5099682807922363, + "epoch": 27 + }, + { + "hidden_norms": [ + 338.32244873046875, + 230.9785614013672, + 152.46780395507812, + 224.96499633789062, + 486.111083984375 + ], + "bp_grad_norms_per_sample_med": [ + 3.443951572990045e-05, + 3.224790998501703e-05, + 3.0727285775355995e-05, + 2.7226298698224127e-05, + 2.1652953364537098e-05 + ], + "bp_grad_norms_F": [ + 0.0012660843785852194, + 0.0011493951315060258, + 0.0010706180473789573, + 0.0009175407467409968, + 0.0007115012849681079 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1298828125, + "loss_eval": 2.5662076473236084, + "epoch": 28 + }, + { + "hidden_norms": [ + 342.5646057128906, + 229.08815002441406, + 153.96673583984375, + 216.54530334472656, + 468.6747131347656 + ], + "bp_grad_norms_per_sample_med": [ + 3.46860324498266e-05, + 3.2538478990318254e-05, + 3.093785562668927e-05, + 2.7406946173869073e-05, + 2.1759695300715975e-05 + ], + "bp_grad_norms_F": [ + 0.0012609382392838597, + 0.001147899660281837, + 0.0010664825094863772, + 0.0009160453919321299, + 0.0007114250329323113 + ], + "gamma_dfa": NaN, + "acc_eval": 0.123046875, + "loss_eval": 2.586763381958008, + "epoch": 29 + }, + { + "hidden_norms": [ + 348.8407287597656, + 229.21829223632812, + 152.20892333984375, + 214.9100799560547, + 478.5781555175781 + ], + "bp_grad_norms_per_sample_med": [ + 3.3881755371112376e-05, + 3.1849580409470946e-05, + 3.0435230655712076e-05, + 2.698182470339816e-05, + 2.157314338546712e-05 + ], + "bp_grad_norms_F": [ + 0.0012431713985279202, + 0.0011320828925818205, + 0.0010550167644396424, + 0.0009089091327041388, + 0.000706658698618412 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1318359375, + "loss_eval": 2.5531229972839355, + "epoch": 30 + }, + { + "hidden_norms": [ + 351.8199768066406, + 225.8287811279297, + 153.97621154785156, + 207.98619079589844, + 449.3790588378906 + ], + "bp_grad_norms_per_sample_med": [ + 3.457794082351029e-05, + 3.269680746598169e-05, + 3.108347300440073e-05, + 2.75895836239215e-05, + 2.188902180932928e-05 + ], + "bp_grad_norms_F": [ + 0.0012726614950224757, + 0.0011605133768171072, + 0.0010800294112414122, + 0.0009289697627536952, + 0.0007184858550317585 + ], + "gamma_dfa": NaN, + "acc_eval": 0.130859375, + "loss_eval": 2.5874619483947754, + "epoch": 31 + }, + { + "hidden_norms": [ + 353.6206359863281, + 225.6538543701172, + 151.9993896484375, + 207.81591796875, + 458.920166015625 + ], + "bp_grad_norms_per_sample_med": [ + 3.461301821516827e-05, + 3.2766867661848664e-05, + 3.128241587546654e-05, + 2.7638012397801504e-05, + 2.198204310843721e-05 + ], + "bp_grad_norms_F": [ + 0.001283104415051639, + 0.0011686854995787144, + 0.0010903337970376015, + 0.0009369406034238636, + 0.000721081392839551 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1376953125, + "loss_eval": 2.583052635192871, + "epoch": 32 + }, + { + "hidden_norms": [ + 355.174560546875, + 226.53065490722656, + 150.45091247558594, + 200.73980712890625, + 457.2731018066406 + ], + "bp_grad_norms_per_sample_med": [ + 3.5071778256678954e-05, + 3.3138821891043335e-05, + 3.159284096909687e-05, + 2.8334745366009884e-05, + 2.23859660763992e-05 + ], + "bp_grad_norms_F": [ + 0.0012956986902281642, + 0.0011821272782981396, + 0.001104547642171383, + 0.0009524936904199421, + 0.0007312360685318708 + ], + "gamma_dfa": NaN, + "acc_eval": 0.12890625, + "loss_eval": 2.605353832244873, + "epoch": 33 + }, + { + "hidden_norms": [ + 360.4849853515625, + 223.40980529785156, + 148.3797607421875, + 195.64169311523438, + 461.1542663574219 + ], + "bp_grad_norms_per_sample_med": [ + 3.4972203138750046e-05, + 3.31850751535967e-05, + 3.171996650053188e-05, + 2.820813824655488e-05, + 2.2246067601372488e-05 + ], + "bp_grad_norms_F": [ + 0.0012813522480428219, + 0.0011739785550162196, + 0.00110049347858876, + 0.0009508885559625924, + 0.0007318558637052774 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1279296875, + "loss_eval": 2.609264373779297, + "epoch": 34 + }, + { + "hidden_norms": [ + 365.4316711425781, + 222.55001831054688, + 148.93753051757812, + 196.41476440429688, + 464.26507568359375 + ], + "bp_grad_norms_per_sample_med": [ + 3.474177356110886e-05, + 3.299827585578896e-05, + 3.161515633109957e-05, + 2.8241847758181393e-05, + 2.233032682852354e-05 + ], + "bp_grad_norms_F": [ + 0.001280988217331469, + 0.0011732708662748337, + 0.0010997118661180139, + 0.0009513412951491773, + 0.0007320611621253192 + ], + "gamma_dfa": NaN, + "acc_eval": 0.123046875, + "loss_eval": 2.6414568424224854, + "epoch": 35 + }, + { + "hidden_norms": [ + 365.99407958984375, + 220.5921173095703, + 147.05055236816406, + 194.5092315673828, + 456.3348083496094 + ], + "bp_grad_norms_per_sample_med": [ + 3.5159438994014636e-05, + 3.344163633300923e-05, + 3.1946114177117124e-05, + 2.86933845927706e-05, + 2.2498443286167458e-05 + ], + "bp_grad_norms_F": [ + 0.0013043885119259357, + 0.0011966620804741979, + 0.0011218151776120067, + 0.0009711913880892098, + 0.0007424909272231162 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1337890625, + "loss_eval": 2.6415724754333496, + "epoch": 36 + }, + { + "hidden_norms": [ + 370.3197326660156, + 220.85414123535156, + 148.2594451904297, + 188.3152313232422, + 446.8343505859375 + ], + "bp_grad_norms_per_sample_med": [ + 3.53947798430454e-05, + 3.362595452927053e-05, + 3.218940764782019e-05, + 2.885511094063986e-05, + 2.269916149089113e-05 + ], + "bp_grad_norms_F": [ + 0.001304175122641027, + 0.001198453363031149, + 0.0011262644547969103, + 0.0009740483365021646, + 0.0007447644020430744 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1279296875, + "loss_eval": 2.6847548484802246, + "epoch": 37 + }, + { + "hidden_norms": [ + 372.6519775390625, + 219.43032836914062, + 146.2524871826172, + 186.9598388671875, + 419.9220275878906 + ], + "bp_grad_norms_per_sample_med": [ + 3.5350865800864995e-05, + 3.369166006450541e-05, + 3.231317532481626e-05, + 2.9215334507171065e-05, + 2.2943044314160943e-05 + ], + "bp_grad_norms_F": [ + 0.0013154788175597787, + 0.0012110902462154627, + 0.00113767315633595, + 0.000987510895356536, + 0.0007552221650257707 + ], + "gamma_dfa": NaN, + "acc_eval": 0.134765625, + "loss_eval": 2.663112163543701, + "epoch": 38 + }, + { + "hidden_norms": [ + 377.5515441894531, + 217.7505340576172, + 144.7539520263672, + 182.63914489746094, + 424.8920593261719 + ], + "bp_grad_norms_per_sample_med": [ + 3.550875771907158e-05, + 3.3909564081113786e-05, + 3.234989708289504e-05, + 2.9385402740444988e-05, + 2.3012338715489022e-05 + ], + "bp_grad_norms_F": [ + 0.0013136330526322126, + 0.0012126904912292957, + 0.001143725821748376, + 0.0009956557769328356, + 0.000757638190407306 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1123046875, + "loss_eval": 2.6713695526123047, + "epoch": 39 + }, + { + "hidden_norms": [ + 375.5976867675781, + 217.32119750976562, + 143.29833984375, + 178.9922332763672, + 416.0475769042969 + ], + "bp_grad_norms_per_sample_med": [ + 3.6261131754145026e-05, + 3.459263825789094e-05, + 3.311317050247453e-05, + 3.0077193514443934e-05, + 2.332564690732397e-05 + ], + "bp_grad_norms_F": [ + 0.0013422674965113401, + 0.0012380937114357948, + 0.0011671145912259817, + 0.0010137255303561687, + 0.0007670389022678137 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1171875, + "loss_eval": 2.6898365020751953, + "epoch": 40 + }, + { + "hidden_norms": [ + 375.6454772949219, + 215.73880004882812, + 143.0796356201172, + 173.5657958984375, + 413.10693359375 + ], + "bp_grad_norms_per_sample_med": [ + 3.5994391510030255e-05, + 3.4521792258601636e-05, + 3.3360858651576564e-05, + 3.016969822056126e-05, + 2.3851269361330196e-05 + ], + "bp_grad_norms_F": [ + 0.0013558906503021717, + 0.0012535321293398738, + 0.0011830577859655023, + 0.0010295362444594502, + 0.0007781152380630374 + ], + "gamma_dfa": NaN, + "acc_eval": 0.119140625, + "loss_eval": 2.6808576583862305, + "epoch": 41 + }, + { + "hidden_norms": [ + 381.1890869140625, + 214.87374877929688, + 142.17715454101562, + 172.16009521484375, + 413.11871337890625 + ], + "bp_grad_norms_per_sample_med": [ + 3.590781852835789e-05, + 3.450449730735272e-05, + 3.32859308400657e-05, + 3.011901571881026e-05, + 2.3740196411381476e-05 + ], + "bp_grad_norms_F": [ + 0.0013439194299280643, + 0.0012433268129825592, + 0.0011747550452128053, + 0.0010278060799464583, + 0.0007790841045789421 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1083984375, + "loss_eval": 2.7061455249786377, + "epoch": 42 + }, + { + "hidden_norms": [ + 382.1147766113281, + 212.32655334472656, + 142.33558654785156, + 169.52694702148438, + 398.5701904296875 + ], + "bp_grad_norms_per_sample_med": [ + 3.659713547676802e-05, + 3.507183282636106e-05, + 3.372716673766263e-05, + 3.064091288251802e-05, + 2.416563620499801e-05 + ], + "bp_grad_norms_F": [ + 0.0013747483026236296, + 0.0012707116547971964, + 0.0012008449994027615, + 0.0010481667704880238, + 0.0007909793639555573 + ], + "gamma_dfa": NaN, + "acc_eval": 0.107421875, + "loss_eval": 2.7121200561523438, + "epoch": 43 + }, + { + "hidden_norms": [ + 388.24554443359375, + 211.70144653320312, + 141.58709716796875, + 166.8690643310547, + 390.73895263671875 + ], + "bp_grad_norms_per_sample_med": [ + 3.605844176490791e-05, + 3.457901402725838e-05, + 3.344014839967713e-05, + 3.0472821890725754e-05, + 2.386603955528699e-05 + ], + "bp_grad_norms_F": [ + 0.0013416680740192533, + 0.0012422216823324561, + 0.0011764775263145566, + 0.0010343515314161777, + 0.0007849647663533688 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1240234375, + "loss_eval": 2.6901586055755615, + "epoch": 44 + }, + { + "hidden_norms": [ + 387.182861328125, + 211.15060424804688, + 141.0326385498047, + 165.57235717773438, + 375.9649963378906 + ], + "bp_grad_norms_per_sample_med": [ + 3.6760768125532195e-05, + 3.520414247759618e-05, + 3.39620492013637e-05, + 3.100339381489903e-05, + 2.4274080715258606e-05 + ], + "bp_grad_norms_F": [ + 0.0013679155381396413, + 0.0012680977815762162, + 0.001201036386191845, + 0.0010586031712591648, + 0.0007975373882800341 + ], + "gamma_dfa": NaN, + "acc_eval": 0.115234375, + "loss_eval": 2.7196202278137207, + "epoch": 45 + }, + { + "hidden_norms": [ + 389.78302001953125, + 209.2168426513672, + 140.19239807128906, + 162.1501007080078, + 373.6092529296875 + ], + "bp_grad_norms_per_sample_med": [ + 3.6972556699765846e-05, + 3.547927553881891e-05, + 3.4321546991122887e-05, + 3.136819213978015e-05, + 2.4795872377580963e-05 + ], + "bp_grad_norms_F": [ + 0.001378108048811555, + 0.0012792085763067007, + 0.0012131200637668371, + 0.0010711504146456718, + 0.0008094239747151732 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1123046875, + "loss_eval": 2.732020854949951, + "epoch": 46 + }, + { + "hidden_norms": [ + 390.8168640136719, + 207.98391723632812, + 140.21983337402344, + 161.1061248779297, + 358.555419921875 + ], + "bp_grad_norms_per_sample_med": [ + 3.740100146387704e-05, + 3.60443300451152e-05, + 3.478667713352479e-05, + 3.1701372790848836e-05, + 2.49275763053447e-05 + ], + "bp_grad_norms_F": [ + 0.0013912947615608573, + 0.0012947055511176586, + 0.0012257345952093601, + 0.00108279287815094, + 0.000817548600025475 + ], + "gamma_dfa": NaN, + "acc_eval": 0.11328125, + "loss_eval": 2.734851598739624, + "epoch": 47 + }, + { + "hidden_norms": [ + 392.3091735839844, + 206.94676208496094, + 137.84091186523438, + 156.7150115966797, + 363.1738586425781 + ], + "bp_grad_norms_per_sample_med": [ + 3.7181769585004076e-05, + 3.575249866116792e-05, + 3.458252103882842e-05, + 3.156786260660738e-05, + 2.489473990863189e-05 + ], + "bp_grad_norms_F": [ + 0.0013799670850858092, + 0.0012849466875195503, + 0.0012195904273539782, + 0.0010820929892361164, + 0.0008166414918377995 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1083984375, + "loss_eval": 2.730489492416382, + "epoch": 48 + }, + { + "hidden_norms": [ + 392.93621826171875, + 206.63357543945312, + 137.95150756835938, + 156.19265747070312, + 348.4825744628906 + ], + "bp_grad_norms_per_sample_med": [ + 3.750698306248523e-05, + 3.625384488259442e-05, + 3.4952467103721574e-05, + 3.2122828997671604e-05, + 2.5343802917632274e-05 + ], + "bp_grad_norms_F": [ + 0.0014074875507503748, + 0.0013119739014655352, + 0.0012457441771402955, + 0.0011056199437007308, + 0.0008317606407217681 + ], + "gamma_dfa": NaN, + "acc_eval": 0.10546875, + "loss_eval": 2.7619447708129883, + "epoch": 49 + }, + { + "hidden_norms": [ + 394.5487976074219, + 204.12411499023438, + 137.66342163085938, + 151.4534454345703, + 343.6612854003906 + ], + "bp_grad_norms_per_sample_med": [ + 3.779921098612249e-05, + 3.6266086681280285e-05, + 3.5253593523520976e-05, + 3.246645428589545e-05, + 2.558354208304081e-05 + ], + "bp_grad_norms_F": [ + 0.0014083774294704199, + 0.0013136735651642084, + 0.0012480755103752017, + 0.0011111509520560503, + 0.0008380677900277078 + ], + "gamma_dfa": NaN, + "acc_eval": 0.095703125, + "loss_eval": 2.7554924488067627, + "epoch": 50 + }, + { + "hidden_norms": [ + 397.6114196777344, + 202.55885314941406, + 136.6888427734375, + 150.49545288085938, + 329.96112060546875 + ], + "bp_grad_norms_per_sample_med": [ + 3.777034726226702e-05, + 3.6449018807616085e-05, + 3.515862044878304e-05, + 3.240678779548034e-05, + 2.560876600909978e-05 + ], + "bp_grad_norms_F": [ + 0.001405128394253552, + 0.001311970641836524, + 0.001248166779987514, + 0.0011124340817332268, + 0.0008421412203460932 + ], + "gamma_dfa": NaN, + "acc_eval": 0.10546875, + "loss_eval": 2.7597320079803467, + "epoch": 51 + }, + { + "hidden_norms": [ + 397.78509521484375, + 202.12451171875, + 135.5238800048828, + 148.92816162109375, + 322.4108581542969 + ], + "bp_grad_norms_per_sample_med": [ + 3.840518184006214e-05, + 3.6834608181379735e-05, + 3.5840494092553854e-05, + 3.275332346674986e-05, + 2.6062174583785236e-05 + ], + "bp_grad_norms_F": [ + 0.001429337658919394, + 0.00133553147315979, + 0.0012706448324024677, + 0.001131666824221611, + 0.0008531482890248299 + ], + "gamma_dfa": NaN, + "acc_eval": 0.099609375, + "loss_eval": 2.7737417221069336, + "epoch": 52 + }, + { + "hidden_norms": [ + 397.3096618652344, + 199.6620635986328, + 134.52984619140625, + 145.349853515625, + 298.2867431640625 + ], + "bp_grad_norms_per_sample_med": [ + 3.877158087561838e-05, + 3.721338725881651e-05, + 3.603506775107235e-05, + 3.3124437322840095e-05, + 2.6345343940192834e-05 + ], + "bp_grad_norms_F": [ + 0.0014398579951375723, + 0.001346803386695683, + 0.0012816074304282665, + 0.001146289287135005, + 0.0008667311049066484 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1025390625, + "loss_eval": 2.799215316772461, + "epoch": 53 + }, + { + "hidden_norms": [ + 400.7160949707031, + 198.93077087402344, + 134.9965057373047, + 147.8721923828125, + 299.2564392089844 + ], + "bp_grad_norms_per_sample_med": [ + 3.8850699638715014e-05, + 3.7408095522550866e-05, + 3.61659076588694e-05, + 3.348653990542516e-05, + 2.6619676646078005e-05 + ], + "bp_grad_norms_F": [ + 0.0014573318185284734, + 0.0013647449668496847, + 0.001298584509640932, + 0.001162077416665852, + 0.0008761510835029185 + ], + "gamma_dfa": NaN, + "acc_eval": 0.08984375, + "loss_eval": 2.8113207817077637, + "epoch": 54 + }, + { + "hidden_norms": [ + 399.78253173828125, + 198.36306762695312, + 132.11000061035156, + 142.8116912841797, + 299.17218017578125 + ], + "bp_grad_norms_per_sample_med": [ + 3.933380503440276e-05, + 3.791782364714891e-05, + 3.674212348414585e-05, + 3.40558253810741e-05, + 2.7044263333664276e-05 + ], + "bp_grad_norms_F": [ + 0.001484063221141696, + 0.0013903625076636672, + 0.0013244440779089928, + 0.0011864654952660203, + 0.0008941980777308345 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0888671875, + "loss_eval": 2.847215175628662, + "epoch": 55 + }, + { + "hidden_norms": [ + 401.17156982421875, + 196.801025390625, + 134.57815551757812, + 139.7723388671875, + 288.41851806640625 + ], + "bp_grad_norms_per_sample_med": [ + 3.922020914615132e-05, + 3.7812937080161646e-05, + 3.68127366527915e-05, + 3.415128594497219e-05, + 2.7148824301548302e-05 + ], + "bp_grad_norms_F": [ + 0.0014704873319715261, + 0.001381139038130641, + 0.0013163810363039374, + 0.001184670371003449, + 0.0008946889429353178 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0908203125, + "loss_eval": 2.816185712814331, + "epoch": 56 + }, + { + "hidden_norms": [ + 400.9927978515625, + 196.3038330078125, + 132.07135009765625, + 139.7966766357422, + 279.3277587890625 + ], + "bp_grad_norms_per_sample_med": [ + 3.982979615102522e-05, + 3.841472425847314e-05, + 3.7321347917895764e-05, + 3.467328497208655e-05, + 2.7518768547452055e-05 + ], + "bp_grad_norms_F": [ + 0.0014958448009565473, + 0.001403261674568057, + 0.0013373151887208223, + 0.0012032209197059274, + 0.0009093029075302184 + ], + "gamma_dfa": NaN, + "acc_eval": 0.09765625, + "loss_eval": 2.8296005725860596, + "epoch": 57 + }, + { + "hidden_norms": [ + 401.6940612792969, + 195.37176513671875, + 131.6783447265625, + 139.06954956054688, + 268.53350830078125 + ], + "bp_grad_norms_per_sample_med": [ + 3.964872666983865e-05, + 3.833413211395964e-05, + 3.708717122208327e-05, + 3.448158531682566e-05, + 2.7542468160390854e-05 + ], + "bp_grad_norms_F": [ + 0.0014878648798912764, + 0.0013977688504382968, + 0.00133328081574291, + 0.0012016715481877327, + 0.0009097974398173392 + ], + "gamma_dfa": NaN, + "acc_eval": 0.09375, + "loss_eval": 2.80366849899292, + "epoch": 58 + }, + { + "hidden_norms": [ + 402.2669372558594, + 195.07772827148438, + 130.2777099609375, + 136.1566925048828, + 263.0674133300781 + ], + "bp_grad_norms_per_sample_med": [ + 4.008352698292583e-05, + 3.8822814531158656e-05, + 3.763332642847672e-05, + 3.510116948746145e-05, + 2.7965274057351053e-05 + ], + "bp_grad_norms_F": [ + 0.0015098530566319823, + 0.0014185438631102443, + 0.001352492137812078, + 0.0012215198948979378, + 0.0009253643220290542 + ], + "gamma_dfa": NaN, + "acc_eval": 0.09375, + "loss_eval": 2.833949089050293, + "epoch": 59 + }, + { + "hidden_norms": [ + 404.5005798339844, + 192.42762756347656, + 130.96656799316406, + 135.46536254882812, + 255.70611572265625 + ], + "bp_grad_norms_per_sample_med": [ + 4.0377384721068665e-05, + 3.883212775690481e-05, + 3.7497047742363065e-05, + 3.505245331325568e-05, + 2.8039796234224923e-05 + ], + "bp_grad_norms_F": [ + 0.0015065876068547368, + 0.0014162716688588262, + 0.0013495896710082889, + 0.0012195424642413855, + 0.0009257213678210974 + ], + "gamma_dfa": NaN, + "acc_eval": 0.103515625, + "loss_eval": 2.8347878456115723, + "epoch": 60 + }, + { + "hidden_norms": [ + 405.3465270996094, + 191.92613220214844, + 129.0675048828125, + 135.35177612304688, + 252.48280334472656 + ], + "bp_grad_norms_per_sample_med": [ + 4.047132460982539e-05, + 3.890526568284258e-05, + 3.791163908317685e-05, + 3.532003393047489e-05, + 2.8360002033878118e-05 + ], + "bp_grad_norms_F": [ + 0.001506851869635284, + 0.0014191134832799435, + 0.0013552922755479813, + 0.0012275888584554195, + 0.0009371190681122243 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0947265625, + "loss_eval": 2.8487884998321533, + "epoch": 61 + }, + { + "hidden_norms": [ + 405.92303466796875, + 191.02706909179688, + 130.1326904296875, + 131.96170043945312, + 243.21319580078125 + ], + "bp_grad_norms_per_sample_med": [ + 4.0983595681609586e-05, + 3.9633086998946965e-05, + 3.8324356864904985e-05, + 3.588865001802333e-05, + 2.8768741685780697e-05 + ], + "bp_grad_norms_F": [ + 0.001533527858555317, + 0.0014434503391385078, + 0.0013784898910671473, + 0.001250342931598425, + 0.0009516954887658358 + ], + "gamma_dfa": NaN, + "acc_eval": 0.099609375, + "loss_eval": 2.853466749191284, + "epoch": 62 + }, + { + "hidden_norms": [ + 404.5056457519531, + 189.7686004638672, + 128.53379821777344, + 131.6268768310547, + 239.69944763183594 + ], + "bp_grad_norms_per_sample_med": [ + 4.129076478420757e-05, + 3.997457315563224e-05, + 3.881670272676274e-05, + 3.6345707485452294e-05, + 2.9240014555398375e-05 + ], + "bp_grad_norms_F": [ + 0.0015445395838469267, + 0.001454798853956163, + 0.0013908768305554986, + 0.0012628707336261868, + 0.000962753314524889 + ], + "gamma_dfa": NaN, + "acc_eval": 0.09375, + "loss_eval": 2.864095687866211, + "epoch": 63 + }, + { + "hidden_norms": [ + 406.03680419921875, + 189.29116821289062, + 127.50506591796875, + 131.68568420410156, + 233.78379821777344 + ], + "bp_grad_norms_per_sample_med": [ + 4.1155919461743906e-05, + 4.004100264864974e-05, + 3.874011599691585e-05, + 3.628453123383224e-05, + 2.934946860477794e-05 + ], + "bp_grad_norms_F": [ + 0.0015430431813001633, + 0.0014545356389135122, + 0.0013910855632275343, + 0.0012647509574890137, + 0.0009666763944551349 + ], + "gamma_dfa": NaN, + "acc_eval": 0.095703125, + "loss_eval": 2.8635716438293457, + "epoch": 64 + }, + { + "hidden_norms": [ + 406.0451354980469, + 188.50218200683594, + 126.54427337646484, + 131.3389129638672, + 226.51025390625 + ], + "bp_grad_norms_per_sample_med": [ + 4.183232886134647e-05, + 4.0587648982182145e-05, + 3.94381677324418e-05, + 3.678469511214644e-05, + 2.9675620680791326e-05 + ], + "bp_grad_norms_F": [ + 0.001558265183120966, + 0.0014702302869409323, + 0.0014062377158552408, + 0.0012798203388229012, + 0.0009780466789379716 + ], + "gamma_dfa": NaN, + "acc_eval": 0.095703125, + "loss_eval": 2.8676958084106445, + "epoch": 65 + }, + { + "hidden_norms": [ + 408.6777038574219, + 187.3246307373047, + 127.4869155883789, + 129.45443725585938, + 217.5286102294922 + ], + "bp_grad_norms_per_sample_med": [ + 4.219069887767546e-05, + 4.0918450395110995e-05, + 3.9726855902699754e-05, + 3.7175828765612096e-05, + 2.9963695851620287e-05 + ], + "bp_grad_norms_F": [ + 0.0015777976950630546, + 0.001490283408202231, + 0.0014262630138546228, + 0.001298666698858142, + 0.0009915514383465052 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0869140625, + "loss_eval": 2.8961129188537598, + "epoch": 66 + }, + { + "hidden_norms": [ + 407.8295593261719, + 186.51223754882812, + 126.99847412109375, + 128.33078002929688, + 215.7896270751953 + ], + "bp_grad_norms_per_sample_med": [ + 4.240999624016695e-05, + 4.097919736523181e-05, + 3.9745518733980134e-05, + 3.734237179742195e-05, + 3.010852560692001e-05 + ], + "bp_grad_norms_F": [ + 0.0015762250404804945, + 0.00148971623275429, + 0.0014267999213188887, + 0.0013026067754253745, + 0.0009967804653570056 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0927734375, + "loss_eval": 2.8922109603881836, + "epoch": 67 + }, + { + "hidden_norms": [ + 408.5052490234375, + 185.35150146484375, + 126.04090881347656, + 127.63972473144531, + 211.70339965820312 + ], + "bp_grad_norms_per_sample_med": [ + 4.2915176891256124e-05, + 4.142584293731488e-05, + 4.0363862353842705e-05, + 3.7879472074564546e-05, + 3.063846452278085e-05 + ], + "bp_grad_norms_F": [ + 0.0015976275317370892, + 0.001511436770670116, + 0.0014480556128546596, + 0.001321145216934383, + 0.001012138556689024 + ], + "gamma_dfa": NaN, + "acc_eval": 0.08984375, + "loss_eval": 2.9307312965393066, + "epoch": 68 + }, + { + "hidden_norms": [ + 408.47100830078125, + 185.3424835205078, + 126.64398956298828, + 127.55502319335938, + 211.88119506835938 + ], + "bp_grad_norms_per_sample_med": [ + 4.3488638766575605e-05, + 4.180728137725964e-05, + 4.041391730424948e-05, + 3.8047244743211195e-05, + 3.0868024623487145e-05 + ], + "bp_grad_norms_F": [ + 0.00161185662727803, + 0.0015253758756443858, + 0.0014606004115194082, + 0.0013330455403774977, + 0.0010200685355812311 + ], + "gamma_dfa": NaN, + "acc_eval": 0.087890625, + "loss_eval": 2.932239532470703, + "epoch": 69 + }, + { + "hidden_norms": [ + 408.52923583984375, + 184.1455535888672, + 125.52372741699219, + 125.75703430175781, + 202.25552368164062 + ], + "bp_grad_norms_per_sample_med": [ + 4.348695438238792e-05, + 4.2108520574402064e-05, + 4.075234028277919e-05, + 3.836580435745418e-05, + 3.1048515666043386e-05 + ], + "bp_grad_norms_F": [ + 0.0016183900879696012, + 0.0015315954806283116, + 0.0014678208390250802, + 0.001341602997854352, + 0.0010267652105540037 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0869140625, + "loss_eval": 2.9302639961242676, + "epoch": 70 + }, + { + "hidden_norms": [ + 408.8894958496094, + 183.35772705078125, + 125.07991027832031, + 125.64179229736328, + 197.8079376220703 + ], + "bp_grad_norms_per_sample_med": [ + 4.373578849481419e-05, + 4.239315967424773e-05, + 4.112703027203679e-05, + 3.845592436846346e-05, + 3.1269701139535755e-05 + ], + "bp_grad_norms_F": [ + 0.0016269702464342117, + 0.0015422124415636063, + 0.0014783325605094433, + 0.001352085149846971, + 0.0010349294170737267 + ], + "gamma_dfa": NaN, + "acc_eval": 0.091796875, + "loss_eval": 2.9367189407348633, + "epoch": 71 + }, + { + "hidden_norms": [ + 408.4325256347656, + 182.9261932373047, + 124.68492126464844, + 124.7309341430664, + 192.49610900878906 + ], + "bp_grad_norms_per_sample_med": [ + 4.388380693853833e-05, + 4.263465234544128e-05, + 4.1247698391089216e-05, + 3.877044946420938e-05, + 3.1494288123212755e-05 + ], + "bp_grad_norms_F": [ + 0.0016377014108002186, + 0.0015517075080424547, + 0.0014868414727970958, + 0.001360182068310678, + 0.0010441095801070333 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0927734375, + "loss_eval": 2.930757999420166, + "epoch": 72 + }, + { + "hidden_norms": [ + 408.14178466796875, + 182.40310668945312, + 124.50841522216797, + 123.8620834350586, + 190.0107879638672 + ], + "bp_grad_norms_per_sample_med": [ + 4.45740224677138e-05, + 4.323892426327802e-05, + 4.188392267678864e-05, + 3.935809581889771e-05, + 3.189874405506998e-05 + ], + "bp_grad_norms_F": [ + 0.0016554963076487184, + 0.00156887574121356, + 0.0015039717545732856, + 0.0013761234004050493, + 0.0010567718418315053 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0869140625, + "loss_eval": 2.9669477939605713, + "epoch": 73 + }, + { + "hidden_norms": [ + 408.57916259765625, + 181.7321014404297, + 124.03689575195312, + 122.9704818725586, + 187.95928955078125 + ], + "bp_grad_norms_per_sample_med": [ + 4.501524745137431e-05, + 4.3535896111279726e-05, + 4.2307488911319524e-05, + 3.976419611717574e-05, + 3.218180063413456e-05 + ], + "bp_grad_norms_F": [ + 0.0016716192476451397, + 0.001584019628353417, + 0.0015181623166427016, + 0.0013901714701205492, + 0.0010662488639354706 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0908203125, + "loss_eval": 2.9710330963134766, + "epoch": 74 + }, + { + "hidden_norms": [ + 408.1520690917969, + 180.9037322998047, + 124.13348388671875, + 123.0340576171875, + 186.64889526367188 + ], + "bp_grad_norms_per_sample_med": [ + 4.489531056606211e-05, + 4.363941479823552e-05, + 4.237061511958018e-05, + 3.981809277320281e-05, + 3.235776239307597e-05 + ], + "bp_grad_norms_F": [ + 0.0016766563057899475, + 0.0015889391070231795, + 0.0015231993747875094, + 0.0013958020135760307, + 0.0010720851132646203 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0927734375, + "loss_eval": 2.959228515625, + "epoch": 75 + }, + { + "hidden_norms": [ + 409.3914794921875, + 180.49095153808594, + 123.59921264648438, + 122.37818145751953, + 181.8359375 + ], + "bp_grad_norms_per_sample_med": [ + 4.522506060311571e-05, + 4.3832860683323815e-05, + 4.2538729758234695e-05, + 3.9995622501010075e-05, + 3.253304384998046e-05 + ], + "bp_grad_norms_F": [ + 0.0016819218872115016, + 0.001593844499439001, + 0.0015282074455171824, + 0.0014012405881658196, + 0.0010784030891954899 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0927734375, + "loss_eval": 2.961671829223633, + "epoch": 76 + }, + { + "hidden_norms": [ + 407.241455078125, + 180.02792358398438, + 123.85694885253906, + 122.00341033935547, + 179.4743194580078 + ], + "bp_grad_norms_per_sample_med": [ + 4.5559816499007866e-05, + 4.4125670683570206e-05, + 4.277457628631964e-05, + 4.0345701563637704e-05, + 3.2811487471917644e-05 + ], + "bp_grad_norms_F": [ + 0.0016946949763223529, + 0.0016066118841990829, + 0.0015405946178361773, + 0.0014128233306109905, + 0.0010864713694900274 + ], + "gamma_dfa": NaN, + "acc_eval": 0.09765625, + "loss_eval": 2.971811294555664, + "epoch": 77 + }, + { + "hidden_norms": [ + 408.3240661621094, + 179.1845245361328, + 123.02991485595703, + 121.22331237792969, + 176.96409606933594 + ], + "bp_grad_norms_per_sample_med": [ + 4.576908759190701e-05, + 4.430625631357543e-05, + 4.3082043703179806e-05, + 4.0411658119410276e-05, + 3.2916912459768355e-05 + ], + "bp_grad_norms_F": [ + 0.0016961582005023956, + 0.0016096236649900675, + 0.0015443011652678251, + 0.0014174508396536112, + 0.0010930649004876614 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0947265625, + "loss_eval": 2.974250316619873, + "epoch": 78 + }, + { + "hidden_norms": [ + 409.5758972167969, + 178.83154296875, + 122.89900207519531, + 120.96637725830078, + 176.27029418945312 + ], + "bp_grad_norms_per_sample_med": [ + 4.575210914481431e-05, + 4.45544756075833e-05, + 4.321682718000375e-05, + 4.0704584534978494e-05, + 3.307598308310844e-05 + ], + "bp_grad_norms_F": [ + 0.0017041281098499894, + 0.001617106725461781, + 0.0015517985448241234, + 0.0014248047955334187, + 0.0010987903224304318 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0888671875, + "loss_eval": 2.9865829944610596, + "epoch": 79 + }, + { + "hidden_norms": [ + 408.8537902832031, + 178.98573303222656, + 122.46696472167969, + 121.31299591064453, + 173.41905212402344 + ], + "bp_grad_norms_per_sample_med": [ + 4.6213288442231715e-05, + 4.482917211134918e-05, + 4.371384784462862e-05, + 4.093564712093212e-05, + 3.334296343382448e-05 + ], + "bp_grad_norms_F": [ + 0.00171999994199723, + 0.001632340019568801, + 0.001565982005558908, + 0.0014375611208379269, + 0.0011084020370617509 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0927734375, + "loss_eval": 2.993680953979492, + "epoch": 80 + }, + { + "hidden_norms": [ + 408.5456848144531, + 178.0683135986328, + 122.94597625732422, + 119.80611419677734, + 171.1206817626953 + ], + "bp_grad_norms_per_sample_med": [ + 4.6296096115838736e-05, + 4.503710806602612e-05, + 4.384905696497299e-05, + 4.111307498533279e-05, + 3.349714825162664e-05 + ], + "bp_grad_norms_F": [ + 0.0017213152023032308, + 0.0016335739055648446, + 0.0015675420872867107, + 0.001440141350030899, + 0.001112470985390246 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0927734375, + "loss_eval": 2.994321346282959, + "epoch": 81 + }, + { + "hidden_norms": [ + 409.3093566894531, + 177.68714904785156, + 122.89625549316406, + 119.95466613769531, + 168.89804077148438 + ], + "bp_grad_norms_per_sample_med": [ + 4.6671568270539865e-05, + 4.528012505033985e-05, + 4.418051685206592e-05, + 4.1504132241243497e-05, + 3.381213900865987e-05 + ], + "bp_grad_norms_F": [ + 0.001732644159346819, + 0.0016448728274554014, + 0.0015783295966684818, + 0.001450547482818365, + 0.0011199831496924162 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0947265625, + "loss_eval": 3.004246950149536, + "epoch": 82 + }, + { + "hidden_norms": [ + 408.72955322265625, + 177.53179931640625, + 121.72450256347656, + 119.71387481689453, + 168.49583435058594 + ], + "bp_grad_norms_per_sample_med": [ + 4.686604006565176e-05, + 4.567100768326782e-05, + 4.437788811628707e-05, + 4.169986641500145e-05, + 3.4023832995444536e-05 + ], + "bp_grad_norms_F": [ + 0.0017455043271183968, + 0.0016571393935009837, + 0.0015903809107840061, + 0.0014616175321862102, + 0.001127574942074716 + ], + "gamma_dfa": NaN, + "acc_eval": 0.09375, + "loss_eval": 3.015833854675293, + "epoch": 83 + }, + { + "hidden_norms": [ + 409.93121337890625, + 177.41183471679688, + 121.63835144042969, + 119.78266906738281, + 166.5583953857422 + ], + "bp_grad_norms_per_sample_med": [ + 4.7002995415823534e-05, + 4.566587813314982e-05, + 4.4412678107619286e-05, + 4.1799670725595206e-05, + 3.404032759135589e-05 + ], + "bp_grad_norms_F": [ + 0.0017475533531978726, + 0.0016598458169028163, + 0.0015934593975543976, + 0.0014648212818428874, + 0.0011309005785733461 + ], + "gamma_dfa": NaN, + "acc_eval": 0.095703125, + "loss_eval": 3.014139413833618, + "epoch": 84 + }, + { + "hidden_norms": [ + 409.67083740234375, + 177.14193725585938, + 121.51908111572266, + 119.6811294555664, + 166.031982421875 + ], + "bp_grad_norms_per_sample_med": [ + 4.713247108156793e-05, + 4.586786963045597e-05, + 4.4539196096593514e-05, + 4.203089338261634e-05, + 3.428043783060275e-05 + ], + "bp_grad_norms_F": [ + 0.0017551736673340201, + 0.001667042262852192, + 0.0016005010111257434, + 0.0014717906014993787, + 0.0011371106375008821 + ], + "gamma_dfa": NaN, + "acc_eval": 0.087890625, + "loss_eval": 3.0291876792907715, + "epoch": 85 + }, + { + "hidden_norms": [ + 410.37042236328125, + 176.73268127441406, + 121.4700698852539, + 119.30713653564453, + 163.45822143554688 + ], + "bp_grad_norms_per_sample_med": [ + 4.7194233047775924e-05, + 4.609613824868575e-05, + 4.4591557525563985e-05, + 4.207295205560513e-05, + 3.430316428421065e-05 + ], + "bp_grad_norms_F": [ + 0.001759424339979887, + 0.0016711216885596514, + 0.0016040647169575095, + 0.0014759227633476257, + 0.001140325446613133 + ], + "gamma_dfa": NaN, + "acc_eval": 0.09375, + "loss_eval": 3.0314245223999023, + "epoch": 86 + }, + { + "hidden_norms": [ + 409.8002624511719, + 176.60916137695312, + 121.219970703125, + 118.81930541992188, + 164.01478576660156 + ], + "bp_grad_norms_per_sample_med": [ + 4.7294168325606734e-05, + 4.6120272600091994e-05, + 4.4749522203346714e-05, + 4.225381417199969e-05, + 3.438722342252731e-05 + ], + "bp_grad_norms_F": [ + 0.0017650157678872347, + 0.0016766699263826013, + 0.0016095110913738608, + 0.0014808655250817537, + 0.0011436669155955315 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0927734375, + "loss_eval": 3.030081272125244, + "epoch": 87 + }, + { + "hidden_norms": [ + 409.7901306152344, + 176.61012268066406, + 121.13548278808594, + 118.5867919921875, + 162.41827392578125 + ], + "bp_grad_norms_per_sample_med": [ + 4.7548022848786786e-05, + 4.6351164201041684e-05, + 4.494565655477345e-05, + 4.2309966374887154e-05, + 3.455657861195505e-05 + ], + "bp_grad_norms_F": [ + 0.0017697742441669106, + 0.001681560999713838, + 0.00161420414224267, + 0.0014853639295324683, + 0.0011477968655526638 + ], + "gamma_dfa": NaN, + "acc_eval": 0.09375, + "loss_eval": 3.0332422256469727, + "epoch": 88 + }, + { + "hidden_norms": [ + 409.9271240234375, + 176.3477783203125, + 120.93573760986328, + 118.68280029296875, + 161.79257202148438 + ], + "bp_grad_norms_per_sample_med": [ + 4.757043279823847e-05, + 4.634608922060579e-05, + 4.5027496526017785e-05, + 4.236193490214646e-05, + 3.461442975094542e-05 + ], + "bp_grad_norms_F": [ + 0.0017714434070512652, + 0.0016832581022754312, + 0.0016157239442691207, + 0.0014867670834064484, + 0.0011494142236188054 + ], + "gamma_dfa": NaN, + "acc_eval": 0.091796875, + "loss_eval": 3.0295891761779785, + "epoch": 89 + }, + { + "hidden_norms": [ + 409.3666076660156, + 176.4572296142578, + 121.02136993408203, + 118.42733001708984, + 161.92198181152344 + ], + "bp_grad_norms_per_sample_med": [ + 4.7602890845155343e-05, + 4.65112243546173e-05, + 4.5134373067412525e-05, + 4.2457497329451144e-05, + 3.4702385164564475e-05 + ], + "bp_grad_norms_F": [ + 0.0017726266523823142, + 0.0016847110819071531, + 0.0016171842580661178, + 0.0014885812997817993, + 0.001151244156062603 + ], + "gamma_dfa": NaN, + "acc_eval": 0.09375, + "loss_eval": 3.0332508087158203, + "epoch": 90 + }, + { + "hidden_norms": [ + 408.93438720703125, + 176.05850219726562, + 121.09625244140625, + 118.71532440185547, + 160.93397521972656 + ], + "bp_grad_norms_per_sample_med": [ + 4.767462087329477e-05, + 4.656092278310098e-05, + 4.517777415458113e-05, + 4.260002606315538e-05, + 3.481149542494677e-05 + ], + "bp_grad_norms_F": [ + 0.0017778765177354217, + 0.0016896515153348446, + 0.0016218661330640316, + 0.0014927292941138148, + 0.0011542538413777947 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0927734375, + "loss_eval": 3.0385818481445312, + "epoch": 91 + }, + { + "hidden_norms": [ + 408.2444763183594, + 176.17698669433594, + 120.81340789794922, + 118.79690551757812, + 160.8688507080078 + ], + "bp_grad_norms_per_sample_med": [ + 4.765141420648433e-05, + 4.667821849579923e-05, + 4.5252400013851e-05, + 4.269158671377227e-05, + 3.480418672552332e-05 + ], + "bp_grad_norms_F": [ + 0.0017795232124626637, + 0.0016910110134631395, + 0.0016234440263360739, + 0.0014941159170120955, + 0.0011556288227438927 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0908203125, + "loss_eval": 3.0389466285705566, + "epoch": 92 + }, + { + "hidden_norms": [ + 408.58831787109375, + 176.04327392578125, + 120.86355590820312, + 118.54495239257812, + 160.07017517089844 + ], + "bp_grad_norms_per_sample_med": [ + 4.780395101988688e-05, + 4.6777106035733595e-05, + 4.532063030637801e-05, + 4.271055877325125e-05, + 3.487269350443967e-05 + ], + "bp_grad_norms_F": [ + 0.001782167237251997, + 0.0016936222091317177, + 0.0016259904950857162, + 0.0014966638991609216, + 0.0011574920499697328 + ], + "gamma_dfa": NaN, + "acc_eval": 0.091796875, + "loss_eval": 3.0411715507507324, + "epoch": 93 + }, + { + "hidden_norms": [ + 408.69635009765625, + 175.86227416992188, + 120.84530639648438, + 118.5611572265625, + 159.65382385253906 + ], + "bp_grad_norms_per_sample_med": [ + 4.7862777137197554e-05, + 4.672469003708102e-05, + 4.5333617890719324e-05, + 4.2781779484357685e-05, + 3.488900983938947e-05 + ], + "bp_grad_norms_F": [ + 0.001782999956049025, + 0.0016942995134741068, + 0.0016265579033643007, + 0.001497312681749463, + 0.001158081111498177 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0927734375, + "loss_eval": 3.0412378311157227, + "epoch": 94 + }, + { + "hidden_norms": [ + 408.5793151855469, + 175.8729705810547, + 120.83885192871094, + 118.5599365234375, + 159.589111328125 + ], + "bp_grad_norms_per_sample_med": [ + 4.793615153175779e-05, + 4.6734887291677296e-05, + 4.529079524218105e-05, + 4.2848438170040026e-05, + 3.4947173844557256e-05 + ], + "bp_grad_norms_F": [ + 0.0017846085829660296, + 0.0016958917258307338, + 0.001628118334338069, + 0.0014987689210101962, + 0.0011592835653573275 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0908203125, + "loss_eval": 3.043121576309204, + "epoch": 95 + }, + { + "hidden_norms": [ + 408.6483459472656, + 175.8555908203125, + 120.81853485107422, + 118.52471160888672, + 159.30239868164062 + ], + "bp_grad_norms_per_sample_med": [ + 4.796134089701809e-05, + 4.68125035695266e-05, + 4.539822111837566e-05, + 4.2882278648903593e-05, + 3.495233249850571e-05 + ], + "bp_grad_norms_F": [ + 0.0017852310556918383, + 0.0016965895192697644, + 0.001628802390769124, + 0.0014994175871834159, + 0.0011597864795476198 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0908203125, + "loss_eval": 3.0433754920959473, + "epoch": 96 + }, + { + "hidden_norms": [ + 408.78167724609375, + 175.81280517578125, + 120.72789001464844, + 118.362060546875, + 159.2758026123047 + ], + "bp_grad_norms_per_sample_med": [ + 4.7979057853808627e-05, + 4.6818935516057536e-05, + 4.545195770333521e-05, + 4.2866002331720665e-05, + 3.4974782465724275e-05 + ], + "bp_grad_norms_F": [ + 0.0017855397891253233, + 0.0016968693817034364, + 0.0016290779458358884, + 0.001499759964644909, + 0.001160072861239314 + ], + "gamma_dfa": NaN, + "acc_eval": 0.091796875, + "loss_eval": 3.0432236194610596, + "epoch": 97 + }, + { + "hidden_norms": [ + 408.695068359375, + 175.82485961914062, + 120.68985748291016, + 118.31425476074219, + 159.31414794921875 + ], + "bp_grad_norms_per_sample_med": [ + 4.796995563083328e-05, + 4.685561725636944e-05, + 4.54587752756197e-05, + 4.2861738620558754e-05, + 3.4979620977537706e-05 + ], + "bp_grad_norms_F": [ + 0.0017854906618595123, + 0.0016968429554253817, + 0.001629071426577866, + 0.0014998035039752722, + 0.0011602065060287714 + ], + "gamma_dfa": NaN, + "acc_eval": 0.091796875, + "loss_eval": 3.0435032844543457, + "epoch": 98 + }, + { + "hidden_norms": [ + 408.69329833984375, + 175.80587768554688, + 120.6858901977539, + 118.34341430664062, + 159.32943725585938 + ], + "bp_grad_norms_per_sample_med": [ + 4.796809298568405e-05, + 4.686374086304568e-05, + 4.545971387415193e-05, + 4.28554521931801e-05, + 3.4983324439963326e-05 + ], + "bp_grad_norms_F": [ + 0.0017855679616332054, + 0.0016969236312434077, + 0.001629148842766881, + 0.0014998704427853227, + 0.0011602530721575022 + ], + "gamma_dfa": NaN, + "acc_eval": 0.091796875, + "loss_eval": 3.043445348739624, + "epoch": 99 + }, + { + "hidden_norms": [ + 408.6950378417969, + 175.79644775390625, + 120.68733978271484, + 118.34892272949219, + 159.32240295410156 + ], + "bp_grad_norms_per_sample_med": [ + 4.7968002036213875e-05, + 4.6864570322213694e-05, + 4.546308991848491e-05, + 4.2857409425778314e-05, + 3.498443402349949e-05 + ], + "bp_grad_norms_F": [ + 0.0017855766927823424, + 0.0016969360876828432, + 0.0016291660722345114, + 0.0014998912811279297, + 0.0011602782178670168 + ], + "gamma_dfa": NaN, + "acc_eval": 0.091796875, + "loss_eval": 3.0435147285461426, + "epoch": 100 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 42.802223205566406, + 44.22697067260742, + 46.05121994018555, + 46.896766662597656 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010791289387270808, + 0.0002035950165009126, + 0.00014324457151815295, + 0.00011542177526280284, + 9.846547618508339e-05 + ], + "bp_grad_norms_F": [ + 0.0380445197224617, + 0.00666962843388319, + 0.0046500470489263535, + 0.003719294909387827, + 0.003155440790578723 + ], + "gamma_dfa": 0.004864378133788705, + "acc_eval": 0.080078125, + "loss_eval": 2.446239709854126, + "epoch": 0 + }, + { + "hidden_norms": [ + 1180.2318115234375, + 5768.2900390625, + 5472.90234375, + 6369.3427734375, + 5295.2470703125 + ], + "bp_grad_norms_per_sample_med": [ + 1.2146981589467032e-06, + 8.634061714474228e-07, + 8.587696811446222e-07, + 8.589160529481887e-07, + 8.53334995554178e-07 + ], + "bp_grad_norms_F": [ + 6.592504360014573e-05, + 4.607137088896707e-05, + 4.4360855099512264e-05, + 4.341698149801232e-05, + 4.290258584660478e-05 + ], + "gamma_dfa": 0.0467059058137238, + "acc_eval": 0.15625, + "loss_eval": 2.2713985443115234, + "epoch": 1 + }, + { + "hidden_norms": [ + 2712.02197265625, + 35799.15625, + 30196.22265625, + 31429.328125, + 21571.224609375 + ], + "bp_grad_norms_per_sample_med": [ + 3.2316361853190756e-07, + 1.6252558054929978e-07, + 1.6230175958753534e-07, + 1.6301386551731412e-07, + 1.6222111298702657e-07 + ], + "bp_grad_norms_F": [ + 2.881550244637765e-05, + 1.2372604032862e-05, + 1.1472440746729262e-05, + 1.1236465070396662e-05, + 1.1124561751785222e-05 + ], + "gamma_dfa": 0.035421818611212075, + "acc_eval": 0.146484375, + "loss_eval": 2.335322856903076, + "epoch": 2 + }, + { + "hidden_norms": [ + 4310.83203125, + 104622.7734375, + 77630.2421875, + 78666.21875, + 48679.88671875 + ], + "bp_grad_norms_per_sample_med": [ + 1.8400233159354684e-07, + 6.495802296058173e-08, + 6.498943605492968e-08, + 6.491647042139448e-08, + 6.464611601586512e-08 + ], + "bp_grad_norms_F": [ + 1.769972368492745e-05, + 5.158871317689773e-06, + 4.676893240684876e-06, + 4.603746219800087e-06, + 4.549533514364157e-06 + ], + "gamma_dfa": 0.03363112888473552, + "acc_eval": 0.150390625, + "loss_eval": 2.4106125831604004, + "epoch": 3 + }, + { + "hidden_norms": [ + 5880.8115234375, + 227753.375, + 152491.703125, + 155418.390625, + 88801.296875 + ], + "bp_grad_norms_per_sample_med": [ + 1.2607929988917022e-07, + 3.377261137416099e-08, + 3.3712492353288326e-08, + 3.3661436305010284e-08, + 3.362825395925029e-08 + ], + "bp_grad_norms_F": [ + 1.548601358081214e-05, + 2.78187621916004e-06, + 2.4831683731463272e-06, + 2.456902620906476e-06, + 2.4304001726704882e-06 + ], + "gamma_dfa": 0.027950844378210604, + "acc_eval": 0.1494140625, + "loss_eval": 2.473954677581787, + "epoch": 4 + }, + { + "hidden_norms": [ + 7446.83203125, + 415853.34375, + 244149.921875, + 253104.71875, + 141041.109375 + ], + "bp_grad_norms_per_sample_med": [ + 1.0277101125666377e-07, + 2.1167430475088622e-08, + 2.113832486827505e-08, + 2.1176427722480184e-08, + 2.102850160667913e-08 + ], + "bp_grad_norms_F": [ + 1.4487833141174633e-05, + 2.0795134787476854e-06, + 1.5597894389429712e-06, + 1.522601451142691e-06, + 1.5034931948321173e-06 + ], + "gamma_dfa": 0.02746052150905598, + "acc_eval": 0.1435546875, + "loss_eval": 2.5455238819122314, + "epoch": 5 + }, + { + "hidden_norms": [ + 8986.072265625, + 683627.0, + 382622.5625, + 394341.96875, + 225869.703125 + ], + "bp_grad_norms_per_sample_med": [ + 8.362774650549909e-08, + 1.4089099664715832e-08, + 1.4079772014952141e-08, + 1.4096787737116756e-08, + 1.4042676355074946e-08 + ], + "bp_grad_norms_F": [ + 1.094696290238062e-05, + 1.43898739679571e-06, + 1.0249204933643341e-06, + 1.0037305173682398e-06, + 9.89082195701485e-07 + ], + "gamma_dfa": 0.022385360905900598, + "acc_eval": 0.1416015625, + "loss_eval": 2.617079973220825, + "epoch": 6 + }, + { + "hidden_norms": [ + 10599.609375, + 1064012.5, + 545495.875, + 573164.9375, + 330028.71875 + ], + "bp_grad_norms_per_sample_med": [ + 7.213265718064577e-08, + 1.0183534016050544e-08, + 1.0178969667151705e-08, + 1.0194342259239875e-08, + 1.0160833951999848e-08 + ], + "bp_grad_norms_F": [ + 1.0159021258004941e-05, + 8.805947686596483e-07, + 7.233961696329061e-07, + 7.142662639125774e-07, + 7.038501053102664e-07 + ], + "gamma_dfa": 0.014009941252879798, + "acc_eval": 0.1337890625, + "loss_eval": 2.7312068939208984, + "epoch": 7 + }, + { + "hidden_norms": [ + 12143.3994140625, + 1557775.25, + 759262.3125, + 792826.0, + 460775.59375 + ], + "bp_grad_norms_per_sample_med": [ + 6.697734988847515e-08, + 7.604014307105444e-09, + 7.596973716772482e-09, + 7.606048235686558e-09, + 7.604833207608408e-09 + ], + "bp_grad_norms_F": [ + 9.400837370776571e-06, + 6.404222290257167e-07, + 5.235326625552261e-07, + 5.169007977201545e-07, + 5.090913077765435e-07 + ], + "gamma_dfa": 0.011664194520562887, + "acc_eval": 0.1328125, + "loss_eval": 2.825345516204834, + "epoch": 8 + }, + { + "hidden_norms": [ + 13694.29296875, + 2172737.5, + 997486.0625, + 1070732.625, + 629918.4375 + ], + "bp_grad_norms_per_sample_med": [ + 6.409224795334012e-08, + 6.097121918458015e-09, + 6.086279480399526e-09, + 6.08825212466968e-09, + 6.0656004663428575e-09 + ], + "bp_grad_norms_F": [ + 9.614421287551522e-06, + 5.113795964462042e-07, + 4.071621901857725e-07, + 4.02141125732669e-07, + 3.9655543560002116e-07 + ], + "gamma_dfa": 0.008997007156722248, + "acc_eval": 0.1298828125, + "loss_eval": 2.988190174102783, + "epoch": 9 + }, + { + "hidden_norms": [ + 15223.474609375, + 2927110.5, + 1275342.625, + 1378191.375, + 828821.8125 + ], + "bp_grad_norms_per_sample_med": [ + 6.029451782296746e-08, + 5.071707498416345e-09, + 5.069247244193775e-09, + 5.075359243988942e-09, + 5.0706532306321606e-09 + ], + "bp_grad_norms_F": [ + 9.640240023145452e-06, + 4.242011186761374e-07, + 3.2627585255795566e-07, + 3.2204775379796047e-07, + 3.1740532335788885e-07 + ], + "gamma_dfa": 0.0051322957733646035, + "acc_eval": 0.125, + "loss_eval": 3.152592658996582, + "epoch": 10 + }, + { + "hidden_norms": [ + 16733.46484375, + 3849004.0, + 1605019.5, + 1758574.0, + 1046866.9375 + ], + "bp_grad_norms_per_sample_med": [ + 5.804990976798763e-08, + 4.271067943761864e-09, + 4.260845898329535e-09, + 4.262723063419571e-09, + 4.251643481723022e-09 + ], + "bp_grad_norms_F": [ + 9.824444532569032e-06, + 3.8355952369784063e-07, + 2.739863020906341e-07, + 2.699064225453185e-07, + 2.6583589374240546e-07 + ], + "gamma_dfa": 0.002556616673246026, + "acc_eval": 0.125, + "loss_eval": 3.3216772079467773, + "epoch": 11 + }, + { + "hidden_norms": [ + 18226.0703125, + 4895676.0, + 1964835.75, + 2174918.0, + 1297900.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.8149943527041614e-08, + 3.753563682096228e-09, + 3.750809440816738e-09, + 3.756827737788626e-09, + 3.745073584582315e-09 + ], + "bp_grad_norms_F": [ + 1.0199929420195986e-05, + 3.2010626682676957e-07, + 2.3428944473380398e-07, + 2.3066610310706892e-07, + 2.272569474826014e-07 + ], + "gamma_dfa": -0.001056009205058217, + "acc_eval": 0.1162109375, + "loss_eval": 3.5638060569763184, + "epoch": 12 + }, + { + "hidden_norms": [ + 19695.107421875, + 6176501.5, + 2397138.0, + 2692062.25, + 1632551.125 + ], + "bp_grad_norms_per_sample_med": [ + 5.818218085096305e-08, + 3.2458047360961473e-09, + 3.240681722971317e-09, + 3.251705793516635e-09, + 3.2418265849543104e-09 + ], + "bp_grad_norms_F": [ + 1.0194554306508508e-05, + 2.884790433199669e-07, + 2.0161056113465747e-07, + 1.9845649035232782e-07, + 1.9566277842386626e-07 + ], + "gamma_dfa": -0.003356708213686943, + "acc_eval": 0.11328125, + "loss_eval": 3.7695584297180176, + "epoch": 13 + }, + { + "hidden_norms": [ + 21182.841796875, + 7649758.0, + 2859185.75, + 3238327.25, + 2017791.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.6009717752658617e-08, + 2.8617739289416022e-09, + 2.86194334897516e-09, + 2.864514181410982e-09, + 2.8607307633876644e-09 + ], + "bp_grad_norms_F": [ + 9.991773367801215e-06, + 2.805488747981144e-07, + 1.7382579642344353e-07, + 1.7105583083321108e-07, + 1.6860903429005702e-07 + ], + "gamma_dfa": -0.004406693275086582, + "acc_eval": 0.1103515625, + "loss_eval": 3.9298348426818848, + "epoch": 14 + }, + { + "hidden_norms": [ + 22575.759765625, + 9260891.0, + 3426286.0, + 3904244.75, + 2469897.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.523341073399024e-08, + 2.458340642164103e-09, + 2.4571535917061738e-09, + 2.4605368853514165e-09, + 2.455863956640769e-09 + ], + "bp_grad_norms_F": [ + 9.669157407188322e-06, + 2.321831686913356e-07, + 1.4871888254219812e-07, + 1.466667072236305e-07, + 1.44689224157446e-07 + ], + "gamma_dfa": -0.005493569537065923, + "acc_eval": 0.11328125, + "loss_eval": 4.065067291259766, + "epoch": 15 + }, + { + "hidden_norms": [ + 23971.93359375, + 11148851.0, + 3986279.5, + 4682323.5, + 2980997.5 + ], + "bp_grad_norms_per_sample_med": [ + 5.2560817920266345e-08, + 2.1839356989517e-09, + 2.1809569705766307e-09, + 2.1860839805043497e-09, + 2.177982905138265e-09 + ], + "bp_grad_norms_F": [ + 9.612061148800422e-06, + 2.2171894897837774e-07, + 1.2985647401819733e-07, + 1.2793493908702658e-07, + 1.2610371413757093e-07 + ], + "gamma_dfa": -0.0057282960042357445, + "acc_eval": 0.1103515625, + "loss_eval": 4.23506498336792, + "epoch": 16 + }, + { + "hidden_norms": [ + 25387.59765625, + 13199074.0, + 4584581.0, + 5421912.0, + 3520717.25 + ], + "bp_grad_norms_per_sample_med": [ + 5.063454011633439e-08, + 1.9527632844074105e-09, + 1.9520551841623046e-09, + 1.956988127105319e-09, + 1.9527153227727467e-09 + ], + "bp_grad_norms_F": [ + 9.531939213047735e-06, + 1.855236746450828e-07, + 1.1443902536711903e-07, + 1.1294694246544168e-07, + 1.1146746459189671e-07 + ], + "gamma_dfa": -0.00637711986200884, + "acc_eval": 0.1123046875, + "loss_eval": 4.372166633605957, + "epoch": 17 + }, + { + "hidden_norms": [ + 26803.72265625, + 15607512.0, + 5231978.5, + 6327852.0, + 4171921.5 + ], + "bp_grad_norms_per_sample_med": [ + 5.073666287103151e-08, + 1.7431257548494727e-09, + 1.7403234409130164e-09, + 1.7429053755790846e-09, + 1.737441190918787e-09 + ], + "bp_grad_norms_F": [ + 9.275222510041203e-06, + 1.6788693812941347e-07, + 1.0197032906944514e-07, + 1.0054727539454689e-07, + 9.927033062240298e-08 + ], + "gamma_dfa": -0.006377041107043624, + "acc_eval": 0.1142578125, + "loss_eval": 4.511043071746826, + "epoch": 18 + }, + { + "hidden_norms": [ + 28166.5859375, + 18256806.0, + 6062269.0, + 7361214.0, + 4908964.5 + ], + "bp_grad_norms_per_sample_med": [ + 4.8937458529962896e-08, + 1.5624438409744812e-09, + 1.5615452264583496e-09, + 1.5637011685498692e-09, + 1.559517959215384e-09 + ], + "bp_grad_norms_F": [ + 9.249049981008284e-06, + 1.5261937846844376e-07, + 9.117609778286351e-08, + 8.977448828773049e-08, + 8.863072764597746e-08 + ], + "gamma_dfa": -0.007660938150365837, + "acc_eval": 0.1171875, + "loss_eval": 4.64661979675293, + "epoch": 19 + }, + { + "hidden_norms": [ + 29548.751953125, + 21145650.0, + 6936910.0, + 8491332.0, + 5632708.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.774140904828528e-08, + 1.397353122101208e-09, + 1.3845558033409588e-09, + 1.3843480806130515e-09, + 1.3776775276141962e-09 + ], + "bp_grad_norms_F": [ + 9.035198672791012e-06, + 1.426667637360879e-07, + 8.229534387282911e-08, + 8.094935566305139e-08, + 7.995085837819715e-08 + ], + "gamma_dfa": -0.00677196380274836, + "acc_eval": 0.111328125, + "loss_eval": 4.76383113861084, + "epoch": 20 + }, + { + "hidden_norms": [ + 30869.275390625, + 24201464.0, + 7880455.0, + 9702563.0, + 6424945.5 + ], + "bp_grad_norms_per_sample_med": [ + 4.703911571368735e-08, + 1.2679121086378586e-09, + 1.2570423590929636e-09, + 1.2592289433399628e-09, + 1.2545631200566731e-09 + ], + "bp_grad_norms_F": [ + 8.886428986443207e-06, + 1.178441522142748e-07, + 7.369149557234778e-08, + 7.258120149344904e-08, + 7.175417238158843e-08 + ], + "gamma_dfa": -0.008610141419922002, + "acc_eval": 0.1162109375, + "loss_eval": 4.926914691925049, + "epoch": 21 + }, + { + "hidden_norms": [ + 32181.666015625, + 27506424.0, + 8773789.0, + 11014517.0, + 7322481.5 + ], + "bp_grad_norms_per_sample_med": [ + 4.4904634677322974e-08, + 1.1420530077188573e-09, + 1.121353787603141e-09, + 1.124021098419803e-09, + 1.120450510150306e-09 + ], + "bp_grad_norms_F": [ + 8.90475439518923e-06, + 1.1447492909155699e-07, + 6.648813410947696e-08, + 6.533218765980564e-08, + 6.45067217419637e-08 + ], + "gamma_dfa": -0.007374132976110559, + "acc_eval": 0.111328125, + "loss_eval": 5.004192352294922, + "epoch": 22 + }, + { + "hidden_norms": [ + 33471.7265625, + 31266642.0, + 9769161.0, + 12538190.0, + 8328704.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.517446683394155e-08, + 1.0276371975592724e-09, + 1.005762251260478e-09, + 1.0072189748910887e-09, + 1.0049648890841922e-09 + ], + "bp_grad_norms_F": [ + 8.657435500936117e-06, + 1.0238768766157591e-07, + 6.021300436032107e-08, + 5.9172805322305067e-08, + 5.8442100936417773e-08 + ], + "gamma_dfa": -0.006727739999405458, + "acc_eval": 0.1123046875, + "loss_eval": 5.116036415100098, + "epoch": 23 + }, + { + "hidden_norms": [ + 34792.7890625, + 35134068.0, + 11038143.0, + 14059113.0, + 9444097.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.4753964090205045e-08, + 9.320837435211615e-10, + 9.107828935484008e-10, + 9.128516276213361e-10, + 9.105118325969386e-10 + ], + "bp_grad_norms_F": [ + 8.577152584621217e-06, + 9.559200009334745e-08, + 5.512932332862874e-08, + 5.411101611230151e-08, + 5.343352782460897e-08 + ], + "gamma_dfa": -0.00556181388310506, + "acc_eval": 0.1142578125, + "loss_eval": 5.2026848793029785, + "epoch": 24 + }, + { + "hidden_norms": [ + 36056.9921875, + 39258876.0, + 12277943.0, + 15686179.0, + 10635754.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.2437520164639864e-08, + 8.431049747237296e-10, + 8.279052998716452e-10, + 8.256172967513464e-10, + 8.249605998322806e-10 + ], + "bp_grad_norms_F": [ + 8.401701961702202e-06, + 9.383651189409647e-08, + 5.072890729707069e-08, + 4.9743736241225633e-08, + 4.90946696629635e-08 + ], + "gamma_dfa": -0.004373190506157698, + "acc_eval": 0.115234375, + "loss_eval": 5.283636569976807, + "epoch": 25 + }, + { + "hidden_norms": [ + 37332.3203125, + 43838448.0, + 13573116.0, + 17373072.0, + 11853122.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.96461210527832e-08, + 7.721222550216567e-10, + 7.523985323665272e-10, + 7.522342748700339e-10, + 7.507660604311184e-10 + ], + "bp_grad_norms_F": [ + 8.241736395575572e-06, + 8.553880093131738e-08, + 4.659301566789509e-08, + 4.568136446891913e-08, + 4.507716511170656e-08 + ], + "gamma_dfa": -0.003043898326723138, + "acc_eval": 0.1123046875, + "loss_eval": 5.340336322784424, + "epoch": 26 + }, + { + "hidden_norms": [ + 38604.234375, + 48637388.0, + 14943648.0, + 19237954.0, + 13168041.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.845103080379886e-08, + 7.063521434425013e-10, + 6.949120723298563e-10, + 6.971247468179342e-10, + 6.954581355245182e-10 + ], + "bp_grad_norms_F": [ + 8.12488178780768e-06, + 8.518332350604396e-08, + 4.348786220020884e-08, + 4.2559751278758995e-08, + 4.1998429622935873e-08 + ], + "gamma_dfa": -0.0021704566534026526, + "acc_eval": 0.1103515625, + "loss_eval": 5.403829574584961, + "epoch": 27 + }, + { + "hidden_norms": [ + 39856.5078125, + 53569880.0, + 16230254.0, + 21087022.0, + 14556169.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.739526022172868e-08, + 6.497330451438188e-10, + 6.402843810704439e-10, + 6.384167083872683e-10, + 6.366632776533265e-10 + ], + "bp_grad_norms_F": [ + 8.042790796025656e-06, + 7.930053413929272e-08, + 4.0553047142566356e-08, + 3.9663138551304655e-08, + 3.909939749746627e-08 + ], + "gamma_dfa": 0.00027063591551268473, + "acc_eval": 0.11328125, + "loss_eval": 5.486921310424805, + "epoch": 28 + }, + { + "hidden_norms": [ + 41114.66015625, + 59315272.0, + 17822804.0, + 22986032.0, + 16084622.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.655359392951141e-08, + 6.013742281929524e-10, + 5.905386180060646e-10, + 5.911486300469448e-10, + 5.910953393417628e-10 + ], + "bp_grad_norms_F": [ + 7.960659786476754e-06, + 8.031720000190035e-08, + 3.805743276075191e-08, + 3.7164745947393385e-08, + 3.6596219388229656e-08 + ], + "gamma_dfa": 0.0034554791564005427, + "acc_eval": 0.1142578125, + "loss_eval": 5.604689598083496, + "epoch": 29 + }, + { + "hidden_norms": [ + 42325.58984375, + 64740044.0, + 19249378.0, + 25010146.0, + 17657480.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.541291704323157e-08, + 5.539400049769938e-10, + 5.454215967759524e-10, + 5.459841467825299e-10, + 5.440591865912836e-10 + ], + "bp_grad_norms_F": [ + 7.836213626433164e-06, + 7.777267541086985e-08, + 3.578357521405451e-08, + 3.4922344127608085e-08, + 3.437838813624694e-08 + ], + "gamma_dfa": 0.003963275059504667, + "acc_eval": 0.115234375, + "loss_eval": 5.663756370544434, + "epoch": 30 + }, + { + "hidden_norms": [ + 43534.375, + 70424152.0, + 20966526.0, + 27032410.0, + 19126838.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.4974387830288833e-08, + 5.135932235056373e-10, + 5.051635221242634e-10, + 5.056056129326691e-10, + 5.03480979130444e-10 + ], + "bp_grad_norms_F": [ + 7.886262210377026e-06, + 8.217509162022907e-08, + 3.401517645329477e-08, + 3.309881080326704e-08, + 3.255568614690674e-08 + ], + "gamma_dfa": 0.006612789164137212, + "acc_eval": 0.1162109375, + "loss_eval": 5.706640243530273, + "epoch": 31 + }, + { + "hidden_norms": [ + 44720.9453125, + 76344112.0, + 22771320.0, + 29203482.0, + 20864830.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.4229628909088206e-08, + 4.800634334500842e-10, + 4.701866673784139e-10, + 4.693791466614528e-10, + 4.668225250803459e-10 + ], + "bp_grad_norms_F": [ + 7.781368367432151e-06, + 7.414258362814508e-08, + 3.207212984079888e-08, + 3.1193785332561674e-08, + 3.0666903683140845e-08 + ], + "gamma_dfa": 0.008515000299667008, + "acc_eval": 0.1162109375, + "loss_eval": 5.720961093902588, + "epoch": 32 + }, + { + "hidden_norms": [ + 45875.8046875, + 82383720.0, + 24638848.0, + 31558806.0, + 22520176.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.390868030805905e-08, + 4.458567681719927e-10, + 4.385545260277013e-10, + 4.3886239087242984e-10, + 4.3707018559935307e-10 + ], + "bp_grad_norms_F": [ + 7.905513484729454e-06, + 7.275451707755565e-08, + 3.047262708832932e-08, + 2.960254974482268e-08, + 2.9090815090171418e-08 + ], + "gamma_dfa": 0.01025733859205502, + "acc_eval": 0.1142578125, + "loss_eval": 5.7539262771606445, + "epoch": 33 + }, + { + "hidden_norms": [ + 47003.1328125, + 89200944.0, + 26495704.0, + 33934388.0, + 24310298.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.3027241386207606e-08, + 4.1779490977944533e-10, + 4.123023311652929e-10, + 4.1292305685836084e-10, + 4.1066355871421933e-10 + ], + "bp_grad_norms_F": [ + 8.257205990958028e-06, + 7.720848316239426e-08, + 2.8986395506080953e-08, + 2.8067159263400754e-08, + 2.7556911419424068e-08 + ], + "gamma_dfa": 0.012584943462570664, + "acc_eval": 0.11328125, + "loss_eval": 5.796531677246094, + "epoch": 34 + }, + { + "hidden_norms": [ + 48090.08984375, + 95793720.0, + 28464040.0, + 36264388.0, + 26293806.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.217191490989535e-08, + 3.894292666117849e-10, + 3.8594555329396485e-10, + 3.8626962739485293e-10, + 3.8498901289152343e-10 + ], + "bp_grad_norms_F": [ + 8.125247404677793e-06, + 7.330743301281473e-08, + 2.7641750222073824e-08, + 2.6769551908500944e-08, + 2.6268399011541987e-08 + ], + "gamma_dfa": 0.015375214185041841, + "acc_eval": 0.1181640625, + "loss_eval": 5.804059982299805, + "epoch": 35 + }, + { + "hidden_norms": [ + 49138.04296875, + 102879768.0, + 30344818.0, + 38660032.0, + 28092164.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.081565580487222e-08, + 3.644603230323895e-10, + 3.576897944501667e-10, + 3.568374207230107e-10, + 3.5416741761551407e-10 + ], + "bp_grad_norms_F": [ + 8.033912308746949e-06, + 7.398465839969504e-08, + 2.61401691403762e-08, + 2.530256892896432e-08, + 2.481599992165684e-08 + ], + "gamma_dfa": 0.01655786213814281, + "acc_eval": 0.1162109375, + "loss_eval": 5.779043197631836, + "epoch": 36 + }, + { + "hidden_norms": [ + 50205.23828125, + 109785504.0, + 32500932.0, + 40993492.0, + 30124936.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.087046351879508e-08, + 3.450236207847013e-10, + 3.3626229578587186e-10, + 3.3652211572920976e-10, + 3.357169819917516e-10 + ], + "bp_grad_norms_F": [ + 8.317977517435793e-06, + 6.930265783466893e-08, + 2.4881831706125013e-08, + 2.413608513052168e-08, + 2.36848762824593e-08 + ], + "gamma_dfa": 0.01839016478334088, + "acc_eval": 0.1162109375, + "loss_eval": 5.815016746520996, + "epoch": 37 + }, + { + "hidden_norms": [ + 51234.28125, + 116882832.0, + 34622344.0, + 43672052.0, + 32010828.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.011625793192252e-08, + 3.242739410325157e-10, + 3.1924299315200244e-10, + 3.1952127055312474e-10, + 3.181244712102682e-10 + ], + "bp_grad_norms_F": [ + 8.41012479213532e-06, + 7.246134714478103e-08, + 2.3759820777513596e-08, + 2.3049024022725462e-08, + 2.2618014128283903e-08 + ], + "gamma_dfa": 0.019554060958398622, + "acc_eval": 0.1142578125, + "loss_eval": 5.829615116119385, + "epoch": 38 + }, + { + "hidden_norms": [ + 52247.84375, + 124228312.0, + 36552372.0, + 46094684.0, + 33968656.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.024800321327348e-08, + 3.052329222708039e-10, + 3.0248267779420246e-10, + 3.022799510699059e-10, + 3.012357030485191e-10 + ], + "bp_grad_norms_F": [ + 7.947497579152696e-06, + 6.409469932577849e-08, + 2.2781945219207955e-08, + 2.209960925370069e-08, + 2.1678969730487552e-08 + ], + "gamma_dfa": 0.022201491628948133, + "acc_eval": 0.1142578125, + "loss_eval": 5.778614044189453, + "epoch": 39 + }, + { + "hidden_norms": [ + 53254.6640625, + 131932448.0, + 38786720.0, + 48743312.0, + 36026440.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.9781913823967443e-08, + 2.8849589384094543e-10, + 2.856256064998064e-10, + 2.8570401600092055e-10, + 2.844837143634038e-10 + ], + "bp_grad_norms_F": [ + 7.602731329825474e-06, + 6.632863147615353e-08, + 2.174161650714268e-08, + 2.107603691570148e-08, + 2.067151072537854e-08 + ], + "gamma_dfa": 0.02325869471678743, + "acc_eval": 0.119140625, + "loss_eval": 5.798803329467773, + "epoch": 40 + }, + { + "hidden_norms": [ + 54228.43359375, + 139390368.0, + 41071128.0, + 51348924.0, + 38183484.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.9682835744893055e-08, + 2.752674477246586e-10, + 2.7137878055860654e-10, + 2.716726288376492e-10, + 2.71538042051489e-10 + ], + "bp_grad_norms_F": [ + 7.424123396049254e-06, + 6.37739248077196e-08, + 2.099002749389456e-08, + 2.0336601735948534e-08, + 1.9947020035715468e-08 + ], + "gamma_dfa": 0.024572641068516532, + "acc_eval": 0.119140625, + "loss_eval": 5.8440093994140625, + "epoch": 41 + }, + { + "hidden_norms": [ + 55136.65625, + 147294320.0, + 43301224.0, + 54132172.0, + 40002916.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.0416718033166035e-08, + 2.623444794735974e-10, + 2.586598435438958e-10, + 2.587878522586351e-10, + 2.5755084176459775e-10 + ], + "bp_grad_norms_F": [ + 7.195616944954963e-06, + 5.543640568816954e-08, + 2.0126753597082825e-08, + 1.9496084746606357e-08, + 1.9124053451946565e-08 + ], + "gamma_dfa": 0.026229552553559188, + "acc_eval": 0.1201171875, + "loss_eval": 5.841940879821777, + "epoch": 42 + }, + { + "hidden_norms": [ + 56057.48828125, + 155058496.0, + 45581136.0, + 56721952.0, + 42172944.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.9346542973485157e-08, + 2.4918875296542353e-10, + 2.4687848987348104e-10, + 2.470146309718757e-10, + 2.4589502656269246e-10 + ], + "bp_grad_norms_F": [ + 7.236937562993262e-06, + 4.957384902581907e-08, + 1.9364815528888357e-08, + 1.8756255215635065e-08, + 1.840485097659439e-08 + ], + "gamma_dfa": 0.027025546743971063, + "acc_eval": 0.12109375, + "loss_eval": 5.79724645614624, + "epoch": 43 + }, + { + "hidden_norms": [ + 56951.0546875, + 163286592.0, + 47715684.0, + 59381272.0, + 44453996.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.9479124918907473e-08, + 2.39016806347081e-10, + 2.3503707313743405e-10, + 2.33648544956111e-10, + 2.335798499064623e-10 + ], + "bp_grad_norms_F": [ + 7.3719347710721195e-06, + 5.521000900898798e-08, + 1.8681236113593513e-08, + 1.8048309513574168e-08, + 1.7682033615074033e-08 + ], + "gamma_dfa": 0.02818910058704205, + "acc_eval": 0.1181640625, + "loss_eval": 5.779097080230713, + "epoch": 44 + }, + { + "hidden_norms": [ + 57889.91015625, + 171572336.0, + 49962976.0, + 62099764.0, + 46403104.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.00151405951965e-08, + 2.294373580014053e-10, + 2.2455036441382248e-10, + 2.2508651886798958e-10, + 2.2402991961545382e-10 + ], + "bp_grad_norms_F": [ + 7.484923116862774e-06, + 5.0286196540128e-08, + 1.8117480848900414e-08, + 1.7483015923858147e-08, + 1.7114837547183015e-08 + ], + "gamma_dfa": 0.029963871067593573, + "acc_eval": 0.1220703125, + "loss_eval": 5.8359575271606445, + "epoch": 45 + }, + { + "hidden_norms": [ + 58731.421875, + 180056896.0, + 52137220.0, + 64717056.0, + 48647116.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.929727926925807e-08, + 2.1976008512947232e-10, + 2.159663420320257e-10, + 2.163312862180078e-10, + 2.1587925891353166e-10 + ], + "bp_grad_norms_F": [ + 7.681007446080912e-06, + 5.031828109736125e-08, + 1.7532725493651924e-08, + 1.6936246183263393e-08, + 1.659478598980968e-08 + ], + "gamma_dfa": 0.03088831547938753, + "acc_eval": 0.1220703125, + "loss_eval": 5.786240100860596, + "epoch": 46 + }, + { + "hidden_norms": [ + 59567.96875, + 187949040.0, + 54233264.0, + 67384816.0, + 50735356.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.870891080419824e-08, + 2.1069677946794485e-10, + 2.057157916235397e-10, + 2.0573617809382938e-10, + 2.051469827346608e-10 + ], + "bp_grad_norms_F": [ + 7.31024283595616e-06, + 4.820083177037304e-08, + 1.691453910268592e-08, + 1.6327849294839325e-08, + 1.5993451896179067e-08 + ], + "gamma_dfa": 0.03192764806590276, + "acc_eval": 0.119140625, + "loss_eval": 5.707631587982178, + "epoch": 47 + }, + { + "hidden_norms": [ + 60402.91796875, + 196285488.0, + 56440304.0, + 70085304.0, + 52941472.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8424729237030988e-08, + 2.033633955678127e-10, + 1.9889993818633656e-10, + 1.9922237470826332e-10, + 1.9868894030050654e-10 + ], + "bp_grad_norms_F": [ + 7.644263860129286e-06, + 4.852574519986774e-08, + 1.6383141954179337e-08, + 1.581754283108694e-08, + 1.548989914113008e-08 + ], + "gamma_dfa": 0.033413520381145645, + "acc_eval": 0.1220703125, + "loss_eval": 5.704823017120361, + "epoch": 48 + }, + { + "hidden_norms": [ + 61196.53515625, + 204414672.0, + 58842936.0, + 72912304.0, + 55068312.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.859230185947581e-08, + 1.9821513874695995e-10, + 1.9266777062654228e-10, + 1.9288849684162557e-10, + 1.9265547490654455e-10 + ], + "bp_grad_norms_F": [ + 7.879517397668678e-06, + 4.184777324667266e-08, + 1.6105406785982268e-08, + 1.550557016116727e-08, + 1.5175970702330233e-08 + ], + "gamma_dfa": 0.034091180186806014, + "acc_eval": 0.1201171875, + "loss_eval": 5.725862979888916, + "epoch": 49 + }, + { + "hidden_norms": [ + 61914.14453125, + 212112608.0, + 61176224.0, + 75542504.0, + 57474876.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8669807861092522e-08, + 1.8937640344773854e-10, + 1.8534798695846177e-10, + 1.855716413867725e-10, + 1.852704378801917e-10 + ], + "bp_grad_norms_F": [ + 8.087788955890574e-06, + 4.2019124180114886e-08, + 1.5675068354426003e-08, + 1.5084628657291432e-08, + 1.4754542476680399e-08 + ], + "gamma_dfa": 0.034466555964172585, + "acc_eval": 0.1201171875, + "loss_eval": 5.820840358734131, + "epoch": 50 + }, + { + "hidden_norms": [ + 62603.82421875, + 219453520.0, + 63197896.0, + 78229512.0, + 59644488.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.9210220020559063e-08, + 1.8399998191753753e-10, + 1.7923225403837506e-10, + 1.792543474765651e-10, + 1.785920855645884e-10 + ], + "bp_grad_norms_F": [ + 8.000329216883983e-06, + 4.107307916001446e-08, + 1.5165383615567407e-08, + 1.4602372644390016e-08, + 1.4272954373950597e-08 + ], + "gamma_dfa": 0.035090556057184585, + "acc_eval": 0.12109375, + "loss_eval": 5.784890174865723, + "epoch": 51 + }, + { + "hidden_norms": [ + 63365.48828125, + 227326704.0, + 65434160.0, + 80771200.0, + 61832948.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.9006677948473225e-08, + 1.7990454959093682e-10, + 1.7418685938075384e-10, + 1.7404670760168273e-10, + 1.7386522777051994e-10 + ], + "bp_grad_norms_F": [ + 8.04007868282497e-06, + 3.7175201583750095e-08, + 1.4899267597456856e-08, + 1.4325389763314433e-08, + 1.4007627946455159e-08 + ], + "gamma_dfa": 0.035336821872988367, + "acc_eval": 0.12109375, + "loss_eval": 5.837845802307129, + "epoch": 52 + }, + { + "hidden_norms": [ + 64122.77734375, + 235505280.0, + 67571832.0, + 83154408.0, + 63815212.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8882961800036355e-08, + 1.752420292211454e-10, + 1.6966168747689636e-10, + 1.6997936391760504e-10, + 1.6931231416883463e-10 + ], + "bp_grad_norms_F": [ + 7.732651283731684e-06, + 3.6642365586203596e-08, + 1.4491905453439813e-08, + 1.39411024946412e-08, + 1.3628048911584756e-08 + ], + "gamma_dfa": 0.035559086416469654, + "acc_eval": 0.12109375, + "loss_eval": 5.813376426696777, + "epoch": 53 + }, + { + "hidden_norms": [ + 64808.83203125, + 243721104.0, + 69766352.0, + 85766896.0, + 65980356.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8568885923618836e-08, + 1.6757319143412275e-10, + 1.6364704036320177e-10, + 1.6374304689925623e-10, + 1.6309503747535814e-10 + ], + "bp_grad_norms_F": [ + 7.502960215788335e-06, + 3.409801507814336e-08, + 1.4090593580817767e-08, + 1.3566921808205734e-08, + 1.3258036446472943e-08 + ], + "gamma_dfa": 0.03633021883433685, + "acc_eval": 0.12109375, + "loss_eval": 5.748073101043701, + "epoch": 54 + }, + { + "hidden_norms": [ + 65405.05078125, + 251434864.0, + 71765544.0, + 88222840.0, + 68040816.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8620791070466112e-08, + 1.6591342189009595e-10, + 1.611620559227589e-10, + 1.6055762275257734e-10, + 1.6039196359951546e-10 + ], + "bp_grad_norms_F": [ + 7.535967142757727e-06, + 3.341937571121889e-08, + 1.3891366279494832e-08, + 1.3369996665346662e-08, + 1.3064806125839823e-08 + ], + "gamma_dfa": 0.037189101487456355, + "acc_eval": 0.1220703125, + "loss_eval": 5.769567966461182, + "epoch": 55 + }, + { + "hidden_norms": [ + 65975.4296875, + 259364544.0, + 73868528.0, + 90804584.0, + 70148048.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8815582808761064e-08, + 1.6121720625150715e-10, + 1.5669744668489471e-10, + 1.568625784820199e-10, + 1.56342438994983e-10 + ], + "bp_grad_norms_F": [ + 7.530327820859384e-06, + 2.989135694519973e-08, + 1.3588412173248798e-08, + 1.308291253110383e-08, + 1.2791012693469384e-08 + ], + "gamma_dfa": 0.037349180958699435, + "acc_eval": 0.1201171875, + "loss_eval": 5.802239418029785, + "epoch": 56 + }, + { + "hidden_norms": [ + 66535.546875, + 267235600.0, + 75921592.0, + 93206176.0, + 72113992.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8679746577608967e-08, + 1.5684299692342307e-10, + 1.530628263024525e-10, + 1.5322397517447683e-10, + 1.5271124642612932e-10 + ], + "bp_grad_norms_F": [ + 7.578343684144784e-06, + 2.8776035776445497e-08, + 1.3372356555407805e-08, + 1.2855631226216246e-08, + 1.2555028128247159e-08 + ], + "gamma_dfa": 0.03780493976228172, + "acc_eval": 0.1201171875, + "loss_eval": 5.850732803344727, + "epoch": 57 + }, + { + "hidden_norms": [ + 67107.3125, + 274158304.0, + 77594136.0, + 95315520.0, + 73880288.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.9038343285492374e-08, + 1.5442255807407435e-10, + 1.5004263109741345e-10, + 1.5028490951696227e-10, + 1.4968959405337046e-10 + ], + "bp_grad_norms_F": [ + 7.555737283837516e-06, + 3.160908335075874e-08, + 1.3153115929753767e-08, + 1.2644002289619038e-08, + 1.2345022781801163e-08 + ], + "gamma_dfa": 0.03859367490440491, + "acc_eval": 0.12109375, + "loss_eval": 5.83157205581665, + "epoch": 58 + }, + { + "hidden_norms": [ + 67633.5703125, + 281346784.0, + 79395712.0, + 97521760.0, + 75716480.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8924493022941533e-08, + 1.5015137744267548e-10, + 1.4681762749990668e-10, + 1.469668414744163e-10, + 1.4640397227871915e-10 + ], + "bp_grad_norms_F": [ + 7.076869223965332e-06, + 3.03394500633658e-08, + 1.2924256331814377e-08, + 1.2421836004250508e-08, + 1.2128483106721433e-08 + ], + "gamma_dfa": 0.03882967439312779, + "acc_eval": 0.1201171875, + "loss_eval": 5.850924491882324, + "epoch": 59 + }, + { + "hidden_norms": [ + 68127.2578125, + 288068512.0, + 81019736.0, + 99671120.0, + 77532304.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.900766915558961e-08, + 1.4631622302641034e-10, + 1.434221075236053e-10, + 1.4353812582967862e-10, + 1.428595158836643e-10 + ], + "bp_grad_norms_F": [ + 7.026245839369949e-06, + 3.037761331370348e-08, + 1.2673269544904997e-08, + 1.216829925709817e-08, + 1.1867063776094255e-08 + ], + "gamma_dfa": 0.039077571367670316, + "acc_eval": 0.119140625, + "loss_eval": 5.843035697937012, + "epoch": 60 + }, + { + "hidden_norms": [ + 68607.2890625, + 295220896.0, + 83038584.0, + 101714504.0, + 79438864.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.889952988027744e-08, + 1.4436063455747217e-10, + 1.410637162635453e-10, + 1.4117192137508283e-10, + 1.405108668306454e-10 + ], + "bp_grad_norms_F": [ + 6.8223289417801425e-06, + 2.9571756599011678e-08, + 1.237319757763089e-08, + 1.1902468344260342e-08, + 1.1619527562345411e-08 + ], + "gamma_dfa": 0.0394883609842509, + "acc_eval": 0.119140625, + "loss_eval": 5.8329925537109375, + "epoch": 61 + }, + { + "hidden_norms": [ + 69038.0703125, + 302174528.0, + 84795640.0, + 103621440.0, + 81134560.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8758867287592693e-08, + 1.4096314393530207e-10, + 1.380290187702471e-10, + 1.3813312993438132e-10, + 1.3748156779680443e-10 + ], + "bp_grad_norms_F": [ + 6.821945589763345e-06, + 2.9822015079616904e-08, + 1.2211526900784975e-08, + 1.1739270888710962e-08, + 1.1454956982959175e-08 + ], + "gamma_dfa": 0.03950453496872797, + "acc_eval": 0.1201171875, + "loss_eval": 5.862898826599121, + "epoch": 62 + }, + { + "hidden_norms": [ + 69486.8671875, + 308758272.0, + 86559352.0, + 105690288.0, + 82830320.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.880081950706881e-08, + 1.381648684350978e-10, + 1.3562810596834396e-10, + 1.3572509782733277e-10, + 1.3508719143295878e-10 + ], + "bp_grad_norms_F": [ + 6.841747108410345e-06, + 3.094388745239485e-08, + 1.2084786504829026e-08, + 1.1623659368353856e-08, + 1.1344519990075241e-08 + ], + "gamma_dfa": 0.03953796969653922, + "acc_eval": 0.1181640625, + "loss_eval": 5.886589527130127, + "epoch": 63 + }, + { + "hidden_norms": [ + 69910.8515625, + 314931680.0, + 87987448.0, + 107443096.0, + 84227784.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8549854036441502e-08, + 1.3562842515746354e-10, + 1.3309958690754797e-10, + 1.3318925129457426e-10, + 1.32547681164219e-10 + ], + "bp_grad_norms_F": [ + 6.486627626145491e-06, + 3.26463052147119e-08, + 1.1863860116534397e-08, + 1.1407089495207856e-08, + 1.112555558790973e-08 + ], + "gamma_dfa": 0.040154138219804736, + "acc_eval": 0.12109375, + "loss_eval": 5.841930389404297, + "epoch": 64 + }, + { + "hidden_norms": [ + 70309.921875, + 320869664.0, + 89479256.0, + 109445496.0, + 85720672.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8119913508817262e-08, + 1.333930049751686e-10, + 1.311449004948173e-10, + 1.3122899988893266e-10, + 1.306234981290899e-10 + ], + "bp_grad_norms_F": [ + 6.1845657910453156e-06, + 3.1657755528158305e-08, + 1.1685694190077811e-08, + 1.1245842479468138e-08, + 1.0970555130995763e-08 + ], + "gamma_dfa": 0.04057217295485316, + "acc_eval": 0.1181640625, + "loss_eval": 5.787144184112549, + "epoch": 65 + }, + { + "hidden_norms": [ + 70717.453125, + 326733312.0, + 90990512.0, + 111385000.0, + 87145456.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.868856441295975e-08, + 1.3173599711091555e-10, + 1.290058199154842e-10, + 1.2908775437470155e-10, + 1.284874151519233e-10 + ], + "bp_grad_norms_F": [ + 6.056342499505263e-06, + 3.0463933597957293e-08, + 1.1565422397552538e-08, + 1.1122933685214775e-08, + 1.0847451825668486e-08 + ], + "gamma_dfa": 0.040889364270697115, + "acc_eval": 0.119140625, + "loss_eval": 5.847908020019531, + "epoch": 66 + }, + { + "hidden_norms": [ + 71084.71875, + 332338880.0, + 92455056.0, + 113026960.0, + 88541256.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.7999890406249506e-08, + 1.2975863439290691e-10, + 1.2677238425684578e-10, + 1.268507521245965e-10, + 1.2626712175833887e-10 + ], + "bp_grad_norms_F": [ + 5.962062004982727e-06, + 2.9298774961716845e-08, + 1.14416129903816e-08, + 1.1010567568803253e-08, + 1.0736493472052189e-08 + ], + "gamma_dfa": 0.040890415915782796, + "acc_eval": 0.1201171875, + "loss_eval": 5.816187381744385, + "epoch": 67 + }, + { + "hidden_norms": [ + 71436.84375, + 337832864.0, + 93879264.0, + 114665400.0, + 89926616.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.7683153547286565e-08, + 1.2797991832957933e-10, + 1.2511817970572991e-10, + 1.2518648617731998e-10, + 1.246210634686662e-10 + ], + "bp_grad_norms_F": [ + 5.7771489991864655e-06, + 2.8285153774731953e-08, + 1.1245044895247247e-08, + 1.0827025498372223e-08, + 1.0562406060898866e-08 + ], + "gamma_dfa": 0.04072478835223592, + "acc_eval": 0.1201171875, + "loss_eval": 5.783463478088379, + "epoch": 68 + }, + { + "hidden_norms": [ + 71769.5546875, + 342918304.0, + 95263584.0, + 116254568.0, + 91446520.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.775840357571724e-08, + 1.2646382552272684e-10, + 1.2334086529897093e-10, + 1.2337944554907665e-10, + 1.2288142725580542e-10 + ], + "bp_grad_norms_F": [ + 5.667419827659614e-06, + 2.6888709925287912e-08, + 1.1133559851828068e-08, + 1.0716635578944533e-08, + 1.0457153365450722e-08 + ], + "gamma_dfa": 0.040744281255683745, + "acc_eval": 0.1201171875, + "loss_eval": 5.804702281951904, + "epoch": 69 + }, + { + "hidden_norms": [ + 72080.078125, + 347772576.0, + 96482160.0, + 117685240.0, + 92638296.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8613341029881667e-08, + 1.2489977108121053e-10, + 1.2201274712797527e-10, + 1.220573642157774e-10, + 1.2148008987633574e-10 + ], + "bp_grad_norms_F": [ + 5.642392352456227e-06, + 2.7134319680044428e-08, + 1.1023663759601732e-08, + 1.0605543110386861e-08, + 1.034114660569685e-08 + ], + "gamma_dfa": 0.04128229359048419, + "acc_eval": 0.1201171875, + "loss_eval": 5.805394172668457, + "epoch": 70 + }, + { + "hidden_norms": [ + 72369.9921875, + 352377056.0, + 97691240.0, + 119151816.0, + 93761800.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8514245187238885e-08, + 1.2353804090814435e-10, + 1.2041069530344117e-10, + 1.2046977304613904e-10, + 1.1990240744719216e-10 + ], + "bp_grad_norms_F": [ + 5.6565527302154806e-06, + 2.8678897479039733e-08, + 1.0947891482260275e-08, + 1.0533200978102286e-08, + 1.0270048811378274e-08 + ], + "gamma_dfa": 0.04154024633317022, + "acc_eval": 0.119140625, + "loss_eval": 5.7999067306518555, + "epoch": 71 + }, + { + "hidden_norms": [ + 72651.671875, + 356846048.0, + 98782024.0, + 120475080.0, + 94848032.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8226885717685946e-08, + 1.221410056428951e-10, + 1.1935313848354667e-10, + 1.193777160457543e-10, + 1.1868718508001308e-10 + ], + "bp_grad_norms_F": [ + 5.597235940513201e-06, + 2.7164126947809564e-08, + 1.078571720825039e-08, + 1.038548358422986e-08, + 1.0128220928606879e-08 + ], + "gamma_dfa": 0.041652156607597135, + "acc_eval": 0.119140625, + "loss_eval": 5.782708168029785, + "epoch": 72 + }, + { + "hidden_norms": [ + 72915.9765625, + 361214752.0, + 99899064.0, + 121794264.0, + 95956256.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8156543763202535e-08, + 1.208296795951469e-10, + 1.1789087761560069e-10, + 1.1794409893184366e-10, + 1.1745009131924888e-10 + ], + "bp_grad_norms_F": [ + 5.609212166746147e-06, + 2.767807316672588e-08, + 1.074356958952194e-08, + 1.0335670985739398e-08, + 1.007653693818611e-08 + ], + "gamma_dfa": 0.041388919182281825, + "acc_eval": 0.1171875, + "loss_eval": 5.816926956176758, + "epoch": 73 + }, + { + "hidden_norms": [ + 73160.8984375, + 365176576.0, + 100896352.0, + 123055840.0, + 96952304.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8052935974187676e-08, + 1.2002213112261018e-10, + 1.1708690961231838e-10, + 1.1711043246265262e-10, + 1.1664859356219637e-10 + ], + "bp_grad_norms_F": [ + 5.528850579139544e-06, + 2.6534554109503006e-08, + 1.062906651583262e-08, + 1.0228863978056779e-08, + 9.976772297193293e-09 + ], + "gamma_dfa": 0.04158145491965115, + "acc_eval": 0.1201171875, + "loss_eval": 5.83203125, + "epoch": 74 + }, + { + "hidden_norms": [ + 73388.9921875, + 369039872.0, + 101870976.0, + 124229664.0, + 97872176.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.811547972214612e-08, + 1.1867723470615488e-10, + 1.160038107239636e-10, + 1.1605346544873996e-10, + 1.1549688982981365e-10 + ], + "bp_grad_norms_F": [ + 5.516625151358312e-06, + 2.6522718243882082e-08, + 1.0559543461852172e-08, + 1.0160210450749219e-08, + 9.905477327265544e-09 + ], + "gamma_dfa": 0.04162494709453313, + "acc_eval": 0.1181640625, + "loss_eval": 5.825821876525879, + "epoch": 75 + }, + { + "hidden_norms": [ + 73607.875, + 372436096.0, + 102747608.0, + 125356400.0, + 98735744.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8296041065800637e-08, + 1.1797214594100325e-10, + 1.1553259737784316e-10, + 1.1555564144449804e-10, + 1.148080935875484e-10 + ], + "bp_grad_norms_F": [ + 5.4743991313443985e-06, + 2.5615005228019072e-08, + 1.0501097769122225e-08, + 1.0109610926178902e-08, + 9.859975946824306e-09 + ], + "gamma_dfa": 0.04183118613582337, + "acc_eval": 0.1171875, + "loss_eval": 5.838399887084961, + "epoch": 76 + }, + { + "hidden_norms": [ + 73806.21875, + 375504928.0, + 103559744.0, + 126298048.0, + 99592752.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8072012270285995e-08, + 1.16896228807839e-10, + 1.1455134063531602e-10, + 1.1459744958530749e-10, + 1.1405828365118609e-10 + ], + "bp_grad_norms_F": [ + 5.35501703780028e-06, + 2.4375134799470288e-08, + 1.0415713624922773e-08, + 1.0033582853452572e-08, + 9.78571357279634e-09 + ], + "gamma_dfa": 0.04175542373559438, + "acc_eval": 0.1181640625, + "loss_eval": 5.806183815002441, + "epoch": 77 + }, + { + "hidden_norms": [ + 73982.1328125, + 378528768.0, + 104296416.0, + 127198352.0, + 100364600.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.802979714999765e-08, + 1.1618311174244056e-10, + 1.1359845702996196e-10, + 1.1364404556291063e-10, + 1.1310929276531212e-10 + ], + "bp_grad_norms_F": [ + 5.359067017707275e-06, + 2.4563517442288685e-08, + 1.0355730495348325e-08, + 9.969440384338668e-09, + 9.722052496385913e-09 + ], + "gamma_dfa": 0.041852476922940696, + "acc_eval": 0.1171875, + "loss_eval": 5.812763690948486, + "epoch": 78 + }, + { + "hidden_norms": [ + 74143.3515625, + 381338400.0, + 104995776.0, + 128103664.0, + 101143248.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.803018084307496e-08, + 1.1504715929921971e-10, + 1.1309976566398205e-10, + 1.1314182923882754e-10, + 1.1259981835820554e-10 + ], + "bp_grad_norms_F": [ + 5.305423201207304e-06, + 2.479905347740896e-08, + 1.0304642472647174e-08, + 9.922130672634921e-09, + 9.675199308389892e-09 + ], + "gamma_dfa": 0.04194222000660375, + "acc_eval": 0.1201171875, + "loss_eval": 5.790335655212402, + "epoch": 79 + }, + { + "hidden_norms": [ + 74296.140625, + 383779872.0, + 105624680.0, + 128832568.0, + 101739872.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8086292402917934e-08, + 1.1405020677868194e-10, + 1.1259575216637785e-10, + 1.126363308179279e-10, + 1.121035694828798e-10 + ], + "bp_grad_norms_F": [ + 5.285005499899853e-06, + 2.497140805246545e-08, + 1.0247953596831394e-08, + 9.865908978667903e-09, + 9.618767116137406e-09 + ], + "gamma_dfa": 0.042092169023817405, + "acc_eval": 0.1201171875, + "loss_eval": 5.78256893157959, + "epoch": 80 + }, + { + "hidden_norms": [ + 74432.171875, + 386197824.0, + 106270032.0, + 129540264.0, + 102336408.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8129701235002358e-08, + 1.1369888364143321e-10, + 1.1195557675369727e-10, + 1.1199620397750465e-10, + 1.1146324141453334e-10 + ], + "bp_grad_norms_F": [ + 5.2314603635750245e-06, + 2.418116018532146e-08, + 1.0211192780218425e-08, + 9.833079239740528e-09, + 9.588974059226985e-09 + ], + "gamma_dfa": 0.0422149248624919, + "acc_eval": 0.1201171875, + "loss_eval": 5.794626235961914, + "epoch": 81 + }, + { + "hidden_norms": [ + 74557.1328125, + 388309664.0, + 106804240.0, + 130160096.0, + 102871888.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8006962082827158e-08, + 1.1333335658836319e-10, + 1.1151064099879093e-10, + 1.1155010942731636e-10, + 1.1102004732199688e-10 + ], + "bp_grad_norms_F": [ + 5.231111572356895e-06, + 2.3960881279094792e-08, + 1.0185694065967255e-08, + 9.808036161018663e-09, + 9.561717639883227e-09 + ], + "gamma_dfa": 0.042091405965038575, + "acc_eval": 0.1201171875, + "loss_eval": 5.809223175048828, + "epoch": 82 + }, + { + "hidden_norms": [ + 74670.6484375, + 390046144.0, + 107241528.0, + 130709072.0, + 103311792.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.80954566278524e-08, + 1.1238011909942003e-10, + 1.1107993691528151e-10, + 1.1111822573184327e-10, + 1.1058326476742764e-10 + ], + "bp_grad_norms_F": [ + 5.195881840336369e-06, + 2.3944403793052516e-08, + 1.0142765738407888e-08, + 9.765725117460988e-09, + 9.519601995577887e-09 + ], + "gamma_dfa": 0.042151874920818955, + "acc_eval": 0.1201171875, + "loss_eval": 5.789272785186768, + "epoch": 83 + }, + { + "hidden_norms": [ + 74771.78125, + 391740192.0, + 107714400.0, + 131203208.0, + 103730008.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8205375812717648e-08, + 1.1187289983283222e-10, + 1.1065893340544974e-10, + 1.106964936381516e-10, + 1.1018032319842774e-10 + ], + "bp_grad_norms_F": [ + 5.16868840350071e-06, + 2.363896278723132e-08, + 1.0106472991822102e-08, + 9.731052408312735e-09, + 9.487330032698083e-09 + ], + "gamma_dfa": 0.042111018407013034, + "acc_eval": 0.1201171875, + "loss_eval": 5.778679847717285, + "epoch": 84 + }, + { + "hidden_norms": [ + 74860.828125, + 393210464.0, + 108154200.0, + 131674336.0, + 104148832.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8289822040505896e-08, + 1.1139363043088935e-10, + 1.1020819673523974e-10, + 1.1024554186223057e-10, + 1.0972771996575759e-10 + ], + "bp_grad_norms_F": [ + 5.15709007231635e-06, + 2.3636799184600932e-08, + 1.008097960664145e-08, + 9.703811088002112e-09, + 9.460902283819905e-09 + ], + "gamma_dfa": 0.04205825741155422, + "acc_eval": 0.1201171875, + "loss_eval": 5.787901878356934, + "epoch": 85 + }, + { + "hidden_norms": [ + 74942.4453125, + 394569024.0, + 108544648.0, + 132082208.0, + 104483976.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8258760664812144e-08, + 1.1120066673031559e-10, + 1.0991466070642275e-10, + 1.0995130500512929e-10, + 1.0943435047039429e-10 + ], + "bp_grad_norms_F": [ + 5.150290235178545e-06, + 2.3486826705720887e-08, + 1.0058711197302728e-08, + 9.684677060306512e-09, + 9.442134185633222e-09 + ], + "gamma_dfa": 0.042173042878857814, + "acc_eval": 0.119140625, + "loss_eval": 5.789056301116943, + "epoch": 86 + }, + { + "hidden_norms": [ + 75009.5703125, + 395748704.0, + 108812392.0, + 132420432.0, + 104755352.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.825358436098213e-08, + 1.1081059680950744e-10, + 1.0968410901757153e-10, + 1.0972003861020596e-10, + 1.0920536697156535e-10 + ], + "bp_grad_norms_F": [ + 5.127661552251084e-06, + 2.3339271848499266e-08, + 1.002943950112467e-08, + 9.659677502327213e-09, + 9.417544966083824e-09 + ], + "gamma_dfa": 0.04217808429893921, + "acc_eval": 0.1201171875, + "loss_eval": 5.776318550109863, + "epoch": 87 + }, + { + "hidden_norms": [ + 75066.4921875, + 396774016.0, + 109070288.0, + 132708432.0, + 105002960.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.824552858271545e-08, + 1.1050411280466577e-10, + 1.0939484040850544e-10, + 1.0943065897883741e-10, + 1.0891805513058017e-10 + ], + "bp_grad_norms_F": [ + 5.1081005949527025e-06, + 2.2895029871961015e-08, + 1.0016128371148625e-08, + 9.644456788748812e-09, + 9.40405175953174e-09 + ], + "gamma_dfa": 0.04221886159211863, + "acc_eval": 0.1201171875, + "loss_eval": 5.782362937927246, + "epoch": 88 + }, + { + "hidden_norms": [ + 75117.3984375, + 397629600.0, + 109292216.0, + 132974672.0, + 105237816.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8004475183251998e-08, + 1.1032175173397718e-10, + 1.092313739459172e-10, + 1.092670676161589e-10, + 1.0875097350426799e-10 + ], + "bp_grad_norms_F": [ + 5.101501756143989e-06, + 2.2761090789913396e-08, + 9.993788907536327e-09, + 9.627679986579096e-09, + 9.387123967030675e-09 + ], + "gamma_dfa": 0.04218835258870968, + "acc_eval": 0.119140625, + "loss_eval": 5.786335468292236, + "epoch": 89 + }, + { + "hidden_norms": [ + 75159.3515625, + 398356864.0, + 109470496.0, + 133184088.0, + 105416456.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.806424248547046e-08, + 1.1018109341565108e-10, + 1.0910816694575942e-10, + 1.0914344428236689e-10, + 1.0862655219767703e-10 + ], + "bp_grad_norms_F": [ + 5.100384441902861e-06, + 2.2749302885927136e-08, + 9.977647152936697e-09, + 9.612988627338837e-09, + 9.37321864569185e-09 + ], + "gamma_dfa": 0.04216382784579764, + "acc_eval": 0.1201171875, + "loss_eval": 5.787578582763672, + "epoch": 90 + }, + { + "hidden_norms": [ + 75196.53125, + 398958272.0, + 109628448.0, + 133366784.0, + 105577720.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8093891657476888e-08, + 1.0998777583148822e-10, + 1.0895360308404989e-10, + 1.0898840857587189e-10, + 1.084766096393075e-10 + ], + "bp_grad_norms_F": [ + 5.099497684568632e-06, + 2.276015820257271e-08, + 9.975322790012342e-09, + 9.609090412254773e-09, + 9.369199638342707e-09 + ], + "gamma_dfa": 0.0421357955710846, + "acc_eval": 0.1201171875, + "loss_eval": 5.788777828216553, + "epoch": 91 + }, + { + "hidden_norms": [ + 75225.75, + 399436800.0, + 109753008.0, + 133503392.0, + 105709880.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.7958691362073296e-08, + 1.098953844591577e-10, + 1.0885654877501594e-10, + 1.0889117385559643e-10, + 1.0837702263399862e-10 + ], + "bp_grad_norms_F": [ + 5.099244390294189e-06, + 2.2776946551061883e-08, + 9.965032354841696e-09, + 9.599201433729831e-09, + 9.359114372387012e-09 + ], + "gamma_dfa": 0.04213721772248391, + "acc_eval": 0.1201171875, + "loss_eval": 5.787423133850098, + "epoch": 92 + }, + { + "hidden_norms": [ + 75247.3671875, + 399815808.0, + 109848648.0, + 133619136.0, + 105800656.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.813173693994031e-08, + 1.0978142006567992e-10, + 1.0878217771015386e-10, + 1.0881660156281114e-10, + 1.0830317198617934e-10 + ], + "bp_grad_norms_F": [ + 5.097780103824334e-06, + 2.278613919770578e-08, + 9.958157853873217e-09, + 9.592699079519207e-09, + 9.35304633742362e-09 + ], + "gamma_dfa": 0.042139860528550344, + "acc_eval": 0.1201171875, + "loss_eval": 5.78769588470459, + "epoch": 93 + }, + { + "hidden_norms": [ + 75264.9921875, + 400121888.0, + 109927240.0, + 133712496.0, + 105877656.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8044253141956688e-08, + 1.0970312158686824e-10, + 1.0871267774881233e-10, + 1.0874703221253057e-10, + 1.0823512919255762e-10 + ], + "bp_grad_norms_F": [ + 5.0932972044392955e-06, + 2.2714601755069452e-08, + 9.954023383329513e-09, + 9.589306237955952e-09, + 9.350141105812781e-09 + ], + "gamma_dfa": 0.04215262952493504, + "acc_eval": 0.1201171875, + "loss_eval": 5.787428379058838, + "epoch": 94 + }, + { + "hidden_norms": [ + 75277.7421875, + 400340192.0, + 109981456.0, + 133783368.0, + 105935424.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8024039977481152e-08, + 1.0965856001021734e-10, + 1.0866757493843693e-10, + 1.0870188776879175e-10, + 1.0818954065960895e-10 + ], + "bp_grad_norms_F": [ + 5.093556865176652e-06, + 2.269677956689975e-08, + 9.948016632677081e-09, + 9.583557947223653e-09, + 9.344440776715146e-09 + ], + "gamma_dfa": 0.04216338234982686, + "acc_eval": 0.1201171875, + "loss_eval": 5.787187099456787, + "epoch": 95 + }, + { + "hidden_norms": [ + 75285.703125, + 400477120.0, + 110015360.0, + 133823992.0, + 105968568.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.7959323745108122e-08, + 1.096286394997037e-10, + 1.0863549643191917e-10, + 1.0866971211775933e-10, + 1.0815728868074359e-10 + ], + "bp_grad_norms_F": [ + 5.094433618069161e-06, + 2.2707608238192734e-08, + 9.945019030510593e-09, + 9.580433335543148e-09, + 9.341129647566504e-09 + ], + "gamma_dfa": 0.04217854590388015, + "acc_eval": 0.1201171875, + "loss_eval": 5.785982608795166, + "epoch": 96 + }, + { + "hidden_norms": [ + 75289.953125, + 400549248.0, + 110035048.0, + 133846800.0, + 105987544.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.7980583183762064e-08, + 1.0960886365207756e-10, + 1.0861883614765588e-10, + 1.0865301020013263e-10, + 1.0814063533537421e-10 + ], + "bp_grad_norms_F": [ + 5.094651896797586e-06, + 2.2699452983943047e-08, + 9.943881273954958e-09, + 9.579290249916994e-09, + 9.340033635396594e-09 + ], + "gamma_dfa": 0.04217962139227893, + "acc_eval": 0.1201171875, + "loss_eval": 5.78618860244751, + "epoch": 97 + }, + { + "hidden_norms": [ + 75293.8203125, + 400615232.0, + 110052384.0, + 133866488.0, + 106003008.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.800710419137431e-08, + 1.0960048146824164e-10, + 1.0860957966318807e-10, + 1.0864373983787701e-10, + 1.0813145517873934e-10 + ], + "bp_grad_norms_F": [ + 5.094465905131074e-06, + 2.2699449431229368e-08, + 9.942947798435853e-09, + 9.578524640119213e-09, + 9.339320428125575e-09 + ], + "gamma_dfa": 0.04218013053832692, + "acc_eval": 0.1201171875, + "loss_eval": 5.786159515380859, + "epoch": 98 + }, + { + "hidden_norms": [ + 75295.7109375, + 400646048.0, + 110060248.0, + 133875320.0, + 106009248.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8009079500179723e-08, + 1.0959386176345731e-10, + 1.0860166238524371e-10, + 1.0863580868214484e-10, + 1.0812370443424868e-10 + ], + "bp_grad_norms_F": [ + 5.094112111692084e-06, + 2.26939054215336e-08, + 9.942577428034838e-09, + 9.578169368751333e-09, + 9.33901134203552e-09 + ], + "gamma_dfa": 0.042181356100627454, + "acc_eval": 0.1201171875, + "loss_eval": 5.786299705505371, + "epoch": 99 + }, + { + "hidden_norms": [ + 75295.7421875, + 400646208.0, + 110060504.0, + 133875616.0, + 106009536.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.8005374019812734e-08, + 1.0959412544142566e-10, + 1.0860218280228651e-10, + 1.0863632909918763e-10, + 1.0812418321792805e-10 + ], + "bp_grad_norms_F": [ + 5.0940698201884516e-06, + 2.269248788877576e-08, + 9.942581868926936e-09, + 9.57817469782185e-09, + 9.339016671106037e-09 + ], + "gamma_dfa": 0.042181452532531694, + "acc_eval": 0.1201171875, + "loss_eval": 5.786318302154541, + "epoch": 100 + } + ] +} \ No newline at end of file diff --git a/results/h2_no_residual_full_s456.log b/results/h2_no_residual_full_s456.log new file mode 100644 index 0000000..d0f198c --- /dev/null +++ b/results/h2_no_residual_full_s456.log @@ -0,0 +1,107 @@ +device=cuda:0, depth=4, d_hidden=256, epochs=100, seed=456 +eval buffer: torch.Size([1024, 3072]) + +=== DFA training === + [DFA] Ep 0: ||h||_med=[8.696551322937012, 42.47159957885742, 42.67432403564453, 45.272701263427734, 43.449092864990234] ||g||_med=[0.0011182057205587626, 0.00021166827355045825, 0.00014748115791007876, 0.00011803740198956802, 0.00010102539090439677] acc=0.1143 + [DFA] Ep 1: ||h_L||=9.975e+03 ||g_2||=4.843e-07 acc=0.1113 gamma_dfa=0.0185 + [DFA] Ep 2: ||h_L||=4.258e+04 ||g_2||=8.536e-08 acc=0.1006 gamma_dfa=0.0173 + [DFA] Ep 3: ||h_L||=9.508e+04 ||g_2||=3.481e-08 acc=0.0801 gamma_dfa=0.0150 + [DFA] Ep 4: ||h_L||=1.685e+05 ||g_2||=1.968e-08 acc=0.0654 gamma_dfa=0.0208 + [DFA] Ep 5: ||h_L||=2.704e+05 ||g_2||=1.294e-08 acc=0.0732 gamma_dfa=0.0239 + [DFA] Ep 6: ||h_L||=4.002e+05 ||g_2||=9.634e-09 acc=0.1064 gamma_dfa=0.0241 + [DFA] Ep 7: ||h_L||=5.563e+05 ||g_2||=7.954e-09 acc=0.1123 gamma_dfa=0.0292 + [DFA] Ep 8: ||h_L||=7.605e+05 ||g_2||=6.522e-09 acc=0.1152 gamma_dfa=0.0312 + [DFA] Ep 9: ||h_L||=1.011e+06 ||g_2||=5.556e-09 acc=0.1162 gamma_dfa=0.0348 + [DFA] Ep 10: ||h_L||=1.307e+06 ||g_2||=4.731e-09 acc=0.1152 gamma_dfa=0.0403 + [DFA] Ep 11: ||h_L||=1.643e+06 ||g_2||=4.127e-09 acc=0.1162 gamma_dfa=0.0408 + [DFA] Ep 12: ||h_L||=2.047e+06 ||g_2||=3.521e-09 acc=0.1123 gamma_dfa=0.0411 + [DFA] Ep 13: ||h_L||=2.529e+06 ||g_2||=3.068e-09 acc=0.1143 gamma_dfa=0.0436 + [DFA] Ep 14: ||h_L||=3.069e+06 ||g_2||=2.661e-09 acc=0.1152 gamma_dfa=0.0434 + [DFA] Ep 15: ||h_L||=3.672e+06 ||g_2||=2.340e-09 acc=0.1123 gamma_dfa=0.0459 + [DFA] Ep 16: ||h_L||=4.363e+06 ||g_2||=2.085e-09 acc=0.1104 gamma_dfa=0.0443 + [DFA] Ep 17: ||h_L||=5.116e+06 ||g_2||=1.862e-09 acc=0.1035 gamma_dfa=0.0453 + [DFA] Ep 18: ||h_L||=5.947e+06 ||g_2||=1.664e-09 acc=0.0859 gamma_dfa=0.0454 + [DFA] Ep 19: ||h_L||=6.799e+06 ||g_2||=1.496e-09 acc=0.0762 gamma_dfa=0.0448 + [DFA] Ep 20: ||h_L||=7.803e+06 ||g_2||=1.355e-09 acc=0.0801 gamma_dfa=0.0458 + [DFA] Ep 21: ||h_L||=8.837e+06 ||g_2||=1.236e-09 acc=0.0928 gamma_dfa=0.0458 + [DFA] Ep 22: ||h_L||=9.928e+06 ||g_2||=1.132e-09 acc=0.1045 gamma_dfa=0.0462 + [DFA] Ep 23: ||h_L||=1.110e+07 ||g_2||=1.038e-09 acc=0.1055 gamma_dfa=0.0465 + [DFA] Ep 24: ||h_L||=1.236e+07 ||g_2||=9.618e-10 acc=0.1055 gamma_dfa=0.0462 + [DFA] Ep 25: ||h_L||=1.366e+07 ||g_2||=8.898e-10 acc=0.1055 gamma_dfa=0.0468 + [DFA] Ep 26: ||h_L||=1.500e+07 ||g_2||=8.268e-10 acc=0.1055 gamma_dfa=0.0475 + [DFA] Ep 27: ||h_L||=1.650e+07 ||g_2||=7.703e-10 acc=0.1064 gamma_dfa=0.0474 + [DFA] Ep 28: ||h_L||=1.811e+07 ||g_2||=7.228e-10 acc=0.1055 gamma_dfa=0.0473 + [DFA] Ep 29: ||h_L||=1.965e+07 ||g_2||=6.773e-10 acc=0.1055 gamma_dfa=0.0472 + [DFA] Ep 30: ||h_L||=2.139e+07 ||g_2||=6.385e-10 acc=0.1055 gamma_dfa=0.0478 + [DFA] Ep 31: ||h_L||=2.306e+07 ||g_2||=6.001e-10 acc=0.1055 gamma_dfa=0.0481 + [DFA] Ep 32: ||h_L||=2.490e+07 ||g_2||=5.676e-10 acc=0.1064 gamma_dfa=0.0476 + [DFA] Ep 33: ||h_L||=2.693e+07 ||g_2||=5.345e-10 acc=0.1055 gamma_dfa=0.0476 + [DFA] Ep 34: ||h_L||=2.880e+07 ||g_2||=5.057e-10 acc=0.1055 gamma_dfa=0.0481 + [DFA] Ep 35: ||h_L||=3.075e+07 ||g_2||=4.826e-10 acc=0.1055 gamma_dfa=0.0478 + [DFA] Ep 36: ||h_L||=3.269e+07 ||g_2||=4.582e-10 acc=0.1055 gamma_dfa=0.0478 + [DFA] Ep 37: ||h_L||=3.458e+07 ||g_2||=4.370e-10 acc=0.1055 gamma_dfa=0.0480 + [DFA] Ep 38: ||h_L||=3.663e+07 ||g_2||=4.178e-10 acc=0.1055 gamma_dfa=0.0481 + [DFA] Ep 39: ||h_L||=3.877e+07 ||g_2||=4.003e-10 acc=0.1055 gamma_dfa=0.0479 + [DFA] Ep 40: ||h_L||=4.085e+07 ||g_2||=3.838e-10 acc=0.1055 gamma_dfa=0.0483 + [DFA] Ep 41: ||h_L||=4.301e+07 ||g_2||=3.697e-10 acc=0.1055 gamma_dfa=0.0488 + [DFA] Ep 42: ||h_L||=4.527e+07 ||g_2||=3.547e-10 acc=0.1055 gamma_dfa=0.0488 + [DFA] Ep 43: ||h_L||=4.735e+07 ||g_2||=3.417e-10 acc=0.1055 gamma_dfa=0.0487 + [DFA] Ep 44: ||h_L||=4.957e+07 ||g_2||=3.287e-10 acc=0.1055 gamma_dfa=0.0491 + [DFA] Ep 45: ||h_L||=5.152e+07 ||g_2||=3.176e-10 acc=0.1055 gamma_dfa=0.0493 + [DFA] Ep 46: ||h_L||=5.370e+07 ||g_2||=3.079e-10 acc=0.1055 gamma_dfa=0.0490 + [DFA] Ep 47: ||h_L||=5.579e+07 ||g_2||=2.985e-10 acc=0.1055 gamma_dfa=0.0497 + [DFA] Ep 48: ||h_L||=5.788e+07 ||g_2||=2.902e-10 acc=0.1055 gamma_dfa=0.0495 + [DFA] Ep 49: ||h_L||=6.001e+07 ||g_2||=2.819e-10 acc=0.1055 gamma_dfa=0.0495 + [DFA] Ep 50: ||h_L||=6.212e+07 ||g_2||=2.740e-10 acc=0.1055 gamma_dfa=0.0500 + [DFA] Ep 51: ||h_L||=6.409e+07 ||g_2||=2.676e-10 acc=0.1055 gamma_dfa=0.0503 + [DFA] Ep 52: ||h_L||=6.611e+07 ||g_2||=2.606e-10 acc=0.1055 gamma_dfa=0.0498 + [DFA] Ep 53: ||h_L||=6.824e+07 ||g_2||=2.535e-10 acc=0.1055 gamma_dfa=0.0503 + [DFA] Ep 54: ||h_L||=7.033e+07 ||g_2||=2.483e-10 acc=0.1055 gamma_dfa=0.0506 + [DFA] Ep 55: ||h_L||=7.230e+07 ||g_2||=2.428e-10 acc=0.1055 gamma_dfa=0.0507 + [DFA] Ep 56: ||h_L||=7.415e+07 ||g_2||=2.379e-10 acc=0.1055 gamma_dfa=0.0508 + [DFA] Ep 57: ||h_L||=7.599e+07 ||g_2||=2.338e-10 acc=0.1055 gamma_dfa=0.0508 + [DFA] Ep 58: ||h_L||=7.792e+07 ||g_2||=2.293e-10 acc=0.1055 gamma_dfa=0.0510 + [DFA] Ep 59: ||h_L||=7.974e+07 ||g_2||=2.247e-10 acc=0.1055 gamma_dfa=0.0511 + [DFA] Ep 60: ||h_L||=8.161e+07 ||g_2||=2.218e-10 acc=0.1055 gamma_dfa=0.0513 + [DFA] Ep 61: ||h_L||=8.329e+07 ||g_2||=2.178e-10 acc=0.1055 gamma_dfa=0.0515 + [DFA] Ep 62: ||h_L||=8.490e+07 ||g_2||=2.139e-10 acc=0.1055 gamma_dfa=0.0518 + [DFA] Ep 63: ||h_L||=8.655e+07 ||g_2||=2.119e-10 acc=0.1055 gamma_dfa=0.0518 + [DFA] Ep 64: ||h_L||=8.808e+07 ||g_2||=2.085e-10 acc=0.1055 gamma_dfa=0.0519 + [DFA] Ep 65: ||h_L||=8.967e+07 ||g_2||=2.067e-10 acc=0.1055 gamma_dfa=0.0517 + [DFA] Ep 66: ||h_L||=9.106e+07 ||g_2||=2.040e-10 acc=0.1055 gamma_dfa=0.0519 + [DFA] Ep 67: ||h_L||=9.243e+07 ||g_2||=2.017e-10 acc=0.1055 gamma_dfa=0.0520 + [DFA] Ep 68: ||h_L||=9.373e+07 ||g_2||=1.995e-10 acc=0.1055 gamma_dfa=0.0521 + [DFA] Ep 69: ||h_L||=9.486e+07 ||g_2||=1.975e-10 acc=0.1055 gamma_dfa=0.0522 + [DFA] Ep 70: ||h_L||=9.607e+07 ||g_2||=1.956e-10 acc=0.1055 gamma_dfa=0.0521 + [DFA] Ep 71: ||h_L||=9.723e+07 ||g_2||=1.938e-10 acc=0.1055 gamma_dfa=0.0521 + [DFA] Ep 72: ||h_L||=9.818e+07 ||g_2||=1.921e-10 acc=0.1055 gamma_dfa=0.0522 + [DFA] Ep 73: ||h_L||=9.925e+07 ||g_2||=1.908e-10 acc=0.1055 gamma_dfa=0.0523 + [DFA] Ep 74: ||h_L||=1.003e+08 ||g_2||=1.891e-10 acc=0.1055 gamma_dfa=0.0523 + [DFA] Ep 75: ||h_L||=1.012e+08 ||g_2||=1.877e-10 acc=0.1055 gamma_dfa=0.0524 + [DFA] Ep 76: ||h_L||=1.020e+08 ||g_2||=1.867e-10 acc=0.1055 gamma_dfa=0.0523 + [DFA] Ep 77: ||h_L||=1.028e+08 ||g_2||=1.857e-10 acc=0.1055 gamma_dfa=0.0524 + [DFA] Ep 78: ||h_L||=1.035e+08 ||g_2||=1.846e-10 acc=0.1055 gamma_dfa=0.0524 + [DFA] Ep 79: ||h_L||=1.041e+08 ||g_2||=1.838e-10 acc=0.1055 gamma_dfa=0.0525 + [DFA] Ep 80: ||h_L||=1.047e+08 ||g_2||=1.829e-10 acc=0.1055 gamma_dfa=0.0526 + [DFA] Ep 81: ||h_L||=1.052e+08 ||g_2||=1.821e-10 acc=0.1055 gamma_dfa=0.0527 + [DFA] Ep 82: ||h_L||=1.057e+08 ||g_2||=1.815e-10 acc=0.1055 gamma_dfa=0.0527 + [DFA] Ep 83: ||h_L||=1.062e+08 ||g_2||=1.808e-10 acc=0.1055 gamma_dfa=0.0526 + [DFA] Ep 84: ||h_L||=1.066e+08 ||g_2||=1.802e-10 acc=0.1055 gamma_dfa=0.0527 + [DFA] Ep 85: ||h_L||=1.070e+08 ||g_2||=1.797e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 86: ||h_L||=1.073e+08 ||g_2||=1.794e-10 acc=0.1055 gamma_dfa=0.0527 + [DFA] Ep 87: ||h_L||=1.076e+08 ||g_2||=1.790e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 88: ||h_L||=1.079e+08 ||g_2||=1.787e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 89: ||h_L||=1.081e+08 ||g_2||=1.784e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 90: ||h_L||=1.082e+08 ||g_2||=1.782e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 91: ||h_L||=1.084e+08 ||g_2||=1.780e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 92: ||h_L||=1.085e+08 ||g_2||=1.778e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 93: ||h_L||=1.086e+08 ||g_2||=1.777e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 94: ||h_L||=1.087e+08 ||g_2||=1.776e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 95: ||h_L||=1.087e+08 ||g_2||=1.776e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 96: ||h_L||=1.087e+08 ||g_2||=1.775e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 97: ||h_L||=1.088e+08 ||g_2||=1.775e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 98: ||h_L||=1.088e+08 ||g_2||=1.775e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 99: ||h_L||=1.088e+08 ||g_2||=1.775e-10 acc=0.1055 gamma_dfa=0.0528 + [DFA] Ep 100: ||h_L||=1.088e+08 ||g_2||=1.775e-10 acc=0.1055 gamma_dfa=0.0528 + +Saved results/h2_no_residual_full_s456/snapshot_evolution_s456.json diff --git a/results/h2_no_residual_full_s456/snapshot_evolution_s456.json b/results/h2_no_residual_full_s456/snapshot_evolution_s456.json new file mode 100644 index 0000000..4070eaa --- /dev/null +++ b/results/h2_no_residual_full_s456/snapshot_evolution_s456.json @@ -0,0 +1,2749 @@ +{ + "config": { + "output_dir": "results/h2_no_residual_full_s456", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 456, + "depth": 4, + "d_hidden": 256, + "log_every": 1, + "no_residual_add": true, + "w2_std": 0.5, + "random_targets": false, + "skip_bp": true + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": null, + "dfa_log": [ + { + "hidden_norms": [ + 8.696551322937012, + 42.47159957885742, + 42.67432403564453, + 45.272701263427734, + 43.449092864990234 + ], + "bp_grad_norms_per_sample_med": [ + 0.0011182057205587626, + 0.00021166827355045825, + 0.00014748115791007876, + 0.00011803740198956802, + 0.00010102539090439677 + ], + "bp_grad_norms_F": [ + 0.039927296340465546, + 0.006882709916681051, + 0.004750067833811045, + 0.00377994985319674, + 0.0032426300458610058 + ], + "gamma_dfa": 0.012312270817346871, + "acc_eval": 0.1142578125, + "loss_eval": 2.3956005573272705, + "epoch": 0 + }, + { + "hidden_norms": [ + 1556.684814453125, + 6497.32177734375, + 10603.298828125, + 15776.048828125, + 9974.5771484375 + ], + "bp_grad_norms_per_sample_med": [ + 7.715180458944815e-07, + 4.893955178886245e-07, + 4.84326051264361e-07, + 4.838655058847507e-07, + 4.83024962250056e-07 + ], + "bp_grad_norms_F": [ + 4.703722152044065e-05, + 2.927827154053375e-05, + 2.886639595089946e-05, + 2.8710121114272624e-05, + 2.851033423212357e-05 + ], + "gamma_dfa": 0.018546399660408497, + "acc_eval": 0.111328125, + "loss_eval": 2.356113910675049, + "epoch": 1 + }, + { + "hidden_norms": [ + 3438.555908203125, + 41675.72265625, + 66460.0234375, + 84792.1875, + 42575.42578125 + ], + "bp_grad_norms_per_sample_med": [ + 2.2151462530928256e-07, + 8.604414603041732e-08, + 8.536036233408595e-08, + 8.52630037684321e-08, + 8.530036410547837e-08 + ], + "bp_grad_norms_F": [ + 1.8386168449069373e-05, + 6.961788585613249e-06, + 6.748253326804843e-06, + 6.721136742271483e-06, + 6.674351880064933e-06 + ], + "gamma_dfa": 0.017316466895863414, + "acc_eval": 0.1005859375, + "loss_eval": 2.356572151184082, + "epoch": 2 + }, + { + "hidden_norms": [ + 5372.435546875, + 121188.546875, + 174809.4375, + 203405.859375, + 95077.4609375 + ], + "bp_grad_norms_per_sample_med": [ + 1.2532444770840812e-07, + 3.495903300176906e-08, + 3.4808731896873724e-08, + 3.474917420476231e-08, + 3.4685903926856554e-08 + ], + "bp_grad_norms_F": [ + 1.1882418220920954e-05, + 2.7211688120587496e-06, + 2.6087484457093524e-06, + 2.602359927550424e-06, + 2.590174972283421e-06 + ], + "gamma_dfa": 0.014974067453294992, + "acc_eval": 0.080078125, + "loss_eval": 2.381472110748291, + "epoch": 3 + }, + { + "hidden_norms": [ + 7225.4375, + 258499.359375, + 333575.4375, + 364076.25, + 168464.5 + ], + "bp_grad_norms_per_sample_med": [ + 8.640306248253182e-08, + 1.9808053863812347e-08, + 1.9682946827970227e-08, + 1.9666908102067282e-08, + 1.967319640527876e-08 + ], + "bp_grad_norms_F": [ + 1.1042752703360748e-05, + 1.5015855296951486e-06, + 1.3234410971563193e-06, + 1.3206722542236093e-06, + 1.314130940954783e-06 + ], + "gamma_dfa": 0.020775633631274104, + "acc_eval": 0.0654296875, + "loss_eval": 2.458400249481201, + "epoch": 4 + }, + { + "hidden_norms": [ + 8934.6435546875, + 470048.6875, + 549725.375, + 586957.8125, + 270350.28125 + ], + "bp_grad_norms_per_sample_med": [ + 7.15417982632971e-08, + 1.303753727199819e-08, + 1.2938533799911056e-08, + 1.2922544811999614e-08, + 1.2902905410783205e-08 + ], + "bp_grad_norms_F": [ + 9.721887181513011e-06, + 9.336578727925371e-07, + 8.095747716652113e-07, + 8.079554731921235e-07, + 8.037279712880263e-07 + ], + "gamma_dfa": 0.023886571638286114, + "acc_eval": 0.0732421875, + "loss_eval": 2.553205966949463, + "epoch": 5 + }, + { + "hidden_norms": [ + 10581.7958984375, + 749584.4375, + 812141.0, + 857193.1875, + 400190.71875 + ], + "bp_grad_norms_per_sample_med": [ + 6.321820222865426e-08, + 9.664934630393418e-09, + 9.634317343909515e-09, + 9.620791274755902e-09, + 9.613222218263218e-09 + ], + "bp_grad_norms_F": [ + 7.260930487973383e-06, + 5.95286962834507e-07, + 5.624330583486881e-07, + 5.61392937470373e-07, + 5.576875423685124e-07 + ], + "gamma_dfa": 0.024110323167406023, + "acc_eval": 0.1064453125, + "loss_eval": 2.702815532684326, + "epoch": 6 + }, + { + "hidden_norms": [ + 12157.236328125, + 1101113.5, + 1131608.625, + 1175579.75, + 556328.5625 + ], + "bp_grad_norms_per_sample_med": [ + 6.076628977780274e-08, + 7.990832884274823e-09, + 7.954333192117247e-09, + 7.956207248582814e-09, + 7.94490695454897e-09 + ], + "bp_grad_norms_F": [ + 9.092925211007241e-06, + 4.779853952641133e-07, + 4.453321764685825e-07, + 4.4446503011386085e-07, + 4.4091100903642655e-07 + ], + "gamma_dfa": 0.029227681923657656, + "acc_eval": 0.1123046875, + "loss_eval": 2.943108558654785, + "epoch": 7 + }, + { + "hidden_norms": [ + 13644.7734375, + 1553127.5, + 1514848.5, + 1594542.125, + 760487.4375 + ], + "bp_grad_norms_per_sample_med": [ + 6.183345391264083e-08, + 6.574770061718027e-09, + 6.521708506568302e-09, + 6.522410611609075e-09, + 6.511657879570976e-09 + ], + "bp_grad_norms_F": [ + 1.052718380378792e-05, + 3.7946443853797973e-07, + 3.55582386646347e-07, + 3.546880407157005e-07, + 3.51142261934001e-07 + ], + "gamma_dfa": 0.031233762740157545, + "acc_eval": 0.115234375, + "loss_eval": 3.18121600151062, + "epoch": 8 + }, + { + "hidden_norms": [ + 15180.75, + 2118332.5, + 1971916.0, + 2126576.75, + 1010951.875 + ], + "bp_grad_norms_per_sample_med": [ + 6.837856147967614e-08, + 5.575389039336187e-09, + 5.5562221490390584e-09, + 5.548445258796164e-09, + 5.536703984176938e-09 + ], + "bp_grad_norms_F": [ + 1.100128883990692e-05, + 3.2698190466362576e-07, + 3.031300082056987e-07, + 3.0168610010150587e-07, + 2.9835959480806196e-07 + ], + "gamma_dfa": 0.03483391250483692, + "acc_eval": 0.1162109375, + "loss_eval": 3.5671467781066895, + "epoch": 9 + }, + { + "hidden_norms": [ + 16599.55078125, + 2766443.75, + 2507868.5, + 2746855.25, + 1307418.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.16296781888559e-08, + 4.753268889601259e-09, + 4.731485869768903e-09, + 4.728840874435036e-09, + 4.7213348786101506e-09 + ], + "bp_grad_norms_F": [ + 1.1134686246805359e-05, + 2.7916473754885374e-07, + 2.561137080192566e-07, + 2.54354034723292e-07, + 2.5102386302933155e-07 + ], + "gamma_dfa": 0.04032926296349615, + "acc_eval": 0.115234375, + "loss_eval": 3.8605642318725586, + "epoch": 10 + }, + { + "hidden_norms": [ + 18096.76171875, + 3487919.0, + 3098858.25, + 3488545.25, + 1643380.75 + ], + "bp_grad_norms_per_sample_med": [ + 7.39422816309343e-08, + 4.142685749997099e-09, + 4.12689660223009e-09, + 4.106536444226094e-09, + 4.097727934748718e-09 + ], + "bp_grad_norms_F": [ + 1.2028808669128921e-05, + 2.466808268763998e-07, + 2.2443308012043417e-07, + 2.2274194577676099e-07, + 2.1958824447665393e-07 + ], + "gamma_dfa": 0.04084749217145145, + "acc_eval": 0.1162109375, + "loss_eval": 4.266114234924316, + "epoch": 11 + }, + { + "hidden_norms": [ + 19581.2265625, + 4300652.5, + 3764740.75, + 4282907.0, + 2046749.5 + ], + "bp_grad_norms_per_sample_med": [ + 7.486859487926267e-08, + 3.5559581945676655e-09, + 3.521152702745667e-09, + 3.5090488292865984e-09, + 3.507678369985001e-09 + ], + "bp_grad_norms_F": [ + 1.1329559129080735e-05, + 2.097379336873928e-07, + 1.916048546490856e-07, + 1.900083077543968e-07, + 1.8724767869571224e-07 + ], + "gamma_dfa": 0.041128118813503534, + "acc_eval": 0.1123046875, + "loss_eval": 4.545563220977783, + "epoch": 12 + }, + { + "hidden_norms": [ + 21009.037109375, + 5305093.0, + 4626911.0, + 5321710.0, + 2528971.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.575832938755411e-08, + 3.0991811339475817e-09, + 3.0681037710422743e-09, + 3.060007136568288e-09, + 3.054509534194949e-09 + ], + "bp_grad_norms_F": [ + 1.31506558318506e-05, + 1.8260404033298983e-07, + 1.6721619999771065e-07, + 1.6574335859331768e-07, + 1.6327113883107813e-07 + ], + "gamma_dfa": 0.04362456756643951, + "acc_eval": 0.1142578125, + "loss_eval": 5.006200790405273, + "epoch": 13 + }, + { + "hidden_norms": [ + 22418.66015625, + 6455876.5, + 5546792.0, + 6434348.0, + 3069372.75 + ], + "bp_grad_norms_per_sample_med": [ + 7.665693146918784e-08, + 2.6803985697654298e-09, + 2.6608955039364446e-09, + 2.655886177649336e-09, + 2.650993424779813e-09 + ], + "bp_grad_norms_F": [ + 1.1598707715165801e-05, + 1.584767090889727e-07, + 1.4540981396748975e-07, + 1.442050745481538e-07, + 1.419812747371907e-07 + ], + "gamma_dfa": 0.043382189120166004, + "acc_eval": 0.115234375, + "loss_eval": 5.284748077392578, + "epoch": 14 + }, + { + "hidden_norms": [ + 23927.9296875, + 7772545.0, + 6605308.0, + 7661779.0, + 3671957.5 + ], + "bp_grad_norms_per_sample_med": [ + 7.622067954571321e-08, + 2.3548620831093103e-09, + 2.3399049364769553e-09, + 2.3347188626843263e-09, + 2.3328083909035513e-09 + ], + "bp_grad_norms_F": [ + 1.2071202945662662e-05, + 1.4146635862744006e-07, + 1.285337845047252e-07, + 1.2724865428026533e-07, + 1.2524400005986536e-07 + ], + "gamma_dfa": 0.045932179084047675, + "acc_eval": 0.1123046875, + "loss_eval": 5.692019462585449, + "epoch": 15 + }, + { + "hidden_norms": [ + 25385.748046875, + 9261487.0, + 7775942.0, + 8990953.0, + 4363130.5 + ], + "bp_grad_norms_per_sample_med": [ + 7.712851868291182e-08, + 2.1066282052117913e-09, + 2.0846218085068813e-09, + 2.0782020548892888e-09, + 2.0737342953935922e-09 + ], + "bp_grad_norms_F": [ + 1.4093741810938809e-05, + 1.278412895544534e-07, + 1.1472226901787508e-07, + 1.1351045259289094e-07, + 1.1163785273993199e-07 + ], + "gamma_dfa": 0.04430226338445209, + "acc_eval": 0.1103515625, + "loss_eval": 6.133723258972168, + "epoch": 16 + }, + { + "hidden_norms": [ + 26846.431640625, + 10875826.0, + 9052473.0, + 10511219.0, + 5116002.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.701503079715621e-08, + 1.8753321118225585e-09, + 1.861700571481606e-09, + 1.8542083424222255e-09, + 1.8551130631649926e-09 + ], + "bp_grad_norms_F": [ + 1.3089967978885397e-05, + 1.156644771072024e-07, + 1.0296086117023151e-07, + 1.0183324405943495e-07, + 1.0014894513687977e-07 + ], + "gamma_dfa": 0.04534357553347945, + "acc_eval": 0.103515625, + "loss_eval": 6.548648834228516, + "epoch": 17 + }, + { + "hidden_norms": [ + 28266.26953125, + 12742770.0, + 10505442.0, + 12262496.0, + 5946980.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.75791733076403e-08, + 1.6816592562918231e-09, + 1.6644484679417815e-09, + 1.662164628157825e-09, + 1.6569644545327833e-09 + ], + "bp_grad_norms_F": [ + 1.3716629837290384e-05, + 1.0489808488500785e-07, + 9.319560234644086e-08, + 9.210800300252231e-08, + 9.0522433993101e-08 + ], + "gamma_dfa": 0.04543712313170545, + "acc_eval": 0.0859375, + "loss_eval": 6.933040618896484, + "epoch": 18 + }, + { + "hidden_norms": [ + 29640.484375, + 14788877.0, + 12157201.0, + 14095277.0, + 6799392.5 + ], + "bp_grad_norms_per_sample_med": [ + 7.606816865290966e-08, + 1.512424963046044e-09, + 1.495692236730406e-09, + 1.4903339673466576e-09, + 1.4848139384682213e-09 + ], + "bp_grad_norms_F": [ + 1.3458115063258447e-05, + 9.697606628833455e-08, + 8.518442484728439e-08, + 8.402660256479066e-08, + 8.255508987531357e-08 + ], + "gamma_dfa": 0.044778631010558456, + "acc_eval": 0.076171875, + "loss_eval": 7.425451278686523, + "epoch": 19 + }, + { + "hidden_norms": [ + 31005.751953125, + 17043824.0, + 13942765.0, + 16095532.0, + 7803190.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.645277122492189e-08, + 1.3731507042535895e-09, + 1.3549177335647755e-09, + 1.3525375264222816e-09, + 1.3489699357549512e-09 + ], + "bp_grad_norms_F": [ + 1.2845624951296486e-05, + 8.864368084005037e-08, + 7.73182620150692e-08, + 7.621348885322732e-08, + 7.483793496021462e-08 + ], + "gamma_dfa": 0.045761530549498275, + "acc_eval": 0.080078125, + "loss_eval": 7.776348114013672, + "epoch": 20 + }, + { + "hidden_norms": [ + 32358.83984375, + 19344688.0, + 15897992.0, + 18375228.0, + 8836651.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.644052146815739e-08, + 1.2519073555594673e-09, + 1.235606394978106e-09, + 1.2283364325682555e-09, + 1.2260956694376546e-09 + ], + "bp_grad_norms_F": [ + 1.3093407687847503e-05, + 8.157029185440479e-08, + 7.093318998840914e-08, + 6.988454259726495e-08, + 6.859116297164292e-08 + ], + "gamma_dfa": 0.04580485462793149, + "acc_eval": 0.0927734375, + "loss_eval": 8.182464599609375, + "epoch": 21 + }, + { + "hidden_norms": [ + 33740.52734375, + 21987014.0, + 17933020.0, + 20700014.0, + 9927617.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.858014328121499e-08, + 1.141782890456966e-09, + 1.131721383273998e-09, + 1.1269319921680676e-09, + 1.1228904472915247e-09 + ], + "bp_grad_norms_F": [ + 1.2902617527288385e-05, + 7.599386009360387e-08, + 6.517191053490023e-08, + 6.410991915117847e-08, + 6.290429155342281e-08 + ], + "gamma_dfa": 0.046245397155871615, + "acc_eval": 0.1044921875, + "loss_eval": 8.578572273254395, + "epoch": 22 + }, + { + "hidden_norms": [ + 35055.48828125, + 24700796.0, + 20204280.0, + 23173254.0, + 11098732.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.840032623107618e-08, + 1.054925813370744e-09, + 1.0381229209599496e-09, + 1.033837571107199e-09, + 1.0320241328187763e-09 + ], + "bp_grad_norms_F": [ + 1.3013632269576192e-05, + 7.11033791844784e-08, + 6.033156552121e-08, + 5.929242519187028e-08, + 5.8144280501437606e-08 + ], + "gamma_dfa": 0.04646674945252016, + "acc_eval": 0.10546875, + "loss_eval": 8.944098472595215, + "epoch": 23 + }, + { + "hidden_norms": [ + 36405.48046875, + 27759312.0, + 22467726.0, + 25750832.0, + 12358187.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.77747288793762e-08, + 9.745112494741193e-10, + 9.61777768537786e-10, + 9.57246060195871e-10, + 9.547377333163354e-10 + ], + "bp_grad_norms_F": [ + 1.3124400538799819e-05, + 6.744348723941584e-08, + 5.6144159543691785e-08, + 5.510578660050669e-08, + 5.4037375463167336e-08 + ], + "gamma_dfa": 0.04619356358307414, + "acc_eval": 0.10546875, + "loss_eval": 9.376721382141113, + "epoch": 24 + }, + { + "hidden_norms": [ + 37680.57421875, + 30906478.0, + 24827362.0, + 28558372.0, + 13662978.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.0997551776818e-08, + 9.035370229781847e-10, + 8.898414227687113e-10, + 8.862885980676083e-10, + 8.829543207689028e-10 + ], + "bp_grad_norms_F": [ + 1.3445563126879279e-05, + 6.41164845660569e-08, + 5.240685041485449e-08, + 5.135610692263981e-08, + 5.02956822856504e-08 + ], + "gamma_dfa": 0.046825854369672015, + "acc_eval": 0.10546875, + "loss_eval": 9.577943801879883, + "epoch": 25 + }, + { + "hidden_norms": [ + 38936.06640625, + 34144420.0, + 27240194.0, + 31329912.0, + 14997002.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.190059475055023e-08, + 8.378591709323757e-10, + 8.267845297282861e-10, + 8.228125403242359e-10, + 8.203847046139856e-10 + ], + "bp_grad_norms_F": [ + 1.2998734746361151e-05, + 6.114981232485661e-08, + 4.876913095586133e-08, + 4.772548578557689e-08, + 4.673227849139039e-08 + ], + "gamma_dfa": 0.047515806669252925, + "acc_eval": 0.10546875, + "loss_eval": 9.88414478302002, + "epoch": 26 + }, + { + "hidden_norms": [ + 40155.01953125, + 37508168.0, + 29749186.0, + 34078604.0, + 16502834.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.168245813067188e-08, + 7.775868282600129e-10, + 7.702881665849759e-10, + 7.661091205868331e-10, + 7.637669940940839e-10 + ], + "bp_grad_norms_F": [ + 1.3017543096793815e-05, + 5.765622645981239e-08, + 4.5165805317992636e-08, + 4.418279431206429e-08, + 4.329486813503536e-08 + ], + "gamma_dfa": 0.047424486168893054, + "acc_eval": 0.1064453125, + "loss_eval": 10.275530815124512, + "epoch": 27 + }, + { + "hidden_norms": [ + 41438.58203125, + 41153480.0, + 32568028.0, + 37348624.0, + 18107524.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.174999521770587e-08, + 7.312160876793428e-10, + 7.228238008138987e-10, + 7.196194196090744e-10, + 7.171208626921555e-10 + ], + "bp_grad_norms_F": [ + 1.2991866242373362e-05, + 5.5619945982243735e-08, + 4.266198772029384e-08, + 4.1693596131153754e-08, + 4.083043592117974e-08 + ], + "gamma_dfa": 0.04726689399103634, + "acc_eval": 0.10546875, + "loss_eval": 10.532907485961914, + "epoch": 28 + }, + { + "hidden_norms": [ + 42610.61328125, + 44767372.0, + 35250536.0, + 40433388.0, + 19648566.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.25098211976183e-08, + 6.862435619758855e-10, + 6.773137606330693e-10, + 6.743952063459346e-10, + 6.720446421581983e-10 + ], + "bp_grad_norms_F": [ + 1.2943252841068897e-05, + 5.273594538834914e-08, + 4.00670607803022e-08, + 3.916983715157585e-08, + 3.8364525778433745e-08 + ], + "gamma_dfa": 0.04717689534300007, + "acc_eval": 0.10546875, + "loss_eval": 10.889819145202637, + "epoch": 29 + }, + { + "hidden_norms": [ + 43802.12109375, + 48777580.0, + 38250948.0, + 43905160.0, + 21394392.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.3824673424715e-08, + 6.459773826961168e-10, + 6.385393880314894e-10, + 6.341404623633196e-10, + 6.317291689761362e-10 + ], + "bp_grad_norms_F": [ + 1.2702556887234095e-05, + 4.966772237935402e-08, + 3.767947376331904e-08, + 3.682788829451056e-08, + 3.60615324268565e-08 + ], + "gamma_dfa": 0.04775475192582235, + "acc_eval": 0.10546875, + "loss_eval": 11.143190383911133, + "epoch": 30 + }, + { + "hidden_norms": [ + 44971.96484375, + 53001532.0, + 41286860.0, + 47327540.0, + 23064180.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.44017193912805e-08, + 6.083171188997483e-10, + 6.001447672154825e-10, + 5.973078143206578e-10, + 5.949598036458781e-10 + ], + "bp_grad_norms_F": [ + 1.2565969882416539e-05, + 4.7034244943233716e-08, + 3.557239125484557e-08, + 3.4768806500551364e-08, + 3.403641457566664e-08 + ], + "gamma_dfa": 0.04808254592353478, + "acc_eval": 0.10546875, + "loss_eval": 11.375898361206055, + "epoch": 31 + }, + { + "hidden_norms": [ + 46135.65234375, + 57315672.0, + 44360792.0, + 51011808.0, + 24900550.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.566909315277371e-08, + 5.749250520103999e-10, + 5.675590553089194e-10, + 5.655514945246409e-10, + 5.63264157538157e-10 + ], + "bp_grad_norms_F": [ + 1.2200253877381328e-05, + 4.4094601747701745e-08, + 3.3572575830476126e-08, + 3.2811797723297786e-08, + 3.210490717719949e-08 + ], + "gamma_dfa": 0.04755272905458696, + "acc_eval": 0.1064453125, + "loss_eval": 11.584449768066406, + "epoch": 32 + }, + { + "hidden_norms": [ + 47265.27734375, + 61919976.0, + 47722620.0, + 54844944.0, + 26929922.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.478352953034118e-08, + 5.391301294288553e-10, + 5.344974463028507e-10, + 5.308364858791492e-10, + 5.291052596057e-10 + ], + "bp_grad_norms_F": [ + 1.2009260899503715e-05, + 4.1767787450908145e-08, + 3.1745546635875144e-08, + 3.102580947711431e-08, + 3.037316531617762e-08 + ], + "gamma_dfa": 0.0475847675697878, + "acc_eval": 0.10546875, + "loss_eval": 11.923343658447266, + "epoch": 33 + }, + { + "hidden_norms": [ + 48342.62109375, + 66327300.0, + 51030320.0, + 58382808.0, + 28803830.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.630867398551345e-08, + 5.130093017058357e-10, + 5.057400054298e-10, + 5.023059190811807e-10, + 5.003696346150832e-10 + ], + "bp_grad_norms_F": [ + 1.1836677003884688e-05, + 3.972920481487563e-08, + 3.016906902075789e-08, + 2.9483924635087533e-08, + 2.8860545953079964e-08 + ], + "gamma_dfa": 0.04806397232459858, + "acc_eval": 0.10546875, + "loss_eval": 12.134788513183594, + "epoch": 34 + }, + { + "hidden_norms": [ + 49438.7734375, + 70923576.0, + 54371588.0, + 62839076.0, + 30745350.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.529716666316745e-08, + 4.881638981935055e-10, + 4.826159472059999e-10, + 4.801878894511447e-10, + 4.785546958707698e-10 + ], + "bp_grad_norms_F": [ + 1.1614155482675415e-05, + 3.7715466305598966e-08, + 2.8843189170402184e-08, + 2.8193024803613298e-08, + 2.7588850315396485e-08 + ], + "gamma_dfa": 0.047784373455215245, + "acc_eval": 0.10546875, + "loss_eval": 12.365730285644531, + "epoch": 35 + }, + { + "hidden_norms": [ + 50484.30859375, + 75708880.0, + 57946872.0, + 66924284.0, + 32685426.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.612364865712152e-08, + 4.650996809907326e-10, + 4.5824133376726195e-10, + 4.5511036605994093e-10, + 4.534528585953268e-10 + ], + "bp_grad_norms_F": [ + 1.1689081475196872e-05, + 3.617047283910324e-08, + 2.7491989129657668e-08, + 2.6862345237077534e-08, + 2.6283149878736367e-08 + ], + "gamma_dfa": 0.04781174083473161, + "acc_eval": 0.10546875, + "loss_eval": 12.582022666931152, + "epoch": 36 + }, + { + "hidden_norms": [ + 51533.140625, + 80717000.0, + 61608756.0, + 71031448.0, + 34583536.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.646285465374604e-08, + 4.4203954385757527e-10, + 4.369871131615355e-10, + 4.329318292750628e-10, + 4.319989088674703e-10 + ], + "bp_grad_norms_F": [ + 1.1521507985889912e-05, + 3.4413087490747785e-08, + 2.619959005301098e-08, + 2.5601275766007348e-08, + 2.505496254912032e-08 + ], + "gamma_dfa": 0.04798329665209167, + "acc_eval": 0.10546875, + "loss_eval": 12.857856750488281, + "epoch": 37 + }, + { + "hidden_norms": [ + 52583.0859375, + 85961416.0, + 65257552.0, + 74859152.0, + 36629052.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.666147977010041e-08, + 4.2343398232169704e-10, + 4.1782510784571514e-10, + 4.1457998145588704e-10, + 4.136685161082454e-10 + ], + "bp_grad_norms_F": [ + 1.1553073818504345e-05, + 3.306437434957843e-08, + 2.515412056425248e-08, + 2.4584762670087912e-08, + 2.405546162265182e-08 + ], + "gamma_dfa": 0.04809549875790253, + "acc_eval": 0.10546875, + "loss_eval": 13.005304336547852, + "epoch": 38 + }, + { + "hidden_norms": [ + 53574.21875, + 91233752.0, + 68912136.0, + 78801432.0, + 38771888.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.665335116120332e-08, + 4.0339676043998907e-10, + 4.0027073322512763e-10, + 3.982228713450553e-10, + 3.9690134512326836e-10 + ], + "bp_grad_norms_F": [ + 1.1503744644869585e-05, + 3.151562921743789e-08, + 2.405471910549295e-08, + 2.3515880798186117e-08, + 2.3014273153876275e-08 + ], + "gamma_dfa": 0.04791133257094771, + "acc_eval": 0.10546875, + "loss_eval": 13.310943603515625, + "epoch": 39 + }, + { + "hidden_norms": [ + 54515.76953125, + 96143688.0, + 72537432.0, + 83291584.0, + 40846320.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.742490109625578e-08, + 3.8639558219699666e-10, + 3.8376418709518134e-10, + 3.813957205611729e-10, + 3.8053543649496646e-10 + ], + "bp_grad_norms_F": [ + 1.1331952919135801e-05, + 3.0162087938379045e-08, + 2.3133726045898584e-08, + 2.2621049922122438e-08, + 2.2133153976255926e-08 + ], + "gamma_dfa": 0.0483476699446328, + "acc_eval": 0.10546875, + "loss_eval": 13.509955406188965, + "epoch": 40 + }, + { + "hidden_norms": [ + 55471.92578125, + 101352504.0, + 76262640.0, + 87893288.0, + 43005752.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.776105886454388e-08, + 3.722072094980433e-10, + 3.6970662642410446e-10, + 3.67776836762701e-10, + 3.6656577773186427e-10 + ], + "bp_grad_norms_F": [ + 1.1259300663368776e-05, + 2.921965247537628e-08, + 2.22886100686992e-08, + 2.178610181147178e-08, + 2.1311375775212582e-08 + ], + "gamma_dfa": 0.04882028384599835, + "acc_eval": 0.10546875, + "loss_eval": 13.669061660766602, + "epoch": 41 + }, + { + "hidden_norms": [ + 56406.1796875, + 106503480.0, + 80309328.0, + 92335120.0, + 45272116.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.741802304257362e-08, + 3.5817968035978254e-10, + 3.546553328792612e-10, + 3.5286135124934503e-10, + 3.517087177051792e-10 + ], + "bp_grad_norms_F": [ + 1.1156203981954604e-05, + 2.829144030158659e-08, + 2.1501875835383544e-08, + 2.1014004758512783e-08, + 2.056106396253199e-08 + ], + "gamma_dfa": 0.04876198567217216, + "acc_eval": 0.10546875, + "loss_eval": 13.882933616638184, + "epoch": 42 + }, + { + "hidden_norms": [ + 57307.2421875, + 111696136.0, + 84071088.0, + 96859240.0, + 47347232.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.675155527271272e-08, + 3.451815777655298e-10, + 3.4170632989827254e-10, + 3.399925063707343e-10, + 3.38884892370217e-10 + ], + "bp_grad_norms_F": [ + 1.105228056985652e-05, + 2.731184522986041e-08, + 2.0790139387827367e-08, + 2.0321502702813632e-08, + 1.9881698065660203e-08 + ], + "gamma_dfa": 0.04874728451250121, + "acc_eval": 0.10546875, + "loss_eval": 14.110960960388184, + "epoch": 43 + }, + { + "hidden_norms": [ + 58201.1015625, + 116915912.0, + 88056232.0, + 101457736.0, + 49574372.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.81610304759306e-08, + 3.3262503862374615e-10, + 3.28719912401354e-10, + 3.270855530868033e-10, + 3.2694977281089166e-10 + ], + "bp_grad_norms_F": [ + 1.09774755401304e-05, + 2.6502128491756594e-08, + 2.010280297781719e-08, + 1.964214924043972e-08, + 1.9215420365981117e-08 + ], + "gamma_dfa": 0.049133426626212895, + "acc_eval": 0.10546875, + "loss_eval": 14.251358985900879, + "epoch": 44 + }, + { + "hidden_norms": [ + 59057.046875, + 122526296.0, + 92035232.0, + 106073072.0, + 51524732.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.615387514510076e-08, + 3.1993208082781166e-10, + 3.1755734153371407e-10, + 3.1527228050443057e-10, + 3.1427349611590216e-10 + ], + "bp_grad_norms_F": [ + 1.0898848813667428e-05, + 2.5704085970801316e-08, + 1.941714167230657e-08, + 1.896907697584993e-08, + 1.8563016013217748e-08 + ], + "gamma_dfa": 0.04926633776631206, + "acc_eval": 0.10546875, + "loss_eval": 14.543952941894531, + "epoch": 45 + }, + { + "hidden_norms": [ + 59915.00390625, + 128059208.0, + 95767408.0, + 110314168.0, + 53699800.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.616160585006583e-08, + 3.10205972020583e-10, + 3.0786348470535074e-10, + 3.0548555352005735e-10, + 3.044886287550952e-10 + ], + "bp_grad_norms_F": [ + 1.0854326319531538e-05, + 2.4907375717475588e-08, + 1.8864984241417915e-08, + 1.8437393833892202e-08, + 1.8046192096221603e-08 + ], + "gamma_dfa": 0.04898433407652192, + "acc_eval": 0.10546875, + "loss_eval": 14.763640403747559, + "epoch": 46 + }, + { + "hidden_norms": [ + 60732.77734375, + 133044840.0, + 99449000.0, + 114745104.0, + 55794780.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.66734808369074e-08, + 3.0199040490508366e-10, + 2.984798519456433e-10, + 2.9689897762530393e-10, + 2.9609348306536276e-10 + ], + "bp_grad_norms_F": [ + 1.0869742254726589e-05, + 2.4187817970755532e-08, + 1.8320044148367742e-08, + 1.79040302583644e-08, + 1.7519981909686067e-08 + ], + "gamma_dfa": 0.049695645982865244, + "acc_eval": 0.10546875, + "loss_eval": 14.853147506713867, + "epoch": 47 + }, + { + "hidden_norms": [ + 61537.2265625, + 138238256.0, + 103294888.0, + 119079736.0, + 57875032.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.672164852896458e-08, + 2.937747545228575e-10, + 2.90239082767485e-10, + 2.8853816558260803e-10, + 2.880042870856414e-10 + ], + "bp_grad_norms_F": [ + 1.0855384971364401e-05, + 2.3642215296604263e-08, + 1.78662986627387e-08, + 1.745818423160017e-08, + 1.7085612924461202e-08 + ], + "gamma_dfa": 0.04945674288319424, + "acc_eval": 0.10546875, + "loss_eval": 15.014139175415039, + "epoch": 48 + }, + { + "hidden_norms": [ + 62318.859375, + 143781376.0, + 107295080.0, + 123266280.0, + 60009076.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.63586393506921e-08, + 2.853322023099736e-10, + 2.819139366394552e-10, + 2.8051430622788587e-10, + 2.796505249591519e-10 + ], + "bp_grad_norms_F": [ + 1.0763029422378168e-05, + 2.2983703829027036e-08, + 1.7385014317028435e-08, + 1.699019236411914e-08, + 1.662707127536578e-08 + ], + "gamma_dfa": 0.04949341545579955, + "acc_eval": 0.10546875, + "loss_eval": 15.234472274780273, + "epoch": 49 + }, + { + "hidden_norms": [ + 63084.12109375, + 148953776.0, + 111167488.0, + 127493184.0, + 62116584.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.690788888543466e-08, + 2.77830092265674e-10, + 2.7401189650611e-10, + 2.7265251167918336e-10, + 2.71903860538103e-10 + ], + "bp_grad_norms_F": [ + 1.0762613783299457e-05, + 2.2435919788676983e-08, + 1.6915544520657022e-08, + 1.65265419127536e-08, + 1.6172732486552377e-08 + ], + "gamma_dfa": 0.04998577304650098, + "acc_eval": 0.10546875, + "loss_eval": 15.356475830078125, + "epoch": 50 + }, + { + "hidden_norms": [ + 63822.42578125, + 153887120.0, + 114903200.0, + 131868160.0, + 64092768.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.741512402821172e-08, + 2.695783041239963e-10, + 2.676055765871155e-10, + 2.6572444244976623e-10, + 2.649161723322635e-10 + ], + "bp_grad_norms_F": [ + 1.07648411358241e-05, + 2.1865258048592295e-08, + 1.6514658085498013e-08, + 1.6137914116143293e-08, + 1.5790037721785666e-08 + ], + "gamma_dfa": 0.050343112263362855, + "acc_eval": 0.10546875, + "loss_eval": 15.516284942626953, + "epoch": 51 + }, + { + "hidden_norms": [ + 64467.453125, + 158904000.0, + 118881072.0, + 136114000.0, + 66111872.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.664627415555515e-08, + 2.624416239882521e-10, + 2.6058996627220665e-10, + 2.5911758849694877e-10, + 2.584663871818549e-10 + ], + "bp_grad_norms_F": [ + 1.0719203601183835e-05, + 2.1336076017064443e-08, + 1.6169177996516737e-08, + 1.5802571695644474e-08, + 1.546756678294514e-08 + ], + "gamma_dfa": 0.04984566644998267, + "acc_eval": 0.10546875, + "loss_eval": 15.6607084274292, + "epoch": 52 + }, + { + "hidden_norms": [ + 65120.73828125, + 163883856.0, + 122702472.0, + 140198928.0, + 68242560.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.641593041147644e-08, + 2.5804472447710225e-10, + 2.5353724675269973e-10, + 2.5259389024867573e-10, + 2.520264275052142e-10 + ], + "bp_grad_norms_F": [ + 1.0724111234594602e-05, + 2.0917026333222566e-08, + 1.5751618676063117e-08, + 1.5394757468811804e-08, + 1.5069018033386783e-08 + ], + "gamma_dfa": 0.05030635162256658, + "acc_eval": 0.10546875, + "loss_eval": 15.901081085205078, + "epoch": 53 + }, + { + "hidden_norms": [ + 65754.40625, + 168991232.0, + 126758528.0, + 144376592.0, + 70329568.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.677351104324771e-08, + 2.5239485501593606e-10, + 2.4832783052097795e-10, + 2.4752053184862177e-10, + 2.4696938938362223e-10 + ], + "bp_grad_norms_F": [ + 1.0669472430890892e-05, + 2.0359754770993277e-08, + 1.542808725218947e-08, + 1.5080953374990713e-08, + 1.4761029731857889e-08 + ], + "gamma_dfa": 0.05062760764849372, + "acc_eval": 0.10546875, + "loss_eval": 16.04940414428711, + "epoch": 54 + }, + { + "hidden_norms": [ + 66360.1953125, + 173885088.0, + 130550672.0, + 148377456.0, + 72298680.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.759133862668023e-08, + 2.4686536148621485e-10, + 2.4284077526637304e-10, + 2.4196153414202115e-10, + 2.414988486965086e-10 + ], + "bp_grad_norms_F": [ + 1.0671456038835458e-05, + 1.9936877038162493e-08, + 1.5118750695819472e-08, + 1.4775524803667395e-08, + 1.4458762187530283e-08 + ], + "gamma_dfa": 0.050650376273551956, + "acc_eval": 0.10546875, + "loss_eval": 16.173294067382812, + "epoch": 55 + }, + { + "hidden_norms": [ + 66955.3671875, + 179032416.0, + 134152312.0, + 152335472.0, + 74150016.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.732155265533947e-08, + 2.4187768454808634e-10, + 2.378792995916257e-10, + 2.3684243455335263e-10, + 2.3630350454162397e-10 + ], + "bp_grad_norms_F": [ + 1.0680658306227997e-05, + 1.9686593688561516e-08, + 1.484478495683561e-08, + 1.4507179457723396e-08, + 1.4196978703751029e-08 + ], + "gamma_dfa": 0.05082969422801398, + "acc_eval": 0.10546875, + "loss_eval": 16.27086639404297, + "epoch": 56 + }, + { + "hidden_norms": [ + 67549.515625, + 183555840.0, + 137880064.0, + 156240624.0, + 75989536.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.660003913973924e-08, + 2.357370687544602e-10, + 2.33779245961685e-10, + 2.3301963136823645e-10, + 2.3250262826124413e-10 + ], + "bp_grad_norms_F": [ + 1.0663774446584284e-05, + 1.9352745184164633e-08, + 1.4566153616613065e-08, + 1.423444206949398e-08, + 1.3932280218398319e-08 + ], + "gamma_dfa": 0.05084921311936341, + "acc_eval": 0.10546875, + "loss_eval": 16.451187133789062, + "epoch": 57 + }, + { + "hidden_norms": [ + 68104.8046875, + 188812128.0, + 141342304.0, + 160268688.0, + 77916768.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.660642691893372e-08, + 2.327093101550659e-10, + 2.2930106424734475e-10, + 2.2855875525529257e-10, + 2.2804760857475515e-10 + ], + "bp_grad_norms_F": [ + 1.0613769518386107e-05, + 1.899090662504932e-08, + 1.4301366313418384e-08, + 1.3975586021786057e-08, + 1.3677930787991954e-08 + ], + "gamma_dfa": 0.05096889057313092, + "acc_eval": 0.10546875, + "loss_eval": 16.63678741455078, + "epoch": 58 + }, + { + "hidden_norms": [ + 68657.515625, + 193258416.0, + 144614160.0, + 164019216.0, + 79742168.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.68742304760417e-08, + 2.289267664323802e-10, + 2.2474513916570515e-10, + 2.2393865928282963e-10, + 2.2451285275337796e-10 + ], + "bp_grad_norms_F": [ + 1.0620946341077797e-05, + 1.866202836708908e-08, + 1.4068830544999855e-08, + 1.3749051674949442e-08, + 1.3455515812665908e-08 + ], + "gamma_dfa": 0.05113464401802048, + "acc_eval": 0.10546875, + "loss_eval": 16.70541763305664, + "epoch": 59 + }, + { + "hidden_norms": [ + 69158.5, + 197991056.0, + 148074896.0, + 168001296.0, + 81613432.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.685481134307338e-08, + 2.244555652453073e-10, + 2.21766327523909e-10, + 2.2105835217889336e-10, + 2.2056727277952604e-10 + ], + "bp_grad_norms_F": [ + 1.0557047062320635e-05, + 1.836115792741566e-08, + 1.3819986932617212e-08, + 1.35067770301589e-08, + 1.3220035732786073e-08 + ], + "gamma_dfa": 0.05133810767438263, + "acc_eval": 0.10546875, + "loss_eval": 16.83820915222168, + "epoch": 60 + }, + { + "hidden_norms": [ + 69652.15625, + 202764272.0, + 151440416.0, + 171388720.0, + 83290960.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.682473406906865e-08, + 2.209017690990578e-10, + 2.178418834208884e-10, + 2.1715784725984122e-10, + 2.166662266267494e-10 + ], + "bp_grad_norms_F": [ + 1.0563057912804652e-05, + 1.8060584139334424e-08, + 1.3589187553009197e-08, + 1.3282591027063972e-08, + 1.300101715173696e-08 + ], + "gamma_dfa": 0.051503602182492614, + "acc_eval": 0.10546875, + "loss_eval": 16.996952056884766, + "epoch": 61 + }, + { + "hidden_norms": [ + 70119.3046875, + 207371568.0, + 154513392.0, + 174693904.0, + 84899272.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.754268776556273e-08, + 2.177768798627966e-10, + 2.1394505611560533e-10, + 2.1310755937697934e-10, + 2.1278181994155432e-10 + ], + "bp_grad_norms_F": [ + 1.0583677067188546e-05, + 1.7867773038915402e-08, + 1.3404712007059061e-08, + 1.3099571205543725e-08, + 1.281919193019121e-08 + ], + "gamma_dfa": 0.05178222866379656, + "acc_eval": 0.10546875, + "loss_eval": 17.03223419189453, + "epoch": 62 + }, + { + "hidden_norms": [ + 70571.765625, + 211695824.0, + 157515872.0, + 178129360.0, + 86545024.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.717323396467691e-08, + 2.1452814524813846e-10, + 2.1192504695566328e-10, + 2.1126832228102188e-10, + 2.1079131495849168e-10 + ], + "bp_grad_norms_F": [ + 1.0588292752800044e-05, + 1.7631437643217396e-08, + 1.3229322526342457e-08, + 1.2929083581525447e-08, + 1.2654436609693676e-08 + ], + "gamma_dfa": 0.0517645905201789, + "acc_eval": 0.10546875, + "loss_eval": 17.17680549621582, + "epoch": 63 + }, + { + "hidden_norms": [ + 71016.2734375, + 216131392.0, + 160371248.0, + 181552016.0, + 88083200.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.714041399571215e-08, + 2.1204836497812352e-10, + 2.0845919435075189e-10, + 2.0772163156212997e-10, + 2.0731850958188858e-10 + ], + "bp_grad_norms_F": [ + 1.0558523172221612e-05, + 1.7396088125565257e-08, + 1.3074124005640897e-08, + 1.2776619762178143e-08, + 1.2503839741384581e-08 + ], + "gamma_dfa": 0.05190763485734351, + "acc_eval": 0.10546875, + "loss_eval": 17.230438232421875, + "epoch": 64 + }, + { + "hidden_norms": [ + 71423.875, + 220276432.0, + 163188992.0, + 184901952.0, + 89669880.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.695663922253516e-08, + 2.089625000811779e-10, + 2.0665336109004784e-10, + 2.060027565198297e-10, + 2.0553812818402406e-10 + ], + "bp_grad_norms_F": [ + 1.054474341799505e-05, + 1.720214015676902e-08, + 1.2905923441053346e-08, + 1.2612286326429967e-08, + 1.2343328137376375e-08 + ], + "gamma_dfa": 0.0516790475230664, + "acc_eval": 0.10546875, + "loss_eval": 17.364524841308594, + "epoch": 65 + }, + { + "hidden_norms": [ + 71819.7265625, + 224240896.0, + 165905760.0, + 188025680.0, + 91055744.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.707031184940206e-08, + 2.0619655982656582e-10, + 2.0404426759323968e-10, + 2.0340489015335805e-10, + 2.0294699254463922e-10 + ], + "bp_grad_norms_F": [ + 1.0510210813663434e-05, + 1.6987915074651028e-08, + 1.2752495948120668e-08, + 1.2462213483388496e-08, + 1.2196251120144552e-08 + ], + "gamma_dfa": 0.05187035645940341, + "acc_eval": 0.10546875, + "loss_eval": 17.464691162109375, + "epoch": 66 + }, + { + "hidden_norms": [ + 72184.1796875, + 228069632.0, + 168371744.0, + 190844528.0, + 92434920.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.708528298484453e-08, + 2.0398974176494278e-10, + 2.0165806524641283e-10, + 2.0102944309208226e-10, + 2.0057676353157916e-10 + ], + "bp_grad_norms_F": [ + 1.0452381502545904e-05, + 1.678668404281325e-08, + 1.2599208787378302e-08, + 1.2311685892996138e-08, + 1.2049306441497265e-08 + ], + "gamma_dfa": 0.052035300293937325, + "acc_eval": 0.10546875, + "loss_eval": 17.54598045349121, + "epoch": 67 + }, + { + "hidden_norms": [ + 72520.546875, + 231382032.0, + 170794656.0, + 193581264.0, + 93730880.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.673346485466027e-08, + 2.0163908043269174e-10, + 1.9945969875756475e-10, + 1.988337966496445e-10, + 1.983077452250015e-10 + ], + "bp_grad_norms_F": [ + 1.041769064613618e-05, + 1.6600257168875032e-08, + 1.2470060539726546e-08, + 1.218627776466974e-08, + 1.1927684617774048e-08 + ], + "gamma_dfa": 0.052122256805887446, + "acc_eval": 0.10546875, + "loss_eval": 17.622678756713867, + "epoch": 68 + }, + { + "hidden_norms": [ + 72848.296875, + 234345168.0, + 172920208.0, + 196159376.0, + 94861664.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.68633378559025e-08, + 1.9926535421710412e-10, + 1.9748097601635095e-10, + 1.9686471897095714e-10, + 1.9632170888961298e-10 + ], + "bp_grad_norms_F": [ + 1.0410145478090271e-05, + 1.6476832342959824e-08, + 1.2349259392863132e-08, + 1.2067844501473246e-08, + 1.1810766586961563e-08 + ], + "gamma_dfa": 0.05221144680399448, + "acc_eval": 0.10546875, + "loss_eval": 17.67215347290039, + "epoch": 69 + }, + { + "hidden_norms": [ + 73156.28125, + 237693904.0, + 175292576.0, + 198663152.0, + 96070024.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.698025766307182e-08, + 1.9732028511132427e-10, + 1.9561376130017294e-10, + 1.950042072262903e-10, + 1.9452565946931344e-10 + ], + "bp_grad_norms_F": [ + 1.0408021807961632e-05, + 1.6299335214853272e-08, + 1.224471191108023e-08, + 1.1966841739763368e-08, + 1.1711744463127616e-08 + ], + "gamma_dfa": 0.05207514451467432, + "acc_eval": 0.10546875, + "loss_eval": 17.708881378173828, + "epoch": 70 + }, + { + "hidden_norms": [ + 73450.0390625, + 240668752.0, + 177333776.0, + 200832576.0, + 97232808.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.750691904424457e-08, + 1.9538150264342136e-10, + 1.937518478989375e-10, + 1.9322175803804242e-10, + 1.9261021944050327e-10 + ], + "bp_grad_norms_F": [ + 1.0387684596935287e-05, + 1.614511546677022e-08, + 1.2127667758932148e-08, + 1.1853135362116518e-08, + 1.1600380211973516e-08 + ], + "gamma_dfa": 0.052143561391858384, + "acc_eval": 0.10546875, + "loss_eval": 17.803735733032227, + "epoch": 71 + }, + { + "hidden_norms": [ + 73722.7890625, + 243140912.0, + 179223280.0, + 203119056.0, + 98179728.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.777691107297869e-08, + 1.936056454043822e-10, + 1.921051789866013e-10, + 1.9142704088537243e-10, + 1.908224411817372e-10 + ], + "bp_grad_norms_F": [ + 1.0383127118984703e-05, + 1.6032700500545616e-08, + 1.2034083063383605e-08, + 1.1761529528087067e-08, + 1.1511005482134351e-08 + ], + "gamma_dfa": 0.0522310700325761, + "acc_eval": 0.10546875, + "loss_eval": 17.871017456054688, + "epoch": 72 + }, + { + "hidden_norms": [ + 73977.796875, + 245601744.0, + 181134272.0, + 205298592.0, + 99248704.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.645526605732812e-08, + 1.9214441149273398e-10, + 1.908457003541031e-10, + 1.8958104530675257e-10, + 1.891580642121582e-10 + ], + "bp_grad_norms_F": [ + 1.0368045877839904e-05, + 1.593527443333187e-08, + 1.1956020173897741e-08, + 1.1683961353980976e-08, + 1.1433988866826894e-08 + ], + "gamma_dfa": 0.05229719865019433, + "acc_eval": 0.10546875, + "loss_eval": 17.842838287353516, + "epoch": 73 + }, + { + "hidden_norms": [ + 74210.2890625, + 248047296.0, + 183004848.0, + 207310784.0, + 100283200.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.702664189286224e-08, + 1.9067503131964259e-10, + 1.8910681354178394e-10, + 1.886194395117613e-10, + 1.8805811075051082e-10 + ], + "bp_grad_norms_F": [ + 1.0340887456550263e-05, + 1.5766524086302525e-08, + 1.1852850256843794e-08, + 1.1584752712678892e-08, + 1.1337309757664116e-08 + ], + "gamma_dfa": 0.05227879187441431, + "acc_eval": 0.10546875, + "loss_eval": 17.977331161499023, + "epoch": 74 + }, + { + "hidden_norms": [ + 74442.2578125, + 250302768.0, + 184669344.0, + 209343920.0, + 101168016.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.73824319569394e-08, + 1.8929384448806985e-10, + 1.8772923493504123e-10, + 1.8724671813075133e-10, + 1.8670247292629227e-10 + ], + "bp_grad_norms_F": [ + 1.0353242942073848e-05, + 1.5672505071506748e-08, + 1.1772779195950989e-08, + 1.1506068098299238e-08, + 1.1260493870679511e-08 + ], + "gamma_dfa": 0.05237349838716909, + "acc_eval": 0.10546875, + "loss_eval": 18.03546905517578, + "epoch": 75 + }, + { + "hidden_norms": [ + 74647.3203125, + 252406032.0, + 186061376.0, + 211037200.0, + 101960680.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.6925361131307e-08, + 1.881417382998407e-10, + 1.867033888602876e-10, + 1.8579758565007154e-10, + 1.8538144630486642e-10 + ], + "bp_grad_norms_F": [ + 1.0341693268856034e-05, + 1.5606824277369924e-08, + 1.1714643477489517e-08, + 1.1449987624700952e-08, + 1.1205665728653003e-08 + ], + "gamma_dfa": 0.05233656561176758, + "acc_eval": 0.10546875, + "loss_eval": 18.052072525024414, + "epoch": 76 + }, + { + "hidden_norms": [ + 74842.0859375, + 254511632.0, + 187492928.0, + 212704224.0, + 102757816.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.698394537987042e-08, + 1.8709332694211156e-10, + 1.8572142435058225e-10, + 1.8484298813792321e-10, + 1.8442962435027965e-10 + ], + "bp_grad_norms_F": [ + 1.0342246241634712e-05, + 1.552284167871676e-08, + 1.1652745435242196e-08, + 1.1389352572166445e-08, + 1.114572434346428e-08 + ], + "gamma_dfa": 0.05241188171203248, + "acc_eval": 0.10546875, + "loss_eval": 18.086322784423828, + "epoch": 77 + }, + { + "hidden_norms": [ + 75024.015625, + 256539408.0, + 188878192.0, + 214226816.0, + 103471288.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.701635323404844e-08, + 1.8604462415083844e-10, + 1.84622400700718e-10, + 1.8390608480522985e-10, + 1.834675189549273e-10 + ], + "bp_grad_norms_F": [ + 1.032539876177907e-05, + 1.5453247570462736e-08, + 1.1593147775101897e-08, + 1.133172844447472e-08, + 1.1090729223894868e-08 + ], + "gamma_dfa": 0.05239276264910586, + "acc_eval": 0.10546875, + "loss_eval": 18.168014526367188, + "epoch": 78 + }, + { + "hidden_norms": [ + 75180.9609375, + 258451104.0, + 190004976.0, + 215740128.0, + 104133768.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.704767395784074e-08, + 1.8524454192814233e-10, + 1.8379993360628788e-10, + 1.8304618931708205e-10, + 1.8256345046818723e-10 + ], + "bp_grad_norms_F": [ + 1.0337872481613886e-05, + 1.5379262308101715e-08, + 1.1539456501452605e-08, + 1.127898041630715e-08, + 1.103767743870776e-08 + ], + "gamma_dfa": 0.052515600953483954, + "acc_eval": 0.10546875, + "loss_eval": 18.164344787597656, + "epoch": 79 + }, + { + "hidden_norms": [ + 75327.796875, + 260127200.0, + 191027072.0, + 216985472.0, + 104684240.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.744654422798703e-08, + 1.8438454929547987e-10, + 1.8290086112315862e-10, + 1.8214722785625526e-10, + 1.8167076176744956e-10 + ], + "bp_grad_norms_F": [ + 1.032766067510238e-05, + 1.5304989275932712e-08, + 1.14842633180956e-08, + 1.122501380734775e-08, + 1.098510349351045e-08 + ], + "gamma_dfa": 0.05257981286558788, + "acc_eval": 0.10546875, + "loss_eval": 18.223249435424805, + "epoch": 80 + }, + { + "hidden_norms": [ + 75454.5703125, + 261646176.0, + 192111600.0, + 218110816.0, + 105216432.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.775589321885491e-08, + 1.8362063258781092e-10, + 1.8213851260551195e-10, + 1.8139376112280559e-10, + 1.809180305567537e-10 + ], + "bp_grad_norms_F": [ + 1.032176169246668e-05, + 1.5236809147722852e-08, + 1.1438899605309416e-08, + 1.1181004566651609e-08, + 1.0941747952131209e-08 + ], + "gamma_dfa": 0.052668574411654845, + "acc_eval": 0.10546875, + "loss_eval": 18.2590389251709, + "epoch": 81 + }, + { + "hidden_norms": [ + 75578.140625, + 263041184.0, + 193033856.0, + 219211776.0, + 105729752.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.755376512681323e-08, + 1.830409435132907e-10, + 1.8150429770269483e-10, + 1.807565902511854e-10, + 1.8044568617092693e-10 + ], + "bp_grad_norms_F": [ + 1.0324319191568065e-05, + 1.5187332280675037e-08, + 1.1401711574876572e-08, + 1.1144490663639317e-08, + 1.0905955249995714e-08 + ], + "gamma_dfa": 0.05269488821795676, + "acc_eval": 0.10546875, + "loss_eval": 18.284685134887695, + "epoch": 82 + }, + { + "hidden_norms": [ + 75686.9765625, + 264364192.0, + 193939856.0, + 220289456.0, + 106222280.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.723260691567702e-08, + 1.8233220488994561e-10, + 1.808086180776769e-10, + 1.8018871117408963e-10, + 1.7971832355634376e-10 + ], + "bp_grad_norms_F": [ + 1.0300875146640465e-05, + 1.5149137055914252e-08, + 1.1367639274340036e-08, + 1.1110781628076438e-08, + 1.0873751676854226e-08 + ], + "gamma_dfa": 0.05262827526894398, + "acc_eval": 0.10546875, + "loss_eval": 18.32525634765625, + "epoch": 83 + }, + { + "hidden_norms": [ + 75782.5703125, + 265506368.0, + 194623696.0, + 221062096.0, + 106625800.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.738180667933193e-08, + 1.8182351457785018e-10, + 1.8023170456071824e-10, + 1.796851972768465e-10, + 1.7919579708980393e-10 + ], + "bp_grad_norms_F": [ + 1.0303671842848416e-05, + 1.510927916115179e-08, + 1.133329874392075e-08, + 1.107721647741755e-08, + 1.0840857100902213e-08 + ], + "gamma_dfa": 0.0526832842733711, + "acc_eval": 0.10546875, + "loss_eval": 18.358993530273438, + "epoch": 84 + }, + { + "hidden_norms": [ + 75869.921875, + 266527792.0, + 195260000.0, + 221772592.0, + 107003056.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.824529373896439e-08, + 1.8133940182796238e-10, + 1.7974224886252443e-10, + 1.7921185369029757e-10, + 1.7870449564583168e-10 + ], + "bp_grad_norms_F": [ + 1.0309514436812606e-05, + 1.506138680440472e-08, + 1.129713478320582e-08, + 1.1042018854823255e-08, + 1.080576872425354e-08 + ], + "gamma_dfa": 0.052798322300077416, + "acc_eval": 0.10546875, + "loss_eval": 18.391273498535156, + "epoch": 85 + }, + { + "hidden_norms": [ + 75944.28125, + 267298400.0, + 195821152.0, + 222463360.0, + 107333864.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.755981895092191e-08, + 1.8102987164869688e-10, + 1.793504234015586e-10, + 1.788625914045383e-10, + 1.7835513621555776e-10 + ], + "bp_grad_norms_F": [ + 1.0287751138093881e-05, + 1.502210977832874e-08, + 1.1278022071792293e-08, + 1.1023718826663753e-08, + 1.0788149040763528e-08 + ], + "gamma_dfa": 0.05272912958753295, + "acc_eval": 0.10546875, + "loss_eval": 18.391714096069336, + "epoch": 86 + }, + { + "hidden_norms": [ + 76007.421875, + 268045776.0, + 196358640.0, + 223064400.0, + 107612040.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.762406622508934e-08, + 1.807102384399073e-10, + 1.7898976745200912e-10, + 1.785393638487065e-10, + 1.7802226359719953e-10 + ], + "bp_grad_norms_F": [ + 1.0287554687238298e-05, + 1.4994483876762388e-08, + 1.1257166754319314e-08, + 1.1003281841226453e-08, + 1.0768073543943046e-08 + ], + "gamma_dfa": 0.052773734016227536, + "acc_eval": 0.10546875, + "loss_eval": 18.410842895507812, + "epoch": 87 + }, + { + "hidden_norms": [ + 76064.7109375, + 268696256.0, + 196819616.0, + 223570480.0, + 107852768.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.758166814004653e-08, + 1.8037309146290426e-10, + 1.7866680357414566e-10, + 1.782173991715652e-10, + 1.7768413129726213e-10 + ], + "bp_grad_norms_F": [ + 1.0283758456353098e-05, + 1.4970940043212977e-08, + 1.1237919927964413e-08, + 1.0984368081778939e-08, + 1.0749558576605978e-08 + ], + "gamma_dfa": 0.05277359033061657, + "acc_eval": 0.10546875, + "loss_eval": 18.423473358154297, + "epoch": 88 + }, + { + "hidden_norms": [ + 76113.765625, + 269233728.0, + 197204896.0, + 224016384.0, + 108068584.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.767738535198077e-08, + 1.800838783649894e-10, + 1.7838196197939027e-10, + 1.7793383433328813e-10, + 1.7738220614571532e-10 + ], + "bp_grad_norms_F": [ + 1.0285043572366703e-05, + 1.4949996796076448e-08, + 1.1221012563567001e-08, + 1.096789947752086e-08, + 1.0733534949736168e-08 + ], + "gamma_dfa": 0.05277923475659918, + "acc_eval": 0.10546875, + "loss_eval": 18.44818878173828, + "epoch": 89 + }, + { + "hidden_norms": [ + 76154.09375, + 269669792.0, + 197538960.0, + 224391824.0, + 108235960.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.767518266949992e-08, + 1.7989677802976445e-10, + 1.7819240527572333e-10, + 1.777451658080409e-10, + 1.771848640030882e-10 + ], + "bp_grad_norms_F": [ + 1.029091072268784e-05, + 1.4940461312562547e-08, + 1.1209391637123645e-08, + 1.0956426876873593e-08, + 1.0722061460910481e-08 + ], + "gamma_dfa": 0.05281960548018105, + "acc_eval": 0.10546875, + "loss_eval": 18.45142364501953, + "epoch": 90 + }, + { + "hidden_norms": [ + 76187.59375, + 270051616.0, + 197844384.0, + 224727824.0, + 108387672.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.763404224509941e-08, + 1.7972098809160286e-10, + 1.780089131653284e-10, + 1.7756210390906801e-10, + 1.7699951226912702e-10 + ], + "bp_grad_norms_F": [ + 1.0288421435689088e-05, + 1.4926607505572065e-08, + 1.1199507987669222e-08, + 1.0946849648973966e-08, + 1.0712753351072024e-08 + ], + "gamma_dfa": 0.05281454947544262, + "acc_eval": 0.10546875, + "loss_eval": 18.456693649291992, + "epoch": 91 + }, + { + "hidden_norms": [ + 76216.3125, + 270347840.0, + 198067872.0, + 225002016.0, + 108500144.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.769242754169682e-08, + 1.795031345785958e-10, + 1.7781580374798267e-10, + 1.773555469153365e-10, + 1.7679230301936855e-10 + ], + "bp_grad_norms_F": [ + 1.0288722478435375e-05, + 1.4910959578173788e-08, + 1.1187878179441668e-08, + 1.0935604422002143e-08, + 1.070183497375865e-08 + ], + "gamma_dfa": 0.052812248992267996, + "acc_eval": 0.10546875, + "loss_eval": 18.479557037353516, + "epoch": 92 + }, + { + "hidden_norms": [ + 76238.2890625, + 270583392.0, + 198231920.0, + 225197232.0, + 108588960.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.765692172119088e-08, + 1.794125820131498e-10, + 1.7771174809499968e-10, + 1.7726634049530787e-10, + 1.7670596930141613e-10 + ], + "bp_grad_norms_F": [ + 1.0287496479577385e-05, + 1.490491285949247e-08, + 1.1181702674889493e-08, + 1.0929432470163647e-08, + 1.0695790031434171e-08 + ], + "gamma_dfa": 0.052826936458586715, + "acc_eval": 0.10546875, + "loss_eval": 18.482463836669922, + "epoch": 93 + }, + { + "hidden_norms": [ + 76254.984375, + 270769600.0, + 198360864.0, + 225341792.0, + 108654560.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.761775660559579e-08, + 1.7933368678946238e-10, + 1.776363084404764e-10, + 1.7719105349645048e-10, + 1.766297247352e-10 + ], + "bp_grad_norms_F": [ + 1.0286962606187444e-05, + 1.4897207911701571e-08, + 1.1177347936097703e-08, + 1.0925224280811108e-08, + 1.0691623586467358e-08 + ], + "gamma_dfa": 0.052814016249612905, + "acc_eval": 0.10546875, + "loss_eval": 18.48452377319336, + "epoch": 94 + }, + { + "hidden_norms": [ + 76267.0, + 270906656.0, + 198453952.0, + 225448800.0, + 108703144.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.761757186448449e-08, + 1.792699738656367e-10, + 1.7757639803051006e-10, + 1.771305185860328e-10, + 1.7656787143494057e-10 + ], + "bp_grad_norms_F": [ + 1.0286720680596773e-05, + 1.4893439370666783e-08, + 1.1173768577066312e-08, + 1.0921708870625935e-08, + 1.0688168572414725e-08 + ], + "gamma_dfa": 0.05281054192164447, + "acc_eval": 0.10546875, + "loss_eval": 18.48675537109375, + "epoch": 95 + }, + { + "hidden_norms": [ + 76274.53125, + 270996800.0, + 198521872.0, + 225534016.0, + 108737184.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.757600511444252e-08, + 1.7921109041196814e-10, + 1.7751719538772193e-10, + 1.7707224575502778e-10, + 1.7651151373865304e-10 + ], + "bp_grad_norms_F": [ + 1.0285029929946177e-05, + 1.4889327104583572e-08, + 1.1170673275273657e-08, + 1.09186730767874e-08, + 1.0685286433442798e-08 + ], + "gamma_dfa": 0.052804862934863195, + "acc_eval": 0.10546875, + "loss_eval": 18.492807388305664, + "epoch": 96 + }, + { + "hidden_norms": [ + 76278.6171875, + 271041184.0, + 198554096.0, + 225570960.0, + 108751040.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.758564717936679e-08, + 1.791868459166679e-10, + 1.7749526848298558e-10, + 1.770504159948061e-10, + 1.7648858763319453e-10 + ], + "bp_grad_norms_F": [ + 1.028558563120896e-05, + 1.4887539201424715e-08, + 1.1169264624300013e-08, + 1.091728041302531e-08, + 1.068388577607493e-08 + ], + "gamma_dfa": 0.052804886450758204, + "acc_eval": 0.10546875, + "loss_eval": 18.49222183227539, + "epoch": 97 + }, + { + "hidden_norms": [ + 76282.2109375, + 271081440.0, + 198586512.0, + 225606800.0, + 108767848.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.758451741641693e-08, + 1.7916516881211209e-10, + 1.7747517344623986e-10, + 1.7702975196876025e-10, + 1.764676044180291e-10 + ], + "bp_grad_norms_F": [ + 1.028525730362162e-05, + 1.488619361111887e-08, + 1.1168157953989066e-08, + 1.0916189729925918e-08, + 1.0682827955577068e-08 + ], + "gamma_dfa": 0.05280597397359088, + "acc_eval": 0.10546875, + "loss_eval": 18.493602752685547, + "epoch": 98 + }, + { + "hidden_norms": [ + 76284.046875, + 271101920.0, + 198601280.0, + 225624992.0, + 108775912.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.758536296227248e-08, + 1.7915657846145905e-10, + 1.7746643043992094e-10, + 1.7702135590713652e-10, + 1.7645920835640538e-10 + ], + "bp_grad_norms_F": [ + 1.028511906042695e-05, + 1.488560208429135e-08, + 1.1167605507012013e-08, + 1.0915637282948865e-08, + 1.0682285278562631e-08 + ], + "gamma_dfa": 0.05280651607608888, + "acc_eval": 0.10546875, + "loss_eval": 18.494029998779297, + "epoch": 99 + }, + { + "hidden_norms": [ + 76284.0703125, + 271101952.0, + 198601472.0, + 225625280.0, + 108776088.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.758680536402608e-08, + 1.7915803562917887e-10, + 1.7746806801888226e-10, + 1.7702275756370511e-10, + 1.7646061001297397e-10 + ], + "bp_grad_norms_F": [ + 1.0285211828886531e-05, + 1.488571665930749e-08, + 1.1167688107605045e-08, + 1.0915716330828218e-08, + 1.0682358109193046e-08 + ], + "gamma_dfa": 0.052806626496021636, + "acc_eval": 0.10546875, + "loss_eval": 18.493879318237305, + "epoch": 100 + } + ] +} \ No newline at end of file diff --git a/results/h2_no_residual_s42.log b/results/h2_no_residual_s42.log new file mode 100644 index 0000000..1fd6037 --- /dev/null +++ b/results/h2_no_residual_s42.log @@ -0,0 +1,16 @@ +device=cuda:0, depth=4, d_hidden=256, epochs=100, seed=42 +eval buffer: torch.Size([1024, 3072]) + +=== BP training === + [BP] Ep 0: ||h||_med=[8.718070030212402, 4.280222415924072, 4.422238349914551, 4.604765892028809, 4.6893696784973145] ||g||_med=[0.0010339331347495317, 0.0009070215164683759, 0.0008196940761990845, 0.000755702203605324, 0.0006969328387640417] acc=0.1123 + [BP] Ep 1: ||h_L||=2.659e+01 ||g_2||=8.531e-05 acc=0.0576 + [BP] Ep 2: ||h_L||=3.938e+01 ||g_2||=6.031e-05 acc=0.0576 + [BP] Ep 3: ||h_L||=4.631e+01 ||g_2||=5.228e-05 acc=0.0664 + [BP] Ep 4: ||h_L||=5.721e+01 ||g_2||=4.597e-05 acc=0.0625 + [BP] Ep 5: ||h_L||=6.593e+01 ||g_2||=4.147e-05 acc=0.0664 + [BP] Ep 6: ||h_L||=7.175e+01 ||g_2||=3.982e-05 acc=0.0762 + [BP] Ep 7: ||h_L||=8.016e+01 ||g_2||=3.737e-05 acc=0.0820 + [BP] Ep 8: ||h_L||=8.979e+01 ||g_2||=3.617e-05 acc=0.0781 + [BP] Ep 9: ||h_L||=1.020e+02 ||g_2||=3.456e-05 acc=0.0752 + [BP] Ep 10: ||h_L||=1.159e+02 ||g_2||=3.380e-05 acc=0.0752 + [BP] Ep 11: ||h_L||=1.185e+02 ||g_2||=3.288e-05 acc=0.0840 diff --git a/results/h2_smoke_w0.1/snapshot_evolution_s42.json b/results/h2_smoke_w0.1/snapshot_evolution_s42.json new file mode 100644 index 0000000..d085d3c --- /dev/null +++ b/results/h2_smoke_w0.1/snapshot_evolution_s42.json @@ -0,0 +1,237 @@ +{ + "config": { + "output_dir": "results/h2_smoke_w0.1", + "epochs": 3, + "lr": 0.001, + "wd": 0.01, + "seed": 42, + "depth": 4, + "d_hidden": 256, + "log_every": 1, + "no_residual_add": true, + "w2_std": 0.1 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.560444831848145, + 8.845171928405762, + 9.21005916595459, + 9.379204750061035 + ], + "bp_grad_norms_per_sample_med": [ + 0.001055641332641244, + 0.0007215326768346131, + 0.0005827629356645048, + 0.0004979022196494043, + 0.00043998067849315703 + ], + "bp_grad_norms_F": [ + 0.036981210112571716, + 0.023669881746172905, + 0.018871067091822624, + 0.016073165461421013, + 0.014115042984485626 + ], + "gamma_dfa": NaN, + "acc_eval": 0.09375, + "loss_eval": 2.4311001300811768, + "epoch": 0 + }, + { + "hidden_norms": [ + 85.71797180175781, + 28.746126174926758, + 27.666101455688477, + 31.958999633789062, + 39.62472915649414 + ], + "bp_grad_norms_per_sample_med": [ + 8.686084765940905e-05, + 8.580532448831946e-05, + 8.54266545502469e-05, + 8.48824274726212e-05, + 8.353861630894244e-05 + ], + "bp_grad_norms_F": [ + 0.003033322049304843, + 0.002979709068313241, + 0.0029494145419448614, + 0.002918587066233158, + 0.0028573593590408564 + ], + "gamma_dfa": NaN, + "acc_eval": 0.05859375, + "loss_eval": 2.529827356338501, + "epoch": 1 + }, + { + "hidden_norms": [ + 103.60254669189453, + 33.103458404541016, + 32.14752197265625, + 38.19721984863281, + 48.121864318847656 + ], + "bp_grad_norms_per_sample_med": [ + 7.112277671694756e-05, + 7.050936983432621e-05, + 7.047054532449692e-05, + 6.984646461205557e-05, + 6.839916750323027e-05 + ], + "bp_grad_norms_F": [ + 0.002462180098518729, + 0.0024272387381643057, + 0.002406709361821413, + 0.002380331512540579, + 0.0023274135310202837 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0703125, + "loss_eval": 2.518604278564453, + "epoch": 2 + }, + { + "hidden_norms": [ + 99.88206481933594, + 32.27016830444336, + 29.376516342163086, + 35.85775375366211, + 44.175907135009766 + ], + "bp_grad_norms_per_sample_med": [ + 7.549120346084237e-05, + 7.506681140512228e-05, + 7.482277578674257e-05, + 7.426074444083497e-05, + 7.269046182045713e-05 + ], + "bp_grad_norms_F": [ + 0.002598837483674288, + 0.00256195105612278, + 0.002536388346925378, + 0.0025058977771550417, + 0.002439383417367935 + ], + "gamma_dfa": NaN, + "acc_eval": 0.072265625, + "loss_eval": 2.5117571353912354, + "epoch": 3 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.560444831848145, + 8.845171928405762, + 9.21005916595459, + 9.379204750061035 + ], + "bp_grad_norms_per_sample_med": [ + 0.001055641332641244, + 0.0007215326768346131, + 0.0005827629356645048, + 0.0004979022196494043, + 0.00043998067849315703 + ], + "bp_grad_norms_F": [ + 0.036981210112571716, + 0.023669881746172905, + 0.018871067091822624, + 0.016073165461421013, + 0.014115042984485626 + ], + "gamma_dfa": 0.0034602322848513722, + "acc_eval": 0.09375, + "loss_eval": 2.4311001300811768, + "epoch": 0 + }, + { + "hidden_norms": [ + 1321.57177734375, + 5876.37109375, + 5211.20947265625, + 5922.93798828125, + 3697.69580078125 + ], + "bp_grad_norms_per_sample_med": [ + 1.0980336355714826e-06, + 8.924058079173847e-07, + 8.845478305374854e-07, + 8.81322591794742e-07, + 8.844919534567453e-07 + ], + "bp_grad_norms_F": [ + 7.150410965550691e-05, + 5.026865619583987e-05, + 4.9243793910136446e-05, + 4.888495459454134e-05, + 4.859357068198733e-05 + ], + "gamma_dfa": 0.03524830285459757, + "acc_eval": 0.1181640625, + "loss_eval": 2.2935099601745605, + "epoch": 1 + }, + { + "hidden_norms": [ + 2543.9384765625, + 26885.123046875, + 22657.53515625, + 23760.638671875, + 13455.5205078125 + ], + "bp_grad_norms_per_sample_med": [ + 3.232785559248441e-07, + 2.0931234701038193e-07, + 2.086635788600688e-07, + 2.0885721596641815e-07, + 2.086642325593857e-07 + ], + "bp_grad_norms_F": [ + 3.009554711752571e-05, + 1.4969685253163334e-05, + 1.4619089597545099e-05, + 1.4558195289282594e-05, + 1.4452642062678933e-05 + ], + "gamma_dfa": 0.03537877253256738, + "acc_eval": 0.1201171875, + "loss_eval": 2.3101487159729004, + "epoch": 2 + }, + { + "hidden_norms": [ + 2961.771484375, + 39258.7265625, + 31789.115234375, + 32956.20703125, + 18197.2578125 + ], + "bp_grad_norms_per_sample_med": [ + 2.570918979927228e-07, + 1.4994434138770885e-07, + 1.4976241402564483e-07, + 1.4952657068079134e-07, + 1.4944804149763513e-07 + ], + "bp_grad_norms_F": [ + 2.3238537323777564e-05, + 1.1003003237419762e-05, + 1.0661849046300631e-05, + 1.0592500984785147e-05, + 1.0497028597455937e-05 + ], + "gamma_dfa": 0.03636467596516013, + "acc_eval": 0.12109375, + "loss_eval": 2.3122406005859375, + "epoch": 3 + } + ] +} \ No newline at end of file diff --git a/results/h2_smoke_w0.2/snapshot_evolution_s42.json b/results/h2_smoke_w0.2/snapshot_evolution_s42.json new file mode 100644 index 0000000..a98f5da --- /dev/null +++ b/results/h2_smoke_w0.2/snapshot_evolution_s42.json @@ -0,0 +1,237 @@ +{ + "config": { + "output_dir": "results/h2_smoke_w0.2", + "epochs": 3, + "lr": 0.001, + "wd": 0.01, + "seed": 42, + "depth": 4, + "d_hidden": 256, + "log_every": 1, + "no_residual_add": true, + "w2_std": 0.2 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 17.12088966369629, + 17.690689086914062, + 18.420406341552734, + 18.75864601135254 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010638737585395575, + 0.00045698368921875954, + 0.0003363286959938705, + 0.0002763723023235798, + 0.0002378255157964304 + ], + "bp_grad_norms_F": [ + 0.03763078525662422, + 0.015000421553850174, + 0.010959738865494728, + 0.008936461992561817, + 0.007658911868929863 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0859375, + "loss_eval": 2.4382002353668213, + "epoch": 0 + }, + { + "hidden_norms": [ + 85.67359161376953, + 53.38432693481445, + 47.44037628173828, + 55.29991149902344, + 67.34859466552734 + ], + "bp_grad_norms_per_sample_med": [ + 8.009114390006289e-05, + 7.683139119762927e-05, + 7.53635322325863e-05, + 7.400008325930685e-05, + 7.128623110475019e-05 + ], + "bp_grad_norms_F": [ + 0.0027135731652379036, + 0.0025544750969856977, + 0.0024875544477254152, + 0.0024266208056360483, + 0.0023267678916454315 + ], + "gamma_dfa": NaN, + "acc_eval": 0.083984375, + "loss_eval": 2.4839837551116943, + "epoch": 1 + }, + { + "hidden_norms": [ + 103.92682647705078, + 59.23755645751953, + 52.980411529541016, + 64.2865982055664, + 78.33065032958984 + ], + "bp_grad_norms_per_sample_med": [ + 6.883802416268736e-05, + 6.662087980657816e-05, + 6.507965008495376e-05, + 6.394806405296549e-05, + 6.143032078398392e-05 + ], + "bp_grad_norms_F": [ + 0.0023220409639179707, + 0.002212206134572625, + 0.0021602711640298367, + 0.0021026749163866043, + 0.002004916314035654 + ], + "gamma_dfa": NaN, + "acc_eval": 0.09375, + "loss_eval": 2.4874913692474365, + "epoch": 2 + }, + { + "hidden_norms": [ + 99.67398834228516, + 58.03565216064453, + 49.116390228271484, + 60.295406341552734, + 73.20696258544922 + ], + "bp_grad_norms_per_sample_med": [ + 7.312109664781019e-05, + 7.063996599754319e-05, + 6.898775609442964e-05, + 6.728436710545793e-05, + 6.445571489166468e-05 + ], + "bp_grad_norms_F": [ + 0.002473062602803111, + 0.0023518132511526346, + 0.0022898896131664515, + 0.002222386421635747, + 0.002102817641571164 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0927734375, + "loss_eval": 2.4926531314849854, + "epoch": 3 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 17.12088966369629, + 17.690689086914062, + 18.420406341552734, + 18.75864601135254 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010638737585395575, + 0.00045698368921875954, + 0.0003363286959938705, + 0.0002763723023235798, + 0.0002378255157964304 + ], + "bp_grad_norms_F": [ + 0.03763078525662422, + 0.015000421553850174, + 0.010959738865494728, + 0.008936461992561817, + 0.007658911868929863 + ], + "gamma_dfa": 0.0037797510012751445, + "acc_eval": 0.0859375, + "loss_eval": 2.4382002353668213, + "epoch": 0 + }, + { + "hidden_norms": [ + 1258.0216064453125, + 5942.1240234375, + 4878.22021484375, + 5972.6494140625, + 4135.04931640625 + ], + "bp_grad_norms_per_sample_med": [ + 1.158710347226588e-06, + 8.974735692390823e-07, + 8.935384698816051e-07, + 8.949773473432288e-07, + 8.903299999474257e-07 + ], + "bp_grad_norms_F": [ + 6.218944326974452e-05, + 4.8492554924450815e-05, + 4.7771758545422927e-05, + 4.744856778415851e-05, + 4.708760025096126e-05 + ], + "gamma_dfa": 0.039906812366098166, + "acc_eval": 0.1259765625, + "loss_eval": 2.2913613319396973, + "epoch": 1 + }, + { + "hidden_norms": [ + 2455.668212890625, + 26613.791015625, + 20806.90234375, + 23305.125, + 14706.8408203125 + ], + "bp_grad_norms_per_sample_med": [ + 3.5421919619693654e-07, + 2.1852616782780387e-07, + 2.1860738286250125e-07, + 2.179439917426862e-07, + 2.1746768652519677e-07 + ], + "bp_grad_norms_F": [ + 3.6695244489237666e-05, + 1.5090728993527591e-05, + 1.4612215636589099e-05, + 1.4485378414974548e-05, + 1.4331568308989517e-05 + ], + "gamma_dfa": 0.03681188588961959, + "acc_eval": 0.1416015625, + "loss_eval": 2.3159337043762207, + "epoch": 2 + }, + { + "hidden_norms": [ + 2871.099853515625, + 38200.73828125, + 28961.662109375, + 32314.5390625, + 19539.51953125 + ], + "bp_grad_norms_per_sample_med": [ + 2.831942822467681e-07, + 1.5707844625012513e-07, + 1.5655700735806022e-07, + 1.5635474426289875e-07, + 1.559963891395455e-07 + ], + "bp_grad_norms_F": [ + 2.7198082534596324e-05, + 1.122839967138134e-05, + 1.0740075595094822e-05, + 1.0607479453028645e-05, + 1.046583474817453e-05 + ], + "gamma_dfa": 0.036901777144521475, + "acc_eval": 0.1435546875, + "loss_eval": 2.321805477142334, + "epoch": 3 + } + ] +} \ No newline at end of file diff --git a/results/h2_smoke_w0.5/snapshot_evolution_s42.json b/results/h2_smoke_w0.5/snapshot_evolution_s42.json new file mode 100644 index 0000000..8c75ebd --- /dev/null +++ b/results/h2_smoke_w0.5/snapshot_evolution_s42.json @@ -0,0 +1,237 @@ +{ + "config": { + "output_dir": "results/h2_smoke_w0.5", + "epochs": 3, + "lr": 0.001, + "wd": 0.01, + "seed": 42, + "depth": 4, + "d_hidden": 256, + "log_every": 1, + "no_residual_add": true, + "w2_std": 0.5 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 42.802223205566406, + 44.22697067260742, + 46.05121994018555, + 46.896766662597656 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010791289387270808, + 0.0002035950165009126, + 0.00014324457151815295, + 0.00011542177526280284, + 9.846547618508339e-05 + ], + "bp_grad_norms_F": [ + 0.0380445197224617, + 0.00666962843388319, + 0.0046500470489263535, + 0.003719294909387827, + 0.003155440790578723 + ], + "gamma_dfa": NaN, + "acc_eval": 0.080078125, + "loss_eval": 2.446239709854126, + "epoch": 0 + }, + { + "hidden_norms": [ + 86.00836944580078, + 130.30899047851562, + 107.6886215209961, + 127.31951141357422, + 155.31224060058594 + ], + "bp_grad_norms_per_sample_med": [ + 5.636421337840147e-05, + 4.504464232013561e-05, + 4.254864325048402e-05, + 4.0549883124185726e-05, + 3.8371628761524335e-05 + ], + "bp_grad_norms_F": [ + 0.0019479888724163175, + 0.0014867106219753623, + 0.0013919975608587265, + 0.001322419848293066, + 0.0012390650808811188 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1435546875, + "loss_eval": 2.293787717819214, + "epoch": 1 + }, + { + "hidden_norms": [ + 103.2545166015625, + 142.36724853515625, + 117.42737579345703, + 145.57473754882812, + 174.0562744140625 + ], + "bp_grad_norms_per_sample_med": [ + 5.0501937948865816e-05, + 4.213622378301807e-05, + 3.962606206187047e-05, + 3.741410546354018e-05, + 3.486485002213158e-05 + ], + "bp_grad_norms_F": [ + 0.001744136679917574, + 0.0013844756176695228, + 0.0012931021628901362, + 0.0012163385981693864, + 0.0011240089079365134 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1640625, + "loss_eval": 2.2804112434387207, + "epoch": 2 + }, + { + "hidden_norms": [ + 99.97102355957031, + 140.33131408691406, + 110.34066772460938, + 136.7115936279297, + 163.25784301757812 + ], + "bp_grad_norms_per_sample_med": [ + 5.4715037549613044e-05, + 4.477328184293583e-05, + 4.2219675378873944e-05, + 3.9974820538191125e-05, + 3.672601087600924e-05 + ], + "bp_grad_norms_F": [ + 0.0019211760954931378, + 0.0015042650047689676, + 0.0013935193419456482, + 0.0013014256255701184, + 0.0011887947330251336 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1630859375, + "loss_eval": 2.294424057006836, + "epoch": 3 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 42.802223205566406, + 44.22697067260742, + 46.05121994018555, + 46.896766662597656 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010791289387270808, + 0.0002035950165009126, + 0.00014324457151815295, + 0.00011542177526280284, + 9.846547618508339e-05 + ], + "bp_grad_norms_F": [ + 0.0380445197224617, + 0.00666962843388319, + 0.0046500470489263535, + 0.003719294909387827, + 0.003155440790578723 + ], + "gamma_dfa": 0.004864378133788705, + "acc_eval": 0.080078125, + "loss_eval": 2.446239709854126, + "epoch": 0 + }, + { + "hidden_norms": [ + 1180.2318115234375, + 5768.2900390625, + 5472.90234375, + 6369.3427734375, + 5295.2470703125 + ], + "bp_grad_norms_per_sample_med": [ + 1.2146981589467032e-06, + 8.634061714474228e-07, + 8.587696811446222e-07, + 8.589160529481887e-07, + 8.53334995554178e-07 + ], + "bp_grad_norms_F": [ + 6.592504360014573e-05, + 4.607137088896707e-05, + 4.4360855099512264e-05, + 4.341698149801232e-05, + 4.290258584660478e-05 + ], + "gamma_dfa": 0.0467059058137238, + "acc_eval": 0.15625, + "loss_eval": 2.2713985443115234, + "epoch": 1 + }, + { + "hidden_norms": [ + 2312.98193359375, + 25168.3515625, + 22182.9609375, + 23364.205078125, + 16927.552734375 + ], + "bp_grad_norms_per_sample_med": [ + 4.0056002603705565e-07, + 2.224278716767003e-07, + 2.2240433850129193e-07, + 2.2153939482905116e-07, + 2.2145297862152802e-07 + ], + "bp_grad_norms_F": [ + 3.370734702912159e-05, + 1.619783870410174e-05, + 1.508272544015199e-05, + 1.4707649825140834e-05, + 1.4549447769240942e-05 + ], + "gamma_dfa": 0.04014483268838376, + "acc_eval": 0.1513671875, + "loss_eval": 2.315417528152466, + "epoch": 2 + }, + { + "hidden_norms": [ + 2703.50634765625, + 35877.58203125, + 30404.849609375, + 31748.2421875, + 22049.421875 + ], + "bp_grad_norms_per_sample_med": [ + 3.239594548176683e-07, + 1.6274317715669895e-07, + 1.625548691208678e-07, + 1.6296479543598252e-07, + 1.628933432584745e-07 + ], + "bp_grad_norms_F": [ + 2.923223473771941e-05, + 1.1944111065531615e-05, + 1.1137096407765057e-05, + 1.09043749034754e-05, + 1.0791579370561522e-05 + ], + "gamma_dfa": 0.039210652525071055, + "acc_eval": 0.1484375, + "loss_eval": 2.3342530727386475, + "epoch": 3 + } + ] +} \ No newline at end of file diff --git a/results/h2_smoketest/snapshot_evolution_s42.json b/results/h2_smoketest/snapshot_evolution_s42.json new file mode 100644 index 0000000..5f09cbd --- /dev/null +++ b/results/h2_smoketest/snapshot_evolution_s42.json @@ -0,0 +1,129 @@ +{ + "config": { + "output_dir": "results/h2_smoketest", + "epochs": 1, + "lr": 0.001, + "wd": 0.01, + "seed": 42, + "depth": 4, + "d_hidden": 256, + "log_every": 1, + "no_residual_add": true, + "w2_std": 0.05 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 4.280222415924072, + 4.422238349914551, + 4.604765892028809, + 4.6893696784973145 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010339331347495317, + 0.0009070215164683759, + 0.0008196940761990845, + 0.000755702203605324, + 0.0006969328387640417 + ], + "bp_grad_norms_F": [ + 0.036222200840711594, + 0.030558692291378975, + 0.027158580720424652, + 0.02468229830265045, + 0.022657815366983414 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1123046875, + "loss_eval": 2.414133310317993, + "epoch": 0 + }, + { + "hidden_norms": [ + 85.9231185913086, + 17.862314224243164, + 18.3341064453125, + 20.362960815429688, + 26.587692260742188 + ], + "bp_grad_norms_per_sample_med": [ + 8.575361425755545e-05, + 8.537247049389407e-05, + 8.530700870323926e-05, + 8.512997737852857e-05, + 8.473115303786471e-05 + ], + "bp_grad_norms_F": [ + 0.0030727137345820665, + 0.003054599277675152, + 0.0030425451695919037, + 0.0030279208440333605, + 0.0030008067842572927 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0576171875, + "loss_eval": 2.5138001441955566, + "epoch": 1 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 4.280222415924072, + 4.422238349914551, + 4.604765892028809, + 4.6893696784973145 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010339331347495317, + 0.0009070215164683759, + 0.0008196940761990845, + 0.000755702203605324, + 0.0006969328387640417 + ], + "bp_grad_norms_F": [ + 0.036222200840711594, + 0.030558692291378975, + 0.027158580720424652, + 0.02468229830265045, + 0.022657815366983414 + ], + "gamma_dfa": 0.004694993258453906, + "acc_eval": 0.1123046875, + "loss_eval": 2.414133310317993, + "epoch": 0 + }, + { + "hidden_norms": [ + 1363.396484375, + 5623.7373046875, + 6282.16259765625, + 6187.54150390625, + 3601.992919921875 + ], + "bp_grad_norms_per_sample_med": [ + 1.0316066436644178e-06, + 8.392997301598371e-07, + 8.332735319527274e-07, + 8.32648026971583e-07, + 8.310838666147902e-07 + ], + "bp_grad_norms_F": [ + 7.324694888666272e-05, + 4.777986396220513e-05, + 4.688410263042897e-05, + 4.647139576263726e-05, + 4.622975757229142e-05 + ], + "gamma_dfa": 0.029530375730246305, + "acc_eval": 0.1015625, + "loss_eval": 2.2971253395080566, + "epoch": 1 + } + ] +} \ No newline at end of file diff --git a/results/minimal_aux_compression/minimal_aux_compression_t5_s42.json b/results/minimal_aux_compression/minimal_aux_compression_t5_s42.json new file mode 100644 index 0000000..59a1c9f --- /dev/null +++ b/results/minimal_aux_compression/minimal_aux_compression_t5_s42.json @@ -0,0 +1,5768 @@ +{ + "args": { + "num_blocks": 4, + "d_hidden": 256, + "batch_size": 128, + "epochs": 100, + "t0": 5, + "alpha": 0.75, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "M": 4, + "seed": 42, + "gpu": 0, + "output_dir": "/home/yurenh2/fa/results/minimal_aux_compression" + }, + "dfa_ckpt_acc": 0.304, + "normmatched_target_rms": [ + 0.7896092499308573, + 0.7894034341625545, + 0.7893155885474457, + 0.7892744828825412 + ], + "continue_DFA": { + "test_acc": [ + 0.3031, + 0.3043, + 0.3078, + 0.2971, + 0.2816, + 0.3181, + 0.3104, + 0.2967, + 0.303, + 0.31, + 0.3122, + 0.316, + 0.3094, + 0.3142, + 0.2997, + 0.3197, + 0.2975, + 0.3086, + 0.3016, + 0.3011, + 0.3019, + 0.3147, + 0.3144, + 0.2963, + 0.2995, + 0.297, + 0.3034, + 0.2957, + 0.3163, + 0.3049, + 0.3046, + 0.309, + 0.3058, + 0.3184, + 0.3077, + 0.3048, + 0.3058, + 0.3098, + 0.3123, + 0.3132, + 0.3065, + 0.3037, + 0.3101, + 0.31, + 0.3103, + 0.3172, + 0.2985, + 0.3066, + 0.3083, + 0.3137, + 0.3116, + 0.2969, + 0.3123, + 0.3053, + 0.3128, + 0.3076, + 0.3072, + 0.3068, + 0.3074, + 0.3094, + 0.3194, + 0.312, + 0.3111, + 0.311, + 0.3117, + 0.3071, + 0.3082, + 0.3104, + 0.312, + 0.3114, + 0.3117, + 0.3161, + 0.311, + 0.3111, + 0.3089, + 0.3099, + 0.307, + 0.3108, + 0.3119, + 0.3106, + 0.3125, + 0.3081, + 0.3133, + 0.3109, + 0.3118, + 0.3099, + 0.3113, + 0.3112, + 0.3108, + 0.3101, + 0.3107, + 0.3105, + 0.3108, + 0.311, + 0.3111 + ], + "train_loss": [ + 1.9896479614639282, + 1.989228398399353, + 1.9913108707427978, + 1.9891952603530885, + 1.9893831426239013, + 1.9876405304718017, + 1.9879415699768066, + 1.9855383531951905, + 1.9861496739959716, + 1.9879567293548583, + 1.9880899668884278, + 1.988914436264038, + 1.9845729635620117, + 1.9882750720977784, + 1.986619080886841, + 1.986360415725708, + 1.984292981414795, + 1.9868758028411866, + 1.9862796499633788, + 1.9836064116668701, + 1.9887293506622314, + 1.987586946182251, + 1.9869858631896973, + 1.9876407931137086, + 1.9903872080993652, + 1.9870248597717286, + 1.984416696243286, + 1.9871015835952759, + 1.987274853439331, + 1.9857344278717042, + 1.9862716618347167, + 1.98514561378479, + 1.988260205154419, + 1.9840300716400145, + 1.9863889629364013, + 1.987745002822876, + 1.9889955393981933, + 1.9864666799926758, + 1.9893225020599365, + 1.9871594960784913, + 1.9884574700164794, + 1.9864218033599854, + 1.9859322482299804, + 1.9873759143829346, + 1.9861914360046387, + 1.9885319758605957, + 1.9898562560272217, + 1.985831473045349, + 1.985336185760498, + 1.9852413446807862, + 1.9856248221206665, + 1.9873600564193725, + 1.9870840522003175, + 1.9870067491149903, + 1.9869314754486085, + 1.9850653249359131, + 1.9875930228424072, + 1.987569184112549, + 1.9871658860015868, + 1.9855123371887207, + 1.9833889255523682, + 1.9880683898925782, + 1.9878030462265015, + 1.98471407623291, + 1.988103190536499, + 1.9855585750961304, + 1.9861370626831054, + 1.9858980004882814, + 1.9873674423217773, + 1.9872277666473388, + 1.9847508831787108, + 1.9853865002059936, + 1.9861437704849243, + 1.9859025341796874, + 1.9839345678329467, + 1.984999510536194, + 1.9822538426208496, + 1.984417091293335, + 1.983155788269043, + 1.983664865875244, + 1.9863640853881837, + 1.9857785580825806, + 1.9854218925476075, + 1.9845938192749024, + 1.9818547330474854, + 1.9859014357757567, + 1.983231044921875, + 1.985167163925171, + 1.9846584673690797, + 1.9843994527816773, + 1.9858917093276978, + 1.984087236328125, + 1.9825552994537354, + 1.9838171983337403, + 1.9841137975311278 + ], + "gamma": [ + [ + 6, + 0.08304189937189221 + ], + [ + 7, + 0.08198711951263249 + ], + [ + 8, + 0.08454073127359152 + ], + [ + 9, + 0.08434331172611564 + ], + [ + 10, + 0.08335044141858816 + ], + [ + 13, + 0.08535977214341983 + ], + [ + 15, + 0.08736230782233179 + ], + [ + 20, + 0.09012478915974498 + ], + [ + 25, + 0.09021505803684704 + ], + [ + 35, + 0.09383204276673496 + ], + [ + 45, + 0.09757547511253506 + ], + [ + 55, + 0.09976769518107176 + ], + [ + 65, + 0.10113811318296939 + ], + [ + 75, + 0.10125958314165473 + ], + [ + 85, + 0.10157915914896876 + ], + [ + 95, + 0.10157413315027952 + ], + [ + 100, + 0.10160211031325161 + ] + ], + "rho": [ + [ + 6, + 0.015308302594348788 + ], + [ + 7, + -0.00024611176922917366 + ], + [ + 8, + 0.028694706736132503 + ], + [ + 9, + 0.017990151420235634 + ], + [ + 10, + 0.007663325406610966 + ], + [ + 13, + 0.0028579640202224255 + ], + [ + 15, + 0.013683738186955452 + ], + [ + 20, + 0.005488905240781605 + ], + [ + 25, + 0.009160608984529972 + ], + [ + 35, + 0.004546445794403553 + ], + [ + 45, + -0.006887141382321715 + ], + [ + 55, + 0.0014273221604526043 + ], + [ + 65, + 0.004843547940254211 + ], + [ + 75, + -0.0008459403179585934 + ], + [ + 85, + 0.0030805536080151796 + ], + [ + 95, + 0.009379950352013111 + ], + [ + 100, + -0.006648134032730013 + ] + ], + "alpha_eff": [ + [ + 6, + 0.0 + ], + [ + 7, + 0.0 + ], + [ + 8, + 0.0 + ], + [ + 9, + 0.0 + ], + [ + 10, + 0.0 + ], + [ + 11, + 0.0 + ], + [ + 12, + 0.0 + ], + [ + 13, + 0.0 + ], + [ + 14, + 0.0 + ], + [ + 15, + 0.0 + ], + [ + 16, + 0.0 + ], + [ + 17, + 0.0 + ], + [ + 18, + 0.0 + ], + [ + 19, + 0.0 + ], + [ + 20, + 0.0 + ], + [ + 21, + 0.0 + ], + [ + 22, + 0.0 + ], + [ + 23, + 0.0 + ], + [ + 24, + 0.0 + ], + [ + 25, + 0.0 + ], + [ + 26, + 0.0 + ], + [ + 27, + 0.0 + ], + [ + 28, + 0.0 + ], + [ + 29, + 0.0 + ], + [ + 30, + 0.0 + ], + [ + 31, + 0.0 + ], + [ + 32, + 0.0 + ], + [ + 33, + 0.0 + ], + [ + 34, + 0.0 + ], + [ + 35, + 0.0 + ], + [ + 36, + 0.0 + ], + [ + 37, + 0.0 + ], + [ + 38, + 0.0 + ], + [ + 39, + 0.0 + ], + [ + 40, + 0.0 + ], + [ + 41, + 0.0 + ], + [ + 42, + 0.0 + ], + [ + 43, + 0.0 + ], + [ + 44, + 0.0 + ], + [ + 45, + 0.0 + ], + [ + 46, + 0.0 + ], + [ + 47, + 0.0 + ], + [ + 48, + 0.0 + ], + [ + 49, + 0.0 + ], + [ + 50, + 0.0 + ], + [ + 51, + 0.0 + ], + [ + 52, + 0.0 + ], + [ + 53, + 0.0 + ], + [ + 54, + 0.0 + ], + [ + 55, + 0.0 + ], + [ + 56, + 0.0 + ], + [ + 57, + 0.0 + ], + [ + 58, + 0.0 + ], + [ + 59, + 0.0 + ], + [ + 60, + 0.0 + ], + [ + 61, + 0.0 + ], + [ + 62, + 0.0 + ], + [ + 63, + 0.0 + ], + [ + 64, + 0.0 + ], + [ + 65, + 0.0 + ], + [ + 66, + 0.0 + ], + [ + 67, + 0.0 + ], + [ + 68, + 0.0 + ], + [ + 69, + 0.0 + ], + [ + 70, + 0.0 + ], + [ + 71, + 0.0 + ], + [ + 72, + 0.0 + ], + [ + 73, + 0.0 + ], + [ + 74, + 0.0 + ], + [ + 75, + 0.0 + ], + [ + 76, + 0.0 + ], + [ + 77, + 0.0 + ], + [ + 78, + 0.0 + ], + [ + 79, + 0.0 + ], + [ + 80, + 0.0 + ], + [ + 81, + 0.0 + ], + [ + 82, + 0.0 + ], + [ + 83, + 0.0 + ], + [ + 84, + 0.0 + ], + [ + 85, + 0.0 + ], + [ + 86, + 0.0 + ], + [ + 87, + 0.0 + ], + [ + 88, + 0.0 + ], + [ + 89, + 0.0 + ], + [ + 90, + 0.0 + ], + [ + 91, + 0.0 + ], + [ + 92, + 0.0 + ], + [ + 93, + 0.0 + ], + [ + 94, + 0.0 + ], + [ + 95, + 0.0 + ], + [ + 96, + 0.0 + ], + [ + 97, + 0.0 + ], + [ + 98, + 0.0 + ], + [ + 99, + 0.0 + ], + [ + 100, + 0.0 + ] + ] + }, + "blend_random_trainable": { + "test_acc": [ + 0.304, + 0.3076, + 0.3108, + 0.3041, + 0.3098, + 0.3099, + 0.3038, + 0.297, + 0.2967, + 0.305, + 0.3156, + 0.3146, + 0.321, + 0.3105, + 0.3088, + 0.3038, + 0.3162, + 0.3148, + 0.3115, + 0.3031, + 0.3083, + 0.32, + 0.3081, + 0.3096, + 0.3084, + 0.3109, + 0.313, + 0.3187, + 0.31, + 0.3164, + 0.3185, + 0.3129, + 0.3139, + 0.3129, + 0.3216, + 0.3134, + 0.3204, + 0.3199, + 0.314, + 0.3219, + 0.3155, + 0.3138, + 0.3172, + 0.3154, + 0.3138, + 0.3156, + 0.3221, + 0.3134, + 0.3155, + 0.318, + 0.3154, + 0.3213, + 0.3228, + 0.3151, + 0.3185, + 0.3175, + 0.3256, + 0.3221, + 0.3152, + 0.3185, + 0.3232, + 0.3244, + 0.3207, + 0.3285, + 0.3137, + 0.3157, + 0.3232, + 0.3224, + 0.3229, + 0.3179, + 0.3202, + 0.326, + 0.321, + 0.3218, + 0.3149, + 0.3252, + 0.3187, + 0.3223, + 0.3203, + 0.3219, + 0.3252, + 0.3245, + 0.3237, + 0.3215, + 0.3219, + 0.3214, + 0.3212, + 0.3208, + 0.3207, + 0.3215, + 0.3208, + 0.3209, + 0.3207, + 0.3211, + 0.3212 + ], + "train_loss": [ + 1.9875820624542235, + 1.984858465499878, + 1.9837525555801392, + 1.9818363088226318, + 1.9856461972427368, + 1.9782102161026, + 1.9760711154174804, + 1.9777770901489258, + 1.975443967514038, + 1.976013292541504, + 1.9727115103149413, + 1.969586827430725, + 1.9730798572158814, + 1.9704905807876587, + 1.9703517753601074, + 1.9711850595092772, + 1.9702121339416503, + 1.972580355758667, + 1.9681320180511475, + 1.9686706248474122, + 1.9683358684539796, + 1.9668307958602906, + 1.9643502359008789, + 1.965956339035034, + 1.9685641189575196, + 1.9635703317642212, + 1.9627861168670655, + 1.9650380011367798, + 1.9642291540527343, + 1.9642311791992189, + 1.9646381041717529, + 1.9633978008651733, + 1.9658650427246094, + 1.9637716662597657, + 1.9667017318725586, + 1.962588292388916, + 1.9642483969116211, + 1.963774356918335, + 1.9637555825424193, + 1.966401972732544, + 1.9644542486572265, + 1.9629163044738769, + 1.9644242834854126, + 1.9674142376327515, + 1.9655234298706055, + 1.9619557665252685, + 1.9633433204650879, + 1.9618017944717407, + 1.961913779373169, + 1.9628275882339477, + 1.9626629904174804, + 1.959987710533142, + 1.963222172012329, + 1.9608874097061157, + 1.9631134511566162, + 1.96072896484375, + 1.9636458055877686, + 1.9607766639709472, + 1.9610338224029542, + 1.9611924673843384, + 1.962102650718689, + 1.9620676553344727, + 1.9624957943725585, + 1.9585958462142945, + 1.9600954289245605, + 1.9600101694107055, + 1.9582736966323853, + 1.9630938558197022, + 1.9602874573135376, + 1.9607704308319092, + 1.9604313027954101, + 1.9593016355133057, + 1.961487769317627, + 1.9581396647644043, + 1.9602671353530883, + 1.9591305192565918, + 1.9604460619354247, + 1.9608135815429688, + 1.9591818682861328, + 1.956793077659607, + 1.960898640060425, + 1.9563995078277587, + 1.9601803003311158, + 1.956558929977417, + 1.9553365264129638, + 1.9587519913482665, + 1.9584099251556397, + 1.958340239944458, + 1.9584214044570922, + 1.9551129587554932, + 1.9588654565429688, + 1.960626877746582, + 1.9583866863250732, + 1.955967247581482, + 1.9612910549163818 + ], + "gamma": [ + [ + 6, + 0.019220562127884477 + ], + [ + 7, + 0.03108229034114629 + ], + [ + 8, + 0.018241118639707565 + ], + [ + 9, + 0.034495080122724175 + ], + [ + 10, + 0.028780929278582335 + ], + [ + 13, + 0.030122535827104002 + ], + [ + 15, + 0.02802148787304759 + ], + [ + 20, + 0.03149552864488214 + ], + [ + 25, + 0.03785618720576167 + ], + [ + 35, + 0.021021342370659113 + ], + [ + 45, + 0.03360021597472951 + ], + [ + 55, + 0.026182003552094102 + ], + [ + 65, + 0.028913337620906532 + ], + [ + 75, + 0.028639126277994365 + ], + [ + 85, + 0.030121456366032362 + ], + [ + 95, + 0.03247612394625321 + ], + [ + 100, + 0.022932072111871094 + ] + ], + "rho": [ + [ + 6, + 0.013808809919282794 + ], + [ + 7, + 0.03821952547878027 + ], + [ + 8, + 0.0360131417401135 + ], + [ + 9, + 0.004150372929871082 + ], + [ + 10, + 0.013662770157679915 + ], + [ + 13, + 0.028151119186077267 + ], + [ + 15, + -0.0075449212454259396 + ], + [ + 20, + 0.0036099848803132772 + ], + [ + 25, + 0.000372566981241107 + ], + [ + 35, + 0.015148252947255969 + ], + [ + 45, + -0.001252165180630982 + ], + [ + 55, + -0.004500149516388774 + ], + [ + 65, + 0.020315622678026557 + ], + [ + 75, + -0.005173317855224013 + ], + [ + 85, + -0.002073251875117421 + ], + [ + 95, + 0.012416869401931763 + ], + [ + 100, + -0.006122617865912616 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7499197681564169 + ], + [ + 7, + 0.7498578762844952 + ], + [ + 8, + 0.7497999109492675 + ], + [ + 9, + 0.7497192773113324 + ], + [ + 10, + 0.7496842012884236 + ], + [ + 11, + 0.7496251981136395 + ], + [ + 12, + 0.749583628394037 + ], + [ + 13, + 0.7495581218904329 + ], + [ + 14, + 0.7495461848578033 + ], + [ + 15, + 0.749573789654497 + ], + [ + 16, + 0.7495078820260268 + ], + [ + 17, + 0.7494844798218633 + ], + [ + 18, + 0.7494460918088632 + ], + [ + 19, + 0.7494516167979163 + ], + [ + 20, + 0.7494209521942866 + ], + [ + 21, + 0.7494175843359755 + ], + [ + 22, + 0.7494194415266225 + ], + [ + 23, + 0.7494112317089004 + ], + [ + 24, + 0.7494132065753276 + ], + [ + 25, + 0.7494000991283181 + ], + [ + 26, + 0.7493913367051803 + ], + [ + 27, + 0.7493884842858975 + ], + [ + 28, + 0.7493755115783163 + ], + [ + 29, + 0.7493806287495052 + ], + [ + 30, + 0.7494016796762221 + ], + [ + 31, + 0.7493717711870365 + ], + [ + 32, + 0.749390029861711 + ], + [ + 33, + 0.7493999407109747 + ], + [ + 34, + 0.7493989022517102 + ], + [ + 35, + 0.7493795023296775 + ], + [ + 36, + 0.7493802135569222 + ], + [ + 37, + 0.74938156352573 + ], + [ + 38, + 0.7493928756541923 + ], + [ + 39, + 0.7493847808816975 + ], + [ + 40, + 0.7494038315175888 + ], + [ + 41, + 0.7493898131837181 + ], + [ + 42, + 0.7493857565571695 + ], + [ + 43, + 0.7493881993609323 + ], + [ + 44, + 0.7493968115497678 + ], + [ + 45, + 0.7493927498805746 + ], + [ + 46, + 0.7493963496195201 + ], + [ + 47, + 0.749385830666834 + ], + [ + 48, + 0.7493898922894369 + ], + [ + 49, + 0.7494094214602504 + ], + [ + 50, + 0.7493919284640196 + ], + [ + 51, + 0.7493724687303878 + ], + [ + 52, + 0.7493753754192403 + ], + [ + 53, + 0.7494169509817146 + ], + [ + 54, + 0.7494090969012233 + ], + [ + 55, + 0.749400978844211 + ], + [ + 56, + 0.7494047934457866 + ], + [ + 57, + 0.7494084815304891 + ], + [ + 58, + 0.7493952180905741 + ], + [ + 59, + 0.7493953983915104 + ], + [ + 60, + 0.7493957553341601 + ], + [ + 61, + 0.7493888248335011 + ], + [ + 62, + 0.7494101782890408 + ], + [ + 63, + 0.7494018681681134 + ], + [ + 64, + 0.7493975554113989 + ], + [ + 65, + 0.749402005689373 + ], + [ + 66, + 0.749388448551595 + ], + [ + 67, + 0.749378292937364 + ], + [ + 68, + 0.7493893777192285 + ], + [ + 69, + 0.7494020640612745 + ], + [ + 70, + 0.749388113256205 + ], + [ + 71, + 0.7493949761765804 + ], + [ + 72, + 0.7493872273422472 + ], + [ + 73, + 0.7493686665131345 + ], + [ + 74, + 0.7494086878510853 + ], + [ + 75, + 0.7493987049175213 + ], + [ + 76, + 0.7494035104924066 + ], + [ + 77, + 0.7494085798421963 + ], + [ + 78, + 0.7494012236175737 + ], + [ + 79, + 0.7493965643903735 + ], + [ + 80, + 0.7493722388926175 + ], + [ + 81, + 0.7493855664728786 + ], + [ + 82, + 0.7494076422037731 + ], + [ + 83, + 0.7493981861235621 + ], + [ + 84, + 0.7493902518791544 + ], + [ + 85, + 0.7493864440294339 + ], + [ + 86, + 0.7493949116123264 + ], + [ + 87, + 0.749393934029398 + ], + [ + 88, + 0.749385337987517 + ], + [ + 89, + 0.7493765470260315 + ], + [ + 90, + 0.7493792753959445 + ], + [ + 91, + 0.7493811654692877 + ], + [ + 92, + 0.7493927875353597 + ], + [ + 93, + 0.7494018052648254 + ], + [ + 94, + 0.7493991205092052 + ], + [ + 95, + 0.7494021873821667 + ], + [ + 96, + 0.7493917296459803 + ], + [ + 97, + 0.7493875192016652 + ], + [ + 98, + 0.7493879653352852 + ], + [ + 99, + 0.7493900474601058 + ], + [ + 100, + 0.7493940854326728 + ] + ] + }, + "blend_zero_target_trainable": { + "test_acc": [ + 0.264, + 0.2781, + 0.2795, + 0.2619, + 0.2655, + 0.2574, + 0.2514, + 0.2542, + 0.2466, + 0.259, + 0.264, + 0.2723, + 0.2761, + 0.2633, + 0.2566, + 0.2678, + 0.2485, + 0.2296, + 0.2162, + 0.1917, + 0.2184, + 0.2065, + 0.1931, + 0.2059, + 0.1663, + 0.1954, + 0.1922, + 0.1855, + 0.2072, + 0.1851, + 0.1741, + 0.1939, + 0.2083, + 0.2042, + 0.1954, + 0.1935, + 0.1993, + 0.205, + 0.2011, + 0.2087, + 0.2126, + 0.2141, + 0.2116, + 0.218, + 0.2072, + 0.2151, + 0.2189, + 0.21, + 0.2135, + 0.2176, + 0.2167, + 0.2213, + 0.2093, + 0.2129, + 0.2022, + 0.2056, + 0.2059, + 0.2057, + 0.2057, + 0.1849, + 0.2026, + 0.2112, + 0.1995, + 0.2044, + 0.1936, + 0.1937, + 0.2087, + 0.2021, + 0.2024, + 0.2016, + 0.2045, + 0.2056, + 0.2069, + 0.2041, + 0.1967, + 0.2015, + 0.2022, + 0.2002, + 0.2001, + 0.2013, + 0.2039, + 0.2041, + 0.2051, + 0.2007, + 0.2061, + 0.2013, + 0.2014, + 0.2032, + 0.2028, + 0.2033, + 0.2034, + 0.2023, + 0.2023, + 0.2031, + 0.203 + ], + "train_loss": [ + 2.003432984466553, + 2.0404958644104005, + 2.05170421913147, + 2.0512914763641357, + 2.059718384246826, + 2.056018392791748, + 2.0574035197448732, + 2.0550795609283448, + 2.051431663131714, + 2.05087917678833, + 2.048379221496582, + 2.0444970846939086, + 2.0427867864608764, + 2.0435575288391115, + 2.0456857122802736, + 2.0441513802337647, + 2.059211141204834, + 2.094487442703247, + 2.120898944854736, + 2.1411775353240965, + 2.1573567083740235, + 2.1730971395111083, + 2.1813291581726073, + 2.1853540766906736, + 2.18426385635376, + 2.1859450843048096, + 2.188995297317505, + 2.1879526950073243, + 2.1853000207519533, + 2.184229321975708, + 2.185366726226807, + 2.1810081949615476, + 2.17667474029541, + 2.1741380378723143, + 2.1705066053009032, + 2.1679501496124267, + 2.161978765106201, + 2.157980567855835, + 2.155652809371948, + 2.1513871308898924, + 2.1485144862365724, + 2.1452884986877443, + 2.1404634771728515, + 2.1402083478546143, + 2.1359153479003905, + 2.131035371170044, + 2.129794978027344, + 2.127242118988037, + 2.12495826461792, + 2.1216389994812013, + 2.1218640398406983, + 2.1189474866485596, + 2.117184839553833, + 2.12220953918457, + 2.1290039992523195, + 2.134818592529297, + 2.139795846862793, + 2.144669624786377, + 2.147829578704834, + 2.1512765794372557, + 2.152941629180908, + 2.1555648081207277, + 2.1558456703186035, + 2.154955834350586, + 2.1563889036560058, + 2.1574053646850584, + 2.157794552078247, + 2.158604030303955, + 2.1575727156829836, + 2.1577176335144044, + 2.1552623760986327, + 2.15590681930542, + 2.1562809659576416, + 2.1556343312072754, + 2.154660927200317, + 2.154556582107544, + 2.1544403926086426, + 2.1531307109832762, + 2.153617290649414, + 2.1533555097198485, + 2.153312416534424, + 2.152898409576416, + 2.1517363874053954, + 2.150981352081299, + 2.1505518492889406, + 2.150823607788086, + 2.150866351776123, + 2.148874746017456, + 2.150503429489136, + 2.1488629806518555, + 2.1504575192260744, + 2.1508920285797117, + 2.1497586909484863, + 2.1493976766967773, + 2.1510607133483886 + ], + "gamma": [ + [ + 6, + 0.03389458020683378 + ], + [ + 7, + 0.032111093460116535 + ], + [ + 8, + 0.03044863895047456 + ], + [ + 9, + 0.027433430892415345 + ], + [ + 10, + 0.03774541278835386 + ], + [ + 13, + 0.028504844522103667 + ], + [ + 15, + 0.03287511027883738 + ], + [ + 20, + 0.030300902930321172 + ], + [ + 25, + 0.0219054170884192 + ], + [ + 35, + 0.022474667755886912 + ], + [ + 45, + 0.0220179446041584 + ], + [ + 55, + 0.015417475253343582 + ], + [ + 65, + 0.012031457619741559 + ], + [ + 75, + 0.008347300812602043 + ], + [ + 85, + 0.016150177223607898 + ], + [ + 95, + 0.015004270651843399 + ], + [ + 100, + 0.011660999851301312 + ] + ], + "rho": [ + [ + 6, + -0.010524745099246502 + ], + [ + 7, + 0.004101772676222026 + ], + [ + 8, + 0.014873296488076448 + ], + [ + 9, + 0.004569279495626688 + ], + [ + 10, + -0.016330178827047348 + ], + [ + 13, + 0.00018126238137483597 + ], + [ + 15, + -0.01115548168309033 + ], + [ + 20, + -0.003041449934244156 + ], + [ + 25, + 0.015354603994637728 + ], + [ + 35, + -0.004682793049141765 + ], + [ + 45, + 0.012765995226800442 + ], + [ + 55, + 0.0006810068152844906 + ], + [ + 65, + 0.0004903898807242513 + ], + [ + 75, + 0.0011397527996450663 + ], + [ + 85, + -0.007209937088191509 + ], + [ + 95, + -1.2403237633407116e-05 + ], + [ + 100, + 0.012036159634590149 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7497110973373646 + ], + [ + 7, + 0.7495407175006196 + ], + [ + 8, + 0.7495014650438155 + ], + [ + 9, + 0.7494394919805796 + ], + [ + 10, + 0.7492695388180962 + ], + [ + 11, + 0.7493654889004079 + ], + [ + 12, + 0.7492565472070247 + ], + [ + 13, + 0.7493716493675475 + ], + [ + 14, + 0.7488066993907092 + ], + [ + 15, + 0.7491013538795988 + ], + [ + 16, + 0.7488933707912518 + ], + [ + 17, + 0.7494522288524024 + ], + [ + 18, + 0.7485868275958928 + ], + [ + 19, + 0.7473422431339624 + ], + [ + 20, + 0.7487962612259776 + ], + [ + 21, + 0.7494983161370045 + ], + [ + 22, + 0.7488975791216388 + ], + [ + 23, + 0.7480469713157275 + ], + [ + 24, + 0.7476437599827086 + ], + [ + 25, + 0.7474300097150289 + ], + [ + 26, + 0.747822986596431 + ], + [ + 27, + 0.7467118602425042 + ], + [ + 28, + 0.7471092996894162 + ], + [ + 29, + 0.7474470807519938 + ], + [ + 30, + 0.7476479569684252 + ], + [ + 31, + 0.7451283529728077 + ], + [ + 32, + 0.7458003003360094 + ], + [ + 33, + 0.7479835072001517 + ], + [ + 34, + 0.7446984605538471 + ], + [ + 35, + 0.7472124552272632 + ], + [ + 36, + 0.7463556332882426 + ], + [ + 37, + 0.7478376971321143 + ], + [ + 38, + 0.7478406578000478 + ], + [ + 39, + 0.7452850328116474 + ], + [ + 40, + 0.7466762376670545 + ], + [ + 41, + 0.7465009125588701 + ], + [ + 42, + 0.7450841557621256 + ], + [ + 43, + 0.7475184980092098 + ], + [ + 44, + 0.7454323403700487 + ], + [ + 45, + 0.7466811337346811 + ], + [ + 46, + 0.7465945785710588 + ], + [ + 47, + 0.746418668302273 + ], + [ + 48, + 0.7436489486425888 + ], + [ + 49, + 0.7450323294196143 + ], + [ + 50, + 0.7452192867013743 + ], + [ + 51, + 0.7464475260063141 + ], + [ + 52, + 0.7446866001113734 + ], + [ + 53, + 0.7448524841779364 + ], + [ + 54, + 0.7455440347145722 + ], + [ + 55, + 0.7457388396571264 + ], + [ + 56, + 0.7454119647928196 + ], + [ + 57, + 0.7430682626389489 + ], + [ + 58, + 0.7474565595948314 + ], + [ + 59, + 0.7423278495791585 + ], + [ + 60, + 0.7405472765991656 + ], + [ + 61, + 0.7395458773278126 + ], + [ + 62, + 0.7372895911825251 + ], + [ + 63, + 0.7363498697758593 + ], + [ + 64, + 0.7361875591915609 + ], + [ + 65, + 0.7349399572004071 + ], + [ + 66, + 0.7349707856961266 + ], + [ + 67, + 0.7322439808492792 + ], + [ + 68, + 0.7370521675143109 + ], + [ + 69, + 0.7386382624403232 + ], + [ + 70, + 0.7359472410416439 + ], + [ + 71, + 0.7353025986822335 + ], + [ + 72, + 0.7422242868818804 + ], + [ + 73, + 0.7423497206892272 + ], + [ + 74, + 0.7448571186644266 + ], + [ + 75, + 0.7423834255487499 + ], + [ + 76, + 0.7442281775254069 + ], + [ + 77, + 0.7435052675407173 + ], + [ + 78, + 0.7432126276523632 + ], + [ + 79, + 0.7438013154978188 + ], + [ + 80, + 0.7422217812382554 + ], + [ + 81, + 0.7440913565942923 + ], + [ + 82, + 0.7431837126395141 + ], + [ + 83, + 0.7428475916511187 + ], + [ + 84, + 0.7431000264451493 + ], + [ + 85, + 0.7437450935657974 + ], + [ + 86, + 0.7448235077650524 + ], + [ + 87, + 0.7427219708609096 + ], + [ + 88, + 0.7446693593127022 + ], + [ + 89, + 0.7085648437424285 + ], + [ + 90, + 0.740787975062913 + ], + [ + 91, + 0.7435331734982812 + ], + [ + 92, + 0.7441944409139527 + ], + [ + 93, + 0.7442299607020697 + ], + [ + 94, + 0.7442485650183557 + ], + [ + 95, + 0.7442345753614953 + ], + [ + 96, + 0.7439078810239492 + ], + [ + 97, + 0.7440106065482555 + ], + [ + 98, + 0.7447251286476685 + ], + [ + 99, + 0.6997242281014505 + ], + [ + 100, + 0.6615523455523286 + ] + ] + }, + "blend_zero_target_normmatched": { + "test_acc": [ + 0.2866, + 0.282, + 0.2812, + 0.2836, + 0.2808, + 0.2778, + 0.267, + 0.26, + 0.2562, + 0.2612, + 0.2792, + 0.2825, + 0.2852, + 0.2714, + 0.2702, + 0.2641, + 0.2735, + 0.2716, + 0.2446, + 0.2401, + 0.2261, + 0.2183, + 0.2018, + 0.213, + 0.1616, + 0.2083, + 0.1808, + 0.17, + 0.196, + 0.1803, + 0.174, + 0.1809, + 0.1913, + 0.1739, + 0.1978, + 0.178, + 0.1755, + 0.185, + 0.197, + 0.2071, + 0.1986, + 0.1997, + 0.2037, + 0.1986, + 0.206, + 0.2072, + 0.2205, + 0.204, + 0.221, + 0.2224, + 0.2128, + 0.2231, + 0.1855, + 0.2021, + 0.2, + 0.1953, + 0.2023, + 0.2001, + 0.2051, + 0.1695, + 0.1874, + 0.203, + 0.183, + 0.1933, + 0.1868, + 0.1933, + 0.197, + 0.1996, + 0.2037, + 0.1967, + 0.2036, + 0.1976, + 0.1993, + 0.2006, + 0.1876, + 0.1986, + 0.1962, + 0.1986, + 0.2006, + 0.1912, + 0.1982, + 0.205, + 0.2028, + 0.1982, + 0.2017, + 0.2023, + 0.2016, + 0.2036, + 0.2019, + 0.2028, + 0.2031, + 0.2029, + 0.2027, + 0.2025, + 0.2024 + ], + "train_loss": [ + 2.0053810136413572, + 2.041295912704468, + 2.0512937017822264, + 2.053422501525879, + 2.0592232944488527, + 2.0548282941436766, + 2.05423579788208, + 2.0632657752227783, + 2.060771167755127, + 2.056736230392456, + 2.0528232559204103, + 2.0485662706756593, + 2.0494049028778076, + 2.048429629974365, + 2.0481020497894287, + 2.0484046691894533, + 2.0441742082214356, + 2.0480171503067015, + 2.063710992202759, + 2.0992287350463865, + 2.1267570765686035, + 2.1412508248901365, + 2.146205220413208, + 2.1534790293884276, + 2.158313088378906, + 2.1622572157287596, + 2.164492923126221, + 2.1671857472991944, + 2.1656103144836427, + 2.167160799713135, + 2.1723063859558107, + 2.1732035494995117, + 2.1731792053985597, + 2.170966181488037, + 2.1706438542175293, + 2.1692603215789794, + 2.1665657765197754, + 2.1672782804870607, + 2.1647318984222412, + 2.163161800994873, + 2.1622354071807863, + 2.1623518823242187, + 2.1588726734924317, + 2.160354369506836, + 2.1577954167175295, + 2.1540362316131594, + 2.153853145523071, + 2.1522259687805176, + 2.151134018096924, + 2.1495489282989504, + 2.151202033081055, + 2.1525076805114747, + 2.154239734420776, + 2.158012287521362, + 2.162692668609619, + 2.1647850951385497, + 2.168344123535156, + 2.1698388371276853, + 2.171119987869263, + 2.1744665003204346, + 2.1771156128692626, + 2.180222715072632, + 2.183630125198364, + 2.182013426513672, + 2.1836937813568116, + 2.182101170425415, + 2.183056134490967, + 2.185867686767578, + 2.182726886138916, + 2.183416725234985, + 2.18278630607605, + 2.182796475982666, + 2.1808603149414063, + 2.179879749679565, + 2.181025611343384, + 2.1796674224853514, + 2.1807386072540282, + 2.1793438794708253, + 2.1803506465148925, + 2.1796112225341795, + 2.178861034927368, + 2.178344298248291, + 2.178040598297119, + 2.1764233238220214, + 2.1758622844696043, + 2.177035397949219, + 2.177131224822998, + 2.175055715484619, + 2.1750781156921386, + 2.1741144459533692, + 2.1753570489501954, + 2.1760255853271486, + 2.1760116576385498, + 2.1750786515045166, + 2.177204143218994 + ], + "gamma": [ + [ + 6, + 0.032760744099505246 + ], + [ + 7, + 0.03356296959100291 + ], + [ + 8, + 0.03529427613830194 + ], + [ + 9, + 0.03668428759556264 + ], + [ + 10, + 0.032860312261618674 + ], + [ + 13, + 0.03368683677399531 + ], + [ + 15, + 0.03394245891831815 + ], + [ + 20, + 0.03203312022378668 + ], + [ + 25, + 0.030271637078840286 + ], + [ + 35, + 0.014803529251366854 + ], + [ + 45, + 0.023266919946763664 + ], + [ + 55, + 0.0193672813475132 + ], + [ + 65, + 0.008843706636980642 + ], + [ + 75, + 0.01770660956390202 + ], + [ + 85, + 0.017078267177566886 + ], + [ + 95, + 0.019479279697407037 + ], + [ + 100, + 0.013533162360545248 + ] + ], + "rho": [ + [ + 6, + 0.008696502249222249 + ], + [ + 7, + -0.014632533071562648 + ], + [ + 8, + 0.0014590504579246044 + ], + [ + 9, + 0.019048720016144216 + ], + [ + 10, + 0.002272033249028027 + ], + [ + 13, + 0.00363256991840899 + ], + [ + 15, + -0.0008845720440149307 + ], + [ + 20, + -0.0013811918906867504 + ], + [ + 25, + -0.0008659022860229015 + ], + [ + 35, + 4.157889634370804e-06 + ], + [ + 45, + 0.005909497383981943 + ], + [ + 55, + -0.0021812813356518745 + ], + [ + 65, + -0.0036668083630502224 + ], + [ + 75, + 0.0019832749385386705 + ], + [ + 85, + -0.0003587682731449604 + ], + [ + 95, + 0.0025006418582051992 + ], + [ + 100, + -0.0003044707700610161 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7497102366961352 + ], + [ + 7, + 0.7496117878894093 + ], + [ + 8, + 0.7493668366630404 + ], + [ + 9, + 0.7494885253400894 + ], + [ + 10, + 0.7493006036787342 + ], + [ + 11, + 0.749507307622937 + ], + [ + 12, + 0.7489157461784136 + ], + [ + 13, + 0.7484369725912149 + ], + [ + 14, + 0.7491493989675917 + ], + [ + 15, + 0.7491947136943565 + ], + [ + 16, + 0.7489663992747633 + ], + [ + 17, + 0.7492430082735069 + ], + [ + 18, + 0.7479519284173322 + ], + [ + 19, + 0.7490517895834745 + ], + [ + 20, + 0.7484701280239605 + ], + [ + 21, + 0.74903092534869 + ], + [ + 22, + 0.7473644629390265 + ], + [ + 23, + 0.7494644840448654 + ], + [ + 24, + 0.748960534840753 + ], + [ + 25, + 0.7483511507690959 + ], + [ + 26, + 0.7479331988196185 + ], + [ + 27, + 0.7475201299801273 + ], + [ + 28, + 0.7469163964983162 + ], + [ + 29, + 0.7465724689237111 + ], + [ + 30, + 0.7463302567909254 + ], + [ + 31, + 0.7465513386415606 + ], + [ + 32, + 0.7474534738876192 + ], + [ + 33, + 0.7478912888643996 + ], + [ + 34, + 0.7462201697635631 + ], + [ + 35, + 0.7470943867621369 + ], + [ + 36, + 0.7444033970460742 + ], + [ + 37, + 0.7445381349531562 + ], + [ + 38, + 0.7467094160155424 + ], + [ + 39, + 0.7471418977436385 + ], + [ + 40, + 0.7468045466743071 + ], + [ + 41, + 0.7476849137928582 + ], + [ + 42, + 0.7453636446201087 + ], + [ + 43, + 0.7454549215666408 + ], + [ + 44, + 0.7468388575782224 + ], + [ + 45, + 0.7469884602426576 + ], + [ + 46, + 0.7471925785241396 + ], + [ + 47, + 0.7465119294092779 + ], + [ + 48, + 0.747185893816065 + ], + [ + 49, + 0.745718881971195 + ], + [ + 50, + 0.7452120083006145 + ], + [ + 51, + 0.7469803062502717 + ], + [ + 52, + 0.7428619281265142 + ], + [ + 53, + 0.7444926098917032 + ], + [ + 54, + 0.7441734065874468 + ], + [ + 55, + 0.7478602155222444 + ], + [ + 56, + 0.7429932759166155 + ], + [ + 57, + 0.7385215321278118 + ], + [ + 58, + 0.7374059694144435 + ], + [ + 59, + 0.7357296586926964 + ], + [ + 60, + 0.7347909031655697 + ], + [ + 61, + 0.7328087811513545 + ], + [ + 62, + 0.7288583480260555 + ], + [ + 63, + 0.7301279724503908 + ], + [ + 64, + 0.7319453293685294 + ], + [ + 65, + 0.7403276468203419 + ], + [ + 66, + 0.7321262214944909 + ], + [ + 67, + 0.7402790505349546 + ], + [ + 68, + 0.7361369243833945 + ], + [ + 69, + 0.7399826715782402 + ], + [ + 70, + 0.7385633677318512 + ], + [ + 71, + 0.7425509271044789 + ], + [ + 72, + 0.7410376088263465 + ], + [ + 73, + 0.7414316062436253 + ], + [ + 74, + 0.7423208572562254 + ], + [ + 75, + 0.7392775755613968 + ], + [ + 76, + 0.7423138959603065 + ], + [ + 77, + 0.7440436578416467 + ], + [ + 78, + 0.7417742672783044 + ], + [ + 79, + 0.7350923971954704 + ], + [ + 80, + 0.740331853535796 + ], + [ + 81, + 0.7403988790156416 + ], + [ + 82, + 0.74129861644223 + ], + [ + 83, + 0.7436739568445836 + ], + [ + 84, + 0.7436813696502542 + ], + [ + 85, + 0.7439240254755711 + ], + [ + 86, + 0.7437693353790671 + ], + [ + 87, + 0.7424159035007266 + ], + [ + 88, + 0.7412607206475597 + ], + [ + 89, + 0.7438216074109935 + ], + [ + 90, + 0.7441292943903884 + ], + [ + 91, + 0.7439333557153369 + ], + [ + 92, + 0.744267398988157 + ], + [ + 93, + 0.7414080338200553 + ], + [ + 94, + 0.662589780026837 + ], + [ + 95, + 0.6103594363078234 + ], + [ + 96, + 0.7080672370124097 + ], + [ + 97, + 0.6981383092536529 + ], + [ + 98, + 0.6739209545836329 + ], + [ + 99, + 0.6362291510318147 + ], + [ + 100, + 0.6540743195648167 + ] + ] + }, + "blend_perlayer_vector": { + "test_acc": [ + 0.3014, + 0.3091, + 0.3161, + 0.3138, + 0.3037, + 0.3046, + 0.3131, + 0.3115, + 0.2915, + 0.3185, + 0.3216, + 0.3119, + 0.3172, + 0.303, + 0.3201, + 0.3214, + 0.3286, + 0.3219, + 0.3216, + 0.3198, + 0.3209, + 0.3261, + 0.3199, + 0.3192, + 0.309, + 0.3095, + 0.3278, + 0.3126, + 0.3186, + 0.3137, + 0.3159, + 0.3185, + 0.3245, + 0.3079, + 0.3228, + 0.3072, + 0.3225, + 0.3238, + 0.3216, + 0.307, + 0.3216, + 0.3226, + 0.3168, + 0.3162, + 0.314, + 0.3111, + 0.3091, + 0.3163, + 0.3185, + 0.3108, + 0.3226, + 0.3224, + 0.326, + 0.3153, + 0.32, + 0.3186, + 0.3202, + 0.3143, + 0.3179, + 0.3175, + 0.316, + 0.3179, + 0.3194, + 0.3259, + 0.3205, + 0.3149, + 0.3241, + 0.3204, + 0.3167, + 0.3175, + 0.3158, + 0.314, + 0.3206, + 0.3172, + 0.3194, + 0.3168, + 0.3173, + 0.3163, + 0.3181, + 0.3158, + 0.3175, + 0.3171, + 0.3165, + 0.3189, + 0.3184, + 0.3169, + 0.3171, + 0.3181, + 0.3175, + 0.3177, + 0.318, + 0.3184, + 0.3178, + 0.3178, + 0.3179 + ], + "train_loss": [ + 1.9994929840087892, + 1.9909435724639892, + 1.9911939218902588, + 1.9807739561462403, + 1.9746150674438476, + 1.9764668709564208, + 1.975018363647461, + 1.9737896001815796, + 1.9739441508483886, + 1.9663956859588623, + 1.9689143822860717, + 1.9658036951446534, + 1.9667480603027343, + 1.9674083672332763, + 1.964588031463623, + 1.9619441661834718, + 1.9664774893569947, + 1.9652658667755127, + 1.9653460961532592, + 1.9660338995742799, + 1.966213752784729, + 1.9687189400863647, + 1.9702468350219726, + 1.9715557425689698, + 1.9705856410980225, + 1.9700196152496339, + 1.9696489532852173, + 1.972307102279663, + 1.9681650104141235, + 1.9746904849624634, + 1.9716557328033448, + 1.970906025238037, + 1.9725887395858765, + 1.9706830628967285, + 1.9751151922225951, + 1.977521953353882, + 1.9779337515640258, + 1.9787398273086547, + 1.9779761680603027, + 1.975472740097046, + 1.9720595486068726, + 1.9750176905059815, + 1.9728286672592164, + 1.9735189740753174, + 1.9700484294891358, + 1.9663869178009032, + 1.970880456314087, + 1.9700935790252685, + 1.969158224258423, + 1.9686299856567382, + 1.9682164820098877, + 1.9658004427719116, + 1.9688281896209716, + 1.9674775586318969, + 1.9676536360931396, + 1.9619322258758545, + 1.964151021347046, + 1.9621918587875367, + 1.962152914199829, + 1.9639425127792358, + 1.9638695216369628, + 1.9604027495574952, + 1.9605082215118408, + 1.9634784563827514, + 1.9594726029205323, + 1.9596597722625733, + 1.9628461597061158, + 1.9617521169281005, + 1.9619831213760377, + 1.9604441236877441, + 1.9610664263534545, + 1.960748560256958, + 1.963457571182251, + 1.9597577194595337, + 1.9599701406478882, + 1.9587874462509156, + 1.9594787602233887, + 1.9586531242370606, + 1.960344973449707, + 1.9590771360015868, + 1.9615441747665405, + 1.9583571487808227, + 1.9579783059692384, + 1.9601671183013916, + 1.9585991205215454, + 1.9578000702667235, + 1.957329704208374, + 1.9584047491836547, + 1.961261401901245, + 1.9607749820327758, + 1.953811019744873, + 1.9586621810913085, + 1.956612640991211, + 1.9581326139068604, + 1.9590486404037475 + ], + "gamma": [ + [ + 6, + 0.02758424769854173 + ], + [ + 7, + 0.02514540360425599 + ], + [ + 8, + 0.02798356593120843 + ], + [ + 9, + 0.029024130548350513 + ], + [ + 10, + 0.02441626461222768 + ], + [ + 13, + 0.026506584195885807 + ], + [ + 15, + 0.025264176714699715 + ], + [ + 20, + 0.024162075715139508 + ], + [ + 25, + 0.028284745756536722 + ], + [ + 35, + 0.026664523931685835 + ], + [ + 45, + 0.02932862620218657 + ], + [ + 55, + 0.024880344019038603 + ], + [ + 65, + 0.03438053181162104 + ], + [ + 75, + 0.030886002001352608 + ], + [ + 85, + 0.0240993500337936 + ], + [ + 95, + 0.0330632771801902 + ], + [ + 100, + 0.032676345988875255 + ] + ], + "rho": [ + [ + 6, + -0.00015322724357247353 + ], + [ + 7, + 0.009105906821787357 + ], + [ + 8, + 0.00440916046500206 + ], + [ + 9, + 0.013502348680049181 + ], + [ + 10, + 0.018625129014253616 + ], + [ + 13, + -0.012899965571705252 + ], + [ + 15, + 0.01508733443915844 + ], + [ + 20, + 0.010009644087404013 + ], + [ + 25, + 0.017516383668407798 + ], + [ + 35, + -0.0034965425729751587 + ], + [ + 45, + 0.009483097353950143 + ], + [ + 55, + 0.007973434403538704 + ], + [ + 65, + 0.016091769794002175 + ], + [ + 75, + -0.0038209278136491776 + ], + [ + 85, + -0.004151179688051343 + ], + [ + 95, + 0.004727359628304839 + ], + [ + 100, + 0.03360465099103749 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7496775136338373 + ], + [ + 7, + 0.7493848072643251 + ], + [ + 8, + 0.7493969820019624 + ], + [ + 9, + 0.7493779152086678 + ], + [ + 10, + 0.7493805607606816 + ], + [ + 11, + 0.7493858277202536 + ], + [ + 12, + 0.7493563667065243 + ], + [ + 13, + 0.7493739172881089 + ], + [ + 14, + 0.7493865152293538 + ], + [ + 15, + 0.7493799567737963 + ], + [ + 16, + 0.7493893793529548 + ], + [ + 17, + 0.7493935108297147 + ], + [ + 18, + 0.74937751457295 + ], + [ + 19, + 0.7493662596795336 + ], + [ + 20, + 0.7493579343807725 + ], + [ + 21, + 0.749376258570811 + ], + [ + 22, + 0.7493780597076252 + ], + [ + 23, + 0.7493718220015017 + ], + [ + 24, + 0.7493692390237389 + ], + [ + 25, + 0.7493817670563111 + ], + [ + 26, + 0.74934943246719 + ], + [ + 27, + 0.7493683354978263 + ], + [ + 28, + 0.7493750063356389 + ], + [ + 29, + 0.7493796536392181 + ], + [ + 30, + 0.7493815981479246 + ], + [ + 31, + 0.7493623953227052 + ], + [ + 32, + 0.7493714793640737 + ], + [ + 33, + 0.7493764149643402 + ], + [ + 34, + 0.7493924611144313 + ], + [ + 35, + 0.7493682567855126 + ], + [ + 36, + 0.7493617466290655 + ], + [ + 37, + 0.7493704769253654 + ], + [ + 38, + 0.749364511476785 + ], + [ + 39, + 0.7493487010999397 + ], + [ + 40, + 0.7493669261600524 + ], + [ + 41, + 0.7493560475686346 + ], + [ + 42, + 0.7493803044479502 + ], + [ + 43, + 0.7493788648584025 + ], + [ + 44, + 0.7493798778374525 + ], + [ + 45, + 0.7493651396584137 + ], + [ + 46, + 0.7493552045661347 + ], + [ + 47, + 0.7493729246021084 + ], + [ + 48, + 0.7493537313829601 + ], + [ + 49, + 0.7493827162435386 + ], + [ + 50, + 0.7493576430091816 + ], + [ + 51, + 0.7493604521014898 + ], + [ + 52, + 0.7493745756303004 + ], + [ + 53, + 0.7493613106607291 + ], + [ + 54, + 0.7493819623812891 + ], + [ + 55, + 0.7493775018999356 + ], + [ + 56, + 0.7493898504865194 + ], + [ + 57, + 0.7493854228839159 + ], + [ + 58, + 0.7493921795264545 + ], + [ + 59, + 0.7493614757989889 + ], + [ + 60, + 0.7493846420331053 + ], + [ + 61, + 0.7493759850668327 + ], + [ + 62, + 0.7494039517917349 + ], + [ + 63, + 0.7493645538488906 + ], + [ + 64, + 0.7493858809378218 + ], + [ + 65, + 0.749382843410981 + ], + [ + 66, + 0.7493601441202046 + ], + [ + 67, + 0.7493684406388421 + ], + [ + 68, + 0.749374369432499 + ], + [ + 69, + 0.7493906263596096 + ], + [ + 70, + 0.7493647075621254 + ], + [ + 71, + 0.7493811987237541 + ], + [ + 72, + 0.7493655957605927 + ], + [ + 73, + 0.7493640673929639 + ], + [ + 74, + 0.749398196804206 + ], + [ + 75, + 0.7493917599647075 + ], + [ + 76, + 0.7493809179743072 + ], + [ + 77, + 0.749353315616542 + ], + [ + 78, + 0.749385558142852 + ], + [ + 79, + 0.749366959825757 + ], + [ + 80, + 0.7493677037146079 + ], + [ + 81, + 0.7493588560245095 + ], + [ + 82, + 0.7493731044418906 + ], + [ + 83, + 0.749372858756826 + ], + [ + 84, + 0.7493648726008507 + ], + [ + 85, + 0.7493626112188468 + ], + [ + 86, + 0.7493844679969018 + ], + [ + 87, + 0.7493600602773467 + ], + [ + 88, + 0.749374010047192 + ], + [ + 89, + 0.7493398289894967 + ], + [ + 90, + 0.7493728568131478 + ], + [ + 91, + 0.7493648528938069 + ], + [ + 92, + 0.749379987144675 + ], + [ + 93, + 0.749379012553428 + ], + [ + 94, + 0.7493564874397597 + ], + [ + 95, + 0.7493693097759272 + ], + [ + 96, + 0.749372332695717 + ], + [ + 97, + 0.7493727628665475 + ], + [ + 98, + 0.7493753051079124 + ], + [ + 99, + 0.7493838413921884 + ], + [ + 100, + 0.7493817605382551 + ] + ] + }, + "blend_random_freeze_after_1": { + "test_acc": [ + 0.3063, + 0.2032, + 0.1273, + 0.1407, + 0.1227, + 0.1319, + 0.1227, + 0.1423, + 0.1406, + 0.1236, + 0.1189, + 0.1452, + 0.1251, + 0.1218, + 0.1289, + 0.1275, + 0.1214, + 0.1205, + 0.1383, + 0.1194, + 0.1175, + 0.1348, + 0.1399, + 0.1337, + 0.1299, + 0.1347, + 0.1261, + 0.1214, + 0.1429, + 0.1205, + 0.1292, + 0.14, + 0.1265, + 0.1458, + 0.125, + 0.122, + 0.1374, + 0.1398, + 0.1335, + 0.1295, + 0.1391, + 0.1338, + 0.1271, + 0.1384, + 0.1451, + 0.146, + 0.1351, + 0.1455, + 0.1192, + 0.124, + 0.1355, + 0.1205, + 0.1245, + 0.143, + 0.1442, + 0.1276, + 0.1451, + 0.1287, + 0.145, + 0.1261, + 0.1444, + 0.1342, + 0.1202, + 0.1272, + 0.1398, + 0.1416, + 0.1185, + 0.1345, + 0.141, + 0.1406, + 0.1437, + 0.1351, + 0.1352, + 0.1454, + 0.1427, + 0.1334, + 0.1436, + 0.1433, + 0.143, + 0.1176, + 0.1329, + 0.133, + 0.1345, + 0.1346, + 0.1349, + 0.1442, + 0.1458, + 0.143, + 0.1443, + 0.1416, + 0.1432, + 0.1435, + 0.1437, + 0.1438, + 0.1438 + ], + "train_loss": [ + 1.9885120925903321, + 2.0761205434417724, + 2.230262163696289, + 2.2778841004943846, + 2.2938861424255372, + 2.295684944229126, + 2.297641329574585, + 2.298973360443115, + 2.294463068695068, + 2.296937135620117, + 2.296987574005127, + 2.295542655105591, + 2.2948559199523926, + 2.29499972946167, + 2.2935732513427736, + 2.293764686279297, + 2.2939922271728515, + 2.2954816610717774, + 2.293695736236572, + 2.293420573272705, + 2.292508361053467, + 2.292823321685791, + 2.2922408909606933, + 2.2910657302093504, + 2.2923990909576415, + 2.291787723312378, + 2.2910885387420654, + 2.2904720906066895, + 2.2900661878204347, + 2.290612805328369, + 2.2922181576538088, + 2.2916324267578125, + 2.2893353955078126, + 2.2892222313690187, + 2.2895913304138182, + 2.2891984420776366, + 2.2897861616516115, + 2.288906211013794, + 2.287695652923584, + 2.2881334494781496, + 2.288540917892456, + 2.288068819885254, + 2.2882668949890137, + 2.289553168182373, + 2.28741283493042, + 2.287084792022705, + 2.287241609802246, + 2.286262402496338, + 2.287431600341797, + 2.2859934727478026, + 2.2863884370422363, + 2.2855619835662844, + 2.285059044265747, + 2.285717262420654, + 2.2851440204620364, + 2.2853235563659666, + 2.285508095550537, + 2.284884995803833, + 2.2841670207214357, + 2.2842117460632325, + 2.2844207135772705, + 2.284843815765381, + 2.2833426860809327, + 2.2847967240142824, + 2.2843006983184813, + 2.2830437184906005, + 2.2828539336395264, + 2.283909013595581, + 2.283869965133667, + 2.2835022590637206, + 2.283671631164551, + 2.2828954322052004, + 2.2837038899230957, + 2.2823268105316163, + 2.2824643184661864, + 2.282547272720337, + 2.2829145204162598, + 2.2820186660003663, + 2.2827925469207764, + 2.282179147338867, + 2.282109367904663, + 2.2820095054626464, + 2.2816736547851564, + 2.2822063021850587, + 2.2824253468322753, + 2.2817126638793943, + 2.2823937452697756, + 2.281291566543579, + 2.282202901000977, + 2.2823980027770996, + 2.281220394439697, + 2.2813532514190675, + 2.2817853865051267, + 2.281285207366943, + 2.2816215362548826 + ], + "gamma": [ + [ + 6, + 0.0226771094603464 + ], + [ + 7, + 0.018273803289048374 + ], + [ + 8, + 0.022315494250506163 + ], + [ + 9, + 0.02100165915908292 + ], + [ + 10, + 0.016694228834239766 + ], + [ + 13, + 0.0118214536778396 + ], + [ + 15, + 0.008569155354052782 + ], + [ + 20, + 0.005392427754486562 + ], + [ + 25, + 0.00896685284897103 + ], + [ + 35, + 0.005980721532523603 + ], + [ + 45, + 0.007969904990005716 + ], + [ + 55, + 0.006948693706092968 + ], + [ + 65, + 0.006855892404971087 + ], + [ + 75, + 0.006548671450985921 + ], + [ + 85, + 0.005674670293529971 + ], + [ + 95, + 0.006074464247149081 + ], + [ + 100, + 0.006020089146772989 + ] + ], + "rho": [ + [ + 6, + 0.005136748077347875 + ], + [ + 7, + 0.013638765143696219 + ], + [ + 8, + 0.0026725411880761385 + ], + [ + 9, + -4.764541517943144e-05 + ], + [ + 10, + 0.002810525242239237 + ], + [ + 13, + -0.0014697947772219777 + ], + [ + 15, + 0.007574135437607765 + ], + [ + 20, + 9.234785102307796e-05 + ], + [ + 25, + 0.0022132452577352524 + ], + [ + 35, + 0.0025958193000406027 + ], + [ + 45, + -0.0014452249743044376 + ], + [ + 55, + -0.006561175920069218 + ], + [ + 65, + 0.006800537463277578 + ], + [ + 75, + 0.0004066654946655035 + ], + [ + 85, + -0.00431265402585268 + ], + [ + 95, + 0.00305967777967453 + ], + [ + 100, + -0.006211055442690849 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7499212197100755 + ], + [ + 7, + 0.7499024856318292 + ], + [ + 8, + 0.7499319673934342 + ], + [ + 9, + 0.7499395970672296 + ], + [ + 10, + 0.7499431338929365 + ], + [ + 11, + 0.7499451968801987 + ], + [ + 12, + 0.7499465867049562 + ], + [ + 13, + 0.7499476422536362 + ], + [ + 14, + 0.7499484656371325 + ], + [ + 15, + 0.7499491977198112 + ], + [ + 16, + 0.7499498216952964 + ], + [ + 17, + 0.7499503794749826 + ], + [ + 18, + 0.7499508528867302 + ], + [ + 19, + 0.7499512869664006 + ], + [ + 20, + 0.7499516601427744 + ], + [ + 21, + 0.7499519864052889 + ], + [ + 22, + 0.7499523064733358 + ], + [ + 23, + 0.7499526089508433 + ], + [ + 24, + 0.749952882354241 + ], + [ + 25, + 0.7499531608515829 + ], + [ + 26, + 0.7499534033295001 + ], + [ + 27, + 0.7499536259687262 + ], + [ + 28, + 0.7499538391637108 + ], + [ + 29, + 0.7499540315490518 + ], + [ + 30, + 0.7499542277574561 + ], + [ + 31, + 0.7499544090025009 + ], + [ + 32, + 0.749954588810981 + ], + [ + 33, + 0.7499547605309729 + ], + [ + 34, + 0.7499549214785973 + ], + [ + 35, + 0.749955081906797 + ], + [ + 36, + 0.7499552256254782 + ], + [ + 37, + 0.7499553760836208 + ], + [ + 38, + 0.7499555201660311 + ], + [ + 39, + 0.7499556578726498 + ], + [ + 40, + 0.7499558101880698 + ], + [ + 41, + 0.7499559520076509 + ], + [ + 42, + 0.7499560894172485 + ], + [ + 43, + 0.7499562191698678 + ], + [ + 44, + 0.7499563382921131 + ], + [ + 45, + 0.7499564438303168 + ], + [ + 46, + 0.7499565391022466 + ], + [ + 47, + 0.7499566237337427 + ], + [ + 48, + 0.7499567041709162 + ], + [ + 49, + 0.7499567712266514 + ], + [ + 50, + 0.7499568361920005 + ], + [ + 51, + 0.749956898750056 + ], + [ + 52, + 0.7499569438134133 + ], + [ + 53, + 0.7499569908254526 + ], + [ + 54, + 0.7499570420350408 + ], + [ + 55, + 0.7499570775301238 + ], + [ + 56, + 0.7499571016564673 + ], + [ + 57, + 0.7499571459746414 + ], + [ + 58, + 0.7499571891869481 + ], + [ + 59, + 0.7499572110038194 + ], + [ + 60, + 0.749957236354002 + ], + [ + 61, + 0.7499572662894795 + ], + [ + 62, + 0.7499572911271395 + ], + [ + 63, + 0.7499573173336485 + ], + [ + 64, + 0.7499573392179685 + ], + [ + 65, + 0.749957359288327 + ], + [ + 66, + 0.749957377204341 + ], + [ + 67, + 0.749957394189893 + ], + [ + 68, + 0.749957415460572 + ], + [ + 69, + 0.7499574298905061 + ], + [ + 70, + 0.7499574504969908 + ], + [ + 71, + 0.7499574570612607 + ], + [ + 72, + 0.7499574808032011 + ], + [ + 73, + 0.7499574914435875 + ], + [ + 74, + 0.7499575046833561 + ], + [ + 75, + 0.7499575174477293 + ], + [ + 76, + 0.7499575343827153 + ], + [ + 77, + 0.7499575338567375 + ], + [ + 78, + 0.7499575504747613 + ], + [ + 79, + 0.7499575599418454 + ], + [ + 80, + 0.7499575676658329 + ], + [ + 81, + 0.7499575752145811 + ], + [ + 82, + 0.74995758071355 + ], + [ + 83, + 0.7499575876654663 + ], + [ + 84, + 0.7499575940948701 + ], + [ + 85, + 0.7499575954603194 + ], + [ + 86, + 0.7499576004871666 + ], + [ + 87, + 0.7499575992228616 + ], + [ + 88, + 0.7499576131908711 + ], + [ + 89, + 0.7499576097857281 + ], + [ + 90, + 0.7499576155374349 + ], + [ + 91, + 0.7499576194786625 + ], + [ + 92, + 0.7499576219937862 + ], + [ + 93, + 0.7499576193168133 + ], + [ + 94, + 0.7499576203215673 + ], + [ + 95, + 0.7499576204193835 + ], + [ + 96, + 0.7499576158408036 + ], + [ + 97, + 0.7499576177929302 + ], + [ + 98, + 0.7499576268251236 + ], + [ + 99, + 0.7499576217915709 + ], + [ + 100, + 0.7499576206351348 + ] + ] + }, + "blend_random_freeze_after_5": { + "test_acc": [ + 0.3057, + 0.3121, + 0.3176, + 0.3081, + 0.3076, + 0.2275, + 0.1555, + 0.1352, + 0.1333, + 0.1123, + 0.1447, + 0.1549, + 0.1184, + 0.131, + 0.1215, + 0.1274, + 0.121, + 0.1214, + 0.1219, + 0.1173, + 0.117, + 0.1384, + 0.1364, + 0.1385, + 0.1269, + 0.124, + 0.1228, + 0.1189, + 0.1414, + 0.1208, + 0.1269, + 0.1394, + 0.12, + 0.1429, + 0.1241, + 0.1209, + 0.1378, + 0.1362, + 0.1326, + 0.1277, + 0.1372, + 0.1136, + 0.128, + 0.1333, + 0.1416, + 0.142, + 0.1323, + 0.125, + 0.1194, + 0.1136, + 0.1338, + 0.1253, + 0.1243, + 0.1417, + 0.1427, + 0.1245, + 0.1446, + 0.1173, + 0.1155, + 0.1251, + 0.1435, + 0.1346, + 0.1229, + 0.1181, + 0.141, + 0.1418, + 0.118, + 0.1345, + 0.14, + 0.1457, + 0.1436, + 0.1352, + 0.1345, + 0.145, + 0.1421, + 0.1342, + 0.1345, + 0.1407, + 0.1431, + 0.118, + 0.1345, + 0.1354, + 0.1332, + 0.118, + 0.1353, + 0.1333, + 0.144, + 0.1421, + 0.1439, + 0.1289, + 0.1445, + 0.1411, + 0.1421, + 0.143, + 0.143 + ], + "train_loss": [ + 1.986709086303711, + 1.9856938624572753, + 1.9857408505249023, + 1.9869411079406738, + 1.9924460929107666, + 2.065664505157471, + 2.188273988494873, + 2.2466244148254395, + 2.271299695587158, + 2.28955681350708, + 2.297678905792236, + 2.2992174604034425, + 2.300583914337158, + 2.300704315338135, + 2.29892277053833, + 2.29928806098938, + 2.299401301345825, + 2.3006060648345947, + 2.2990310078430176, + 2.298429386138916, + 2.297889120941162, + 2.2977303551483153, + 2.2972964846801758, + 2.2962034020233153, + 2.296949835205078, + 2.297126563796997, + 2.2956148274993895, + 2.294817444534302, + 2.294436751174927, + 2.2950318000030516, + 2.296592710418701, + 2.295585599975586, + 2.2933802742004397, + 2.293261420288086, + 2.293370549621582, + 2.29287371963501, + 2.293215133666992, + 2.2926715459442137, + 2.2913270640563965, + 2.2918275312042238, + 2.2921436554718015, + 2.2917427026367188, + 2.2918095041656494, + 2.293215352859497, + 2.290927030715942, + 2.2903220557403565, + 2.2907896925354003, + 2.289483503417969, + 2.290825044403076, + 2.2892746055603026, + 2.290025728302002, + 2.2888286866760255, + 2.2882002299499513, + 2.2888796851348876, + 2.288195140609741, + 2.2884540342712403, + 2.2888086296081545, + 2.287996703338623, + 2.287258808746338, + 2.287319690093994, + 2.287380068283081, + 2.2877273332214356, + 2.2862229296875, + 2.287708251419067, + 2.2872046815490723, + 2.2860105876159666, + 2.2856850257110595, + 2.286888239746094, + 2.286637530593872, + 2.2864006828308105, + 2.2864431773376466, + 2.285773974761963, + 2.2863538861083983, + 2.2849072905731203, + 2.2852252075195314, + 2.285120125808716, + 2.285544990386963, + 2.284608533935547, + 2.285385781326294, + 2.2849736070251465, + 2.284644779510498, + 2.284583871459961, + 2.284174046859741, + 2.284768877105713, + 2.2850564936828612, + 2.284282191696167, + 2.2848409812927244, + 2.2838416215515136, + 2.2848528610229493, + 2.2848921446228028, + 2.2837032903289796, + 2.283878885421753, + 2.28442051902771, + 2.283711439285278, + 2.284164406585693 + ], + "gamma": [ + [ + 6, + 0.03155870421323925 + ], + [ + 7, + 0.030853431904688478 + ], + [ + 8, + 0.02669353107921779 + ], + [ + 9, + 0.04021082253893837 + ], + [ + 10, + 0.02785447984933853 + ], + [ + 13, + 0.009877135511487722 + ], + [ + 15, + 0.013345680315978825 + ], + [ + 20, + 0.01822983069723705 + ], + [ + 25, + 0.02449846071203865 + ], + [ + 35, + 0.008210629923269153 + ], + [ + 45, + 0.013970461225426334 + ], + [ + 55, + 0.013153882991474575 + ], + [ + 65, + 0.012924989430075584 + ], + [ + 75, + 0.01255605021270867 + ], + [ + 85, + 0.010964347789496287 + ], + [ + 95, + 0.011661061071279732 + ], + [ + 100, + 0.01153306716068414 + ] + ], + "rho": [ + [ + 6, + -0.00038986606523394585 + ], + [ + 7, + 0.003939110552892089 + ], + [ + 8, + -0.008288708748295903 + ], + [ + 9, + 0.006352564319968224 + ], + [ + 10, + 0.003459762316197157 + ], + [ + 13, + -0.0020975149236619473 + ], + [ + 15, + -0.002305691596120596 + ], + [ + 20, + -0.0023182069417089224 + ], + [ + 25, + -0.009444743394851685 + ], + [ + 35, + 0.002495761029422283 + ], + [ + 45, + -0.003406036412343383 + ], + [ + 55, + -0.00597015954554081 + ], + [ + 65, + -0.008500710129737854 + ], + [ + 75, + -0.0017160457791760564 + ], + [ + 85, + -0.00019435398280620575 + ], + [ + 95, + -0.005632538348436356 + ], + [ + 100, + 0.010569632984697819 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7499212107796505 + ], + [ + 7, + 0.7498528185962008 + ], + [ + 8, + 0.7497876571533472 + ], + [ + 9, + 0.7497269655928557 + ], + [ + 10, + 0.7496997642722671 + ], + [ + 11, + 0.7496945326114705 + ], + [ + 12, + 0.7497726365416734 + ], + [ + 13, + 0.7498108788064575 + ], + [ + 14, + 0.7498236977077778 + ], + [ + 15, + 0.749829508716111 + ], + [ + 16, + 0.7498335861585433 + ], + [ + 17, + 0.7498370685320528 + ], + [ + 18, + 0.7498402778006952 + ], + [ + 19, + 0.7498432276623289 + ], + [ + 20, + 0.7498458081573879 + ], + [ + 21, + 0.7498480619416539 + ], + [ + 22, + 0.7498499112601706 + ], + [ + 23, + 0.7498514802587081 + ], + [ + 24, + 0.7498528096051518 + ], + [ + 25, + 0.7498540019321015 + ], + [ + 26, + 0.7498550528840675 + ], + [ + 27, + 0.7498559698539567 + ], + [ + 28, + 0.7498567911115943 + ], + [ + 29, + 0.749857566886694 + ], + [ + 30, + 0.7498583052715652 + ], + [ + 31, + 0.7498590404228719 + ], + [ + 32, + 0.749859714970948 + ], + [ + 33, + 0.7498603463670913 + ], + [ + 34, + 0.7498608917921542 + ], + [ + 35, + 0.7498613438542885 + ], + [ + 36, + 0.7498617154807191 + ], + [ + 37, + 0.7498619536148421 + ], + [ + 38, + 0.7498620909216565 + ], + [ + 39, + 0.7498621543267309 + ], + [ + 40, + 0.749862060406788 + ], + [ + 41, + 0.7498618841088817 + ], + [ + 42, + 0.7498616681490198 + ], + [ + 43, + 0.7498613902038908 + ], + [ + 44, + 0.7498610584144705 + ], + [ + 45, + 0.7498607010313652 + ], + [ + 46, + 0.7498603161791532 + ], + [ + 47, + 0.7498599164455008 + ], + [ + 48, + 0.7498595232666123 + ], + [ + 49, + 0.7498590958460849 + ], + [ + 50, + 0.7498586592021772 + ], + [ + 51, + 0.7498582383751307 + ], + [ + 52, + 0.749857847542827 + ], + [ + 53, + 0.7498573739407272 + ], + [ + 54, + 0.7498569834772216 + ], + [ + 55, + 0.7498566489428903 + ], + [ + 56, + 0.7498562327888529 + ], + [ + 57, + 0.7498558698686884 + ], + [ + 58, + 0.7498555493443314 + ], + [ + 59, + 0.7498552811370571 + ], + [ + 60, + 0.7498549487912574 + ], + [ + 61, + 0.7498546960468907 + ], + [ + 62, + 0.7498544060062654 + ], + [ + 63, + 0.7498541988974751 + ], + [ + 64, + 0.7498539576374978 + ], + [ + 65, + 0.7498537409716542 + ], + [ + 66, + 0.7498535307747923 + ], + [ + 67, + 0.7498533419195366 + ], + [ + 68, + 0.7498531947832188 + ], + [ + 69, + 0.749853023106332 + ], + [ + 70, + 0.7498528461986017 + ], + [ + 71, + 0.749852717577081 + ], + [ + 72, + 0.7498525422243073 + ], + [ + 73, + 0.7498524360618399 + ], + [ + 74, + 0.749852326241415 + ], + [ + 75, + 0.7498522140626529 + ], + [ + 76, + 0.7498521204452114 + ], + [ + 77, + 0.7498520311237458 + ], + [ + 78, + 0.7498519479769574 + ], + [ + 79, + 0.7498518422828333 + ], + [ + 80, + 0.7498517599526828 + ], + [ + 81, + 0.7498517247145857 + ], + [ + 82, + 0.7498516684949844 + ], + [ + 83, + 0.7498516197832401 + ], + [ + 84, + 0.74985155412182 + ], + [ + 85, + 0.7498515355900542 + ], + [ + 86, + 0.7498514845196694 + ], + [ + 87, + 0.7498514612905921 + ], + [ + 88, + 0.7498514061403054 + ], + [ + 89, + 0.7498513745431571 + ], + [ + 90, + 0.7498513783864412 + ], + [ + 91, + 0.7498513570437203 + ], + [ + 92, + 0.7498513428884045 + ], + [ + 93, + 0.7498513538717607 + ], + [ + 94, + 0.7498513209180501 + ], + [ + 95, + 0.7498513234252093 + ], + [ + 96, + 0.7498513092258868 + ], + [ + 97, + 0.749851332383995 + ], + [ + 98, + 0.74985129756099 + ], + [ + 99, + 0.7498512950098275 + ], + [ + 100, + 0.7498513107344179 + ] + ] + }, + "blend_random_freeze_after_10": { + "test_acc": [ + 0.3068, + 0.3136, + 0.3192, + 0.3089, + 0.3114, + 0.3063, + 0.3078, + 0.3036, + 0.2979, + 0.3096, + 0.2179, + 0.1748, + 0.1378, + 0.1336, + 0.1181, + 0.1128, + 0.1455, + 0.1036, + 0.129, + 0.1169, + 0.1216, + 0.1377, + 0.1299, + 0.1349, + 0.124, + 0.1225, + 0.1224, + 0.1163, + 0.1391, + 0.1219, + 0.1258, + 0.1357, + 0.1209, + 0.1412, + 0.1213, + 0.1178, + 0.1351, + 0.1348, + 0.1311, + 0.1239, + 0.1283, + 0.1147, + 0.1267, + 0.121, + 0.1391, + 0.1416, + 0.1322, + 0.1233, + 0.12, + 0.1156, + 0.1346, + 0.1335, + 0.1221, + 0.1394, + 0.1402, + 0.1256, + 0.142, + 0.1091, + 0.1168, + 0.124, + 0.1168, + 0.1326, + 0.1237, + 0.1144, + 0.139, + 0.1395, + 0.1163, + 0.1333, + 0.1373, + 0.1413, + 0.1409, + 0.1342, + 0.1332, + 0.1423, + 0.1397, + 0.1334, + 0.1183, + 0.1317, + 0.1406, + 0.1178, + 0.1332, + 0.1331, + 0.1324, + 0.1128, + 0.132, + 0.1302, + 0.1405, + 0.1402, + 0.1403, + 0.1155, + 0.1419, + 0.1408, + 0.1299, + 0.1294, + 0.1298 + ], + "train_loss": [ + 1.9881320515441894, + 1.9870186071777343, + 1.9866066049194335, + 1.9788966651153563, + 1.983320122642517, + 1.9800231924819947, + 1.9782171863555909, + 1.9803499440002441, + 1.9775104429626464, + 1.978521219139099, + 2.055931195602417, + 2.1806510187530517, + 2.2426024320220947, + 2.2739720858764647, + 2.2868179563903808, + 2.2959177317047117, + 2.2989520695495607, + 2.301827975311279, + 2.3013604727935792, + 2.300691455078125, + 2.3002707484436034, + 2.2999929568481443, + 2.2992140190124513, + 2.2985281761932375, + 2.298954692993164, + 2.299465831298828, + 2.2978392871856688, + 2.297249239654541, + 2.2968861849212647, + 2.2975925408935547, + 2.299312409133911, + 2.298013726577759, + 2.2960053624725343, + 2.2958316496276856, + 2.295717995529175, + 2.29549167678833, + 2.2956369426727297, + 2.295159391708374, + 2.2939567210388185, + 2.294398659133911, + 2.2947351665496827, + 2.2943758375549317, + 2.2943764640808104, + 2.2959127186584474, + 2.293632814407349, + 2.292774415283203, + 2.29338448928833, + 2.2919403810119627, + 2.293427130661011, + 2.2917928271484374, + 2.2928208229064944, + 2.291327280807495, + 2.290728750305176, + 2.2914211921691896, + 2.290752984085083, + 2.2909728344726563, + 2.2913581065368653, + 2.2904867668914797, + 2.2898236507415772, + 2.2899002440643312, + 2.289705597457886, + 2.290143021392822, + 2.28862012840271, + 2.2900324601745607, + 2.2896193817901613, + 2.2885303899383547, + 2.2881026596069334, + 2.289370965118408, + 2.2890094148254394, + 2.2887696474456787, + 2.288681288909912, + 2.2881503539276125, + 2.288611475830078, + 2.2871972442626953, + 2.287553341674805, + 2.287350797958374, + 2.2876590617370605, + 2.286870872344971, + 2.2875029762268064, + 2.287281789703369, + 2.286849340667725, + 2.286843361053467, + 2.286285085296631, + 2.286966771469116, + 2.2872533617401123, + 2.2865214878082276, + 2.2868791717529295, + 2.285948681564331, + 2.2870913939666746, + 2.2869653445434572, + 2.285891586151123, + 2.2860418113708496, + 2.2865823564910888, + 2.2858644956970213, + 2.286282457962036 + ], + "gamma": [ + [ + 6, + 0.03577435575425625 + ], + [ + 7, + 0.02594527183100581 + ], + [ + 8, + 0.019803995557595044 + ], + [ + 9, + 0.023345530848018825 + ], + [ + 10, + 0.028913925169035792 + ], + [ + 13, + 0.0333862743282225 + ], + [ + 15, + 0.028461035108193755 + ], + [ + 20, + 0.013225269212853163 + ], + [ + 25, + 0.026851321141293738 + ], + [ + 35, + 0.01460943155871064 + ], + [ + 45, + 0.0214682377356894 + ], + [ + 55, + 0.01993026031232148 + ], + [ + 65, + 0.019510357384092458 + ], + [ + 75, + 0.019181935362439617 + ], + [ + 85, + 0.017001007566932458 + ], + [ + 95, + 0.01799813916977655 + ], + [ + 100, + 0.017798602316588585 + ] + ], + "rho": [ + [ + 6, + 0.008851037011481822 + ], + [ + 7, + 0.010623326292261481 + ], + [ + 8, + 0.006243920885026455 + ], + [ + 9, + 0.018517075921408832 + ], + [ + 10, + 0.019994840724393725 + ], + [ + 13, + -0.003194989636540413 + ], + [ + 15, + 0.013649753760546446 + ], + [ + 20, + 0.0033422389533370733 + ], + [ + 25, + -0.0046805706806480885 + ], + [ + 35, + -0.006440741941332817 + ], + [ + 45, + -0.006845635827630758 + ], + [ + 55, + 0.00424462603405118 + ], + [ + 65, + 0.008816015906631947 + ], + [ + 75, + -0.004470052197575569 + ], + [ + 85, + -0.00485114473849535 + ], + [ + 95, + 0.003956635016947985 + ], + [ + 100, + -0.009871503338217735 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7499193180455133 + ], + [ + 7, + 0.7498498951928352 + ], + [ + 8, + 0.7497853275435375 + ], + [ + 9, + 0.7497583213788145 + ], + [ + 10, + 0.7496802137700671 + ], + [ + 11, + 0.7496336473357863 + ], + [ + 12, + 0.7495944234730211 + ], + [ + 13, + 0.7495856134523137 + ], + [ + 14, + 0.7495378145517163 + ], + [ + 15, + 0.7495203656557123 + ], + [ + 16, + 0.749595675138455 + ], + [ + 17, + 0.7496260288222706 + ], + [ + 18, + 0.7496405775473204 + ], + [ + 19, + 0.7496439416568822 + ], + [ + 20, + 0.7496436035869247 + ], + [ + 21, + 0.7496418566541048 + ], + [ + 22, + 0.7496398332785688 + ], + [ + 23, + 0.7496378150693942 + ], + [ + 24, + 0.7496360547295424 + ], + [ + 25, + 0.7496347410096641 + ], + [ + 26, + 0.7496337641962749 + ], + [ + 27, + 0.749633142211968 + ], + [ + 28, + 0.7496326525979851 + ], + [ + 29, + 0.7496323165710145 + ], + [ + 30, + 0.7496321006433524 + ], + [ + 31, + 0.7496319818274026 + ], + [ + 32, + 0.7496320191619597 + ], + [ + 33, + 0.7496322547896026 + ], + [ + 34, + 0.7496326005447648 + ], + [ + 35, + 0.749633079285126 + ], + [ + 36, + 0.7496336269858973 + ], + [ + 37, + 0.7496342560321766 + ], + [ + 38, + 0.7496349100853218 + ], + [ + 39, + 0.7496355510132134 + ], + [ + 40, + 0.7496362531526267 + ], + [ + 41, + 0.7496369420344482 + ], + [ + 42, + 0.7496375791497651 + ], + [ + 43, + 0.7496382069287194 + ], + [ + 44, + 0.7496388242679449 + ], + [ + 45, + 0.7496393759112324 + ], + [ + 46, + 0.7496399419288853 + ], + [ + 47, + 0.7496404388552795 + ], + [ + 48, + 0.7496409375102326 + ], + [ + 49, + 0.7496413907226306 + ], + [ + 50, + 0.7496418546650437 + ], + [ + 51, + 0.7496423077489263 + ], + [ + 52, + 0.749642663069428 + ], + [ + 53, + 0.749643060698477 + ], + [ + 54, + 0.7496434160776027 + ], + [ + 55, + 0.7496436851345508 + ], + [ + 56, + 0.7496439725611305 + ], + [ + 57, + 0.7496443179024123 + ], + [ + 58, + 0.7496445984967786 + ], + [ + 59, + 0.7496447819587829 + ], + [ + 60, + 0.7496450557382539 + ], + [ + 61, + 0.7496452667699693 + ], + [ + 62, + 0.7496454587106002 + ], + [ + 63, + 0.7496456532096109 + ], + [ + 64, + 0.7496458126259359 + ], + [ + 65, + 0.7496459772222902 + ], + [ + 66, + 0.7496461469941117 + ], + [ + 67, + 0.7496462543422839 + ], + [ + 68, + 0.7496463845246278 + ], + [ + 69, + 0.7496464831191557 + ], + [ + 70, + 0.7496466277675442 + ], + [ + 71, + 0.7496467035339424 + ], + [ + 72, + 0.7496468599431467 + ], + [ + 73, + 0.7496468933974064 + ], + [ + 74, + 0.7496469773700104 + ], + [ + 75, + 0.7496470592440312 + ], + [ + 76, + 0.7496471400320178 + ], + [ + 77, + 0.7496471817124153 + ], + [ + 78, + 0.749647239774908 + ], + [ + 79, + 0.7496472965021626 + ], + [ + 80, + 0.7496473676715285 + ], + [ + 81, + 0.7496473739817566 + ], + [ + 82, + 0.749647428403859 + ], + [ + 83, + 0.7496474899750082 + ], + [ + 84, + 0.7496475077123036 + ], + [ + 85, + 0.7496475029501258 + ], + [ + 86, + 0.7496475523423989 + ], + [ + 87, + 0.749647543193304 + ], + [ + 88, + 0.7496476452948474 + ], + [ + 89, + 0.7496476172122094 + ], + [ + 90, + 0.7496476359495764 + ], + [ + 91, + 0.7496476560422746 + ], + [ + 92, + 0.7496476677099678 + ], + [ + 93, + 0.7496476121010561 + ], + [ + 94, + 0.7496476771397894 + ], + [ + 95, + 0.7496476691809392 + ], + [ + 96, + 0.7496476473565865 + ], + [ + 97, + 0.7496476403332835 + ], + [ + 98, + 0.7496476870492047 + ], + [ + 99, + 0.7496476723095268 + ], + [ + 100, + 0.7496476678215215 + ] + ] + } +} \ No newline at end of file diff --git a/results/online_shallow/scan_s42.json b/results/online_shallow/scan_s42.json new file mode 100644 index 0000000..b3dfeea --- /dev/null +++ b/results/online_shallow/scan_s42.json @@ -0,0 +1,422 @@ +[ + { + "method": "dfa", + "L": 4, + "d_hidden": 256, + "seed": 42, + "warmup_ratio": 0.2, + "term_grad_weight": 1.0, + "test_acc": 0.3116, + "mean_gamma": 0.10076353600015864, + "mean_rho": -0.00476757250726223, + "mean_nudge": -3.260793164372444e-07, + "per_layer_gamma": [ + 0.42987197637557983, + 0.002452872460708022, + -0.014306485652923584, + -0.014964219182729721 + ], + "per_layer_rho": [ + -0.01907029002904892, + 0.0, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + -1.3024546205997467e-06, + -1.862645149230957e-09, + 0.0, + 0.0 + ] + }, + { + "method": "sb_eT", + "L": 4, + "d_hidden": 256, + "seed": 42, + "warmup_ratio": 0.2, + "term_grad_weight": 1.0, + "test_acc": 0.1737, + "mean_gamma": 0.02469697833294049, + "mean_rho": -0.012663604691624641, + "mean_nudge": -1.6051344573497772e-06, + "per_layer_gamma": [ + 0.02607825957238674, + 0.049343302845954895, + 0.002323275664821267, + 0.021043075248599052 + ], + "per_layer_rho": [ + -0.050654418766498566, + 0.0, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + -6.420537829399109e-06, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "cb_eT", + "L": 4, + "d_hidden": 256, + "seed": 42, + "warmup_ratio": 0.0, + "term_grad_weight": 1.0, + "test_acc": 0.1546, + "mean_gamma": 0.010205775421354701, + "mean_rho": 0.0012211860157549381, + "mean_nudge": -5.587935447692871e-09, + "per_layer_gamma": [ + 0.028749946504831314, + 0.012085458263754845, + 5.072341991763096e-06, + -1.7375425159116276e-05 + ], + "per_layer_rho": [ + 0.0048847440630197525, + 0.0, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + -2.2351741790771484e-08, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "cb_eT", + "L": 4, + "d_hidden": 256, + "seed": 42, + "warmup_ratio": 0.0, + "term_grad_weight": 4.0, + "test_acc": 0.1169, + "mean_gamma": 0.004216111148707569, + "mean_rho": 0.00741030735662207, + "mean_nudge": -7.916241884231567e-09, + "per_layer_gamma": [ + 0.0018346477299928665, + 0.019228298217058182, + -0.002127251587808132, + -0.0020712497644126415 + ], + "per_layer_rho": [ + 0.03154653310775757, + -0.001905303681269288, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + -2.60770320892334e-08, + -5.587935447692871e-09, + 0.0, + 0.0 + ] + }, + { + "method": "cb_eT", + "L": 4, + "d_hidden": 256, + "seed": 42, + "warmup_ratio": 0.05, + "term_grad_weight": 1.0, + "test_acc": 0.1049, + "mean_gamma": -0.0009609744556655642, + "mean_rho": 0.0024358099326491356, + "mean_nudge": 3.259629011154175e-09, + "per_layer_gamma": [ + -0.004597642458975315, + -3.2639800338074565e-06, + 0.0004314985126256943, + 0.0003255101037211716 + ], + "per_layer_rho": [ + 0.009743239730596542, + 0.0, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + 1.30385160446167e-08, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "cb_eT", + "L": 4, + "d_hidden": 256, + "seed": 42, + "warmup_ratio": 0.05, + "term_grad_weight": 4.0, + "test_acc": 0.1798, + "mean_gamma": 0.06056667093071155, + "mean_rho": 0.03483579680323601, + "mean_nudge": -1.0756775736808777e-06, + "per_layer_gamma": [ + 0.2081003189086914, + 0.033366840332746506, + 0.0005531693459488451, + 0.00024635513545945287 + ], + "per_layer_rho": [ + 0.13934318721294403, + 0.0, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + -4.302710294723511e-06, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "cb_eT", + "L": 4, + "d_hidden": 256, + "seed": 42, + "warmup_ratio": 0.2, + "term_grad_weight": 1.0, + "test_acc": 0.283, + "mean_gamma": 0.17921950668096542, + "mean_rho": 0.008699589408934116, + "mean_nudge": -8.21426510810852e-07, + "per_layer_gamma": [ + 0.5069771409034729, + 0.05348020792007446, + 0.07490736246109009, + 0.08151331543922424 + ], + "per_layer_rho": [ + 0.034798357635736465, + 0.0, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + -3.285706043243408e-06, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "cb_eT", + "L": 4, + "d_hidden": 256, + "seed": 42, + "warmup_ratio": 0.2, + "term_grad_weight": 4.0, + "test_acc": 0.2854, + "mean_gamma": 0.18741484452039003, + "mean_rho": 0.0021140535827726126, + "mean_nudge": -8.436618372797966e-07, + "per_layer_gamma": [ + 0.5276610851287842, + 0.046022433787584305, + 0.08646765351295471, + 0.08950820565223694 + ], + "per_layer_rho": [ + 0.00845621433109045, + 0.0, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + -3.3746473491191864e-06, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "cb_deltaL", + "L": 4, + "d_hidden": 256, + "seed": 42, + "warmup_ratio": 0.0, + "term_grad_weight": 1.0, + "test_acc": 0.0953, + "mean_gamma": 0.00023498532198695798, + "mean_rho": -0.002640543971210718, + "mean_nudge": 4.190951585769653e-09, + "per_layer_gamma": [ + 0.0009388166945427656, + 1.1305664884275757e-06, + -2.059467707482554e-09, + -3.91361565377224e-09 + ], + "per_layer_rho": [ + -0.010562175884842873, + 0.0, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + 1.6763806343078613e-08, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "cb_deltaL", + "L": 4, + "d_hidden": 256, + "seed": 42, + "warmup_ratio": 0.0, + "term_grad_weight": 4.0, + "test_acc": 0.1084, + "mean_gamma": -0.000962152166505803, + "mean_rho": -0.006210822146385908, + "mean_nudge": 9.313225746154785e-10, + "per_layer_gamma": [ + -0.003848549909889698, + -5.8880857523035957e-08, + 4.6535258979574223e-10, + -3.4062858089711767e-10 + ], + "per_layer_rho": [ + -0.024843288585543633, + 0.0, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + 3.725290298461914e-09, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "cb_deltaL", + "L": 4, + "d_hidden": 256, + "seed": 42, + "warmup_ratio": 0.05, + "term_grad_weight": 1.0, + "test_acc": 0.1092, + "mean_gamma": 0.009919490943730125, + "mean_rho": -0.008342609740793705, + "mean_nudge": -2.3283064365386963e-10, + "per_layer_gamma": [ + 0.03979068249464035, + -0.0001326934725511819, + 2.563164889579639e-05, + -5.6568960644654e-06 + ], + "per_layer_rho": [ + -0.03337043896317482, + 0.0, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + -9.313225746154785e-10, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "cb_deltaL", + "L": 4, + "d_hidden": 256, + "seed": 42, + "warmup_ratio": 0.05, + "term_grad_weight": 4.0, + "test_acc": 0.1155, + "mean_gamma": -0.0010879231473768236, + "mean_rho": -0.0036583333276212215, + "mean_nudge": 3.725290298461914e-09, + "per_layer_gamma": [ + -0.004351496696472168, + -1.6072939956757182e-07, + -2.6652518414493898e-08, + -8.51111714439412e-09 + ], + "per_layer_rho": [ + -0.014633333310484886, + 0.0, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + 1.4901161193847656e-08, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "cb_deltaL", + "L": 4, + "d_hidden": 256, + "seed": 42, + "warmup_ratio": 0.2, + "term_grad_weight": 1.0, + "test_acc": 0.1851, + "mean_gamma": 0.0015729351434856653, + "mean_rho": 0.0014943215064704418, + "mean_nudge": -7.450580596923828e-09, + "per_layer_gamma": [ + -0.0012846197932958603, + 0.005665094591677189, + 0.004892412573099136, + -0.0029811467975378036 + ], + "per_layer_rho": [ + 0.005977286025881767, + 0.0, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + -2.9802322387695312e-08, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "cb_deltaL", + "L": 4, + "d_hidden": 256, + "seed": 42, + "warmup_ratio": 0.2, + "term_grad_weight": 4.0, + "test_acc": 0.1706, + "mean_gamma": 0.007908080180641264, + "mean_rho": -0.014252320863306522, + "mean_nudge": -6.565824151039124e-08, + "per_layer_gamma": [ + 0.020493682473897934, + -0.0016250908374786377, + 0.002295387675985694, + 0.010468341410160065 + ], + "per_layer_rho": [ + -0.01426580548286438, + -0.04274347797036171, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + -2.6263296604156494e-07, + 0.0, + 0.0, + 0.0 + ] + } +] \ No newline at end of file diff --git a/results/online_shallow_3seed/scan_s123.json b/results/online_shallow_3seed/scan_s123.json new file mode 100644 index 0000000..ad5d91d --- /dev/null +++ b/results/online_shallow_3seed/scan_s123.json @@ -0,0 +1,62 @@ +[ + { + "method": "dfa", + "L": 4, + "d_hidden": 256, + "seed": 123, + "warmup_ratio": 0.2, + "term_grad_weight": 1.0, + "test_acc": 0.3106, + "mean_gamma": 0.11738517042249441, + "mean_rho": 0.005885639227926731, + "mean_nudge": -4.444736987352371e-07, + "per_layer_gamma": [ + 0.4517223834991455, + 0.012923447415232658, + 0.004009386524558067, + 0.0008854642510414124 + ], + "per_layer_rho": [ + 0.023542556911706924, + 0.0, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + -1.7816200852394104e-06, + 3.725290298461914e-09, + 0.0, + 0.0 + ] + }, + { + "method": "cb_eT", + "L": 4, + "d_hidden": 256, + "seed": 123, + "warmup_ratio": 0.2, + "term_grad_weight": 1.0, + "test_acc": 0.2753, + "mean_gamma": 0.17617796920239925, + "mean_rho": 0.0019302130676805973, + "mean_nudge": -7.422640919685364e-07, + "per_layer_gamma": [ + 0.5222728252410889, + 0.043591007590293884, + 0.0659613385796547, + 0.07288670539855957 + ], + "per_layer_rho": [ + 0.022736016660928726, + 0.0, + -0.015015164390206337, + 0.0 + ], + "per_layer_nudge": [ + -2.9690563678741455e-06, + 0.0, + 0.0, + 0.0 + ] + } +] \ No newline at end of file diff --git a/results/online_shallow_3seed/scan_s42.json b/results/online_shallow_3seed/scan_s42.json new file mode 100644 index 0000000..624919b --- /dev/null +++ b/results/online_shallow_3seed/scan_s42.json @@ -0,0 +1,62 @@ +[ + { + "method": "dfa", + "L": 4, + "d_hidden": 256, + "seed": 42, + "warmup_ratio": 0.2, + "term_grad_weight": 1.0, + "test_acc": 0.3116, + "mean_gamma": 0.10076353600015864, + "mean_rho": -0.00476757250726223, + "mean_nudge": -3.260793164372444e-07, + "per_layer_gamma": [ + 0.42987197637557983, + 0.002452872460708022, + -0.014306485652923584, + -0.014964219182729721 + ], + "per_layer_rho": [ + -0.01907029002904892, + 0.0, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + -1.3024546205997467e-06, + -1.862645149230957e-09, + 0.0, + 0.0 + ] + }, + { + "method": "cb_eT", + "L": 4, + "d_hidden": 256, + "seed": 42, + "warmup_ratio": 0.2, + "term_grad_weight": 1.0, + "test_acc": 0.283, + "mean_gamma": 0.17921950668096542, + "mean_rho": 0.008699589408934116, + "mean_nudge": -8.21426510810852e-07, + "per_layer_gamma": [ + 0.5069771409034729, + 0.05348020792007446, + 0.07490736246109009, + 0.08151331543922424 + ], + "per_layer_rho": [ + 0.034798357635736465, + 0.0, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + -3.285706043243408e-06, + 0.0, + 0.0, + 0.0 + ] + } +] \ No newline at end of file diff --git a/results/online_shallow_3seed/scan_s456.json b/results/online_shallow_3seed/scan_s456.json new file mode 100644 index 0000000..09327b1 --- /dev/null +++ b/results/online_shallow_3seed/scan_s456.json @@ -0,0 +1,62 @@ +[ + { + "method": "dfa", + "L": 4, + "d_hidden": 256, + "seed": 456, + "warmup_ratio": 0.2, + "term_grad_weight": 1.0, + "test_acc": 0.297, + "mean_gamma": 0.09892195643624291, + "mean_rho": -0.004888533148914576, + "mean_nudge": -3.1944364309310913e-07, + "per_layer_gamma": [ + 0.3969520926475525, + -0.0020016406197100878, + -0.0031630932353436947, + 0.003900466952472925 + ], + "per_layer_rho": [ + -0.019554132595658302, + 0.0, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + -1.2777745723724365e-06, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "cb_eT", + "L": 4, + "d_hidden": 256, + "seed": 456, + "warmup_ratio": 0.2, + "term_grad_weight": 1.0, + "test_acc": 0.2893, + "mean_gamma": 0.23417379707098007, + "mean_rho": -0.002338360995054245, + "mean_nudge": -5.409820005297661e-07, + "per_layer_gamma": [ + 0.41382449865341187, + 0.12546014785766602, + 0.1961553394794464, + 0.201255202293396 + ], + "per_layer_rho": [ + -0.00935344398021698, + 0.0, + 0.0, + 0.0 + ], + "per_layer_nudge": [ + -2.1639280021190643e-06, + 0.0, + 0.0, + 0.0 + ] + } +] \ No newline at end of file diff --git a/results/online_vec_pilot/pilot_s42.json b/results/online_vec_pilot/pilot_s42.json new file mode 100644 index 0000000..989a2d9 --- /dev/null +++ b/results/online_vec_pilot/pilot_s42.json @@ -0,0 +1,177 @@ +[ + { + "method": "dfa", + "L": 4, + "d": 256, + "seed": 42, + "warmup_ratio": 0.2, + "term_weight": 1.0, + "M": 4, + "test_acc": 0.3116, + "mean_gamma": 0.10076353600015864, + "mean_rho": -0.00476757250726223, + "mean_nudge": -3.260793164372444e-07, + "per_layer_gamma": [ + 0.42987197637557983, + 0.002452872460708022, + -0.014306485652923584, + -0.014964219182729721 + ], + "per_layer_rho": [ + -0.01907029002904892, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "vec_eT_M4", + "L": 4, + "d": 256, + "seed": 42, + "warmup_ratio": 0.0, + "term_weight": 1.0, + "M": 4, + "test_acc": 0.1585, + "mean_gamma": 0.0070959172576294804, + "mean_rho": 0.004696090705692768, + "mean_nudge": 1.6298145055770874e-09, + "per_layer_gamma": [ + 0.02838953770697117, + -1.1787886251113378e-05, + 1.5722671378171071e-06, + 4.346942660049535e-06 + ], + "per_layer_rho": [ + 0.018784362822771072, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "vec_eT_M4", + "L": 4, + "d": 256, + "seed": 42, + "warmup_ratio": 0.0, + "term_weight": 4.0, + "M": 4, + "test_acc": 0.1547, + "mean_gamma": -0.004175424227696567, + "mean_rho": 0.007184227928519249, + "mean_nudge": -3.725290298461914e-09, + "per_layer_gamma": [ + -0.016694847494363785, + -1.839158903749194e-05, + 5.305797913024435e-06, + 6.2363747019844595e-06 + ], + "per_layer_rho": [ + 0.028736911714076996, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "vec_eT_M4", + "L": 4, + "d": 256, + "seed": 42, + "warmup_ratio": 0.05, + "term_weight": 1.0, + "M": 4, + "test_acc": 0.1301, + "mean_gamma": 0.0003392250334854907, + "mean_rho": -0.006982688792049885, + "mean_nudge": 2.561137080192566e-09, + "per_layer_gamma": [ + 0.0014179275603964925, + 2.4803875930956565e-06, + -5.080455230199732e-05, + -1.270326174562797e-05 + ], + "per_layer_rho": [ + -0.02793075516819954, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "vec_eT_M4", + "L": 4, + "d": 256, + "seed": 42, + "warmup_ratio": 0.05, + "term_weight": 4.0, + "M": 4, + "test_acc": 0.1585, + "mean_gamma": 0.001455232677017193, + "mean_rho": -0.004349564202129841, + "mean_nudge": 2.3283064365386963e-10, + "per_layer_gamma": [ + 0.005935228429734707, + -4.2289950215490535e-05, + -2.683553066162858e-05, + -4.517224078881554e-05 + ], + "per_layer_rho": [ + -0.017398256808519363, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "vec_eT_M4", + "L": 4, + "d": 256, + "seed": 42, + "warmup_ratio": 0.2, + "term_weight": 1.0, + "M": 4, + "test_acc": 0.2425, + "mean_gamma": 0.0011495156340970425, + "mean_rho": 0.00014320318587124348, + "mean_nudge": -8.847564458847046e-09, + "per_layer_gamma": [ + 0.004161187447607517, + 8.946975140133873e-05, + 0.00017050666792783886, + 0.00017689866945147514 + ], + "per_layer_rho": [ + 0.0005728127434849739, + 0.0, + 0.0, + 0.0 + ] + }, + { + "method": "vec_eT_M4", + "L": 4, + "d": 256, + "seed": 42, + "warmup_ratio": 0.2, + "term_weight": 4.0, + "M": 4, + "test_acc": 0.1985, + "mean_gamma": 0.0039006864826660603, + "mean_rho": 0.0011303124483674765, + "mean_nudge": -1.234002411365509e-08, + "per_layer_gamma": [ + 0.014948057942092419, + 0.0001860432676039636, + 0.00021447567269206047, + 0.00025416904827579856 + ], + "per_layer_rho": [ + 0.004521249793469906, + 0.0, + 0.0, + 0.0 + ] + } +] \ No newline at end of file diff --git a/results/optionA_random_targets_s42.log b/results/optionA_random_targets_s42.log new file mode 100644 index 0000000..a3a42dd --- /dev/null +++ b/results/optionA_random_targets_s42.log @@ -0,0 +1,107 @@ +device=cuda:0, depth=4, d_hidden=256, epochs=100, seed=42 +eval buffer: torch.Size([1024, 3072]) + +=== DFA training === + [DFA] Ep 0: ||h||_med=[8.718070030212402, 8.780964851379395, 8.812002182006836, 8.828720092773438, 8.893179893493652] ||g||_med=[0.0010068593546748161, 0.000997236929833889, 0.0009934091940522194, 0.0009870644425973296, 0.0009829498594626784] acc=0.1152 + [DFA] Ep 1: ||h_L||=1.616e+03 ||g_2||=5.122e-06 acc=0.0781 gamma_dfa=-0.0195 + [DFA] Ep 2: ||h_L||=1.391e+04 ||g_2||=5.878e-07 acc=0.0752 gamma_dfa=-0.0282 + [DFA] Ep 3: ||h_L||=4.246e+04 ||g_2||=1.870e-07 acc=0.1045 gamma_dfa=-0.0381 + [DFA] Ep 4: ||h_L||=9.624e+04 ||g_2||=8.071e-08 acc=0.1035 gamma_dfa=-0.0378 + [DFA] Ep 5: ||h_L||=1.850e+05 ||g_2||=4.153e-08 acc=0.0742 gamma_dfa=-0.0436 + [DFA] Ep 6: ||h_L||=3.073e+05 ||g_2||=2.394e-08 acc=0.0947 gamma_dfa=-0.0448 + [DFA] Ep 7: ||h_L||=4.777e+05 ||g_2||=1.513e-08 acc=0.1084 gamma_dfa=-0.0455 + [DFA] Ep 8: ||h_L||=6.985e+05 ||g_2||=1.015e-08 acc=0.1279 gamma_dfa=-0.0395 + [DFA] Ep 9: ||h_L||=9.675e+05 ||g_2||=7.060e-09 acc=0.0869 gamma_dfa=-0.0190 + [DFA] Ep 10: ||h_L||=1.307e+06 ||g_2||=5.129e-09 acc=0.1045 gamma_dfa=-0.0181 + [DFA] Ep 11: ||h_L||=1.716e+06 ||g_2||=3.838e-09 acc=0.1113 gamma_dfa=-0.0240 + [DFA] Ep 12: ||h_L||=2.196e+06 ||g_2||=2.895e-09 acc=0.0879 gamma_dfa=-0.0201 + [DFA] Ep 13: ||h_L||=2.781e+06 ||g_2||=2.258e-09 acc=0.0703 gamma_dfa=-0.0132 + [DFA] Ep 14: ||h_L||=3.421e+06 ||g_2||=1.784e-09 acc=0.1006 gamma_dfa=-0.0058 + [DFA] Ep 15: ||h_L||=4.226e+06 ||g_2||=1.396e-09 acc=0.0889 gamma_dfa=-0.0100 + [DFA] Ep 16: ||h_L||=5.056e+06 ||g_2||=1.131e-09 acc=0.0889 gamma_dfa=-0.0037 + [DFA] Ep 17: ||h_L||=5.866e+06 ||g_2||=9.453e-10 acc=0.0986 gamma_dfa=-0.0099 + [DFA] Ep 18: ||h_L||=6.858e+06 ||g_2||=7.787e-10 acc=0.0996 gamma_dfa=-0.0063 + [DFA] Ep 19: ||h_L||=8.041e+06 ||g_2||=6.544e-10 acc=0.1104 gamma_dfa=-0.0087 + [DFA] Ep 20: ||h_L||=9.318e+06 ||g_2||=5.474e-10 acc=0.1045 gamma_dfa=-0.0098 + [DFA] Ep 21: ||h_L||=1.077e+07 ||g_2||=4.567e-10 acc=0.0898 gamma_dfa=0.0014 + [DFA] Ep 22: ||h_L||=1.231e+07 ||g_2||=3.877e-10 acc=0.0928 gamma_dfa=-0.0015 + [DFA] Ep 23: ||h_L||=1.395e+07 ||g_2||=3.320e-10 acc=0.1006 gamma_dfa=-0.0039 + [DFA] Ep 24: ||h_L||=1.562e+07 ||g_2||=2.862e-10 acc=0.0889 gamma_dfa=-0.0053 + [DFA] Ep 25: ||h_L||=1.753e+07 ||g_2||=2.498e-10 acc=0.0811 gamma_dfa=-0.0011 + [DFA] Ep 26: ||h_L||=1.959e+07 ||g_2||=2.162e-10 acc=0.0752 gamma_dfa=0.0000 + [DFA] Ep 27: ||h_L||=2.174e+07 ||g_2||=1.882e-10 acc=0.1240 gamma_dfa=-0.0094 + [DFA] Ep 28: ||h_L||=2.396e+07 ||g_2||=1.655e-10 acc=0.0996 gamma_dfa=0.0049 + [DFA] Ep 29: ||h_L||=2.643e+07 ||g_2||=1.463e-10 acc=0.1191 gamma_dfa=-0.0017 + [DFA] Ep 30: ||h_L||=2.888e+07 ||g_2||=1.314e-10 acc=0.1348 gamma_dfa=-0.0005 + [DFA] Ep 31: ||h_L||=3.160e+07 ||g_2||=1.169e-10 acc=0.1182 gamma_dfa=-0.0009 + [DFA] Ep 32: ||h_L||=3.433e+07 ||g_2||=1.024e-10 acc=0.1025 gamma_dfa=-0.0034 + [DFA] Ep 33: ||h_L||=3.693e+07 ||g_2||=9.115e-11 acc=0.1270 gamma_dfa=0.0007 + [DFA] Ep 34: ||h_L||=3.970e+07 ||g_2||=8.221e-11 acc=0.1055 gamma_dfa=0.0019 + [DFA] Ep 35: ||h_L||=4.276e+07 ||g_2||=7.299e-11 acc=0.0928 gamma_dfa=0.0005 + [DFA] Ep 36: ||h_L||=4.573e+07 ||g_2||=6.667e-11 acc=0.1152 gamma_dfa=-0.0008 + [DFA] Ep 37: ||h_L||=4.878e+07 ||g_2||=6.093e-11 acc=0.1250 gamma_dfa=-0.0022 + [DFA] Ep 38: ||h_L||=5.207e+07 ||g_2||=5.443e-11 acc=0.0859 gamma_dfa=-0.0001 + [DFA] Ep 39: ||h_L||=5.511e+07 ||g_2||=4.958e-11 acc=0.1230 gamma_dfa=-0.0013 + [DFA] Ep 40: ||h_L||=5.806e+07 ||g_2||=4.578e-11 acc=0.0781 gamma_dfa=-0.0016 + [DFA] Ep 41: ||h_L||=6.145e+07 ||g_2||=4.278e-11 acc=0.0664 gamma_dfa=0.0003 + [DFA] Ep 42: ||h_L||=6.473e+07 ||g_2||=3.890e-11 acc=0.0889 gamma_dfa=0.0044 + [DFA] Ep 43: ||h_L||=6.815e+07 ||g_2||=3.522e-11 acc=0.1064 gamma_dfa=-0.0026 + [DFA] Ep 44: ||h_L||=7.139e+07 ||g_2||=3.238e-11 acc=0.1396 gamma_dfa=0.0011 + [DFA] Ep 45: ||h_L||=7.456e+07 ||g_2||=3.018e-11 acc=0.1191 gamma_dfa=0.0015 + [DFA] Ep 46: ||h_L||=7.814e+07 ||g_2||=2.801e-11 acc=0.1377 gamma_dfa=0.0007 + [DFA] Ep 47: ||h_L||=8.133e+07 ||g_2||=2.622e-11 acc=0.0869 gamma_dfa=0.0035 + [DFA] Ep 48: ||h_L||=8.473e+07 ||g_2||=2.505e-11 acc=0.0752 gamma_dfa=0.0013 + [DFA] Ep 49: ||h_L||=8.819e+07 ||g_2||=2.312e-11 acc=0.1094 gamma_dfa=0.0011 + [DFA] Ep 50: ||h_L||=9.170e+07 ||g_2||=2.175e-11 acc=0.0986 gamma_dfa=-0.0012 + [DFA] Ep 51: ||h_L||=9.510e+07 ||g_2||=2.029e-11 acc=0.1211 gamma_dfa=0.0001 + [DFA] Ep 52: ||h_L||=9.809e+07 ||g_2||=1.951e-11 acc=0.0820 gamma_dfa=0.0010 + [DFA] Ep 53: ||h_L||=1.015e+08 ||g_2||=1.830e-11 acc=0.0869 gamma_dfa=-0.0033 + [DFA] Ep 54: ||h_L||=1.046e+08 ||g_2||=1.751e-11 acc=0.0898 gamma_dfa=-0.0003 + [DFA] Ep 55: ||h_L||=1.076e+08 ||g_2||=1.678e-11 acc=0.0869 gamma_dfa=-0.0005 + [DFA] Ep 56: ||h_L||=1.111e+08 ||g_2||=1.598e-11 acc=0.1162 gamma_dfa=0.0029 + [DFA] Ep 57: ||h_L||=1.142e+08 ||g_2||=1.499e-11 acc=0.0840 gamma_dfa=-0.0001 + [DFA] Ep 58: ||h_L||=1.171e+08 ||g_2||=1.418e-11 acc=0.0811 gamma_dfa=0.0050 + [DFA] Ep 59: ||h_L||=1.202e+08 ||g_2||=1.351e-11 acc=0.1338 gamma_dfa=-0.0011 + [DFA] Ep 60: ||h_L||=1.230e+08 ||g_2||=1.301e-11 acc=0.1504 gamma_dfa=-0.0020 + [DFA] Ep 61: ||h_L||=1.257e+08 ||g_2||=1.253e-11 acc=0.1123 gamma_dfa=0.0018 + [DFA] Ep 62: ||h_L||=1.285e+08 ||g_2||=1.209e-11 acc=0.0986 gamma_dfa=0.0013 + [DFA] Ep 63: ||h_L||=1.312e+08 ||g_2||=1.186e-11 acc=0.1152 gamma_dfa=0.0017 + [DFA] Ep 64: ||h_L||=1.337e+08 ||g_2||=1.152e-11 acc=0.0996 gamma_dfa=0.0023 + [DFA] Ep 65: ||h_L||=1.359e+08 ||g_2||=1.100e-11 acc=0.0762 gamma_dfa=-0.0017 + [DFA] Ep 66: ||h_L||=1.382e+08 ||g_2||=1.057e-11 acc=0.1162 gamma_dfa=-0.0007 + [DFA] Ep 67: ||h_L||=1.405e+08 ||g_2||=1.041e-11 acc=0.0781 gamma_dfa=0.0021 + [DFA] Ep 68: ||h_L||=1.424e+08 ||g_2||=1.026e-11 acc=0.1074 gamma_dfa=-0.0026 + [DFA] Ep 69: ||h_L||=1.445e+08 ||g_2||=9.974e-12 acc=0.0986 gamma_dfa=0.0005 + [DFA] Ep 70: ||h_L||=1.466e+08 ||g_2||=9.732e-12 acc=0.0889 gamma_dfa=-0.0003 + [DFA] Ep 71: ||h_L||=1.482e+08 ||g_2||=9.569e-12 acc=0.1143 gamma_dfa=-0.0020 + [DFA] Ep 72: ||h_L||=1.499e+08 ||g_2||=9.471e-12 acc=0.1055 gamma_dfa=-0.0012 + [DFA] Ep 73: ||h_L||=1.517e+08 ||g_2||=9.353e-12 acc=0.1201 gamma_dfa=-0.0021 + [DFA] Ep 74: ||h_L||=1.533e+08 ||g_2||=9.077e-12 acc=0.0908 gamma_dfa=0.0005 + [DFA] Ep 75: ||h_L||=1.546e+08 ||g_2||=8.996e-12 acc=0.1133 gamma_dfa=-0.0005 + [DFA] Ep 76: ||h_L||=1.558e+08 ||g_2||=8.988e-12 acc=0.0830 gamma_dfa=-0.0013 + [DFA] Ep 77: ||h_L||=1.571e+08 ||g_2||=8.877e-12 acc=0.0781 gamma_dfa=0.0009 + [DFA] Ep 78: ||h_L||=1.583e+08 ||g_2||=8.694e-12 acc=0.0645 gamma_dfa=0.0014 + [DFA] Ep 79: ||h_L||=1.594e+08 ||g_2||=8.523e-12 acc=0.1074 gamma_dfa=0.0008 + [DFA] Ep 80: ||h_L||=1.603e+08 ||g_2||=8.436e-12 acc=0.0703 gamma_dfa=-0.0008 + [DFA] Ep 81: ||h_L||=1.612e+08 ||g_2||=8.381e-12 acc=0.0938 gamma_dfa=-0.0033 + [DFA] Ep 82: ||h_L||=1.620e+08 ||g_2||=8.330e-12 acc=0.1240 gamma_dfa=0.0004 + [DFA] Ep 83: ||h_L||=1.628e+08 ||g_2||=8.371e-12 acc=0.0859 gamma_dfa=0.0011 + [DFA] Ep 84: ||h_L||=1.634e+08 ||g_2||=8.219e-12 acc=0.0850 gamma_dfa=0.0004 + [DFA] Ep 85: ||h_L||=1.640e+08 ||g_2||=8.202e-12 acc=0.0840 gamma_dfa=0.0002 + [DFA] Ep 86: ||h_L||=1.645e+08 ||g_2||=8.157e-12 acc=0.1064 gamma_dfa=0.0000 + [DFA] Ep 87: ||h_L||=1.650e+08 ||g_2||=8.125e-12 acc=0.0850 gamma_dfa=-0.0002 + [DFA] Ep 88: ||h_L||=1.654e+08 ||g_2||=8.098e-12 acc=0.0820 gamma_dfa=0.0013 + [DFA] Ep 89: ||h_L||=1.657e+08 ||g_2||=8.072e-12 acc=0.1182 gamma_dfa=-0.0002 + [DFA] Ep 90: ||h_L||=1.660e+08 ||g_2||=8.044e-12 acc=0.1084 gamma_dfa=-0.0005 + [DFA] Ep 91: ||h_L||=1.662e+08 ||g_2||=8.025e-12 acc=0.1250 gamma_dfa=-0.0016 + [DFA] Ep 92: ||h_L||=1.664e+08 ||g_2||=8.020e-12 acc=0.1250 gamma_dfa=-0.0005 + [DFA] Ep 93: ||h_L||=1.665e+08 ||g_2||=8.012e-12 acc=0.1201 gamma_dfa=-0.0009 + [DFA] Ep 94: ||h_L||=1.667e+08 ||g_2||=8.013e-12 acc=0.1240 gamma_dfa=-0.0010 + [DFA] Ep 95: ||h_L||=1.667e+08 ||g_2||=8.007e-12 acc=0.1240 gamma_dfa=-0.0007 + [DFA] Ep 96: ||h_L||=1.668e+08 ||g_2||=8.006e-12 acc=0.1240 gamma_dfa=-0.0004 + [DFA] Ep 97: ||h_L||=1.668e+08 ||g_2||=8.007e-12 acc=0.1240 gamma_dfa=-0.0003 + [DFA] Ep 98: ||h_L||=1.669e+08 ||g_2||=8.005e-12 acc=0.1240 gamma_dfa=-0.0003 + [DFA] Ep 99: ||h_L||=1.669e+08 ||g_2||=8.004e-12 acc=0.1240 gamma_dfa=-0.0003 + [DFA] Ep 100: ||h_L||=1.669e+08 ||g_2||=8.004e-12 acc=0.1240 gamma_dfa=-0.0004 + +Saved results/optionA_random_targets_s42/snapshot_evolution_s42.json diff --git a/results/optionA_random_targets_s42/snapshot_evolution_s42.json b/results/optionA_random_targets_s42/snapshot_evolution_s42.json new file mode 100644 index 0000000..9a24e69 --- /dev/null +++ b/results/optionA_random_targets_s42/snapshot_evolution_s42.json @@ -0,0 +1,2749 @@ +{ + "config": { + "output_dir": "results/optionA_random_targets_s42", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 42, + "depth": 4, + "d_hidden": 256, + "log_every": 1, + "no_residual_add": false, + "w2_std": 0.01, + "random_targets": true, + "skip_bp": true + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": null, + "dfa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010068593546748161, + 0.000997236929833889, + 0.0009934091940522194, + 0.0009870644425973296, + 0.0009829498594626784 + ], + "bp_grad_norms_F": [ + 0.03544403985142708, + 0.03507080301642418, + 0.03477022796869278, + 0.03443896397948265, + 0.03407429903745651 + ], + "gamma_dfa": 0.007406219025142491, + "acc_eval": 0.115234375, + "loss_eval": 2.383650302886963, + "epoch": 0 + }, + { + "hidden_norms": [ + 290.9817199707031, + 627.6629028320312, + 1287.7171630859375, + 1459.1513671875, + 1616.4718017578125 + ], + "bp_grad_norms_per_sample_med": [ + 5.262210834189318e-06, + 5.14477824253845e-06, + 5.1224119488324504e-06, + 5.1222677939222194e-06, + 5.123215942148818e-06 + ], + "bp_grad_norms_F": [ + 0.0008317740284837782, + 0.0008041572291404009, + 0.0007967103738337755, + 0.0007942747906781733, + 0.0007939037750475109 + ], + "gamma_dfa": -0.01952565903775394, + "acc_eval": 0.078125, + "loss_eval": 2.3129711151123047, + "epoch": 1 + }, + { + "hidden_norms": [ + 530.2883911132812, + 4770.83984375, + 10422.763671875, + 12636.15234375, + 13907.7587890625 + ], + "bp_grad_norms_per_sample_med": [ + 7.561958454971318e-07, + 5.883355242985999e-07, + 5.877673743270861e-07, + 5.877889748262533e-07, + 5.877806756870996e-07 + ], + "bp_grad_norms_F": [ + 0.00048568230704404414, + 0.0004738113493658602, + 0.0004746047197841108, + 0.00046957648009993136, + 0.00046837228001095355 + ], + "gamma_dfa": -0.02824715618044138, + "acc_eval": 0.0751953125, + "loss_eval": 2.327746868133545, + "epoch": 2 + }, + { + "hidden_norms": [ + 776.7593994140625, + 14701.5390625, + 31384.16015625, + 38395.3359375, + 42461.37890625 + ], + "bp_grad_norms_per_sample_med": [ + 3.0913437853996584e-07, + 1.869875916327146e-07, + 1.8700784210068377e-07, + 1.870558179462023e-07, + 1.870270267545493e-07 + ], + "bp_grad_norms_F": [ + 0.0003413700615055859, + 0.0003374870866537094, + 0.0003392821818124503, + 0.00030567243811674416, + 0.0003016987757291645 + ], + "gamma_dfa": -0.038137396797537804, + "acc_eval": 0.1044921875, + "loss_eval": 2.3107361793518066, + "epoch": 3 + }, + { + "hidden_norms": [ + 968.3828125, + 37952.72265625, + 72785.1328125, + 87599.4140625, + 96238.84375 + ], + "bp_grad_norms_per_sample_med": [ + 2.4106981300064945e-07, + 8.08614899483473e-08, + 8.070540502558288e-08, + 8.066034951070833e-08, + 8.066343326618153e-08 + ], + "bp_grad_norms_F": [ + 0.0002630708331707865, + 0.00023605814203619957, + 0.00023638480342924595, + 0.00023389894340652972, + 0.00021539803128689528 + ], + "gamma_dfa": -0.037757945246994495, + "acc_eval": 0.103515625, + "loss_eval": 2.312647819519043, + "epoch": 4 + }, + { + "hidden_norms": [ + 1094.08642578125, + 78769.9453125, + 140437.5625, + 168767.5625, + 184955.890625 + ], + "bp_grad_norms_per_sample_med": [ + 1.8580334426587797e-07, + 4.146673404648027e-08, + 4.152716215344299e-08, + 4.1506435621840865e-08, + 4.150659904667009e-08 + ], + "bp_grad_norms_F": [ + 0.00017344040679745376, + 0.0001734093384584412, + 0.00017384161765221506, + 0.00017216427659150213, + 0.0001493075687903911 + ], + "gamma_dfa": -0.04355482757091522, + "acc_eval": 0.07421875, + "loss_eval": 2.3431315422058105, + "epoch": 5 + }, + { + "hidden_norms": [ + 1341.3931884765625, + 139090.921875, + 231652.84375, + 281000.15625, + 307253.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.95400020795023e-08, + 2.393203679673661e-08, + 2.393579912052246e-08, + 2.3937987592148602e-08, + 2.3940138760281116e-08 + ], + "bp_grad_norms_F": [ + 8.837149653118104e-05, + 8.386950503336266e-05, + 8.389632421312854e-05, + 8.345059177372605e-05, + 7.231948256958276e-05 + ], + "gamma_dfa": -0.044815219938755035, + "acc_eval": 0.0947265625, + "loss_eval": 2.3063740730285645, + "epoch": 6 + }, + { + "hidden_norms": [ + 1541.082763671875, + 221682.3125, + 361269.78125, + 435912.5, + 477745.59375 + ], + "bp_grad_norms_per_sample_med": [ + 8.871538881294327e-08, + 1.5129883124131993e-08, + 1.5129455022133698e-08, + 1.513093117466724e-08, + 1.5129749897369038e-08 + ], + "bp_grad_norms_F": [ + 6.570185360033065e-05, + 1.65565506904386e-05, + 1.6456760931760073e-05, + 1.2925677765451837e-05, + 1.2370261174510233e-05 + ], + "gamma_dfa": -0.0455410098657012, + "acc_eval": 0.1083984375, + "loss_eval": 2.322909355163574, + "epoch": 7 + }, + { + "hidden_norms": [ + 1785.2386474609375, + 320922.03125, + 530986.4375, + 634164.875, + 698474.0625 + ], + "bp_grad_norms_per_sample_med": [ + 4.730902603000686e-08, + 1.0146245621456274e-08, + 1.0146251838705211e-08, + 1.0143652140470749e-08, + 1.014903983076465e-08 + ], + "bp_grad_norms_F": [ + 1.1641483069979586e-05, + 5.675432475982234e-06, + 5.721857633034233e-06, + 7.849063763387676e-07, + 7.832054507161956e-07 + ], + "gamma_dfa": -0.039457285893149674, + "acc_eval": 0.1279296875, + "loss_eval": 2.3133440017700195, + "epoch": 8 + }, + { + "hidden_norms": [ + 2014.4766845703125, + 439754.375, + 730323.4375, + 876362.4375, + 967547.375 + ], + "bp_grad_norms_per_sample_med": [ + 3.3528117171499616e-08, + 7.06648384252162e-09, + 7.059930862141073e-09, + 7.054891337787694e-09, + 7.054930861727371e-09 + ], + "bp_grad_norms_F": [ + 8.620314474683255e-06, + 5.386140401242301e-06, + 5.411964593804441e-06, + 4.715600994131819e-07, + 4.707477785359515e-07 + ], + "gamma_dfa": -0.018979715649038553, + "acc_eval": 0.0869140625, + "loss_eval": 2.3219242095947266, + "epoch": 9 + }, + { + "hidden_norms": [ + 2227.54052734375, + 609797.1875, + 983513.8125, + 1188663.0, + 1307053.25 + ], + "bp_grad_norms_per_sample_med": [ + 2.0001076350695257e-08, + 5.128104607621253e-09, + 5.1290607316900605e-09, + 5.126524982301817e-09, + 5.12929876350654e-09 + ], + "bp_grad_norms_F": [ + 6.190822659846162e-06, + 3.060452399950009e-06, + 3.074174401263008e-06, + 3.294025248123944e-07, + 3.29135190213492e-07 + ], + "gamma_dfa": -0.01813346426934004, + "acc_eval": 0.1044921875, + "loss_eval": 2.331584930419922, + "epoch": 10 + }, + { + "hidden_norms": [ + 2457.193115234375, + 803897.3125, + 1286980.25, + 1553564.875, + 1716479.25 + ], + "bp_grad_norms_per_sample_med": [ + 1.729943654993349e-08, + 3.841335249887834e-09, + 3.838269257983029e-09, + 3.838585449500442e-09, + 3.837864692712856e-09 + ], + "bp_grad_norms_F": [ + 3.917093636118807e-06, + 2.7961248179053655e-06, + 2.805686108331429e-06, + 2.3621770139925502e-07, + 2.3617232614014938e-07 + ], + "gamma_dfa": -0.02396334079094231, + "acc_eval": 0.111328125, + "loss_eval": 2.3206071853637695, + "epoch": 11 + }, + { + "hidden_norms": [ + 2634.52099609375, + 1040589.8125, + 1656069.25, + 1991088.125, + 2196123.75 + ], + "bp_grad_norms_per_sample_med": [ + 2.1142980699551117e-08, + 2.8919602268473454e-09, + 2.8948958785690593e-09, + 2.8949218577878355e-09, + 2.8939526330873377e-09 + ], + "bp_grad_norms_F": [ + 2.204534575867001e-05, + 2.299454763488029e-06, + 2.206897988799028e-06, + 1.7700770627016027e-07, + 1.7689913534013613e-07 + ], + "gamma_dfa": -0.020109509699977934, + "acc_eval": 0.087890625, + "loss_eval": 2.315797805786133, + "epoch": 12 + }, + { + "hidden_norms": [ + 2877.5615234375, + 1376012.25, + 2111297.75, + 2523565.25, + 2781256.5 + ], + "bp_grad_norms_per_sample_med": [ + 1.216429978967426e-08, + 2.2570649793607345e-09, + 2.2583199754677707e-09, + 2.258467191040836e-09, + 2.2585668890684474e-09 + ], + "bp_grad_norms_F": [ + 3.714726335601881e-05, + 2.6385948785900837e-06, + 2.600723519208259e-06, + 1.345374585071113e-07, + 1.344694169347349e-07 + ], + "gamma_dfa": -0.013240656815469265, + "acc_eval": 0.0703125, + "loss_eval": 2.3100953102111816, + "epoch": 13 + }, + { + "hidden_norms": [ + 3088.69287109375, + 1698364.75, + 2601432.25, + 3103900.5, + 3421196.25 + ], + "bp_grad_norms_per_sample_med": [ + 1.9957044017360204e-08, + 1.783974634683716e-09, + 1.783756697903982e-09, + 1.7829976384220458e-09, + 1.7823481579526401e-09 + ], + "bp_grad_norms_F": [ + 3.862057383230422e-06, + 2.0336331090220483e-06, + 2.036696969298646e-06, + 1.0464794542031086e-07, + 1.0456345478360163e-07 + ], + "gamma_dfa": -0.005813862895593047, + "acc_eval": 0.1005859375, + "loss_eval": 2.3175578117370605, + "epoch": 14 + }, + { + "hidden_norms": [ + 3303.89599609375, + 2057797.625, + 3208369.75, + 3840521.25, + 4226141.5 + ], + "bp_grad_norms_per_sample_med": [ + 1.0653308457619914e-08, + 1.3972134560447103e-09, + 1.3960789191358458e-09, + 1.3953704858238325e-09, + 1.395240034618439e-09 + ], + "bp_grad_norms_F": [ + 3.350825500092469e-05, + 1.8437043536323472e-06, + 1.7324912278127158e-06, + 8.088576919362822e-08, + 8.08555569165037e-08 + ], + "gamma_dfa": -0.009977308567613363, + "acc_eval": 0.0888671875, + "loss_eval": 2.313873052597046, + "epoch": 15 + }, + { + "hidden_norms": [ + 3511.251708984375, + 2498907.0, + 3838076.75, + 4584989.5, + 5056157.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2424533402111138e-08, + 1.1319180037716592e-09, + 1.1314524872574339e-09, + 1.1313682213298648e-09, + 1.1311728220775308e-09 + ], + "bp_grad_norms_F": [ + 3.6209145036991686e-05, + 1.2319624147494324e-06, + 1.1622746569628362e-06, + 6.361955939837571e-08, + 6.359429960411944e-08 + ], + "gamma_dfa": -0.003661318449303508, + "acc_eval": 0.0888671875, + "loss_eval": 2.3163557052612305, + "epoch": 16 + }, + { + "hidden_norms": [ + 3775.89697265625, + 2830713.5, + 4406309.0, + 5287962.5, + 5866003.5 + ], + "bp_grad_norms_per_sample_med": [ + 9.175260551330666e-09, + 9.454962368593556e-10, + 9.453093863243112e-10, + 9.453505755985248e-10, + 9.453685612115237e-10 + ], + "bp_grad_norms_F": [ + 7.906389510026202e-05, + 1.4282334177551093e-06, + 1.2143628964622621e-06, + 4.9730939366554594e-08, + 4.970008760096789e-08 + ], + "gamma_dfa": -0.00987274688668549, + "acc_eval": 0.0986328125, + "loss_eval": 2.310572624206543, + "epoch": 17 + }, + { + "hidden_norms": [ + 3992.62939453125, + 3305205.5, + 5135523.0, + 6172568.0, + 6858123.5 + ], + "bp_grad_norms_per_sample_med": [ + 7.447438221674929e-09, + 7.795076806260681e-10, + 7.787387401592127e-10, + 7.785659339454298e-10, + 7.786636335715968e-10 + ], + "bp_grad_norms_F": [ + 6.625035166507587e-05, + 1.4839708910585614e-06, + 5.721043407902471e-07, + 3.443057750018852e-08, + 3.4421322681055244e-08 + ], + "gamma_dfa": -0.006256722612306476, + "acc_eval": 0.099609375, + "loss_eval": 2.3168537616729736, + "epoch": 18 + }, + { + "hidden_norms": [ + 4142.52978515625, + 3917073.0, + 6029541.5, + 7244691.5, + 8040561.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.708185980499934e-09, + 6.548476760848132e-10, + 6.543839359274273e-10, + 6.541163166673414e-10, + 6.541419628192102e-10 + ], + "bp_grad_norms_F": [ + 8.116958838400024e-07, + 2.7829198501194696e-08, + 2.171442403664514e-08, + 2.171425173003172e-08, + 2.1709443132067463e-08 + ], + "gamma_dfa": -0.008716321433894336, + "acc_eval": 0.1103515625, + "loss_eval": 2.307344675064087, + "epoch": 19 + }, + { + "hidden_norms": [ + 4319.63134765625, + 4541538.0, + 7015912.0, + 8395939.0, + 9318214.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.706714212294628e-09, + 5.475734865534321e-10, + 5.474371511660081e-10, + 5.474699027452345e-10, + 5.470845443333872e-10 + ], + "bp_grad_norms_F": [ + 9.98826635623118e-07, + 1.9267284656621086e-08, + 1.8231443021932137e-08, + 1.8230153386866732e-08, + 1.822698791897892e-08 + ], + "gamma_dfa": -0.009770376258529723, + "acc_eval": 0.1044921875, + "loss_eval": 2.3123068809509277, + "epoch": 20 + }, + { + "hidden_norms": [ + 4493.5576171875, + 5295852.0, + 8144737.5, + 9706496.0, + 10771585.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.5074546883274706e-09, + 4.5678333338017296e-10, + 4.567042022340928e-10, + 4.5673645421295817e-10, + 4.5639386714313446e-10 + ], + "bp_grad_norms_F": [ + 7.984108947312052e-07, + 1.5798146790757528e-08, + 1.5310378742583453e-08, + 1.531174653734979e-08, + 1.5307973555422905e-08 + ], + "gamma_dfa": 0.001372043276205659, + "acc_eval": 0.08984375, + "loss_eval": 2.304574728012085, + "epoch": 21 + }, + { + "hidden_norms": [ + 4713.58544921875, + 6076811.0, + 9296267.0, + 11104688.0, + 12313681.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.7650869089134176e-09, + 3.880850918402956e-10, + 3.8772021704325255e-10, + 3.877534959784157e-10, + 3.877534959784157e-10 + ], + "bp_grad_norms_F": [ + 8.055810098994698e-07, + 1.3297294820802108e-08, + 1.2999676002323213e-08, + 1.2997061205055616e-08, + 1.2994151532552678e-08 + ], + "gamma_dfa": -0.001540843746624887, + "acc_eval": 0.0927734375, + "loss_eval": 2.3001956939697266, + "epoch": 22 + }, + { + "hidden_norms": [ + 4932.0283203125, + 6808919.0, + 10515250.0, + 12614906.0, + 13952134.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.722823604945802e-09, + 3.3205604932362576e-10, + 3.3200522886467354e-10, + 3.319224339826121e-10, + 3.319316765892921e-10 + ], + "bp_grad_norms_F": [ + 8.157737738656579e-07, + 1.1298772584211747e-08, + 1.1099826835447857e-08, + 1.1101125352297458e-08, + 1.1098639340900718e-08 + ], + "gamma_dfa": -0.0038606239249929786, + "acc_eval": 0.1005859375, + "loss_eval": 2.3065578937530518, + "epoch": 23 + }, + { + "hidden_norms": [ + 5160.6142578125, + 7539331.0, + 11751434.0, + 14133378.0, + 15619303.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.541834742686433e-09, + 2.862569903339107e-10, + 2.861809678122995e-10, + 2.8618746261699357e-10, + 2.8600946611057054e-10 + ], + "bp_grad_norms_F": [ + 5.115749672768288e-07, + 9.68886215702014e-09, + 9.564988801002983e-09, + 9.563906999687788e-09, + 9.562156400022559e-09 + ], + "gamma_dfa": -0.005291882203891873, + "acc_eval": 0.0888671875, + "loss_eval": 2.306269645690918, + "epoch": 24 + }, + { + "hidden_norms": [ + 5342.28369140625, + 8587680.0, + 13221096.0, + 15854032.0, + 17531438.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.404613562769555e-09, + 2.500546436579043e-10, + 2.498238005355091e-10, + 2.5007032555812714e-10, + 2.5000959635868014e-10 + ], + "bp_grad_norms_F": [ + 8.579532959629432e-07, + 8.395090844715014e-09, + 8.30485546998716e-09, + 8.305622856141781e-09, + 8.304008147774766e-09 + ], + "gamma_dfa": -0.0010773324174806476, + "acc_eval": 0.0810546875, + "loss_eval": 2.3139305114746094, + "epoch": 25 + }, + { + "hidden_norms": [ + 5483.166015625, + 9723498.0, + 14831751.0, + 17743800.0, + 19587500.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.163097422349438e-09, + 2.162879736422596e-10, + 2.1617001244589318e-10, + 2.1610728484500186e-10, + 2.1611390454978618e-10 + ], + "bp_grad_norms_F": [ + 8.197772558560246e-07, + 7.273167845767148e-09, + 7.203821983381431e-09, + 7.205678720367814e-09, + 7.204227880919234e-09 + ], + "gamma_dfa": 1.8637801986187696e-05, + "acc_eval": 0.0751953125, + "loss_eval": 2.313469648361206, + "epoch": 26 + }, + { + "hidden_norms": [ + 5764.373046875, + 10784341.0, + 16432148.0, + 19679324.0, + 21736526.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.4971423534813084e-09, + 1.883019018489307e-10, + 1.8820056624235804e-10, + 1.881857447649793e-10, + 1.8821781633260315e-10 + ], + "bp_grad_norms_F": [ + 7.796735417286982e-07, + 6.3456924159766e-09, + 6.269113672630056e-09, + 6.2696292602026915e-09, + 6.268407570786394e-09 + ], + "gamma_dfa": -0.009387154830619693, + "acc_eval": 0.1240234375, + "loss_eval": 2.306946277618408, + "epoch": 27 + }, + { + "hidden_norms": [ + 5953.8154296875, + 12087036.0, + 18197724.0, + 21766380.0, + 23964956.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.9581326277394737e-09, + 1.6603075858601102e-10, + 1.6546233827519075e-10, + 1.654698739139704e-10, + 1.654279768725786e-10 + ], + "bp_grad_norms_F": [ + 7.887553010732518e-07, + 5.60325252862981e-09, + 5.523563828546685e-09, + 5.524424029346164e-09, + 5.523790314043708e-09 + ], + "gamma_dfa": 0.004911014751996845, + "acc_eval": 0.099609375, + "loss_eval": 2.3079466819763184, + "epoch": 28 + }, + { + "hidden_norms": [ + 6103.1767578125, + 13586370.0, + 20138950.0, + 24031604.0, + 26432166.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.675929033912894e-09, + 1.4642610735027262e-10, + 1.4630179012709021e-10, + 1.4625449462624118e-10, + 1.4625445299287776e-10 + ], + "bp_grad_norms_F": [ + 5.090974468657805e-07, + 4.923043306348518e-09, + 4.85900208957446e-09, + 4.858577984379053e-09, + 4.8580677258769356e-09 + ], + "gamma_dfa": -0.001665741903707385, + "acc_eval": 0.119140625, + "loss_eval": 2.3058736324310303, + "epoch": 29 + }, + { + "hidden_norms": [ + 6289.6884765625, + 14985982.0, + 22021216.0, + 26264438.0, + 28881832.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.36727260016778e-09, + 1.3193185433024723e-10, + 1.3139930810091016e-10, + 1.313865682917026e-10, + 1.313865821694904e-10 + ], + "bp_grad_norms_F": [ + 5.067869324193452e-07, + 4.352318949685241e-09, + 4.3002512661871606e-09, + 4.300079403662949e-09, + 4.299330669255141e-09 + ], + "gamma_dfa": -0.0004749984946101904, + "acc_eval": 0.134765625, + "loss_eval": 2.2982680797576904, + "epoch": 30 + }, + { + "hidden_norms": [ + 6523.13232421875, + 16536787.0, + 24215278.0, + 28796266.0, + 31602218.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.811848170443e-09, + 1.1650350129066567e-10, + 1.168874996793079e-10, + 1.1678497058298376e-10, + 1.1676350164524507e-10 + ], + "bp_grad_norms_F": [ + 1.0699311587814009e-06, + 3.859509600800948e-09, + 3.8213117115049045e-09, + 3.820499028250879e-09, + 3.8199492458090845e-09 + ], + "gamma_dfa": -0.0009061050368472934, + "acc_eval": 0.1181640625, + "loss_eval": 2.3070034980773926, + "epoch": 31 + }, + { + "hidden_norms": [ + 6718.77001953125, + 18189110.0, + 26350528.0, + 31306452.0, + 34333380.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.6170128286651106e-09, + 1.026562307382406e-10, + 1.0235094716204429e-10, + 1.0229352781498946e-10, + 1.0229320168697598e-10 + ], + "bp_grad_norms_F": [ + 7.658765639462217e-07, + 3.4193439191199104e-09, + 3.3851728087341826e-09, + 3.3853084779877918e-09, + 3.3853269076900006e-09 + ], + "gamma_dfa": -0.003424330148845911, + "acc_eval": 0.1025390625, + "loss_eval": 2.307239532470703, + "epoch": 32 + }, + { + "hidden_norms": [ + 6883.12548828125, + 19488106.0, + 28346706.0, + 33685484.0, + 36926260.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.087009980973221e-09, + 9.127182343249274e-11, + 9.115138505100262e-11, + 9.112680748879498e-11, + 9.108464676943484e-11 + ], + "bp_grad_norms_F": [ + 6.505949841084657e-07, + 3.0607936185589324e-09, + 3.031910944528704e-09, + 3.0311655407899707e-09, + 3.030735440390231e-09 + ], + "gamma_dfa": 0.0007484849775210023, + "acc_eval": 0.126953125, + "loss_eval": 2.299861431121826, + "epoch": 33 + }, + { + "hidden_norms": [ + 7075.13671875, + 20968554.0, + 30458362.0, + 36184532.0, + 39704584.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.7312005990154375e-09, + 8.229845277485381e-11, + 8.220574915229761e-11, + 8.216692604090525e-11, + 8.216703706320772e-11 + ], + "bp_grad_norms_F": [ + 5.460973966364691e-07, + 2.7569984073494425e-09, + 2.731066262029458e-09, + 2.7299451588191914e-09, + 2.7297459848085737e-09 + ], + "gamma_dfa": 0.0019178662332706153, + "acc_eval": 0.10546875, + "loss_eval": 2.304497241973877, + "epoch": 34 + }, + { + "hidden_norms": [ + 7259.11181640625, + 23033338.0, + 32925422.0, + 39030248.0, + 42756800.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.3574480973186382e-09, + 7.317867145584245e-11, + 7.298522203269542e-11, + 7.29523316755909e-11, + 7.295326148737402e-11 + ], + "bp_grad_norms_F": [ + 9.340447491013038e-07, + 2.4876549709063056e-09, + 2.468606430383602e-09, + 2.468798498966862e-09, + 2.4683108890144467e-09 + ], + "gamma_dfa": 0.0004995002527721226, + "acc_eval": 0.0927734375, + "loss_eval": 2.316316604614258, + "epoch": 35 + }, + { + "hidden_norms": [ + 7421.775390625, + 24686730.0, + 35197740.0, + 41724168.0, + 45731128.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6613123099418203e-09, + 6.675621860852132e-11, + 6.666651952702551e-11, + 6.660563073301873e-11, + 6.660502011035518e-11 + ], + "bp_grad_norms_F": [ + 5.461850491883524e-07, + 2.235697182939589e-09, + 2.218524031150082e-09, + 2.2181974035362373e-09, + 2.217934280679401e-09 + ], + "gamma_dfa": -0.0007714751118328422, + "acc_eval": 0.115234375, + "loss_eval": 2.299975872039795, + "epoch": 36 + }, + { + "hidden_norms": [ + 7595.57861328125, + 26510854.0, + 37595356.0, + 44555964.0, + 48780100.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.225840178837757e-09, + 6.114001666057689e-11, + 6.093330007228559e-11, + 6.092592402806574e-11, + 6.092682608427324e-11 + ], + "bp_grad_norms_F": [ + 5.346724947230541e-07, + 2.03656935759966e-09, + 2.023372358550546e-09, + 2.0227952646223457e-09, + 2.022433331916318e-09 + ], + "gamma_dfa": -0.002239674242446199, + "acc_eval": 0.125, + "loss_eval": 2.301793336868286, + "epoch": 37 + }, + { + "hidden_norms": [ + 7750.2373046875, + 28535444.0, + 40272040.0, + 47577320.0, + 52073104.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.8177556126985905e-09, + 5.451538873102457e-11, + 5.443305875485471e-11, + 5.4429814821954636e-11, + 5.4436097990384624e-11 + ], + "bp_grad_norms_F": [ + 4.054070359416073e-07, + 1.8392830591906772e-09, + 1.8223703657227475e-09, + 1.8226138376320478e-09, + 1.8224435294200703e-09 + ], + "gamma_dfa": -7.494278543163091e-05, + "acc_eval": 0.0859375, + "loss_eval": 2.3060522079467773, + "epoch": 38 + }, + { + "hidden_norms": [ + 7842.494140625, + 30102162.0, + 42567964.0, + 50335104.0, + 55107076.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.4601239106681874e-09, + 4.961669269887281e-11, + 4.958486399253559e-11, + 4.9537509511088373e-11, + 4.9538078500388494e-11 + ], + "bp_grad_norms_F": [ + 3.688643346322351e-07, + 1.6754320153467006e-09, + 1.6663495028268471e-09, + 1.6659863488754922e-09, + 1.6657608625791909e-09 + ], + "gamma_dfa": -0.0012932312965858728, + "acc_eval": 0.123046875, + "loss_eval": 2.305074691772461, + "epoch": 39 + }, + { + "hidden_norms": [ + 7978.84033203125, + 31648130.0, + 44751680.0, + 52999412.0, + 58060848.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.122314324282115e-09, + 4.579963838735601e-11, + 4.578180889946992e-11, + 4.577443632469702e-11, + 4.57794635533304e-11 + ], + "bp_grad_norms_F": [ + 5.346829539121245e-07, + 1.5462353619710711e-09, + 1.5314658430298778e-09, + 1.5317623835997551e-09, + 1.531660798193002e-09 + ], + "gamma_dfa": -0.0015878456179052591, + "acc_eval": 0.078125, + "loss_eval": 2.311302661895752, + "epoch": 40 + }, + { + "hidden_norms": [ + 8110.69677734375, + 33538538.0, + 47405844.0, + 56144432.0, + 61445208.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.846236801801183e-09, + 4.287940835734361e-11, + 4.277651843853647e-11, + 4.270922504545638e-11, + 4.270716419396692e-11 + ], + "bp_grad_norms_F": [ + 6.336174465104705e-07, + 1.4277677928831167e-09, + 1.411427863473591e-09, + 1.4113960000727843e-09, + 1.4115042468176853e-09 + ], + "gamma_dfa": 0.0003075850836466998, + "acc_eval": 0.06640625, + "loss_eval": 2.3155269622802734, + "epoch": 41 + }, + { + "hidden_norms": [ + 8218.2890625, + 35439168.0, + 50034100.0, + 59178108.0, + 64727180.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5490064786405355e-09, + 3.9022073766714627e-11, + 3.8900438426026085e-11, + 3.885531826841593e-11, + 3.885488111809998e-11 + ], + "bp_grad_norms_F": [ + 4.209731514492887e-07, + 1.29418675776094e-09, + 1.2822323203209862e-09, + 1.282524864087975e-09, + 1.282538297786573e-09 + ], + "gamma_dfa": 0.004402266175020486, + "acc_eval": 0.0888671875, + "loss_eval": 2.3072235584259033, + "epoch": 42 + }, + { + "hidden_norms": [ + 8356.0576171875, + 37748524.0, + 52921432.0, + 62358388.0, + 68150840.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.2101902530380357e-09, + 3.5293011568793276e-11, + 3.5220604210906004e-11, + 3.520495353570574e-11, + 3.5206077636518174e-11 + ], + "bp_grad_norms_F": [ + 4.58017922255749e-07, + 1.1915447517552025e-09, + 1.1833590773946412e-09, + 1.1830882939989351e-09, + 1.183062092735554e-09 + ], + "gamma_dfa": -0.0026363012730143964, + "acc_eval": 0.1064453125, + "loss_eval": 2.301530361175537, + "epoch": 43 + }, + { + "hidden_norms": [ + 8468.8984375, + 39503084.0, + 55376920.0, + 65278316.0, + 71385032.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.8453949479635412e-09, + 3.246405921863982e-11, + 3.238384560511065e-11, + 3.2375737507583935e-11, + 3.2377513864423335e-11 + ], + "bp_grad_norms_F": [ + 4.802472517440037e-07, + 1.1004476219156345e-09, + 1.0926821669698938e-09, + 1.092572032845851e-09, + 1.0924769977549431e-09 + ], + "gamma_dfa": 0.0010803540208144113, + "acc_eval": 0.1396484375, + "loss_eval": 2.3026890754699707, + "epoch": 44 + }, + { + "hidden_norms": [ + 8563.8193359375, + 41138400.0, + 57739148.0, + 68164040.0, + 74560624.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7058150447724074e-09, + 3.018212416106003e-11, + 3.0175469761806184e-11, + 3.0169026998816406e-11, + 3.017583058428919e-11 + ], + "bp_grad_norms_F": [ + 4.471017973628477e-07, + 1.0233066616294195e-09, + 1.0133889283281405e-09, + 1.0129664884672707e-09, + 1.0129456162744077e-09 + ], + "gamma_dfa": 0.001452172189601697, + "acc_eval": 0.119140625, + "loss_eval": 2.3021607398986816, + "epoch": 45 + }, + { + "hidden_norms": [ + 8657.7607421875, + 43261356.0, + 60519764.0, + 71481504.0, + 78138984.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.013100575126714e-09, + 2.8044349828504345e-11, + 2.8007120927986406e-11, + 2.800258289137325e-11, + 2.7994129583874816e-11 + ], + "bp_grad_norms_F": [ + 4.194439213733858e-07, + 9.434407699515646e-10, + 9.384462096306834e-10, + 9.380274335057948e-10, + 9.378612331190084e-10 + ], + "gamma_dfa": 0.0007094524626154453, + "acc_eval": 0.1376953125, + "loss_eval": 2.2962775230407715, + "epoch": 46 + }, + { + "hidden_norms": [ + 8790.2177734375, + 45091320.0, + 63046644.0, + 74457320.0, + 81331192.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.4347481808462135e-09, + 2.630745274401214e-11, + 2.622063850765688e-11, + 2.6189189705760896e-11, + 2.618921746133651e-11 + ], + "bp_grad_norms_F": [ + 7.371211836471048e-07, + 8.928198735880244e-10, + 8.842627741145748e-10, + 8.843225596244508e-10, + 8.844897037008081e-10 + ], + "gamma_dfa": 0.0035163145803380758, + "acc_eval": 0.0869140625, + "loss_eval": 2.308018207550049, + "epoch": 47 + }, + { + "hidden_norms": [ + 8908.1201171875, + 47254860.0, + 65723668.0, + 77611024.0, + 84728680.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.7307127670184173e-09, + 2.504270402159392e-11, + 2.5052317859097784e-11, + 2.5023790331535345e-11, + 2.5014615379070904e-11 + ], + "bp_grad_norms_F": [ + 6.292835905696847e-07, + 8.318437605403517e-10, + 8.267081463841919e-10, + 8.263784656570294e-10, + 8.262315831508715e-10 + ], + "gamma_dfa": 0.0013402553158812225, + "acc_eval": 0.0751953125, + "loss_eval": 2.3012595176696777, + "epoch": 48 + }, + { + "hidden_norms": [ + 9040.81640625, + 49197456.0, + 68364032.0, + 80749512.0, + 88194248.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2460811271708394e-09, + 2.3192125303550526e-11, + 2.3115362055015076e-11, + 2.3076223223950088e-11, + 2.3076362001828166e-11 + ], + "bp_grad_norms_F": [ + 4.4760727746506745e-07, + 7.767143594961112e-10, + 7.696474568774647e-10, + 7.699579307463011e-10, + 7.697840698206448e-10 + ], + "gamma_dfa": 0.0011345145248924382, + "acc_eval": 0.109375, + "loss_eval": 2.3025381565093994, + "epoch": 49 + }, + { + "hidden_norms": [ + 9096.951171875, + 51418580.0, + 71253736.0, + 84008288.0, + 91700160.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.652081027536667e-09, + 2.1794503701766388e-11, + 2.1752362064364483e-11, + 2.1721518680961616e-11, + 2.1714638767655892e-11 + ], + "bp_grad_norms_F": [ + 4.2562598423501186e-07, + 7.30644378332812e-10, + 7.245531952193573e-10, + 7.24433568688454e-10, + 7.243706190429577e-10 + ], + "gamma_dfa": -0.0012115467980038375, + "acc_eval": 0.0986328125, + "loss_eval": 2.3028664588928223, + "epoch": 50 + }, + { + "hidden_norms": [ + 9195.421875, + 53477960.0, + 73949888.0, + 87218208.0, + 95104784.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.0763821773073232e-09, + 2.0283105056639883e-11, + 2.0292134292332342e-11, + 2.0280107454473395e-11, + 2.0280043269704784e-11 + ], + "bp_grad_norms_F": [ + 4.4348283267936495e-07, + 6.856579193303958e-10, + 6.817193476393868e-10, + 6.813303254915581e-10, + 6.81267153801457e-10 + ], + "gamma_dfa": 0.00014059534441912547, + "acc_eval": 0.12109375, + "loss_eval": 2.300283432006836, + "epoch": 51 + }, + { + "hidden_norms": [ + 9354.1484375, + 54696328.0, + 76135840.0, + 89854944.0, + 98086680.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.338345073127357e-09, + 1.9446970075942538e-11, + 1.951434153157905e-11, + 1.9502762252376904e-11, + 1.950522555971279e-11 + ], + "bp_grad_norms_F": [ + 7.923298426248948e-07, + 6.581531986071809e-10, + 6.558240617238198e-10, + 6.55002219129841e-10, + 6.549716324855126e-10 + ], + "gamma_dfa": 0.0009868293709587306, + "acc_eval": 0.08203125, + "loss_eval": 2.308971405029297, + "epoch": 52 + }, + { + "hidden_norms": [ + 9396.91796875, + 56824088.0, + 78830128.0, + 92998112.0, + 101473056.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5743603087869928e-09, + 1.830174033157217e-11, + 1.83033917883213e-11, + 1.828929195590856e-11, + 1.8287725500609753e-11 + ], + "bp_grad_norms_F": [ + 5.051292646385264e-07, + 6.139382335845767e-10, + 6.081654624345845e-10, + 6.082383485761511e-10, + 6.080949632725208e-10 + ], + "gamma_dfa": -0.0033112295641331, + "acc_eval": 0.0869140625, + "loss_eval": 2.3057596683502197, + "epoch": 53 + }, + { + "hidden_norms": [ + 9468.728515625, + 58575712.0, + 81144072.0, + 95889464.0, + 104606984.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.8610024632437216e-09, + 1.757114766187673e-11, + 1.7507960359264274e-11, + 1.7509681204952443e-11, + 1.751184267040351e-11 + ], + "bp_grad_norms_F": [ + 4.554808015200251e-07, + 5.796045865480437e-10, + 5.748747033962331e-10, + 5.745580122784588e-10, + 5.745347531060929e-10 + ], + "gamma_dfa": -0.0003432991070440039, + "acc_eval": 0.08984375, + "loss_eval": 2.298818588256836, + "epoch": 54 + }, + { + "hidden_norms": [ + 9555.708984375, + 60407900.0, + 83458520.0, + 98574208.0, + 107551688.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.279448629849412e-09, + 1.684081346597921e-11, + 1.677817607070864e-11, + 1.677138462830019e-11, + 1.677173851188929e-11 + ], + "bp_grad_norms_F": [ + 4.388069214655843e-07, + 5.62806412585104e-10, + 5.561613392046638e-10, + 5.564256833068271e-10, + 5.564126381862877e-10 + ], + "gamma_dfa": -0.0005112638318678364, + "acc_eval": 0.0869140625, + "loss_eval": 2.3081560134887695, + "epoch": 55 + }, + { + "hidden_norms": [ + 9638.900390625, + 62801376.0, + 86421992.0, + 101967032.0, + 111112024.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.658361892253879e-09, + 1.6043997727588355e-11, + 1.598270821245862e-11, + 1.5972815084475123e-11, + 1.5974208067426332e-11 + ], + "bp_grad_norms_F": [ + 3.7533030194936146e-07, + 5.26626853236678e-10, + 5.223827481692922e-10, + 5.223168009216295e-10, + 5.222874355226281e-10 + ], + "gamma_dfa": 0.0029356127051869407, + "acc_eval": 0.1162109375, + "loss_eval": 2.2985568046569824, + "epoch": 56 + }, + { + "hidden_norms": [ + 9718.0244140625, + 64624960.0, + 89000072.0, + 104851280.0, + 114205744.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.292640661176847e-09, + 1.499218110767586e-11, + 1.4987202451299808e-11, + 1.4976865234106462e-11, + 1.497728503718765e-11 + ], + "bp_grad_norms_F": [ + 2.8470327606555657e-07, + 5.047448570216773e-10, + 4.990237667534814e-10, + 4.992751767574077e-10, + 4.992522506519492e-10 + ], + "gamma_dfa": -5.288697866490111e-05, + "acc_eval": 0.083984375, + "loss_eval": 2.308565139770508, + "epoch": 57 + }, + { + "hidden_norms": [ + 9801.466796875, + 66401824.0, + 91302272.0, + 107465608.0, + 117121048.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6839835081938759e-09, + 1.4242066727343516e-11, + 1.4184016808305167e-11, + 1.417683158366767e-11, + 1.41777934878351e-11 + ], + "bp_grad_norms_F": [ + 4.110351881081442e-07, + 4.848813572877475e-10, + 4.80424644511146e-10, + 4.804525666202153e-10, + 4.804344699849139e-10 + ], + "gamma_dfa": 0.005033881159761222, + "acc_eval": 0.0810546875, + "loss_eval": 2.3111414909362793, + "epoch": 58 + }, + { + "hidden_norms": [ + 9890.490234375, + 68205280.0, + 93614360.0, + 110285296.0, + 120199864.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.280599737363275e-09, + 1.3558537972913065e-11, + 1.3508410535989501e-11, + 1.350657866799887e-11, + 1.3504152657217716e-11 + ], + "bp_grad_norms_F": [ + 2.917624613019143e-07, + 4.580297252587684e-10, + 4.5511858171032316e-10, + 4.5487102973140736e-10, + 4.548312837471258e-10 + ], + "gamma_dfa": -0.0010600784517009743, + "acc_eval": 0.1337890625, + "loss_eval": 2.3005125522613525, + "epoch": 59 + }, + { + "hidden_norms": [ + 9970.1796875, + 70070560.0, + 95841760.0, + 112873624.0, + 122957488.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5372191297657878e-09, + 1.2977110705469919e-11, + 1.3014193021854137e-11, + 1.301157879357584e-11, + 1.301332045594572e-11 + ], + "bp_grad_norms_F": [ + 3.609145835525851e-07, + 4.4097417384314497e-10, + 4.391887409305184e-10, + 4.386717655791017e-10, + 4.3868858545792477e-10 + ], + "gamma_dfa": -0.0019604496665124316, + "acc_eval": 0.150390625, + "loss_eval": 2.2972958087921143, + "epoch": 60 + }, + { + "hidden_norms": [ + 10013.4111328125, + 71841280.0, + 98034728.0, + 115420424.0, + 125712432.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.980667851952944e-09, + 1.2545815081255185e-11, + 1.2525404324836842e-11, + 1.2530108027541953e-11, + 1.2529619702883465e-11 + ], + "bp_grad_norms_F": [ + 4.7472269670834066e-07, + 4.2379699749517385e-10, + 4.224821603671103e-10, + 4.2210435147183034e-10, + 4.2200473671094585e-10 + ], + "gamma_dfa": 0.001835448889323743, + "acc_eval": 0.1123046875, + "loss_eval": 2.301358222961426, + "epoch": 61 + }, + { + "hidden_norms": [ + 10096.0283203125, + 73830392.0, + 100452376.0, + 118091624.0, + 128521440.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0877483358484596e-09, + 1.2145178092393127e-11, + 1.2089194229014666e-11, + 1.2089107492840867e-11, + 1.2089683421034891e-11 + ], + "bp_grad_norms_F": [ + 3.47462531635756e-07, + 4.1091860469855135e-10, + 4.074744708315592e-10, + 4.072828740930845e-10, + 4.072460701998182e-10 + ], + "gamma_dfa": 0.001284073296119459, + "acc_eval": 0.0986328125, + "loss_eval": 2.306840419769287, + "epoch": 62 + }, + { + "hidden_norms": [ + 10180.875, + 75552776.0, + 102509640.0, + 120544920.0, + 131168024.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.552231787549374e-09, + 1.1890774823108963e-11, + 1.1859568882499616e-11, + 1.1871844653177366e-11, + 1.187336080149537e-11 + ], + "bp_grad_norms_F": [ + 3.4558294714770454e-07, + 3.966963146861957e-10, + 3.9473879720475225e-10, + 3.9452693889607815e-10, + 3.9439784771388986e-10 + ], + "gamma_dfa": 0.0016765635373303667, + "acc_eval": 0.115234375, + "loss_eval": 2.298762798309326, + "epoch": 63 + }, + { + "hidden_norms": [ + 10240.1455078125, + 77067560.0, + 104630624.0, + 122945856.0, + 133711672.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7201819968448717e-09, + 1.1546708901521985e-11, + 1.1524695260611839e-11, + 1.1516852575776948e-11, + 1.1515758832625345e-11 + ], + "bp_grad_norms_F": [ + 4.471509669201623e-07, + 3.9150541142340956e-10, + 3.873180665081577e-10, + 3.8728689699674135e-10, + 3.8727610007782687e-10 + ], + "gamma_dfa": 0.00234126152281533, + "acc_eval": 0.099609375, + "loss_eval": 2.3141303062438965, + "epoch": 64 + }, + { + "hidden_norms": [ + 10319.01171875, + 78272792.0, + 106212480.0, + 124890544.0, + 135898992.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.082502087967896e-09, + 1.1041124611810282e-11, + 1.099913302798905e-11, + 1.099662808728974e-11, + 1.0998860676403321e-11 + ], + "bp_grad_norms_F": [ + 2.724834757827921e-07, + 3.732617270824079e-10, + 3.7087055648754585e-10, + 3.705740991843953e-10, + 3.7055333801383483e-10 + ], + "gamma_dfa": -0.0016588781545578968, + "acc_eval": 0.076171875, + "loss_eval": 2.301309585571289, + "epoch": 65 + }, + { + "hidden_norms": [ + 10393.1220703125, + 79820272.0, + 108085488.0, + 127064000.0, + 138196272.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1938173782866102e-09, + 1.0600672249727605e-11, + 1.0572632179461916e-11, + 1.0572812590703418e-11, + 1.0572290438937149e-11 + ], + "bp_grad_norms_F": [ + 2.4229757400462404e-07, + 3.608289500522943e-10, + 3.590567010380852e-10, + 3.5867539494027767e-10, + 3.5869879289052164e-10 + ], + "gamma_dfa": -0.0006768384373572189, + "acc_eval": 0.1162109375, + "loss_eval": 2.300891876220703, + "epoch": 66 + }, + { + "hidden_norms": [ + 10441.87109375, + 81050488.0, + 109770584.0, + 129123352.0, + 140471120.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.23911914062802e-09, + 1.040783778605281e-11, + 1.0406573172638822e-11, + 1.0404551352427571e-11, + 1.0400711542013497e-11 + ], + "bp_grad_norms_F": [ + 3.1678638379162294e-07, + 3.529202208252258e-10, + 3.508623114267806e-10, + 3.5074002036061813e-10, + 3.507301671312746e-10 + ], + "gamma_dfa": 0.002077823784929933, + "acc_eval": 0.078125, + "loss_eval": 2.302239179611206, + "epoch": 67 + }, + { + "hidden_norms": [ + 10470.16796875, + 82310688.0, + 111439184.0, + 131022848.0, + 142428160.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5865209146426196e-09, + 1.0226258208290151e-11, + 1.02605328747285e-11, + 1.0260522466387645e-11, + 1.0260643897030963e-11 + ], + "bp_grad_norms_F": [ + 3.3883526384670404e-07, + 3.5046832103091674e-10, + 3.5014954824497124e-10, + 3.4966474160569305e-10, + 3.496121170343258e-10 + ], + "gamma_dfa": -0.0026201284417766146, + "acc_eval": 0.107421875, + "loss_eval": 2.298029661178589, + "epoch": 68 + }, + { + "hidden_norms": [ + 10513.3203125, + 83437016.0, + 113127648.0, + 132967152.0, + 144543232.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.473118955938276e-10, + 1.0023389236668567e-11, + 9.974353808173131e-12, + 9.973816911257316e-12, + 9.97038302613662e-12 + ], + "bp_grad_norms_F": [ + 2.5441801199121983e-07, + 3.393485770164517e-10, + 3.373779589033177e-10, + 3.371187218270677e-10, + 3.370881351827393e-10 + ], + "gamma_dfa": 0.0005034620153310243, + "acc_eval": 0.0986328125, + "loss_eval": 2.301563262939453, + "epoch": 69 + }, + { + "hidden_norms": [ + 10551.1669921875, + 84680168.0, + 114672840.0, + 134819488.0, + 146567616.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0249410209439702e-09, + 9.764996970751394e-12, + 9.731633034137932e-12, + 9.726664786102734e-12, + 9.72637768936746e-12 + ], + "bp_grad_norms_F": [ + 2.863991426238499e-07, + 3.3205654892398684e-10, + 3.300854312104917e-10, + 3.3006170019334036e-10, + 3.300271445016989e-10 + ], + "gamma_dfa": -0.00030547842834494077, + "acc_eval": 0.0888671875, + "loss_eval": 2.3098697662353516, + "epoch": 70 + }, + { + "hidden_norms": [ + 10571.28515625, + 85669488.0, + 115961600.0, + 136359216.0, + 148233216.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.3427733369653083e-09, + 9.57579241595008e-12, + 9.569240365381315e-12, + 9.571362799554173e-12, + 9.572694199821985e-12 + ], + "bp_grad_norms_F": [ + 3.248615314532799e-07, + 3.252469404912972e-10, + 3.2484867573678855e-10, + 3.24500371018388e-10, + 3.244539636959587e-10 + ], + "gamma_dfa": -0.0020247000393283088, + "acc_eval": 0.1142578125, + "loss_eval": 2.2976913452148438, + "epoch": 71 + }, + { + "hidden_norms": [ + 10612.2607421875, + 86644544.0, + 117219120.0, + 137880144.0, + 149864576.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2906055113504067e-09, + 9.509206790048186e-12, + 9.47129093903376e-12, + 9.464854247576149e-12, + 9.465737221825421e-12 + ], + "bp_grad_norms_F": [ + 2.801213554448623e-07, + 3.198223630374031e-10, + 3.183240893100958e-10, + 3.1834490599180754e-10, + 3.1827357416247537e-10 + ], + "gamma_dfa": -0.001203124011226464, + "acc_eval": 0.10546875, + "loss_eval": 2.3055059909820557, + "epoch": 72 + }, + { + "hidden_norms": [ + 10637.9248046875, + 87766232.0, + 118693968.0, + 139534048.0, + 151658064.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.839014827202504e-10, + 9.328608198411192e-12, + 9.353431223990682e-12, + 9.345346545230893e-12, + 9.345603284305337e-12 + ], + "bp_grad_norms_F": [ + 2.646772543357656e-07, + 3.13234327364853e-10, + 3.120789182631256e-10, + 3.1186964122298377e-10, + 3.118231783894032e-10 + ], + "gamma_dfa": -0.0021326720525394194, + "acc_eval": 0.1201171875, + "loss_eval": 2.3003604412078857, + "epoch": 73 + }, + { + "hidden_norms": [ + 10656.4482421875, + 88713800.0, + 119968392.0, + 141039184.0, + 153268816.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.779404980785444e-10, + 9.102603219790506e-12, + 9.076880740088722e-12, + 9.072962867118228e-12, + 9.071843970476223e-12 + ], + "bp_grad_norms_F": [ + 2.0230599773185531e-07, + 3.0828151142969773e-10, + 3.0691377217451077e-10, + 3.067752996077644e-10, + 3.0672925310781807e-10 + ], + "gamma_dfa": 0.00048369063733844087, + "acc_eval": 0.0908203125, + "loss_eval": 2.3012309074401855, + "epoch": 74 + }, + { + "hidden_norms": [ + 10672.1494140625, + 89505176.0, + 120986568.0, + 142222336.0, + 154574096.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.261312272634825e-10, + 9.015565204106846e-12, + 8.995597669536615e-12, + 8.994238513693187e-12, + 8.993757127928603e-12 + ], + "bp_grad_norms_F": [ + 2.1154608020879095e-07, + 3.072229692868689e-10, + 3.052531283298521e-10, + 3.0519622939984004e-10, + 3.051366936901445e-10 + ], + "gamma_dfa": -0.0005316346723702736, + "acc_eval": 0.11328125, + "loss_eval": 2.3040223121643066, + "epoch": 75 + }, + { + "hidden_norms": [ + 10723.896484375, + 90374152.0, + 122032824.0, + 143367616.0, + 155819504.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.261785617274086e-10, + 8.993932334999677e-12, + 8.987987437647504e-12, + 8.987462683796021e-12, + 8.98797182513622e-12 + ], + "bp_grad_norms_F": [ + 1.5789649410180573e-07, + 3.019114402924572e-10, + 3.00178187861988e-10, + 2.999948345294712e-10, + 2.9999083772658253e-10 + ], + "gamma_dfa": -0.0012852016006945632, + "acc_eval": 0.0830078125, + "loss_eval": 2.3029680252075195, + "epoch": 76 + }, + { + "hidden_norms": [ + 10752.4677734375, + 91243824.0, + 123139408.0, + 144679744.0, + 157141888.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0187789500903932e-09, + 8.908308986310676e-12, + 8.877474276525188e-12, + 8.871863313442141e-12, + 8.872454854147449e-12 + ], + "bp_grad_norms_F": [ + 2.2995939730208192e-07, + 2.996720371850614e-10, + 2.9733623896355255e-10, + 2.9736765827514944e-10, + 2.9736227369348e-10 + ], + "gamma_dfa": 0.0009152928978437558, + "acc_eval": 0.078125, + "loss_eval": 2.3087785243988037, + "epoch": 77 + }, + { + "hidden_norms": [ + 10774.716796875, + 91815512.0, + 124004224.0, + 145694656.0, + 158276032.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.046535660000131e-10, + 8.72336057555767e-12, + 8.693952675831174e-12, + 8.687773590809744e-12, + 8.688093647291062e-12 + ], + "bp_grad_norms_F": [ + 1.826059730092311e-07, + 2.946680122128953e-10, + 2.92846163985061e-10, + 2.9275293300656813e-10, + 2.927521280948753e-10 + ], + "gamma_dfa": 0.0014372464029293042, + "acc_eval": 0.064453125, + "loss_eval": 2.3071916103363037, + "epoch": 78 + }, + { + "hidden_norms": [ + 10790.939453125, + 92420488.0, + 124895360.0, + 146715424.0, + 159350832.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.62354623873307e-10, + 8.534323421571788e-12, + 8.523472726229553e-12, + 8.523020830764061e-12, + 8.520370173292768e-12 + ], + "bp_grad_norms_F": [ + 2.139736210438059e-07, + 2.9157729009021693e-10, + 2.8999641576987756e-10, + 2.899117335086743e-10, + 2.898933315620411e-10 + ], + "gamma_dfa": 0.0007644326506124344, + "acc_eval": 0.107421875, + "loss_eval": 2.307311534881592, + "epoch": 79 + }, + { + "hidden_norms": [ + 10804.537109375, + 93059200.0, + 125634128.0, + 147548304.0, + 160277184.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.631766802378536e-10, + 8.465870365848005e-12, + 8.435890007374436e-12, + 8.433719868305989e-12, + 8.432757096776822e-12 + ], + "bp_grad_norms_F": [ + 1.5449778345555387e-07, + 2.894649520079895e-10, + 2.876322513500895e-10, + 2.8752078495841715e-10, + 2.8753605052500575e-10 + ], + "gamma_dfa": -0.0008484880891046487, + "acc_eval": 0.0703125, + "loss_eval": 2.3064723014831543, + "epoch": 80 + }, + { + "hidden_norms": [ + 10826.3466796875, + 93631016.0, + 126376416.0, + 148363712.0, + 161162256.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.068867630659724e-10, + 8.39008376662953e-12, + 8.381075347618783e-12, + 8.379246949075103e-12, + 8.377123647540508e-12 + ], + "bp_grad_norms_F": [ + 1.5745726500426827e-07, + 2.870276794020299e-10, + 2.8557434195164433e-10, + 2.853116076728668e-10, + 2.853256519941283e-10 + ], + "gamma_dfa": -0.0032648725573380943, + "acc_eval": 0.09375, + "loss_eval": 2.301131248474121, + "epoch": 81 + }, + { + "hidden_norms": [ + 10839.0986328125, + 94148792.0, + 127019560.0, + 149143280.0, + 162023376.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.829024042278917e-10, + 8.344799677650894e-12, + 8.329600897916123e-12, + 8.328910477972684e-12, + 8.32927910671133e-12 + ], + "bp_grad_norms_F": [ + 1.0639800507306063e-07, + 2.8474167468317546e-10, + 2.829097234258171e-10, + 2.8278687724814233e-10, + 2.827818257333803e-10 + ], + "gamma_dfa": 0.0004431852612469811, + "acc_eval": 0.1240234375, + "loss_eval": 2.302319049835205, + "epoch": 82 + }, + { + "hidden_norms": [ + 10845.5009765625, + 94622624.0, + 127620392.0, + 149820912.0, + 162751232.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.976296597014596e-10, + 8.380781311989605e-12, + 8.37097405281817e-12, + 8.368299109218214e-12, + 8.368221046661795e-12 + ], + "bp_grad_norms_F": [ + 1.5657094820653583e-07, + 2.842148183468396e-10, + 2.8250898842507866e-10, + 2.8236088467359366e-10, + 2.8235377924623606e-10 + ], + "gamma_dfa": 0.0011154523126606364, + "acc_eval": 0.0859375, + "loss_eval": 2.3030214309692383, + "epoch": 83 + }, + { + "hidden_norms": [ + 10858.826171875, + 95010072.0, + 128124352.0, + 150449040.0, + 163406224.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.707155303902312e-10, + 8.22641173930938e-12, + 8.219256872332714e-12, + 8.215187211058073e-12, + 8.215540227285434e-12 + ], + "bp_grad_norms_F": [ + 1.3043053570527263e-07, + 2.814159738573352e-10, + 2.796477494015903e-10, + 2.795675912992124e-10, + 2.7956112425009394e-10 + ], + "gamma_dfa": 0.00044634643927565776, + "acc_eval": 0.0849609375, + "loss_eval": 2.3043744564056396, + "epoch": 84 + }, + { + "hidden_norms": [ + 10870.2197265625, + 95329544.0, + 128596424.0, + 150994576.0, + 163991392.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.56519053063198e-10, + 8.213814177426837e-12, + 8.202234898224692e-12, + 8.199945063236402e-12, + 8.200029197324987e-12 + ], + "bp_grad_norms_F": [ + 1.2775484492522082e-07, + 2.8084765069102957e-10, + 2.791658848533274e-10, + 2.790815634146071e-10, + 2.7906171817804193e-10 + ], + "gamma_dfa": 0.00020755327568622306, + "acc_eval": 0.083984375, + "loss_eval": 2.3030991554260254, + "epoch": 85 + }, + { + "hidden_norms": [ + 10879.8818359375, + 95701368.0, + 129014928.0, + 151496160.0, + 164549552.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.791080475743172e-10, + 8.169613423258948e-12, + 8.157244844875233e-12, + 8.15449097135712e-12, + 8.153281869094364e-12 + ], + "bp_grad_norms_F": [ + 1.5473247572117543e-07, + 2.7922636425259384e-10, + 2.774635243785184e-10, + 2.7745489239450194e-10, + 2.774172003228159e-10 + ], + "gamma_dfa": 3.1085157388588414e-05, + "acc_eval": 0.1064453125, + "loss_eval": 2.303433418273926, + "epoch": 86 + }, + { + "hidden_norms": [ + 10884.3349609375, + 95902000.0, + 129303088.0, + 151867408.0, + 164970960.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.919178953066705e-10, + 8.147189520246734e-12, + 8.125238329381723e-12, + 8.123910398560863e-12, + 8.123323194664245e-12 + ], + "bp_grad_norms_F": [ + 9.07293014051902e-08, + 2.7798055524108634e-10, + 2.7618457520972584e-10, + 2.761503803405674e-10, + 2.7613575315221794e-10 + ], + "gamma_dfa": -0.0002183817014156375, + "acc_eval": 0.0849609375, + "loss_eval": 2.304762363433838, + "epoch": 87 + }, + { + "hidden_norms": [ + 10897.5751953125, + 96208496.0, + 129661472.0, + 152266096.0, + 165380960.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.258827817655742e-10, + 8.113974769852206e-12, + 8.097599847600723e-12, + 8.095455729384415e-12, + 8.095571955857306e-12 + ], + "bp_grad_norms_F": [ + 1.5276340548098233e-07, + 2.7692478865581904e-10, + 2.752131300631788e-10, + 2.751227301533987e-10, + 2.751290584246391e-10 + ], + "gamma_dfa": 0.0012931385499541648, + "acc_eval": 0.08203125, + "loss_eval": 2.3039329051971436, + "epoch": 88 + }, + { + "hidden_norms": [ + 10904.84375, + 96462512.0, + 129958240.0, + 152599856.0, + 165729872.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.247893786197722e-10, + 8.085110705935428e-12, + 8.072378702983496e-12, + 8.07249319473291e-12, + 8.071344807791814e-12 + ], + "bp_grad_norms_F": [ + 1.0969206698518974e-07, + 2.758918649092834e-10, + 2.7459995388667835e-10, + 2.7444016503785917e-10, + 2.7442872974070553e-10 + ], + "gamma_dfa": -0.00021380887119448744, + "acc_eval": 0.1181640625, + "loss_eval": 2.3010976314544678, + "epoch": 89 + }, + { + "hidden_norms": [ + 10912.2958984375, + 96621360.0, + 130177664.0, + 152860160.0, + 166016640.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.230118005350448e-10, + 8.057754116719273e-12, + 8.04393184006269e-12, + 8.043486016129364e-12, + 8.04203491994171e-12 + ], + "bp_grad_norms_F": [ + 1.1847043168700111e-07, + 2.7523416878949547e-10, + 2.739179438826511e-10, + 2.7376986788674174e-10, + 2.7375315903022113e-10 + ], + "gamma_dfa": -0.00048403643450001255, + "acc_eval": 0.1083984375, + "loss_eval": 2.3003616333007812, + "epoch": 90 + }, + { + "hidden_norms": [ + 10917.05859375, + 96728752.0, + 130332528.0, + 153046592.0, + 166225136.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.476303216982558e-10, + 8.051880343029616e-12, + 8.02496437357636e-12, + 8.026921141657262e-12, + 8.025202898054307e-12 + ], + "bp_grad_norms_F": [ + 9.623265384561819e-08, + 2.746256555496984e-10, + 2.7323307505433547e-10, + 2.730623227531481e-10, + 2.73067457534637e-10 + ], + "gamma_dfa": -0.0015982053701009136, + "acc_eval": 0.125, + "loss_eval": 2.3003616333007812, + "epoch": 91 + }, + { + "hidden_norms": [ + 10923.0517578125, + 96870376.0, + 130487432.0, + 153217872.0, + 166403392.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.7786268558548386e-10, + 8.030507682443844e-12, + 8.02036388691807e-12, + 8.021478446751384e-12, + 8.020081126991485e-12 + ], + "bp_grad_norms_F": [ + 8.926052430524578e-08, + 2.743367200075397e-10, + 2.7284480230704844e-10, + 2.726960879328999e-10, + 2.7270555258418483e-10 + ], + "gamma_dfa": -0.0004921842846670188, + "acc_eval": 0.125, + "loss_eval": 2.300823211669922, + "epoch": 92 + }, + { + "hidden_norms": [ + 10922.423828125, + 96967520.0, + 130610968.0, + 153345712.0, + 166543008.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.468065084584083e-10, + 8.020029952648944e-12, + 8.011922722483966e-12, + 8.012338188756463e-12, + 8.013246316496137e-12 + ], + "bp_grad_norms_F": [ + 1.1504861419098233e-07, + 2.742139570965918e-10, + 2.7267893498716944e-10, + 2.725325520813726e-10, + 2.725419612215063e-10 + ], + "gamma_dfa": -0.0009440958092454821, + "acc_eval": 0.1201171875, + "loss_eval": 2.3005006313323975, + "epoch": 93 + }, + { + "hidden_norms": [ + 10924.3486328125, + 97010512.0, + 130686240.0, + 153444928.0, + 166653632.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.0347483687419583e-10, + 8.026363428059735e-12, + 8.013480504165393e-12, + 8.012077980235066e-12, + 8.010573107619656e-12 + ], + "bp_grad_norms_F": [ + 9.41274009846893e-08, + 2.740666027456484e-10, + 2.725613068577104e-10, + 2.7241114919362985e-10, + 2.7241911504383154e-10 + ], + "gamma_dfa": -0.0009883725906547625, + "acc_eval": 0.1240234375, + "loss_eval": 2.3007426261901855, + "epoch": 94 + }, + { + "hidden_norms": [ + 10926.5390625, + 97067000.0, + 130754976.0, + 153525008.0, + 166741232.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.34201924415234e-10, + 8.020669198249841e-12, + 8.007470554682872e-12, + 8.006251911440998e-12, + 8.004616067203152e-12 + ], + "bp_grad_norms_F": [ + 9.773965103931914e-08, + 2.7412291880857254e-10, + 2.725366043954125e-10, + 2.7240124045313507e-10, + 2.724127867725912e-10 + ], + "gamma_dfa": -0.0006572065904038027, + "acc_eval": 0.1240234375, + "loss_eval": 2.3012468814849854, + "epoch": 95 + }, + { + "hidden_norms": [ + 10928.3896484375, + 97092400.0, + 130798760.0, + 153578400.0, + 166798624.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.0636483067402196e-10, + 8.025032895153661e-12, + 8.005560624135821e-12, + 8.006460078258115e-12, + 8.00502199249653e-12 + ], + "bp_grad_norms_F": [ + 9.727948935278619e-08, + 2.740962179448303e-10, + 2.725039638384885e-10, + 2.72373013032734e-10, + 2.723824221728677e-10 + ], + "gamma_dfa": -0.0003809257905231789, + "acc_eval": 0.1240234375, + "loss_eval": 2.3011176586151123, + "epoch": 96 + }, + { + "hidden_norms": [ + 10928.3759765625, + 97099208.0, + 130815104.0, + 153601264.0, + 166826208.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.9727551803814265e-10, + 8.031460045632155e-12, + 8.006649163116997e-12, + 8.006433190044238e-12, + 8.007052486325161e-12 + ], + "bp_grad_norms_F": [ + 8.93527598577748e-08, + 2.7405827607296374e-10, + 2.7247276657149655e-10, + 2.723416214767127e-10, + 2.723492820155826e-10 + ], + "gamma_dfa": -0.00030210223485482857, + "acc_eval": 0.1240234375, + "loss_eval": 2.301220178604126, + "epoch": 97 + }, + { + "hidden_norms": [ + 10928.6552734375, + 97115416.0, + 130835856.0, + 153625952.0, + 166852032.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.794573821824798e-10, + 8.030101757150465e-12, + 8.005353324680442e-12, + 8.005096585605997e-12, + 8.00570807563128e-12 + ], + "bp_grad_norms_F": [ + 8.692392583498076e-08, + 2.739931892481451e-10, + 2.724127867725912e-10, + 2.7228078125496324e-10, + 2.7228858057171124e-10 + ], + "gamma_dfa": -0.00032888483474380337, + "acc_eval": 0.1240234375, + "loss_eval": 2.3012919425964355, + "epoch": 98 + }, + { + "hidden_norms": [ + 10928.8115234375, + 97125048.0, + 130846640.0, + 153637296.0, + 166864480.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.7600883517896477e-10, + 8.028339278098873e-12, + 8.003602121331443e-12, + 8.003305483617051e-12, + 8.003913504195381e-12 + ], + "bp_grad_norms_F": [ + 8.798993178515957e-08, + 2.7396546142810507e-10, + 2.7238306055110684e-10, + 2.7225180443402053e-10, + 2.7225932619501236e-10 + ], + "gamma_dfa": -0.0003425047798373271, + "acc_eval": 0.1240234375, + "loss_eval": 2.301285743713379, + "epoch": 99 + }, + { + "hidden_norms": [ + 10928.8310546875, + 97125584.0, + 130847152.0, + 153637792.0, + 166864928.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.7847944223123875e-10, + 8.028382646185772e-12, + 8.003642019971391e-12, + 8.00335752532133e-12, + 8.003966413261399e-12 + ], + "bp_grad_norms_F": [ + 8.822269847996722e-08, + 2.739633520043583e-10, + 2.7238253319517014e-10, + 2.7225077747772275e-10, + 2.7225843801659266e-10 + ], + "gamma_dfa": -0.0003516010765451938, + "acc_eval": 0.1240234375, + "loss_eval": 2.301274299621582, + "epoch": 100 + } + ] +} \ No newline at end of file diff --git a/results/optionA_smoke/snapshot_evolution_s42.json b/results/optionA_smoke/snapshot_evolution_s42.json new file mode 100644 index 0000000..86fedde --- /dev/null +++ b/results/optionA_smoke/snapshot_evolution_s42.json @@ -0,0 +1,130 @@ +{ + "config": { + "output_dir": "results/optionA_smoke", + "epochs": 3, + "lr": 0.001, + "wd": 0.01, + "seed": 42, + "depth": 4, + "d_hidden": 256, + "log_every": 1, + "no_residual_add": false, + "w2_std": 0.01, + "random_targets": true, + "skip_bp": true + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": null, + "dfa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010068593546748161, + 0.000997236929833889, + 0.0009934091940522194, + 0.0009870644425973296, + 0.0009829498594626784 + ], + "bp_grad_norms_F": [ + 0.03544403985142708, + 0.03507080301642418, + 0.03477022796869278, + 0.03443896397948265, + 0.03407429903745651 + ], + "gamma_dfa": 0.007406219025142491, + "acc_eval": 0.115234375, + "loss_eval": 2.383650302886963, + "epoch": 0 + }, + { + "hidden_norms": [ + 290.9817199707031, + 627.6629028320312, + 1287.7171630859375, + 1459.1513671875, + 1616.4718017578125 + ], + "bp_grad_norms_per_sample_med": [ + 5.262210834189318e-06, + 5.14477824253845e-06, + 5.1224119488324504e-06, + 5.1222677939222194e-06, + 5.123215942148818e-06 + ], + "bp_grad_norms_F": [ + 0.0008317740284837782, + 0.0008041572291404009, + 0.0007967103738337755, + 0.0007942747906781733, + 0.0007939037750475109 + ], + "gamma_dfa": -0.01952565903775394, + "acc_eval": 0.078125, + "loss_eval": 2.3129711151123047, + "epoch": 1 + }, + { + "hidden_norms": [ + 467.1022644042969, + 3057.49267578125, + 7424.37353515625, + 8857.5537109375, + 9767.6162109375 + ], + "bp_grad_norms_per_sample_med": [ + 9.694709888208308e-07, + 8.50241519856354e-07, + 8.498120678268606e-07, + 8.498261649947381e-07, + 8.499836781084014e-07 + ], + "bp_grad_norms_F": [ + 0.0005667012883350253, + 0.0005514815566129982, + 0.0005513231735676527, + 0.0005382975214160979, + 0.0005368698039092124 + ], + "gamma_dfa": -0.02370089991018176, + "acc_eval": 0.0810546875, + "loss_eval": 2.320453643798828, + "epoch": 2 + }, + { + "hidden_norms": [ + 524.08203125, + 4883.1953125, + 11064.0263671875, + 13177.29296875, + 14508.083984375 + ], + "bp_grad_norms_per_sample_med": [ + 6.069666369512561e-07, + 5.623286938316596e-07, + 5.621984087156306e-07, + 5.621164973490522e-07, + 5.620748311230273e-07 + ], + "bp_grad_norms_F": [ + 0.0005193821853026748, + 0.0004981618840247393, + 0.0004926337860524654, + 0.0004888861440122128, + 0.0004883570945821702 + ], + "gamma_dfa": -0.024675255175679922, + "acc_eval": 0.0712890625, + "loss_eval": 2.3067145347595215, + "epoch": 3 + } + ] +} \ No newline at end of file diff --git a/results/optionEP_random_targets_full.log b/results/optionEP_random_targets_full.log new file mode 100644 index 0000000..0316f6a --- /dev/null +++ b/results/optionEP_random_targets_full.log @@ -0,0 +1,7 @@ +[ep_random s=42] Training EP beta=0.5 T=20 alpha=0.1 + Ep 20: acc=0.0996 + Ep 40: acc=0.0631 + Ep 60: acc=0.0555 + Ep 80: acc=0.0669 + Ep 100: acc=0.0808 +[ep_random s=42] acc=0.0808 Γ=-0.0003 ρ=-0.0056 nse=0.7162 diff --git a/results/optionEP_random_targets_full/ep_random_s42.json b/results/optionEP_random_targets_full/ep_random_s42.json new file mode 100644 index 0000000..15c8f89 --- /dev/null +++ b/results/optionEP_random_targets_full/ep_random_s42.json @@ -0,0 +1,23 @@ +{ + "method": "ep_random", + "seed": 42, + "acc": 0.0808, + "Gamma": -0.00029538582612076425, + "rho": -0.005596753908321261, + "naive_StateErr": 0.7161955833435059, + "gammas_per_layer": [ + 0.0, + 0.0018188292160630226, + 1.8913333406089805e-05, + -0.0030192858539521694 + ], + "rhos_per_layer": [ + 0.0, + 0.010634900070726871, + 0.0, + -0.03302191570401192 + ], + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.1 +} \ No newline at end of file diff --git a/results/optionEP_smoke/ep_random_s42.json b/results/optionEP_smoke/ep_random_s42.json new file mode 100644 index 0000000..c6cbbf0 --- /dev/null +++ b/results/optionEP_smoke/ep_random_s42.json @@ -0,0 +1,23 @@ +{ + "method": "ep_random", + "seed": 42, + "acc": 0.1265, + "Gamma": 0.00786564577720128, + "rho": 0.00806531310081482, + "naive_StateErr": 1.4184660911560059, + "gammas_per_layer": [ + 0.0, + 0.0019382296595722437, + 0.0007031346904113889, + 0.028821218758821487 + ], + "rhos_per_layer": [ + 0.0, + 0.0, + 0.0, + 0.03226125240325928 + ], + "beta": 0.5, + "T_nudge": 20, + "alpha_nudge": 0.1 +} \ No newline at end of file diff --git a/results/optionSBCB_random_targets_s42.log b/results/optionSBCB_random_targets_s42.log new file mode 100644 index 0000000..8c08124 --- /dev/null +++ b/results/optionSBCB_random_targets_s42.log @@ -0,0 +1,36 @@ +Using device: cuda:0 + +============================================================ +Seed 42 +============================================================ + +--- State Bridge --- + [SB] Epoch 1: loss=2.3230, train=0.0991, test=0.1088, state_err=0.1329 + [SB] Epoch 10: loss=2.3119, train=0.1013, test=0.1006, state_err=0.0093 + [SB] Epoch 20: loss=2.3074, train=0.1005, test=0.0925, state_err=0.0028 + [SB] Epoch 30: loss=2.3057, train=0.0977, test=0.0999, state_err=0.1014 + [SB] Epoch 40: loss=2.3052, train=0.1000, test=0.0998, state_err=0.0015 + [SB] Epoch 50: loss=2.3054, train=0.0998, test=0.0946, state_err=0.0032 + [SB] Epoch 60: loss=2.3046, train=0.0990, test=0.1000, state_err=0.0014 + [SB] Epoch 70: loss=2.3035, train=0.1014, test=0.0980, state_err=0.0009 + [SB] Epoch 80: loss=2.3029, train=0.0996, test=0.0993, state_err=0.0004 + [SB] Epoch 90: loss=2.3027, train=0.1008, test=0.0999, state_err=0.0004 + [SB] Epoch 100: loss=2.3026, train=0.1006, test=0.0998, state_err=0.0003 + Final test acc: 0.0998 + +--- Credit Bridge --- + [CB] Warmup phase: 20 epochs (DFA fallback + value net training) + [CB] Epoch 1 (warmup): loss=2.3207, train=0.0995, test=0.0998, vloss=0.360249 + [CB] Epoch 10 (warmup): loss=2.3105, train=0.0983, test=0.1014, vloss=0.015749 + [CB] Epoch 20 (warmup): loss=2.3073, train=0.0997, test=0.1000, vloss=0.010331 + [CB] Epoch 30 (blend=0.50): loss=2.3055, train=0.1029, test=0.1000, vloss=0.005910 + [CB] Epoch 40 (blend=1.00): loss=2.3037, train=0.1006, test=0.0993, vloss=0.001187 + [CB] Epoch 50 (blend=1.00): loss=2.3034, train=0.0978, test=0.0911, vloss=0.000232 + [CB] Epoch 60 (blend=1.00): loss=2.3031, train=0.0997, test=0.1149, vloss=0.000103 + [CB] Epoch 70 (blend=1.00): loss=2.3028, train=0.1001, test=0.0758, vloss=0.000054 + [CB] Epoch 80 (blend=1.00): loss=2.3027, train=0.0996, test=0.1083, vloss=0.000021 + [CB] Epoch 90 (blend=1.00): loss=2.3027, train=0.0976, test=0.0858, vloss=0.000024 + [CB] Epoch 100 (blend=1.00): loss=2.3026, train=0.0990, test=0.0853, vloss=0.000002 + Final test acc: 0.0853 + +All results saved to results/optionSBCB_random_targets_s42/results_cifar10.json diff --git a/results/optionSBCB_random_targets_s42/results_cifar10.json b/results/optionSBCB_random_targets_s42/results_cifar10.json new file mode 100644 index 0000000..1fe6e59 --- /dev/null +++ b/results/optionSBCB_random_targets_s42/results_cifar10.json @@ -0,0 +1,996 @@ +{ + "42": { + "state_bridge": { + "log": { + "train_loss": [ + 2.32298729019165, + 2.3185904444122314, + 2.3158486935424807, + 2.3151270526123047, + 2.3153048554992677, + 2.313692629928589, + 2.3122592738342287, + 2.3125808728790282, + 2.313471165390015, + 2.3118894706726074, + 2.3125988877868653, + 2.3099629015350343, + 2.31041740196228, + 2.3091588230133056, + 2.3091439936828615, + 2.3106198542785643, + 2.3083640133666994, + 2.3086931996154787, + 2.309051240081787, + 2.3074020581054686, + 2.3068838215637206, + 2.307295061187744, + 2.3084519975280764, + 2.307104247512817, + 2.3071147785949706, + 2.3060205638122557, + 2.306451601409912, + 2.306119982833862, + 2.3060072847747803, + 2.305727400512695, + 2.306379800872803, + 2.3064919486999513, + 2.305928258132935, + 2.3056776414489746, + 2.3055357105255125, + 2.3050391822052, + 2.3047298907470704, + 2.3049536168670652, + 2.304167579269409, + 2.3051955548858643, + 2.305130446929932, + 2.305691002731323, + 2.3054561265563964, + 2.3053656420898436, + 2.3066579315948488, + 2.307786160964966, + 2.30552385055542, + 2.3060861295318604, + 2.3058279441833496, + 2.3054451098632813, + 2.3063634481811524, + 2.3052050663757324, + 2.3048459218597412, + 2.3044755393981933, + 2.3043885823059083, + 2.304098957672119, + 2.3039053114318846, + 2.304439072341919, + 2.3049430378723144, + 2.304635962142944, + 2.3039317012023925, + 2.3042490730285645, + 2.3039936375427246, + 2.3039682440185545, + 2.3040738610839844, + 2.3039017552185057, + 2.303662957687378, + 2.303627054824829, + 2.303579069137573, + 2.303518524169922, + 2.3034945246887206, + 2.3033056853485108, + 2.3032505568695067, + 2.3031821016693117, + 2.3032670336151124, + 2.3031894248199465, + 2.3030360176849367, + 2.30285311958313, + 2.3028978575897217, + 2.3029318421173097, + 2.302868471298218, + 2.3028548345947266, + 2.3028144734191893, + 2.3028969371795656, + 2.302703039703369, + 2.302848923034668, + 2.3027575202941897, + 2.3027942278289797, + 2.3028129412078857, + 2.3027255848693846, + 2.3026459377288817, + 2.3026881690979004, + 2.3025801965332033, + 2.3026949546813964, + 2.302636395187378, + 2.302556064605713, + 2.3025378968048096, + 2.302605783843994, + 2.3026791831207274, + 2.3026494352722167 + ], + "train_acc": [ + 0.09906, + 0.09794, + 0.10148, + 0.10038, + 0.10258, + 0.09924, + 0.10072, + 0.10158, + 0.10112, + 0.10128, + 0.10144, + 0.09974, + 0.1014, + 0.09986, + 0.10036, + 0.09864, + 0.0989, + 0.101, + 0.1003, + 0.10046, + 0.10232, + 0.1005, + 0.09898, + 0.10104, + 0.10058, + 0.0996, + 0.09946, + 0.09874, + 0.10022, + 0.09774, + 0.09808, + 0.09882, + 0.10142, + 0.1015, + 0.10032, + 0.09838, + 0.09716, + 0.09878, + 0.10184, + 0.09998, + 0.10034, + 0.0989, + 0.09914, + 0.1004, + 0.1008, + 0.09762, + 0.10064, + 0.0989, + 0.09826, + 0.09978, + 0.10004, + 0.10138, + 0.10118, + 0.10056, + 0.09994, + 0.09978, + 0.10034, + 0.0988, + 0.0996, + 0.09896, + 0.10002, + 0.0988, + 0.10028, + 0.09918, + 0.09862, + 0.10198, + 0.10266, + 0.09906, + 0.09944, + 0.10142, + 0.09912, + 0.09904, + 0.10118, + 0.10022, + 0.10228, + 0.09686, + 0.1019, + 0.10114, + 0.104, + 0.09958, + 0.10062, + 0.10074, + 0.0992, + 0.09988, + 0.0999, + 0.09896, + 0.09954, + 0.09946, + 0.09852, + 0.10076, + 0.09788, + 0.0983, + 0.10424, + 0.09984, + 0.0976, + 0.10156, + 0.10294, + 0.10108, + 0.09884, + 0.1006 + ], + "test_acc": [ + 0.1088, + 0.138, + 0.0905, + 0.1056, + 0.1109, + 0.0922, + 0.1103, + 0.1, + 0.0998, + 0.1006, + 0.1, + 0.0959, + 0.1026, + 0.0999, + 0.1, + 0.1018, + 0.1, + 0.1003, + 0.1075, + 0.0925, + 0.1001, + 0.1, + 0.1, + 0.1003, + 0.1, + 0.1003, + 0.0999, + 0.0955, + 0.1005, + 0.0999, + 0.1029, + 0.1001, + 0.1017, + 0.1, + 0.0937, + 0.1056, + 0.1015, + 0.1001, + 0.0968, + 0.0998, + 0.1, + 0.1083, + 0.0852, + 0.1079, + 0.0999, + 0.1108, + 0.0996, + 0.1001, + 0.104, + 0.0946, + 0.1036, + 0.1, + 0.0929, + 0.0997, + 0.1017, + 0.0993, + 0.1002, + 0.1, + 0.0892, + 0.1, + 0.0943, + 0.099, + 0.1061, + 0.1089, + 0.0843, + 0.0881, + 0.1148, + 0.1, + 0.1065, + 0.098, + 0.1, + 0.1, + 0.1039, + 0.0974, + 0.1001, + 0.1, + 0.1, + 0.0975, + 0.1078, + 0.0993, + 0.1, + 0.1098, + 0.1, + 0.1, + 0.0999, + 0.1011, + 0.1044, + 0.0855, + 0.0975, + 0.0999, + 0.0848, + 0.0864, + 0.1, + 0.0999, + 0.1039, + 0.094, + 0.0998, + 0.1002, + 0.0998, + 0.0998 + ], + "state_pred_error": [ + 0.13290744504570962, + 0.05252796378970146, + 0.05407449979066849, + 0.012723014710843562, + 0.03147433119058609, + 0.0455251266348362, + 0.01910994484335184, + 0.019099523594379424, + 0.015751069682836533, + 0.0093136414475739, + 0.005163116856366396, + 0.003956335656419396, + 0.004066170732825994, + 0.003421303847208619, + 0.020249373012185098, + 0.006719221432805061, + 0.007660316131561994, + 0.007611995658054948, + 0.004069334329739213, + 0.0028237356878444554, + 0.005142735574692488, + 0.003180019078627229, + 0.001071608488690108, + 0.0007959920338075608, + 0.000777043921276927, + 0.0015644667147099972, + 0.0020243185171112416, + 0.0013769650426506996, + 0.0008027051600441337, + 0.10135034220349044, + 0.3592664433415234, + 0.0031333496563881636, + 0.0029901706556975842, + 0.003235732616111636, + 0.0025980014257133005, + 0.0019967163011431694, + 0.0017620279234647751, + 0.0009231308926269412, + 0.0011702621114999055, + 0.001455627773553133, + 0.0028734958547353743, + 0.00217839173682034, + 0.001414939113482833, + 0.002224961518794298, + 0.005019752886593342, + 0.0033501896389573813, + 0.0018752670540288091, + 0.002304783008992672, + 0.0020676382119581105, + 0.0032032441549003123, + 0.004387096659913659, + 0.0027462033197283744, + 0.002064991759210825, + 0.0015633385695517064, + 0.0011060501547902823, + 0.0007784349711425603, + 0.0012399623063206672, + 0.0022491385858505963, + 0.0017803974036499858, + 0.0013839073456265033, + 0.0010726766408234835, + 0.0013289928095042705, + 0.0012933978212624788, + 0.0013343172781541944, + 0.001423728218227625, + 0.001325902522802353, + 0.0014321199620887636, + 0.0011931503067910672, + 0.001112698319144547, + 0.0009289030161872506, + 0.0009111916594952345, + 0.0007278604841418565, + 0.0006102696084231138, + 0.0006784520456194877, + 0.0007001932211592794, + 0.0006026263131946325, + 0.0005048922867048532, + 0.0005200714689865708, + 0.000486190369669348, + 0.0004406700743548572, + 0.00040038736144080755, + 0.00039187494518235324, + 0.0003871953769773245, + 0.00034735567714087667, + 0.0003704729523416609, + 0.00034192379067651927, + 0.00037344998602289705, + 0.0004422298234142363, + 0.000440553223779425, + 0.00043767732299864295, + 0.0004164460501912981, + 0.00045337298782542347, + 0.00044001577839720995, + 0.00043210198022890835, + 0.00040001162990927695, + 0.0003860502710286528, + 0.00038501776825636627, + 0.0003684677713084966, + 0.00036683685765601695, + 0.00033739448758307843 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.6627534627914429, + 0.03649301826953888, + 0.043565794825553894, + 0.048895061016082764 + ], + "perturbation_rho": [ + 0.03883039206266403, + -0.04418192803859711, + -0.003731100121513009, + 0.02374821901321411 + ], + "nudging": { + "0.001": [ + -1.434236764907837e-07, + -9.313225746154785e-09, + -1.862645149230957e-09, + -1.862645149230957e-09 + ], + "0.003": [ + -4.2282044887542725e-07, + -7.450580596923828e-09, + -3.725290298461914e-09, + -3.725290298461914e-09 + ], + "0.01": [ + -1.4491379261016846e-06, + -1.30385160446167e-08, + -7.450580596923828e-09, + 0.0 + ] + }, + "hidden_norms_per_layer": [ + 1560.4844970703125, + 310652.0, + 331761.15625, + 353089.875, + 360185.46875 + ], + "bp_grad_norms_per_layer": [ + 1.1365173691046948e-07, + 3.573703466486222e-08, + 3.5727047986711113e-08, + 3.5704797340940786e-08, + 3.5682791832414296e-08 + ] + }, + "drift": { + "embed.weight": 13.043507815424693, + "embed.bias": 29.86588313039489, + "blocks.0.ln.weight": 0.5166860818862915, + "blocks.0.w1.weight": 19.360717044257658, + "blocks.0.w1.bias": 29.004801946636565, + "blocks.0.w2.weight": 48.30789617700896, + "blocks.1.ln.weight": 0.7842006087303162, + "blocks.1.w1.weight": 11.791182182499824, + "blocks.1.w1.bias": 14.273464699248207, + "blocks.1.w2.weight": 28.503463313166364, + "blocks.2.ln.weight": 0.8836206793785095, + "blocks.2.w1.weight": 14.733152570313322, + "blocks.2.w1.bias": 17.480997129225248, + "blocks.2.w2.weight": 27.771171107294236, + "blocks.3.ln.weight": 0.665003776550293, + "blocks.3.w1.weight": 15.147301138898312, + "blocks.3.w1.bias": 21.234292438770414, + "blocks.3.w2.weight": 38.43138288142111, + "out_ln.weight": 0.7085357308387756, + "out_head.weight": 0.5498378159761019, + "out_head.bias": 0.35831333543785815 + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.320697575531006, + 2.314502516784668, + 2.314460542755127, + 2.312608349685669, + 2.3133283112335206, + 2.3133729998779295, + 2.312248833694458, + 2.311172733535767, + 2.3115486805725096, + 2.3104688677978515, + 2.3109971079254152, + 2.310881831817627, + 2.310004387893677, + 2.309491654586792, + 2.3095546392822266, + 2.3100841890716555, + 2.3085610353088377, + 2.308080646286011, + 2.3075632568359374, + 2.307347955932617, + 2.3074126527404784, + 2.307658705368042, + 2.3073503659057617, + 2.306713535614014, + 2.306330997467041, + 2.3061688971710206, + 2.3063255101776123, + 2.3057255418395997, + 2.3053788011932372, + 2.3054862889862062, + 2.3051065019226074, + 2.3045800858306884, + 2.304553623123169, + 2.3046239949035643, + 2.3046455932617187, + 2.3043140906524657, + 2.304565064620972, + 2.303868224029541, + 2.3041190071105957, + 2.3036934986114503, + 2.303684545669556, + 2.3032837171173095, + 2.303525014038086, + 2.3033674309539793, + 2.3034363243865967, + 2.303352096710205, + 2.303193058547974, + 2.303125846862793, + 2.3031477342224123, + 2.303350806045532, + 2.3033111126708983, + 2.303525471343994, + 2.3034460102844236, + 2.303145178375244, + 2.3032577839660644, + 2.3030932935333253, + 2.3031362072753905, + 2.303055979385376, + 2.302980875701904, + 2.3030779765319824, + 2.302983999786377, + 2.303044497756958, + 2.3030930955505373, + 2.303104384841919, + 2.3030656214141847, + 2.3030314892578123, + 2.302923185272217, + 2.3029102128601076, + 2.3028630736541746, + 2.3028233364105226, + 2.3029996464538574, + 2.302821640625, + 2.302850316848755, + 2.3029183795928954, + 2.30286163772583, + 2.3028460260772703, + 2.302827332229614, + 2.302656623458862, + 2.3028156612396242, + 2.302746138534546, + 2.3027149549102783, + 2.302699661560059, + 2.30270656539917, + 2.302787049484253, + 2.3026862089538573, + 2.3026845347595213, + 2.3026778645324706, + 2.3026780055236817, + 2.302643309173584, + 2.302685669555664, + 2.302650958709717, + 2.3026181773376466, + 2.3025860111236574, + 2.3026244691467284, + 2.3026082512664794, + 2.3026506772613526, + 2.3025857417297364, + 2.3026533776855467, + 2.3026109131622317, + 2.302595517349243 + ], + "train_acc": [ + 0.09946, + 0.09898, + 0.10092, + 0.10138, + 0.09744, + 0.10108, + 0.10086, + 0.09928, + 0.10138, + 0.09826, + 0.09894, + 0.10066, + 0.09984, + 0.10064, + 0.10108, + 0.09942, + 0.10004, + 0.09876, + 0.10062, + 0.09968, + 0.0996, + 0.09952, + 0.09828, + 0.1006, + 0.10106, + 0.10024, + 0.0999, + 0.09796, + 0.09978, + 0.10288, + 0.10014, + 0.10054, + 0.09818, + 0.09922, + 0.10078, + 0.1016, + 0.0993, + 0.10042, + 0.09788, + 0.10064, + 0.10094, + 0.10018, + 0.102, + 0.10154, + 0.09986, + 0.09978, + 0.0998, + 0.09948, + 0.10142, + 0.09782, + 0.10038, + 0.097, + 0.10054, + 0.1011, + 0.09966, + 0.10024, + 0.09916, + 0.1009, + 0.10136, + 0.0997, + 0.1003, + 0.09868, + 0.10006, + 0.09862, + 0.0986, + 0.09998, + 0.09918, + 0.10112, + 0.10032, + 0.10014, + 0.0994, + 0.10032, + 0.09924, + 0.10002, + 0.09714, + 0.10214, + 0.10122, + 0.1002, + 0.10022, + 0.0996, + 0.10258, + 0.10096, + 0.09934, + 0.09812, + 0.1009, + 0.10174, + 0.10068, + 0.09948, + 0.10072, + 0.09762, + 0.09764, + 0.0989, + 0.09824, + 0.09884, + 0.09932, + 0.0999, + 0.1005, + 0.0972, + 0.09852, + 0.099 + ], + "test_acc": [ + 0.0998, + 0.105, + 0.0966, + 0.1001, + 0.1042, + 0.1092, + 0.0987, + 0.1, + 0.0995, + 0.1014, + 0.0901, + 0.0984, + 0.1149, + 0.1106, + 0.1288, + 0.1322, + 0.1, + 0.1, + 0.0927, + 0.1, + 0.1046, + 0.1, + 0.0683, + 0.1077, + 0.0896, + 0.1, + 0.1048, + 0.1, + 0.1, + 0.1, + 0.0971, + 0.1009, + 0.0991, + 0.1045, + 0.0855, + 0.1, + 0.1023, + 0.0922, + 0.1022, + 0.0993, + 0.1114, + 0.0996, + 0.1237, + 0.1385, + 0.1, + 0.0661, + 0.1128, + 0.1112, + 0.0981, + 0.0911, + 0.1011, + 0.0916, + 0.0717, + 0.1276, + 0.1143, + 0.0922, + 0.1152, + 0.1013, + 0.1008, + 0.1149, + 0.1003, + 0.1007, + 0.0784, + 0.1047, + 0.0972, + 0.0939, + 0.1092, + 0.1107, + 0.0959, + 0.0758, + 0.1089, + 0.1093, + 0.1152, + 0.1, + 0.0862, + 0.0776, + 0.1, + 0.0923, + 0.0801, + 0.1083, + 0.0871, + 0.1008, + 0.0629, + 0.0892, + 0.0987, + 0.1172, + 0.0854, + 0.1082, + 0.0948, + 0.0858, + 0.1101, + 0.1043, + 0.1139, + 0.0968, + 0.0853, + 0.1046, + 0.0855, + 0.0841, + 0.0853, + 0.0853 + ], + "value_loss": [ + 0.36024896956682206, + 0.03183852453351021, + 0.025451152555942536, + 0.021708431544005872, + 0.02077318694293499, + 0.020753964634239674, + 0.021235586476922034, + 0.01893643991112709, + 0.018619907104372977, + 0.015749295738935472, + 0.016165131821632386, + 0.01627982610166073, + 0.01576672645226121, + 0.013386324182450771, + 0.01423095471471548, + 0.014466542360335588, + 0.012401664460375906, + 0.011147678565084935, + 0.011141861658394337, + 0.010330630984306335, + 0.009658805636167526, + 0.008585796424597501, + 0.008594671681523324, + 0.007982810129523277, + 0.007645617132037878, + 0.008022303429841995, + 0.008005152634829283, + 0.0059666380059719085, + 0.005986212073117495, + 0.005909559334218502, + 0.004877746372818947, + 0.003636553997769952, + 0.003040616886168718, + 0.003947440829202533, + 0.00315660555139184, + 0.0029034065799415113, + 0.002512122514247894, + 0.0016924809731543064, + 0.001678440686389804, + 0.0011873630691319704, + 0.0009388955864496529, + 0.0009610869230516255, + 0.0006362878701463341, + 0.0004323156377952546, + 0.0003630236568301916, + 0.00036932898109778763, + 0.00033574777004309, + 0.0002565739982156083, + 0.0001863192752469331, + 0.00023190321479924024, + 0.00026786222354508935, + 0.00033428026146255436, + 0.00027582604380790144, + 0.0001974007376888767, + 0.0001375103883445263, + 0.0004384587158355862, + 0.0039204689223319295, + 0.004382409224770963, + 0.0006871034290734678, + 0.00010320373967755585, + 0.00014435500147752463, + 9.740317803341896e-05, + 8.956539701670409e-05, + 9.767239448963665e-05, + 8.177875839173793e-05, + 6.697170453844591e-05, + 4.722151418682188e-05, + 5.749972769990564e-05, + 6.388362684287131e-05, + 5.368636809522286e-05, + 3.949314116733149e-05, + 4.417577457614243e-05, + 4.6873606223380194e-05, + 3.221075773006305e-05, + 2.8231028532609345e-05, + 2.298405951121822e-05, + 2.5732159098843112e-05, + 2.1224372125871013e-05, + 3.2635308437165804e-05, + 2.130895388283534e-05, + 1.289501101593487e-05, + 1.5379936417157296e-05, + 1.4666962435876485e-05, + 1.298599345231196e-05, + 1.1551605327113065e-05, + 6.440735349897295e-06, + 5.332033502490958e-06, + 4.883227497921326e-06, + 8.978629974124487e-05, + 2.4204184894333592e-05, + 4.545561687118606e-06, + 3.5889826984202956e-06, + 4.1601734295545614e-06, + 4.2137386921967846e-06, + 3.875532386446139e-06, + 3.4998742312018293e-06, + 2.6388491396210154e-06, + 2.4725526066322344e-06, + 2.2455400646140332e-06, + 2.4813705806445795e-06 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.025305092334747314, + 0.0009738511289469898, + -0.00010878710600081831, + -7.289459063031245e-07 + ], + "perturbation_rho": [ + 0.014444086700677872, + -0.042073216289281845, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + 1.862645149230957e-09, + -1.862645149230957e-09, + 0.0, + 0.0 + ], + "0.003": [ + 0.0, + 0.0, + 0.0, + 0.0 + ], + "0.01": [ + -1.862645149230957e-09, + -7.450580596923828e-09, + 0.0, + 0.0 + ] + }, + "hidden_norms_per_layer": [ + 5692.50634765625, + 459013.09375, + 91032032.0, + 125105208.0, + 138335232.0 + ], + "bp_grad_norms_per_layer": [ + 1.7060839407889716e-09, + 7.58920010168751e-11, + 7.270677115922553e-11, + 7.273436714028136e-11, + 7.270117147184507e-11 + ] + }, + "drift": { + "embed.weight": 45.86434101884337, + "embed.bias": 113.35733240852751, + "blocks.0.ln.weight": 4.421970367431641, + "blocks.0.w1.weight": 97.06686933355363, + "blocks.0.w1.bias": 47.28995503044106, + "blocks.0.w2.weight": 146.57679653697483, + "blocks.1.ln.weight": 4.999883651733398, + "blocks.1.w1.weight": 137.2272615608869, + "blocks.1.w1.bias": 138.63656460889115, + "blocks.1.w2.weight": 171.87600316053306, + "blocks.2.ln.weight": 4.91436243057251, + "blocks.2.w1.weight": 133.27781391246944, + "blocks.2.w1.bias": 128.21395802713855, + "blocks.2.w2.weight": 175.64976178971338, + "blocks.3.ln.weight": 4.6856255531311035, + "blocks.3.w1.weight": 118.23222583929504, + "blocks.3.w1.bias": 115.15562764222817, + "blocks.3.w2.weight": 152.30494494545084, + "out_ln.weight": 0.6381078958511353, + "out_head.weight": 0.7641696600790421, + "out_head.bias": 0.4448472934844991 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 100, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 42 + ], + "gpu": 0, + "output_dir": "results/optionSBCB_random_targets_s42", + "methods": [ + "state_bridge", + "credit_bridge" + ], + "random_targets": true, + "num_classes": 10 + } +} \ No newline at end of file diff --git a/results/optionSBCB_smoke/results_cifar10.json b/results/optionSBCB_smoke/results_cifar10.json new file mode 100644 index 0000000..c2ab728 --- /dev/null +++ b/results/optionSBCB_smoke/results_cifar10.json @@ -0,0 +1,220 @@ +{ + "42": { + "state_bridge": { + "log": { + "train_loss": [ + 2.32298729019165, + 2.3135665228271485, + 2.3065665995025633 + ], + "train_acc": [ + 0.09906, + 0.09972, + 0.09984 + ], + "test_acc": [ + 0.1088, + 0.0958, + 0.1037 + ], + "state_pred_error": [ + 0.13290744504570962, + 0.04644830721378326, + 0.02964444874405861 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.02890743687748909, + 0.029086019843816757, + 0.02471546083688736, + 0.02299082651734352 + ], + "perturbation_rho": [ + 0.06398507952690125, + 0.03261129930615425, + -0.0327291414141655, + 0.03132244944572449 + ], + "nudging": { + "0.001": [ + -8.400529623031616e-07, + -5.029141902923584e-07, + -2.8870999813079834e-07, + -1.3969838619232178e-07 + ], + "0.003": [ + -2.5480985641479492e-06, + -1.559033989906311e-06, + -7.82310962677002e-07, + -4.7497451305389404e-07 + ], + "0.01": [ + -8.374452590942383e-06, + -5.166977643966675e-06, + -2.5797635316848755e-06, + -1.5459954738616943e-06 + ] + }, + "hidden_norms_per_layer": [ + 382.91375732421875, + 1350.580810546875, + 2999.959716796875, + 4744.67626953125, + 6224.6923828125 + ], + "bp_grad_norms_per_layer": [ + 1.2822482858609874e-05, + 1.0445839507156052e-05, + 1.0443974133522715e-05, + 1.04420678326278e-05, + 1.0443762221257202e-05 + ] + }, + "drift": { + "embed.weight": 3.211158219942791, + "embed.bias": 7.062613177208634, + "blocks.0.ln.weight": 0.21760645508766174, + "blocks.0.w1.weight": 2.8678529976663016, + "blocks.0.w1.bias": 3.956961082186717, + "blocks.0.w2.weight": 9.394435771614729, + "blocks.1.ln.weight": 0.18258990347385406, + "blocks.1.w1.weight": 2.21922766779391, + "blocks.1.w1.bias": 2.8283530013194156, + "blocks.1.w2.weight": 7.529057036338004, + "blocks.2.ln.weight": 0.1940218061208725, + "blocks.2.w1.weight": 2.6529854316910684, + "blocks.2.w1.bias": 3.025569884204286, + "blocks.2.w2.weight": 8.47631449731586, + "blocks.3.ln.weight": 0.1730765700340271, + "blocks.3.w1.weight": 2.41631876651548, + "blocks.3.w1.bias": 2.7588911555760287, + "blocks.3.w2.weight": 7.962227392442747, + "out_ln.weight": 0.03852882981300354, + "out_head.weight": 0.2597139888044846, + "out_head.bias": 0.22334529177207701 + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.320697575531006, + 2.3160406340026856, + 2.307044482879639 + ], + "train_acc": [ + 0.09946, + 0.09836, + 0.10142 + ], + "test_acc": [ + 0.0998, + 0.1055, + 0.0925 + ], + "value_loss": [ + 0.36024896956682206, + 0.6458554600691795, + 0.018822102856636047 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.0007630798500031233, + -0.009494196623563766, + -0.009180156514048576, + -0.007028202060610056 + ], + "perturbation_rho": [ + -0.014483902603387833, + 0.01178690791130066, + -0.011402066797018051, + 0.02756977453827858 + ], + "nudging": { + "0.001": [ + -4.284083843231201e-08, + 6.146728992462158e-08, + 4.842877388000488e-08, + 3.91155481338501e-08 + ], + "0.003": [ + -1.4528632164001465e-07, + 1.5459954738616943e-07, + 1.471489667892456e-07, + 6.891787052154541e-08 + ], + "0.01": [ + -4.637986421585083e-07, + 6.239861249923706e-07, + 4.6193599700927734e-07, + 2.998858690261841e-07 + ] + }, + "hidden_norms_per_layer": [ + 1157.2740478515625, + 10477.9150390625, + 16051.2392578125, + 19347.453125, + 19974.22265625 + ], + "bp_grad_norms_per_layer": [ + 4.064333097630879e-06, + 3.1959411899151746e-06, + 3.1822878554521594e-06, + 3.1774463877809467e-06, + 3.1793581456440734e-06 + ] + }, + "drift": { + "embed.weight": 7.825915877663139, + "embed.bias": 10.392833847164916, + "blocks.0.ln.weight": 0.32047849893569946, + "blocks.0.w1.weight": 6.762743850808533, + "blocks.0.w1.bias": 8.151214078637885, + "blocks.0.w2.weight": 17.774887825977164, + "blocks.1.ln.weight": 0.28780925273895264, + "blocks.1.w1.weight": 6.646412153864217, + "blocks.1.w1.bias": 7.28996940865764, + "blocks.1.w2.weight": 16.59156331214822, + "blocks.2.ln.weight": 0.30320411920547485, + "blocks.2.w1.weight": 6.002501250935489, + "blocks.2.w1.bias": 5.318388908944272, + "blocks.2.w2.weight": 16.00213789556674, + "blocks.3.ln.weight": 0.24688510596752167, + "blocks.3.w1.weight": 3.6772500170447437, + "blocks.3.w1.bias": 4.008142009024597, + "blocks.3.w2.weight": 13.91740354386689, + "out_ln.weight": 0.03830864652991295, + "out_head.weight": 0.3261551698718769, + "out_head.bias": 0.2861540512185052 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 3, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 42 + ], + "gpu": 0, + "output_dir": "results/optionSBCB_smoke", + "methods": [ + "state_bridge", + "credit_bridge" + ], + "random_targets": true, + "num_classes": 10 + } +} \ No newline at end of file diff --git a/results/periodic_refit/periodic_refit_s42.json b/results/periodic_refit/periodic_refit_s42.json new file mode 100644 index 0000000..c94ebd5 --- /dev/null +++ b/results/periodic_refit/periodic_refit_s42.json @@ -0,0 +1,414 @@ +{ + "DFA_only": { + "test_acc": [ + 0.3006, + 0.3039, + 0.2971, + 0.2915, + 0.2946, + 0.3055, + 0.3016, + 0.3071, + 0.2983, + 0.2891, + 0.2938, + 0.3097, + 0.2861, + 0.3091, + 0.3089, + 0.2942, + 0.3116, + 0.2963, + 0.2971, + 0.3065, + 0.3158, + 0.299, + 0.2948, + 0.3057, + 0.2977, + 0.3158, + 0.3065, + 0.2975, + 0.3125, + 0.306, + 0.3041, + 0.2915, + 0.2928, + 0.3004, + 0.3148, + 0.307, + 0.297, + 0.3043, + 0.3047, + 0.3002, + 0.3159, + 0.3159, + 0.3046, + 0.2984, + 0.3016, + 0.3024, + 0.29, + 0.3164, + 0.3004, + 0.3073, + 0.3154, + 0.3014, + 0.3072, + 0.3075, + 0.3181, + 0.2923, + 0.306, + 0.3055, + 0.3096, + 0.3027, + 0.3036, + 0.308, + 0.3097, + 0.3109, + 0.3127, + 0.3129, + 0.3155, + 0.3164, + 0.3102, + 0.3021, + 0.3138, + 0.313, + 0.3097, + 0.3088, + 0.3115, + 0.3157, + 0.3126, + 0.311, + 0.309, + 0.3091, + 0.304, + 0.3102, + 0.311, + 0.3136, + 0.3116, + 0.3114, + 0.3108, + 0.3112, + 0.3152, + 0.3077, + 0.3121, + 0.3119, + 0.3122, + 0.3115, + 0.3114, + 0.3118, + 0.3114, + 0.3116, + 0.3116, + 0.3116 + ], + "train_loss": [ + 2.0318866732025147, + 2.0057224438476564, + 2.000193025856018, + 1.9955825387573243, + 1.9903357116699218, + 1.9887702255249022, + 1.9901456210327149, + 1.9876038012313844, + 1.9891375769424438, + 1.9916579194641113, + 1.9882932608032227, + 1.9864958861541748, + 1.989747982635498, + 1.987270903930664, + 1.9892830609512329, + 1.9896244260025024, + 1.9903675205230713, + 1.9884116526794433, + 1.9885369082641602, + 1.986256969833374, + 1.987841325416565, + 1.9860659005355834, + 1.9870660667419433, + 1.9887021855926514, + 1.9881466793823241, + 1.987437709274292, + 1.9851161840438842, + 1.9871229264068604, + 1.987296971054077, + 1.9865425718688965, + 1.985583653526306, + 1.9873635176086426, + 1.9880531158828736, + 1.986221237449646, + 1.9857749569702148, + 1.9882853355407715, + 1.9866280360412598, + 1.98623606010437, + 1.9872347016906737, + 1.9890095454406738, + 1.987217137069702, + 1.9882683947753905, + 1.9873427893066407, + 1.9894943984985352, + 1.9865683745956422, + 1.9856433502197266, + 1.9884860709381103, + 1.9900159615325927, + 1.9878518949127197, + 1.98708917388916, + 1.9877159860992433, + 1.9865355113220216, + 1.9874952691268921, + 1.988472138748169, + 1.9888839432525636, + 1.9876802584075928, + 1.987925719909668, + 1.9862554049301147, + 1.9863393670272826, + 1.9889370369720458, + 1.9876346451187135, + 1.9845583619689942, + 1.9870499811553954, + 1.987435880508423, + 1.9854575398254395, + 1.985907090988159, + 1.9861144110870361, + 1.9871188342666626, + 1.9862679552841187, + 1.9887662117004394, + 1.9872093386840821, + 1.9860852742004393, + 1.9862465969085694, + 1.986481220550537, + 1.9852113827896118, + 1.9885292751312256, + 1.9848377563476562, + 1.986888662185669, + 1.9864294763183594, + 1.9865412310028077, + 1.985109836578369, + 1.9869044762802124, + 1.984938102722168, + 1.9856962964248657, + 1.9853763344573974, + 1.984437050552368, + 1.984452505493164, + 1.9845013403320313, + 1.9867055741119384, + 1.9862973651123046, + 1.9845818555450438, + 1.9843991091156006, + 1.9876228217315675, + 1.985638127822876, + 1.985604430923462, + 1.9853035695648193, + 1.9835245191192628, + 1.9839755685806275, + 1.9846243866729736, + 1.9842720232391358 + ] + }, + "refit_K5_R1_a0.75": { + "test_acc": [ + 0.1174, + 0.133, + 0.1408, + 0.1299, + 0.1397, + 0.1242, + 0.1374, + 0.1382, + 0.1362, + 0.1362, + 0.1332, + 0.1381, + 0.1413, + 0.1457, + 0.1236, + 0.1283, + 0.1224, + 0.1352, + 0.1431, + 0.1407, + 0.1265, + 0.1247, + 0.1428, + 0.1407, + 0.1215, + 0.1337, + 0.1252, + 0.1433, + 0.146, + 0.1341, + 0.1441, + 0.136, + 0.1196, + 0.1119, + 0.1387, + 0.1314, + 0.1263, + 0.1146, + 0.1256, + 0.1274, + 0.1334, + 0.1301, + 0.1341, + 0.1234, + 0.1186, + 0.1318, + 0.1217, + 0.127, + 0.1237, + 0.1179, + 0.1343, + 0.1077, + 0.1398, + 0.1378, + 0.122, + 0.123, + 0.129, + 0.141, + 0.1183, + 0.1148, + 0.1417, + 0.1245, + 0.1442, + 0.1332, + 0.1309, + 0.1328, + 0.1246, + 0.1427, + 0.1444, + 0.1255, + 0.1286, + 0.1172, + 0.1151, + 0.1281, + 0.1317, + 0.1159, + 0.1241, + 0.1315, + 0.1304, + 0.1316, + 0.132, + 0.142, + 0.1192, + 0.1292, + 0.1154, + 0.135, + 0.1253, + 0.1306, + 0.1387, + 0.1401, + 0.125, + 0.1319, + 0.1406, + 0.1317, + 0.1395, + 0.1405, + 0.1389, + 0.1404, + 0.14, + 0.1399 + ], + "train_loss": [ + 2.2922492407226565, + 2.303223536987305, + 2.297322120132446, + 2.2908322675323487, + 2.2916210280609133, + 2.291199165649414, + 2.292368500289917, + 2.2919790600585936, + 2.2932819635009767, + 2.291942204589844, + 2.2920562203216552, + 2.292144420928955, + 2.291042411804199, + 2.2911525618743895, + 2.289652233123779, + 2.292079990386963, + 2.29080831741333, + 2.2901196612548826, + 2.2909918134307863, + 2.2910345366668703, + 2.290270492095947, + 2.291422851638794, + 2.2929677319335937, + 2.2916940523529052, + 2.2927628204345702, + 2.2935196813964844, + 2.2930270182037353, + 2.291781602096558, + 2.2911440320587158, + 2.2910533695983886, + 2.2924093311309814, + 2.2931985846710203, + 2.2921073666381835, + 2.2925245095062254, + 2.293268418502808, + 2.291532369232178, + 2.290545958404541, + 2.2910766479492186, + 2.290808622894287, + 2.290147826538086, + 2.290089402923584, + 2.2919920152282716, + 2.2909375720977785, + 2.2912671838378906, + 2.291217657546997, + 2.2908856577301027, + 2.2912476402282715, + 2.2905492133331298, + 2.290840171356201, + 2.2898812239074706, + 2.289819273147583, + 2.289929093093872, + 2.2888978022766113, + 2.289257996673584, + 2.2891055699920653, + 2.288888888473511, + 2.288564768753052, + 2.2889565814971924, + 2.288644219055176, + 2.2885153662872315, + 2.2883075208282473, + 2.288591046142578, + 2.287981568374634, + 2.2882171091461183, + 2.2874768580627443, + 2.287058499908447, + 2.2877427760314943, + 2.2876212321472167, + 2.286393500213623, + 2.2868061962890627, + 2.2863689573669435, + 2.286908480758667, + 2.286366832733154, + 2.2867871881866457, + 2.287365332946777, + 2.2860294148254394, + 2.286066697845459, + 2.2859441703796386, + 2.285769623260498, + 2.285296831588745, + 2.285918746032715, + 2.286178753890991, + 2.285149822845459, + 2.284917789764404, + 2.285303730926514, + 2.28559301864624, + 2.2857230437469482, + 2.285581053314209, + 2.28521455368042, + 2.2851917591094972, + 2.2861509452819826, + 2.284609991760254, + 2.2853968709564207, + 2.2851967042541506, + 2.2849537175750734, + 2.2850700605010985, + 2.285350464324951, + 2.285402466278076, + 2.2850866062927246, + 2.2854909355163575 + ] + } +} \ No newline at end of file diff --git a/results/prefit_threshold/prefit_curve_t5_s42.json b/results/prefit_threshold/prefit_curve_t5_s42.json new file mode 100644 index 0000000..5cce540 --- /dev/null +++ b/results/prefit_threshold/prefit_curve_t5_s42.json @@ -0,0 +1,330 @@ +{ + "dfa_cont_final": 0.3107, + "dfa_cont_acc20": 0.3071, + "results": [ + { + "E_prefit": 0, + "branch": "blend_075", + "gamma_frozen": -0.004854517173953354, + "rho_frozen": 0.013503444148227572, + "nudge_frozen": 6.938353180885315e-08, + "final_acc": 0.3237, + "acc_at_20": 0.3162, + "diff_final": 0.013000000000000012, + "diff_acc20": 0.009099999999999997, + "test_acc": [ + 0.3062, + 0.3035, + 0.3071, + 0.3023, + 0.2972, + 0.3146, + 0.3089, + 0.2936, + 0.3063, + 0.3115, + 0.3006, + 0.3113, + 0.3214, + 0.321, + 0.3162, + 0.3085, + 0.3096, + 0.3176, + 0.3176, + 0.323, + 0.313, + 0.3147, + 0.3195, + 0.3169, + 0.3099, + 0.3074, + 0.3086, + 0.3209, + 0.3024, + 0.3131, + 0.3174, + 0.3141, + 0.3244, + 0.3188, + 0.3253, + 0.3237, + 0.3188, + 0.3253, + 0.3222, + 0.3159, + 0.3254, + 0.3314, + 0.3196, + 0.3184, + 0.3242, + 0.3239, + 0.3194, + 0.3171, + 0.322, + 0.3185, + 0.3257, + 0.3221, + 0.323, + 0.3251, + 0.3221, + 0.3145, + 0.3177, + 0.3223, + 0.3228, + 0.3243, + 0.3263, + 0.3255, + 0.3191, + 0.3178, + 0.3259, + 0.3221, + 0.3225, + 0.3236, + 0.3217, + 0.3244, + 0.3183, + 0.3224, + 0.3226, + 0.3182, + 0.3207, + 0.3177, + 0.3249, + 0.321, + 0.3232, + 0.3241, + 0.3237, + 0.3241, + 0.3235, + 0.3241, + 0.3247, + 0.3242, + 0.3231, + 0.3236, + 0.3237, + 0.3239, + 0.3242, + 0.3236, + 0.3235, + 0.3237, + 0.3237 + ] + }, + { + "E_prefit": 15, + "branch": "blend_075", + "gamma_frozen": 0.0019898422178812325, + "rho_frozen": 0.010547585785388947, + "nudge_frozen": -7.2177499532699585e-09, + "final_acc": 0.3228, + "acc_at_20": 0.3196, + "diff_final": 0.0121, + "diff_acc20": 0.012500000000000011, + "test_acc": [ + 0.2986, + 0.3119, + 0.3106, + 0.3062, + 0.296, + 0.3146, + 0.3114, + 0.3012, + 0.3097, + 0.3134, + 0.3223, + 0.3308, + 0.3023, + 0.3168, + 0.3196, + 0.3047, + 0.3028, + 0.3218, + 0.3243, + 0.3202, + 0.3063, + 0.3167, + 0.3224, + 0.3196, + 0.312, + 0.3206, + 0.3291, + 0.3138, + 0.3163, + 0.3264, + 0.3215, + 0.3244, + 0.3249, + 0.3197, + 0.3212, + 0.3205, + 0.3192, + 0.3209, + 0.3175, + 0.3208, + 0.317, + 0.3192, + 0.3203, + 0.32, + 0.3148, + 0.3272, + 0.3211, + 0.3198, + 0.3203, + 0.3265, + 0.3233, + 0.3208, + 0.317, + 0.3255, + 0.3244, + 0.319, + 0.3207, + 0.3218, + 0.3259, + 0.3243, + 0.3221, + 0.3221, + 0.3221, + 0.3221, + 0.3212, + 0.3192, + 0.3207, + 0.3194, + 0.3193, + 0.3221, + 0.3205, + 0.3235, + 0.3243, + 0.3222, + 0.323, + 0.3249, + 0.3214, + 0.3194, + 0.3237, + 0.3228, + 0.3234, + 0.3229, + 0.3231, + 0.3236, + 0.3229, + 0.3249, + 0.3232, + 0.3235, + 0.3232, + 0.3235, + 0.3234, + 0.3231, + 0.323, + 0.3227, + 0.3228 + ] + }, + { + "E_prefit": 60, + "branch": "blend_075", + "gamma_frozen": -0.0008711532718734816, + "rho_frozen": -0.00878655374981463, + "nudge_frozen": -1.6298145055770874e-09, + "final_acc": 0.3246, + "acc_at_20": 0.3097, + "diff_final": 0.013900000000000023, + "diff_acc20": 0.002599999999999991, + "test_acc": [ + 0.2959, + 0.3026, + 0.3108, + 0.3105, + 0.3015, + 0.3061, + 0.3003, + 0.3037, + 0.3141, + 0.3155, + 0.3226, + 0.3122, + 0.3242, + 0.302, + 0.3097, + 0.3137, + 0.3212, + 0.3207, + 0.3169, + 0.3074, + 0.3198, + 0.3212, + 0.3141, + 0.3153, + 0.3154, + 0.3234, + 0.3269, + 0.3219, + 0.3125, + 0.3247, + 0.3184, + 0.3113, + 0.3203, + 0.325, + 0.3189, + 0.3259, + 0.3228, + 0.3266, + 0.3249, + 0.32, + 0.3221, + 0.3257, + 0.3244, + 0.3248, + 0.3271, + 0.3233, + 0.3212, + 0.3138, + 0.3182, + 0.3181, + 0.3221, + 0.3208, + 0.3302, + 0.3187, + 0.3172, + 0.3241, + 0.3163, + 0.3293, + 0.3244, + 0.3241, + 0.3231, + 0.3266, + 0.3236, + 0.3165, + 0.3223, + 0.3233, + 0.3204, + 0.3202, + 0.3254, + 0.3231, + 0.3255, + 0.32, + 0.3237, + 0.3245, + 0.3264, + 0.3217, + 0.3257, + 0.3257, + 0.3232, + 0.3257, + 0.3268, + 0.3238, + 0.324, + 0.3249, + 0.3241, + 0.3235, + 0.3247, + 0.3248, + 0.3244, + 0.3241, + 0.3244, + 0.3248, + 0.3246, + 0.3246, + 0.3246 + ] + } + ] +} \ No newline at end of file diff --git a/results/resmlp_frozen_blocks_s123.log b/results/resmlp_frozen_blocks_s123.log new file mode 100644 index 0000000..728da12 --- /dev/null +++ b/results/resmlp_frozen_blocks_s123.log @@ -0,0 +1,73 @@ +Device: cuda:0, seed=123, epochs=100 + +=== BP shallow (ResMLP num_blocks=0), seed=123 === + n_params: 789770 (789770 trainable) + [BP-shallow] ep 1: test_acc=0.3507 + [BP-shallow] ep 10: test_acc=0.3744 + [BP-shallow] ep 20: test_acc=0.3604 + [BP-shallow] ep 30: test_acc=0.3518 + [BP-shallow] ep 40: test_acc=0.3535 + [BP-shallow] ep 50: test_acc=0.3613 + [BP-shallow] ep 60: test_acc=0.3631 + [BP-shallow] ep 70: test_acc=0.3709 + [BP-shallow] ep 80: test_acc=0.3828 + [BP-shallow] ep 90: test_acc=0.3832 + [BP-shallow] ep 100: test_acc=0.3841 +FINAL BP-shallow: 0.3841 + +=== BP frozen-blocks (ResMLP num_blocks=4, blocks frozen), seed=123 === + n_params: 1318154 (789770 trainable) + [BP-frozen] ep 1: test_acc=0.3517 + [BP-frozen] ep 10: test_acc=0.3653 + [BP-frozen] ep 20: test_acc=0.3538 + [BP-frozen] ep 30: test_acc=0.3501 + [BP-frozen] ep 40: test_acc=0.3558 + [BP-frozen] ep 50: test_acc=0.3528 + [BP-frozen] ep 60: test_acc=0.3701 + [BP-frozen] ep 70: test_acc=0.3750 + [BP-frozen] ep 80: test_acc=0.3855 + [BP-frozen] ep 90: test_acc=0.3855 + [BP-frozen] ep 100: test_acc=0.3896 +FINAL BP-frozen-blocks: 0.3896 + +=== DFA shallow (ResMLP num_blocks=0), seed=123 === + n_params: 789770 (789770 trainable) + [DFA-shallow] ep 1: test_acc=0.3348 + [DFA-shallow] ep 10: test_acc=0.3457 + [DFA-shallow] ep 20: test_acc=0.3484 + [DFA-shallow] ep 30: test_acc=0.3323 + [DFA-shallow] ep 40: test_acc=0.3442 + [DFA-shallow] ep 50: test_acc=0.3460 + [DFA-shallow] ep 60: test_acc=0.3469 + [DFA-shallow] ep 70: test_acc=0.3427 + [DFA-shallow] ep 80: test_acc=0.3432 + [DFA-shallow] ep 90: test_acc=0.3485 + [DFA-shallow] ep 100: test_acc=0.3485 +FINAL DFA-shallow: 0.3485 + +=== DFA frozen-blocks (ResMLP num_blocks=4, blocks frozen), seed=123 === + n_params: 1318154 (789770 trainable) + [DFA-frozen] ep 1: test_acc=0.3182 + [DFA-frozen] ep 10: test_acc=0.3388 + [DFA-frozen] ep 20: test_acc=0.3429 + [DFA-frozen] ep 30: test_acc=0.3286 + [DFA-frozen] ep 40: test_acc=0.3372 + [DFA-frozen] ep 50: test_acc=0.3281 + [DFA-frozen] ep 60: test_acc=0.3417 + [DFA-frozen] ep 70: test_acc=0.3483 + [DFA-frozen] ep 80: test_acc=0.3469 + [DFA-frozen] ep 90: test_acc=0.3479 + [DFA-frozen] ep 100: test_acc=0.3497 +FINAL DFA-frozen-blocks: 0.3497 + +=== ResMLP frozen/shallow baseline summary, seed=123 === + BP-shallow: 0.3841 + BP-frozen: 0.3896 + DFA-shallow: 0.3485 + DFA-frozen: 0.3497 + +Compare to trainable 4-block ResMLP (3-seed mean): BP=0.609, DFA=0.308 + +Interpretation: + If DFA-frozen ≈ DFA-trainable (0.308): blocks are passengers, walk-back parallels ViT + If DFA-frozen << DFA-trainable: ResMLP DFA actually trains the blocks (interesting contrast with ViT) diff --git a/results/resmlp_frozen_blocks_s42.log b/results/resmlp_frozen_blocks_s42.log new file mode 100644 index 0000000..238c955 --- /dev/null +++ b/results/resmlp_frozen_blocks_s42.log @@ -0,0 +1,73 @@ +Device: cuda:0, seed=42, epochs=100 + +=== BP shallow (ResMLP num_blocks=0), seed=42 === + n_params: 789770 (789770 trainable) + [BP-shallow] ep 1: test_acc=0.3469 + [BP-shallow] ep 10: test_acc=0.3740 + [BP-shallow] ep 20: test_acc=0.3640 + [BP-shallow] ep 30: test_acc=0.3514 + [BP-shallow] ep 40: test_acc=0.3523 + [BP-shallow] ep 50: test_acc=0.3618 + [BP-shallow] ep 60: test_acc=0.3721 + [BP-shallow] ep 70: test_acc=0.3734 + [BP-shallow] ep 80: test_acc=0.3811 + [BP-shallow] ep 90: test_acc=0.3883 + [BP-shallow] ep 100: test_acc=0.3872 +FINAL BP-shallow: 0.3872 + +=== BP frozen-blocks (ResMLP num_blocks=4, blocks frozen), seed=42 === + n_params: 1318154 (789770 trainable) + [BP-frozen] ep 1: test_acc=0.3520 + [BP-frozen] ep 10: test_acc=0.3668 + [BP-frozen] ep 20: test_acc=0.3510 + [BP-frozen] ep 30: test_acc=0.3530 + [BP-frozen] ep 40: test_acc=0.3570 + [BP-frozen] ep 50: test_acc=0.3626 + [BP-frozen] ep 60: test_acc=0.3644 + [BP-frozen] ep 70: test_acc=0.3766 + [BP-frozen] ep 80: test_acc=0.3840 + [BP-frozen] ep 90: test_acc=0.3847 + [BP-frozen] ep 100: test_acc=0.3890 +FINAL BP-frozen-blocks: 0.3890 + +=== DFA shallow (ResMLP num_blocks=0), seed=42 === + n_params: 789770 (789770 trainable) + [DFA-shallow] ep 1: test_acc=0.3219 + [DFA-shallow] ep 10: test_acc=0.3410 + [DFA-shallow] ep 20: test_acc=0.3375 + [DFA-shallow] ep 30: test_acc=0.3356 + [DFA-shallow] ep 40: test_acc=0.3456 + [DFA-shallow] ep 50: test_acc=0.3427 + [DFA-shallow] ep 60: test_acc=0.3434 + [DFA-shallow] ep 70: test_acc=0.3452 + [DFA-shallow] ep 80: test_acc=0.3479 + [DFA-shallow] ep 90: test_acc=0.3463 + [DFA-shallow] ep 100: test_acc=0.3469 +FINAL DFA-shallow: 0.3469 + +=== DFA frozen-blocks (ResMLP num_blocks=4, blocks frozen), seed=42 === + n_params: 1318154 (789770 trainable) + [DFA-frozen] ep 1: test_acc=0.3255 + [DFA-frozen] ep 10: test_acc=0.3376 + [DFA-frozen] ep 20: test_acc=0.3414 + [DFA-frozen] ep 30: test_acc=0.3434 + [DFA-frozen] ep 40: test_acc=0.3422 + [DFA-frozen] ep 50: test_acc=0.3399 + [DFA-frozen] ep 60: test_acc=0.3422 + [DFA-frozen] ep 70: test_acc=0.3493 + [DFA-frozen] ep 80: test_acc=0.3474 + [DFA-frozen] ep 90: test_acc=0.3448 + [DFA-frozen] ep 100: test_acc=0.3460 +FINAL DFA-frozen-blocks: 0.3460 + +=== ResMLP frozen/shallow baseline summary, seed=42 === + BP-shallow: 0.3872 + BP-frozen: 0.3890 + DFA-shallow: 0.3469 + DFA-frozen: 0.3460 + +Compare to trainable 4-block ResMLP (3-seed mean): BP=0.609, DFA=0.308 + +Interpretation: + If DFA-frozen ≈ DFA-trainable (0.308): blocks are passengers, walk-back parallels ViT + If DFA-frozen << DFA-trainable: ResMLP DFA actually trains the blocks (interesting contrast with ViT) diff --git a/results/resmlp_frozen_blocks_s456.log b/results/resmlp_frozen_blocks_s456.log new file mode 100644 index 0000000..5bd1b66 --- /dev/null +++ b/results/resmlp_frozen_blocks_s456.log @@ -0,0 +1,73 @@ +Device: cuda:0, seed=456, epochs=100 + +=== BP shallow (ResMLP num_blocks=0), seed=456 === + n_params: 789770 (789770 trainable) + [BP-shallow] ep 1: test_acc=0.3545 + [BP-shallow] ep 10: test_acc=0.3636 + [BP-shallow] ep 20: test_acc=0.3572 + [BP-shallow] ep 30: test_acc=0.3514 + [BP-shallow] ep 40: test_acc=0.3629 + [BP-shallow] ep 50: test_acc=0.3623 + [BP-shallow] ep 60: test_acc=0.3711 + [BP-shallow] ep 70: test_acc=0.3766 + [BP-shallow] ep 80: test_acc=0.3875 + [BP-shallow] ep 90: test_acc=0.3875 + [BP-shallow] ep 100: test_acc=0.3876 +FINAL BP-shallow: 0.3876 + +=== BP frozen-blocks (ResMLP num_blocks=4, blocks frozen), seed=456 === + n_params: 1318154 (789770 trainable) + [BP-frozen] ep 1: test_acc=0.3593 + [BP-frozen] ep 10: test_acc=0.3696 + [BP-frozen] ep 20: test_acc=0.3515 + [BP-frozen] ep 30: test_acc=0.3541 + [BP-frozen] ep 40: test_acc=0.3574 + [BP-frozen] ep 50: test_acc=0.3567 + [BP-frozen] ep 60: test_acc=0.3724 + [BP-frozen] ep 70: test_acc=0.3777 + [BP-frozen] ep 80: test_acc=0.3861 + [BP-frozen] ep 90: test_acc=0.3894 + [BP-frozen] ep 100: test_acc=0.3881 +FINAL BP-frozen-blocks: 0.3881 + +=== DFA shallow (ResMLP num_blocks=0), seed=456 === + n_params: 789770 (789770 trainable) + [DFA-shallow] ep 1: test_acc=0.3246 + [DFA-shallow] ep 10: test_acc=0.3453 + [DFA-shallow] ep 20: test_acc=0.3426 + [DFA-shallow] ep 30: test_acc=0.3498 + [DFA-shallow] ep 40: test_acc=0.3431 + [DFA-shallow] ep 50: test_acc=0.3549 + [DFA-shallow] ep 60: test_acc=0.3494 + [DFA-shallow] ep 70: test_acc=0.3534 + [DFA-shallow] ep 80: test_acc=0.3494 + [DFA-shallow] ep 90: test_acc=0.3507 + [DFA-shallow] ep 100: test_acc=0.3519 +FINAL DFA-shallow: 0.3519 + +=== DFA frozen-blocks (ResMLP num_blocks=4, blocks frozen), seed=456 === + n_params: 1318154 (789770 trainable) + [DFA-frozen] ep 1: test_acc=0.3283 + [DFA-frozen] ep 10: test_acc=0.3427 + [DFA-frozen] ep 20: test_acc=0.3425 + [DFA-frozen] ep 30: test_acc=0.3481 + [DFA-frozen] ep 40: test_acc=0.3329 + [DFA-frozen] ep 50: test_acc=0.3425 + [DFA-frozen] ep 60: test_acc=0.3519 + [DFA-frozen] ep 70: test_acc=0.3556 + [DFA-frozen] ep 80: test_acc=0.3507 + [DFA-frozen] ep 90: test_acc=0.3508 + [DFA-frozen] ep 100: test_acc=0.3510 +FINAL DFA-frozen-blocks: 0.3510 + +=== ResMLP frozen/shallow baseline summary, seed=456 === + BP-shallow: 0.3876 + BP-frozen: 0.3881 + DFA-shallow: 0.3519 + DFA-frozen: 0.3510 + +Compare to trainable 4-block ResMLP (3-seed mean): BP=0.609, DFA=0.308 + +Interpretation: + If DFA-frozen ≈ DFA-trainable (0.308): blocks are passengers, walk-back parallels ViT + If DFA-frozen << DFA-trainable: ResMLP DFA actually trains the blocks (interesting contrast with ViT) diff --git a/results/resnet_baseline_s42.log b/results/resnet_baseline_s42.log new file mode 100644 index 0000000..10175be --- /dev/null +++ b/results/resnet_baseline_s42.log @@ -0,0 +1,6 @@ +Device: cuda:0, seed=42, epochs=60 + +=== BP trainable (SmallResNet num_blocks=4), seed=42 === + n_params: 298442 (298442 trainable) + [BP-trainable] ep 1: test_acc=0.5045 + [BP-trainable] ep 10: test_acc=0.7700 diff --git a/results/resnet_frozen_blocks_s42.log b/results/resnet_frozen_blocks_s42.log new file mode 100644 index 0000000..2c9e352 --- /dev/null +++ b/results/resnet_frozen_blocks_s42.log @@ -0,0 +1,5 @@ +Device: cuda:0, seed=42, epochs=30 + +=== BP trainable (SmallResNet num_blocks=4), seed=42 === + n_params: 75498 (75498 trainable) + [BP-trainable] ep 1: test_acc=0.4618 diff --git a/results/resnet_protocol_validation.json b/results/resnet_protocol_validation.json new file mode 100644 index 0000000..c2c8ee5 --- /dev/null +++ b/results/resnet_protocol_validation.json @@ -0,0 +1,2999 @@ +{ + "42": { + "bp": { + "log": { + "train_loss": [ + 1.4754980445098878, + 1.1327733042144776, + 0.9823549256706238, + 0.8884939163589477, + 0.8080494424057006, + 0.7429164674949646, + 0.691338694820404, + 0.6396145434761047, + 0.6058105169486999, + 0.5681285029792785, + 0.5410099887466431, + 0.5156902655792236, + 0.48821864374160767, + 0.4693263840675354, + 0.44821343361854554, + 0.4341135684013367, + 0.4153518598937988, + 0.4031775716972351, + 0.3901845865726471, + 0.37803070536613465, + 0.36493089889526364, + 0.3530925098323822, + 0.34134404032707216, + 0.32737062341690065, + 0.3201012042999268, + 0.30783499921798707, + 0.3018397808456421, + 0.297964332113266, + 0.2811221259975433, + 0.2744342702102661, + 0.26620709442138674, + 0.2572384280967712, + 0.24901132754325866, + 0.2451383338546753, + 0.23960787649154663, + 0.22755484651565552, + 0.21933056587219238, + 0.2154020707654953, + 0.20710637582778932, + 0.20213108753204345, + 0.19146164437294005, + 0.18917329798221588, + 0.17772054873466492, + 0.17262119786262511, + 0.17501190958976745, + 0.16236323578834533, + 0.15728484272003174, + 0.1503485471725464, + 0.14705612461566925, + 0.1391956588745117, + 0.13705069701194764, + 0.1280645592546463, + 0.12542680257797242, + 0.11884177312612533, + 0.11983791782855988, + 0.11101757476329803, + 0.10580061419487, + 0.09929067412376404, + 0.09622357261061669, + 0.09204819278240203, + 0.09021267262935638, + 0.08517345870494843, + 0.08284438428878785, + 0.07769702455043792, + 0.07526010594129562, + 0.07193764674186706, + 0.06778959328889847, + 0.06626685544013977, + 0.061662050495147704, + 0.062233254585266115, + 0.05574440080881119, + 0.05430667734146118, + 0.050687168483734134, + 0.05152127984762192, + 0.047372261435985566, + 0.045812105536460875, + 0.04105121579051018, + 0.041827005530595776, + 0.03994967749714851, + 0.03859664423584938, + 0.03739786517620087, + 0.03536494743227959, + 0.03402860813319683, + 0.032672048892974856, + 0.033726132349967956, + 0.032082007769942286, + 0.03033736688375473, + 0.030522687734365464, + 0.02902250618815422, + 0.027636773591041566, + 0.028686479598283767, + 0.027951767029762268, + 0.027169395470619202, + 0.026654738742113115, + 0.02677365488886833, + 0.026482253704667093, + 0.024927393090724944, + 0.02497604925274849, + 0.026100769642591476, + 0.025896823017597197 + ], + "train_acc": [ + 0.45964, + 0.59478, + 0.64942, + 0.68564, + 0.7155, + 0.74002, + 0.759, + 0.778, + 0.79062, + 0.8042, + 0.8139, + 0.82322, + 0.83096, + 0.83878, + 0.84706, + 0.85214, + 0.85686, + 0.86174, + 0.86592, + 0.87024, + 0.87432, + 0.87884, + 0.88326, + 0.8879, + 0.88992, + 0.89312, + 0.89666, + 0.89684, + 0.90298, + 0.90614, + 0.90778, + 0.91138, + 0.91432, + 0.91484, + 0.91664, + 0.92094, + 0.92352, + 0.92584, + 0.92802, + 0.92958, + 0.93406, + 0.9351, + 0.93924, + 0.94048, + 0.93892, + 0.94464, + 0.94534, + 0.9487, + 0.94968, + 0.95276, + 0.9528, + 0.9574, + 0.95744, + 0.96078, + 0.96016, + 0.96282, + 0.9647, + 0.96816, + 0.96838, + 0.9708, + 0.97036, + 0.97234, + 0.97322, + 0.9746, + 0.97646, + 0.97678, + 0.97904, + 0.9792, + 0.98132, + 0.9807, + 0.98392, + 0.98454, + 0.98496, + 0.98534, + 0.98722, + 0.98734, + 0.98918, + 0.98902, + 0.98994, + 0.9903, + 0.99048, + 0.99146, + 0.99194, + 0.99266, + 0.99138, + 0.99328, + 0.99318, + 0.99348, + 0.99398, + 0.99464, + 0.99392, + 0.99424, + 0.99436, + 0.99462, + 0.99468, + 0.9945, + 0.9953, + 0.9954, + 0.99516, + 0.9948 + ], + "test_acc": [ + 0.506, + 0.6221, + 0.6134, + 0.6653, + 0.6809, + 0.6845, + 0.7282, + 0.715, + 0.758, + 0.7538, + 0.742, + 0.7841, + 0.7783, + 0.79, + 0.762, + 0.7896, + 0.7946, + 0.8012, + 0.8066, + 0.8337, + 0.8222, + 0.8306, + 0.8369, + 0.8343, + 0.8176, + 0.7976, + 0.836, + 0.8464, + 0.8087, + 0.8516, + 0.8444, + 0.8347, + 0.8414, + 0.83, + 0.8454, + 0.8373, + 0.8399, + 0.8572, + 0.854, + 0.8572, + 0.8496, + 0.8496, + 0.8686, + 0.8571, + 0.8517, + 0.8432, + 0.8515, + 0.864, + 0.8615, + 0.8668, + 0.8367, + 0.8333, + 0.8594, + 0.8709, + 0.8679, + 0.8613, + 0.8689, + 0.87, + 0.8732, + 0.8701, + 0.8585, + 0.8654, + 0.8618, + 0.8735, + 0.8626, + 0.8751, + 0.8694, + 0.8685, + 0.8749, + 0.8727, + 0.8751, + 0.8761, + 0.8726, + 0.8775, + 0.8688, + 0.8762, + 0.876, + 0.8711, + 0.8691, + 0.8771, + 0.875, + 0.8739, + 0.8748, + 0.8751, + 0.8764, + 0.8764, + 0.8761, + 0.8759, + 0.8763, + 0.8784, + 0.8768, + 0.8771, + 0.8766, + 0.875, + 0.8766, + 0.876, + 0.8764, + 0.8783, + 0.8774, + 0.8769 + ] + }, + "diagnostics": { + "bp_cosine": [ + 1.0, + 1.0, + 1.0, + 1.0 + ], + "bp_grad_norms_per_layer": [ + 3.9082557634628756e-08, + 5.067175123940615e-08, + 3.265608228275596e-08, + 1.1308735281545523e-08, + 3.1019329327364176e-09 + ], + "hidden_norms_per_layer": [ + 1.630630612373352, + 2.3162124156951904, + 4.237359523773193, + 9.196452140808105, + 17.93486213684082 + ] + } + }, + "fa": { + "log": { + "train_loss": [ + 1.8298806344604492, + 1.688780364112854, + 1.647813285560608, + 1.632948429145813, + 1.6219196771621704, + 1.597323589477539, + 1.6194571055603026, + 1.5867001958465576, + 1.5856347469329835, + 1.5822649958419799, + 1.567199764328003, + 1.5595971042633057, + 1.555942633628845, + 1.5450387216186523, + 1.5443615267181396, + 1.5423453115463257, + 1.5377392181777954, + 1.5742749130630493, + 1.5323925372695923, + 1.5202843558502197, + 1.5258193575286865, + 1.5040335019302369, + 1.507170670814514, + 1.5143084545516967, + 1.4983913586807251, + 1.4908056282806397, + 1.5053773770904542, + 1.4907385025787354, + 1.4826300627517701, + 1.466815757484436, + 1.4698192767333984, + 1.4639443017578124, + 1.459072035560608, + 1.4483210107040405, + 1.455411272239685, + 1.4497789043807983, + 1.44592253200531, + 1.462750799331665, + 1.4582938319778442, + 1.4474501207733155, + 1.4522054817199708, + 1.4697525200653077, + 1.4576213805389404, + 1.4627395877838134, + 1.4435660293197632, + 1.4565714419937135, + 1.4885323392486571, + 1.4720177228546143, + 1.477506584815979, + 1.4671536804962158, + 1.4733956943511963, + 1.4923374033355712, + 1.4908088668823243, + 1.4986677370834351, + 1.506933953514099, + 1.4915515749359132, + 1.5066200190734864, + 1.5074671340179444, + 1.5117018646621705, + 1.5098506378555299, + 1.52632337348938, + 1.5084018962860108, + 1.4978013104248047, + 1.4830269091033936, + 1.475912446899414, + 1.49930527469635, + 1.5067418698883057, + 1.512999187850952, + 1.517277278137207, + 1.5063294620513916, + 1.5280411059951782, + 1.5010698389434813, + 1.5042574712753296, + 1.5221018926620484, + 1.5003190943527223, + 1.502483357963562, + 1.494799020462036, + 1.5052326755142211, + 1.5050663613891602, + 1.519798519821167, + 1.5059367882919312, + 1.5141305075836182, + 1.5212347466278076, + 1.5083724868011474, + 1.5028382047271729, + 1.52472865776062, + 1.5356733351898193, + 1.5201873098373413, + 1.566948963356018, + 1.5514922919464111, + 1.558815823059082, + 1.5491892823028564, + 1.575247833518982, + 1.5376620474624634, + 1.5292223310852051, + 1.5172099410247804, + 1.5145379526138305, + 1.5038220858764648, + 1.50547469871521, + 1.5119369091033936 + ], + "train_acc": [ + 0.31842, + 0.37374, + 0.39324, + 0.40182, + 0.40412, + 0.4211, + 0.41732, + 0.42548, + 0.42548, + 0.4254, + 0.43404, + 0.43838, + 0.44018, + 0.44176, + 0.4438, + 0.44488, + 0.44962, + 0.4329, + 0.45138, + 0.45352, + 0.45012, + 0.45828, + 0.45946, + 0.45388, + 0.45988, + 0.46518, + 0.45762, + 0.462, + 0.46632, + 0.46964, + 0.4709, + 0.47326, + 0.47348, + 0.4779, + 0.47418, + 0.47572, + 0.47944, + 0.47124, + 0.47294, + 0.4799, + 0.47656, + 0.47036, + 0.476, + 0.47532, + 0.48174, + 0.47684, + 0.4653, + 0.47198, + 0.4682, + 0.47048, + 0.4705, + 0.46424, + 0.46426, + 0.4617, + 0.46056, + 0.4619, + 0.45984, + 0.45824, + 0.45614, + 0.45822, + 0.45278, + 0.45816, + 0.46198, + 0.46712, + 0.46686, + 0.45834, + 0.4546, + 0.45078, + 0.45096, + 0.45758, + 0.4504, + 0.45786, + 0.4551, + 0.45058, + 0.45946, + 0.45886, + 0.46094, + 0.45682, + 0.4567, + 0.45352, + 0.45318, + 0.45374, + 0.45124, + 0.45422, + 0.45768, + 0.45028, + 0.4471, + 0.45038, + 0.4322, + 0.44048, + 0.43662, + 0.43446, + 0.42868, + 0.44552, + 0.44874, + 0.45298, + 0.45436, + 0.45668, + 0.45604, + 0.45474 + ], + "test_acc": [ + 0.3207, + 0.3503, + 0.3527, + 0.3861, + 0.3942, + 0.4001, + 0.4306, + 0.4432, + 0.4478, + 0.4524, + 0.4585, + 0.465, + 0.458, + 0.4227, + 0.392, + 0.4192, + 0.3884, + 0.4038, + 0.4158, + 0.4077, + 0.3143, + 0.4095, + 0.3911, + 0.4277, + 0.403, + 0.3575, + 0.4462, + 0.4343, + 0.492, + 0.5031, + 0.4931, + 0.4969, + 0.4998, + 0.4965, + 0.4941, + 0.4774, + 0.4824, + 0.4616, + 0.4576, + 0.3687, + 0.3822, + 0.4509, + 0.3604, + 0.3934, + 0.397, + 0.3731, + 0.4169, + 0.4009, + 0.4215, + 0.456, + 0.4938, + 0.5047, + 0.492, + 0.4953, + 0.4836, + 0.477, + 0.4887, + 0.4833, + 0.4541, + 0.4727, + 0.4383, + 0.4087, + 0.4211, + 0.3786, + 0.3644, + 0.3657, + 0.3426, + 0.3886, + 0.4046, + 0.4387, + 0.4099, + 0.4625, + 0.4529, + 0.4586, + 0.485, + 0.4865, + 0.4843, + 0.4794, + 0.4679, + 0.4693, + 0.4615, + 0.4667, + 0.4192, + 0.418, + 0.4125, + 0.3571, + 0.3608, + 0.3457, + 0.3906, + 0.3725, + 0.4014, + 0.4286, + 0.4085, + 0.446, + 0.4485, + 0.4346, + 0.4817, + 0.485, + 0.495, + 0.4833 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.011285820975899696, + 0.07406313717365265, + 0.1594497561454773, + 0.44105973839759827 + ], + "bp_grad_norms_per_layer": [ + 1.3695491361431777e-05, + 1.8004903949986328e-06, + 9.99313783722755e-07, + 8.082909062068211e-07, + 5.473577857628698e-07 + ], + "hidden_norms_per_layer": [ + 50.53160095214844, + 103.4476089477539, + 149.35552978515625, + 182.89686584472656, + 189.6983184814453 + ] + } + }, + "dfa": { + "log": { + "train_loss": [ + 1.9700327950286864, + 1.7197770983886718, + 1.632392515296936, + 1.5972210712432862, + 1.5736680292129517, + 1.5405088848114015, + 1.5421941160202026, + 1.520421322631836, + 1.5005842459106444, + 1.4921242977905274, + 1.4844317977905273, + 1.483495234451294, + 1.4797166704177855, + 1.4774001663970948, + 1.4658505402374267, + 1.4566633183288573, + 1.4593217742156983, + 1.4601572839736938, + 1.4440136874389649, + 1.4463013646697997, + 1.4405934756088257, + 1.4422135416030883, + 1.422125124206543, + 1.4206480749130248, + 1.420827185935974, + 1.4188856798553466, + 1.4109822200775146, + 1.4247135849761963, + 1.4055966735458374, + 1.4032851572036744, + 1.410328683128357, + 1.4118695135116577, + 1.4036611133956909, + 1.3949691522216796, + 1.3968347528076173, + 1.3958281589126587, + 1.39325541847229, + 1.403240125617981, + 1.392686354484558, + 1.3892713842010498, + 1.382711388092041, + 1.389695151901245, + 1.3808801708602905, + 1.3848997201919555, + 1.3890845811843873, + 1.4066275939178468, + 1.3875241959381104, + 1.3897144681549072, + 1.3796721933746339, + 1.396430911216736, + 1.387675725402832, + 1.3777567819595338, + 1.3884191586303711, + 1.381468256187439, + 1.3925903015136718, + 1.3914262427520752, + 1.3773758321762084, + 1.3876502769851684, + 1.3776784436798095, + 1.3695590120315553, + 1.3830354277420045, + 1.3944670934677124, + 1.3798560680007934, + 1.3890421490478515, + 1.374452215538025, + 1.3832157874298097, + 1.3792221859359741, + 1.3865778247833251, + 1.398633239364624, + 1.383202797050476, + 1.4095420195388795, + 1.3881797384262085, + 1.3861817309188842, + 1.399900616531372, + 1.3711223928070069, + 1.3982175287628174, + 1.401219694595337, + 1.3866778911972046, + 1.3866484435272217, + 1.3840515439605714, + 1.3872028903961182, + 1.387791619644165, + 1.390064393234253, + 1.3949497409439087, + 1.385475379447937, + 1.394461077232361, + 1.3839679726409913, + 1.3870975177383422, + 1.3855371921157837, + 1.3954718680572509, + 1.3886094842147827, + 1.3855898504257202, + 1.3940177222824097, + 1.4014257174682616, + 1.3956065648269653, + 1.376382395401001, + 1.3796580749511718, + 1.3885908546829224, + 1.3941678115081788, + 1.4100037472152709 + ], + "train_acc": [ + 0.26468, + 0.37022, + 0.40486, + 0.42178, + 0.43042, + 0.44586, + 0.44794, + 0.45628, + 0.46218, + 0.46572, + 0.4714, + 0.47332, + 0.47372, + 0.4786, + 0.47742, + 0.48406, + 0.48038, + 0.48206, + 0.48642, + 0.48924, + 0.48912, + 0.48716, + 0.493, + 0.4975, + 0.49292, + 0.49658, + 0.49862, + 0.49692, + 0.50214, + 0.50136, + 0.50334, + 0.50208, + 0.50184, + 0.50406, + 0.50682, + 0.5067, + 0.50564, + 0.50384, + 0.50712, + 0.50984, + 0.513, + 0.50756, + 0.51442, + 0.51452, + 0.51248, + 0.50492, + 0.5094, + 0.51026, + 0.5129, + 0.50942, + 0.5128, + 0.51386, + 0.51294, + 0.51314, + 0.5097, + 0.51186, + 0.51472, + 0.51466, + 0.51572, + 0.51818, + 0.51692, + 0.51066, + 0.51592, + 0.51586, + 0.51642, + 0.51666, + 0.51496, + 0.51416, + 0.50964, + 0.51496, + 0.51284, + 0.51294, + 0.51454, + 0.51066, + 0.51986, + 0.5122, + 0.51132, + 0.51556, + 0.5143, + 0.51508, + 0.51314, + 0.51538, + 0.51624, + 0.51358, + 0.51708, + 0.5134, + 0.51714, + 0.51774, + 0.51886, + 0.51394, + 0.51664, + 0.51706, + 0.51338, + 0.5106, + 0.51576, + 0.51934, + 0.51794, + 0.51738, + 0.51044, + 0.51066 + ], + "test_acc": [ + 0.3153, + 0.3474, + 0.386, + 0.388, + 0.4166, + 0.4531, + 0.4665, + 0.471, + 0.4903, + 0.4845, + 0.4895, + 0.487, + 0.4829, + 0.4498, + 0.4608, + 0.4765, + 0.4157, + 0.4487, + 0.42, + 0.4166, + 0.4502, + 0.4119, + 0.3815, + 0.4482, + 0.4885, + 0.4125, + 0.4783, + 0.4813, + 0.5087, + 0.5166, + 0.5321, + 0.5214, + 0.5275, + 0.5214, + 0.5298, + 0.5097, + 0.498, + 0.5028, + 0.4919, + 0.4638, + 0.443, + 0.4517, + 0.4192, + 0.4341, + 0.4191, + 0.4345, + 0.4743, + 0.4441, + 0.4946, + 0.5211, + 0.5172, + 0.5296, + 0.5338, + 0.5327, + 0.5373, + 0.5275, + 0.5326, + 0.5287, + 0.5091, + 0.5058, + 0.5008, + 0.4079, + 0.451, + 0.4224, + 0.4662, + 0.4654, + 0.4191, + 0.4663, + 0.4364, + 0.4456, + 0.5066, + 0.5268, + 0.5368, + 0.5377, + 0.5413, + 0.5476, + 0.5292, + 0.529, + 0.536, + 0.5284, + 0.4941, + 0.5041, + 0.4917, + 0.4746, + 0.4656, + 0.4459, + 0.4626, + 0.3939, + 0.446, + 0.4554, + 0.4422, + 0.5023, + 0.4576, + 0.5104, + 0.5295, + 0.5327, + 0.5195, + 0.5494, + 0.5471, + 0.5413 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.08758166432380676, + 0.08265066146850586, + 0.12648510932922363, + 0.10309864580631256 + ], + "bp_grad_norms_per_layer": [ + 2.3419132048729807e-05, + 3.6119690776104107e-06, + 1.7736473409968312e-06, + 1.5713918628534884e-06, + 1.7539369991936837e-06 + ], + "hidden_norms_per_layer": [ + 47.25933837890625, + 109.33719635009766, + 155.00738525390625, + 191.0522918701172, + 219.52337646484375 + ] + } + }, + "frozen_acc": 0.4463 + }, + "123": { + "bp": { + "log": { + "train_loss": [ + 1.495588239517212, + 1.1326856233215332, + 0.9856092191314697, + 0.8843897874641419, + 0.8114790439987183, + 0.7456379578399658, + 0.697955235080719, + 0.654170990562439, + 0.6158091250801087, + 0.5829520724487305, + 0.5525357649230958, + 0.5250414242553711, + 0.5006515597724914, + 0.48423763071060183, + 0.46926417328834535, + 0.4528700869369507, + 0.43051134550094605, + 0.41593158436775207, + 0.4056923293495178, + 0.3909835531234741, + 0.3792208040237427, + 0.3660886435699463, + 0.3583825979232788, + 0.3472343339729309, + 0.33715820897102355, + 0.32825799531936645, + 0.31955092518806455, + 0.3038673452949524, + 0.2969187310600281, + 0.2933626782989502, + 0.27999647459983823, + 0.268520337266922, + 0.26634064863204954, + 0.2538251077890396, + 0.24892900864601136, + 0.24191651473999023, + 0.232765593996048, + 0.22151346509933473, + 0.222532262134552, + 0.21110695028305054, + 0.20780864106178285, + 0.19791428791999816, + 0.19185672250270844, + 0.18785401693344117, + 0.17802429156303406, + 0.1720601306962967, + 0.16842515460014343, + 0.16257646847724916, + 0.15610155190944672, + 0.15005135691642763, + 0.14009289414882659, + 0.1384709987258911, + 0.13156649881362914, + 0.12928588601112365, + 0.12685507180213929, + 0.1160386240530014, + 0.10782978903532028, + 0.10997594069480895, + 0.10836599202871322, + 0.09867196915149688, + 0.09783898058176041, + 0.08973311794519424, + 0.08834265770435333, + 0.08185022172212601, + 0.07984862296581269, + 0.07728323365688324, + 0.07318342950820923, + 0.06945570806026459, + 0.06800889924287797, + 0.06299814170360565, + 0.061575687782764434, + 0.056308155422210696, + 0.05341108487129211, + 0.05296990805625915, + 0.05296066891252994, + 0.04871720019578934, + 0.04586738684058189, + 0.04388664490222931, + 0.04339365641117096, + 0.04231060939252376, + 0.04077634312748909, + 0.039417545340061186, + 0.03753207321703434, + 0.037230935846567156, + 0.034856179753541945, + 0.03275925306677818, + 0.03446773986160755, + 0.032199940350055696, + 0.03195429321408272, + 0.030788076300621033, + 0.030068219158649444, + 0.030032526297569275, + 0.029710424115657805, + 0.02918463228583336, + 0.028123204150795937, + 0.02919030601501465, + 0.029277059656381606, + 0.027259378086328508, + 0.0266542486217618, + 0.028766508388519286 + ], + "train_acc": [ + 0.449, + 0.5959, + 0.6476, + 0.68514, + 0.71296, + 0.7388, + 0.7567, + 0.77474, + 0.7868, + 0.80072, + 0.80904, + 0.81816, + 0.82786, + 0.83348, + 0.8387, + 0.84456, + 0.85092, + 0.85656, + 0.86014, + 0.86546, + 0.86932, + 0.8738, + 0.87796, + 0.87998, + 0.88338, + 0.88642, + 0.89038, + 0.89488, + 0.8979, + 0.89792, + 0.90422, + 0.90792, + 0.90796, + 0.9129, + 0.91398, + 0.9169, + 0.91828, + 0.92408, + 0.92334, + 0.9273, + 0.92912, + 0.93154, + 0.93466, + 0.93544, + 0.938, + 0.94012, + 0.94162, + 0.94442, + 0.94616, + 0.94784, + 0.95244, + 0.9535, + 0.9548, + 0.95672, + 0.95636, + 0.96082, + 0.96466, + 0.96328, + 0.96326, + 0.96726, + 0.96682, + 0.97112, + 0.97136, + 0.97392, + 0.97444, + 0.97538, + 0.97714, + 0.97862, + 0.9784, + 0.98034, + 0.98176, + 0.98508, + 0.98458, + 0.98552, + 0.98558, + 0.98714, + 0.98738, + 0.98786, + 0.98852, + 0.98858, + 0.98988, + 0.9895, + 0.99064, + 0.99092, + 0.99166, + 0.99262, + 0.9916, + 0.99292, + 0.9927, + 0.99356, + 0.99404, + 0.99396, + 0.9941, + 0.9939, + 0.99516, + 0.9942, + 0.99396, + 0.99498, + 0.99516, + 0.99404 + ], + "test_acc": [ + 0.4668, + 0.4975, + 0.6427, + 0.6186, + 0.7044, + 0.6675, + 0.7212, + 0.7318, + 0.7142, + 0.7239, + 0.7613, + 0.7318, + 0.7903, + 0.7557, + 0.7618, + 0.7681, + 0.8016, + 0.8023, + 0.8207, + 0.7878, + 0.8081, + 0.8078, + 0.7974, + 0.7988, + 0.8218, + 0.8317, + 0.7977, + 0.8371, + 0.8246, + 0.8268, + 0.8343, + 0.8101, + 0.8236, + 0.8219, + 0.8504, + 0.8422, + 0.831, + 0.829, + 0.8335, + 0.8489, + 0.8335, + 0.8383, + 0.8255, + 0.8291, + 0.8579, + 0.8497, + 0.8458, + 0.8448, + 0.8602, + 0.842, + 0.8673, + 0.8624, + 0.867, + 0.8614, + 0.8556, + 0.861, + 0.843, + 0.8513, + 0.8648, + 0.8534, + 0.8559, + 0.8508, + 0.8663, + 0.8608, + 0.8662, + 0.8685, + 0.8674, + 0.8685, + 0.8683, + 0.8697, + 0.873, + 0.8691, + 0.8666, + 0.8732, + 0.8669, + 0.8759, + 0.8702, + 0.8755, + 0.8744, + 0.873, + 0.8745, + 0.8724, + 0.8718, + 0.8709, + 0.8737, + 0.8734, + 0.8763, + 0.8753, + 0.8751, + 0.8748, + 0.8747, + 0.8759, + 0.8744, + 0.8748, + 0.8741, + 0.8746, + 0.875, + 0.8757, + 0.8757, + 0.8751 + ] + }, + "diagnostics": { + "bp_cosine": [ + 1.0, + 1.0, + 1.0, + 1.0 + ], + "bp_grad_norms_per_layer": [ + 6.912577532602882e-08, + 1.1992902670954209e-07, + 1.1417370160415885e-07, + 2.9605759621631478e-08, + 7.1233121623492934e-09 + ], + "hidden_norms_per_layer": [ + 1.5058701038360596, + 2.3091824054718018, + 3.9312002658843994, + 8.719876289367676, + 17.75613784790039 + ] + } + }, + "fa": { + "log": { + "train_loss": [ + 1.8659718270111083, + 1.683680397567749, + 1.612106671218872, + 1.5741597354888917, + 1.5599941147613525, + 1.5427036904144287, + 1.5440460584259033, + 1.5428195544815064, + 1.5271256440734864, + 1.5313361112594603, + 1.5289501099395753, + 1.513870721130371, + 1.5121803590393066, + 1.5032499996566773, + 1.512363984184265, + 1.5016355478668213, + 1.5096042656707764, + 1.492105902671814, + 1.4917547158050537, + 1.4900038906860351, + 1.4975745567321777, + 1.493273950843811, + 1.5052244140625, + 1.5001088582611084, + 1.5032766550445558, + 1.5210559719085692, + 1.5131746913909911, + 1.4969936119842528, + 1.5052455416107178, + 1.5028073372650146, + 1.509829647216797, + 1.5195129321670533, + 1.4970213110351562, + 1.5049412929916381, + 1.4949871908187866, + 1.4840487638092041, + 1.5036991092300416, + 1.4982619463348388, + 1.4966608276367188, + 1.5110313299179077, + 1.5175931993865968, + 1.5064766229248048, + 1.5220397052764894, + 1.5112490351104737, + 1.5147967623138427, + 1.5128357276153563, + 1.5076934622192384, + 1.5041581441879273, + 1.5137867282485962, + 1.5087187747573854, + 1.5027286514663696, + 1.5078837477111817, + 1.5078793271636963, + 1.5332094471740723, + 1.5532902967071534, + 1.531460919418335, + 1.526025957069397, + 1.545231460647583, + 1.5436910135269164, + 1.5562543505859374, + 1.592395346107483, + 1.5260646786499024, + 1.510891372642517, + 1.5131159967422485, + 1.5337466653823852, + 1.570516603012085, + 1.5490166927719116, + 1.5552853171539307, + 1.5633169314193727, + 1.5687613497543336, + 1.5776711074447631, + 1.550319636154175, + 1.5639197861099243, + 1.5420448788452148, + 1.5506871451187134, + 1.5436728594970703, + 1.544439082107544, + 1.5564761966323852, + 1.5428286236572266, + 1.5689187644577027, + 1.5568335976409913, + 1.5351758861541749, + 1.5409207321929932, + 1.5642808813858031, + 1.5521496292495727, + 1.5486036518096924, + 1.5483359182739258, + 1.5397209240722656, + 1.5328784543228149, + 1.5347419134521485, + 1.5272779167175292, + 1.5183787253189087, + 1.5255509783172607, + 1.5052685770416259, + 1.5213663787841798, + 1.4785558428573609, + 1.4870614541244507, + 1.4948050667953492, + 1.4956997775650025, + 1.5064945538711547 + ], + "train_acc": [ + 0.3056, + 0.37904, + 0.4103, + 0.42516, + 0.43474, + 0.44184, + 0.4445, + 0.44374, + 0.4478, + 0.4489, + 0.45134, + 0.45386, + 0.45748, + 0.45826, + 0.45484, + 0.45908, + 0.45536, + 0.46316, + 0.46284, + 0.46542, + 0.4616, + 0.46186, + 0.45934, + 0.45926, + 0.45776, + 0.44942, + 0.45392, + 0.4577, + 0.45366, + 0.4564, + 0.45234, + 0.4506, + 0.45694, + 0.45458, + 0.45722, + 0.46484, + 0.46076, + 0.45914, + 0.46288, + 0.45626, + 0.45278, + 0.45988, + 0.4519, + 0.45574, + 0.45572, + 0.45734, + 0.45724, + 0.4602, + 0.45514, + 0.4564, + 0.46106, + 0.45974, + 0.45838, + 0.44886, + 0.44068, + 0.45242, + 0.45194, + 0.44476, + 0.44334, + 0.44222, + 0.42254, + 0.44746, + 0.45404, + 0.45282, + 0.4468, + 0.42856, + 0.44068, + 0.43984, + 0.43342, + 0.43192, + 0.43184, + 0.43894, + 0.433, + 0.44186, + 0.4392, + 0.44028, + 0.44122, + 0.43994, + 0.4433, + 0.43554, + 0.43714, + 0.44596, + 0.44356, + 0.4375, + 0.4413, + 0.44216, + 0.44138, + 0.45042, + 0.45134, + 0.44988, + 0.45178, + 0.4552, + 0.44996, + 0.45752, + 0.45072, + 0.46666, + 0.46272, + 0.46206, + 0.45912, + 0.4544 + ], + "test_acc": [ + 0.2557, + 0.3587, + 0.3773, + 0.4178, + 0.4133, + 0.4564, + 0.453, + 0.4769, + 0.4726, + 0.4852, + 0.4752, + 0.4801, + 0.4714, + 0.4655, + 0.4422, + 0.4411, + 0.4299, + 0.3935, + 0.3857, + 0.3673, + 0.3759, + 0.4085, + 0.3923, + 0.4606, + 0.4338, + 0.359, + 0.4343, + 0.4325, + 0.447, + 0.489, + 0.4758, + 0.4802, + 0.484, + 0.482, + 0.4826, + 0.4847, + 0.4832, + 0.4697, + 0.4249, + 0.409, + 0.409, + 0.3935, + 0.3071, + 0.4144, + 0.3761, + 0.3694, + 0.3964, + 0.3913, + 0.4114, + 0.465, + 0.4863, + 0.4788, + 0.4888, + 0.4753, + 0.4704, + 0.483, + 0.492, + 0.4622, + 0.4634, + 0.4524, + 0.4046, + 0.4036, + 0.4197, + 0.4015, + 0.3201, + 0.3319, + 0.3996, + 0.2774, + 0.317, + 0.4131, + 0.4293, + 0.4107, + 0.4385, + 0.4546, + 0.4745, + 0.4664, + 0.4682, + 0.4707, + 0.4637, + 0.4634, + 0.4574, + 0.4256, + 0.3755, + 0.3476, + 0.3271, + 0.2652, + 0.3075, + 0.3732, + 0.3428, + 0.3723, + 0.3851, + 0.4178, + 0.4538, + 0.4451, + 0.4813, + 0.4791, + 0.4951, + 0.4864, + 0.474, + 0.4701 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.07231192290782928, + 0.08217933773994446, + 0.15553204715251923, + 0.4070398211479187 + ], + "bp_grad_norms_per_layer": [ + 1.9104201783193275e-05, + 2.399963932475657e-06, + 1.234139631378639e-06, + 1.0221878028460196e-06, + 7.074656309669081e-07 + ], + "hidden_norms_per_layer": [ + 55.40227127075195, + 103.83504486083984, + 151.3930206298828, + 184.45449829101562, + 189.0428466796875 + ] + } + }, + "dfa": { + "log": { + "train_loss": [ + 1.9979866750717163, + 1.7517047381591797, + 1.666371762084961, + 1.600228463973999, + 1.5743235528182984, + 1.5476901987457274, + 1.5314745957183837, + 1.5130221286010743, + 1.4985457011795045, + 1.5043407316970825, + 1.4782429806900024, + 1.4846010361099242, + 1.4903296518325806, + 1.489443695526123, + 1.4796258502960205, + 1.48433977848053, + 1.4877143989562989, + 1.4892795726776122, + 1.4888588542175294, + 1.4829449924087525, + 1.4706789566802978, + 1.4695693682861328, + 1.4745273109054566, + 1.4871982336044312, + 1.469974294166565, + 1.4704977536773682, + 1.4612956504058838, + 1.471293696861267, + 1.4503397106933593, + 1.4601988890838622, + 1.4435253295516968, + 1.447725463256836, + 1.4467037618637084, + 1.4500885382843018, + 1.455040583152771, + 1.4443602278137206, + 1.447977113723755, + 1.4414146844100952, + 1.4293622527694703, + 1.4400424856185914, + 1.4403304705047608, + 1.430347915916443, + 1.4418269156646728, + 1.4286183041763305, + 1.431903427810669, + 1.43258889087677, + 1.4342171427154542, + 1.4285272072219848, + 1.4248057216644288, + 1.4252272537231445, + 1.4247102612304687, + 1.420763522605896, + 1.427785071258545, + 1.4206389274978637, + 1.4140512529754639, + 1.430296021385193, + 1.4163820014190673, + 1.4163366886138915, + 1.4075730377578735, + 1.4129050022506713, + 1.412215914993286, + 1.4040869583511353, + 1.4064097495269776, + 1.4082780233383179, + 1.3974828253936769, + 1.3907576309585572, + 1.3999906717681885, + 1.4001604806137085, + 1.3971656357192994, + 1.3846220355606078, + 1.413904198036194, + 1.3953790336990357, + 1.407677121810913, + 1.4085192776870727, + 1.3891954959869384, + 1.3969441717147828, + 1.3953401776123047, + 1.4075214514541625, + 1.392098694076538, + 1.4014366470336914, + 1.383703885116577, + 1.3975200021362304, + 1.3966769958114624, + 1.395452327079773, + 1.3924421725082397, + 1.392994442138672, + 1.3946838153839112, + 1.3889806948471068, + 1.4011986894607544, + 1.392875761756897, + 1.3996651697540283, + 1.3918553145599366, + 1.3905788117218019, + 1.3978934088897705, + 1.395444873085022, + 1.3836221188735962, + 1.3835073752593994, + 1.3996466543579102, + 1.3921513790512086, + 1.3886110556030273 + ], + "train_acc": [ + 0.25512, + 0.35406, + 0.39256, + 0.41872, + 0.42746, + 0.44032, + 0.44904, + 0.45578, + 0.46216, + 0.46186, + 0.47208, + 0.4704, + 0.46696, + 0.46728, + 0.46982, + 0.47016, + 0.46732, + 0.47058, + 0.46704, + 0.47188, + 0.47184, + 0.47774, + 0.47564, + 0.46992, + 0.47904, + 0.47598, + 0.4805, + 0.4798, + 0.48436, + 0.4804, + 0.48658, + 0.4882, + 0.48746, + 0.48498, + 0.4856, + 0.48972, + 0.48944, + 0.4911, + 0.49712, + 0.49246, + 0.49236, + 0.49502, + 0.49186, + 0.4949, + 0.49132, + 0.49518, + 0.49632, + 0.49714, + 0.49698, + 0.4976, + 0.49764, + 0.49996, + 0.4982, + 0.50006, + 0.50194, + 0.49868, + 0.50102, + 0.5003, + 0.50452, + 0.50352, + 0.50094, + 0.50638, + 0.50562, + 0.50712, + 0.50918, + 0.51182, + 0.50668, + 0.50992, + 0.51012, + 0.51506, + 0.50606, + 0.50954, + 0.50492, + 0.50494, + 0.51098, + 0.50954, + 0.5119, + 0.50756, + 0.5122, + 0.5099, + 0.51502, + 0.51232, + 0.51182, + 0.51178, + 0.51356, + 0.51212, + 0.5126, + 0.5151, + 0.50946, + 0.51328, + 0.51028, + 0.51492, + 0.51728, + 0.51268, + 0.5116, + 0.5164, + 0.51488, + 0.51248, + 0.51738, + 0.51552 + ], + "test_acc": [ + 0.2659, + 0.3594, + 0.3468, + 0.4054, + 0.4209, + 0.4382, + 0.4645, + 0.4759, + 0.484, + 0.4903, + 0.4803, + 0.4829, + 0.4731, + 0.48, + 0.4662, + 0.4533, + 0.4632, + 0.4207, + 0.4454, + 0.4012, + 0.4227, + 0.4392, + 0.4277, + 0.4557, + 0.4545, + 0.4582, + 0.48, + 0.4613, + 0.5073, + 0.5058, + 0.5176, + 0.5158, + 0.5175, + 0.5144, + 0.504, + 0.4989, + 0.4939, + 0.4828, + 0.4713, + 0.4078, + 0.4124, + 0.4353, + 0.4391, + 0.4563, + 0.4511, + 0.4067, + 0.4166, + 0.4923, + 0.4659, + 0.5016, + 0.5189, + 0.523, + 0.5282, + 0.5231, + 0.5334, + 0.5074, + 0.5186, + 0.5232, + 0.5093, + 0.4995, + 0.467, + 0.4539, + 0.441, + 0.4158, + 0.4242, + 0.3758, + 0.4375, + 0.2489, + 0.4025, + 0.453, + 0.5135, + 0.4813, + 0.5284, + 0.5371, + 0.5471, + 0.5423, + 0.5411, + 0.5358, + 0.5337, + 0.5311, + 0.5235, + 0.4908, + 0.464, + 0.4208, + 0.4237, + 0.4022, + 0.3981, + 0.3835, + 0.3665, + 0.466, + 0.3939, + 0.4512, + 0.5103, + 0.4967, + 0.5091, + 0.5297, + 0.5453, + 0.5533, + 0.5418, + 0.548 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.09619210660457611, + 0.07335361838340759, + 0.09598866105079651, + 0.12553545832633972 + ], + "bp_grad_norms_per_layer": [ + 2.3029326257528737e-05, + 3.30211491927912e-06, + 1.7296084706686088e-06, + 1.7123409179475857e-06, + 1.822835770326492e-06 + ], + "hidden_norms_per_layer": [ + 46.774864196777344, + 112.76661682128906, + 160.17086791992188, + 191.71311950683594, + 218.50283813476562 + ] + } + }, + "frozen_acc": 0.439 + }, + "456": { + "bp": { + "log": { + "train_loss": [ + 1.5160641179275514, + 1.1373616902923585, + 0.9867977604675293, + 0.879104539604187, + 0.8026973062515259, + 0.7398024030876159, + 0.6849897325134278, + 0.6419805959129333, + 0.6066270620346069, + 0.5656318543624878, + 0.5430069333076477, + 0.5161823916244507, + 0.4938885500907898, + 0.4700241546821594, + 0.45997175704956056, + 0.4387467160606384, + 0.424728159160614, + 0.4102775760555267, + 0.39500373538017275, + 0.3853588530731201, + 0.3722192826938629, + 0.3609906807899475, + 0.35011868640899657, + 0.3387249102306366, + 0.32812179962158206, + 0.32087999514579774, + 0.3091567077445984, + 0.30012500077247617, + 0.28842351221084594, + 0.2877265364074707, + 0.27251338097572325, + 0.26745018371105195, + 0.25646164291858675, + 0.25673630625247956, + 0.24372106365203858, + 0.23358901292800904, + 0.23192961641311646, + 0.2255696634578705, + 0.21565012225151062, + 0.20677277130126953, + 0.20152188514709474, + 0.19581060210227966, + 0.19028258794784547, + 0.1841914382791519, + 0.17373496751785278, + 0.17271406743049622, + 0.16331802525043487, + 0.15863498505592347, + 0.14999562792301177, + 0.14473856409549712, + 0.14406693646430968, + 0.14047701974868773, + 0.1324915998506546, + 0.1275099449801445, + 0.12249933202266693, + 0.11727544169425964, + 0.11460136109352112, + 0.10892109509944915, + 0.10204498662948608, + 0.09586662238121033, + 0.09406495225906372, + 0.08779436621665955, + 0.087703556432724, + 0.08578594008922577, + 0.07818658845186234, + 0.07675694673776627, + 0.07220518976211548, + 0.06950767105042935, + 0.06377516150712967, + 0.06165861406207085, + 0.06159033078074455, + 0.058180121289491654, + 0.05655836649179458, + 0.05223947284221649, + 0.05033184681296349, + 0.04905604504346848, + 0.04456530170381069, + 0.04502734445810318, + 0.04437524861574173, + 0.04308886869430542, + 0.03868388356208801, + 0.03812801341593266, + 0.03718253348588944, + 0.03652035888537765, + 0.0338644351452589, + 0.03453644402831793, + 0.032784310665130614, + 0.03278352576315403, + 0.031418144221305844, + 0.030436194059848785, + 0.02994262287378311, + 0.03070086252808571, + 0.02871063878774643, + 0.030094075206518172, + 0.02943230504631996, + 0.027803415595293045, + 0.028644300409555436, + 0.028327953987121582, + 0.028030424483418463, + 0.027398860431313513 + ], + "train_acc": [ + 0.44308, + 0.59558, + 0.65168, + 0.68998, + 0.7194, + 0.7423, + 0.7602, + 0.77614, + 0.79044, + 0.80464, + 0.81352, + 0.82222, + 0.83044, + 0.83888, + 0.84234, + 0.85044, + 0.85332, + 0.859, + 0.86514, + 0.86824, + 0.87012, + 0.87526, + 0.8781, + 0.88222, + 0.8871, + 0.88816, + 0.89312, + 0.89714, + 0.89986, + 0.89924, + 0.90564, + 0.90728, + 0.9118, + 0.91082, + 0.91566, + 0.9195, + 0.91938, + 0.9218, + 0.92472, + 0.92866, + 0.93012, + 0.9323, + 0.93438, + 0.93586, + 0.94102, + 0.94056, + 0.94362, + 0.9455, + 0.94822, + 0.95118, + 0.94988, + 0.95224, + 0.95454, + 0.9569, + 0.95858, + 0.96016, + 0.96116, + 0.96306, + 0.9657, + 0.9686, + 0.96904, + 0.97188, + 0.97136, + 0.9718, + 0.97554, + 0.9755, + 0.97714, + 0.97796, + 0.98142, + 0.98202, + 0.9814, + 0.98234, + 0.9833, + 0.98538, + 0.98568, + 0.98642, + 0.98808, + 0.98796, + 0.98826, + 0.98844, + 0.99046, + 0.99028, + 0.99066, + 0.9907, + 0.99234, + 0.99216, + 0.9928, + 0.99288, + 0.9932, + 0.99352, + 0.99434, + 0.99378, + 0.99432, + 0.9936, + 0.994, + 0.99482, + 0.99412, + 0.99418, + 0.99446, + 0.99458 + ], + "test_acc": [ + 0.5183, + 0.5736, + 0.6279, + 0.6712, + 0.6831, + 0.7037, + 0.7237, + 0.7395, + 0.7255, + 0.7823, + 0.7595, + 0.7661, + 0.7836, + 0.759, + 0.7763, + 0.7452, + 0.7823, + 0.81, + 0.8002, + 0.8178, + 0.8219, + 0.7635, + 0.7796, + 0.8069, + 0.817, + 0.801, + 0.8244, + 0.8341, + 0.8304, + 0.8073, + 0.8264, + 0.8266, + 0.8423, + 0.8438, + 0.8508, + 0.8521, + 0.8528, + 0.8569, + 0.8246, + 0.847, + 0.8519, + 0.834, + 0.8514, + 0.8564, + 0.8668, + 0.8543, + 0.8501, + 0.8509, + 0.8432, + 0.8499, + 0.8521, + 0.8618, + 0.8625, + 0.8683, + 0.8661, + 0.8431, + 0.8536, + 0.8602, + 0.861, + 0.8676, + 0.8685, + 0.8694, + 0.8659, + 0.8662, + 0.8693, + 0.8665, + 0.8729, + 0.8673, + 0.8773, + 0.8757, + 0.8698, + 0.8681, + 0.8717, + 0.8755, + 0.872, + 0.8735, + 0.8739, + 0.8748, + 0.8769, + 0.877, + 0.8746, + 0.8774, + 0.8766, + 0.8746, + 0.8767, + 0.8777, + 0.8767, + 0.8767, + 0.8764, + 0.8771, + 0.8788, + 0.878, + 0.8773, + 0.8789, + 0.8774, + 0.8777, + 0.8776, + 0.8783, + 0.8783, + 0.8773 + ] + }, + "diagnostics": { + "bp_cosine": [ + 1.0, + 1.0, + 1.0, + 1.0 + ], + "bp_grad_norms_per_layer": [ + 1.1557457213484668e-07, + 1.5904217320894531e-07, + 1.3247040442365687e-07, + 3.798226444473585e-08, + 9.729313354966962e-09 + ], + "hidden_norms_per_layer": [ + 1.7021474838256836, + 2.5449094772338867, + 4.418560028076172, + 9.197453498840332, + 18.361495971679688 + ] + } + }, + "fa": { + "log": { + "train_loss": [ + 1.8388006496429443, + 1.6388477425384522, + 1.5723047241592407, + 1.5523447470474243, + 1.5415249212646485, + 1.5431161571502685, + 1.5355080755996704, + 1.5270839902877809, + 1.5336033702087402, + 1.539637003250122, + 1.54302769657135, + 1.538811323776245, + 1.5301817972564697, + 1.513635392112732, + 1.511602727394104, + 1.5054410875320434, + 1.4944276239395142, + 1.4915078888702393, + 1.505673057899475, + 1.4965799645996094, + 1.4820210153961182, + 1.470949204788208, + 1.5031878339385987, + 1.5060544648742675, + 1.5197064126205444, + 1.5097587853240966, + 1.4998890134429932, + 1.5088149597930909, + 1.5380420586013794, + 1.5479945287322998, + 1.5401077768707276, + 1.5486767250823974, + 1.5603229951858522, + 1.558787651863098, + 1.572075382347107, + 1.5438019393157958, + 1.542765788040161, + 1.5333216193389894, + 1.524303759613037, + 1.5235723961639405, + 1.5214403876495362, + 1.5204402813720703, + 1.541364458580017, + 1.5012250566864014, + 1.5124277173614502, + 1.5230836597061157, + 1.5412120163726806, + 1.5329921883392335, + 1.5200326070404053, + 1.5141836537933349, + 1.517231360168457, + 1.5352338036346436, + 1.533933445968628, + 1.5161780032348633, + 1.5225077356719972, + 1.5297851563262939, + 1.513075235671997, + 1.5052410777664185, + 1.515364197921753, + 1.5016302545166016, + 1.5332107681274414, + 1.5103576389312745, + 1.5200442121124267, + 1.5020100690078735, + 1.5109573263931275, + 1.4995048323822022, + 1.4985650747299195, + 1.4828378940200806, + 1.4779076181030273, + 1.4760516178131105, + 1.4895838101196288, + 1.4858886737823487, + 1.4851336638259887, + 1.500923940010071, + 1.4823656270599366, + 1.4936273226928711, + 1.4718116438674926, + 1.479018363571167, + 1.4953905407714845, + 1.4994900365447998, + 1.4885512816619872, + 1.480618069229126, + 1.5012863097381592, + 1.506208432044983, + 1.4944241470336914, + 1.49456167137146, + 1.5098730950164796, + 1.5051140392303466, + 1.5134692226409912, + 1.5226804944229126, + 1.5144084841918946, + 1.5232038221740722, + 1.5139210459136963, + 1.5156014365005492, + 1.52377382938385, + 1.5234981735229491, + 1.5224218480682372, + 1.5218167197036743, + 1.5318193957138062, + 1.5287795416259766 + ], + "train_acc": [ + 0.31774, + 0.3982, + 0.42496, + 0.43068, + 0.44088, + 0.44126, + 0.44228, + 0.44938, + 0.44294, + 0.44418, + 0.44554, + 0.44738, + 0.44878, + 0.45672, + 0.45624, + 0.45514, + 0.46162, + 0.46508, + 0.4537, + 0.45884, + 0.4671, + 0.47226, + 0.45796, + 0.45434, + 0.45222, + 0.45602, + 0.4592, + 0.45838, + 0.4486, + 0.4429, + 0.44742, + 0.44442, + 0.44166, + 0.44236, + 0.43566, + 0.44358, + 0.44418, + 0.44772, + 0.45104, + 0.45326, + 0.4502, + 0.45424, + 0.44642, + 0.45936, + 0.4546, + 0.45028, + 0.44218, + 0.44476, + 0.44862, + 0.45316, + 0.45018, + 0.44558, + 0.445, + 0.44918, + 0.44712, + 0.44466, + 0.45282, + 0.45582, + 0.45008, + 0.45656, + 0.44814, + 0.4574, + 0.4478, + 0.45758, + 0.45634, + 0.45834, + 0.458, + 0.4626, + 0.46408, + 0.46842, + 0.46282, + 0.46148, + 0.4641, + 0.45702, + 0.46232, + 0.46062, + 0.469, + 0.46806, + 0.45776, + 0.45832, + 0.46242, + 0.46564, + 0.45702, + 0.45586, + 0.4598, + 0.46158, + 0.45398, + 0.45968, + 0.45214, + 0.44914, + 0.45398, + 0.44604, + 0.45474, + 0.4488, + 0.44712, + 0.44762, + 0.4469, + 0.45234, + 0.4448, + 0.44538 + ], + "test_acc": [ + 0.3086, + 0.3587, + 0.3434, + 0.3477, + 0.4298, + 0.4628, + 0.4504, + 0.4734, + 0.4801, + 0.4632, + 0.4663, + 0.4767, + 0.4678, + 0.4424, + 0.4285, + 0.428, + 0.4418, + 0.3465, + 0.4019, + 0.3723, + 0.3955, + 0.3582, + 0.3886, + 0.3837, + 0.4198, + 0.4193, + 0.405, + 0.4546, + 0.4503, + 0.4776, + 0.47, + 0.4658, + 0.4401, + 0.4718, + 0.4374, + 0.4485, + 0.4589, + 0.3954, + 0.4312, + 0.406, + 0.3895, + 0.3406, + 0.338, + 0.3789, + 0.3933, + 0.3649, + 0.3774, + 0.3894, + 0.4353, + 0.4685, + 0.4606, + 0.4865, + 0.4834, + 0.4816, + 0.4656, + 0.4809, + 0.4869, + 0.4569, + 0.4697, + 0.4341, + 0.44, + 0.4354, + 0.395, + 0.3731, + 0.3257, + 0.4188, + 0.3973, + 0.3604, + 0.3774, + 0.4403, + 0.4193, + 0.4522, + 0.4503, + 0.487, + 0.4902, + 0.4957, + 0.508, + 0.4846, + 0.4724, + 0.4804, + 0.4706, + 0.4534, + 0.4274, + 0.4526, + 0.444, + 0.359, + 0.3653, + 0.3762, + 0.3793, + 0.3683, + 0.3477, + 0.4465, + 0.4061, + 0.4241, + 0.4229, + 0.4535, + 0.4707, + 0.4677, + 0.4769, + 0.474 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.058251358568668365, + 0.0052527980878949165, + 0.16866855323314667, + 0.40164506435394287 + ], + "bp_grad_norms_per_layer": [ + 1.2751997928717174e-05, + 3.002295898113516e-06, + 1.257812300536898e-06, + 8.748378945711011e-07, + 6.224869366633357e-07 + ], + "hidden_norms_per_layer": [ + 53.4076042175293, + 94.59198760986328, + 138.4558868408203, + 174.03082275390625, + 177.5882568359375 + ] + } + }, + "dfa": { + "log": { + "train_loss": [ + 1.9832865395355224, + 1.7502513399887085, + 1.6449337438201905, + 1.6053136781311035, + 1.5808841290664672, + 1.5549153183364868, + 1.5427701051330567, + 1.534728247947693, + 1.5328357236480712, + 1.5239458906555177, + 1.5125219562530519, + 1.5000166980743408, + 1.499222512741089, + 1.4927287301635743, + 1.5004344689941407, + 1.4861587203216553, + 1.4685827215576173, + 1.463277092437744, + 1.4733178770065307, + 1.4807002882003784, + 1.4656713399505614, + 1.4568580744552613, + 1.4681837302780152, + 1.4557059508895873, + 1.4571999851989745, + 1.4609215265655517, + 1.4586345113754273, + 1.4629971759796143, + 1.4590657321166993, + 1.4617421231460572, + 1.4511952079010009, + 1.461978643836975, + 1.453667638092041, + 1.4468986032104492, + 1.4443752507781982, + 1.4449514136505126, + 1.4444499270248412, + 1.4468188973999023, + 1.439971184463501, + 1.4227961892700196, + 1.4266341059494019, + 1.422662779006958, + 1.426161422729492, + 1.4228117908477784, + 1.427011708984375, + 1.4431268807220459, + 1.4146196817398071, + 1.4275095965576172, + 1.4253623778915405, + 1.4229059297561646, + 1.4180848153305055, + 1.4208539867782592, + 1.4236131421661378, + 1.4215651251983643, + 1.4113855828857422, + 1.4156936545562744, + 1.4165809607696533, + 1.4152497507095336, + 1.4176463265228272, + 1.4037966454696655, + 1.4144108854675292, + 1.4033693023681642, + 1.4085983514785767, + 1.4072367011260987, + 1.4190242646026612, + 1.4065343897628784, + 1.4055108359909059, + 1.4067657685089112, + 1.4057906729507446, + 1.4030395392608643, + 1.4049832558822632, + 1.4050726447296142, + 1.4044393698120117, + 1.4132345629882812, + 1.4143582116699218, + 1.4134309550857544, + 1.402359348526001, + 1.3989218573379516, + 1.4112048414611817, + 1.4131255010986328, + 1.3988475032043457, + 1.4039105146026611, + 1.4007704114151, + 1.4156162036895752, + 1.4040945704650878, + 1.3912679317855834, + 1.4181099109649657, + 1.4037213237762451, + 1.4149015707778931, + 1.4188450262069703, + 1.3975644765090942, + 1.4184134230804444, + 1.4000829550933838, + 1.4012997241210938, + 1.4128226322174073, + 1.4041969888687134, + 1.4022131369781494, + 1.408169732055664, + 1.4077017026901244, + 1.401384118461609 + ], + "train_acc": [ + 0.27112, + 0.36064, + 0.40478, + 0.41718, + 0.42858, + 0.44078, + 0.44306, + 0.4494, + 0.45062, + 0.45602, + 0.45942, + 0.4644, + 0.46126, + 0.46632, + 0.46514, + 0.46942, + 0.47602, + 0.48078, + 0.47528, + 0.47308, + 0.4787, + 0.48544, + 0.47896, + 0.48336, + 0.4838, + 0.4813, + 0.48428, + 0.4804, + 0.48508, + 0.4835, + 0.48618, + 0.48328, + 0.48842, + 0.49088, + 0.48918, + 0.49114, + 0.49146, + 0.4912, + 0.49384, + 0.49812, + 0.4967, + 0.49934, + 0.49922, + 0.49834, + 0.49984, + 0.4932, + 0.49898, + 0.49748, + 0.49922, + 0.5005, + 0.50234, + 0.50114, + 0.49996, + 0.50416, + 0.50542, + 0.50446, + 0.50272, + 0.50446, + 0.5037, + 0.50842, + 0.50524, + 0.5119, + 0.50634, + 0.50902, + 0.50526, + 0.50828, + 0.50806, + 0.50748, + 0.50902, + 0.51128, + 0.50924, + 0.50872, + 0.5103, + 0.50704, + 0.50846, + 0.50658, + 0.51196, + 0.5129, + 0.50898, + 0.50978, + 0.51132, + 0.50952, + 0.5122, + 0.51048, + 0.51124, + 0.51608, + 0.50632, + 0.51178, + 0.50774, + 0.507, + 0.51196, + 0.50764, + 0.51432, + 0.51292, + 0.50924, + 0.515, + 0.51512, + 0.5099, + 0.51278, + 0.51376 + ], + "test_acc": [ + 0.2675, + 0.3692, + 0.3562, + 0.3556, + 0.4334, + 0.462, + 0.4672, + 0.4809, + 0.4729, + 0.4752, + 0.494, + 0.4868, + 0.4799, + 0.4728, + 0.4611, + 0.4517, + 0.4326, + 0.351, + 0.3931, + 0.4196, + 0.4363, + 0.4205, + 0.434, + 0.448, + 0.4435, + 0.4335, + 0.4635, + 0.479, + 0.4596, + 0.4963, + 0.5133, + 0.5136, + 0.5115, + 0.5249, + 0.4836, + 0.5063, + 0.4954, + 0.452, + 0.4942, + 0.3831, + 0.41, + 0.3788, + 0.3498, + 0.4271, + 0.4629, + 0.4629, + 0.4719, + 0.4597, + 0.4492, + 0.5074, + 0.5105, + 0.517, + 0.5225, + 0.5369, + 0.5273, + 0.5189, + 0.5249, + 0.5052, + 0.5099, + 0.5056, + 0.4619, + 0.4698, + 0.4649, + 0.4008, + 0.4123, + 0.4251, + 0.3647, + 0.4546, + 0.4994, + 0.4953, + 0.4378, + 0.5049, + 0.512, + 0.5291, + 0.538, + 0.5387, + 0.5379, + 0.5368, + 0.5373, + 0.5233, + 0.5246, + 0.4641, + 0.4691, + 0.5015, + 0.4382, + 0.4761, + 0.416, + 0.464, + 0.4394, + 0.4196, + 0.3663, + 0.4529, + 0.4557, + 0.4781, + 0.5161, + 0.5182, + 0.5327, + 0.5406, + 0.5435, + 0.5315 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.09811964631080627, + 0.05562638118863106, + 0.13867022097110748, + 0.1304049789905548 + ], + "bp_grad_norms_per_layer": [ + 3.095270585617982e-05, + 3.172246806570911e-06, + 1.7334730273432797e-06, + 1.652150672271091e-06, + 1.706813350210723e-06 + ], + "hidden_norms_per_layer": [ + 47.190711975097656, + 108.21077728271484, + 148.76641845703125, + 181.61634826660156, + 217.3177947998047 + ] + } + }, + "frozen_acc": 0.4401 + } +} \ No newline at end of file diff --git a/results/resnet_protocol_validation.log b/results/resnet_protocol_validation.log new file mode 100644 index 0000000..56837e8 --- /dev/null +++ b/results/resnet_protocol_validation.log @@ -0,0 +1,161 @@ + +============================================================ +Seed 42 +============================================================ + +--- BP --- + [BP] ep 10: acc=0.7538 + [BP] ep 20: acc=0.8337 + [BP] ep 30: acc=0.8516 + [BP] ep 40: acc=0.8572 + [BP] ep 50: acc=0.8668 + [BP] ep 60: acc=0.8701 + [BP] ep 70: acc=0.8727 + [BP] ep 80: acc=0.8771 + [BP] ep 90: acc=0.8784 + [BP] ep 100: acc=0.8769 + +--- FA --- + [FA] ep 10: acc=0.4524 + [FA] ep 20: acc=0.4077 + [FA] ep 30: acc=0.5031 + [FA] ep 40: acc=0.3687 + [FA] ep 50: acc=0.4560 + [FA] ep 60: acc=0.4727 + [FA] ep 70: acc=0.4387 + [FA] ep 80: acc=0.4693 + [FA] ep 90: acc=0.3725 + [FA] ep 100: acc=0.4833 + +--- DFA --- + [DFA] ep 10: acc=0.4845 + [DFA] ep 20: acc=0.4166 + [DFA] ep 30: acc=0.5166 + [DFA] ep 40: acc=0.4638 + [DFA] ep 50: acc=0.5211 + [DFA] ep 60: acc=0.5058 + [DFA] ep 70: acc=0.4456 + [DFA] ep 80: acc=0.5284 + [DFA] ep 90: acc=0.4554 + [DFA] ep 100: acc=0.5413 + +--- Frozen --- + [Frozen] ep 10: acc=0.3769 + [Frozen] ep 20: acc=0.3981 + [Frozen] ep 30: acc=0.4072 + [Frozen] ep 40: acc=0.4203 + [Frozen] ep 50: acc=0.4224 + [Frozen] ep 60: acc=0.4352 + [Frozen] ep 70: acc=0.4428 + [Frozen] ep 80: acc=0.4420 + [Frozen] ep 90: acc=0.4432 + [Frozen] ep 100: acc=0.4463 +FINAL frozen: 0.4463 + +============================================================ +Seed 123 +============================================================ + +--- BP --- + [BP] ep 10: acc=0.7239 + [BP] ep 20: acc=0.7878 + [BP] ep 30: acc=0.8268 + [BP] ep 40: acc=0.8489 + [BP] ep 50: acc=0.8420 + [BP] ep 60: acc=0.8534 + [BP] ep 70: acc=0.8697 + [BP] ep 80: acc=0.8730 + [BP] ep 90: acc=0.8748 + [BP] ep 100: acc=0.8751 + +--- FA --- + [FA] ep 10: acc=0.4852 + [FA] ep 20: acc=0.3673 + [FA] ep 30: acc=0.4890 + [FA] ep 40: acc=0.4090 + [FA] ep 50: acc=0.4650 + [FA] ep 60: acc=0.4524 + [FA] ep 70: acc=0.4131 + [FA] ep 80: acc=0.4634 + [FA] ep 90: acc=0.3723 + [FA] ep 100: acc=0.4701 + +--- DFA --- + [DFA] ep 10: acc=0.4903 + [DFA] ep 20: acc=0.4012 + [DFA] ep 30: acc=0.5058 + [DFA] ep 40: acc=0.4078 + [DFA] ep 50: acc=0.5016 + [DFA] ep 60: acc=0.4995 + [DFA] ep 70: acc=0.4530 + [DFA] ep 80: acc=0.5311 + [DFA] ep 90: acc=0.4660 + [DFA] ep 100: acc=0.5480 + +--- Frozen --- + [Frozen] ep 10: acc=0.3516 + [Frozen] ep 20: acc=0.3915 + [Frozen] ep 30: acc=0.4120 + [Frozen] ep 40: acc=0.4210 + [Frozen] ep 50: acc=0.4253 + [Frozen] ep 60: acc=0.4300 + [Frozen] ep 70: acc=0.4313 + [Frozen] ep 80: acc=0.4385 + [Frozen] ep 90: acc=0.4382 + [Frozen] ep 100: acc=0.4390 +FINAL frozen: 0.4390 + +============================================================ +Seed 456 +============================================================ + +--- BP --- + [BP] ep 10: acc=0.7823 + [BP] ep 20: acc=0.8178 + [BP] ep 30: acc=0.8073 + [BP] ep 40: acc=0.8470 + [BP] ep 50: acc=0.8499 + [BP] ep 60: acc=0.8676 + [BP] ep 70: acc=0.8757 + [BP] ep 80: acc=0.8770 + [BP] ep 90: acc=0.8771 + [BP] ep 100: acc=0.8773 + +--- FA --- + [FA] ep 10: acc=0.4632 + [FA] ep 20: acc=0.3723 + [FA] ep 30: acc=0.4776 + [FA] ep 40: acc=0.4060 + [FA] ep 50: acc=0.4685 + [FA] ep 60: acc=0.4341 + [FA] ep 70: acc=0.4403 + [FA] ep 80: acc=0.4804 + [FA] ep 90: acc=0.3683 + [FA] ep 100: acc=0.4740 + +--- DFA --- + [DFA] ep 10: acc=0.4752 + [DFA] ep 20: acc=0.4196 + [DFA] ep 30: acc=0.4963 + [DFA] ep 40: acc=0.3831 + [DFA] ep 50: acc=0.5074 + [DFA] ep 60: acc=0.5056 + [DFA] ep 70: acc=0.4953 + [DFA] ep 80: acc=0.5233 + [DFA] ep 90: acc=0.4196 + [DFA] ep 100: acc=0.5315 + +--- Frozen --- + [Frozen] ep 10: acc=0.3576 + [Frozen] ep 20: acc=0.3920 + [Frozen] ep 30: acc=0.4083 + [Frozen] ep 40: acc=0.4102 + [Frozen] ep 50: acc=0.4163 + [Frozen] ep 60: acc=0.4304 + [Frozen] ep 70: acc=0.4391 + [Frozen] ep 80: acc=0.4400 + [Frozen] ep 90: acc=0.4363 + [Frozen] ep 100: acc=0.4401 +FINAL frozen: 0.4401 + +Saved: results/resnet_protocol_validation.json diff --git a/results/round38_cb_penalty_30ep_s123.log b/results/round38_cb_penalty_30ep_s123.log new file mode 100644 index 0000000..d636bf7 --- /dev/null +++ b/results/round38_cb_penalty_30ep_s123.log @@ -0,0 +1,15 @@ +Using device: cuda:0 + +============================================================ +Seed 123 +============================================================ + +--- Credit Bridge --- + [CB] Warmup phase: 6 epochs (DFA fallback + value net training) + [CB] Epoch 1 (warmup): loss=1.9904, train=0.2822, test=0.3362, vloss=0.650139 + [CB] Epoch 10 (blend=0.67): loss=1.9194, train=0.3203, test=0.3491, vloss=0.052320 + [CB] Epoch 20 (blend=1.00): loss=1.8683, train=0.3406, test=0.3615, vloss=0.024901 + [CB] Epoch 30 (blend=1.00): loss=1.8727, train=0.3440, test=0.3642, vloss=0.011062 + Final test acc: 0.3642 + +All results saved to results/round38_cb_penalty_30ep_s123/results_cifar10.json diff --git a/results/round38_cb_penalty_30ep_s123/results_cifar10.json b/results/round38_cb_penalty_30ep_s123/results_cifar10.json new file mode 100644 index 0000000..ae68c96 --- /dev/null +++ b/results/round38_cb_penalty_30ep_s123/results_cifar10.json @@ -0,0 +1,233 @@ +{ + "123": { + "credit_bridge": { + "log": { + "train_loss": [ + 1.9903950632476806, + 1.9436892071533203, + 1.9378673068237304, + 1.9346954096221924, + 1.9363043911361695, + 1.9327283626937866, + 1.9476709210586547, + 1.9389762512588502, + 1.9266566958236695, + 1.919404111404419, + 1.9120563073730468, + 1.9111018649291993, + 1.9005808422088624, + 1.8967266842269896, + 1.8907416219329833, + 1.882234052658081, + 1.8722203524017333, + 1.8694015215301514, + 1.8656991873168944, + 1.8682857693862915, + 1.8697387396621703, + 1.8678798027801513, + 1.8690597088241576, + 1.8677466773223876, + 1.871109571685791, + 1.8732738525009156, + 1.8745700274658204, + 1.8710524578094483, + 1.8755342425155639, + 1.8727011511993408 + ], + "train_acc": [ + 0.28218, + 0.30712, + 0.31004, + 0.3135, + 0.31522, + 0.31594, + 0.31198, + 0.31488, + 0.31484, + 0.32026, + 0.32228, + 0.32102, + 0.32762, + 0.32718, + 0.33116, + 0.33436, + 0.33864, + 0.33738, + 0.34008, + 0.34056, + 0.34068, + 0.34044, + 0.34202, + 0.34188, + 0.34192, + 0.34224, + 0.3414, + 0.343, + 0.34144, + 0.34402 + ], + "test_acc": [ + 0.3362, + 0.3403, + 0.3354, + 0.3262, + 0.3373, + 0.3421, + 0.3428, + 0.349, + 0.3517, + 0.3491, + 0.353, + 0.347, + 0.3444, + 0.3545, + 0.3505, + 0.3617, + 0.3671, + 0.363, + 0.3697, + 0.3615, + 0.3623, + 0.3666, + 0.3608, + 0.3692, + 0.3652, + 0.3677, + 0.3652, + 0.3645, + 0.364, + 0.3642 + ], + "value_loss": [ + 0.6501392752981185, + 0.19012001507282258, + 0.1075794908285141, + 0.07698172752141952, + 0.06917850073337554, + 0.05796519654870033, + 0.10017188906908035, + 0.06868275530338287, + 0.06073615624547005, + 0.05232048670530319, + 0.045059604372978214, + 0.04662440485239029, + 0.04121920494437218, + 0.044443060465455056, + 0.04122906471073628, + 0.03664021657347679, + 0.03124810820043087, + 0.0269432488912344, + 0.02596988540112972, + 0.024900869569778442, + 0.02048479182034731, + 0.018211499471366407, + 0.0170548377931118, + 0.01694579794406891, + 0.01826157638669014, + 0.014401317476630211, + 0.014872411508262157, + 0.010797930763959884, + 0.01634573257163167, + 0.01106238992586732 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.6450029015541077, + 0.6589623689651489, + 0.6671799421310425, + 0.6754908561706543 + ], + "perturbation_rho": [ + 0.3963339030742645, + 0.4112011194229126, + 0.4508204460144043, + 0.49511781334877014 + ], + "nudging": { + "0.001": [ + -4.538437133305706e-05, + -4.164675556239672e-05, + -3.897584610967897e-05, + -3.720284075825475e-05 + ], + "0.003": [ + -0.00013614483759738505, + -0.00012491861707530916, + -0.00011692544649122283, + -0.00011161504517076537 + ], + "0.01": [ + -0.00045391899766400456, + -0.00041642854921519756, + -0.00038977732765488327, + -0.00037192515446804464 + ] + }, + "hidden_norms_per_layer": [ + 5795.3388671875, + 5812.16650390625, + 5825.60498046875, + 5806.94384765625, + 5834.41455078125 + ], + "bp_grad_norms_per_layer": [ + 2.1459092749864794e-05, + 2.0404753740876913e-05, + 1.9721255739568733e-05, + 1.843643985921517e-05, + 1.812805021472741e-05 + ] + }, + "drift": { + "embed.weight": 47.265920858379104, + "embed.bias": 64.03327510119414, + "blocks.0.ln.weight": 0.31550925970077515, + "blocks.0.w1.weight": 3.9393207442198896, + "blocks.0.w1.bias": 7.116536540852231, + "blocks.0.w2.weight": 18.565318744639406, + "blocks.1.ln.weight": 0.3102896213531494, + "blocks.1.w1.weight": 3.814831040782521, + "blocks.1.w1.bias": 7.074615401132259, + "blocks.1.w2.weight": 18.672674667307152, + "blocks.2.ln.weight": 0.32316333055496216, + "blocks.2.w1.weight": 3.901017267398649, + "blocks.2.w1.bias": 6.366350200102534, + "blocks.2.w2.weight": 19.721825160296877, + "blocks.3.ln.weight": 0.2990249991416931, + "blocks.3.w1.weight": 4.002164431729751, + "blocks.3.w1.bias": 5.90919777616421, + "blocks.3.w2.weight": 21.568416770540885, + "out_ln.weight": 0.09184015542268753, + "out_head.weight": 2.070435355745074, + "out_head.bias": 1.855754764316957 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 30, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 123 + ], + "gpu": 0, + "output_dir": "results/round38_cb_penalty_30ep_s123", + "methods": [ + "credit_bridge" + ], + "random_targets": false, + "penalty_lam": 0.01, + "num_classes": 10 + } +} \ No newline at end of file diff --git a/results/round38_cb_penalty_30ep_s456.log b/results/round38_cb_penalty_30ep_s456.log new file mode 100644 index 0000000..75ef274 --- /dev/null +++ b/results/round38_cb_penalty_30ep_s456.log @@ -0,0 +1,15 @@ +Using device: cuda:0 + +============================================================ +Seed 456 +============================================================ + +--- Credit Bridge --- + [CB] Warmup phase: 6 epochs (DFA fallback + value net training) + [CB] Epoch 1 (warmup): loss=1.9934, train=0.2765, test=0.3431, vloss=0.635836 + [CB] Epoch 10 (blend=0.67): loss=1.9165, train=0.3182, test=0.3451, vloss=0.059035 + [CB] Epoch 20 (blend=1.00): loss=1.8877, train=0.3323, test=0.3456, vloss=0.025170 + [CB] Epoch 30 (blend=1.00): loss=1.8695, train=0.3410, test=0.3562, vloss=0.015811 + Final test acc: 0.3562 + +All results saved to results/round38_cb_penalty_30ep_s456/results_cifar10.json diff --git a/results/round38_cb_penalty_30ep_s456/results_cifar10.json b/results/round38_cb_penalty_30ep_s456/results_cifar10.json new file mode 100644 index 0000000..50e9f4b --- /dev/null +++ b/results/round38_cb_penalty_30ep_s456/results_cifar10.json @@ -0,0 +1,233 @@ +{ + "456": { + "credit_bridge": { + "log": { + "train_loss": [ + 1.9934451489257812, + 1.9314295723724366, + 1.9235225268173217, + 1.9217069106292726, + 1.9212194289398192, + 1.916630177383423, + 1.9345502002716064, + 1.9283877908325195, + 1.9177326504898071, + 1.9165373708343505, + 1.9105737041854858, + 1.8997189542388917, + 1.891296152076721, + 1.8811385650253296, + 1.8842703173446655, + 1.8762526668930053, + 1.8802709610366821, + 1.8837381246566773, + 1.8947839934921265, + 1.8876838129425049, + 1.878063057937622, + 1.8691059185791015, + 1.8723352920913696, + 1.8673814739990235, + 1.86444116481781, + 1.8651199575424193, + 1.8679865084838867, + 1.8683458470916747, + 1.8682409041595458, + 1.8695441330337523 + ], + "train_acc": [ + 0.27654, + 0.30874, + 0.31612, + 0.3179, + 0.31686, + 0.31922, + 0.314, + 0.31612, + 0.31764, + 0.3182, + 0.31802, + 0.3238, + 0.33024, + 0.33216, + 0.33292, + 0.33354, + 0.33402, + 0.33356, + 0.33096, + 0.33232, + 0.33684, + 0.33706, + 0.33616, + 0.34138, + 0.3399, + 0.34038, + 0.34008, + 0.34048, + 0.33706, + 0.341 + ], + "test_acc": [ + 0.3431, + 0.3495, + 0.3477, + 0.356, + 0.3511, + 0.3474, + 0.3323, + 0.3466, + 0.3508, + 0.3451, + 0.341, + 0.3566, + 0.3514, + 0.3453, + 0.3491, + 0.3525, + 0.3464, + 0.3496, + 0.3429, + 0.3456, + 0.343, + 0.3448, + 0.3481, + 0.3549, + 0.3545, + 0.354, + 0.3557, + 0.355, + 0.3562, + 0.3562 + ], + "value_loss": [ + 0.6358358229446411, + 0.20003649864196776, + 0.1189081085062027, + 0.0873355598807335, + 0.07387620919823647, + 0.06212632877349854, + 0.09646473777532577, + 0.08277876357793808, + 0.06577274338841438, + 0.05903506823539734, + 0.060327464895248414, + 0.0471712444293499, + 0.05392980309844017, + 0.04334379373788834, + 0.04389793854594231, + 0.04077757358431816, + 0.03543120482087135, + 0.03244814622402191, + 0.03196794641435146, + 0.02516974647641182, + 0.018719528279304506, + 0.019053550893962382, + 0.019475930092334746, + 0.01711861621081829, + 0.015539742150306702, + 0.018024257761240007, + 0.01626725864171982, + 0.016166514835059643, + 0.015814910601973535, + 0.015810824376344682 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.6528493165969849, + 0.6737558841705322, + 0.6874117851257324, + 0.6945056915283203 + ], + "perturbation_rho": [ + 0.45550960302352905, + 0.4658626317977905, + 0.4093303084373474, + 0.44921162724494934 + ], + "nudging": { + "0.001": [ + -4.855693259742111e-05, + -4.6262473915703595e-05, + -4.405167419463396e-05, + -4.2281331843696535e-05 + ], + "0.003": [ + -0.00014562674914486706, + -0.0001387652737321332, + -0.00013202497211750597, + -0.00012669814168475568 + ], + "0.01": [ + -0.00048537791008129716, + -0.00046242878306657076, + -0.00043993344297632575, + -0.00042223266791552305 + ] + }, + "hidden_norms_per_layer": [ + 5652.72998046875, + 5664.4931640625, + 5686.38916015625, + 5758.30419921875, + 5775.17431640625 + ], + "bp_grad_norms_per_layer": [ + 2.290221891598776e-05, + 2.191648854932282e-05, + 2.0994630176573992e-05, + 2.07327520911349e-05, + 2.0050258171977475e-05 + ] + }, + "drift": { + "embed.weight": 47.17655243675414, + "embed.bias": 69.22157757464541, + "blocks.0.ln.weight": 0.30546510219573975, + "blocks.0.w1.weight": 3.9210619545041143, + "blocks.0.w1.bias": 5.970693807323712, + "blocks.0.w2.weight": 18.22592321226308, + "blocks.1.ln.weight": 0.29675590991973877, + "blocks.1.w1.weight": 3.7748035547298446, + "blocks.1.w1.bias": 5.95370365502356, + "blocks.1.w2.weight": 18.273244666485375, + "blocks.2.ln.weight": 0.29545143246650696, + "blocks.2.w1.weight": 3.797978708503024, + "blocks.2.w1.bias": 6.318915016989016, + "blocks.2.w2.weight": 18.715277379402863, + "blocks.3.ln.weight": 0.29928261041641235, + "blocks.3.w1.weight": 3.9126807823570937, + "blocks.3.w1.bias": 6.287240256219296, + "blocks.3.w2.weight": 18.91014036108483, + "out_ln.weight": 0.10117902606725693, + "out_head.weight": 2.2020174609192082, + "out_head.bias": 2.0786513163395623 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 30, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 456 + ], + "gpu": 0, + "output_dir": "results/round38_cb_penalty_30ep_s456", + "methods": [ + "credit_bridge" + ], + "random_targets": false, + "penalty_lam": 0.01, + "num_classes": 10 + } +} \ No newline at end of file diff --git a/results/round38_sb_penalty_30ep_s123.log b/results/round38_sb_penalty_30ep_s123.log new file mode 100644 index 0000000..69ed527 --- /dev/null +++ b/results/round38_sb_penalty_30ep_s123.log @@ -0,0 +1,14 @@ +Using device: cuda:0 + +============================================================ +Seed 123 +============================================================ + +--- State Bridge --- + [SB] Epoch 1: loss=2.0395, train=0.2546, test=0.3128, state_err=0.2665 + [SB] Epoch 10: loss=1.7017, train=0.4005, test=0.4254, state_err=0.0904 + [SB] Epoch 20: loss=1.6233, train=0.4291, test=0.4439, state_err=0.0677 + [SB] Epoch 30: loss=1.5955, train=0.4431, test=0.4514, state_err=0.0437 + Final test acc: 0.4514 + +All results saved to results/round38_sb_penalty_30ep_s123/results_cifar10.json diff --git a/results/round38_sb_penalty_30ep_s123/results_cifar10.json b/results/round38_sb_penalty_30ep_s123/results_cifar10.json new file mode 100644 index 0000000..09d7c81 --- /dev/null +++ b/results/round38_sb_penalty_30ep_s123/results_cifar10.json @@ -0,0 +1,233 @@ +{ + "123": { + "state_bridge": { + "log": { + "train_loss": [ + 2.0394552979278564, + 1.907211668624878, + 1.8378597689056397, + 1.8050992700958253, + 1.782720252342224, + 1.7607325444793702, + 1.7526287609481812, + 1.7301886476898194, + 1.7114346005249024, + 1.7017147624969482, + 1.6891529846572877, + 1.6735555848693848, + 1.6678473961639404, + 1.6606992713165283, + 1.6562059018707276, + 1.6442966329956055, + 1.6339350330352784, + 1.637065968284607, + 1.6251955394744872, + 1.6232860974502563, + 1.62067741481781, + 1.6153102271270752, + 1.6100856274032593, + 1.6128213213348388, + 1.6058022644805907, + 1.6015477989959717, + 1.6040523609161377, + 1.6024808090591431, + 1.5986408697128296, + 1.5955050112533569 + ], + "train_acc": [ + 0.2546, + 0.31232, + 0.3415, + 0.35616, + 0.36698, + 0.37548, + 0.3775, + 0.38916, + 0.39518, + 0.40052, + 0.40288, + 0.40992, + 0.4117, + 0.4142, + 0.41554, + 0.42002, + 0.42486, + 0.42292, + 0.42918, + 0.4291, + 0.4284, + 0.4346, + 0.4362, + 0.43588, + 0.44048, + 0.44034, + 0.43952, + 0.43918, + 0.44066, + 0.4431 + ], + "test_acc": [ + 0.3128, + 0.3548, + 0.3591, + 0.378, + 0.3826, + 0.3814, + 0.4011, + 0.4028, + 0.404, + 0.4254, + 0.4276, + 0.4332, + 0.4345, + 0.4356, + 0.4316, + 0.4384, + 0.4423, + 0.4425, + 0.4369, + 0.4439, + 0.4447, + 0.4442, + 0.4483, + 0.452, + 0.453, + 0.453, + 0.4498, + 0.4524, + 0.4513, + 0.4514 + ], + "state_pred_error": [ + 0.2664960029602051, + 0.17006848256111146, + 0.1373988006401062, + 0.13497620005130767, + 0.1264824439716339, + 0.11186170087099076, + 0.10831025877714157, + 0.10117165217876434, + 0.0942336485338211, + 0.09043296098470688, + 0.08660082973480225, + 0.08747579972743988, + 0.07973947757720948, + 0.07509488174915313, + 0.07382626082420349, + 0.07346862325191497, + 0.07132561764001846, + 0.07077178321242332, + 0.06908800168275833, + 0.06767414944648743, + 0.06569002504706382, + 0.062389732856750486, + 0.05864977328658104, + 0.05680723578810692, + 0.053985064004659654, + 0.05206361443519592, + 0.0498943436563015, + 0.047763368364572525, + 0.04550520754933357, + 0.043678019300699235 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.42979174852371216, + 0.37390586733818054, + 0.32618582248687744, + 0.28139200806617737 + ], + "perturbation_rho": [ + 0.5135085582733154, + 0.5129182934761047, + 0.38893166184425354, + 0.37062373757362366 + ], + "nudging": { + "0.001": [ + -0.0003920057788491249, + -0.00025207665748894215, + -0.00018884101882576942, + -0.00014588376507163048 + ], + "0.003": [ + -0.001175526063889265, + -0.0007562476675957441, + -0.000566466711461544, + -0.00043755793012678623 + ], + "0.01": [ + -0.003914414905011654, + -0.002520129084587097, + -0.0018878313712775707, + -0.0014582867734134197 + ] + }, + "hidden_norms_per_layer": [ + 231.49375915527344, + 238.22596740722656, + 252.5166473388672, + 278.00189208984375, + 310.919189453125 + ], + "bp_grad_norms_per_layer": [ + 0.000271676923148334, + 0.00023371262068394572, + 0.00020241527818143368, + 0.000180525952600874, + 0.00017415167530998588 + ] + }, + "drift": { + "embed.weight": 6.87082720778762, + "embed.bias": 27.93003811703859, + "blocks.0.ln.weight": 0.1618085354566574, + "blocks.0.w1.weight": 3.191546927288011, + "blocks.0.w1.bias": 6.668010298438182, + "blocks.0.w2.weight": 15.615942220294206, + "blocks.1.ln.weight": 0.12653203308582306, + "blocks.1.w1.weight": 3.159400666127824, + "blocks.1.w1.bias": 7.198150324919049, + "blocks.1.w2.weight": 14.61006448474005, + "blocks.2.ln.weight": 0.1170191541314125, + "blocks.2.w1.weight": 3.2969716684544164, + "blocks.2.w1.bias": 7.019388383996979, + "blocks.2.w2.weight": 15.258183997524307, + "blocks.3.ln.weight": 0.11643991619348526, + "blocks.3.w1.weight": 3.5673772866278055, + "blocks.3.w1.bias": 6.951775133615225, + "blocks.3.w2.weight": 15.726364417935486, + "out_ln.weight": 0.21612103283405304, + "out_head.weight": 1.2186449227295404, + "out_head.bias": 1.8007506807173053 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 30, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 123 + ], + "gpu": 0, + "output_dir": "results/round38_sb_penalty_30ep_s123", + "methods": [ + "state_bridge" + ], + "random_targets": false, + "penalty_lam": 0.01, + "num_classes": 10 + } +} \ No newline at end of file diff --git a/results/round38_sb_penalty_30ep_s456.log b/results/round38_sb_penalty_30ep_s456.log new file mode 100644 index 0000000..c49aa33 --- /dev/null +++ b/results/round38_sb_penalty_30ep_s456.log @@ -0,0 +1,14 @@ +Using device: cuda:0 + +============================================================ +Seed 456 +============================================================ + +--- State Bridge --- + [SB] Epoch 1: loss=2.0369, train=0.2541, test=0.3104, state_err=0.2756 + [SB] Epoch 10: loss=1.7086, train=0.3943, test=0.4104, state_err=0.0876 + [SB] Epoch 20: loss=1.6260, train=0.4284, test=0.4459, state_err=0.0630 + [SB] Epoch 30: loss=1.5980, train=0.4412, test=0.4509, state_err=0.0424 + Final test acc: 0.4509 + +All results saved to results/round38_sb_penalty_30ep_s456/results_cifar10.json diff --git a/results/round38_sb_penalty_30ep_s456/results_cifar10.json b/results/round38_sb_penalty_30ep_s456/results_cifar10.json new file mode 100644 index 0000000..7c3b35c --- /dev/null +++ b/results/round38_sb_penalty_30ep_s456/results_cifar10.json @@ -0,0 +1,233 @@ +{ + "456": { + "state_bridge": { + "log": { + "train_loss": [ + 2.0369125997924806, + 1.9002794314575195, + 1.839365246887207, + 1.8127399161148072, + 1.7898970299911499, + 1.7758199447631835, + 1.7543362093353272, + 1.7370687340545654, + 1.7275934963989257, + 1.7085617017364503, + 1.6948483248138428, + 1.6850648455429078, + 1.6752807913208008, + 1.6712003810882567, + 1.6620737231063842, + 1.6546397353744506, + 1.6401427822113037, + 1.6391044388580323, + 1.630859147644043, + 1.6259963637542725, + 1.6214555887603759, + 1.6194580511856078, + 1.613519859046936, + 1.6123445831680299, + 1.6089352087783813, + 1.6038804431915283, + 1.6018304259872436, + 1.6036242258453368, + 1.6006233197784423, + 1.5980215132904052 + ], + "train_acc": [ + 0.25408, + 0.31238, + 0.3414, + 0.35388, + 0.36162, + 0.368, + 0.37992, + 0.38372, + 0.38852, + 0.39432, + 0.40126, + 0.40466, + 0.40538, + 0.40918, + 0.4099, + 0.41604, + 0.4201, + 0.42306, + 0.42332, + 0.42836, + 0.4309, + 0.4304, + 0.43168, + 0.43282, + 0.43744, + 0.43726, + 0.4399, + 0.43702, + 0.43884, + 0.44118 + ], + "test_acc": [ + 0.3104, + 0.3506, + 0.3735, + 0.3792, + 0.3887, + 0.3929, + 0.3976, + 0.3987, + 0.3979, + 0.4104, + 0.4137, + 0.4198, + 0.4346, + 0.4251, + 0.419, + 0.4391, + 0.4347, + 0.4468, + 0.4455, + 0.4459, + 0.4411, + 0.447, + 0.4562, + 0.455, + 0.4521, + 0.4514, + 0.4522, + 0.4531, + 0.4519, + 0.4509 + ], + "state_pred_error": [ + 0.27555840564250944, + 0.16246181419372557, + 0.14625693091392516, + 0.13436604994773865, + 0.12426637276172638, + 0.11355017890930176, + 0.10647282010555267, + 0.10073854411125183, + 0.09217885914564132, + 0.08755232047796249, + 0.08124397647857666, + 0.08034932177066803, + 0.07723198721170425, + 0.07435347493171691, + 0.07414377628564835, + 0.07049065297842026, + 0.0675844569182396, + 0.06546888866901397, + 0.06477154892683029, + 0.06301552970647811, + 0.059929636999368666, + 0.05725809707641601, + 0.05675601554989815, + 0.056774080897569655, + 0.05566476465702057, + 0.05161277118682861, + 0.0487107616519928, + 0.04572098425865173, + 0.04381731255412102, + 0.04239982622146606 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.42256492376327515, + 0.38477009534835815, + 0.31862324476242065, + 0.27332931756973267 + ], + "perturbation_rho": [ + 0.5183612704277039, + 0.45182135701179504, + 0.3981747329235077, + 0.32433199882507324 + ], + "nudging": { + "0.001": [ + -0.00040302483830600977, + -0.0002813579048961401, + -0.00019051437266170979, + -0.00014453462790697813 + ], + "0.003": [ + -0.001208781497552991, + -0.0008438715012744069, + -0.000571400043554604, + -0.000433529494330287 + ], + "0.01": [ + -0.004026009701192379, + -0.0028109778650105, + -0.001904117758385837, + -0.0014447440626099706 + ] + }, + "hidden_norms_per_layer": [ + 234.2797088623047, + 243.28529357910156, + 250.8776092529297, + 268.8158264160156, + 291.8413391113281 + ], + "bp_grad_norms_per_layer": [ + 0.0002783545642159879, + 0.0002534560626372695, + 0.0002214369596913457, + 0.00020169034542050213, + 0.00019217752560507506 + ] + }, + "drift": { + "embed.weight": 6.880160568400241, + "embed.bias": 30.878601323854713, + "blocks.0.ln.weight": 0.14636263251304626, + "blocks.0.w1.weight": 3.0733067420757636, + "blocks.0.w1.bias": 6.555792191121209, + "blocks.0.w2.weight": 14.035427054326416, + "blocks.1.ln.weight": 0.13672301173210144, + "blocks.1.w1.weight": 3.124442427959728, + "blocks.1.w1.bias": 7.090988357162414, + "blocks.1.w2.weight": 14.513611759686587, + "blocks.2.ln.weight": 0.13195334374904633, + "blocks.2.w1.weight": 3.298519491819089, + "blocks.2.w1.bias": 7.524602101872219, + "blocks.2.w2.weight": 15.233467131609643, + "blocks.3.ln.weight": 0.13041938841342926, + "blocks.3.w1.weight": 3.472952946259165, + "blocks.3.w1.bias": 7.358409158987916, + "blocks.3.w2.weight": 14.931264123351346, + "out_ln.weight": 0.2145024985074997, + "out_head.weight": 1.1640670176605314, + "out_head.bias": 1.760523224597371 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 30, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 456 + ], + "gpu": 0, + "output_dir": "results/round38_sb_penalty_30ep_s456", + "methods": [ + "state_bridge" + ], + "random_targets": false, + "penalty_lam": 0.01, + "num_classes": 10 + } +} \ No newline at end of file diff --git a/results/round38_sbcb_baseline_30ep.log b/results/round38_sbcb_baseline_30ep.log new file mode 100644 index 0000000..a9c469b --- /dev/null +++ b/results/round38_sbcb_baseline_30ep.log @@ -0,0 +1,22 @@ +Using device: cuda:0 + +============================================================ +Seed 42 +============================================================ + +--- State Bridge --- + [SB] Epoch 1: loss=2.1616, train=0.1953, test=0.2011, state_err=0.3882 + [SB] Epoch 10: loss=2.0830, train=0.1993, test=0.1873, state_err=0.0756 + [SB] Epoch 20: loss=2.0933, train=0.1943, test=0.1734, state_err=0.0021 + [SB] Epoch 30: loss=2.0812, train=0.2086, test=0.2126, state_err=0.0005 + Final test acc: 0.2126 + +--- Credit Bridge --- + [CB] Warmup phase: 6 epochs (DFA fallback + value net training) + [CB] Epoch 1 (warmup): loss=2.0397, train=0.2522, test=0.2777, vloss=0.498809 + [CB] Epoch 10 (blend=0.67): loss=2.0855, train=0.2324, test=0.2308, vloss=0.039947 + [CB] Epoch 20 (blend=1.00): loss=2.1414, train=0.1883, test=0.1824, vloss=0.012027 + [CB] Epoch 30 (blend=1.00): loss=2.1347, train=0.1973, test=0.2105, vloss=0.000746 + Final test acc: 0.2105 + +All results saved to results/round38_sbcb_baseline_30ep/results_cifar10.json diff --git a/results/round38_sbcb_baseline_30ep/results_cifar10.json b/results/round38_sbcb_baseline_30ep/results_cifar10.json new file mode 100644 index 0000000..4375072 --- /dev/null +++ b/results/round38_sbcb_baseline_30ep/results_cifar10.json @@ -0,0 +1,437 @@ +{ + "42": { + "state_bridge": { + "log": { + "train_loss": [ + 2.1615624513244627, + 2.201089162750244, + 2.182833108444214, + 2.1709032915496826, + 2.1161820389556887, + 2.2302013398742675, + 2.1329537266540526, + 2.10827269241333, + 2.0998276640319826, + 2.083012378692627, + 2.102786566772461, + 2.106615118637085, + 2.0964282553863525, + 2.0857217935943604, + 2.0992775797271728, + 2.0625892084503175, + 2.0862051232147216, + 2.1001052409362795, + 2.094951697998047, + 2.0933474546813966, + 2.0933452713775633, + 2.08693749671936, + 2.0883480770874026, + 2.086935211029053, + 2.0861202153015137, + 2.0841029391479493, + 2.082290132446289, + 2.0792110958099363, + 2.0804510121154784, + 2.081232653427124 + ], + "train_acc": [ + 0.19528, + 0.1606, + 0.17582, + 0.16834, + 0.18852, + 0.1556, + 0.17988, + 0.18368, + 0.19014, + 0.19926, + 0.19686, + 0.1923, + 0.1981, + 0.20012, + 0.19082, + 0.2146, + 0.20116, + 0.18934, + 0.19132, + 0.19428, + 0.18736, + 0.1931, + 0.19568, + 0.19958, + 0.20248, + 0.20444, + 0.2046, + 0.2062, + 0.20122, + 0.20856 + ], + "test_acc": [ + 0.2011, + 0.1577, + 0.176, + 0.1994, + 0.1896, + 0.1661, + 0.1688, + 0.181, + 0.1939, + 0.1873, + 0.1878, + 0.2058, + 0.2082, + 0.1967, + 0.2019, + 0.2005, + 0.1949, + 0.1854, + 0.1759, + 0.1734, + 0.1868, + 0.1995, + 0.1949, + 0.2007, + 0.2077, + 0.2085, + 0.2109, + 0.2079, + 0.2132, + 0.2126 + ], + "state_pred_error": [ + 0.3881664722061157, + 0.5467375702285766, + 0.4459853865337372, + 0.21270744318962098, + 0.2084006814146042, + 0.1407120229911804, + 0.19075847319602968, + 0.1764928385257721, + 0.10211428045988083, + 0.07563618842363358, + 0.05846105343937874, + 0.03846761897563934, + 0.03369148607134819, + 0.022906817595362665, + 0.015594833841919899, + 0.007780850533694029, + 0.005383170440495014, + 0.00387467138633132, + 0.0025940868555754423, + 0.0021150133569538595, + 0.001786851437687874, + 0.0014581093015894294, + 0.0012195721989311278, + 0.001029884922001511, + 0.0009008185034245252, + 0.0008114725712127983, + 0.0007245114441029728, + 0.0006559462931565941, + 0.0006020296776108444, + 0.0005471098060533404 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.2372891902923584, + 0.12591305375099182, + 0.1843540072441101, + 0.28460749983787537 + ], + "perturbation_rho": [ + 0.5516304969787598, + 0.003948327153921127, + -0.007016957737505436, + 0.0 + ], + "nudging": { + "0.001": [ + -1.981109380722046e-05, + -8.381903171539307e-09, + 0.0, + 0.0 + ], + "0.003": [ + -5.944725126028061e-05, + -1.862645149230957e-09, + 0.0, + 0.0 + ], + "0.01": [ + -0.00019809138029813766, + -1.862645149230957e-08, + 3.725290298461914e-09, + 0.0 + ] + }, + "hidden_norms_per_layer": [ + 695.4109497070312, + 561166.6875, + 5258578.5, + 12430880.0, + 9851606.0 + ], + "bp_grad_norms_per_layer": [ + 1.0803730219777208e-05, + 1.284981632210247e-08, + 9.346035056978508e-09, + 9.320208604890468e-09, + 9.30139343324754e-09 + ] + }, + "drift": { + "embed.weight": 10.683279498765518, + "embed.bias": 16.186979717078597, + "blocks.0.ln.weight": 1.8698891401290894, + "blocks.0.w1.weight": 34.012515230994815, + "blocks.0.w1.bias": 46.85058602976643, + "blocks.0.w2.weight": 124.44356621058887, + "blocks.1.ln.weight": 1.7833274602890015, + "blocks.1.w1.weight": 48.03603598766101, + "blocks.1.w1.bias": 58.602063412195584, + "blocks.1.w2.weight": 123.88140584500592, + "blocks.2.ln.weight": 2.2544941902160645, + "blocks.2.w1.weight": 66.40401175683013, + "blocks.2.w1.bias": 63.25326651988191, + "blocks.2.w2.weight": 127.01673478324264, + "blocks.3.ln.weight": 1.7423062324523926, + "blocks.3.w1.weight": 37.248001175030076, + "blocks.3.w1.bias": 38.949358252268084, + "blocks.3.w2.weight": 101.10015971156598, + "out_ln.weight": 0.1668696403503418, + "out_head.weight": 1.4905390969722283, + "out_head.bias": 1.6423172242266484 + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.039658761978149, + 2.0134409933471678, + 2.00583283241272, + 2.009486458129883, + 2.008044157333374, + 2.0073662790679934, + 2.0122061133575437, + 2.040649677429199, + 2.0651579305267336, + 2.0854766065979002, + 2.099567792701721, + 2.1041016172790528, + 2.111146937561035, + 2.0936275885772706, + 2.100649955825806, + 2.1145339432525634, + 2.1261457512664794, + 2.134411395187378, + 2.138650359802246, + 2.1414046758270264, + 2.1410846240997317, + 2.140825333404541, + 2.1406545039367675, + 2.1377127909851072, + 2.138584699020386, + 2.1371214043426514, + 2.137926218109131, + 2.134101504898071, + 2.1338819580078123, + 2.134741836090088 + ], + "train_acc": [ + 0.25218, + 0.26698, + 0.27004, + 0.26836, + 0.26838, + 0.26756, + 0.26486, + 0.2526, + 0.24742, + 0.23242, + 0.22372, + 0.2182, + 0.2176, + 0.21986, + 0.21266, + 0.2051, + 0.19802, + 0.1941, + 0.1906, + 0.18834, + 0.19216, + 0.19062, + 0.1907, + 0.19222, + 0.19358, + 0.19584, + 0.1945, + 0.19384, + 0.19432, + 0.19732 + ], + "test_acc": [ + 0.2777, + 0.2762, + 0.2822, + 0.3004, + 0.3017, + 0.2837, + 0.2964, + 0.2601, + 0.2555, + 0.2308, + 0.2401, + 0.2235, + 0.1973, + 0.2062, + 0.1917, + 0.232, + 0.2137, + 0.19, + 0.182, + 0.1824, + 0.1929, + 0.191, + 0.1938, + 0.2015, + 0.2114, + 0.2172, + 0.2056, + 0.2037, + 0.2205, + 0.2105 + ], + "value_loss": [ + 0.4988088236522675, + 0.10717420438051224, + 0.08406411410808563, + 0.06901271151542664, + 0.05796313747167587, + 0.04655733848810196, + 0.043197430835962294, + 0.04390601473927498, + 0.036221856105923655, + 0.03994749122738838, + 0.038669472066164015, + 0.03699167508423328, + 0.0456404883146286, + 0.026927970384061337, + 0.02069880782365799, + 0.01933776231765747, + 0.02080854148507118, + 0.016443329193592073, + 0.013170968658924103, + 0.012027110563218594, + 0.00889115786999464, + 0.0077953302666544915, + 0.005822759210169315, + 0.004206860280707479, + 0.003205367206633091, + 0.0018577339798584581, + 0.0014363039807975292, + 0.001063295077085495, + 0.0008753935668803751, + 0.000745832763761282 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.17070117592811584, + 0.12735798954963684, + 0.21822263300418854, + 0.2762623727321625 + ], + "perturbation_rho": [ + 0.021132776513695717, + -0.006791723892092705, + 0.0, + 0.023015428334474564 + ], + "nudging": { + "0.001": [ + -7.441267371177673e-07, + -1.5925616025924683e-07, + 0.0, + 0.0 + ], + "0.003": [ + -2.280808985233307e-06, + -5.373731255531311e-07, + 0.0, + 0.0 + ], + "0.01": [ + -7.669441401958466e-06, + -1.7955899238586426e-06, + 0.0, + 1.862645149230957e-09 + ] + }, + "hidden_norms_per_layer": [ + 7008.69921875, + 7480314.5, + 66006552.0, + 65819076.0, + 67016280.0 + ], + "bp_grad_norms_per_layer": [ + 9.282441055802337e-07, + 5.1517807797551995e-09, + 4.764760141995339e-09, + 4.764532768319896e-09, + 4.767270578298621e-09 + ] + }, + "drift": { + "embed.weight": 55.317448573929425, + "embed.bias": 47.56034585553186, + "blocks.0.ln.weight": 4.106407642364502, + "blocks.0.w1.weight": 67.89937919497739, + "blocks.0.w1.bias": 55.34124320193868, + "blocks.0.w2.weight": 132.61316975770185, + "blocks.1.ln.weight": 3.4333691596984863, + "blocks.1.w1.weight": 109.26717483313107, + "blocks.1.w1.bias": 120.3421088832556, + "blocks.1.w2.weight": 196.69358325668478, + "blocks.2.ln.weight": 2.4557623863220215, + "blocks.2.w1.weight": 55.033274573984386, + "blocks.2.w1.bias": 54.84317146947108, + "blocks.2.w2.weight": 98.576185000917, + "blocks.3.ln.weight": 2.2460579872131348, + "blocks.3.w1.weight": 51.81531440048247, + "blocks.3.w1.bias": 53.49338639187709, + "blocks.3.w2.weight": 92.14827023111492, + "out_ln.weight": 0.22502917051315308, + "out_head.weight": 2.8997412886471703, + "out_head.bias": 0.4396077262245561 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 30, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 42 + ], + "gpu": 0, + "output_dir": "results/round38_sbcb_baseline_30ep", + "methods": [ + "state_bridge", + "credit_bridge" + ], + "random_targets": false, + "penalty_lam": 0.0, + "num_classes": 10 + } +} \ No newline at end of file diff --git a/results/round38_sbcb_penalty_30ep.log b/results/round38_sbcb_penalty_30ep.log new file mode 100644 index 0000000..b4a53ad --- /dev/null +++ b/results/round38_sbcb_penalty_30ep.log @@ -0,0 +1,22 @@ +Using device: cuda:0 + +============================================================ +Seed 42 +============================================================ + +--- State Bridge --- + [SB] Epoch 1: loss=2.0475, train=0.2466, test=0.2730, state_err=0.2454 + [SB] Epoch 10: loss=1.7100, train=0.3957, test=0.4162, state_err=0.0916 + [SB] Epoch 20: loss=1.6214, train=0.4307, test=0.4463, state_err=0.0700 + [SB] Epoch 30: loss=1.5901, train=0.4447, test=0.4564, state_err=0.0439 + Final test acc: 0.4564 + +--- Credit Bridge --- + [CB] Warmup phase: 6 epochs (DFA fallback + value net training) + [CB] Epoch 1 (warmup): loss=1.9964, train=0.2772, test=0.3299, vloss=0.666879 + [CB] Epoch 10 (blend=0.67): loss=1.9112, train=0.3191, test=0.3456, vloss=0.055581 + [CB] Epoch 20 (blend=1.00): loss=1.8719, train=0.3363, test=0.3546, vloss=0.020539 + [CB] Epoch 30 (blend=1.00): loss=1.8736, train=0.3438, test=0.3596, vloss=0.014528 + Final test acc: 0.3596 + +All results saved to results/round38_sbcb_penalty_30ep/results_cifar10.json diff --git a/results/round38_sbcb_penalty_30ep/results_cifar10.json b/results/round38_sbcb_penalty_30ep/results_cifar10.json new file mode 100644 index 0000000..cb030f1 --- /dev/null +++ b/results/round38_sbcb_penalty_30ep/results_cifar10.json @@ -0,0 +1,437 @@ +{ + "42": { + "state_bridge": { + "log": { + "train_loss": [ + 2.0474753201293945, + 1.916932412071228, + 1.8463650513076781, + 1.8093244620132447, + 1.7900167614746094, + 1.770258097190857, + 1.7575064269256593, + 1.745316464805603, + 1.7256561163330078, + 1.710018780593872, + 1.6960305325698852, + 1.6879396067047119, + 1.6709380169677734, + 1.6666312908172607, + 1.6575450637435913, + 1.6553003553009034, + 1.6458853662872315, + 1.6390605908966065, + 1.633693081512451, + 1.6213745572280884, + 1.6122850603866576, + 1.6089301138305665, + 1.5997764694976806, + 1.6013678260421753, + 1.6002555493545532, + 1.5937991617202758, + 1.5923587594223023, + 1.5893851773071288, + 1.5910608068466185, + 1.5901478890609742 + ], + "train_acc": [ + 0.24662, + 0.30632, + 0.34066, + 0.35354, + 0.3627, + 0.37132, + 0.37842, + 0.38224, + 0.39068, + 0.39572, + 0.39934, + 0.40442, + 0.41028, + 0.41562, + 0.4161, + 0.41766, + 0.41936, + 0.42446, + 0.42536, + 0.43068, + 0.43248, + 0.43428, + 0.43778, + 0.44052, + 0.43932, + 0.4404, + 0.44258, + 0.44194, + 0.44336, + 0.44466 + ], + "test_acc": [ + 0.273, + 0.3524, + 0.3676, + 0.3756, + 0.3906, + 0.3879, + 0.3819, + 0.3966, + 0.4068, + 0.4162, + 0.4183, + 0.4298, + 0.4321, + 0.4389, + 0.4217, + 0.4379, + 0.4363, + 0.4406, + 0.4425, + 0.4463, + 0.4538, + 0.4566, + 0.4496, + 0.4453, + 0.4486, + 0.4567, + 0.4575, + 0.4563, + 0.4565, + 0.4564 + ], + "state_pred_error": [ + 0.24535170847892762, + 0.1636493504667282, + 0.13540883115291596, + 0.12653046741724014, + 0.12561693742990493, + 0.11761465485811233, + 0.10871879986047744, + 0.10335472867965698, + 0.09837688980817795, + 0.091632712829113, + 0.0877949278664589, + 0.08455404979228974, + 0.08431078619241715, + 0.07790626471281052, + 0.0775115798163414, + 0.07608327221155167, + 0.07628034708738327, + 0.07240497077941895, + 0.07071494008302688, + 0.06996692018032075, + 0.06466230425357819, + 0.0624802718091011, + 0.058281462930440904, + 0.055862715678215026, + 0.05389112324714661, + 0.05099856609106064, + 0.04935575147509575, + 0.04708607808470726, + 0.04531161543607712, + 0.04388566305398941 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.42546752095222473, + 0.36250773072242737, + 0.31346678733825684, + 0.2606384754180908 + ], + "perturbation_rho": [ + 0.4038287401199341, + 0.44145163893699646, + 0.40815383195877075, + 0.3253956735134125 + ], + "nudging": { + "0.001": [ + -0.0003594870213419199, + -0.00023786397650837898, + -0.0001701684668660164, + -0.00012595904991030693 + ], + "0.003": [ + -0.0010785695631057024, + -0.0007136135827749968, + -0.0005104630254209042, + -0.00037785875611007214 + ], + "0.01": [ + -0.0035966814029961824, + -0.0023783869110047817, + -0.0017011994495987892, + -0.0012592736165970564 + ] + }, + "hidden_norms_per_layer": [ + 243.4176788330078, + 251.25033569335938, + 264.15234375, + 281.2754821777344, + 301.9956359863281 + ], + "bp_grad_norms_per_layer": [ + 0.00025976746110245585, + 0.00023080054961610585, + 0.0002087712928187102, + 0.0001913418382173404, + 0.00017467232828494161 + ] + }, + "drift": { + "embed.weight": 7.101831683055874, + "embed.bias": 26.55614727350677, + "blocks.0.ln.weight": 0.13280124962329865, + "blocks.0.w1.weight": 3.0818043823960677, + "blocks.0.w1.bias": 6.322237223125591, + "blocks.0.w2.weight": 14.259096230097354, + "blocks.1.ln.weight": 0.11403189599514008, + "blocks.1.w1.weight": 3.033562757580805, + "blocks.1.w1.bias": 6.850830368282527, + "blocks.1.w2.weight": 13.651065232090788, + "blocks.2.ln.weight": 0.11589953303337097, + "blocks.2.w1.weight": 3.2263993788002137, + "blocks.2.w1.bias": 6.9524991530621545, + "blocks.2.w2.weight": 14.671537599689291, + "blocks.3.ln.weight": 0.12724463641643524, + "blocks.3.w1.weight": 3.3413554165823025, + "blocks.3.w1.bias": 7.662419316475547, + "blocks.3.w2.weight": 14.679376824812177, + "out_ln.weight": 0.21895238757133484, + "out_head.weight": 1.1940135791700324, + "out_head.bias": 2.222106740649061 + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 1.9963660776519776, + 1.9372394968414306, + 1.9241013562393188, + 1.9278872109222411, + 1.9258392727661133, + 1.9213631185913085, + 1.93245830078125, + 1.9319513151550294, + 1.9178282093048096, + 1.9111720166015624, + 1.9015198223876952, + 1.8905008841705322, + 1.8903594969940185, + 1.8827447821807861, + 1.8827315840911865, + 1.8831548281478883, + 1.8796609592437745, + 1.8760715311050415, + 1.874497896347046, + 1.8719314217758178, + 1.8737228869628906, + 1.8702389026260375, + 1.869253684387207, + 1.8723084658813476, + 1.8726538021087646, + 1.866847327041626, + 1.8720124649047851, + 1.8690419888305665, + 1.8700805447769164, + 1.8736286736679078 + ], + "train_acc": [ + 0.2772, + 0.30878, + 0.3143, + 0.31462, + 0.31578, + 0.31758, + 0.31572, + 0.31458, + 0.31894, + 0.31912, + 0.3223, + 0.32764, + 0.32844, + 0.33476, + 0.3338, + 0.33586, + 0.33744, + 0.3355, + 0.33672, + 0.33632, + 0.33976, + 0.33918, + 0.34024, + 0.33654, + 0.33996, + 0.34146, + 0.33952, + 0.34062, + 0.34076, + 0.34376 + ], + "test_acc": [ + 0.3299, + 0.342, + 0.3458, + 0.3319, + 0.3513, + 0.3494, + 0.3535, + 0.3477, + 0.3438, + 0.3456, + 0.3492, + 0.3432, + 0.3486, + 0.3392, + 0.3444, + 0.3448, + 0.3444, + 0.3525, + 0.3618, + 0.3546, + 0.3556, + 0.3595, + 0.3577, + 0.3559, + 0.3598, + 0.3621, + 0.3612, + 0.3592, + 0.3584, + 0.3596 + ], + "value_loss": [ + 0.666878916387558, + 0.18937870089530945, + 0.11881086151123046, + 0.08265157832622529, + 0.06769442874908448, + 0.06252522818088531, + 0.09614691172599793, + 0.07957154913902283, + 0.054948721503019334, + 0.05558138638615608, + 0.05110657853126526, + 0.046604735120534896, + 0.04109812472939491, + 0.03985793245315552, + 0.03339640676736832, + 0.03308486737549305, + 0.030077795300483705, + 0.025715462546348572, + 0.022470404601693153, + 0.020539281535744667, + 0.018625647016167642, + 0.018597659103274346, + 0.016686187164783477, + 0.016902890469133854, + 0.016258136838972568, + 0.012850605883747339, + 0.011790002823770046, + 0.011391780233085156, + 0.014738336679339409, + 0.014527755738198757 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.6566677093505859, + 0.675422191619873, + 0.6851179599761963, + 0.6924338936805725 + ], + "perturbation_rho": [ + 0.4113081693649292, + 0.4249998927116394, + 0.5678677558898926, + 0.5010733604431152 + ], + "nudging": { + "0.001": [ + -5.1190661906730384e-05, + -4.658541001845151e-05, + -4.432544665178284e-05, + -4.257681575836614e-05 + ], + "0.003": [ + -0.00015361575060524046, + -0.00013976145419292152, + -0.0001330113154835999, + -0.00012775413051713258 + ], + "0.01": [ + -0.0005118446424603462, + -0.0004658599500544369, + -0.00044331286335363984, + -0.00042594311526045203 + ] + }, + "hidden_norms_per_layer": [ + 5362.49755859375, + 5384.90576171875, + 5393.5771484375, + 5410.9482421875, + 5431.09033203125 + ], + "bp_grad_norms_per_layer": [ + 2.3212431187857874e-05, + 2.1681269572582096e-05, + 2.1051570001873188e-05, + 2.0064975615241565e-05, + 1.878892544482369e-05 + ] + }, + "drift": { + "embed.weight": 44.5671938207566, + "embed.bias": 58.96553186802584, + "blocks.0.ln.weight": 0.29142487049102783, + "blocks.0.w1.weight": 3.8377129757749735, + "blocks.0.w1.bias": 6.352571784709687, + "blocks.0.w2.weight": 18.724100714811932, + "blocks.1.ln.weight": 0.2817494571208954, + "blocks.1.w1.weight": 3.743751843873518, + "blocks.1.w1.bias": 7.155651981858119, + "blocks.1.w2.weight": 18.70848603498537, + "blocks.2.ln.weight": 0.28254690766334534, + "blocks.2.w1.weight": 3.7939537187971424, + "blocks.2.w1.bias": 6.996760215683633, + "blocks.2.w2.weight": 19.26348418356461, + "blocks.3.ln.weight": 0.27882981300354004, + "blocks.3.w1.weight": 3.869420244575826, + "blocks.3.w1.bias": 7.142781074581749, + "blocks.3.w2.weight": 20.36433189495994, + "out_ln.weight": 0.09818978607654572, + "out_head.weight": 2.0291022420933946, + "out_head.bias": 2.1241749027066383 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 30, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 42 + ], + "gpu": 0, + "output_dir": "results/round38_sbcb_penalty_30ep", + "methods": [ + "state_bridge", + "credit_bridge" + ], + "random_targets": false, + "penalty_lam": 0.01, + "num_classes": 10 + } +} \ No newline at end of file diff --git a/results/round38_smoke_sbcb_pen/results_cifar10.json b/results/round38_smoke_sbcb_pen/results_cifar10.json new file mode 100644 index 0000000..f5ed9c4 --- /dev/null +++ b/results/round38_smoke_sbcb_pen/results_cifar10.json @@ -0,0 +1,213 @@ +{ + "42": { + "state_bridge": { + "log": { + "train_loss": [ + 2.0474753201293945, + 1.9117268241119385 + ], + "train_acc": [ + 0.24662, + 0.30954 + ], + "test_acc": [ + 0.273, + 0.3501 + ], + "state_pred_error": [ + 0.24535170847892762, + 0.13223054832935333 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.3206905722618103, + 0.2752090096473694, + 0.24660587310791016, + 0.22906462848186493 + ], + "perturbation_rho": [ + 0.4074876010417938, + 0.2618027925491333, + 0.26648417115211487, + 0.24533966183662415 + ], + "nudging": { + "0.001": [ + -0.00024993112310767174, + -0.00019314652308821678, + -0.00016400963068008423, + -0.00015044421888887882 + ], + "0.003": [ + -0.0007498480845242739, + -0.0005794172175228596, + -0.0004920377396047115, + -0.00045136199332773685 + ], + "0.01": [ + -0.0025002574548125267, + -0.001930799102410674, + -0.001639701658859849, + -0.0015042978338897228 + ] + }, + "hidden_norms_per_layer": [ + 197.37428283691406, + 208.8948211669922, + 213.67898559570312, + 225.69448852539062, + 229.3214111328125 + ], + "bp_grad_norms_per_layer": [ + 0.0002925087173935026, + 0.00027807100559584796, + 0.0002793201128952205, + 0.0002787425764836371, + 0.00027831399347633123 + ] + }, + "drift": { + "embed.weight": 3.0943938196002705, + "embed.bias": 5.276486174790121, + "blocks.0.ln.weight": 0.041422076523303986, + "blocks.0.w1.weight": 1.2334240308956859, + "blocks.0.w1.bias": 1.7498680169137257, + "blocks.0.w2.weight": 4.629686685849745, + "blocks.1.ln.weight": 0.0331297293305397, + "blocks.1.w1.weight": 1.1419210278459624, + "blocks.1.w1.bias": 1.3133909085501447, + "blocks.1.w2.weight": 4.0167023654211755, + "blocks.2.ln.weight": 0.036234382539987564, + "blocks.2.w1.weight": 1.0949732338041316, + "blocks.2.w1.bias": 1.347265776948355, + "blocks.2.w2.weight": 3.8533434905704533, + "blocks.3.ln.weight": 0.04701152443885803, + "blocks.3.w1.weight": 1.0335121836652872, + "blocks.3.w1.bias": 1.4470639304699096, + "blocks.3.w2.weight": 3.5886411268756073, + "out_ln.weight": 0.035340577363967896, + "out_head.weight": 0.5555762293577677, + "out_head.bias": 1.3793257927193587 + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 1.9963660776519776, + 2.0451175025177 + ], + "train_acc": [ + 0.2772, + 0.26838 + ], + "test_acc": [ + 0.3299, + 0.2827 + ], + "value_loss": [ + 0.666878916387558, + 0.47583423060417174 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.03980115056037903, + 0.079774409532547, + 0.1276342272758484, + 0.15156477689743042 + ], + "perturbation_rho": [ + 0.04505116492509842, + 0.14404122531414032, + 0.17026099562644958, + 0.15786880254745483 + ], + "nudging": { + "0.001": [ + -4.916917532682419e-06, + -1.4375429600477219e-05, + -1.966068521142006e-05, + -2.3062806576490402e-05 + ], + "0.003": [ + -1.4716759324073792e-05, + -4.31169755756855e-05, + -5.895830690860748e-05, + -6.919307634234428e-05 + ], + "0.01": [ + -4.905415698885918e-05, + -0.00014382274821400642, + -0.00019651977345347404, + -0.00023055588826537132 + ] + }, + "hidden_norms_per_layer": [ + 1009.140380859375, + 1082.5697021484375, + 1145.231201171875, + 1182.99951171875, + 1257.748046875 + ], + "bp_grad_norms_per_layer": [ + 6.559405301231891e-05, + 6.734106864314526e-05, + 6.742271943949163e-05, + 6.65746774757281e-05, + 6.616810424020514e-05 + ] + }, + "drift": { + "embed.weight": 7.564059143620495, + "embed.bias": 8.746969303910673, + "blocks.0.ln.weight": 0.11126699298620224, + "blocks.0.w1.weight": 1.9535038516346213, + "blocks.0.w1.bias": 1.6108819536646128, + "blocks.0.w2.weight": 7.201445067417667, + "blocks.1.ln.weight": 0.11589338630437851, + "blocks.1.w1.weight": 1.871920531155357, + "blocks.1.w1.bias": 1.7519376093645112, + "blocks.1.w2.weight": 6.716478346434812, + "blocks.2.ln.weight": 0.11303362250328064, + "blocks.2.w1.weight": 1.9497895886204863, + "blocks.2.w1.bias": 1.6654855654120733, + "blocks.2.w2.weight": 6.897888781603305, + "blocks.3.ln.weight": 0.12764930725097656, + "blocks.3.w1.weight": 2.1127271785838393, + "blocks.3.w1.bias": 1.8058662035226984, + "blocks.3.w2.weight": 7.331784125259354, + "out_ln.weight": 0.041299086064100266, + "out_head.weight": 0.9332516761578312, + "out_head.bias": 1.5418626566795017 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 2, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 42 + ], + "gpu": 0, + "output_dir": "results/round38_smoke_sbcb_pen", + "methods": [ + "state_bridge", + "credit_bridge" + ], + "random_targets": false, + "penalty_lam": 0.01, + "num_classes": 10 + } +} \ No newline at end of file diff --git a/results/round41_dfa_penalty_30ep.log b/results/round41_dfa_penalty_30ep.log new file mode 100644 index 0000000..1b1a829 --- /dev/null +++ b/results/round41_dfa_penalty_30ep.log @@ -0,0 +1,14 @@ +Using device: cuda:0 + +============================================================ +Seed 42 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=1.9962, train=0.2802, test=0.3313 + [DFA] Epoch 10: loss=1.9151, train=0.3238, test=0.3476 + [DFA] Epoch 20: loss=1.8987, train=0.3316, test=0.3590 + [DFA] Epoch 30: loss=1.8923, train=0.3405, test=0.3607 + Final test acc: 0.3607 + +All results saved to results/round41_dfa_penalty_30ep/results_cifar10.json diff --git a/results/round41_dfa_penalty_30ep/results_cifar10.json b/results/round41_dfa_penalty_30ep/results_cifar10.json new file mode 100644 index 0000000..c1ddd6e --- /dev/null +++ b/results/round41_dfa_penalty_30ep/results_cifar10.json @@ -0,0 +1,201 @@ +{ + "42": { + "dfa": { + "log": { + "train_loss": [ + 1.9962164908218383, + 1.9369539144134522, + 1.9308127733612062, + 1.9288829196548463, + 1.924676773147583, + 1.918132286529541, + 1.918223798522949, + 1.9147104105377197, + 1.9164991827011109, + 1.9150708497619628, + 1.9118981461334228, + 1.9094872266387939, + 1.905809390487671, + 1.9049867826080322, + 1.90767120262146, + 1.9046393532562256, + 1.9038504275894166, + 1.9006466190338134, + 1.8996596237182617, + 1.8986669551086426, + 1.8997121560668946, + 1.8965645993423461, + 1.8971398455047608, + 1.8969778009414673, + 1.89667788482666, + 1.8934650146484375, + 1.8900965643310548, + 1.8924740059661864, + 1.892325519180298, + 1.8923273934555054 + ], + "train_acc": [ + 0.2802, + 0.30808, + 0.31262, + 0.3156, + 0.31668, + 0.31968, + 0.3211, + 0.32238, + 0.3231, + 0.32382, + 0.32378, + 0.32668, + 0.32826, + 0.32862, + 0.32902, + 0.32944, + 0.32948, + 0.33388, + 0.33008, + 0.33162, + 0.33228, + 0.33294, + 0.33364, + 0.33536, + 0.33534, + 0.3341, + 0.33584, + 0.33624, + 0.33534, + 0.34052 + ], + "test_acc": [ + 0.3313, + 0.3463, + 0.3422, + 0.3411, + 0.3597, + 0.3549, + 0.3499, + 0.3438, + 0.3423, + 0.3476, + 0.3497, + 0.3524, + 0.3595, + 0.3521, + 0.354, + 0.3537, + 0.3588, + 0.3613, + 0.356, + 0.359, + 0.3599, + 0.3572, + 0.3615, + 0.3592, + 0.3592, + 0.3609, + 0.3578, + 0.36, + 0.3611, + 0.3607 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.33146190643310547, + 0.16347576677799225, + 0.1610197126865387, + 0.17380905151367188 + ], + "perturbation_rho": [ + 0.12955714762210846, + 0.045910485088825226, + 0.08855772018432617, + 0.06986565887928009 + ], + "nudging": { + "0.001": [ + -1.3143871910870075e-05, + -5.465932190418243e-06, + -5.55114820599556e-06, + -5.612848326563835e-06 + ], + "0.003": [ + -3.937864676117897e-05, + -1.6393139958381653e-05, + -1.6577658243477345e-05, + -1.6813864931464195e-05 + ], + "0.01": [ + -0.00013115769252181053, + -5.455967038869858e-05, + -5.524198058992624e-05, + -5.596294067800045e-05 + ] + }, + "hidden_norms_per_layer": [ + 12120.9111328125, + 12188.2958984375, + 12193.77734375, + 12198.8359375, + 12219.8369140625 + ], + "bp_grad_norms_per_layer": [ + 1.3196319741837215e-05, + 1.3040654266660567e-05, + 1.2841821444453672e-05, + 1.2863742995250504e-05, + 1.2522319593699649e-05 + ] + }, + "drift": { + "embed.weight": 92.65036012342134, + "embed.bias": 95.50366326873346, + "blocks.0.ln.weight": 0.34198617935180664, + "blocks.0.w1.weight": 3.6285842919394478, + "blocks.0.w1.bias": 6.327346232452673, + "blocks.0.w2.weight": 18.245981750960237, + "blocks.1.ln.weight": 0.3590666353702545, + "blocks.1.w1.weight": 3.60860615088841, + "blocks.1.w1.bias": 6.19502489141982, + "blocks.1.w2.weight": 17.96136875105609, + "blocks.2.ln.weight": 0.36136317253112793, + "blocks.2.w1.weight": 3.702767807151941, + "blocks.2.w1.bias": 6.508610347801663, + "blocks.2.w2.weight": 19.259072912976688, + "blocks.3.ln.weight": 0.35671475529670715, + "blocks.3.w1.weight": 3.7164720093334025, + "blocks.3.w1.bias": 6.203418611522943, + "blocks.3.w2.weight": 19.77945180777123, + "out_ln.weight": 0.16879618167877197, + "out_head.weight": 2.418863784769041, + "out_head.bias": 1.1721698518470152 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 30, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 42 + ], + "gpu": 0, + "output_dir": "results/round41_dfa_penalty_30ep", + "methods": [ + "dfa" + ], + "random_targets": false, + "penalty_lam": 0.01, + "num_classes": 10 + } +} \ No newline at end of file diff --git a/results/round41_dfa_penalty_30ep_s123.log b/results/round41_dfa_penalty_30ep_s123.log new file mode 100644 index 0000000..ff0fd4f --- /dev/null +++ b/results/round41_dfa_penalty_30ep_s123.log @@ -0,0 +1,14 @@ +Using device: cuda:0 + +============================================================ +Seed 123 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=1.9918, train=0.2828, test=0.3309 + [DFA] Epoch 10: loss=1.9247, train=0.3184, test=0.3410 + [DFA] Epoch 20: loss=1.9115, train=0.3278, test=0.3600 + [DFA] Epoch 30: loss=1.9042, train=0.3314, test=0.3582 + Final test acc: 0.3582 + +All results saved to results/round41_dfa_penalty_30ep_s123/results_cifar10.json diff --git a/results/round41_dfa_penalty_30ep_s123/results_cifar10.json b/results/round41_dfa_penalty_30ep_s123/results_cifar10.json new file mode 100644 index 0000000..0bad76e --- /dev/null +++ b/results/round41_dfa_penalty_30ep_s123/results_cifar10.json @@ -0,0 +1,201 @@ +{ + "123": { + "dfa": { + "log": { + "train_loss": [ + 1.9917970180892943, + 1.9455738663482667, + 1.9412584506225585, + 1.9381972328948975, + 1.935788204345703, + 1.9355586415863038, + 1.9291299639892578, + 1.9304945249938965, + 1.9279169077301026, + 1.9247258889389038, + 1.9270652098083496, + 1.9239173442077637, + 1.920924050216675, + 1.9179519243621825, + 1.9187614895629883, + 1.9149749173736572, + 1.9101889783477783, + 1.9113776821517945, + 1.9123343227767944, + 1.9115107091522217, + 1.9105930194091796, + 1.9092110122680663, + 1.9085102457046508, + 1.9054700579071044, + 1.906116495628357, + 1.9055400652313232, + 1.9055342751312256, + 1.9067684815216064, + 1.9050640679168702, + 1.9041575216674804 + ], + "train_acc": [ + 0.2828, + 0.3048, + 0.30986, + 0.31168, + 0.31358, + 0.31522, + 0.31574, + 0.317, + 0.31914, + 0.31836, + 0.31874, + 0.31798, + 0.32148, + 0.32276, + 0.32502, + 0.3259, + 0.32756, + 0.32626, + 0.32706, + 0.32784, + 0.329, + 0.32942, + 0.32888, + 0.33042, + 0.33034, + 0.33086, + 0.33476, + 0.33214, + 0.33166, + 0.33136 + ], + "test_acc": [ + 0.3309, + 0.3491, + 0.3382, + 0.3519, + 0.3375, + 0.3487, + 0.3436, + 0.3431, + 0.3632, + 0.341, + 0.3632, + 0.3623, + 0.3531, + 0.3536, + 0.3476, + 0.3485, + 0.3662, + 0.3539, + 0.3453, + 0.36, + 0.3532, + 0.3566, + 0.3562, + 0.3639, + 0.3622, + 0.3623, + 0.3579, + 0.3541, + 0.3576, + 0.3582 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.3322567343711853, + 0.10321325808763504, + 0.15636520087718964, + 0.19004486501216888 + ], + "perturbation_rho": [ + 0.18363387882709503, + 0.04898637533187866, + 0.09784461557865143, + 0.09405896812677383 + ], + "nudging": { + "0.001": [ + -1.0297924745827913e-05, + -3.0525843612849712e-06, + -4.650210030376911e-06, + -5.671870894730091e-06 + ], + "0.003": [ + -3.089715028181672e-05, + -9.163166396319866e-06, + -1.3922981452196836e-05, + -1.7057405784726143e-05 + ], + "0.01": [ + -0.00010294892126694322, + -3.057112917304039e-05, + -4.6447094064205885e-05, + -5.68098621442914e-05 + ] + }, + "hidden_norms_per_layer": [ + 13127.3251953125, + 13128.8193359375, + 13141.9501953125, + 13135.3408203125, + 13141.1806640625 + ], + "bp_grad_norms_per_layer": [ + 1.0922197361651342e-05, + 1.074585088645108e-05, + 1.0719732017605565e-05, + 1.0678052603907418e-05, + 1.0736169315350708e-05 + ] + }, + "drift": { + "embed.weight": 95.06253847427116, + "embed.bias": 69.56343057263858, + "blocks.0.ln.weight": 0.35518038272857666, + "blocks.0.w1.weight": 3.5318213424051828, + "blocks.0.w1.bias": 6.6251757142063346, + "blocks.0.w2.weight": 18.1649292755703, + "blocks.1.ln.weight": 0.37566548585891724, + "blocks.1.w1.weight": 3.577683688515039, + "blocks.1.w1.bias": 6.4976786510039295, + "blocks.1.w2.weight": 18.132601820579644, + "blocks.2.ln.weight": 0.39002206921577454, + "blocks.2.w1.weight": 3.7319215256746268, + "blocks.2.w1.bias": 6.266003010226504, + "blocks.2.w2.weight": 18.870330386369503, + "blocks.3.ln.weight": 0.35860922932624817, + "blocks.3.w1.weight": 3.790655898639472, + "blocks.3.w1.bias": 5.892665738859735, + "blocks.3.w2.weight": 20.602751226104075, + "out_ln.weight": 0.15972787141799927, + "out_head.weight": 2.3651003853179144, + "out_head.bias": 1.3627504013501806 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 30, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 123 + ], + "gpu": 0, + "output_dir": "results/round41_dfa_penalty_30ep_s123", + "methods": [ + "dfa" + ], + "random_targets": false, + "penalty_lam": 0.01, + "num_classes": 10 + } +} \ No newline at end of file diff --git a/results/round41_dfa_penalty_30ep_s456.log b/results/round41_dfa_penalty_30ep_s456.log new file mode 100644 index 0000000..92d71a4 --- /dev/null +++ b/results/round41_dfa_penalty_30ep_s456.log @@ -0,0 +1,14 @@ +Using device: cuda:0 + +============================================================ +Seed 456 +============================================================ + +--- DFA --- + [DFA] Epoch 1: loss=1.9882, train=0.2782, test=0.3368 + [DFA] Epoch 10: loss=1.9104, train=0.3209, test=0.3606 + [DFA] Epoch 20: loss=1.9019, train=0.3310, test=0.3629 + [DFA] Epoch 30: loss=1.8953, train=0.3350, test=0.3614 + Final test acc: 0.3614 + +All results saved to results/round41_dfa_penalty_30ep_s456/results_cifar10.json diff --git a/results/round41_dfa_penalty_30ep_s456/results_cifar10.json b/results/round41_dfa_penalty_30ep_s456/results_cifar10.json new file mode 100644 index 0000000..80d22fc --- /dev/null +++ b/results/round41_dfa_penalty_30ep_s456/results_cifar10.json @@ -0,0 +1,201 @@ +{ + "456": { + "dfa": { + "log": { + "train_loss": [ + 1.9882178707504272, + 1.9317677951049805, + 1.9248256610870362, + 1.9217043152618407, + 1.917682172279358, + 1.919907767944336, + 1.9130486701202392, + 1.9160204236221314, + 1.9124437686920166, + 1.910402643661499, + 1.9057467068099976, + 1.9108504774475097, + 1.9094166152572631, + 1.9078613684844972, + 1.9042421661376954, + 1.9058136753082275, + 1.9045625204467773, + 1.9027692486953736, + 1.901805549621582, + 1.9018799402236939, + 1.8972413793945313, + 1.8987792961883545, + 1.897886729812622, + 1.894330054550171, + 1.8959275032806397, + 1.8961896368408202, + 1.8971351692962646, + 1.8951918316650391, + 1.89493817653656, + 1.8952873357391358 + ], + "train_acc": [ + 0.2782, + 0.30628, + 0.31294, + 0.31586, + 0.31784, + 0.31944, + 0.32352, + 0.32056, + 0.32366, + 0.32092, + 0.32656, + 0.3254, + 0.3272, + 0.3234, + 0.32672, + 0.32684, + 0.33252, + 0.3313, + 0.32936, + 0.33102, + 0.3319, + 0.33272, + 0.33364, + 0.3357, + 0.334, + 0.3336, + 0.33476, + 0.33474, + 0.3348, + 0.33498 + ], + "test_acc": [ + 0.3368, + 0.3538, + 0.3441, + 0.3634, + 0.343, + 0.3574, + 0.341, + 0.3403, + 0.3594, + 0.3606, + 0.3628, + 0.3674, + 0.3684, + 0.3558, + 0.3637, + 0.3632, + 0.3649, + 0.3565, + 0.3631, + 0.3629, + 0.3546, + 0.3629, + 0.3594, + 0.3629, + 0.3619, + 0.3609, + 0.3623, + 0.3609, + 0.3607, + 0.3614 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.35106080770492554, + 0.12957611680030823, + 0.12942053377628326, + 0.15940426290035248 + ], + "perturbation_rho": [ + 0.17636069655418396, + 0.08117785304784775, + 0.0472814217209816, + 0.11043912172317505 + ], + "nudging": { + "0.001": [ + -1.4475401258096099e-05, + -4.396220901980996e-06, + -4.46141348220408e-06, + -5.974114174023271e-06 + ], + "0.003": [ + -4.3450010707601905e-05, + -1.3241806300356984e-05, + -1.3367069186642766e-05, + -1.7999671399593353e-05 + ], + "0.01": [ + -0.00014482333790510893, + -4.394981078803539e-05, + -4.4448592234402895e-05, + -5.99866034463048e-05 + ] + }, + "hidden_norms_per_layer": [ + 12229.544921875, + 12266.8916015625, + 12257.5791015625, + 12255.2705078125, + 12254.3017578125 + ], + "bp_grad_norms_per_layer": [ + 1.334045191470068e-05, + 1.2721701750706416e-05, + 1.251421963388566e-05, + 1.2780437828041613e-05, + 1.2897891792817973e-05 + ] + }, + "drift": { + "embed.weight": 96.08641084786761, + "embed.bias": 127.15202633956196, + "blocks.0.ln.weight": 0.3495213985443115, + "blocks.0.w1.weight": 3.6819779928624996, + "blocks.0.w1.bias": 6.228241220813173, + "blocks.0.w2.weight": 17.84445507605505, + "blocks.1.ln.weight": 0.34699368476867676, + "blocks.1.w1.weight": 3.6269651247865355, + "blocks.1.w1.bias": 6.23888543559435, + "blocks.1.w2.weight": 17.036835876989706, + "blocks.2.ln.weight": 0.3590497076511383, + "blocks.2.w1.weight": 3.638377800312274, + "blocks.2.w1.bias": 6.075326782548754, + "blocks.2.w2.weight": 17.82232398341993, + "blocks.3.ln.weight": 0.35772791504859924, + "blocks.3.w1.weight": 3.76772753341028, + "blocks.3.w1.bias": 6.390494916053956, + "blocks.3.w2.weight": 18.92297820750716, + "out_ln.weight": 0.18465575575828552, + "out_head.weight": 2.515055641320841, + "out_head.bias": 1.320315434071626 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 30, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 456 + ], + "gpu": 0, + "output_dir": "results/round41_dfa_penalty_30ep_s456", + "methods": [ + "dfa" + ], + "random_targets": false, + "penalty_lam": 0.01, + "num_classes": 10 + } +} \ No newline at end of file diff --git a/results/scaffold_replication/replication.json b/results/scaffold_replication/replication.json new file mode 100644 index 0000000..7b0a5bb --- /dev/null +++ b/results/scaffold_replication/replication.json @@ -0,0 +1,38 @@ +{ + "dfa": { + "final": [ + 0.3102, + 0.3103, + 0.2973 + ], + "acc20": [ + 0.3126, + 0.3053, + 0.2936 + ] + }, + "perlayer": { + "final": [ + 0.3124, + 0.2985, + 0.301 + ], + "acc20": [ + 0.2988, + 0.2719, + 0.2917 + ] + }, + "vec": { + "final": [ + 0.3234, + 0.3096, + 0.307 + ], + "acc20": [ + 0.3118, + 0.2946, + 0.3036 + ] + } +} \ No newline at end of file diff --git a/results/schedule_timing/schedules_s42.json b/results/schedule_timing/schedules_s42.json new file mode 100644 index 0000000..9311a22 --- /dev/null +++ b/results/schedule_timing/schedules_s42.json @@ -0,0 +1,2018 @@ +{ + "DFA_only": { + "test_acc": [ + 0.295, + 0.3008, + 0.2999, + 0.3036, + 0.2969, + 0.2926, + 0.297, + 0.2885, + 0.3032, + 0.305, + 0.2875, + 0.2933, + 0.3094, + 0.3185, + 0.3048, + 0.3115, + 0.3062, + 0.3146, + 0.316, + 0.3075, + 0.3015, + 0.3125, + 0.3151, + 0.2991, + 0.3117, + 0.2972, + 0.3094, + 0.3015, + 0.3075, + 0.3032, + 0.3023, + 0.306, + 0.277, + 0.3008, + 0.3077, + 0.3173, + 0.3101, + 0.3089, + 0.311, + 0.3005, + 0.3062, + 0.3139, + 0.3052, + 0.3131, + 0.3016, + 0.298, + 0.2982, + 0.3035, + 0.3112, + 0.3143, + 0.3166, + 0.3021, + 0.3168, + 0.3131, + 0.311, + 0.3148, + 0.3099, + 0.2997, + 0.3138, + 0.3066, + 0.3057, + 0.3105, + 0.3121, + 0.2973, + 0.3108, + 0.3057, + 0.3166, + 0.3153, + 0.3094, + 0.3132, + 0.3122, + 0.3134, + 0.3135, + 0.3058, + 0.3089, + 0.314, + 0.3186, + 0.3131, + 0.3114, + 0.3091, + 0.3131, + 0.3117, + 0.3135, + 0.3118, + 0.3125, + 0.3122, + 0.3131, + 0.3126, + 0.3127, + 0.3124, + 0.3104, + 0.3138, + 0.3108, + 0.3122, + 0.3122, + 0.3116, + 0.3116, + 0.312, + 0.3119, + 0.3119 + ], + "train_loss": [ + 2.037675617980957, + 2.0064356870269777, + 2.0028278520202636, + 1.9938254058074951, + 1.9946035711669923, + 1.9902986218643188, + 1.995398818092346, + 1.9927714242553711, + 1.9901552920150758, + 1.9906873265075684, + 1.9907922621154786, + 1.9868914079284667, + 1.9886361977386475, + 1.9898803197860717, + 1.990440476951599, + 1.9894216409683227, + 1.987988814430237, + 1.9897864045715332, + 1.9920248303222656, + 1.9888737732696533, + 1.9888165196990968, + 1.9904184746932982, + 1.9884975939178466, + 1.9870667554473878, + 1.9861058260345459, + 1.9889244424819947, + 1.9914796359252929, + 1.9903430311584474, + 1.9879192444610596, + 1.9876161047744751, + 1.9889435779571534, + 1.9897238473510743, + 1.9861584117889404, + 1.9904350784301759, + 1.9882240353775025, + 1.9892651306152345, + 1.9910669103240968, + 1.9877908187103273, + 1.9896357573699952, + 1.9884877701568604, + 1.9861946019744874, + 1.9889384778213501, + 1.9867235974121094, + 1.988340041885376, + 1.9876386359024047, + 1.9882950396728516, + 1.9882051584625244, + 1.987388691482544, + 1.9916717697143556, + 1.9906426657485963, + 1.9872832880020141, + 1.9891710163116456, + 1.9888770013046264, + 1.9870350061416626, + 1.9877083992767335, + 1.986397237510681, + 1.987246439666748, + 1.9876907180786132, + 1.9877903689575196, + 1.9880539420318604, + 1.9886457526016235, + 1.9865986731719971, + 1.989062392616272, + 1.9858334029388427, + 1.9864335137557982, + 1.986976103363037, + 1.988425277557373, + 1.9880691256713867, + 1.985303945236206, + 1.9883836991882324, + 1.987995620689392, + 1.9860682797241211, + 1.9866519616317748, + 1.9852013191986084, + 1.9850183421325684, + 1.9861118808746339, + 1.9872060985946656, + 1.9859641944122315, + 1.987057370147705, + 1.9865392845916747, + 1.9851618747711182, + 1.9844412656402588, + 1.986386742553711, + 1.9863465041351318, + 1.9827465126037598, + 1.9845260301208496, + 1.9861502397155761, + 1.986382713623047, + 1.9849865955352783, + 1.986821766090393, + 1.986619790725708, + 1.9852573208236695, + 1.987090570602417, + 1.9849267038726806, + 1.985615106163025, + 1.9835766082763673, + 1.9838462826538086, + 1.9850005253601075, + 1.986313782081604, + 1.9859741217041016 + ], + "gamma": [ + [ + 1, + 0.08253364491974935 + ], + [ + 2, + 0.08030614303424954 + ], + [ + 3, + 0.07973816274898127 + ], + [ + 4, + 0.08138106123078614 + ], + [ + 5, + 0.07910246076062322 + ], + [ + 10, + 0.08214855077676475 + ], + [ + 15, + 0.08803309267386794 + ], + [ + 20, + 0.09171900944784284 + ], + [ + 25, + 0.0934448060579598 + ], + [ + 30, + 0.09441993362270296 + ], + [ + 35, + 0.09620177000761032 + ], + [ + 40, + 0.09739782591350377 + ], + [ + 45, + 0.0992744923569262 + ], + [ + 50, + 0.09916113782674074 + ], + [ + 55, + 0.10024731536395848 + ], + [ + 60, + 0.10015025967732072 + ], + [ + 65, + 0.10074783873278648 + ], + [ + 70, + 0.10073912667576224 + ], + [ + 75, + 0.10122037539258599 + ], + [ + 80, + 0.10102571779862046 + ], + [ + 85, + 0.10127486119745299 + ], + [ + 90, + 0.10134081763681024 + ], + [ + 95, + 0.1013328933622688 + ], + [ + 100, + 0.10132231784518808 + ] + ], + "rho": [ + [ + 1, + 0.025695246877148747 + ], + [ + 2, + 0.04557160963304341 + ], + [ + 3, + 0.021262050315272063 + ], + [ + 4, + 0.010289260419085622 + ], + [ + 5, + 0.02755167754366994 + ], + [ + 10, + -0.007250833325088024 + ], + [ + 15, + 0.013553531607612967 + ], + [ + 20, + 0.003041430376470089 + ], + [ + 25, + 0.008854477549903095 + ], + [ + 30, + 0.0012795617803931236 + ], + [ + 35, + 0.0063968379981815815 + ], + [ + 40, + -0.0017520298715680838 + ], + [ + 45, + 0.005261762998998165 + ], + [ + 50, + 0.00488230912014842 + ], + [ + 55, + 0.0046589490957558155 + ], + [ + 60, + -0.009344345889985561 + ], + [ + 65, + 0.009587313048541546 + ], + [ + 70, + 0.00649524899199605 + ], + [ + 75, + 0.001415157224982977 + ], + [ + 80, + -0.0165848545730114 + ], + [ + 85, + 0.005657955072820187 + ], + [ + 90, + 0.014005240052938461 + ], + [ + 95, + 0.0036805709823966026 + ], + [ + 100, + 0.00399240106344223 + ] + ], + "credit_mode": [ + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa" + ] + }, + "Vec_only_from_0": { + "test_acc": [ + 0.1556, + 0.1638, + 0.1119, + 0.1485, + 0.1354, + 0.1438, + 0.1209, + 0.152, + 0.1412, + 0.1352, + 0.1356, + 0.1413, + 0.1424, + 0.1364, + 0.1452, + 0.1279, + 0.1498, + 0.1346, + 0.1433, + 0.1509, + 0.1475, + 0.1471, + 0.1521, + 0.155, + 0.1353, + 0.1206, + 0.1427, + 0.1362, + 0.1539, + 0.1545, + 0.1496, + 0.1529, + 0.1365, + 0.1513, + 0.1506, + 0.1547, + 0.1551, + 0.1521, + 0.1429, + 0.1341, + 0.1495, + 0.152, + 0.1403, + 0.1452, + 0.1517, + 0.1453, + 0.1492, + 0.1348, + 0.1489, + 0.1507, + 0.1567, + 0.1507, + 0.1559, + 0.1559, + 0.1557, + 0.1603, + 0.155, + 0.1538, + 0.1569, + 0.157, + 0.1555, + 0.1541, + 0.1508, + 0.1497, + 0.1607, + 0.1503, + 0.1556, + 0.1553, + 0.1482, + 0.1581, + 0.1541, + 0.1509, + 0.1548, + 0.1516, + 0.1538, + 0.1557, + 0.1575, + 0.1539, + 0.1544, + 0.1546, + 0.1533, + 0.1571, + 0.1573, + 0.1552, + 0.1555, + 0.1552, + 0.1562, + 0.1531, + 0.1545, + 0.1564, + 0.1554, + 0.1552, + 0.1551, + 0.1539, + 0.1552, + 0.154, + 0.1536, + 0.1539, + 0.1539, + 0.1538 + ], + "train_loss": [ + 2.2607952543640137, + 2.292783719100952, + 2.287668216705322, + 2.2807941083526613, + 2.286093077545166, + 2.2815568644714355, + 2.280725185470581, + 2.280055054244995, + 2.2787086389160156, + 2.2795758988952635, + 2.278482421798706, + 2.279569065704346, + 2.2803222184753418, + 2.280616189727783, + 2.278688010406494, + 2.277662957763672, + 2.2753771209716795, + 2.273494477767944, + 2.274206059112549, + 2.2714648165130615, + 2.2712157353210447, + 2.2711441577911375, + 2.2707051990509033, + 2.2691120259094237, + 2.268804801635742, + 2.268515103683472, + 2.269152431793213, + 2.2689581163024903, + 2.2694105588531492, + 2.2676633386230467, + 2.266967338180542, + 2.266465633544922, + 2.2668006744384765, + 2.2665466984558105, + 2.26613944229126, + 2.26567068901062, + 2.265027080993652, + 2.2640279596710204, + 2.2635817875671385, + 2.264191181716919, + 2.26260107673645, + 2.2629181452941896, + 2.26260962852478, + 2.2613576414489747, + 2.2624890808868408, + 2.2620941619110106, + 2.2606386140441894, + 2.2620151769256593, + 2.263205107269287, + 2.262801318206787, + 2.262505074005127, + 2.2627359703826904, + 2.262208557510376, + 2.262871209640503, + 2.2617874829101563, + 2.2624518565368654, + 2.26157338142395, + 2.262131029815674, + 2.2620470150756837, + 2.262693808517456, + 2.2631860585021975, + 2.2618122407531738, + 2.262384552078247, + 2.263021558837891, + 2.262093891067505, + 2.262812458190918, + 2.261425892791748, + 2.261688832015991, + 2.261387883453369, + 2.260421074676514, + 2.2608421544647217, + 2.260393793334961, + 2.260202441253662, + 2.2613094384765624, + 2.2602577527618406, + 2.2590432794189454, + 2.2594834625244142, + 2.259625990142822, + 2.259765885620117, + 2.2596383428192137, + 2.259389783782959, + 2.2588469641113282, + 2.25830569770813, + 2.2585101136779784, + 2.258915050201416, + 2.2586245221710204, + 2.2585051374816896, + 2.2587241944885252, + 2.25938269821167, + 2.257933346710205, + 2.257919548187256, + 2.257392307128906, + 2.2575006678771974, + 2.257852543411255, + 2.2582048503875733, + 2.258492467803955, + 2.258143528137207, + 2.2576286277770996, + 2.2584652642059324, + 2.258263222732544 + ], + "gamma": [ + [ + 1, + 0.046906414441764355 + ], + [ + 2, + 0.03673951420933008 + ], + [ + 3, + 0.026665887096896768 + ], + [ + 4, + 0.026283789076842368 + ], + [ + 5, + 0.018021107651293278 + ], + [ + 10, + 0.002868741168640554 + ], + [ + 15, + -0.007039564468868775 + ], + [ + 20, + -0.0028080744268663693 + ], + [ + 25, + -0.003981242459872192 + ], + [ + 30, + 0.0015802685657035909 + ], + [ + 35, + 0.0003386319258424919 + ], + [ + 40, + -0.009376191777846543 + ], + [ + 45, + -0.0011508311843044794 + ], + [ + 50, + -0.00452680832495389 + ], + [ + 55, + -0.004038146056700498 + ], + [ + 60, + -0.0011963492534050602 + ], + [ + 65, + 0.00027990929083898664 + ], + [ + 70, + 0.0019741664156072147 + ], + [ + 75, + -0.0008259685328084743 + ], + [ + 80, + 0.001342559138265642 + ], + [ + 85, + -0.0028034689235028054 + ], + [ + 90, + -0.0010258389593218453 + ], + [ + 95, + -0.0012015482668630284 + ], + [ + 100, + -0.0020375673921080306 + ] + ], + "rho": [ + [ + 1, + 0.009520432911813259 + ], + [ + 2, + 0.014110148418694735 + ], + [ + 3, + 0.009610667824745178 + ], + [ + 4, + 0.02536026295274496 + ], + [ + 5, + -0.017238461412489414 + ], + [ + 10, + -0.0013404882047325373 + ], + [ + 15, + 0.010826407931745052 + ], + [ + 20, + -0.004145572893321514 + ], + [ + 25, + 0.0030982745811343193 + ], + [ + 30, + 0.0023843322414904833 + ], + [ + 35, + -0.005288322921842337 + ], + [ + 40, + -0.005878874100744724 + ], + [ + 45, + 0.011015256866812706 + ], + [ + 50, + 0.005903104320168495 + ], + [ + 55, + 0.006925858557224274 + ], + [ + 60, + -0.005350230261683464 + ], + [ + 65, + 0.006404533050954342 + ], + [ + 70, + -0.00387337408028543 + ], + [ + 75, + -0.00044656783575192094 + ], + [ + 80, + -0.009343216195702553 + ], + [ + 85, + 0.005054101347923279 + ], + [ + 90, + -0.0021174014545977116 + ], + [ + 95, + 0.0037775260861963034 + ], + [ + 100, + 0.0032800459302961826 + ] + ], + "credit_mode": [ + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec" + ] + }, + "Vec_early_then_DFA_T5": { + "test_acc": [ + 0.1556, + 0.1638, + 0.1119, + 0.1485, + 0.1354, + 0.1214, + 0.1205, + 0.1535, + 0.1686, + 0.1877, + 0.1704, + 0.1769, + 0.1911, + 0.1952, + 0.198, + 0.1859, + 0.2052, + 0.2103, + 0.2075, + 0.2125, + 0.2189, + 0.2024, + 0.2003, + 0.2197, + 0.1998, + 0.1864, + 0.2136, + 0.2102, + 0.2157, + 0.2374, + 0.2452, + 0.2368, + 0.2194, + 0.2425, + 0.2507, + 0.2453, + 0.2512, + 0.2461, + 0.2584, + 0.2554, + 0.2478, + 0.258, + 0.2541, + 0.2541, + 0.2588, + 0.2494, + 0.2579, + 0.2531, + 0.2605, + 0.2578, + 0.2635, + 0.2553, + 0.261, + 0.2474, + 0.2636, + 0.2473, + 0.26, + 0.2572, + 0.2598, + 0.2613, + 0.2633, + 0.2559, + 0.2607, + 0.2596, + 0.2636, + 0.2628, + 0.2584, + 0.2677, + 0.264, + 0.2628, + 0.2622, + 0.2653, + 0.2641, + 0.2644, + 0.2609, + 0.2621, + 0.2615, + 0.2662, + 0.2644, + 0.2623, + 0.2634, + 0.262, + 0.2616, + 0.2615, + 0.2645, + 0.2655, + 0.2677, + 0.2656, + 0.2638, + 0.2643, + 0.2647, + 0.2649, + 0.2656, + 0.2657, + 0.2654, + 0.2659, + 0.2657, + 0.2657, + 0.2659, + 0.2659 + ], + "train_loss": [ + 2.2607952543640137, + 2.292783719100952, + 2.287668216705322, + 2.2807941083526613, + 2.286093077545166, + 2.2836004988861083, + 2.2862866271209716, + 2.285244619216919, + 2.2609054973602296, + 2.206937854614258, + 2.180389342651367, + 2.1698142209625244, + 2.160961472320557, + 2.150679744720459, + 2.141586039047241, + 2.13259642868042, + 2.121593624725342, + 2.1139394929504394, + 2.109728126373291, + 2.1014424311065674, + 2.0961972291564943, + 2.095888472290039, + 2.0923152655792236, + 2.090117413330078, + 2.087621213684082, + 2.0879313607025147, + 2.0874180991363525, + 2.085029631729126, + 2.080900169067383, + 2.077969464111328, + 2.0741229208374024, + 2.0692056820678713, + 2.065237929840088, + 2.064335147857666, + 2.061286995391846, + 2.0591921871185304, + 2.0578114111328123, + 2.0548733700561526, + 2.0540283696746826, + 2.054108468093872, + 2.050538212890625, + 2.0520819710922242, + 2.0498473474502563, + 2.050922540855408, + 2.049247169189453, + 2.049625509490967, + 2.049577032775879, + 2.048055863113403, + 2.0509523274993895, + 2.0501847734069822, + 2.0481216834259035, + 2.048765834655762, + 2.0488928285217285, + 2.0471814106750488, + 2.0469470857238767, + 2.0462841304016113, + 2.046988398284912, + 2.046081030883789, + 2.0476224256134032, + 2.0474428226470947, + 2.047055297241211, + 2.0454717302703855, + 2.046940880889893, + 2.0451609346771242, + 2.044703078651428, + 2.045888609390259, + 2.0472245388793944, + 2.046105572471619, + 2.044832556915283, + 2.0462215520477294, + 2.0456733382415773, + 2.0438159730529786, + 2.0452309396362303, + 2.043187570877075, + 2.0440224797821043, + 2.043861737976074, + 2.0452261489105226, + 2.0447871438980103, + 2.045407330856323, + 2.0445297634887694, + 2.043699400558472, + 2.0425771548461915, + 2.0439907969665527, + 2.0436773110198976, + 2.0419052614593505, + 2.0427304915618896, + 2.0440841690826415, + 2.0441862660217285, + 2.043128272857666, + 2.0440053569030763, + 2.0435659717559815, + 2.0433614556884767, + 2.0450315365219116, + 2.042842643661499, + 2.043907892150879, + 2.0425101622772215, + 2.0409409938049317, + 2.0435114336395266, + 2.0446753370666504, + 2.044158511199951 + ], + "gamma": [ + [ + 1, + 0.046906414441764355 + ], + [ + 2, + 0.03673951420933008 + ], + [ + 3, + 0.026665887096896768 + ], + [ + 4, + 0.026283789076842368 + ], + [ + 5, + 0.018021107651293278 + ], + [ + 10, + 0.01149182883091271 + ], + [ + 15, + 0.02298548154067248 + ], + [ + 20, + 0.03039000474382192 + ], + [ + 25, + 0.03801577043486759 + ], + [ + 30, + 0.046141690749209374 + ], + [ + 35, + 0.05301836773287505 + ], + [ + 40, + 0.05715382259222679 + ], + [ + 45, + 0.05773878988111392 + ], + [ + 50, + 0.05790983900078572 + ], + [ + 55, + 0.05870011501247063 + ], + [ + 60, + 0.05877381522441283 + ], + [ + 65, + 0.05932015733560547 + ], + [ + 70, + 0.059057099861092865 + ], + [ + 75, + 0.059662707601091824 + ], + [ + 80, + 0.0595702260179678 + ], + [ + 85, + 0.05982493385090493 + ], + [ + 90, + 0.05967272960697301 + ], + [ + 95, + 0.05974454994429834 + ], + [ + 100, + 0.0597556660650298 + ] + ], + "rho": [ + [ + 1, + 0.009520432911813259 + ], + [ + 2, + 0.014110148418694735 + ], + [ + 3, + 0.009610667824745178 + ], + [ + 4, + 0.02536026295274496 + ], + [ + 5, + -0.017238461412489414 + ], + [ + 10, + 0.00037904561031609774 + ], + [ + 15, + 0.00601019780151546 + ], + [ + 20, + -0.010678242426365614 + ], + [ + 25, + -0.001985238865017891 + ], + [ + 30, + 0.0008612943347543478 + ], + [ + 35, + -0.004164013545960188 + ], + [ + 40, + 0.0025230315513908863 + ], + [ + 45, + -0.012162351980805397 + ], + [ + 50, + 0.005844608414918184 + ], + [ + 55, + 0.003095341846346855 + ], + [ + 60, + -0.002123912563547492 + ], + [ + 65, + -0.006803316529840231 + ], + [ + 70, + 0.014365645125508308 + ], + [ + 75, + 0.01490132324397564 + ], + [ + 80, + -0.007389421574771404 + ], + [ + 85, + -0.0018105965573340654 + ], + [ + 90, + -0.00546201691031456 + ], + [ + 95, + 0.00042750255670398474 + ], + [ + 100, + -0.0037207347340881824 + ] + ], + "credit_mode": [ + "vec", + "vec", + "vec", + "vec", + "vec", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa" + ] + }, + "DFA_then_Vec_T20": { + "test_acc": [ + 0.295, + 0.3008, + 0.2999, + 0.3036, + 0.2969, + 0.2926, + 0.297, + 0.2885, + 0.3032, + 0.305, + 0.2875, + 0.2933, + 0.3094, + 0.3185, + 0.3048, + 0.3115, + 0.3062, + 0.3146, + 0.316, + 0.3075, + 0.2803, + 0.2917, + 0.2675, + 0.2394, + 0.226, + 0.2063, + 0.2114, + 0.1997, + 0.1856, + 0.191, + 0.1851, + 0.1915, + 0.1521, + 0.1629, + 0.168, + 0.1427, + 0.1524, + 0.1662, + 0.1455, + 0.1507, + 0.1395, + 0.137, + 0.1361, + 0.1261, + 0.1285, + 0.1463, + 0.1479, + 0.132, + 0.1411, + 0.1191, + 0.1512, + 0.1275, + 0.1285, + 0.1329, + 0.1374, + 0.1216, + 0.1379, + 0.1401, + 0.1329, + 0.1377, + 0.1391, + 0.1242, + 0.1266, + 0.1227, + 0.1263, + 0.1356, + 0.1279, + 0.1338, + 0.138, + 0.1367, + 0.1305, + 0.1318, + 0.1333, + 0.1303, + 0.1144, + 0.1324, + 0.1209, + 0.125, + 0.1282, + 0.1338, + 0.1231, + 0.1127, + 0.1114, + 0.113, + 0.1203, + 0.1327, + 0.1261, + 0.122, + 0.1236, + 0.1285, + 0.1322, + 0.1196, + 0.1334, + 0.1232, + 0.1299, + 0.1242, + 0.1263, + 0.1279, + 0.1277, + 0.1287 + ], + "train_loss": [ + 2.037675617980957, + 2.0064356870269777, + 2.0028278520202636, + 1.9938254058074951, + 1.9946035711669923, + 1.9902986218643188, + 1.995398818092346, + 1.9927714242553711, + 1.9901552920150758, + 1.9906873265075684, + 1.9907922621154786, + 1.9868914079284667, + 1.9886361977386475, + 1.9898803197860717, + 1.990440476951599, + 1.9894216409683227, + 1.987988814430237, + 1.9897864045715332, + 1.9920248303222656, + 1.9888737732696533, + 1.9968967604064942, + 2.0292881615448, + 2.0572906255340575, + 2.077139948272705, + 2.0960366818237306, + 2.114029185333252, + 2.131741167678833, + 2.1515163647460938, + 2.176086215057373, + 2.1996909393310546, + 2.217218240814209, + 2.23117594909668, + 2.238064839477539, + 2.249375128707886, + 2.2556267765808107, + 2.26151417388916, + 2.2651724644470215, + 2.265959970703125, + 2.27016633972168, + 2.2720786261749266, + 2.2715141209411622, + 2.274042503738403, + 2.2748033888244628, + 2.2756617915344237, + 2.2777460805511476, + 2.278391381225586, + 2.278936449432373, + 2.279348678741455, + 2.2798245948028564, + 2.2807802611541748, + 2.2792558080291747, + 2.280216985397339, + 2.2800197692108153, + 2.2809994650268557, + 2.278570050125122, + 2.280403848114014, + 2.2789685863494875, + 2.2798360344696045, + 2.2798763256835937, + 2.281446952972412, + 2.2817236529541014, + 2.280389738922119, + 2.281321027832031, + 2.2819569556427, + 2.282185596847534, + 2.282026661605835, + 2.281688220977783, + 2.2820052515411375, + 2.2816655310058596, + 2.2814247926330564, + 2.280900322418213, + 2.2797810842132566, + 2.2795222138214113, + 2.2794141696166994, + 2.2806855924987794, + 2.278733377609253, + 2.2787368045043945, + 2.279600267791748, + 2.2789700255584715, + 2.278726199417114, + 2.278205829925537, + 2.279039300994873, + 2.278037849807739, + 2.277773072967529, + 2.2775722401428222, + 2.2774807459259034, + 2.2776698320007323, + 2.2777703384399413, + 2.2781166757202147, + 2.2771295314025877, + 2.277872585296631, + 2.2769374592590332, + 2.2766968826293947, + 2.2768497592163084, + 2.2770231059265136, + 2.277113390045166, + 2.277193347091675, + 2.277010828704834, + 2.2768144338989256, + 2.2769637632751465 + ], + "gamma": [ + [ + 1, + 0.08253364491974935 + ], + [ + 2, + 0.08030614303424954 + ], + [ + 3, + 0.07973816274898127 + ], + [ + 4, + 0.08138106123078614 + ], + [ + 5, + 0.07910246076062322 + ], + [ + 10, + 0.08214855077676475 + ], + [ + 15, + 0.08803309267386794 + ], + [ + 20, + 0.09171900944784284 + ], + [ + 25, + 0.0009018457494676113 + ], + [ + 30, + -0.00458292686380446 + ], + [ + 35, + -0.0025702748098410666 + ], + [ + 40, + 0.0004998000513296574 + ], + [ + 45, + 0.0005651051906170323 + ], + [ + 50, + 0.0014650520424766 + ], + [ + 55, + 0.0009007407788885757 + ], + [ + 60, + -0.0015334555755543988 + ], + [ + 65, + 0.0011901014040631708 + ], + [ + 70, + -0.00016616168431937695 + ], + [ + 75, + -0.0011160390986333368 + ], + [ + 80, + -0.00010166734682570677 + ], + [ + 85, + -0.0058146035589743406 + ], + [ + 90, + -0.0026303481754439417 + ], + [ + 95, + 0.0007478901497961488 + ], + [ + 100, + 9.711093844089191e-05 + ] + ], + "rho": [ + [ + 1, + 0.025695246877148747 + ], + [ + 2, + 0.04557160963304341 + ], + [ + 3, + 0.021262050315272063 + ], + [ + 4, + 0.010289260419085622 + ], + [ + 5, + 0.02755167754366994 + ], + [ + 10, + -0.007250833325088024 + ], + [ + 15, + 0.008991335984319448 + ], + [ + 20, + 0.0010940518695861101 + ], + [ + 25, + -0.002270966302603483 + ], + [ + 30, + -0.002854343270882964 + ], + [ + 35, + -0.010588094592094421 + ], + [ + 40, + -0.002963454695418477 + ], + [ + 45, + 0.0015342015540227294 + ], + [ + 50, + 0.006793119478970766 + ], + [ + 55, + -0.010497457347810268 + ], + [ + 60, + -0.01288906205445528 + ], + [ + 65, + -0.0011845249682664871 + ], + [ + 70, + 0.009265268221497536 + ], + [ + 75, + 0.0060013351030647755 + ], + [ + 80, + -0.0006598809268325567 + ], + [ + 85, + -0.004816773347556591 + ], + [ + 90, + 0.015165997669100761 + ], + [ + 95, + -0.003314492292702198 + ], + [ + 100, + -0.01596011593937874 + ] + ], + "credit_mode": [ + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "dfa", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec", + "vec" + ] + } +} \ No newline at end of file diff --git a/results/snapshot_evolution_v2/run_s123.log b/results/snapshot_evolution_v2/run_s123.log new file mode 100644 index 0000000..c95da11 --- /dev/null +++ b/results/snapshot_evolution_v2/run_s123.log @@ -0,0 +1,210 @@ +device=cuda:0, depth=4, d_hidden=256, epochs=100, seed=123 +eval buffer: torch.Size([1024, 3072]) + +=== BP training === + [BP] Ep 0: ||h||_med=[8.690464973449707, 8.719978332519531, 8.73093318939209, 8.75937271118164, 8.790542602539062] ||g||_med=[0.0009977436857298017, 0.000992251792922616, 0.0009848480112850666, 0.0009761073160916567, 0.0009735578205436468] acc=0.0957 + [BP] Ep 1: ||h_L||=9.978e+01 ||g_2||=4.975e-05 acc=0.3965 + [BP] Ep 2: ||h_L||=1.189e+02 ||g_2||=4.264e-05 acc=0.4541 + [BP] Ep 3: ||h_L||=1.329e+02 ||g_2||=4.065e-05 acc=0.4814 + [BP] Ep 4: ||h_L||=1.422e+02 ||g_2||=4.144e-05 acc=0.4971 + [BP] Ep 5: ||h_L||=1.551e+02 ||g_2||=3.945e-05 acc=0.5078 + [BP] Ep 6: ||h_L||=1.671e+02 ||g_2||=3.917e-05 acc=0.5254 + [BP] Ep 7: ||h_L||=1.775e+02 ||g_2||=3.777e-05 acc=0.5156 + [BP] Ep 8: ||h_L||=1.825e+02 ||g_2||=3.695e-05 acc=0.5488 + [BP] Ep 9: ||h_L||=1.888e+02 ||g_2||=3.632e-05 acc=0.5430 + [BP] Ep 10: ||h_L||=1.954e+02 ||g_2||=3.601e-05 acc=0.5449 + [BP] Ep 11: ||h_L||=2.015e+02 ||g_2||=3.606e-05 acc=0.5557 + [BP] Ep 12: ||h_L||=2.081e+02 ||g_2||=3.473e-05 acc=0.5469 + [BP] Ep 13: ||h_L||=2.115e+02 ||g_2||=3.705e-05 acc=0.5332 + [BP] Ep 14: ||h_L||=2.165e+02 ||g_2||=3.531e-05 acc=0.5596 + [BP] Ep 15: ||h_L||=2.242e+02 ||g_2||=3.455e-05 acc=0.5615 + [BP] Ep 16: ||h_L||=2.239e+02 ||g_2||=3.574e-05 acc=0.5479 + [BP] Ep 17: ||h_L||=2.286e+02 ||g_2||=3.507e-05 acc=0.5498 + [BP] Ep 18: ||h_L||=2.338e+02 ||g_2||=3.669e-05 acc=0.5596 + [BP] Ep 19: ||h_L||=2.371e+02 ||g_2||=3.521e-05 acc=0.5605 + [BP] Ep 20: ||h_L||=2.396e+02 ||g_2||=3.595e-05 acc=0.5605 + [BP] Ep 21: ||h_L||=2.379e+02 ||g_2||=3.605e-05 acc=0.5781 + [BP] Ep 22: ||h_L||=2.430e+02 ||g_2||=3.571e-05 acc=0.5713 + [BP] Ep 23: ||h_L||=2.449e+02 ||g_2||=3.564e-05 acc=0.5586 + [BP] Ep 24: ||h_L||=2.481e+02 ||g_2||=3.683e-05 acc=0.5732 + [BP] Ep 25: ||h_L||=2.495e+02 ||g_2||=3.712e-05 acc=0.5771 + [BP] Ep 26: ||h_L||=2.474e+02 ||g_2||=3.760e-05 acc=0.5576 + [BP] Ep 27: ||h_L||=2.503e+02 ||g_2||=3.739e-05 acc=0.5635 + [BP] Ep 28: ||h_L||=2.517e+02 ||g_2||=3.695e-05 acc=0.5820 + [BP] Ep 29: ||h_L||=2.538e+02 ||g_2||=3.717e-05 acc=0.5771 + [BP] Ep 30: ||h_L||=2.501e+02 ||g_2||=3.752e-05 acc=0.5859 + [BP] Ep 31: ||h_L||=2.547e+02 ||g_2||=3.807e-05 acc=0.5850 + [BP] Ep 32: ||h_L||=2.542e+02 ||g_2||=3.772e-05 acc=0.5781 + [BP] Ep 33: ||h_L||=2.557e+02 ||g_2||=3.840e-05 acc=0.5713 + [BP] Ep 34: ||h_L||=2.555e+02 ||g_2||=3.730e-05 acc=0.5840 + [BP] Ep 35: ||h_L||=2.532e+02 ||g_2||=3.882e-05 acc=0.5986 + [BP] Ep 36: ||h_L||=2.578e+02 ||g_2||=3.771e-05 acc=0.5938 + [BP] Ep 37: ||h_L||=2.531e+02 ||g_2||=3.926e-05 acc=0.5869 + [BP] Ep 38: ||h_L||=2.559e+02 ||g_2||=3.848e-05 acc=0.5918 + [BP] Ep 39: ||h_L||=2.531e+02 ||g_2||=3.982e-05 acc=0.5762 + [BP] Ep 40: ||h_L||=2.516e+02 ||g_2||=3.895e-05 acc=0.5967 + [BP] Ep 41: ||h_L||=2.502e+02 ||g_2||=4.041e-05 acc=0.5967 + [BP] Ep 42: ||h_L||=2.541e+02 ||g_2||=4.035e-05 acc=0.5830 + [BP] Ep 43: ||h_L||=2.494e+02 ||g_2||=4.104e-05 acc=0.5830 + [BP] Ep 44: ||h_L||=2.519e+02 ||g_2||=4.092e-05 acc=0.5957 + [BP] Ep 45: ||h_L||=2.514e+02 ||g_2||=4.053e-05 acc=0.5732 + [BP] Ep 46: ||h_L||=2.462e+02 ||g_2||=4.221e-05 acc=0.6006 + [BP] Ep 47: ||h_L||=2.463e+02 ||g_2||=4.183e-05 acc=0.5996 + [BP] Ep 48: ||h_L||=2.455e+02 ||g_2||=4.155e-05 acc=0.6123 + [BP] Ep 49: ||h_L||=2.429e+02 ||g_2||=4.260e-05 acc=0.6006 + [BP] Ep 50: ||h_L||=2.424e+02 ||g_2||=4.242e-05 acc=0.5996 + [BP] Ep 51: ||h_L||=2.412e+02 ||g_2||=4.383e-05 acc=0.6104 + [BP] Ep 52: ||h_L||=2.402e+02 ||g_2||=4.466e-05 acc=0.6143 + [BP] Ep 53: ||h_L||=2.413e+02 ||g_2||=4.137e-05 acc=0.6152 + [BP] Ep 54: ||h_L||=2.388e+02 ||g_2||=4.456e-05 acc=0.6045 + [BP] Ep 55: ||h_L||=2.360e+02 ||g_2||=4.567e-05 acc=0.6025 + [BP] Ep 56: ||h_L||=2.356e+02 ||g_2||=4.226e-05 acc=0.6016 + [BP] Ep 57: ||h_L||=2.325e+02 ||g_2||=4.733e-05 acc=0.6016 + [BP] Ep 58: ||h_L||=2.322e+02 ||g_2||=4.771e-05 acc=0.6064 + [BP] Ep 59: ||h_L||=2.294e+02 ||g_2||=4.590e-05 acc=0.6143 + [BP] Ep 60: ||h_L||=2.299e+02 ||g_2||=4.810e-05 acc=0.6094 + [BP] Ep 61: ||h_L||=2.278e+02 ||g_2||=4.667e-05 acc=0.6045 + [BP] Ep 62: ||h_L||=2.248e+02 ||g_2||=4.761e-05 acc=0.6250 + [BP] Ep 63: ||h_L||=2.245e+02 ||g_2||=4.977e-05 acc=0.6162 + [BP] Ep 64: ||h_L||=2.243e+02 ||g_2||=4.972e-05 acc=0.6172 + [BP] Ep 65: ||h_L||=2.235e+02 ||g_2||=5.078e-05 acc=0.6113 + [BP] Ep 66: ||h_L||=2.205e+02 ||g_2||=4.961e-05 acc=0.6152 + [BP] Ep 67: ||h_L||=2.206e+02 ||g_2||=5.191e-05 acc=0.6104 + [BP] Ep 68: ||h_L||=2.189e+02 ||g_2||=5.423e-05 acc=0.6201 + [BP] Ep 69: ||h_L||=2.179e+02 ||g_2||=5.145e-05 acc=0.6152 + [BP] Ep 70: ||h_L||=2.163e+02 ||g_2||=5.319e-05 acc=0.6240 + [BP] Ep 71: ||h_L||=2.147e+02 ||g_2||=5.234e-05 acc=0.6094 + [BP] Ep 72: ||h_L||=2.142e+02 ||g_2||=5.207e-05 acc=0.6152 + [BP] Ep 73: ||h_L||=2.134e+02 ||g_2||=5.509e-05 acc=0.6152 + [BP] Ep 74: ||h_L||=2.122e+02 ||g_2||=5.333e-05 acc=0.6240 + [BP] Ep 75: ||h_L||=2.118e+02 ||g_2||=5.394e-05 acc=0.6143 + [BP] Ep 76: ||h_L||=2.104e+02 ||g_2||=5.282e-05 acc=0.6152 + [BP] Ep 77: ||h_L||=2.102e+02 ||g_2||=5.367e-05 acc=0.6182 + [BP] Ep 78: ||h_L||=2.086e+02 ||g_2||=5.341e-05 acc=0.6152 + [BP] Ep 79: ||h_L||=2.073e+02 ||g_2||=5.365e-05 acc=0.6113 + [BP] Ep 80: ||h_L||=2.062e+02 ||g_2||=5.509e-05 acc=0.6250 + [BP] Ep 81: ||h_L||=2.058e+02 ||g_2||=5.582e-05 acc=0.6221 + [BP] Ep 82: ||h_L||=2.049e+02 ||g_2||=5.464e-05 acc=0.6211 + [BP] Ep 83: ||h_L||=2.050e+02 ||g_2||=5.509e-05 acc=0.6143 + [BP] Ep 84: ||h_L||=2.043e+02 ||g_2||=5.509e-05 acc=0.6172 + [BP] Ep 85: ||h_L||=2.038e+02 ||g_2||=5.545e-05 acc=0.6191 + [BP] Ep 86: ||h_L||=2.032e+02 ||g_2||=5.440e-05 acc=0.6182 + [BP] Ep 87: ||h_L||=2.028e+02 ||g_2||=5.385e-05 acc=0.6221 + [BP] Ep 88: ||h_L||=2.031e+02 ||g_2||=5.425e-05 acc=0.6133 + [BP] Ep 89: ||h_L||=2.028e+02 ||g_2||=5.523e-05 acc=0.6162 + [BP] Ep 90: ||h_L||=2.022e+02 ||g_2||=5.593e-05 acc=0.6143 + [BP] Ep 91: ||h_L||=2.018e+02 ||g_2||=5.575e-05 acc=0.6191 + [BP] Ep 92: ||h_L||=2.019e+02 ||g_2||=5.540e-05 acc=0.6260 + [BP] Ep 93: ||h_L||=2.017e+02 ||g_2||=5.625e-05 acc=0.6211 + [BP] Ep 94: ||h_L||=2.018e+02 ||g_2||=5.597e-05 acc=0.6191 + [BP] Ep 95: ||h_L||=2.015e+02 ||g_2||=5.523e-05 acc=0.6201 + [BP] Ep 96: ||h_L||=2.015e+02 ||g_2||=5.587e-05 acc=0.6201 + [BP] Ep 97: ||h_L||=2.013e+02 ||g_2||=5.605e-05 acc=0.6191 + [BP] Ep 98: ||h_L||=2.013e+02 ||g_2||=5.599e-05 acc=0.6182 + [BP] Ep 99: ||h_L||=2.013e+02 ||g_2||=5.587e-05 acc=0.6182 + [BP] Ep 100: ||h_L||=2.013e+02 ||g_2||=5.585e-05 acc=0.6182 + +=== DFA training === + [DFA] Ep 0: ||h||_med=[8.690464973449707, 8.719978332519531, 8.73093318939209, 8.75937271118164, 8.790542602539062] ||g||_med=[0.0009977436857298017, 0.000992251792922616, 0.0009848480112850666, 0.0009761073160916567, 0.0009735578205436468] acc=0.0957 + [DFA] Ep 1: ||h_L||=6.963e+03 ||g_2||=1.315e-06 acc=0.3037 gamma_dfa=0.1066 + [DFA] Ep 2: ||h_L||=4.538e+04 ||g_2||=2.744e-07 acc=0.2930 gamma_dfa=0.1079 + [DFA] Ep 3: ||h_L||=1.244e+05 ||g_2||=1.145e-07 acc=0.3184 gamma_dfa=0.1085 + [DFA] Ep 4: ||h_L||=2.575e+05 ||g_2||=6.308e-08 acc=0.3174 gamma_dfa=0.1099 + [DFA] Ep 5: ||h_L||=4.700e+05 ||g_2||=3.892e-08 acc=0.3018 gamma_dfa=0.1084 + [DFA] Ep 6: ||h_L||=7.631e+05 ||g_2||=2.684e-08 acc=0.3096 gamma_dfa=0.1113 + [DFA] Ep 7: ||h_L||=1.163e+06 ||g_2||=1.897e-08 acc=0.3076 gamma_dfa=0.1105 + [DFA] Ep 8: ||h_L||=1.694e+06 ||g_2||=1.405e-08 acc=0.2979 gamma_dfa=0.1125 + [DFA] Ep 9: ||h_L||=2.356e+06 ||g_2||=1.107e-08 acc=0.3008 gamma_dfa=0.1132 + [DFA] Ep 10: ||h_L||=3.180e+06 ||g_2||=8.519e-09 acc=0.3086 gamma_dfa=0.1150 + [DFA] Ep 11: ||h_L||=4.215e+06 ||g_2||=7.026e-09 acc=0.3086 gamma_dfa=0.1165 + [DFA] Ep 12: ||h_L||=5.347e+06 ||g_2||=5.839e-09 acc=0.3047 gamma_dfa=0.1147 + [DFA] Ep 13: ||h_L||=6.688e+06 ||g_2||=4.985e-09 acc=0.2910 gamma_dfa=0.1138 + [DFA] Ep 14: ||h_L||=8.171e+06 ||g_2||=4.288e-09 acc=0.3086 gamma_dfa=0.1140 + [DFA] Ep 15: ||h_L||=9.891e+06 ||g_2||=3.811e-09 acc=0.3193 gamma_dfa=0.1132 + [DFA] Ep 16: ||h_L||=1.192e+07 ||g_2||=3.389e-09 acc=0.3066 gamma_dfa=0.1128 + [DFA] Ep 17: ||h_L||=1.402e+07 ||g_2||=3.017e-09 acc=0.3203 gamma_dfa=0.1126 + [DFA] Ep 18: ||h_L||=1.638e+07 ||g_2||=2.734e-09 acc=0.3154 gamma_dfa=0.1125 + [DFA] Ep 19: ||h_L||=1.904e+07 ||g_2||=2.466e-09 acc=0.3125 gamma_dfa=0.1116 + [DFA] Ep 20: ||h_L||=2.215e+07 ||g_2||=2.232e-09 acc=0.3096 gamma_dfa=0.1132 + [DFA] Ep 21: ||h_L||=2.519e+07 ||g_2||=2.051e-09 acc=0.3105 gamma_dfa=0.1127 + [DFA] Ep 22: ||h_L||=2.868e+07 ||g_2||=1.908e-09 acc=0.3105 gamma_dfa=0.1127 + [DFA] Ep 23: ||h_L||=3.257e+07 ||g_2||=1.751e-09 acc=0.3115 gamma_dfa=0.1119 + [DFA] Ep 24: ||h_L||=3.662e+07 ||g_2||=1.659e-09 acc=0.2979 gamma_dfa=0.1130 + [DFA] Ep 25: ||h_L||=4.115e+07 ||g_2||=1.500e-09 acc=0.2988 gamma_dfa=0.1120 + [DFA] Ep 26: ||h_L||=4.573e+07 ||g_2||=1.410e-09 acc=0.3115 gamma_dfa=0.1125 + [DFA] Ep 27: ||h_L||=5.048e+07 ||g_2||=1.332e-09 acc=0.2979 gamma_dfa=0.1115 + [DFA] Ep 28: ||h_L||=5.555e+07 ||g_2||=1.238e-09 acc=0.3193 gamma_dfa=0.1129 + [DFA] Ep 29: ||h_L||=6.069e+07 ||g_2||=1.189e-09 acc=0.3115 gamma_dfa=0.1119 + [DFA] Ep 30: ||h_L||=6.627e+07 ||g_2||=1.112e-09 acc=0.3125 gamma_dfa=0.1132 + [DFA] Ep 31: ||h_L||=7.196e+07 ||g_2||=1.059e-09 acc=0.3164 gamma_dfa=0.1123 + [DFA] Ep 32: ||h_L||=7.798e+07 ||g_2||=1.019e-09 acc=0.3145 gamma_dfa=0.1149 + [DFA] Ep 33: ||h_L||=8.452e+07 ||g_2||=9.572e-10 acc=0.3125 gamma_dfa=0.1125 + [DFA] Ep 34: ||h_L||=9.103e+07 ||g_2||=9.307e-10 acc=0.3125 gamma_dfa=0.1113 + [DFA] Ep 35: ||h_L||=9.773e+07 ||g_2||=8.747e-10 acc=0.3145 gamma_dfa=0.1136 + [DFA] Ep 36: ||h_L||=1.044e+08 ||g_2||=8.507e-10 acc=0.3291 gamma_dfa=0.1130 + [DFA] Ep 37: ||h_L||=1.115e+08 ||g_2||=8.077e-10 acc=0.3223 gamma_dfa=0.1129 + [DFA] Ep 38: ||h_L||=1.189e+08 ||g_2||=7.702e-10 acc=0.3047 gamma_dfa=0.1119 + [DFA] Ep 39: ||h_L||=1.265e+08 ||g_2||=7.407e-10 acc=0.3076 gamma_dfa=0.1119 + [DFA] Ep 40: ||h_L||=1.339e+08 ||g_2||=7.212e-10 acc=0.3291 gamma_dfa=0.1127 + [DFA] Ep 41: ||h_L||=1.419e+08 ||g_2||=7.015e-10 acc=0.3135 gamma_dfa=0.1130 + [DFA] Ep 42: ||h_L||=1.489e+08 ||g_2||=6.850e-10 acc=0.3145 gamma_dfa=0.1141 + [DFA] Ep 43: ||h_L||=1.566e+08 ||g_2||=6.554e-10 acc=0.3037 gamma_dfa=0.1121 + [DFA] Ep 44: ||h_L||=1.642e+08 ||g_2||=6.278e-10 acc=0.3174 gamma_dfa=0.1122 + [DFA] Ep 45: ||h_L||=1.716e+08 ||g_2||=6.384e-10 acc=0.3135 gamma_dfa=0.1135 + [DFA] Ep 46: ||h_L||=1.797e+08 ||g_2||=6.071e-10 acc=0.3213 gamma_dfa=0.1132 + [DFA] Ep 47: ||h_L||=1.878e+08 ||g_2||=5.891e-10 acc=0.3193 gamma_dfa=0.1123 + [DFA] Ep 48: ||h_L||=1.953e+08 ||g_2||=5.688e-10 acc=0.3252 gamma_dfa=0.1129 + [DFA] Ep 49: ||h_L||=2.031e+08 ||g_2||=5.532e-10 acc=0.3125 gamma_dfa=0.1124 + [DFA] Ep 50: ||h_L||=2.104e+08 ||g_2||=5.600e-10 acc=0.3301 gamma_dfa=0.1123 + [DFA] Ep 51: ||h_L||=2.182e+08 ||g_2||=5.298e-10 acc=0.3281 gamma_dfa=0.1118 + [DFA] Ep 52: ||h_L||=2.259e+08 ||g_2||=5.174e-10 acc=0.3301 gamma_dfa=0.1122 + [DFA] Ep 53: ||h_L||=2.336e+08 ||g_2||=5.160e-10 acc=0.3145 gamma_dfa=0.1123 + [DFA] Ep 54: ||h_L||=2.410e+08 ||g_2||=4.967e-10 acc=0.3320 gamma_dfa=0.1130 + [DFA] Ep 55: ||h_L||=2.485e+08 ||g_2||=4.874e-10 acc=0.3135 gamma_dfa=0.1126 + [DFA] Ep 56: ||h_L||=2.558e+08 ||g_2||=4.891e-10 acc=0.3145 gamma_dfa=0.1122 + [DFA] Ep 57: ||h_L||=2.627e+08 ||g_2||=4.827e-10 acc=0.3086 gamma_dfa=0.1129 + [DFA] Ep 58: ||h_L||=2.695e+08 ||g_2||=4.729e-10 acc=0.3301 gamma_dfa=0.1125 + [DFA] Ep 59: ||h_L||=2.762e+08 ||g_2||=4.574e-10 acc=0.3184 gamma_dfa=0.1127 + [DFA] Ep 60: ||h_L||=2.830e+08 ||g_2||=4.554e-10 acc=0.3125 gamma_dfa=0.1119 + [DFA] Ep 61: ||h_L||=2.893e+08 ||g_2||=4.464e-10 acc=0.3281 gamma_dfa=0.1126 + [DFA] Ep 62: ||h_L||=2.955e+08 ||g_2||=4.414e-10 acc=0.3145 gamma_dfa=0.1131 + [DFA] Ep 63: ||h_L||=3.015e+08 ||g_2||=4.405e-10 acc=0.3096 gamma_dfa=0.1133 + [DFA] Ep 64: ||h_L||=3.073e+08 ||g_2||=4.325e-10 acc=0.3125 gamma_dfa=0.1122 + [DFA] Ep 65: ||h_L||=3.130e+08 ||g_2||=4.353e-10 acc=0.3096 gamma_dfa=0.1132 + [DFA] Ep 66: ||h_L||=3.181e+08 ||g_2||=4.252e-10 acc=0.3164 gamma_dfa=0.1139 + [DFA] Ep 67: ||h_L||=3.232e+08 ||g_2||=4.156e-10 acc=0.3252 gamma_dfa=0.1130 + [DFA] Ep 68: ||h_L||=3.281e+08 ||g_2||=4.153e-10 acc=0.3223 gamma_dfa=0.1126 + [DFA] Ep 69: ||h_L||=3.328e+08 ||g_2||=4.167e-10 acc=0.3135 gamma_dfa=0.1135 + [DFA] Ep 70: ||h_L||=3.372e+08 ||g_2||=4.081e-10 acc=0.3115 gamma_dfa=0.1126 + [DFA] Ep 71: ||h_L||=3.416e+08 ||g_2||=4.053e-10 acc=0.3291 gamma_dfa=0.1126 + [DFA] Ep 72: ||h_L||=3.459e+08 ||g_2||=4.016e-10 acc=0.3096 gamma_dfa=0.1123 + [DFA] Ep 73: ||h_L||=3.497e+08 ||g_2||=3.978e-10 acc=0.3271 gamma_dfa=0.1132 + [DFA] Ep 74: ||h_L||=3.534e+08 ||g_2||=3.977e-10 acc=0.3057 gamma_dfa=0.1133 + [DFA] Ep 75: ||h_L||=3.566e+08 ||g_2||=3.958e-10 acc=0.3164 gamma_dfa=0.1127 + [DFA] Ep 76: ||h_L||=3.599e+08 ||g_2||=3.876e-10 acc=0.3242 gamma_dfa=0.1130 + [DFA] Ep 77: ||h_L||=3.629e+08 ||g_2||=3.873e-10 acc=0.3203 gamma_dfa=0.1131 + [DFA] Ep 78: ||h_L||=3.655e+08 ||g_2||=3.905e-10 acc=0.3145 gamma_dfa=0.1124 + [DFA] Ep 79: ||h_L||=3.682e+08 ||g_2||=3.866e-10 acc=0.3223 gamma_dfa=0.1131 + [DFA] Ep 80: ||h_L||=3.704e+08 ||g_2||=3.851e-10 acc=0.3252 gamma_dfa=0.1127 + [DFA] Ep 81: ||h_L||=3.724e+08 ||g_2||=3.836e-10 acc=0.3193 gamma_dfa=0.1128 + [DFA] Ep 82: ||h_L||=3.744e+08 ||g_2||=3.824e-10 acc=0.3262 gamma_dfa=0.1131 + [DFA] Ep 83: ||h_L||=3.761e+08 ||g_2||=3.835e-10 acc=0.3213 gamma_dfa=0.1129 + [DFA] Ep 84: ||h_L||=3.776e+08 ||g_2||=3.808e-10 acc=0.3184 gamma_dfa=0.1127 + [DFA] Ep 85: ||h_L||=3.790e+08 ||g_2||=3.804e-10 acc=0.3281 gamma_dfa=0.1129 + [DFA] Ep 86: ||h_L||=3.802e+08 ||g_2||=3.807e-10 acc=0.3154 gamma_dfa=0.1129 + [DFA] Ep 87: ||h_L||=3.812e+08 ||g_2||=3.793e-10 acc=0.3223 gamma_dfa=0.1128 + [DFA] Ep 88: ||h_L||=3.822e+08 ||g_2||=3.791e-10 acc=0.3184 gamma_dfa=0.1127 + [DFA] Ep 89: ||h_L||=3.830e+08 ||g_2||=3.775e-10 acc=0.3184 gamma_dfa=0.1129 + [DFA] Ep 90: ||h_L||=3.836e+08 ||g_2||=3.760e-10 acc=0.3262 gamma_dfa=0.1129 + [DFA] Ep 91: ||h_L||=3.841e+08 ||g_2||=3.769e-10 acc=0.3223 gamma_dfa=0.1128 + [DFA] Ep 92: ||h_L||=3.846e+08 ||g_2||=3.753e-10 acc=0.3184 gamma_dfa=0.1129 + [DFA] Ep 93: ||h_L||=3.849e+08 ||g_2||=3.765e-10 acc=0.3223 gamma_dfa=0.1129 + [DFA] Ep 94: ||h_L||=3.852e+08 ||g_2||=3.751e-10 acc=0.3184 gamma_dfa=0.1128 + [DFA] Ep 95: ||h_L||=3.854e+08 ||g_2||=3.753e-10 acc=0.3242 gamma_dfa=0.1129 + [DFA] Ep 96: ||h_L||=3.855e+08 ||g_2||=3.759e-10 acc=0.3203 gamma_dfa=0.1129 + [DFA] Ep 97: ||h_L||=3.856e+08 ||g_2||=3.758e-10 acc=0.3213 gamma_dfa=0.1129 + [DFA] Ep 98: ||h_L||=3.856e+08 ||g_2||=3.755e-10 acc=0.3203 gamma_dfa=0.1128 + [DFA] Ep 99: ||h_L||=3.857e+08 ||g_2||=3.755e-10 acc=0.3203 gamma_dfa=0.1128 + [DFA] Ep 100: ||h_L||=3.857e+08 ||g_2||=3.755e-10 acc=0.3203 gamma_dfa=0.1128 + +Saved results/snapshot_evolution_v2/snapshot_evolution_s123.json diff --git a/results/snapshot_evolution_v2/run_s42.log b/results/snapshot_evolution_v2/run_s42.log new file mode 100644 index 0000000..c764a8a --- /dev/null +++ b/results/snapshot_evolution_v2/run_s42.log @@ -0,0 +1,210 @@ +device=cuda:0, depth=4, d_hidden=256, epochs=100, seed=42 +eval buffer: torch.Size([1024, 3072]) + +=== BP training === + [BP] Ep 0: ||h||_med=[8.718070030212402, 8.780964851379395, 8.812002182006836, 8.828720092773438, 8.893179893493652] ||g||_med=[0.0010068593546748161, 0.000997236929833889, 0.0009934091940522194, 0.0009870644425973296, 0.0009829498594626784] acc=0.1152 + [BP] Ep 1: ||h_L||=9.381e+01 ||g_2||=5.500e-05 acc=0.3799 + [BP] Ep 2: ||h_L||=1.127e+02 ||g_2||=4.286e-05 acc=0.4541 + [BP] Ep 3: ||h_L||=1.245e+02 ||g_2||=4.270e-05 acc=0.4697 + [BP] Ep 4: ||h_L||=1.381e+02 ||g_2||=3.917e-05 acc=0.5039 + [BP] Ep 5: ||h_L||=1.489e+02 ||g_2||=3.916e-05 acc=0.4980 + [BP] Ep 6: ||h_L||=1.566e+02 ||g_2||=3.970e-05 acc=0.5234 + [BP] Ep 7: ||h_L||=1.659e+02 ||g_2||=3.728e-05 acc=0.5283 + [BP] Ep 8: ||h_L||=1.769e+02 ||g_2||=3.801e-05 acc=0.5410 + [BP] Ep 9: ||h_L||=1.814e+02 ||g_2||=3.649e-05 acc=0.5479 + [BP] Ep 10: ||h_L||=1.932e+02 ||g_2||=3.432e-05 acc=0.5664 + [BP] Ep 11: ||h_L||=1.958e+02 ||g_2||=3.381e-05 acc=0.5605 + [BP] Ep 12: ||h_L||=2.009e+02 ||g_2||=3.576e-05 acc=0.5459 + [BP] Ep 13: ||h_L||=2.073e+02 ||g_2||=3.389e-05 acc=0.5664 + [BP] Ep 14: ||h_L||=2.116e+02 ||g_2||=3.384e-05 acc=0.5664 + [BP] Ep 15: ||h_L||=2.138e+02 ||g_2||=3.492e-05 acc=0.5645 + [BP] Ep 16: ||h_L||=2.191e+02 ||g_2||=3.474e-05 acc=0.5742 + [BP] Ep 17: ||h_L||=2.209e+02 ||g_2||=3.491e-05 acc=0.5605 + [BP] Ep 18: ||h_L||=2.229e+02 ||g_2||=3.655e-05 acc=0.5557 + [BP] Ep 19: ||h_L||=2.255e+02 ||g_2||=3.763e-05 acc=0.5576 + [BP] Ep 20: ||h_L||=2.298e+02 ||g_2||=3.622e-05 acc=0.5635 + [BP] Ep 21: ||h_L||=2.360e+02 ||g_2||=3.521e-05 acc=0.5762 + [BP] Ep 22: ||h_L||=2.371e+02 ||g_2||=3.405e-05 acc=0.5879 + [BP] Ep 23: ||h_L||=2.383e+02 ||g_2||=3.356e-05 acc=0.5732 + [BP] Ep 24: ||h_L||=2.395e+02 ||g_2||=3.540e-05 acc=0.5723 + [BP] Ep 25: ||h_L||=2.381e+02 ||g_2||=3.570e-05 acc=0.5703 + [BP] Ep 26: ||h_L||=2.415e+02 ||g_2||=3.454e-05 acc=0.5791 + [BP] Ep 27: ||h_L||=2.422e+02 ||g_2||=3.610e-05 acc=0.5859 + [BP] Ep 28: ||h_L||=2.482e+02 ||g_2||=3.596e-05 acc=0.5811 + [BP] Ep 29: ||h_L||=2.454e+02 ||g_2||=3.742e-05 acc=0.5889 + [BP] Ep 30: ||h_L||=2.486e+02 ||g_2||=3.551e-05 acc=0.5742 + [BP] Ep 31: ||h_L||=2.451e+02 ||g_2||=3.772e-05 acc=0.5723 + [BP] Ep 32: ||h_L||=2.486e+02 ||g_2||=3.777e-05 acc=0.5762 + [BP] Ep 33: ||h_L||=2.471e+02 ||g_2||=3.571e-05 acc=0.5947 + [BP] Ep 34: ||h_L||=2.466e+02 ||g_2||=3.732e-05 acc=0.5996 + [BP] Ep 35: ||h_L||=2.483e+02 ||g_2||=3.716e-05 acc=0.5830 + [BP] Ep 36: ||h_L||=2.487e+02 ||g_2||=3.804e-05 acc=0.5820 + [BP] Ep 37: ||h_L||=2.517e+02 ||g_2||=3.812e-05 acc=0.5850 + [BP] Ep 38: ||h_L||=2.503e+02 ||g_2||=3.821e-05 acc=0.5938 + [BP] Ep 39: ||h_L||=2.469e+02 ||g_2||=3.820e-05 acc=0.5898 + [BP] Ep 40: ||h_L||=2.493e+02 ||g_2||=3.795e-05 acc=0.5918 + [BP] Ep 41: ||h_L||=2.472e+02 ||g_2||=3.859e-05 acc=0.5889 + [BP] Ep 42: ||h_L||=2.489e+02 ||g_2||=4.015e-05 acc=0.5898 + [BP] Ep 43: ||h_L||=2.455e+02 ||g_2||=3.909e-05 acc=0.5986 + [BP] Ep 44: ||h_L||=2.441e+02 ||g_2||=4.048e-05 acc=0.6025 + [BP] Ep 45: ||h_L||=2.469e+02 ||g_2||=3.789e-05 acc=0.6113 + [BP] Ep 46: ||h_L||=2.438e+02 ||g_2||=4.078e-05 acc=0.5947 + [BP] Ep 47: ||h_L||=2.418e+02 ||g_2||=4.107e-05 acc=0.6064 + [BP] Ep 48: ||h_L||=2.448e+02 ||g_2||=4.023e-05 acc=0.6025 + [BP] Ep 49: ||h_L||=2.422e+02 ||g_2||=4.135e-05 acc=0.5938 + [BP] Ep 50: ||h_L||=2.404e+02 ||g_2||=4.054e-05 acc=0.5938 + [BP] Ep 51: ||h_L||=2.403e+02 ||g_2||=4.141e-05 acc=0.6055 + [BP] Ep 52: ||h_L||=2.374e+02 ||g_2||=4.512e-05 acc=0.6035 + [BP] Ep 53: ||h_L||=2.367e+02 ||g_2||=4.363e-05 acc=0.5977 + [BP] Ep 54: ||h_L||=2.351e+02 ||g_2||=4.296e-05 acc=0.6172 + [BP] Ep 55: ||h_L||=2.323e+02 ||g_2||=4.397e-05 acc=0.6006 + [BP] Ep 56: ||h_L||=2.336e+02 ||g_2||=4.373e-05 acc=0.6113 + [BP] Ep 57: ||h_L||=2.309e+02 ||g_2||=4.451e-05 acc=0.6143 + [BP] Ep 58: ||h_L||=2.279e+02 ||g_2||=4.527e-05 acc=0.6113 + [BP] Ep 59: ||h_L||=2.295e+02 ||g_2||=4.667e-05 acc=0.5928 + [BP] Ep 60: ||h_L||=2.257e+02 ||g_2||=4.720e-05 acc=0.6094 + [BP] Ep 61: ||h_L||=2.266e+02 ||g_2||=4.760e-05 acc=0.6045 + [BP] Ep 62: ||h_L||=2.230e+02 ||g_2||=4.822e-05 acc=0.6035 + [BP] Ep 63: ||h_L||=2.228e+02 ||g_2||=4.939e-05 acc=0.6094 + [BP] Ep 64: ||h_L||=2.222e+02 ||g_2||=4.937e-05 acc=0.5986 + [BP] Ep 65: ||h_L||=2.203e+02 ||g_2||=4.871e-05 acc=0.6123 + [BP] Ep 66: ||h_L||=2.196e+02 ||g_2||=5.067e-05 acc=0.6113 + [BP] Ep 67: ||h_L||=2.173e+02 ||g_2||=5.006e-05 acc=0.5898 + [BP] Ep 68: ||h_L||=2.179e+02 ||g_2||=4.987e-05 acc=0.6084 + [BP] Ep 69: ||h_L||=2.160e+02 ||g_2||=5.053e-05 acc=0.6152 + [BP] Ep 70: ||h_L||=2.133e+02 ||g_2||=5.005e-05 acc=0.6074 + [BP] Ep 71: ||h_L||=2.140e+02 ||g_2||=5.274e-05 acc=0.6113 + [BP] Ep 72: ||h_L||=2.128e+02 ||g_2||=5.268e-05 acc=0.6094 + [BP] Ep 73: ||h_L||=2.124e+02 ||g_2||=5.362e-05 acc=0.6113 + [BP] Ep 74: ||h_L||=2.106e+02 ||g_2||=5.307e-05 acc=0.6074 + [BP] Ep 75: ||h_L||=2.098e+02 ||g_2||=5.283e-05 acc=0.6201 + [BP] Ep 76: ||h_L||=2.092e+02 ||g_2||=5.413e-05 acc=0.6094 + [BP] Ep 77: ||h_L||=2.082e+02 ||g_2||=5.412e-05 acc=0.6143 + [BP] Ep 78: ||h_L||=2.077e+02 ||g_2||=5.385e-05 acc=0.6152 + [BP] Ep 79: ||h_L||=2.068e+02 ||g_2||=5.596e-05 acc=0.5996 + [BP] Ep 80: ||h_L||=2.056e+02 ||g_2||=5.548e-05 acc=0.6094 + [BP] Ep 81: ||h_L||=2.050e+02 ||g_2||=5.472e-05 acc=0.6104 + [BP] Ep 82: ||h_L||=2.042e+02 ||g_2||=5.538e-05 acc=0.6201 + [BP] Ep 83: ||h_L||=2.034e+02 ||g_2||=5.665e-05 acc=0.6035 + [BP] Ep 84: ||h_L||=2.034e+02 ||g_2||=5.529e-05 acc=0.6104 + [BP] Ep 85: ||h_L||=2.027e+02 ||g_2||=5.481e-05 acc=0.6152 + [BP] Ep 86: ||h_L||=2.026e+02 ||g_2||=5.497e-05 acc=0.6104 + [BP] Ep 87: ||h_L||=2.024e+02 ||g_2||=5.641e-05 acc=0.6084 + [BP] Ep 88: ||h_L||=2.023e+02 ||g_2||=5.639e-05 acc=0.6113 + [BP] Ep 89: ||h_L||=2.021e+02 ||g_2||=5.677e-05 acc=0.6084 + [BP] Ep 90: ||h_L||=2.022e+02 ||g_2||=5.742e-05 acc=0.6035 + [BP] Ep 91: ||h_L||=2.019e+02 ||g_2||=5.576e-05 acc=0.6113 + [BP] Ep 92: ||h_L||=2.015e+02 ||g_2||=5.681e-05 acc=0.6016 + [BP] Ep 93: ||h_L||=2.012e+02 ||g_2||=5.702e-05 acc=0.6104 + [BP] Ep 94: ||h_L||=2.011e+02 ||g_2||=5.615e-05 acc=0.6123 + [BP] Ep 95: ||h_L||=2.010e+02 ||g_2||=5.590e-05 acc=0.6084 + [BP] Ep 96: ||h_L||=2.010e+02 ||g_2||=5.641e-05 acc=0.6074 + [BP] Ep 97: ||h_L||=2.009e+02 ||g_2||=5.674e-05 acc=0.6094 + [BP] Ep 98: ||h_L||=2.009e+02 ||g_2||=5.674e-05 acc=0.6084 + [BP] Ep 99: ||h_L||=2.009e+02 ||g_2||=5.668e-05 acc=0.6094 + [BP] Ep 100: ||h_L||=2.009e+02 ||g_2||=5.669e-05 acc=0.6094 + +=== DFA training === + [DFA] Ep 0: ||h||_med=[8.718070030212402, 8.780964851379395, 8.812002182006836, 8.828720092773438, 8.893179893493652] ||g||_med=[0.0010068593546748161, 0.000997236929833889, 0.0009934091940522194, 0.0009870644425973296, 0.0009829498594626784] acc=0.1152 + [DFA] Ep 1: ||h_L||=7.304e+03 ||g_2||=1.375e-06 acc=0.3105 gamma_dfa=0.0899 + [DFA] Ep 2: ||h_L||=3.776e+04 ||g_2||=3.111e-07 acc=0.2881 gamma_dfa=0.0858 + [DFA] Ep 3: ||h_L||=1.046e+05 ||g_2||=1.275e-07 acc=0.3018 gamma_dfa=0.0863 + [DFA] Ep 4: ||h_L||=2.235e+05 ||g_2||=6.730e-08 acc=0.3076 gamma_dfa=0.0886 + [DFA] Ep 5: ||h_L||=4.042e+05 ||g_2||=4.211e-08 acc=0.3281 gamma_dfa=0.0876 + [DFA] Ep 6: ||h_L||=6.774e+05 ||g_2||=2.808e-08 acc=0.2920 gamma_dfa=0.0842 + [DFA] Ep 7: ||h_L||=1.027e+06 ||g_2||=2.087e-08 acc=0.2920 gamma_dfa=0.0859 + [DFA] Ep 8: ||h_L||=1.513e+06 ||g_2||=1.577e-08 acc=0.3066 gamma_dfa=0.0852 + [DFA] Ep 9: ||h_L||=2.150e+06 ||g_2||=1.248e-08 acc=0.3184 gamma_dfa=0.0876 + [DFA] Ep 10: ||h_L||=2.934e+06 ||g_2||=1.044e-08 acc=0.3037 gamma_dfa=0.0876 + [DFA] Ep 11: ||h_L||=3.849e+06 ||g_2||=8.960e-09 acc=0.3018 gamma_dfa=0.0892 + [DFA] Ep 12: ||h_L||=4.946e+06 ||g_2||=7.846e-09 acc=0.2871 gamma_dfa=0.0921 + [DFA] Ep 13: ||h_L||=6.325e+06 ||g_2||=6.816e-09 acc=0.2900 gamma_dfa=0.0919 + [DFA] Ep 14: ||h_L||=7.941e+06 ||g_2||=5.938e-09 acc=0.2979 gamma_dfa=0.0949 + [DFA] Ep 15: ||h_L||=9.822e+06 ||g_2||=5.388e-09 acc=0.2852 gamma_dfa=0.0958 + [DFA] Ep 16: ||h_L||=1.202e+07 ||g_2||=4.830e-09 acc=0.2979 gamma_dfa=0.0975 + [DFA] Ep 17: ||h_L||=1.430e+07 ||g_2||=4.410e-09 acc=0.3115 gamma_dfa=0.0999 + [DFA] Ep 18: ||h_L||=1.700e+07 ||g_2||=4.013e-09 acc=0.2969 gamma_dfa=0.0988 + [DFA] Ep 19: ||h_L||=2.002e+07 ||g_2||=3.688e-09 acc=0.2949 gamma_dfa=0.1002 + [DFA] Ep 20: ||h_L||=2.311e+07 ||g_2||=3.374e-09 acc=0.3086 gamma_dfa=0.1007 + [DFA] Ep 21: ||h_L||=2.656e+07 ||g_2||=3.083e-09 acc=0.3154 gamma_dfa=0.1018 + [DFA] Ep 22: ||h_L||=3.043e+07 ||g_2||=2.851e-09 acc=0.3096 gamma_dfa=0.1025 + [DFA] Ep 23: ||h_L||=3.467e+07 ||g_2||=2.638e-09 acc=0.3086 gamma_dfa=0.1020 + [DFA] Ep 24: ||h_L||=3.916e+07 ||g_2||=2.428e-09 acc=0.3008 gamma_dfa=0.1046 + [DFA] Ep 25: ||h_L||=4.389e+07 ||g_2||=2.233e-09 acc=0.3232 gamma_dfa=0.1029 + [DFA] Ep 26: ||h_L||=4.919e+07 ||g_2||=2.056e-09 acc=0.3037 gamma_dfa=0.1025 + [DFA] Ep 27: ||h_L||=5.469e+07 ||g_2||=1.928e-09 acc=0.3105 gamma_dfa=0.1034 + [DFA] Ep 28: ||h_L||=6.011e+07 ||g_2||=1.815e-09 acc=0.3027 gamma_dfa=0.1046 + [DFA] Ep 29: ||h_L||=6.573e+07 ||g_2||=1.725e-09 acc=0.3262 gamma_dfa=0.1051 + [DFA] Ep 30: ||h_L||=7.193e+07 ||g_2||=1.626e-09 acc=0.3018 gamma_dfa=0.1059 + [DFA] Ep 31: ||h_L||=7.819e+07 ||g_2||=1.523e-09 acc=0.3213 gamma_dfa=0.1048 + [DFA] Ep 32: ||h_L||=8.508e+07 ||g_2||=1.429e-09 acc=0.3086 gamma_dfa=0.1060 + [DFA] Ep 33: ||h_L||=9.217e+07 ||g_2||=1.367e-09 acc=0.3115 gamma_dfa=0.1053 + [DFA] Ep 34: ||h_L||=9.964e+07 ||g_2||=1.290e-09 acc=0.3008 gamma_dfa=0.1059 + [DFA] Ep 35: ||h_L||=1.069e+08 ||g_2||=1.223e-09 acc=0.3252 gamma_dfa=0.1062 + [DFA] Ep 36: ||h_L||=1.145e+08 ||g_2||=1.168e-09 acc=0.2998 gamma_dfa=0.1048 + [DFA] Ep 37: ||h_L||=1.224e+08 ||g_2||=1.128e-09 acc=0.3027 gamma_dfa=0.1052 + [DFA] Ep 38: ||h_L||=1.306e+08 ||g_2||=1.069e-09 acc=0.3193 gamma_dfa=0.1057 + [DFA] Ep 39: ||h_L||=1.385e+08 ||g_2||=1.027e-09 acc=0.3027 gamma_dfa=0.1056 + [DFA] Ep 40: ||h_L||=1.470e+08 ||g_2||=9.871e-10 acc=0.3184 gamma_dfa=0.1058 + [DFA] Ep 41: ||h_L||=1.555e+08 ||g_2||=9.513e-10 acc=0.3145 gamma_dfa=0.1057 + [DFA] Ep 42: ||h_L||=1.640e+08 ||g_2||=9.198e-10 acc=0.3057 gamma_dfa=0.1057 + [DFA] Ep 43: ||h_L||=1.727e+08 ||g_2||=8.925e-10 acc=0.3115 gamma_dfa=0.1065 + [DFA] Ep 44: ||h_L||=1.813e+08 ||g_2||=8.598e-10 acc=0.2939 gamma_dfa=0.1057 + [DFA] Ep 45: ||h_L||=1.903e+08 ||g_2||=8.300e-10 acc=0.3037 gamma_dfa=0.1056 + [DFA] Ep 46: ||h_L||=1.990e+08 ||g_2||=8.036e-10 acc=0.3115 gamma_dfa=0.1062 + [DFA] Ep 47: ||h_L||=2.081e+08 ||g_2||=7.852e-10 acc=0.3008 gamma_dfa=0.1059 + [DFA] Ep 48: ||h_L||=2.167e+08 ||g_2||=7.675e-10 acc=0.3037 gamma_dfa=0.1058 + [DFA] Ep 49: ||h_L||=2.257e+08 ||g_2||=7.444e-10 acc=0.3057 gamma_dfa=0.1067 + [DFA] Ep 50: ||h_L||=2.352e+08 ||g_2||=7.281e-10 acc=0.3076 gamma_dfa=0.1065 + [DFA] Ep 51: ||h_L||=2.442e+08 ||g_2||=7.057e-10 acc=0.3145 gamma_dfa=0.1064 + [DFA] Ep 52: ||h_L||=2.533e+08 ||g_2||=6.872e-10 acc=0.3125 gamma_dfa=0.1063 + [DFA] Ep 53: ||h_L||=2.617e+08 ||g_2||=6.789e-10 acc=0.3105 gamma_dfa=0.1070 + [DFA] Ep 54: ||h_L||=2.702e+08 ||g_2||=6.633e-10 acc=0.2998 gamma_dfa=0.1055 + [DFA] Ep 55: ||h_L||=2.789e+08 ||g_2||=6.521e-10 acc=0.2949 gamma_dfa=0.1067 + [DFA] Ep 56: ||h_L||=2.873e+08 ||g_2||=6.409e-10 acc=0.3076 gamma_dfa=0.1073 + [DFA] Ep 57: ||h_L||=2.952e+08 ||g_2||=6.233e-10 acc=0.3096 gamma_dfa=0.1072 + [DFA] Ep 58: ||h_L||=3.031e+08 ||g_2||=6.182e-10 acc=0.3027 gamma_dfa=0.1066 + [DFA] Ep 59: ||h_L||=3.109e+08 ||g_2||=6.106e-10 acc=0.3027 gamma_dfa=0.1067 + [DFA] Ep 60: ||h_L||=3.188e+08 ||g_2||=5.949e-10 acc=0.3145 gamma_dfa=0.1071 + [DFA] Ep 61: ||h_L||=3.262e+08 ||g_2||=5.864e-10 acc=0.3164 gamma_dfa=0.1067 + [DFA] Ep 62: ||h_L||=3.332e+08 ||g_2||=5.788e-10 acc=0.3105 gamma_dfa=0.1066 + [DFA] Ep 63: ||h_L||=3.400e+08 ||g_2||=5.673e-10 acc=0.3154 gamma_dfa=0.1068 + [DFA] Ep 64: ||h_L||=3.464e+08 ||g_2||=5.629e-10 acc=0.3115 gamma_dfa=0.1065 + [DFA] Ep 65: ||h_L||=3.534e+08 ||g_2||=5.576e-10 acc=0.3154 gamma_dfa=0.1068 + [DFA] Ep 66: ||h_L||=3.598e+08 ||g_2||=5.556e-10 acc=0.3125 gamma_dfa=0.1067 + [DFA] Ep 67: ||h_L||=3.659e+08 ||g_2||=5.460e-10 acc=0.3047 gamma_dfa=0.1065 + [DFA] Ep 68: ||h_L||=3.718e+08 ||g_2||=5.413e-10 acc=0.2988 gamma_dfa=0.1065 + [DFA] Ep 69: ||h_L||=3.776e+08 ||g_2||=5.308e-10 acc=0.3105 gamma_dfa=0.1071 + [DFA] Ep 70: ||h_L||=3.828e+08 ||g_2||=5.315e-10 acc=0.3076 gamma_dfa=0.1070 + [DFA] Ep 71: ||h_L||=3.877e+08 ||g_2||=5.271e-10 acc=0.3145 gamma_dfa=0.1069 + [DFA] Ep 72: ||h_L||=3.923e+08 ||g_2||=5.266e-10 acc=0.2998 gamma_dfa=0.1065 + [DFA] Ep 73: ||h_L||=3.969e+08 ||g_2||=5.205e-10 acc=0.3018 gamma_dfa=0.1070 + [DFA] Ep 74: ||h_L||=4.011e+08 ||g_2||=5.160e-10 acc=0.3076 gamma_dfa=0.1066 + [DFA] Ep 75: ||h_L||=4.053e+08 ||g_2||=5.108e-10 acc=0.3096 gamma_dfa=0.1070 + [DFA] Ep 76: ||h_L||=4.091e+08 ||g_2||=5.070e-10 acc=0.3193 gamma_dfa=0.1070 + [DFA] Ep 77: ||h_L||=4.125e+08 ||g_2||=5.052e-10 acc=0.3076 gamma_dfa=0.1069 + [DFA] Ep 78: ||h_L||=4.158e+08 ||g_2||=5.040e-10 acc=0.3066 gamma_dfa=0.1070 + [DFA] Ep 79: ||h_L||=4.187e+08 ||g_2||=5.055e-10 acc=0.3018 gamma_dfa=0.1068 + [DFA] Ep 80: ||h_L||=4.214e+08 ||g_2||=4.991e-10 acc=0.3105 gamma_dfa=0.1069 + [DFA] Ep 81: ||h_L||=4.237e+08 ||g_2||=4.971e-10 acc=0.3076 gamma_dfa=0.1070 + [DFA] Ep 82: ||h_L||=4.259e+08 ||g_2||=4.927e-10 acc=0.3057 gamma_dfa=0.1070 + [DFA] Ep 83: ||h_L||=4.278e+08 ||g_2||=4.936e-10 acc=0.3047 gamma_dfa=0.1069 + [DFA] Ep 84: ||h_L||=4.297e+08 ||g_2||=4.920e-10 acc=0.3076 gamma_dfa=0.1069 + [DFA] Ep 85: ||h_L||=4.313e+08 ||g_2||=4.936e-10 acc=0.3057 gamma_dfa=0.1069 + [DFA] Ep 86: ||h_L||=4.328e+08 ||g_2||=4.903e-10 acc=0.3145 gamma_dfa=0.1068 + [DFA] Ep 87: ||h_L||=4.341e+08 ||g_2||=4.904e-10 acc=0.3086 gamma_dfa=0.1068 + [DFA] Ep 88: ||h_L||=4.351e+08 ||g_2||=4.894e-10 acc=0.3115 gamma_dfa=0.1069 + [DFA] Ep 89: ||h_L||=4.361e+08 ||g_2||=4.855e-10 acc=0.3135 gamma_dfa=0.1070 + [DFA] Ep 90: ||h_L||=4.369e+08 ||g_2||=4.873e-10 acc=0.3096 gamma_dfa=0.1069 + [DFA] Ep 91: ||h_L||=4.375e+08 ||g_2||=4.876e-10 acc=0.3066 gamma_dfa=0.1069 + [DFA] Ep 92: ||h_L||=4.380e+08 ||g_2||=4.862e-10 acc=0.3086 gamma_dfa=0.1068 + [DFA] Ep 93: ||h_L||=4.385e+08 ||g_2||=4.860e-10 acc=0.3096 gamma_dfa=0.1069 + [DFA] Ep 94: ||h_L||=4.388e+08 ||g_2||=4.854e-10 acc=0.3076 gamma_dfa=0.1069 + [DFA] Ep 95: ||h_L||=4.390e+08 ||g_2||=4.861e-10 acc=0.3086 gamma_dfa=0.1069 + [DFA] Ep 96: ||h_L||=4.392e+08 ||g_2||=4.863e-10 acc=0.3066 gamma_dfa=0.1069 + [DFA] Ep 97: ||h_L||=4.393e+08 ||g_2||=4.859e-10 acc=0.3096 gamma_dfa=0.1069 + [DFA] Ep 98: ||h_L||=4.394e+08 ||g_2||=4.857e-10 acc=0.3066 gamma_dfa=0.1069 + [DFA] Ep 99: ||h_L||=4.394e+08 ||g_2||=4.857e-10 acc=0.3076 gamma_dfa=0.1069 + [DFA] Ep 100: ||h_L||=4.394e+08 ||g_2||=4.857e-10 acc=0.3076 gamma_dfa=0.1069 + +Saved results/snapshot_evolution_v2/snapshot_evolution_s42.json diff --git a/results/snapshot_evolution_v2/run_s456.log b/results/snapshot_evolution_v2/run_s456.log new file mode 100644 index 0000000..4ccb115 --- /dev/null +++ b/results/snapshot_evolution_v2/run_s456.log @@ -0,0 +1,210 @@ +device=cuda:0, depth=4, d_hidden=256, epochs=100, seed=456 +eval buffer: torch.Size([1024, 3072]) + +=== BP training === + [BP] Ep 0: ||h||_med=[8.696551322937012, 8.737784385681152, 8.813130378723145, 8.844642639160156, 8.889528274536133] ||g||_med=[0.0010079912608489394, 0.0010035138111561537, 0.0009970925748348236, 0.0009936393471434712, 0.000986678060144186] acc=0.0928 + [BP] Ep 1: ||h_L||=9.917e+01 ||g_2||=5.310e-05 acc=0.4004 + [BP] Ep 2: ||h_L||=1.152e+02 ||g_2||=4.300e-05 acc=0.4600 + [BP] Ep 3: ||h_L||=1.251e+02 ||g_2||=4.203e-05 acc=0.4932 + [BP] Ep 4: ||h_L||=1.367e+02 ||g_2||=4.196e-05 acc=0.4902 + [BP] Ep 5: ||h_L||=1.479e+02 ||g_2||=3.941e-05 acc=0.5039 + [BP] Ep 6: ||h_L||=1.583e+02 ||g_2||=3.835e-05 acc=0.5166 + [BP] Ep 7: ||h_L||=1.656e+02 ||g_2||=3.787e-05 acc=0.5283 + [BP] Ep 8: ||h_L||=1.764e+02 ||g_2||=3.733e-05 acc=0.5293 + [BP] Ep 9: ||h_L||=1.842e+02 ||g_2||=3.600e-05 acc=0.5391 + [BP] Ep 10: ||h_L||=1.915e+02 ||g_2||=3.614e-05 acc=0.5537 + [BP] Ep 11: ||h_L||=1.981e+02 ||g_2||=3.464e-05 acc=0.5449 + [BP] Ep 12: ||h_L||=2.000e+02 ||g_2||=3.492e-05 acc=0.5439 + [BP] Ep 13: ||h_L||=2.067e+02 ||g_2||=3.524e-05 acc=0.5518 + [BP] Ep 14: ||h_L||=2.096e+02 ||g_2||=3.480e-05 acc=0.5479 + [BP] Ep 15: ||h_L||=2.130e+02 ||g_2||=3.509e-05 acc=0.5693 + [BP] Ep 16: ||h_L||=2.143e+02 ||g_2||=3.710e-05 acc=0.5508 + [BP] Ep 17: ||h_L||=2.198e+02 ||g_2||=3.612e-05 acc=0.5840 + [BP] Ep 18: ||h_L||=2.220e+02 ||g_2||=3.491e-05 acc=0.5752 + [BP] Ep 19: ||h_L||=2.260e+02 ||g_2||=3.519e-05 acc=0.5674 + [BP] Ep 20: ||h_L||=2.310e+02 ||g_2||=3.526e-05 acc=0.5664 + [BP] Ep 21: ||h_L||=2.293e+02 ||g_2||=3.503e-05 acc=0.5957 + [BP] Ep 22: ||h_L||=2.355e+02 ||g_2||=3.525e-05 acc=0.5762 + [BP] Ep 23: ||h_L||=2.381e+02 ||g_2||=3.591e-05 acc=0.5684 + [BP] Ep 24: ||h_L||=2.411e+02 ||g_2||=3.563e-05 acc=0.5889 + [BP] Ep 25: ||h_L||=2.405e+02 ||g_2||=3.554e-05 acc=0.5820 + [BP] Ep 26: ||h_L||=2.425e+02 ||g_2||=3.670e-05 acc=0.6025 + [BP] Ep 27: ||h_L||=2.436e+02 ||g_2||=3.618e-05 acc=0.5762 + [BP] Ep 28: ||h_L||=2.474e+02 ||g_2||=3.597e-05 acc=0.5879 + [BP] Ep 29: ||h_L||=2.489e+02 ||g_2||=3.712e-05 acc=0.5938 + [BP] Ep 30: ||h_L||=2.480e+02 ||g_2||=3.656e-05 acc=0.5889 + [BP] Ep 31: ||h_L||=2.501e+02 ||g_2||=3.727e-05 acc=0.5674 + [BP] Ep 32: ||h_L||=2.484e+02 ||g_2||=3.738e-05 acc=0.5986 + [BP] Ep 33: ||h_L||=2.528e+02 ||g_2||=3.573e-05 acc=0.5898 + [BP] Ep 34: ||h_L||=2.496e+02 ||g_2||=3.846e-05 acc=0.5928 + [BP] Ep 35: ||h_L||=2.481e+02 ||g_2||=3.687e-05 acc=0.6152 + [BP] Ep 36: ||h_L||=2.507e+02 ||g_2||=3.670e-05 acc=0.6016 + [BP] Ep 37: ||h_L||=2.485e+02 ||g_2||=3.572e-05 acc=0.5996 + [BP] Ep 38: ||h_L||=2.492e+02 ||g_2||=3.780e-05 acc=0.5908 + [BP] Ep 39: ||h_L||=2.507e+02 ||g_2||=3.791e-05 acc=0.6152 + [BP] Ep 40: ||h_L||=2.484e+02 ||g_2||=3.952e-05 acc=0.6104 + [BP] Ep 41: ||h_L||=2.478e+02 ||g_2||=3.848e-05 acc=0.6084 + [BP] Ep 42: ||h_L||=2.470e+02 ||g_2||=3.780e-05 acc=0.6143 + [BP] Ep 43: ||h_L||=2.466e+02 ||g_2||=3.813e-05 acc=0.6211 + [BP] Ep 44: ||h_L||=2.432e+02 ||g_2||=3.922e-05 acc=0.6182 + [BP] Ep 45: ||h_L||=2.431e+02 ||g_2||=4.048e-05 acc=0.6133 + [BP] Ep 46: ||h_L||=2.431e+02 ||g_2||=3.831e-05 acc=0.6113 + [BP] Ep 47: ||h_L||=2.413e+02 ||g_2||=4.016e-05 acc=0.6133 + [BP] Ep 48: ||h_L||=2.407e+02 ||g_2||=3.886e-05 acc=0.6162 + [BP] Ep 49: ||h_L||=2.395e+02 ||g_2||=4.190e-05 acc=0.6104 + [BP] Ep 50: ||h_L||=2.385e+02 ||g_2||=4.175e-05 acc=0.6152 + [BP] Ep 51: ||h_L||=2.367e+02 ||g_2||=4.073e-05 acc=0.6191 + [BP] Ep 52: ||h_L||=2.373e+02 ||g_2||=4.066e-05 acc=0.6172 + [BP] Ep 53: ||h_L||=2.351e+02 ||g_2||=4.393e-05 acc=0.6104 + [BP] Ep 54: ||h_L||=2.338e+02 ||g_2||=4.099e-05 acc=0.6230 + [BP] Ep 55: ||h_L||=2.329e+02 ||g_2||=4.365e-05 acc=0.6270 + [BP] Ep 56: ||h_L||=2.333e+02 ||g_2||=4.267e-05 acc=0.6309 + [BP] Ep 57: ||h_L||=2.305e+02 ||g_2||=4.151e-05 acc=0.6309 + [BP] Ep 58: ||h_L||=2.282e+02 ||g_2||=4.239e-05 acc=0.6416 + [BP] Ep 59: ||h_L||=2.257e+02 ||g_2||=4.316e-05 acc=0.6279 + [BP] Ep 60: ||h_L||=2.256e+02 ||g_2||=4.490e-05 acc=0.6240 + [BP] Ep 61: ||h_L||=2.244e+02 ||g_2||=4.582e-05 acc=0.6289 + [BP] Ep 62: ||h_L||=2.224e+02 ||g_2||=4.648e-05 acc=0.6270 + [BP] Ep 63: ||h_L||=2.206e+02 ||g_2||=4.636e-05 acc=0.6211 + [BP] Ep 64: ||h_L||=2.205e+02 ||g_2||=4.671e-05 acc=0.6250 + [BP] Ep 65: ||h_L||=2.196e+02 ||g_2||=4.449e-05 acc=0.6270 + [BP] Ep 66: ||h_L||=2.172e+02 ||g_2||=4.745e-05 acc=0.6377 + [BP] Ep 67: ||h_L||=2.152e+02 ||g_2||=4.708e-05 acc=0.6367 + [BP] Ep 68: ||h_L||=2.151e+02 ||g_2||=4.813e-05 acc=0.6289 + [BP] Ep 69: ||h_L||=2.136e+02 ||g_2||=4.880e-05 acc=0.6328 + [BP] Ep 70: ||h_L||=2.124e+02 ||g_2||=4.823e-05 acc=0.6270 + [BP] Ep 71: ||h_L||=2.107e+02 ||g_2||=4.963e-05 acc=0.6230 + [BP] Ep 72: ||h_L||=2.113e+02 ||g_2||=4.797e-05 acc=0.6133 + [BP] Ep 73: ||h_L||=2.090e+02 ||g_2||=4.736e-05 acc=0.6318 + [BP] Ep 74: ||h_L||=2.096e+02 ||g_2||=4.832e-05 acc=0.6270 + [BP] Ep 75: ||h_L||=2.081e+02 ||g_2||=4.982e-05 acc=0.6240 + [BP] Ep 76: ||h_L||=2.075e+02 ||g_2||=4.877e-05 acc=0.6260 + [BP] Ep 77: ||h_L||=2.060e+02 ||g_2||=4.900e-05 acc=0.6221 + [BP] Ep 78: ||h_L||=2.052e+02 ||g_2||=4.906e-05 acc=0.6279 + [BP] Ep 79: ||h_L||=2.050e+02 ||g_2||=5.181e-05 acc=0.6211 + [BP] Ep 80: ||h_L||=2.045e+02 ||g_2||=4.986e-05 acc=0.6260 + [BP] Ep 81: ||h_L||=2.039e+02 ||g_2||=5.293e-05 acc=0.6289 + [BP] Ep 82: ||h_L||=2.032e+02 ||g_2||=5.169e-05 acc=0.6191 + [BP] Ep 83: ||h_L||=2.025e+02 ||g_2||=5.152e-05 acc=0.6260 + [BP] Ep 84: ||h_L||=2.019e+02 ||g_2||=5.158e-05 acc=0.6250 + [BP] Ep 85: ||h_L||=2.018e+02 ||g_2||=5.156e-05 acc=0.6250 + [BP] Ep 86: ||h_L||=2.015e+02 ||g_2||=5.196e-05 acc=0.6309 + [BP] Ep 87: ||h_L||=2.015e+02 ||g_2||=5.104e-05 acc=0.6289 + [BP] Ep 88: ||h_L||=2.017e+02 ||g_2||=5.253e-05 acc=0.6270 + [BP] Ep 89: ||h_L||=2.011e+02 ||g_2||=5.326e-05 acc=0.6299 + [BP] Ep 90: ||h_L||=2.005e+02 ||g_2||=5.368e-05 acc=0.6279 + [BP] Ep 91: ||h_L||=2.000e+02 ||g_2||=5.282e-05 acc=0.6289 + [BP] Ep 92: ||h_L||=1.999e+02 ||g_2||=5.349e-05 acc=0.6270 + [BP] Ep 93: ||h_L||=1.998e+02 ||g_2||=5.212e-05 acc=0.6289 + [BP] Ep 94: ||h_L||=1.993e+02 ||g_2||=5.377e-05 acc=0.6299 + [BP] Ep 95: ||h_L||=1.994e+02 ||g_2||=5.352e-05 acc=0.6309 + [BP] Ep 96: ||h_L||=1.994e+02 ||g_2||=5.367e-05 acc=0.6289 + [BP] Ep 97: ||h_L||=1.994e+02 ||g_2||=5.366e-05 acc=0.6289 + [BP] Ep 98: ||h_L||=1.993e+02 ||g_2||=5.374e-05 acc=0.6289 + [BP] Ep 99: ||h_L||=1.994e+02 ||g_2||=5.385e-05 acc=0.6289 + [BP] Ep 100: ||h_L||=1.994e+02 ||g_2||=5.381e-05 acc=0.6279 + +=== DFA training === + [DFA] Ep 0: ||h||_med=[8.696551322937012, 8.737784385681152, 8.813130378723145, 8.844642639160156, 8.889528274536133] ||g||_med=[0.0010079912608489394, 0.0010035138111561537, 0.0009970925748348236, 0.0009936393471434712, 0.000986678060144186] acc=0.0928 + [DFA] Ep 1: ||h_L||=1.347e+04 ||g_2||=7.784e-07 acc=0.2861 gamma_dfa=0.1029 + [DFA] Ep 2: ||h_L||=7.387e+04 ||g_2||=1.706e-07 acc=0.2988 gamma_dfa=0.0959 + [DFA] Ep 3: ||h_L||=2.014e+05 ||g_2||=7.528e-08 acc=0.2900 gamma_dfa=0.0944 + [DFA] Ep 4: ||h_L||=4.167e+05 ||g_2||=4.114e-08 acc=0.2988 gamma_dfa=0.0917 + [DFA] Ep 5: ||h_L||=7.642e+05 ||g_2||=2.491e-08 acc=0.2900 gamma_dfa=0.0899 + [DFA] Ep 6: ||h_L||=1.235e+06 ||g_2||=1.726e-08 acc=0.3057 gamma_dfa=0.0875 + [DFA] Ep 7: ||h_L||=1.913e+06 ||g_2||=1.233e-08 acc=0.2920 gamma_dfa=0.0888 + [DFA] Ep 8: ||h_L||=2.850e+06 ||g_2||=9.213e-09 acc=0.3115 gamma_dfa=0.0877 + [DFA] Ep 9: ||h_L||=4.005e+06 ||g_2||=7.223e-09 acc=0.2900 gamma_dfa=0.0894 + [DFA] Ep 10: ||h_L||=5.501e+06 ||g_2||=5.828e-09 acc=0.2979 gamma_dfa=0.0913 + [DFA] Ep 11: ||h_L||=7.181e+06 ||g_2||=4.814e-09 acc=0.2822 gamma_dfa=0.0899 + [DFA] Ep 12: ||h_L||=9.249e+06 ||g_2||=4.032e-09 acc=0.2998 gamma_dfa=0.0917 + [DFA] Ep 13: ||h_L||=1.180e+07 ||g_2||=3.444e-09 acc=0.3135 gamma_dfa=0.0932 + [DFA] Ep 14: ||h_L||=1.461e+07 ||g_2||=3.012e-09 acc=0.2861 gamma_dfa=0.0934 + [DFA] Ep 15: ||h_L||=1.793e+07 ||g_2||=2.598e-09 acc=0.2979 gamma_dfa=0.0936 + [DFA] Ep 16: ||h_L||=2.168e+07 ||g_2||=2.271e-09 acc=0.3086 gamma_dfa=0.0933 + [DFA] Ep 17: ||h_L||=2.591e+07 ||g_2||=2.026e-09 acc=0.2969 gamma_dfa=0.0945 + [DFA] Ep 18: ||h_L||=3.070e+07 ||g_2||=1.802e-09 acc=0.3086 gamma_dfa=0.0939 + [DFA] Ep 19: ||h_L||=3.588e+07 ||g_2||=1.638e-09 acc=0.3027 gamma_dfa=0.0952 + [DFA] Ep 20: ||h_L||=4.144e+07 ||g_2||=1.484e-09 acc=0.2959 gamma_dfa=0.0941 + [DFA] Ep 21: ||h_L||=4.772e+07 ||g_2||=1.368e-09 acc=0.2959 gamma_dfa=0.0949 + [DFA] Ep 22: ||h_L||=5.457e+07 ||g_2||=1.246e-09 acc=0.2900 gamma_dfa=0.0948 + [DFA] Ep 23: ||h_L||=6.201e+07 ||g_2||=1.159e-09 acc=0.2939 gamma_dfa=0.0947 + [DFA] Ep 24: ||h_L||=6.970e+07 ||g_2||=1.067e-09 acc=0.2969 gamma_dfa=0.0951 + [DFA] Ep 25: ||h_L||=7.780e+07 ||g_2||=9.980e-10 acc=0.2861 gamma_dfa=0.0948 + [DFA] Ep 26: ||h_L||=8.627e+07 ||g_2||=9.362e-10 acc=0.2979 gamma_dfa=0.0951 + [DFA] Ep 27: ||h_L||=9.569e+07 ||g_2||=8.744e-10 acc=0.2842 gamma_dfa=0.0955 + [DFA] Ep 28: ||h_L||=1.058e+08 ||g_2||=8.262e-10 acc=0.2891 gamma_dfa=0.0953 + [DFA] Ep 29: ||h_L||=1.159e+08 ||g_2||=7.846e-10 acc=0.2920 gamma_dfa=0.0960 + [DFA] Ep 30: ||h_L||=1.267e+08 ||g_2||=7.353e-10 acc=0.2959 gamma_dfa=0.0951 + [DFA] Ep 31: ||h_L||=1.380e+08 ||g_2||=6.977e-10 acc=0.3086 gamma_dfa=0.0952 + [DFA] Ep 32: ||h_L||=1.493e+08 ||g_2||=6.666e-10 acc=0.2949 gamma_dfa=0.0953 + [DFA] Ep 33: ||h_L||=1.617e+08 ||g_2||=6.391e-10 acc=0.2881 gamma_dfa=0.0947 + [DFA] Ep 34: ||h_L||=1.738e+08 ||g_2||=6.205e-10 acc=0.2822 gamma_dfa=0.0956 + [DFA] Ep 35: ||h_L||=1.866e+08 ||g_2||=5.893e-10 acc=0.2988 gamma_dfa=0.0959 + [DFA] Ep 36: ||h_L||=1.990e+08 ||g_2||=5.731e-10 acc=0.2949 gamma_dfa=0.0956 + [DFA] Ep 37: ||h_L||=2.125e+08 ||g_2||=5.475e-10 acc=0.3027 gamma_dfa=0.0953 + [DFA] Ep 38: ||h_L||=2.263e+08 ||g_2||=5.326e-10 acc=0.2891 gamma_dfa=0.0949 + [DFA] Ep 39: ||h_L||=2.401e+08 ||g_2||=5.206e-10 acc=0.3027 gamma_dfa=0.0958 + [DFA] Ep 40: ||h_L||=2.549e+08 ||g_2||=4.933e-10 acc=0.2959 gamma_dfa=0.0952 + [DFA] Ep 41: ||h_L||=2.702e+08 ||g_2||=4.775e-10 acc=0.3086 gamma_dfa=0.0962 + [DFA] Ep 42: ||h_L||=2.844e+08 ||g_2||=4.679e-10 acc=0.2871 gamma_dfa=0.0957 + [DFA] Ep 43: ||h_L||=2.990e+08 ||g_2||=4.493e-10 acc=0.3066 gamma_dfa=0.0961 + [DFA] Ep 44: ||h_L||=3.144e+08 ||g_2||=4.412e-10 acc=0.2900 gamma_dfa=0.0955 + [DFA] Ep 45: ||h_L||=3.282e+08 ||g_2||=4.348e-10 acc=0.2998 gamma_dfa=0.0961 + [DFA] Ep 46: ||h_L||=3.423e+08 ||g_2||=4.229e-10 acc=0.3018 gamma_dfa=0.0956 + [DFA] Ep 47: ||h_L||=3.566e+08 ||g_2||=4.139e-10 acc=0.2969 gamma_dfa=0.0957 + [DFA] Ep 48: ||h_L||=3.713e+08 ||g_2||=4.000e-10 acc=0.3027 gamma_dfa=0.0961 + [DFA] Ep 49: ||h_L||=3.859e+08 ||g_2||=3.904e-10 acc=0.3105 gamma_dfa=0.0957 + [DFA] Ep 50: ||h_L||=4.007e+08 ||g_2||=3.812e-10 acc=0.3008 gamma_dfa=0.0961 + [DFA] Ep 51: ||h_L||=4.150e+08 ||g_2||=3.752e-10 acc=0.3047 gamma_dfa=0.0957 + [DFA] Ep 52: ||h_L||=4.302e+08 ||g_2||=3.718e-10 acc=0.2910 gamma_dfa=0.0954 + [DFA] Ep 53: ||h_L||=4.447e+08 ||g_2||=3.651e-10 acc=0.2881 gamma_dfa=0.0957 + [DFA] Ep 54: ||h_L||=4.586e+08 ||g_2||=3.605e-10 acc=0.2998 gamma_dfa=0.0961 + [DFA] Ep 55: ||h_L||=4.722e+08 ||g_2||=3.467e-10 acc=0.3018 gamma_dfa=0.0963 + [DFA] Ep 56: ||h_L||=4.857e+08 ||g_2||=3.460e-10 acc=0.3047 gamma_dfa=0.0954 + [DFA] Ep 57: ||h_L||=4.994e+08 ||g_2||=3.379e-10 acc=0.2949 gamma_dfa=0.0962 + [DFA] Ep 58: ||h_L||=5.127e+08 ||g_2||=3.307e-10 acc=0.3018 gamma_dfa=0.0962 + [DFA] Ep 59: ||h_L||=5.255e+08 ||g_2||=3.281e-10 acc=0.3008 gamma_dfa=0.0960 + [DFA] Ep 60: ||h_L||=5.379e+08 ||g_2||=3.225e-10 acc=0.2988 gamma_dfa=0.0961 + [DFA] Ep 61: ||h_L||=5.493e+08 ||g_2||=3.184e-10 acc=0.3047 gamma_dfa=0.0962 + [DFA] Ep 62: ||h_L||=5.612e+08 ||g_2||=3.170e-10 acc=0.3027 gamma_dfa=0.0955 + [DFA] Ep 63: ||h_L||=5.725e+08 ||g_2||=3.109e-10 acc=0.2939 gamma_dfa=0.0960 + [DFA] Ep 64: ||h_L||=5.833e+08 ||g_2||=3.055e-10 acc=0.3076 gamma_dfa=0.0956 + [DFA] Ep 65: ||h_L||=5.946e+08 ||g_2||=3.044e-10 acc=0.2979 gamma_dfa=0.0959 + [DFA] Ep 66: ||h_L||=6.045e+08 ||g_2||=2.993e-10 acc=0.3008 gamma_dfa=0.0963 + [DFA] Ep 67: ||h_L||=6.137e+08 ||g_2||=2.988e-10 acc=0.3105 gamma_dfa=0.0961 + [DFA] Ep 68: ||h_L||=6.227e+08 ||g_2||=2.978e-10 acc=0.2939 gamma_dfa=0.0962 + [DFA] Ep 69: ||h_L||=6.309e+08 ||g_2||=2.942e-10 acc=0.2979 gamma_dfa=0.0964 + [DFA] Ep 70: ||h_L||=6.393e+08 ||g_2||=2.940e-10 acc=0.2930 gamma_dfa=0.0964 + [DFA] Ep 71: ||h_L||=6.472e+08 ||g_2||=2.872e-10 acc=0.3018 gamma_dfa=0.0963 + [DFA] Ep 72: ||h_L||=6.547e+08 ||g_2||=2.899e-10 acc=0.2959 gamma_dfa=0.0961 + [DFA] Ep 73: ||h_L||=6.618e+08 ||g_2||=2.843e-10 acc=0.2959 gamma_dfa=0.0962 + [DFA] Ep 74: ||h_L||=6.688e+08 ||g_2||=2.825e-10 acc=0.2998 gamma_dfa=0.0962 + [DFA] Ep 75: ||h_L||=6.755e+08 ||g_2||=2.794e-10 acc=0.3066 gamma_dfa=0.0963 + [DFA] Ep 76: ||h_L||=6.812e+08 ||g_2||=2.790e-10 acc=0.2959 gamma_dfa=0.0962 + [DFA] Ep 77: ||h_L||=6.867e+08 ||g_2||=2.792e-10 acc=0.3066 gamma_dfa=0.0958 + [DFA] Ep 78: ||h_L||=6.919e+08 ||g_2||=2.797e-10 acc=0.2988 gamma_dfa=0.0960 + [DFA] Ep 79: ||h_L||=6.969e+08 ||g_2||=2.750e-10 acc=0.3037 gamma_dfa=0.0959 + [DFA] Ep 80: ||h_L||=7.010e+08 ||g_2||=2.738e-10 acc=0.3066 gamma_dfa=0.0961 + [DFA] Ep 81: ||h_L||=7.049e+08 ||g_2||=2.723e-10 acc=0.3008 gamma_dfa=0.0961 + [DFA] Ep 82: ||h_L||=7.085e+08 ||g_2||=2.722e-10 acc=0.3018 gamma_dfa=0.0960 + [DFA] Ep 83: ||h_L||=7.118e+08 ||g_2||=2.707e-10 acc=0.3018 gamma_dfa=0.0962 + [DFA] Ep 84: ||h_L||=7.148e+08 ||g_2||=2.702e-10 acc=0.3027 gamma_dfa=0.0962 + [DFA] Ep 85: ||h_L||=7.174e+08 ||g_2||=2.683e-10 acc=0.3096 gamma_dfa=0.0961 + [DFA] Ep 86: ||h_L||=7.197e+08 ||g_2||=2.699e-10 acc=0.2969 gamma_dfa=0.0962 + [DFA] Ep 87: ||h_L||=7.218e+08 ||g_2||=2.699e-10 acc=0.2998 gamma_dfa=0.0960 + [DFA] Ep 88: ||h_L||=7.235e+08 ||g_2||=2.703e-10 acc=0.2979 gamma_dfa=0.0960 + [DFA] Ep 89: ||h_L||=7.250e+08 ||g_2||=2.679e-10 acc=0.3018 gamma_dfa=0.0962 + [DFA] Ep 90: ||h_L||=7.262e+08 ||g_2||=2.680e-10 acc=0.2998 gamma_dfa=0.0960 + [DFA] Ep 91: ||h_L||=7.273e+08 ||g_2||=2.691e-10 acc=0.2969 gamma_dfa=0.0960 + [DFA] Ep 92: ||h_L||=7.281e+08 ||g_2||=2.671e-10 acc=0.3018 gamma_dfa=0.0961 + [DFA] Ep 93: ||h_L||=7.288e+08 ||g_2||=2.677e-10 acc=0.3008 gamma_dfa=0.0961 + [DFA] Ep 94: ||h_L||=7.293e+08 ||g_2||=2.685e-10 acc=0.2979 gamma_dfa=0.0961 + [DFA] Ep 95: ||h_L||=7.297e+08 ||g_2||=2.670e-10 acc=0.2998 gamma_dfa=0.0961 + [DFA] Ep 96: ||h_L||=7.299e+08 ||g_2||=2.674e-10 acc=0.2998 gamma_dfa=0.0961 + [DFA] Ep 97: ||h_L||=7.300e+08 ||g_2||=2.671e-10 acc=0.2988 gamma_dfa=0.0961 + [DFA] Ep 98: ||h_L||=7.301e+08 ||g_2||=2.672e-10 acc=0.2998 gamma_dfa=0.0961 + [DFA] Ep 99: ||h_L||=7.302e+08 ||g_2||=2.671e-10 acc=0.2998 gamma_dfa=0.0961 + [DFA] Ep 100: ||h_L||=7.302e+08 ||g_2||=2.672e-10 acc=0.2998 gamma_dfa=0.0961 + +Saved results/snapshot_evolution_v2/snapshot_evolution_s456.json diff --git a/results/snapshot_evolution_v2/snapshot_evolution_s123.json b/results/snapshot_evolution_v2/snapshot_evolution_s123.json new file mode 100644 index 0000000..4ccefc8 --- /dev/null +++ b/results/snapshot_evolution_v2/snapshot_evolution_s123.json @@ -0,0 +1,5473 @@ +{ + "config": { + "output_dir": "results/snapshot_evolution_v2", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 123, + "depth": 4, + "d_hidden": 256, + "log_every": 1 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": [ + { + "hidden_norms": [ + 8.690464973449707, + 8.719978332519531, + 8.73093318939209, + 8.75937271118164, + 8.790542602539062 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009977436857298017, + 0.000992251792922616, + 0.0009848480112850666, + 0.0009761073160916567, + 0.0009735578205436468 + ], + "bp_grad_norms_F": [ + 0.035340383648872375, + 0.03499162197113037, + 0.03454425558447838, + 0.034113530069589615, + 0.033874060958623886 + ], + "gamma_dfa": NaN, + "acc_eval": 0.095703125, + "loss_eval": 2.486203908920288, + "epoch": 0 + }, + { + "hidden_norms": [ + 78.8471908569336, + 81.27874755859375, + 85.74082946777344, + 93.0085678100586, + 99.78337860107422 + ], + "bp_grad_norms_per_sample_med": [ + 5.44870927114971e-05, + 5.06363830936607e-05, + 4.9749945901567116e-05, + 5.010423774365336e-05, + 5.131187572260387e-05 + ], + "bp_grad_norms_F": [ + 0.0025542855728417635, + 0.0021727080456912518, + 0.002010831143707037, + 0.0019116367911919951, + 0.0019338354468345642 + ], + "gamma_dfa": NaN, + "acc_eval": 0.396484375, + "loss_eval": 1.6637382507324219, + "epoch": 1 + }, + { + "hidden_norms": [ + 94.79721069335938, + 98.6406021118164, + 103.38369750976562, + 111.4940185546875, + 118.88549041748047 + ], + "bp_grad_norms_per_sample_med": [ + 4.842087219003588e-05, + 4.405825529829599e-05, + 4.263824666850269e-05, + 4.2027873860206455e-05, + 4.283937960281037e-05 + ], + "bp_grad_norms_F": [ + 0.0020658739376813173, + 0.001806268934160471, + 0.001665781601332128, + 0.0015872427029535174, + 0.0015909546054899693 + ], + "gamma_dfa": NaN, + "acc_eval": 0.4541015625, + "loss_eval": 1.5350896120071411, + "epoch": 2 + }, + { + "hidden_norms": [ + 112.59109497070312, + 116.00851440429688, + 118.50328063964844, + 125.58804321289062, + 132.86842346191406 + ], + "bp_grad_norms_per_sample_med": [ + 4.3564141378737986e-05, + 4.136884308536537e-05, + 4.064830864081159e-05, + 3.9523682062281296e-05, + 3.8838741602376103e-05 + ], + "bp_grad_norms_F": [ + 0.00200729351490736, + 0.001785867614671588, + 0.0016562910750508308, + 0.0015452943043783307, + 0.0015010037459433079 + ], + "gamma_dfa": NaN, + "acc_eval": 0.4814453125, + "loss_eval": 1.449176549911499, + "epoch": 3 + }, + { + "hidden_norms": [ + 124.81511688232422, + 128.57049560546875, + 129.71421813964844, + 136.4766387939453, + 142.1854705810547 + ], + "bp_grad_norms_per_sample_med": [ + 4.382780389278196e-05, + 4.2459021642571315e-05, + 4.143684418522753e-05, + 4.0614067984279245e-05, + 3.921420648111962e-05 + ], + "bp_grad_norms_F": [ + 0.0018197334138676524, + 0.0016814853297546506, + 0.0015934663824737072, + 0.0015063106548041105, + 0.0014485444407910109 + ], + "gamma_dfa": NaN, + "acc_eval": 0.4970703125, + "loss_eval": 1.4218697547912598, + "epoch": 4 + }, + { + "hidden_norms": [ + 138.24440002441406, + 140.13018798828125, + 141.3839874267578, + 147.2488555908203, + 155.097412109375 + ], + "bp_grad_norms_per_sample_med": [ + 4.045376044814475e-05, + 4.011149940197356e-05, + 3.9452468627132475e-05, + 3.831404319498688e-05, + 3.721412576851435e-05 + ], + "bp_grad_norms_F": [ + 0.0017204430187121034, + 0.0016258049290627241, + 0.001551075023598969, + 0.0014644934562966228, + 0.0013933938462287188 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5078125, + "loss_eval": 1.3836241960525513, + "epoch": 5 + }, + { + "hidden_norms": [ + 152.11605834960938, + 153.1806182861328, + 153.2488555908203, + 159.2217559814453, + 167.07318115234375 + ], + "bp_grad_norms_per_sample_med": [ + 3.981084591941908e-05, + 3.969454701291397e-05, + 3.9165588532341644e-05, + 3.808845940511674e-05, + 3.58163051714655e-05 + ], + "bp_grad_norms_F": [ + 0.0017226944910362363, + 0.001611364888958633, + 0.0015574879944324493, + 0.001471089432016015, + 0.001374671934172511 + ], + "gamma_dfa": NaN, + "acc_eval": 0.525390625, + "loss_eval": 1.372281551361084, + "epoch": 6 + }, + { + "hidden_norms": [ + 161.75347900390625, + 163.58787536621094, + 163.35731506347656, + 170.1693115234375, + 177.47879028320312 + ], + "bp_grad_norms_per_sample_med": [ + 3.749227471416816e-05, + 3.707691575982608e-05, + 3.776738958549686e-05, + 3.692766040330753e-05, + 3.5146917070960626e-05 + ], + "bp_grad_norms_F": [ + 0.0016339722787961364, + 0.00156014587264508, + 0.0015048144850879908, + 0.00141648028511554, + 0.0013256004313006997 + ], + "gamma_dfa": NaN, + "acc_eval": 0.515625, + "loss_eval": 1.345876693725586, + "epoch": 7 + }, + { + "hidden_norms": [ + 171.66441345214844, + 171.10499572753906, + 169.24270629882812, + 175.52674865722656, + 182.4739990234375 + ], + "bp_grad_norms_per_sample_med": [ + 3.675510379252955e-05, + 3.6888646718580276e-05, + 3.695035775308497e-05, + 3.644685784820467e-05, + 3.359343099873513e-05 + ], + "bp_grad_norms_F": [ + 0.0016642085975036025, + 0.0015915494877845049, + 0.0015412021894007921, + 0.0014428672147914767, + 0.0013226643204689026 + ], + "gamma_dfa": NaN, + "acc_eval": 0.548828125, + "loss_eval": 1.323807954788208, + "epoch": 8 + }, + { + "hidden_norms": [ + 177.58766174316406, + 178.5358123779297, + 176.316650390625, + 182.18365478515625, + 188.81033325195312 + ], + "bp_grad_norms_per_sample_med": [ + 3.550657493178733e-05, + 3.561190533218905e-05, + 3.632329753600061e-05, + 3.5655833926284686e-05, + 3.342977652209811e-05 + ], + "bp_grad_norms_F": [ + 0.0016174933407455683, + 0.0015753052430227399, + 0.0015375673538073897, + 0.001461501931771636, + 0.0013270385097712278 + ], + "gamma_dfa": NaN, + "acc_eval": 0.54296875, + "loss_eval": 1.323765754699707, + "epoch": 9 + }, + { + "hidden_norms": [ + 186.0078125, + 185.2810821533203, + 182.9329833984375, + 188.10736083984375, + 195.3680877685547 + ], + "bp_grad_norms_per_sample_med": [ + 3.5615968954516575e-05, + 3.5252433008281514e-05, + 3.600740819820203e-05, + 3.5232467780588195e-05, + 3.2765579817350954e-05 + ], + "bp_grad_norms_F": [ + 0.0015362550038844347, + 0.001510681351646781, + 0.0014847773127257824, + 0.0014146054163575172, + 0.00128385319840163 + ], + "gamma_dfa": NaN, + "acc_eval": 0.544921875, + "loss_eval": 1.2933119535446167, + "epoch": 10 + }, + { + "hidden_norms": [ + 193.46343994140625, + 194.1528778076172, + 190.9546661376953, + 196.03440856933594, + 201.5336151123047 + ], + "bp_grad_norms_per_sample_med": [ + 3.449141877354123e-05, + 3.581260534701869e-05, + 3.6061541322851554e-05, + 3.5576940717874095e-05, + 3.29486902046483e-05 + ], + "bp_grad_norms_F": [ + 0.0015161881456151605, + 0.0014996343525126576, + 0.001473701442591846, + 0.0013998147333040833, + 0.0012604170478880405 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5556640625, + "loss_eval": 1.2653318643569946, + "epoch": 11 + }, + { + "hidden_norms": [ + 200.17047119140625, + 198.5863037109375, + 196.08795166015625, + 200.61297607421875, + 208.13084411621094 + ], + "bp_grad_norms_per_sample_med": [ + 3.377814937266521e-05, + 3.471539093879983e-05, + 3.4731467167148367e-05, + 3.4925535146612674e-05, + 3.2187374017667025e-05 + ], + "bp_grad_norms_F": [ + 0.0014635181287303567, + 0.0014519579708576202, + 0.001435206620953977, + 0.0013784168986603618, + 0.0012511539971455932 + ], + "gamma_dfa": NaN, + "acc_eval": 0.546875, + "loss_eval": 1.2704923152923584, + "epoch": 12 + }, + { + "hidden_norms": [ + 203.8260955810547, + 203.86688232421875, + 200.01004028320312, + 204.2325439453125, + 211.52891540527344 + ], + "bp_grad_norms_per_sample_med": [ + 3.5213015507906675e-05, + 3.635779648902826e-05, + 3.70470697816927e-05, + 3.6254354199627414e-05, + 3.324731005704962e-05 + ], + "bp_grad_norms_F": [ + 0.0014951277989894152, + 0.0014758999459445477, + 0.0014606777112931013, + 0.0014066072180867195, + 0.0012636061292141676 + ], + "gamma_dfa": NaN, + "acc_eval": 0.533203125, + "loss_eval": 1.2718024253845215, + "epoch": 13 + }, + { + "hidden_norms": [ + 211.8421630859375, + 209.4982147216797, + 206.025634765625, + 210.11019897460938, + 216.48568725585938 + ], + "bp_grad_norms_per_sample_med": [ + 3.425328395678662e-05, + 3.4357526601525024e-05, + 3.5312823456479236e-05, + 3.490734161459841e-05, + 3.1354313250631094e-05 + ], + "bp_grad_norms_F": [ + 0.0015326166758313775, + 0.0015238082269206643, + 0.0015112065011635423, + 0.0014346316456794739, + 0.0012716582277789712 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5595703125, + "loss_eval": 1.2611415386199951, + "epoch": 14 + }, + { + "hidden_norms": [ + 220.0836639404297, + 218.3101806640625, + 212.22019958496094, + 216.97576904296875, + 224.16114807128906 + ], + "bp_grad_norms_per_sample_med": [ + 3.320865289424546e-05, + 3.393836959730834e-05, + 3.4554454032331705e-05, + 3.380324415047653e-05, + 3.0850649636704475e-05 + ], + "bp_grad_norms_F": [ + 0.0015296684578061104, + 0.0015227487310767174, + 0.0015054721152409911, + 0.0014223494799807668, + 0.0012559365713968873 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5615234375, + "loss_eval": 1.2511423826217651, + "epoch": 15 + }, + { + "hidden_norms": [ + 223.3075714111328, + 219.4958953857422, + 213.75701904296875, + 219.41580200195312, + 223.92572021484375 + ], + "bp_grad_norms_per_sample_med": [ + 3.406661926419474e-05, + 3.485638080746867e-05, + 3.5736342397285625e-05, + 3.5617544199340045e-05, + 3.142367859254591e-05 + ], + "bp_grad_norms_F": [ + 0.001539028249680996, + 0.0015256714541465044, + 0.0015207449905574322, + 0.001449243980459869, + 0.0012804584112018347 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5478515625, + "loss_eval": 1.2619048357009888, + "epoch": 16 + }, + { + "hidden_norms": [ + 229.43417358398438, + 224.83290100097656, + 218.015869140625, + 221.56915283203125, + 228.59274291992188 + ], + "bp_grad_norms_per_sample_med": [ + 3.325551369925961e-05, + 3.411810757825151e-05, + 3.506721623125486e-05, + 3.451627344475128e-05, + 3.0976541893323883e-05 + ], + "bp_grad_norms_F": [ + 0.001564670237712562, + 0.0015591747360303998, + 0.0015565806534141302, + 0.001464744214899838, + 0.0012746548745781183 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5498046875, + "loss_eval": 1.2594949007034302, + "epoch": 17 + }, + { + "hidden_norms": [ + 233.65724182128906, + 228.65892028808594, + 223.14169311523438, + 227.2765350341797, + 233.75588989257812 + ], + "bp_grad_norms_per_sample_med": [ + 3.4493146813474596e-05, + 3.510132592055015e-05, + 3.669387297122739e-05, + 3.577200186555274e-05, + 3.192189251421951e-05 + ], + "bp_grad_norms_F": [ + 0.0015125939389690757, + 0.0015123466728255153, + 0.0015171029372140765, + 0.0014489478198811412, + 0.001258584321476519 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5595703125, + "loss_eval": 1.2556639909744263, + "epoch": 18 + }, + { + "hidden_norms": [ + 237.43548583984375, + 232.39987182617188, + 227.10951232910156, + 230.72291564941406, + 237.13616943359375 + ], + "bp_grad_norms_per_sample_med": [ + 3.340727198519744e-05, + 3.450348594924435e-05, + 3.5213739465689287e-05, + 3.445050970185548e-05, + 3.137766179861501e-05 + ], + "bp_grad_norms_F": [ + 0.0015336342621594667, + 0.0015343877021223307, + 0.0015299322549253702, + 0.0014644783223047853, + 0.0012699750950559974 + ], + "gamma_dfa": NaN, + "acc_eval": 0.560546875, + "loss_eval": 1.2415752410888672, + "epoch": 19 + }, + { + "hidden_norms": [ + 240.3662109375, + 235.49240112304688, + 227.54061889648438, + 233.16600036621094, + 239.60838317871094 + ], + "bp_grad_norms_per_sample_med": [ + 3.387282777111977e-05, + 3.518611265462823e-05, + 3.594699956011027e-05, + 3.514933632686734e-05, + 3.159138941555284e-05 + ], + "bp_grad_norms_F": [ + 0.0015161214396357536, + 0.0015244479291141033, + 0.0015337818767875433, + 0.0014538948889821768, + 0.0012562318006530404 + ], + "gamma_dfa": NaN, + "acc_eval": 0.560546875, + "loss_eval": 1.2436577081680298, + "epoch": 20 + }, + { + "hidden_norms": [ + 246.6840057373047, + 239.0929412841797, + 228.7230682373047, + 233.1182403564453, + 237.92440795898438 + ], + "bp_grad_norms_per_sample_med": [ + 3.365568773006089e-05, + 3.4782005968736485e-05, + 3.604988887673244e-05, + 3.48928188032005e-05, + 3.140935586998239e-05 + ], + "bp_grad_norms_F": [ + 0.0015826384769752622, + 0.0015907500637695193, + 0.0016004826175048947, + 0.0015078946016728878, + 0.0012762312544509768 + ], + "gamma_dfa": NaN, + "acc_eval": 0.578125, + "loss_eval": 1.2292213439941406, + "epoch": 21 + }, + { + "hidden_norms": [ + 248.95265197753906, + 241.59408569335938, + 233.2073211669922, + 236.39898681640625, + 243.02566528320312 + ], + "bp_grad_norms_per_sample_med": [ + 3.3556283597135916e-05, + 3.463738539721817e-05, + 3.5712662793230265e-05, + 3.4992117434740067e-05, + 3.1405961635755375e-05 + ], + "bp_grad_norms_F": [ + 0.0015417077811434865, + 0.0015624086372554302, + 0.00158181122969836, + 0.0014982762513682246, + 0.001269534695893526 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5712890625, + "loss_eval": 1.201985239982605, + "epoch": 22 + }, + { + "hidden_norms": [ + 250.6766815185547, + 243.67706298828125, + 236.90567016601562, + 240.1038360595703, + 244.89207458496094 + ], + "bp_grad_norms_per_sample_med": [ + 3.3543499739607796e-05, + 3.4865890484070405e-05, + 3.564134021871723e-05, + 3.4787921322276816e-05, + 3.112335252808407e-05 + ], + "bp_grad_norms_F": [ + 0.0015237597981467843, + 0.0015382410492748022, + 0.0015483599854633212, + 0.0014793339651077986, + 0.0012637422187253833 + ], + "gamma_dfa": NaN, + "acc_eval": 0.55859375, + "loss_eval": 1.2245514392852783, + "epoch": 23 + }, + { + "hidden_norms": [ + 256.1240539550781, + 248.83609008789062, + 240.2549285888672, + 243.1914825439453, + 248.11964416503906 + ], + "bp_grad_norms_per_sample_med": [ + 3.322990596643649e-05, + 3.523347186273895e-05, + 3.6828067095484585e-05, + 3.5215769457863644e-05, + 3.133456266368739e-05 + ], + "bp_grad_norms_F": [ + 0.0015543467598035932, + 0.0015818241517990828, + 0.0015992531552910805, + 0.001527936663478613, + 0.0012819069670513272 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5732421875, + "loss_eval": 1.2261133193969727, + "epoch": 24 + }, + { + "hidden_norms": [ + 256.9990234375, + 248.78497314453125, + 239.55239868164062, + 243.13818359375, + 249.48153686523438 + ], + "bp_grad_norms_per_sample_med": [ + 3.39320904458873e-05, + 3.600086711230688e-05, + 3.7119287298992276e-05, + 3.6292254662839696e-05, + 3.193991506122984e-05 + ], + "bp_grad_norms_F": [ + 0.0015332578914240003, + 0.00156042305752635, + 0.001574728754349053, + 0.0015015782555565238, + 0.0012670031283050776 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5771484375, + "loss_eval": 1.2080682516098022, + "epoch": 25 + }, + { + "hidden_norms": [ + 260.4493103027344, + 251.83595275878906, + 240.95025634765625, + 242.58055114746094, + 247.42816162109375 + ], + "bp_grad_norms_per_sample_med": [ + 3.4877586585935205e-05, + 3.68267938029021e-05, + 3.760240360861644e-05, + 3.5770553949987516e-05, + 3.202233710908331e-05 + ], + "bp_grad_norms_F": [ + 0.0016203002305701375, + 0.0016500651836395264, + 0.0016584799159318209, + 0.0015617734752595425, + 0.00129653827752918 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5576171875, + "loss_eval": 1.2154628038406372, + "epoch": 26 + }, + { + "hidden_norms": [ + 263.1241760253906, + 253.4596405029297, + 243.6095733642578, + 245.4304656982422, + 250.32362365722656 + ], + "bp_grad_norms_per_sample_med": [ + 3.480416853562929e-05, + 3.640647264546715e-05, + 3.738802479347214e-05, + 3.5808730899589136e-05, + 3.25721557601355e-05 + ], + "bp_grad_norms_F": [ + 0.0015986696816980839, + 0.0016261462587863207, + 0.0016554947942495346, + 0.0015633245930075645, + 0.0013003128115087748 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5634765625, + "loss_eval": 1.2160842418670654, + "epoch": 27 + }, + { + "hidden_norms": [ + 266.5273132324219, + 256.0182189941406, + 245.50253295898438, + 246.18280029296875, + 251.716064453125 + ], + "bp_grad_norms_per_sample_med": [ + 3.359848051331937e-05, + 3.572113564587198e-05, + 3.695064515341073e-05, + 3.506165376165882e-05, + 3.114769424428232e-05 + ], + "bp_grad_norms_F": [ + 0.0016088238917291164, + 0.0016375494888052344, + 0.0016567507991567254, + 0.0015764845302328467, + 0.001285399659536779 + ], + "gamma_dfa": NaN, + "acc_eval": 0.58203125, + "loss_eval": 1.2021496295928955, + "epoch": 28 + }, + { + "hidden_norms": [ + 267.4769592285156, + 258.21368408203125, + 248.0418701171875, + 248.66949462890625, + 253.77452087402344 + ], + "bp_grad_norms_per_sample_med": [ + 3.400501736905426e-05, + 3.611011925386265e-05, + 3.7168374547036365e-05, + 3.569516775314696e-05, + 3.031879896298051e-05 + ], + "bp_grad_norms_F": [ + 0.0015880028950050473, + 0.0016197538934648037, + 0.001652923645451665, + 0.0015723761171102524, + 0.00128253607545048 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5771484375, + "loss_eval": 1.2029783725738525, + "epoch": 29 + }, + { + "hidden_norms": [ + 268.6047668457031, + 256.4200744628906, + 246.27796936035156, + 246.51229858398438, + 250.08482360839844 + ], + "bp_grad_norms_per_sample_med": [ + 3.425245813559741e-05, + 3.6405861465027556e-05, + 3.752295742742717e-05, + 3.6318160709924996e-05, + 3.103434937656857e-05 + ], + "bp_grad_norms_F": [ + 0.0017358324257656932, + 0.0017647893400862813, + 0.0017767423996701837, + 0.0016745994798839092, + 0.0013456137385219336 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5859375, + "loss_eval": 1.2118260860443115, + "epoch": 30 + }, + { + "hidden_norms": [ + 270.9348449707031, + 260.40045166015625, + 250.72512817382812, + 251.9379425048828, + 254.6614227294922 + ], + "bp_grad_norms_per_sample_med": [ + 3.491883762762882e-05, + 3.647417179308832e-05, + 3.8068057619966567e-05, + 3.653564635897055e-05, + 3.172537253703922e-05 + ], + "bp_grad_norms_F": [ + 0.0015994011191651225, + 0.0016339519061148167, + 0.0016624036943539977, + 0.0015806201845407486, + 0.0013034256407991052 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5849609375, + "loss_eval": 1.1830923557281494, + "epoch": 31 + }, + { + "hidden_norms": [ + 274.6016845703125, + 262.9326477050781, + 250.766357421875, + 252.1786346435547, + 254.2251739501953 + ], + "bp_grad_norms_per_sample_med": [ + 3.4794014936778694e-05, + 3.6746245314134285e-05, + 3.771794217755087e-05, + 3.6664638173533604e-05, + 3.1814517569728196e-05 + ], + "bp_grad_norms_F": [ + 0.0016584239201620221, + 0.0016917918110266328, + 0.001726189162582159, + 0.0016276866663247347, + 0.0013194811763241887 + ], + "gamma_dfa": NaN, + "acc_eval": 0.578125, + "loss_eval": 1.1851024627685547, + "epoch": 32 + }, + { + "hidden_norms": [ + 273.59783935546875, + 261.92218017578125, + 250.27320861816406, + 251.19146728515625, + 255.70233154296875 + ], + "bp_grad_norms_per_sample_med": [ + 3.505383210722357e-05, + 3.6710382119053975e-05, + 3.839766577584669e-05, + 3.708387885126285e-05, + 3.1251351174432784e-05 + ], + "bp_grad_norms_F": [ + 0.0016781548038125038, + 0.0017169808270409703, + 0.0017399545758962631, + 0.0016386040952056646, + 0.0013246783055365086 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5712890625, + "loss_eval": 1.1789460182189941, + "epoch": 33 + }, + { + "hidden_norms": [ + 274.9112854003906, + 262.3539123535156, + 251.67474365234375, + 253.08824157714844, + 255.4647979736328 + ], + "bp_grad_norms_per_sample_med": [ + 3.4545508242445067e-05, + 3.622366421041079e-05, + 3.7300182157196105e-05, + 3.594972440623678e-05, + 3.1557658076053485e-05 + ], + "bp_grad_norms_F": [ + 0.001666227588430047, + 0.0016955926548689604, + 0.0017251977697014809, + 0.0016294753877446055, + 0.001327820005826652 + ], + "gamma_dfa": NaN, + "acc_eval": 0.583984375, + "loss_eval": 1.1757192611694336, + "epoch": 34 + }, + { + "hidden_norms": [ + 273.9092712402344, + 261.26507568359375, + 250.60923767089844, + 250.5943145751953, + 253.19862365722656 + ], + "bp_grad_norms_per_sample_med": [ + 3.532320988597348e-05, + 3.7557252653641626e-05, + 3.882365126628429e-05, + 3.676790583995171e-05, + 3.2376574381487444e-05 + ], + "bp_grad_norms_F": [ + 0.001686039031483233, + 0.0017200085567310452, + 0.0017563666915521026, + 0.0016565105179324746, + 0.0013397492002695799 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5986328125, + "loss_eval": 1.1719229221343994, + "epoch": 35 + }, + { + "hidden_norms": [ + 275.9344177246094, + 265.1002502441406, + 253.2598114013672, + 253.86024475097656, + 257.8154296875 + ], + "bp_grad_norms_per_sample_med": [ + 3.419027416384779e-05, + 3.54782423528377e-05, + 3.770734474528581e-05, + 3.707608630065806e-05, + 3.1706651498097926e-05 + ], + "bp_grad_norms_F": [ + 0.0016564616234973073, + 0.001694328966550529, + 0.001729298266582191, + 0.0016409243689849973, + 0.0013242866843938828 + ], + "gamma_dfa": NaN, + "acc_eval": 0.59375, + "loss_eval": 1.169456958770752, + "epoch": 36 + }, + { + "hidden_norms": [ + 277.0843200683594, + 263.2900390625, + 250.48553466796875, + 251.51341247558594, + 253.14413452148438 + ], + "bp_grad_norms_per_sample_med": [ + 3.5850312997354195e-05, + 3.7839381548110396e-05, + 3.925598502974026e-05, + 3.7184508983045816e-05, + 3.174091762048192e-05 + ], + "bp_grad_norms_F": [ + 0.0017717990558594465, + 0.0018099851440638304, + 0.0018417692044749856, + 0.0017209915677085519, + 0.0013732420047745109 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5869140625, + "loss_eval": 1.1764099597930908, + "epoch": 37 + }, + { + "hidden_norms": [ + 280.2084655761719, + 265.3043518066406, + 254.26673889160156, + 253.3932342529297, + 255.91488647460938 + ], + "bp_grad_norms_per_sample_med": [ + 3.4716471418505535e-05, + 3.675218249554746e-05, + 3.84828781534452e-05, + 3.653839303296991e-05, + 3.1539821065962315e-05 + ], + "bp_grad_norms_F": [ + 0.00171388138551265, + 0.0017648075008764863, + 0.00180675252340734, + 0.0016973463352769613, + 0.0013539392966777086 + ], + "gamma_dfa": NaN, + "acc_eval": 0.591796875, + "loss_eval": 1.1670037508010864, + "epoch": 38 + }, + { + "hidden_norms": [ + 278.0702209472656, + 264.4510498046875, + 250.75350952148438, + 248.73284912109375, + 253.1072540283203 + ], + "bp_grad_norms_per_sample_med": [ + 3.694290717248805e-05, + 3.843691956717521e-05, + 3.982238922617398e-05, + 3.8299614971037954e-05, + 3.253731847507879e-05 + ], + "bp_grad_norms_F": [ + 0.0017997974064201117, + 0.0018521619495004416, + 0.0018853276269510388, + 0.001754313474521041, + 0.0013789198128506541 + ], + "gamma_dfa": NaN, + "acc_eval": 0.576171875, + "loss_eval": 1.168372631072998, + "epoch": 39 + }, + { + "hidden_norms": [ + 279.5745849609375, + 265.3549499511719, + 252.89109802246094, + 250.0029296875, + 251.57737731933594 + ], + "bp_grad_norms_per_sample_med": [ + 3.5274497349746525e-05, + 3.741122054634616e-05, + 3.8946731365285814e-05, + 3.7627731217071414e-05, + 3.1920495530357584e-05 + ], + "bp_grad_norms_F": [ + 0.0017959685064852238, + 0.0018515808042138815, + 0.001886399113573134, + 0.0017732164124026895, + 0.001389715587720275 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5966796875, + "loss_eval": 1.1735193729400635, + "epoch": 40 + }, + { + "hidden_norms": [ + 280.56402587890625, + 265.1068115234375, + 251.912353515625, + 248.08627319335938, + 250.21177673339844 + ], + "bp_grad_norms_per_sample_med": [ + 3.672741513582878e-05, + 3.8823065551696345e-05, + 4.041267675347626e-05, + 3.835778989014216e-05, + 3.2424144592368975e-05 + ], + "bp_grad_norms_F": [ + 0.0018404219299554825, + 0.0018969813827425241, + 0.0019448500825092196, + 0.0018052044324576855, + 0.0014045372372493148 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5966796875, + "loss_eval": 1.163725733757019, + "epoch": 41 + }, + { + "hidden_norms": [ + 281.2812194824219, + 266.5726623535156, + 253.18124389648438, + 252.3292694091797, + 254.1314697265625 + ], + "bp_grad_norms_per_sample_med": [ + 3.6245146475266665e-05, + 3.849809218081646e-05, + 4.034954326925799e-05, + 3.857027695630677e-05, + 3.267046849941835e-05 + ], + "bp_grad_norms_F": [ + 0.0018043599557131529, + 0.0018654613522812724, + 0.0018976799910888076, + 0.0017763315699994564, + 0.0013986497651785612 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5830078125, + "loss_eval": 1.172363519668579, + "epoch": 42 + }, + { + "hidden_norms": [ + 278.3638916015625, + 264.4734802246094, + 250.60198974609375, + 248.59568786621094, + 249.39353942871094 + ], + "bp_grad_norms_per_sample_med": [ + 3.7236037314869463e-05, + 3.946686410927214e-05, + 4.103714309167117e-05, + 3.970286707044579e-05, + 3.281752287875861e-05 + ], + "bp_grad_norms_F": [ + 0.0018646781099960208, + 0.0019272645004093647, + 0.0019672266207635403, + 0.001839098404161632, + 0.0014395405305549502 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5830078125, + "loss_eval": 1.1776624917984009, + "epoch": 43 + }, + { + "hidden_norms": [ + 280.8514099121094, + 269.1718444824219, + 253.03790283203125, + 251.60220336914062, + 251.88168334960938 + ], + "bp_grad_norms_per_sample_med": [ + 3.689880759338848e-05, + 3.937961082556285e-05, + 4.092283779755235e-05, + 3.866894985549152e-05, + 3.262344398535788e-05 + ], + "bp_grad_norms_F": [ + 0.0018725661793723702, + 0.0019201217219233513, + 0.0019532060250639915, + 0.0018317755311727524, + 0.001439971849322319 + ], + "gamma_dfa": NaN, + "acc_eval": 0.595703125, + "loss_eval": 1.1693906784057617, + "epoch": 44 + }, + { + "hidden_norms": [ + 280.3335266113281, + 263.89471435546875, + 253.01638793945312, + 250.5576171875, + 251.4005889892578 + ], + "bp_grad_norms_per_sample_med": [ + 3.6666475352831185e-05, + 3.875952461385168e-05, + 4.0531358536100015e-05, + 3.9068203477654606e-05, + 3.450641088420525e-05 + ], + "bp_grad_norms_F": [ + 0.0018578553572297096, + 0.0019184533739462495, + 0.001965942559763789, + 0.0018550093518570065, + 0.0014542803401127458 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5732421875, + "loss_eval": 1.1839377880096436, + "epoch": 45 + }, + { + "hidden_norms": [ + 280.3553771972656, + 263.3617248535156, + 248.94859313964844, + 246.9832000732422, + 246.24644470214844 + ], + "bp_grad_norms_per_sample_med": [ + 3.8412734284065664e-05, + 4.001844354206696e-05, + 4.220755727146752e-05, + 4.0393635572399944e-05, + 3.391467180335894e-05 + ], + "bp_grad_norms_F": [ + 0.001917686895467341, + 0.0019766101613640785, + 0.0020170181524008512, + 0.0018900329014286399, + 0.001476101577281952 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6005859375, + "loss_eval": 1.1689397096633911, + "epoch": 46 + }, + { + "hidden_norms": [ + 278.8861389160156, + 263.3866882324219, + 249.24301147460938, + 246.43963623046875, + 246.34503173828125 + ], + "bp_grad_norms_per_sample_med": [ + 3.77853139070794e-05, + 4.044857996632345e-05, + 4.182702468824573e-05, + 4.050548523082398e-05, + 3.3606509532546625e-05 + ], + "bp_grad_norms_F": [ + 0.0019284948939457536, + 0.001992136472836137, + 0.0020461773965507746, + 0.001900508883409202, + 0.001466717105358839 + ], + "gamma_dfa": NaN, + "acc_eval": 0.599609375, + "loss_eval": 1.1585946083068848, + "epoch": 47 + }, + { + "hidden_norms": [ + 279.963623046875, + 263.52496337890625, + 249.6890869140625, + 245.60646057128906, + 245.52540588378906 + ], + "bp_grad_norms_per_sample_med": [ + 3.724947964656167e-05, + 3.964625648222864e-05, + 4.1545175918145105e-05, + 3.953047780669294e-05, + 3.275729977758601e-05 + ], + "bp_grad_norms_F": [ + 0.0019616533536463976, + 0.002027863636612892, + 0.0020759752951562405, + 0.0019283785950392485, + 0.001484199776314199 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6123046875, + "loss_eval": 1.157920002937317, + "epoch": 48 + }, + { + "hidden_norms": [ + 279.7983093261719, + 263.42352294921875, + 247.6257781982422, + 244.5139923095703, + 242.93429565429688 + ], + "bp_grad_norms_per_sample_med": [ + 3.738125451491214e-05, + 4.007351162726991e-05, + 4.2600284359650686e-05, + 4.0704209823161364e-05, + 3.302833283669315e-05 + ], + "bp_grad_norms_F": [ + 0.001973477192223072, + 0.002032764023169875, + 0.0020790304988622665, + 0.0019371822709217668, + 0.0014914683997631073 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6005859375, + "loss_eval": 1.1545627117156982, + "epoch": 49 + }, + { + "hidden_norms": [ + 278.16461181640625, + 259.95208740234375, + 246.212890625, + 243.02810668945312, + 242.42227172851562 + ], + "bp_grad_norms_per_sample_med": [ + 3.896220732713118e-05, + 4.0713552152737975e-05, + 4.242185241309926e-05, + 4.1096616769209504e-05, + 3.4584638342494145e-05 + ], + "bp_grad_norms_F": [ + 0.0020273446571081877, + 0.0020888603758066893, + 0.0021337512880563736, + 0.0019914479926228523, + 0.0015125740319490433 + ], + "gamma_dfa": NaN, + "acc_eval": 0.599609375, + "loss_eval": 1.1588966846466064, + "epoch": 50 + }, + { + "hidden_norms": [ + 278.74609375, + 259.810302734375, + 244.75640869140625, + 241.40191650390625, + 241.2429962158203 + ], + "bp_grad_norms_per_sample_med": [ + 4.005424489150755e-05, + 4.289989738026634e-05, + 4.383309351396747e-05, + 4.207885649520904e-05, + 3.527112494339235e-05 + ], + "bp_grad_norms_F": [ + 0.002059010788798332, + 0.002119551645591855, + 0.002172222128137946, + 0.0020189452916383743, + 0.0015335450880229473 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.1555505990982056, + "epoch": 51 + }, + { + "hidden_norms": [ + 277.6565246582031, + 262.0436096191406, + 246.2357635498047, + 241.67991638183594, + 240.23500061035156 + ], + "bp_grad_norms_per_sample_med": [ + 4.1031005821423605e-05, + 4.313238605391234e-05, + 4.465782694751397e-05, + 4.2896612285403535e-05, + 3.4334370866417885e-05 + ], + "bp_grad_norms_F": [ + 0.002025892725214362, + 0.0020990471821278334, + 0.0021509609650820494, + 0.002011507283896208, + 0.0015318752266466618 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6142578125, + "loss_eval": 1.1416809558868408, + "epoch": 52 + }, + { + "hidden_norms": [ + 277.4100646972656, + 260.2519836425781, + 245.48947143554688, + 242.5662384033203, + 241.2648162841797 + ], + "bp_grad_norms_per_sample_med": [ + 3.732202821993269e-05, + 3.9125570765463635e-05, + 4.136607458349317e-05, + 3.977569213020615e-05, + 3.3676675229799e-05 + ], + "bp_grad_norms_F": [ + 0.002009452786296606, + 0.002076543401926756, + 0.002131648361682892, + 0.00199576816521585, + 0.0015338497469201684 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.143639087677002, + "epoch": 53 + }, + { + "hidden_norms": [ + 277.3269348144531, + 259.49072265625, + 243.7945098876953, + 240.342041015625, + 238.76239013671875 + ], + "bp_grad_norms_per_sample_med": [ + 3.978172389906831e-05, + 4.20100441260729e-05, + 4.455841553863138e-05, + 4.2333795136073604e-05, + 3.435015969444066e-05 + ], + "bp_grad_norms_F": [ + 0.0020786102395504713, + 0.0021364488638937473, + 0.0021890606731176376, + 0.0020492339972406626, + 0.0015625122468918562 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6044921875, + "loss_eval": 1.1515132188796997, + "epoch": 54 + }, + { + "hidden_norms": [ + 276.1414489746094, + 257.6651306152344, + 242.12867736816406, + 238.3046875, + 235.9711151123047 + ], + "bp_grad_norms_per_sample_med": [ + 4.158447700319812e-05, + 4.40051153418608e-05, + 4.566523784887977e-05, + 4.3018761061830446e-05, + 3.456107515376061e-05 + ], + "bp_grad_norms_F": [ + 0.0021895321551710367, + 0.0022726275492459536, + 0.00232017133384943, + 0.002137792995199561, + 0.0015979791060090065 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6025390625, + "loss_eval": 1.148828148841858, + "epoch": 55 + }, + { + "hidden_norms": [ + 276.29547119140625, + 257.9006652832031, + 242.25363159179688, + 237.8865966796875, + 235.57620239257812 + ], + "bp_grad_norms_per_sample_med": [ + 3.9041460695443675e-05, + 4.0436327253701165e-05, + 4.2260016925865784e-05, + 4.071593502885662e-05, + 3.461613232502714e-05 + ], + "bp_grad_norms_F": [ + 0.0021726686973124743, + 0.002256714040413499, + 0.0023172625806182623, + 0.0021478317212313414, + 0.0016112272860482335 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6015625, + "loss_eval": 1.165194034576416, + "epoch": 56 + }, + { + "hidden_norms": [ + 274.73480224609375, + 257.3844909667969, + 239.9276580810547, + 236.4628448486328, + 232.49490356445312 + ], + "bp_grad_norms_per_sample_med": [ + 4.182914926786907e-05, + 4.482160511543043e-05, + 4.732825618702918e-05, + 4.5475029764929786e-05, + 3.673886021715589e-05 + ], + "bp_grad_norms_F": [ + 0.002222857205197215, + 0.0022976247128099203, + 0.002366685541346669, + 0.002194431144744158, + 0.0016426561633124948 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6015625, + "loss_eval": 1.150635004043579, + "epoch": 57 + }, + { + "hidden_norms": [ + 273.9837341308594, + 255.2301025390625, + 239.6470184326172, + 235.07806396484375, + 232.15016174316406 + ], + "bp_grad_norms_per_sample_med": [ + 4.28417552029714e-05, + 4.5315191528061405e-05, + 4.770928717334755e-05, + 4.653819996747188e-05, + 3.727963485289365e-05 + ], + "bp_grad_norms_F": [ + 0.002205377910286188, + 0.00228099524974823, + 0.002334901597350836, + 0.0021908036433160305, + 0.001635397202335298 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6064453125, + "loss_eval": 1.150489330291748, + "epoch": 58 + }, + { + "hidden_norms": [ + 273.4665222167969, + 255.21783447265625, + 238.12306213378906, + 232.99537658691406, + 229.35629272460938 + ], + "bp_grad_norms_per_sample_med": [ + 4.174295099801384e-05, + 4.412833004607819e-05, + 4.589854142977856e-05, + 4.366271969047375e-05, + 3.4910473914351314e-05 + ], + "bp_grad_norms_F": [ + 0.0022425123024731874, + 0.002337042009457946, + 0.0024111224338412285, + 0.002237174427136779, + 0.0016597777139395475 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6142578125, + "loss_eval": 1.1445674896240234, + "epoch": 59 + }, + { + "hidden_norms": [ + 272.8526306152344, + 254.31373596191406, + 238.0008087158203, + 233.6641082763672, + 229.88113403320312 + ], + "bp_grad_norms_per_sample_med": [ + 4.274978709872812e-05, + 4.589447416947223e-05, + 4.8100573621923104e-05, + 4.519677167991176e-05, + 3.628300692071207e-05 + ], + "bp_grad_norms_F": [ + 0.0022435274440795183, + 0.0023362115025520325, + 0.0024012199137359858, + 0.00223422609269619, + 0.0016617706278339028 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.1417796611785889, + "epoch": 60 + }, + { + "hidden_norms": [ + 272.5745849609375, + 253.39877319335938, + 236.8953094482422, + 231.5461883544922, + 227.8491668701172 + ], + "bp_grad_norms_per_sample_med": [ + 4.257826367393136e-05, + 4.485245153773576e-05, + 4.667421308113262e-05, + 4.5228414819575846e-05, + 3.560770346666686e-05 + ], + "bp_grad_norms_F": [ + 0.0022986247204244137, + 0.002396916039288044, + 0.0024696297477930784, + 0.0022973858285695314, + 0.0016907128738239408 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6044921875, + "loss_eval": 1.1428865194320679, + "epoch": 61 + }, + { + "hidden_norms": [ + 269.6819763183594, + 250.9730682373047, + 234.21188354492188, + 228.83775329589844, + 224.82958984375 + ], + "bp_grad_norms_per_sample_med": [ + 4.29281426477246e-05, + 4.5681605115532875e-05, + 4.7611269110348076e-05, + 4.553339022095315e-05, + 3.683664544951171e-05 + ], + "bp_grad_norms_F": [ + 0.0023400019854307175, + 0.002444769022986293, + 0.0025141045916825533, + 0.002344615990296006, + 0.0017126062884926796 + ], + "gamma_dfa": NaN, + "acc_eval": 0.625, + "loss_eval": 1.1239444017410278, + "epoch": 62 + }, + { + "hidden_norms": [ + 269.7929992675781, + 250.5220947265625, + 233.3997802734375, + 228.2130584716797, + 224.5063018798828 + ], + "bp_grad_norms_per_sample_med": [ + 4.4715372496284544e-05, + 4.6482971811201423e-05, + 4.9765483709052205e-05, + 4.759176226798445e-05, + 3.8208585465326905e-05 + ], + "bp_grad_norms_F": [ + 0.0023639060091227293, + 0.002476333873346448, + 0.0025423571933060884, + 0.00236364989541471, + 0.0017294714925810695 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6162109375, + "loss_eval": 1.1502506732940674, + "epoch": 63 + }, + { + "hidden_norms": [ + 269.24493408203125, + 251.6195831298828, + 234.21717834472656, + 228.9242401123047, + 224.33628845214844 + ], + "bp_grad_norms_per_sample_med": [ + 4.4276617700234056e-05, + 4.620026084012352e-05, + 4.972432361682877e-05, + 4.657481986214407e-05, + 3.729217132786289e-05 + ], + "bp_grad_norms_F": [ + 0.0023896305356174707, + 0.002498477231711149, + 0.0025652945041656494, + 0.002390124835073948, + 0.0017562232678756118 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6171875, + "loss_eval": 1.146531581878662, + "epoch": 64 + }, + { + "hidden_norms": [ + 268.0794982910156, + 250.7041778564453, + 233.16966247558594, + 227.9508056640625, + 223.48045349121094 + ], + "bp_grad_norms_per_sample_med": [ + 4.518003697739914e-05, + 4.807085497304797e-05, + 5.077984678791836e-05, + 4.9026388296624646e-05, + 3.8487425626954064e-05 + ], + "bp_grad_norms_F": [ + 0.0023859951179474592, + 0.002494273241609335, + 0.0025624327827244997, + 0.0023940331302583218, + 0.0017616016557440162 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.1454447507858276, + "epoch": 65 + }, + { + "hidden_norms": [ + 267.8343811035156, + 247.6757049560547, + 231.40367126464844, + 225.93670654296875, + 220.4804229736328 + ], + "bp_grad_norms_per_sample_med": [ + 4.405072468216531e-05, + 4.688911576522514e-05, + 4.961229205946438e-05, + 4.743603858514689e-05, + 3.724359339685179e-05 + ], + "bp_grad_norms_F": [ + 0.002465154742822051, + 0.0025785581674426794, + 0.002648484194651246, + 0.0024633395951241255, + 0.0017954027280211449 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.165484070777893, + "epoch": 66 + }, + { + "hidden_norms": [ + 267.8901062011719, + 248.67857360839844, + 231.63746643066406, + 225.49383544921875, + 220.6399383544922 + ], + "bp_grad_norms_per_sample_med": [ + 4.755932604894042e-05, + 4.9960097385337576e-05, + 5.191187665332109e-05, + 4.949339563609101e-05, + 3.946756987716071e-05 + ], + "bp_grad_norms_F": [ + 0.0024303828831762075, + 0.0025356977712363005, + 0.002610789379104972, + 0.00243638688698411, + 0.0017875435296446085 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.1472151279449463, + "epoch": 67 + }, + { + "hidden_norms": [ + 267.3486022949219, + 247.69305419921875, + 229.9873504638672, + 223.6610870361328, + 218.91578674316406 + ], + "bp_grad_norms_per_sample_med": [ + 4.743155659525655e-05, + 5.06583419337403e-05, + 5.422766844276339e-05, + 5.0596820074133575e-05, + 3.959470632253215e-05 + ], + "bp_grad_norms_F": [ + 0.0025001303292810917, + 0.0026160534471273422, + 0.002682509133592248, + 0.002501503797248006, + 0.0018251334549859166 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6201171875, + "loss_eval": 1.157745599746704, + "epoch": 68 + }, + { + "hidden_norms": [ + 266.2055969238281, + 246.88201904296875, + 229.0934295654297, + 223.09255981445312, + 217.90614318847656 + ], + "bp_grad_norms_per_sample_med": [ + 4.6090037358226255e-05, + 4.8821068048710003e-05, + 5.145218892721459e-05, + 4.892798824585043e-05, + 3.874724279739894e-05 + ], + "bp_grad_norms_F": [ + 0.002517222659662366, + 0.00262960116378963, + 0.002704967511817813, + 0.002524228999391198, + 0.0018283555982634425 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.1513168811798096, + "epoch": 69 + }, + { + "hidden_norms": [ + 263.8387451171875, + 244.32431030273438, + 227.78903198242188, + 222.13900756835938, + 216.27389526367188 + ], + "bp_grad_norms_per_sample_med": [ + 4.680602069129236e-05, + 5.040669202571735e-05, + 5.318928378983401e-05, + 4.9446778575656936e-05, + 3.913935870514251e-05 + ], + "bp_grad_norms_F": [ + 0.0025120435748249292, + 0.0026304670609533787, + 0.0027123456820845604, + 0.002537800231948495, + 0.001847997889854014 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6240234375, + "loss_eval": 1.1497204303741455, + "epoch": 70 + }, + { + "hidden_norms": [ + 263.52716064453125, + 243.21226501464844, + 226.427001953125, + 220.67845153808594, + 214.70176696777344 + ], + "bp_grad_norms_per_sample_med": [ + 4.6976576413726434e-05, + 5.0085352995665744e-05, + 5.2343326387926936e-05, + 4.9784572183853015e-05, + 4.0186921978602186e-05 + ], + "bp_grad_norms_F": [ + 0.0026124012656509876, + 0.0027241536881774664, + 0.002797869499772787, + 0.002603790955618024, + 0.0018792233895510435 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.153285026550293, + "epoch": 71 + }, + { + "hidden_norms": [ + 264.0121765136719, + 243.2773895263672, + 226.7365264892578, + 220.29107666015625, + 214.1591339111328 + ], + "bp_grad_norms_per_sample_med": [ + 4.6254041080828756e-05, + 4.949727008352056e-05, + 5.206605055718683e-05, + 5.012763722334057e-05, + 3.8815273001091555e-05 + ], + "bp_grad_norms_F": [ + 0.0026143237482756376, + 0.0027275518514215946, + 0.0028062777128070593, + 0.002607470378279686, + 0.0018867084290832281 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.1514866352081299, + "epoch": 72 + }, + { + "hidden_norms": [ + 263.4013671875, + 243.0095672607422, + 225.4296112060547, + 219.55067443847656, + 213.40794372558594 + ], + "bp_grad_norms_per_sample_med": [ + 4.8506815801374614e-05, + 5.151949153514579e-05, + 5.5085791245801374e-05, + 5.175785190658644e-05, + 4.0316641388926655e-05 + ], + "bp_grad_norms_F": [ + 0.002606831956654787, + 0.002728143008425832, + 0.0028109808918088675, + 0.0026184367015957832, + 0.0018970600795000792 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.1346663236618042, + "epoch": 73 + }, + { + "hidden_norms": [ + 262.27703857421875, + 242.7241668701172, + 224.5229949951172, + 218.4025115966797, + 212.19247436523438 + ], + "bp_grad_norms_per_sample_med": [ + 4.704251477960497e-05, + 5.0965834816452116e-05, + 5.3327348723541945e-05, + 5.0449500122340396e-05, + 4.0479797462467104e-05 + ], + "bp_grad_norms_F": [ + 0.0026277368888258934, + 0.0027542279567569494, + 0.00283243996091187, + 0.00264621595852077, + 0.0019058829639106989 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6240234375, + "loss_eval": 1.137591004371643, + "epoch": 74 + }, + { + "hidden_norms": [ + 262.1747131347656, + 241.88607788085938, + 224.1046142578125, + 217.9982147216797, + 211.7519989013672 + ], + "bp_grad_norms_per_sample_med": [ + 4.847371383220889e-05, + 5.121564754517749e-05, + 5.3943567763781175e-05, + 5.087414683657698e-05, + 4.037184771732427e-05 + ], + "bp_grad_norms_F": [ + 0.0026811074931174517, + 0.002809705911204219, + 0.002887698821723461, + 0.002692745067179203, + 0.0019356919219717383 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6142578125, + "loss_eval": 1.1538643836975098, + "epoch": 75 + }, + { + "hidden_norms": [ + 261.7838439941406, + 239.75706481933594, + 222.1133575439453, + 216.12124633789062, + 210.44593811035156 + ], + "bp_grad_norms_per_sample_med": [ + 4.8369467549491674e-05, + 5.07068180013448e-05, + 5.281560879666358e-05, + 5.086012970423326e-05, + 4.062180232722312e-05 + ], + "bp_grad_norms_F": [ + 0.0027064597234129906, + 0.0028339733835309744, + 0.0029109998140484095, + 0.002717787167057395, + 0.0019469966646283865 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.1476709842681885, + "epoch": 76 + }, + { + "hidden_norms": [ + 260.708251953125, + 239.65792846679688, + 222.502197265625, + 216.31419372558594, + 210.15716552734375 + ], + "bp_grad_norms_per_sample_med": [ + 4.919906132272445e-05, + 5.164166941540316e-05, + 5.366719051380642e-05, + 5.108323966851458e-05, + 4.000464832643047e-05 + ], + "bp_grad_norms_F": [ + 0.002715736860409379, + 0.0028464714996516705, + 0.0029330456163734198, + 0.0027443754952400923, + 0.001961463363841176 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6181640625, + "loss_eval": 1.1511735916137695, + "epoch": 77 + }, + { + "hidden_norms": [ + 260.4088439941406, + 239.9808349609375, + 222.2389373779297, + 215.33692932128906, + 208.58534240722656 + ], + "bp_grad_norms_per_sample_med": [ + 4.8405916459159926e-05, + 5.163977766642347e-05, + 5.34093014721293e-05, + 5.167788185644895e-05, + 4.020798587589525e-05 + ], + "bp_grad_norms_F": [ + 0.0027501434087753296, + 0.0028795108664780855, + 0.0029617082327604294, + 0.002769613405689597, + 0.001984042814001441 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.1523363590240479, + "epoch": 78 + }, + { + "hidden_norms": [ + 259.8567199707031, + 238.8525848388672, + 221.2687225341797, + 213.9132537841797, + 207.3290557861328 + ], + "bp_grad_norms_per_sample_med": [ + 4.8219208110822365e-05, + 5.1672555855475366e-05, + 5.364803655538708e-05, + 5.1243885536678135e-05, + 4.079756035935134e-05 + ], + "bp_grad_norms_F": [ + 0.0028046013321727514, + 0.002939376747235656, + 0.0030214993748813868, + 0.002813557395711541, + 0.0019953204318881035 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.1514203548431396, + "epoch": 79 + }, + { + "hidden_norms": [ + 259.52423095703125, + 238.27757263183594, + 219.9165802001953, + 213.4214324951172, + 206.20606994628906 + ], + "bp_grad_norms_per_sample_med": [ + 4.8479021643288434e-05, + 5.219021113589406e-05, + 5.5094871640903875e-05, + 5.1899030950153247e-05, + 4.124108454561792e-05 + ], + "bp_grad_norms_F": [ + 0.0028202880639582872, + 0.002952422248199582, + 0.0030410154722630978, + 0.002832787809893489, + 0.0020088190212845802 + ], + "gamma_dfa": NaN, + "acc_eval": 0.625, + "loss_eval": 1.1545820236206055, + "epoch": 80 + }, + { + "hidden_norms": [ + 258.1958923339844, + 237.08778381347656, + 219.2870635986328, + 212.87725830078125, + 205.84408569335938 + ], + "bp_grad_norms_per_sample_med": [ + 5.005837374483235e-05, + 5.344217424863018e-05, + 5.582463927567005e-05, + 5.345495083020069e-05, + 4.113194518140517e-05 + ], + "bp_grad_norms_F": [ + 0.0028330644126981497, + 0.002965509658679366, + 0.0030466399621218443, + 0.00284536718390882, + 0.0020232615061104298 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6220703125, + "loss_eval": 1.1552448272705078, + "epoch": 81 + }, + { + "hidden_norms": [ + 258.44268798828125, + 236.90562438964844, + 218.65948486328125, + 212.63186645507812, + 204.90692138671875 + ], + "bp_grad_norms_per_sample_med": [ + 4.896440077573061e-05, + 5.1820486987708136e-05, + 5.4638629080727696e-05, + 5.3578904044115916e-05, + 4.117973367101513e-05 + ], + "bp_grad_norms_F": [ + 0.002839416265487671, + 0.0029778846073895693, + 0.003062452422454953, + 0.002849552081897855, + 0.0020236214622855186 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62109375, + "loss_eval": 1.1515182256698608, + "epoch": 82 + }, + { + "hidden_norms": [ + 258.24615478515625, + 236.87181091308594, + 219.06484985351562, + 213.2528076171875, + 205.03671264648438 + ], + "bp_grad_norms_per_sample_med": [ + 4.8622885515214875e-05, + 5.181535379961133e-05, + 5.509376205736771e-05, + 5.2298331866040826e-05, + 4.074195385328494e-05 + ], + "bp_grad_norms_F": [ + 0.002838765038177371, + 0.00297414674423635, + 0.003058358561247587, + 0.0028491863049566746, + 0.0020313323475420475 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6142578125, + "loss_eval": 1.1609394550323486, + "epoch": 83 + }, + { + "hidden_norms": [ + 257.9989929199219, + 236.4859161376953, + 218.73072814941406, + 212.0786895751953, + 204.2919464111328 + ], + "bp_grad_norms_per_sample_med": [ + 5.0208276661578566e-05, + 5.2276191127020866e-05, + 5.509322727448307e-05, + 5.315374437486753e-05, + 4.122377504245378e-05 + ], + "bp_grad_norms_F": [ + 0.0028634185437113047, + 0.0029970910400152206, + 0.0030890253838151693, + 0.002881886437535286, + 0.0020408176351338625 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6171875, + "loss_eval": 1.1592046022415161, + "epoch": 84 + }, + { + "hidden_norms": [ + 257.24053955078125, + 235.7548065185547, + 217.84329223632812, + 211.033935546875, + 203.8216094970703 + ], + "bp_grad_norms_per_sample_med": [ + 5.0660164561122656e-05, + 5.414208135334775e-05, + 5.5454143875977024e-05, + 5.3000938351033255e-05, + 4.292939411243424e-05 + ], + "bp_grad_norms_F": [ + 0.0028948886319994926, + 0.003031315514817834, + 0.0031204961705952883, + 0.002907233312726021, + 0.0020496752113103867 + ], + "gamma_dfa": NaN, + "acc_eval": 0.619140625, + "loss_eval": 1.1583250761032104, + "epoch": 85 + }, + { + "hidden_norms": [ + 256.78289794921875, + 235.2476348876953, + 217.21603393554688, + 210.80035400390625, + 203.15478515625 + ], + "bp_grad_norms_per_sample_med": [ + 4.9510348617332056e-05, + 5.1982155127916485e-05, + 5.440499808173627e-05, + 5.1704166253330186e-05, + 4.0308059396920726e-05 + ], + "bp_grad_norms_F": [ + 0.0028964560478925705, + 0.0030334230978041887, + 0.0031210912857204676, + 0.002908239373937249, + 0.0020543786231428385 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6181640625, + "loss_eval": 1.1597179174423218, + "epoch": 86 + }, + { + "hidden_norms": [ + 256.531982421875, + 235.45941162109375, + 217.1429443359375, + 210.1690673828125, + 202.77899169921875 + ], + "bp_grad_norms_per_sample_med": [ + 4.943124076817185e-05, + 5.149367279955186e-05, + 5.385246913647279e-05, + 5.262702325126156e-05, + 4.104706385987811e-05 + ], + "bp_grad_norms_F": [ + 0.0029305708594620228, + 0.0030687344260513783, + 0.003160761669278145, + 0.002940374892205, + 0.0020649591460824013 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6220703125, + "loss_eval": 1.161116600036621, + "epoch": 87 + }, + { + "hidden_norms": [ + 256.3059387207031, + 235.24874877929688, + 217.37142944335938, + 210.53717041015625, + 203.14259338378906 + ], + "bp_grad_norms_per_sample_med": [ + 4.934536627843045e-05, + 5.2089759265072644e-05, + 5.424721530289389e-05, + 5.292960850056261e-05, + 4.041651845909655e-05 + ], + "bp_grad_norms_F": [ + 0.002913407515734434, + 0.0030489542987197638, + 0.003135726321488619, + 0.002922008978202939, + 0.002062067622318864 + ], + "gamma_dfa": NaN, + "acc_eval": 0.61328125, + "loss_eval": 1.155902624130249, + "epoch": 88 + }, + { + "hidden_norms": [ + 256.7462463378906, + 235.3153839111328, + 216.87977600097656, + 210.572509765625, + 202.77845764160156 + ], + "bp_grad_norms_per_sample_med": [ + 4.990033630747348e-05, + 5.337029870133847e-05, + 5.522817809833214e-05, + 5.3465773817151785e-05, + 4.164372876402922e-05 + ], + "bp_grad_norms_F": [ + 0.0029192205984145403, + 0.0030557813588529825, + 0.003147577866911888, + 0.0029307191725820303, + 0.0020654413383454084 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6162109375, + "loss_eval": 1.1561503410339355, + "epoch": 89 + }, + { + "hidden_norms": [ + 256.68145751953125, + 234.77310180664062, + 216.7720947265625, + 209.664794921875, + 202.22833251953125 + ], + "bp_grad_norms_per_sample_med": [ + 4.9965801736107096e-05, + 5.341583164408803e-05, + 5.593279274762608e-05, + 5.420796514954418e-05, + 4.210533734294586e-05 + ], + "bp_grad_norms_F": [ + 0.002943370258435607, + 0.00308181531727314, + 0.003169203409925103, + 0.002951863221824169, + 0.0020759364124387503 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6142578125, + "loss_eval": 1.1583542823791504, + "epoch": 90 + }, + { + "hidden_norms": [ + 256.4252014160156, + 234.56448364257812, + 216.34176635742188, + 209.5242156982422, + 201.7559356689453 + ], + "bp_grad_norms_per_sample_med": [ + 4.9815931561170146e-05, + 5.2233976020943373e-05, + 5.5747830629115924e-05, + 5.41718618478626e-05, + 4.169955354882404e-05 + ], + "bp_grad_norms_F": [ + 0.0029554881621152163, + 0.0030950764194130898, + 0.0031847492791712284, + 0.0029650654178112745, + 0.002081435639411211 + ], + "gamma_dfa": NaN, + "acc_eval": 0.619140625, + "loss_eval": 1.159005045890808, + "epoch": 91 + }, + { + "hidden_norms": [ + 256.15167236328125, + 234.47537231445312, + 216.2799072265625, + 209.95578002929688, + 201.94126892089844 + ], + "bp_grad_norms_per_sample_med": [ + 5.007637446396984e-05, + 5.260824036668055e-05, + 5.540058555197902e-05, + 5.322153810993768e-05, + 4.1122035327134654e-05 + ], + "bp_grad_norms_F": [ + 0.002944375155493617, + 0.00308293872512877, + 0.003174267942085862, + 0.0029555640649050474, + 0.0020777545869350433 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6259765625, + "loss_eval": 1.1595215797424316, + "epoch": 92 + }, + { + "hidden_norms": [ + 256.1369934082031, + 234.51614379882812, + 216.30044555664062, + 209.4623565673828, + 201.70799255371094 + ], + "bp_grad_norms_per_sample_med": [ + 5.048588718636893e-05, + 5.3128016588743776e-05, + 5.624579353025183e-05, + 5.411298116086982e-05, + 4.109516885364428e-05 + ], + "bp_grad_norms_F": [ + 0.0029427227564156055, + 0.0030841128900647163, + 0.003178349928930402, + 0.0029583934228867292, + 0.002080487785860896 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62109375, + "loss_eval": 1.1565905809402466, + "epoch": 93 + }, + { + "hidden_norms": [ + 255.9738311767578, + 234.28948974609375, + 216.3280029296875, + 209.589111328125, + 201.76205444335938 + ], + "bp_grad_norms_per_sample_med": [ + 5.070818224339746e-05, + 5.330924614099786e-05, + 5.596653136308305e-05, + 5.407314529293217e-05, + 4.100686783203855e-05 + ], + "bp_grad_norms_F": [ + 0.0029472638852894306, + 0.003088710131123662, + 0.0031828396022319794, + 0.0029631764627993107, + 0.0020829145796597004 + ], + "gamma_dfa": NaN, + "acc_eval": 0.619140625, + "loss_eval": 1.1584088802337646, + "epoch": 94 + }, + { + "hidden_norms": [ + 255.89332580566406, + 234.19253540039062, + 216.33103942871094, + 209.45057678222656, + 201.54258728027344 + ], + "bp_grad_norms_per_sample_med": [ + 5.041498661739752e-05, + 5.279783727019094e-05, + 5.5226330005098134e-05, + 5.407658318290487e-05, + 4.1154507925966755e-05 + ], + "bp_grad_norms_F": [ + 0.002949801040813327, + 0.00309200631454587, + 0.0031869453378021717, + 0.0029658437706530094, + 0.002085147425532341 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6201171875, + "loss_eval": 1.158942699432373, + "epoch": 95 + }, + { + "hidden_norms": [ + 255.63841247558594, + 234.11630249023438, + 216.2378692626953, + 209.49703979492188, + 201.46917724609375 + ], + "bp_grad_norms_per_sample_med": [ + 5.020374737796374e-05, + 5.243354826234281e-05, + 5.587147097685374e-05, + 5.334949673851952e-05, + 4.121083111385815e-05 + ], + "bp_grad_norms_F": [ + 0.002950438065454364, + 0.003093136241659522, + 0.0031878354493528605, + 0.0029664800968021154, + 0.0020843464881181717 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6201171875, + "loss_eval": 1.1582318544387817, + "epoch": 96 + }, + { + "hidden_norms": [ + 255.8027801513672, + 234.07070922851562, + 216.1463623046875, + 209.4476318359375, + 201.27279663085938 + ], + "bp_grad_norms_per_sample_med": [ + 5.0307549827266484e-05, + 5.278814569464885e-05, + 5.604944453807548e-05, + 5.306081584421918e-05, + 4.1182753193425015e-05 + ], + "bp_grad_norms_F": [ + 0.002952505135908723, + 0.003095670836046338, + 0.0031897351145744324, + 0.00296790711581707, + 0.002085329731926322 + ], + "gamma_dfa": NaN, + "acc_eval": 0.619140625, + "loss_eval": 1.15840482711792, + "epoch": 97 + }, + { + "hidden_norms": [ + 255.60986328125, + 234.11065673828125, + 216.12860107421875, + 209.42921447753906, + 201.28346252441406 + ], + "bp_grad_norms_per_sample_med": [ + 5.0218295655213296e-05, + 5.269264511298388e-05, + 5.5988577514654025e-05, + 5.322946162777953e-05, + 4.136392453801818e-05 + ], + "bp_grad_norms_F": [ + 0.002954497467726469, + 0.003097717184573412, + 0.0031918887980282307, + 0.002969518303871155, + 0.00208606431260705 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6181640625, + "loss_eval": 1.1585593223571777, + "epoch": 98 + }, + { + "hidden_norms": [ + 255.57244873046875, + 234.11569213867188, + 216.13626098632812, + 209.40383911132812, + 201.28627014160156 + ], + "bp_grad_norms_per_sample_med": [ + 5.005559796700254e-05, + 5.2759678510483354e-05, + 5.5868193157948554e-05, + 5.3356721764430404e-05, + 4.125368650420569e-05 + ], + "bp_grad_norms_F": [ + 0.0029547216836363077, + 0.00309770368039608, + 0.003191797062754631, + 0.0029695071280002594, + 0.0020862380042672157 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6181640625, + "loss_eval": 1.1585021018981934, + "epoch": 99 + }, + { + "hidden_norms": [ + 255.5677947998047, + 234.11875915527344, + 216.1315460205078, + 209.4070281982422, + 201.2687530517578 + ], + "bp_grad_norms_per_sample_med": [ + 5.006368883186951e-05, + 5.279530887492001e-05, + 5.585233884630725e-05, + 5.334027810022235e-05, + 4.123226608498953e-05 + ], + "bp_grad_norms_F": [ + 0.002954971743747592, + 0.0030978918075561523, + 0.003191987983882427, + 0.002969692926853895, + 0.002086336025968194 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6181640625, + "loss_eval": 1.1584858894348145, + "epoch": 100 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.690464973449707, + 8.719978332519531, + 8.73093318939209, + 8.75937271118164, + 8.790542602539062 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009977436857298017, + 0.000992251792922616, + 0.0009848480112850666, + 0.0009761073160916567, + 0.0009735578205436468 + ], + "bp_grad_norms_F": [ + 0.035340383648872375, + 0.03499162197113037, + 0.03454425558447838, + 0.034113530069589615, + 0.033874060958623886 + ], + "gamma_dfa": 0.006830460682976991, + "acc_eval": 0.095703125, + "loss_eval": 2.486203908920288, + "epoch": 0 + }, + { + "hidden_norms": [ + 861.2440185546875, + 2373.370849609375, + 4675.99951171875, + 6090.40869140625, + 6962.984375 + ], + "bp_grad_norms_per_sample_med": [ + 2.380779051236459e-06, + 1.3197138741816161e-06, + 1.3154849511920474e-06, + 1.3285966815601569e-06, + 1.3258621720524388e-06 + ], + "bp_grad_norms_F": [ + 0.0001391920231981203, + 6.988063250901178e-05, + 6.874280370539054e-05, + 6.720778765156865e-05, + 6.707101420033723e-05 + ], + "gamma_dfa": 0.10659917898010463, + "acc_eval": 0.3037109375, + "loss_eval": 1.9665180444717407, + "epoch": 1 + }, + { + "hidden_norms": [ + 1679.144775390625, + 8850.173828125, + 31676.23046875, + 40712.2109375, + 45375.55859375 + ], + "bp_grad_norms_per_sample_med": [ + 1.1123192962259054e-06, + 2.7329409135745664e-07, + 2.7436919936008053e-07, + 2.75225175982996e-07, + 2.744452558545163e-07 + ], + "bp_grad_norms_F": [ + 7.363831537077203e-05, + 2.2035641450202093e-05, + 1.9731569409486838e-05, + 1.9022963897441514e-05, + 1.7921549442689866e-05 + ], + "gamma_dfa": 0.10788296448299661, + "acc_eval": 0.29296875, + "loss_eval": 1.972828984260559, + "epoch": 2 + }, + { + "hidden_norms": [ + 2530.16015625, + 21436.486328125, + 88828.296875, + 114079.484375, + 124374.78125 + ], + "bp_grad_norms_per_sample_med": [ + 8.110604312605574e-07, + 1.1556701196013819e-07, + 1.1451407289087001e-07, + 1.1523399479074214e-07, + 1.1543902900257308e-07 + ], + "bp_grad_norms_F": [ + 0.00011594755778787658, + 1.8132053810404614e-05, + 1.1369732419552747e-05, + 8.215727575588971e-06, + 7.219489361887099e-06 + ], + "gamma_dfa": 0.1084698709892109, + "acc_eval": 0.318359375, + "loss_eval": 1.9430747032165527, + "epoch": 3 + }, + { + "hidden_norms": [ + 3363.359375, + 41233.19921875, + 182355.03125, + 240225.46875, + 257539.390625 + ], + "bp_grad_norms_per_sample_med": [ + 6.176944111757621e-07, + 6.474806468759198e-08, + 6.307719502274267e-08, + 6.379124783961743e-08, + 6.374663996666641e-08 + ], + "bp_grad_norms_F": [ + 3.5978406231151894e-05, + 4.323610028222902e-06, + 3.5177260997443227e-06, + 3.4877305097325006e-06, + 3.479522774796351e-06 + ], + "gamma_dfa": 0.10987455540453084, + "acc_eval": 0.3173828125, + "loss_eval": 1.959622859954834, + "epoch": 4 + }, + { + "hidden_norms": [ + 4170.119140625, + 70935.8515625, + 335571.09375, + 441693.5625, + 469995.8125 + ], + "bp_grad_norms_per_sample_med": [ + 4.856212285631045e-07, + 4.0158354863706336e-08, + 3.8916198263905244e-08, + 3.9119736783277403e-08, + 3.916203894505088e-08 + ], + "bp_grad_norms_F": [ + 2.611691706988495e-05, + 2.208936621173052e-06, + 1.6750394706832594e-06, + 1.6634863868603134e-06, + 1.659758027017233e-06 + ], + "gamma_dfa": 0.1083616423420608, + "acc_eval": 0.3017578125, + "loss_eval": 1.932759165763855, + "epoch": 5 + }, + { + "hidden_norms": [ + 5013.92236328125, + 106898.6171875, + 530492.6875, + 719779.5, + 763058.3125 + ], + "bp_grad_norms_per_sample_med": [ + 4.242272950705228e-07, + 2.814423716301917e-08, + 2.683668043346188e-08, + 2.6872848835068908e-08, + 2.6873932412740942e-08 + ], + "bp_grad_norms_F": [ + 2.2560918296221644e-05, + 1.2798993793694535e-06, + 1.0339434766137856e-06, + 1.0326252777304035e-06, + 1.030524344969308e-06 + ], + "gamma_dfa": 0.11125951120629907, + "acc_eval": 0.3095703125, + "loss_eval": 1.9531997442245483, + "epoch": 6 + }, + { + "hidden_norms": [ + 5811.36279296875, + 156264.234375, + 809496.6875, + 1104418.875, + 1163013.625 + ], + "bp_grad_norms_per_sample_med": [ + 3.5694648659045924e-07, + 2.0201103012595922e-08, + 1.89678583950581e-08, + 1.8967025283700423e-08, + 1.8932304612917505e-08 + ], + "bp_grad_norms_F": [ + 1.9050115952268243e-05, + 9.341621307612513e-07, + 6.890153372296481e-07, + 6.891143584653037e-07, + 6.886222649882257e-07 + ], + "gamma_dfa": 0.11049338441807777, + "acc_eval": 0.3076171875, + "loss_eval": 1.9362893104553223, + "epoch": 7 + }, + { + "hidden_norms": [ + 6660.841796875, + 217521.65625, + 1158874.5, + 1615614.625, + 1694436.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.212987280676316e-07, + 1.5324568281016582e-08, + 1.4045938634410504e-08, + 1.4053354924215e-08, + 1.4027999206689401e-08 + ], + "bp_grad_norms_F": [ + 1.7352898794342764e-05, + 6.539408445860317e-07, + 5.044145154897706e-07, + 5.047700142313261e-07, + 5.048477760283276e-07 + ], + "gamma_dfa": 0.11245601065456867, + "acc_eval": 0.2978515625, + "loss_eval": 1.9441646337509155, + "epoch": 8 + }, + { + "hidden_norms": [ + 7480.24169921875, + 295557.40625, + 1585967.0, + 2246827.75, + 2356427.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.889860297727864e-07, + 1.193609300287335e-08, + 1.1067995409064224e-08, + 1.103960478587851e-08, + 1.1055576010221557e-08 + ], + "bp_grad_norms_F": [ + 1.5521236491622403e-05, + 4.5597263920171827e-07, + 3.8742672359148855e-07, + 3.8764648024880444e-07, + 3.877208314406744e-07 + ], + "gamma_dfa": 0.11317481694277376, + "acc_eval": 0.30078125, + "loss_eval": 1.9356626272201538, + "epoch": 9 + }, + { + "hidden_norms": [ + 8273.8408203125, + 388312.4375, + 2104540.5, + 3043837.75, + 3180222.75 + ], + "bp_grad_norms_per_sample_med": [ + 2.619119925384439e-07, + 9.19370091168048e-09, + 8.51864179196582e-09, + 8.482276214749618e-09, + 8.476813917468462e-09 + ], + "bp_grad_norms_F": [ + 1.4210399967851117e-05, + 3.5443522961031704e-07, + 3.0404962103602884e-07, + 3.0431687036980293e-07, + 3.0445681886703824e-07 + ], + "gamma_dfa": 0.11495429277420044, + "acc_eval": 0.30859375, + "loss_eval": 1.936495304107666, + "epoch": 10 + }, + { + "hidden_norms": [ + 9086.7265625, + 501434.3125, + 2767834.0, + 4046107.75, + 4214970.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.471596189934644e-07, + 7.524303846651037e-09, + 7.025830139895106e-09, + 7.019247405537499e-09, + 7.011437208603866e-09 + ], + "bp_grad_norms_F": [ + 1.3406845027930103e-05, + 4.39807990915142e-07, + 2.471441860052437e-07, + 2.474318421263888e-07, + 2.475488827258232e-07 + ], + "gamma_dfa": 0.11651878873817623, + "acc_eval": 0.30859375, + "loss_eval": 1.9542189836502075, + "epoch": 11 + }, + { + "hidden_norms": [ + 9854.2626953125, + 612623.625, + 3485830.25, + 5139234.5, + 5346583.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.3279393701614026e-07, + 6.378383154981293e-09, + 5.839252636974379e-09, + 5.8299334249056756e-09, + 5.825462778830115e-09 + ], + "bp_grad_norms_F": [ + 1.2396733836794738e-05, + 2.516441668376501e-07, + 2.0780194631697668e-07, + 2.0795941679807584e-07, + 2.080748373600727e-07 + ], + "gamma_dfa": 0.11470737145282328, + "acc_eval": 0.3046875, + "loss_eval": 1.9374217987060547, + "epoch": 12 + }, + { + "hidden_norms": [ + 10653.666015625, + 745430.125, + 4325399.0, + 6434218.5, + 6688000.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.1187355514484807e-07, + 5.294193083926757e-09, + 4.98529528769609e-09, + 4.991081326011226e-09, + 4.989251234377434e-09 + ], + "bp_grad_norms_F": [ + 1.1210328011657111e-05, + 2.000140426616781e-07, + 1.7647043648594263e-07, + 1.7654315342952032e-07, + 1.7665543339262513e-07 + ], + "gamma_dfa": 0.11383607180323452, + "acc_eval": 0.291015625, + "loss_eval": 1.9233126640319824, + "epoch": 13 + }, + { + "hidden_norms": [ + 11404.5263671875, + 893037.0625, + 5298411.0, + 7870617.0, + 8170729.5 + ], + "bp_grad_norms_per_sample_med": [ + 1.9957101926593168e-07, + 4.642851436642559e-09, + 4.288450483613815e-09, + 4.285100718703916e-09, + 4.289933297485504e-09 + ], + "bp_grad_norms_F": [ + 1.0866175216506235e-05, + 1.758858729772328e-07, + 1.538420519864303e-07, + 1.5386244456294662e-07, + 1.5397839092656795e-07 + ], + "gamma_dfa": 0.1139617893495597, + "acc_eval": 0.30859375, + "loss_eval": 1.932279109954834, + "epoch": 14 + }, + { + "hidden_norms": [ + 12171.2412109375, + 1062066.875, + 6388639.0, + 9528923.0, + 9891447.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.9334000000981177e-07, + 4.044033108385747e-09, + 3.810601167941741e-09, + 3.801854830953744e-09, + 3.8046659156520946e-09 + ], + "bp_grad_norms_F": [ + 1.0322088201064616e-05, + 1.529211743900305e-07, + 1.350435638869385e-07, + 1.3504063645086717e-07, + 1.3514510044387862e-07 + ], + "gamma_dfa": 0.11320225725648925, + "acc_eval": 0.3193359375, + "loss_eval": 1.921454906463623, + "epoch": 15 + }, + { + "hidden_norms": [ + 12924.974609375, + 1273988.625, + 7574387.5, + 11500420.0, + 11920183.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.8497563303299103e-07, + 3.6160896499382034e-09, + 3.388503477808058e-09, + 3.385580482628825e-09, + 3.3854716807724117e-09 + ], + "bp_grad_norms_F": [ + 9.76746559899766e-06, + 1.3485876593222201e-07, + 1.1896084117779537e-07, + 1.1894425000491538e-07, + 1.1903343022368063e-07 + ], + "gamma_dfa": 0.11276883230311796, + "acc_eval": 0.306640625, + "loss_eval": 1.9356281757354736, + "epoch": 16 + }, + { + "hidden_norms": [ + 13632.109375, + 1465148.75, + 8873670.0, + 13535396.0, + 14019399.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7523743167657813e-07, + 3.18161341716916e-09, + 3.0166942277531916e-09, + 3.0173783471809656e-09, + 3.0215525637089513e-09 + ], + "bp_grad_norms_F": [ + 9.427177246834617e-06, + 1.1933295240851294e-07, + 1.0663712401992598e-07, + 1.0661205607220836e-07, + 1.0669979388922002e-07 + ], + "gamma_dfa": 0.11264261469477788, + "acc_eval": 0.3203125, + "loss_eval": 1.926081657409668, + "epoch": 17 + }, + { + "hidden_norms": [ + 14394.1845703125, + 1699121.5, + 10379340.0, + 15814831.0, + 16377349.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6784264289526618e-07, + 2.8936604223872564e-09, + 2.7336535257660444e-09, + 2.7314879247342105e-09, + 2.733708148738856e-09 + ], + "bp_grad_norms_F": [ + 9.04797616385622e-06, + 1.087723191517398e-07, + 9.662341682314946e-08, + 9.658959498892727e-08, + 9.665905764677518e-08 + ], + "gamma_dfa": 0.11253939801827073, + "acc_eval": 0.3154296875, + "loss_eval": 1.922888994216919, + "epoch": 18 + }, + { + "hidden_norms": [ + 15138.509765625, + 1969752.0, + 12071423.0, + 18393228.0, + 19044056.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5837277089758572e-07, + 2.609559235366987e-09, + 2.4664128517315476e-09, + 2.4639881246457662e-09, + 2.4657431652030937e-09 + ], + "bp_grad_norms_F": [ + 8.502225682605058e-06, + 9.664965716638108e-08, + 8.704243725787819e-08, + 8.700892806245974e-08, + 8.707356613513184e-08 + ], + "gamma_dfa": 0.11155363742727786, + "acc_eval": 0.3125, + "loss_eval": 1.9243314266204834, + "epoch": 19 + }, + { + "hidden_norms": [ + 15811.982421875, + 2268261.5, + 13867645.0, + 21375086.0, + 22149420.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5073908343765652e-07, + 2.376487229227564e-09, + 2.2317030445861974e-09, + 2.2317414583028494e-09, + 2.2311954506193388e-09 + ], + "bp_grad_norms_F": [ + 8.195236659958027e-06, + 8.728681422098816e-08, + 7.846901439734211e-08, + 7.84395552955175e-08, + 7.849664029890846e-08 + ], + "gamma_dfa": 0.11315422086045146, + "acc_eval": 0.3095703125, + "loss_eval": 1.924652338027954, + "epoch": 20 + }, + { + "hidden_norms": [ + 16487.935546875, + 2556303.5, + 15702076.0, + 24321856.0, + 25185988.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.443007136003871e-07, + 2.174122659681643e-09, + 2.0514809850880056e-09, + 2.052057856971601e-09, + 2.05182382195801e-09 + ], + "bp_grad_norms_F": [ + 8.002187314559706e-06, + 8.025331510452816e-08, + 7.266314838716426e-08, + 7.2638087544874e-08, + 7.268938162496852e-08 + ], + "gamma_dfa": 0.11267373809823766, + "acc_eval": 0.310546875, + "loss_eval": 1.9348869323730469, + "epoch": 21 + }, + { + "hidden_norms": [ + 17153.216796875, + 2908610.25, + 17831918.0, + 27718528.0, + 28682196.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.43127067531168e-07, + 2.0134633960111614e-09, + 1.908325941712974e-09, + 1.9070569567958273e-09, + 1.9050578892176873e-09 + ], + "bp_grad_norms_F": [ + 7.550354439445073e-06, + 7.309487415341209e-08, + 6.660556550741603e-08, + 6.657593587533484e-08, + 6.66217090383725e-08 + ], + "gamma_dfa": 0.11266892295680009, + "acc_eval": 0.310546875, + "loss_eval": 1.9210036993026733, + "epoch": 22 + }, + { + "hidden_norms": [ + 17796.001953125, + 3236156.25, + 20246900.0, + 31494576.0, + 32571052.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.3518946673229948e-07, + 1.8474217711172969e-09, + 1.7507182370479768e-09, + 1.7496273319039801e-09, + 1.7511733174657707e-09 + ], + "bp_grad_norms_F": [ + 7.284599632839672e-06, + 6.709063882226474e-08, + 6.151606157800416e-08, + 6.149030440383285e-08, + 6.153235432293513e-08 + ], + "gamma_dfa": 0.11186322406865656, + "acc_eval": 0.3115234375, + "loss_eval": 1.9283114671707153, + "epoch": 23 + }, + { + "hidden_norms": [ + 18460.63671875, + 3604280.25, + 22626418.0, + 35429216.0, + 36622356.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.3137012899733236e-07, + 1.7567419741126855e-09, + 1.6593408869169934e-09, + 1.6595901319860218e-09, + 1.6608053821087765e-09 + ], + "bp_grad_norms_F": [ + 7.130098310881294e-06, + 6.264485108431472e-08, + 5.731577701340029e-08, + 5.729528851361465e-08, + 5.733248187311801e-08 + ], + "gamma_dfa": 0.11299802124267444, + "acc_eval": 0.2978515625, + "loss_eval": 1.942992925643921, + "epoch": 24 + }, + { + "hidden_norms": [ + 19115.904296875, + 4038094.25, + 25405536.0, + 39835936.0, + 41154148.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2640579427625198e-07, + 1.5953075527264104e-09, + 1.5003157605164574e-09, + 1.4991035079958692e-09, + 1.4979777418488993e-09 + ], + "bp_grad_norms_F": [ + 6.799941729696002e-06, + 5.7522207441706996e-08, + 5.297441418861126e-08, + 5.2952817242157835e-08, + 5.298943506204523e-08 + ], + "gamma_dfa": 0.11197824770351872, + "acc_eval": 0.298828125, + "loss_eval": 1.9319748878479004, + "epoch": 25 + }, + { + "hidden_norms": [ + 19780.572265625, + 4490110.5, + 28153634.0, + 44291160.0, + 45731404.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2269519800156559e-07, + 1.4798114955638653e-09, + 1.4102843337582271e-09, + 1.4097069067631196e-09, + 1.4109671209183716e-09 + ], + "bp_grad_norms_F": [ + 6.577545264008222e-06, + 5.327013141709358e-08, + 4.94958669605694e-08, + 4.9476955865657146e-08, + 4.950964083150211e-08 + ], + "gamma_dfa": 0.11252723945653997, + "acc_eval": 0.3115234375, + "loss_eval": 1.9247620105743408, + "epoch": 26 + }, + { + "hidden_norms": [ + 20381.6796875, + 4929967.0, + 30880866.0, + 48905308.0, + 50483824.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1911821928833888e-07, + 1.377626124288156e-09, + 1.3317531522005766e-09, + 1.3313244950907688e-09, + 1.3306112878197496e-09 + ], + "bp_grad_norms_F": [ + 6.326347829599399e-06, + 4.955709798082353e-08, + 4.649340468176888e-08, + 4.6477893533847237e-08, + 4.650862805988254e-08 + ], + "gamma_dfa": 0.11152978462632746, + "acc_eval": 0.2978515625, + "loss_eval": 1.9170689582824707, + "epoch": 27 + }, + { + "hidden_norms": [ + 21001.544921875, + 5444194.5, + 33907076.0, + 53832084.0, + 55554724.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1559290413742929e-07, + 1.3061883796794405e-09, + 1.2378150726632953e-09, + 1.2379912650573033e-09, + 1.2384089309591673e-09 + ], + "bp_grad_norms_F": [ + 6.23212235950632e-06, + 4.7021419646853246e-08, + 4.3998962695468435e-08, + 4.3984215380987735e-08, + 4.4011432720481025e-08 + ], + "gamma_dfa": 0.11285935762862209, + "acc_eval": 0.3193359375, + "loss_eval": 1.9198743104934692, + "epoch": 28 + }, + { + "hidden_norms": [ + 21623.64453125, + 5895143.0, + 37025488.0, + 58791348.0, + 60687928.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1377478870144841e-07, + 1.2547849426169932e-09, + 1.1888731110687445e-09, + 1.1877619998656996e-09, + 1.1896320595283782e-09 + ], + "bp_grad_norms_F": [ + 6.024939921189798e-06, + 4.443810297516393e-08, + 4.161294953064498e-08, + 4.159920763413538e-08, + 4.162497546644772e-08 + ], + "gamma_dfa": 0.11188641694025137, + "acc_eval": 0.3115234375, + "loss_eval": 1.917163372039795, + "epoch": 29 + }, + { + "hidden_norms": [ + 22195.29296875, + 6369258.5, + 40117404.0, + 64235468.0, + 66270544.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1021134582733794e-07, + 1.153794726427293e-09, + 1.1123471033158694e-09, + 1.1119479781385166e-09, + 1.1122585075185043e-09 + ], + "bp_grad_norms_F": [ + 5.96408472119947e-06, + 4.2022573865097e-08, + 3.954471239353552e-08, + 3.953241289877951e-08, + 3.955623029128219e-08 + ], + "gamma_dfa": 0.11316103948047385, + "acc_eval": 0.3125, + "loss_eval": 1.9332935810089111, + "epoch": 30 + }, + { + "hidden_norms": [ + 22786.513671875, + 6899202.5, + 43496572.0, + 69758712.0, + 71960648.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0609301170916297e-07, + 1.1096534802135238e-09, + 1.05872854927469e-09, + 1.0590027743617725e-09, + 1.0579482845329835e-09 + ], + "bp_grad_norms_F": [ + 5.711301128030755e-06, + 3.962547268088201e-08, + 3.742779952631281e-08, + 3.741677900848117e-08, + 3.743992138538488e-08 + ], + "gamma_dfa": 0.11225346029095817, + "acc_eval": 0.31640625, + "loss_eval": 1.9247596263885498, + "epoch": 31 + }, + { + "hidden_norms": [ + 23367.078125, + 7480530.0, + 47061616.0, + 75610000.0, + 77981320.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.054115728038596e-07, + 1.0618838031106748e-09, + 1.0191184562913236e-09, + 1.01949926278877e-09, + 1.0192180432966325e-09 + ], + "bp_grad_norms_F": [ + 5.768360097135883e-06, + 3.826109207238915e-08, + 3.593911657162607e-08, + 3.592855790657268e-08, + 3.594948694285449e-08 + ], + "gamma_dfa": 0.11492819089471595, + "acc_eval": 0.314453125, + "loss_eval": 1.939026117324829, + "epoch": 32 + }, + { + "hidden_norms": [ + 23912.85546875, + 8053234.0, + 51027352.0, + 81931568.0, + 84515616.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0266481353937706e-07, + 9.919576271499864e-10, + 9.572211912001194e-10, + 9.572932446744176e-10, + 9.577664217275128e-10 + ], + "bp_grad_norms_F": [ + 5.472421435115393e-06, + 3.587240016145188e-08, + 3.39712649122248e-08, + 3.396091940999213e-08, + 3.398050552050336e-08 + ], + "gamma_dfa": 0.11253271601162851, + "acc_eval": 0.3125, + "loss_eval": 1.9187253713607788, + "epoch": 33 + }, + { + "hidden_norms": [ + 24486.8359375, + 8682399.0, + 55030492.0, + 88236184.0, + 91025880.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0101911129822838e-07, + 9.702203485062455e-10, + 9.30652499508966e-10, + 9.30728105696943e-10, + 9.303261494508774e-10 + ], + "bp_grad_norms_F": [ + 5.286908617563313e-06, + 3.4072087373715476e-08, + 3.2386065385026086e-08, + 3.2376764380614986e-08, + 3.2396076932172946e-08 + ], + "gamma_dfa": 0.11125053715659305, + "acc_eval": 0.3125, + "loss_eval": 1.9214520454406738, + "epoch": 34 + }, + { + "hidden_norms": [ + 25051.91796875, + 9255517.0, + 58776788.0, + 94748472.0, + 97725744.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.793318156425812e-08, + 9.150468716079274e-10, + 8.747003676923271e-10, + 8.746902091516517e-10, + 8.743750723461119e-10 + ], + "bp_grad_norms_F": [ + 5.294927632348845e-06, + 3.279593840943562e-08, + 3.115108881956985e-08, + 3.114205782139834e-08, + 3.115993862934374e-08 + ], + "gamma_dfa": 0.11356210591475246, + "acc_eval": 0.314453125, + "loss_eval": 1.9334189891815186, + "epoch": 35 + }, + { + "hidden_norms": [ + 25539.400390625, + 9852175.0, + 62733436.0, + 101270040.0, + 104412528.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.590952032567657e-08, + 8.831190223546059e-10, + 8.506708115696426e-10, + 8.503630022360653e-10, + 8.506205184666271e-10 + ], + "bp_grad_norms_F": [ + 5.156022325536469e-06, + 3.1347209272780674e-08, + 2.992178593785866e-08, + 2.9913682197957314e-08, + 2.9930919964726854e-08 + ], + "gamma_dfa": 0.11300312746607233, + "acc_eval": 0.3291015625, + "loss_eval": 1.9240946769714355, + "epoch": 36 + }, + { + "hidden_norms": [ + 26058.23046875, + 10503947.0, + 66954420.0, + 108182184.0, + 111535672.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.312070403666439e-08, + 8.298656206662258e-10, + 8.076765367626138e-10, + 8.076487811869981e-10, + 8.083505531608637e-10 + ], + "bp_grad_norms_F": [ + 5.084062195237493e-06, + 3.008365112577849e-08, + 2.8773875726528786e-08, + 2.8766294235538226e-08, + 2.878227967073599e-08 + ], + "gamma_dfa": 0.11286510003083094, + "acc_eval": 0.322265625, + "loss_eval": 1.9284429550170898, + "epoch": 37 + }, + { + "hidden_norms": [ + 26547.951171875, + 11128081.0, + 71119440.0, + 115305784.0, + 118851064.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.278523549482998e-08, + 8.024952369289906e-10, + 7.701798643289237e-10, + 7.699446635811569e-10, + 7.706733029522184e-10 + ], + "bp_grad_norms_F": [ + 4.915013960271608e-06, + 2.8781727223758935e-08, + 2.7522533585511155e-08, + 2.751522920618754e-08, + 2.7530596469205193e-08 + ], + "gamma_dfa": 0.11193350053144968, + "acc_eval": 0.3046875, + "loss_eval": 1.9189305305480957, + "epoch": 38 + }, + { + "hidden_norms": [ + 27052.158203125, + 11815623.0, + 75267568.0, + 122747224.0, + 126538816.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.042137349979384e-08, + 7.699976212194315e-10, + 7.406790181185841e-10, + 7.406811275423308e-10, + 7.407266466863405e-10 + ], + "bp_grad_norms_F": [ + 4.783120857609902e-06, + 2.7648876965713498e-08, + 2.6492134708178128e-08, + 2.6485189152936073e-08, + 2.6500073246893407e-08 + ], + "gamma_dfa": 0.1119252087228233, + "acc_eval": 0.3076171875, + "loss_eval": 1.9200191497802734, + "epoch": 39 + }, + { + "hidden_norms": [ + 27573.439453125, + 12446571.0, + 79631776.0, + 129906592.0, + 133912576.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.999781897500725e-08, + 7.431448234562765e-10, + 7.212022645752825e-10, + 7.211930497241781e-10, + 7.215293917894883e-10 + ], + "bp_grad_norms_F": [ + 4.7411135710717645e-06, + 2.6746526771148638e-08, + 2.567137080689008e-08, + 2.566465262532347e-08, + 2.5678824400188205e-08 + ], + "gamma_dfa": 0.1126710368462227, + "acc_eval": 0.3291015625, + "loss_eval": 1.9156131744384766, + "epoch": 40 + }, + { + "hidden_norms": [ + 28020.1953125, + 13139046.0, + 84357848.0, + 137652880.0, + 141892912.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.93968845616655e-08, + 7.234106647047156e-10, + 7.015109604324721e-10, + 7.013014613477253e-10, + 7.019884118442121e-10 + ], + "bp_grad_norms_F": [ + 4.706852905655978e-06, + 2.5948086346261334e-08, + 2.480862271170281e-08, + 2.4802661258149783e-08, + 2.4816182886411298e-08 + ], + "gamma_dfa": 0.11299434299689892, + "acc_eval": 0.3134765625, + "loss_eval": 1.917637825012207, + "epoch": 41 + }, + { + "hidden_norms": [ + 28489.8828125, + 13728548.0, + 88388480.0, + 144432224.0, + 148906448.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.832166287220389e-08, + 7.007013858029154e-10, + 6.849794620400473e-10, + 6.849559253119253e-10, + 6.857461820608535e-10 + ], + "bp_grad_norms_F": [ + 4.678155619330937e-06, + 2.5201579489930737e-08, + 2.418770428391781e-08, + 2.4181909807907687e-08, + 2.419472266979028e-08 + ], + "gamma_dfa": 0.11410953500489995, + "acc_eval": 0.314453125, + "loss_eval": 1.9333336353302002, + "epoch": 42 + }, + { + "hidden_norms": [ + 28918.5546875, + 14414132.0, + 92681240.0, + 151898304.0, + 156571040.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.454645694655483e-08, + 6.792187368098723e-10, + 6.553820264265653e-10, + 6.554308207284976e-10, + 6.556304388283252e-10 + ], + "bp_grad_norms_F": [ + 4.511462066147942e-06, + 2.4275013998931172e-08, + 2.338800797474505e-08, + 2.338238225263467e-08, + 2.3394919779207157e-08 + ], + "gamma_dfa": 0.11213390928969602, + "acc_eval": 0.3037109375, + "loss_eval": 1.9155462980270386, + "epoch": 43 + }, + { + "hidden_norms": [ + 29332.80078125, + 15055747.0, + 96975336.0, + 159279984.0, + 164189344.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.274933804841567e-08, + 6.447524736330479e-10, + 6.278008113369538e-10, + 6.277455777414787e-10, + 6.275664987676066e-10 + ], + "bp_grad_norms_F": [ + 4.426053692441201e-06, + 2.3487833900048827e-08, + 2.272233956546188e-08, + 2.2717028258512073e-08, + 2.272915367029782e-08 + ], + "gamma_dfa": 0.11223121372131573, + "acc_eval": 0.3173828125, + "loss_eval": 1.9162096977233887, + "epoch": 44 + }, + { + "hidden_norms": [ + 29736.349609375, + 15823423.0, + 101458080.0, + 166481584.0, + 171638352.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.434898290943238e-08, + 6.55440757224568e-10, + 6.384029416217629e-10, + 6.384751061183636e-10, + 6.382625539202991e-10 + ], + "bp_grad_norms_F": [ + 4.4675143726635724e-06, + 2.308258295613541e-08, + 2.2235047580920764e-08, + 2.2229942331364327e-08, + 2.2241332331418562e-08 + ], + "gamma_dfa": 0.11349940555010107, + "acc_eval": 0.3134765625, + "loss_eval": 1.935542106628418, + "epoch": 45 + }, + { + "hidden_norms": [ + 30168.33984375, + 16512403.0, + 106240736.0, + 174293312.0, + 179686352.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.255891259523196e-08, + 6.180955192114368e-10, + 6.070984825967685e-10, + 6.070359770404821e-10, + 6.068190394614703e-10 + ], + "bp_grad_norms_F": [ + 4.380563041195273e-06, + 2.227099038520919e-08, + 2.156298606337259e-08, + 2.1558207663474604e-08, + 2.1569489305761635e-08 + ], + "gamma_dfa": 0.11322060551538016, + "acc_eval": 0.3212890625, + "loss_eval": 1.9260894060134888, + "epoch": 46 + }, + { + "hidden_norms": [ + 30560.10546875, + 17240642.0, + 111300408.0, + 182109792.0, + 187762288.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.14508851476603e-08, + 6.030238530740917e-10, + 5.890909982042558e-10, + 5.890405385677866e-10, + 5.88881721164114e-10 + ], + "bp_grad_norms_F": [ + 4.2523201955191325e-06, + 2.1578937747790405e-08, + 2.0878760054188206e-08, + 2.0874194817110947e-08, + 2.08853556671329e-08 + ], + "gamma_dfa": 0.11227845895700739, + "acc_eval": 0.3193359375, + "loss_eval": 1.9136857986450195, + "epoch": 47 + }, + { + "hidden_norms": [ + 30927.453125, + 17981622.0, + 115698520.0, + 189446720.0, + 195329056.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.999796736157805e-08, + 5.827110460820961e-10, + 5.688347570753649e-10, + 5.688115534141502e-10, + 5.69402469619007e-10 + ], + "bp_grad_norms_F": [ + 4.254153282090556e-06, + 2.1111715042820833e-08, + 2.044158087244341e-08, + 2.043698899001356e-08, + 2.0447874504725405e-08 + ], + "gamma_dfa": 0.11285097184736514, + "acc_eval": 0.3251953125, + "loss_eval": 1.9130818843841553, + "epoch": 48 + }, + { + "hidden_norms": [ + 31297.09765625, + 18680606.0, + 120312440.0, + 197032272.0, + 203114064.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.911415877970285e-08, + 5.74776504169705e-10, + 5.532440061628563e-10, + 5.531197722064007e-10, + 5.533422053893844e-10 + ], + "bp_grad_norms_F": [ + 4.17833052779315e-06, + 2.0621358842731752e-08, + 1.9960678443453617e-08, + 1.9956562624656726e-08, + 1.9966993392017685e-08 + ], + "gamma_dfa": 0.11243592749451636, + "acc_eval": 0.3125, + "loss_eval": 1.9191365242004395, + "epoch": 49 + }, + { + "hidden_norms": [ + 31637.244140625, + 19360764.0, + 124754384.0, + 204064768.0, + 210382992.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.003268447964729e-08, + 5.749308251701279e-10, + 5.599746222273438e-10, + 5.599968821989876e-10, + 5.599694041791281e-10 + ], + "bp_grad_norms_F": [ + 4.128593900531996e-06, + 2.0178502424528233e-08, + 1.9575201903876405e-08, + 1.9571228193626666e-08, + 1.9581117172151608e-08 + ], + "gamma_dfa": 0.11233749791426817, + "acc_eval": 0.330078125, + "loss_eval": 1.9152377843856812, + "epoch": 50 + }, + { + "hidden_norms": [ + 31964.60546875, + 20067444.0, + 128969536.0, + 211772368.0, + 218247696.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.774531951554309e-08, + 5.427598370744136e-10, + 5.298457228519737e-10, + 5.297982053065198e-10, + 5.30141264221129e-10 + ], + "bp_grad_norms_F": [ + 4.058078957314137e-06, + 1.9621586133666824e-08, + 1.90722975190738e-08, + 1.9068517431719556e-08, + 1.907839575210346e-08 + ], + "gamma_dfa": 0.11183859535958618, + "acc_eval": 0.328125, + "loss_eval": 1.9089019298553467, + "epoch": 51 + }, + { + "hidden_norms": [ + 32292.658203125, + 20829408.0, + 133566216.0, + 219264704.0, + 225938912.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.692310788343093e-08, + 5.312774109533791e-10, + 5.173871886476888e-10, + 5.171740258269608e-10, + 5.173406147918058e-10 + ], + "bp_grad_norms_F": [ + 4.047169568366371e-06, + 1.926170511978853e-08, + 1.867934962263007e-08, + 1.8675748947316606e-08, + 1.868521692927061e-08 + ], + "gamma_dfa": 0.11216733865148854, + "acc_eval": 0.330078125, + "loss_eval": 1.917893886566162, + "epoch": 52 + }, + { + "hidden_norms": [ + 32582.02734375, + 21555154.0, + 138235216.0, + 226622112.0, + 233550816.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.588336359276582e-08, + 5.294207294781472e-10, + 5.160025184913763e-10, + 5.156744475875996e-10, + 5.168100947194887e-10 + ], + "bp_grad_norms_F": [ + 3.991732683061855e-06, + 1.8877956975416055e-08, + 1.8321758332717764e-08, + 1.831830331866513e-08, + 1.832757234865312e-08 + ], + "gamma_dfa": 0.11230919507215731, + "acc_eval": 0.314453125, + "loss_eval": 1.913461685180664, + "epoch": 53 + }, + { + "hidden_norms": [ + 32871.28125, + 22246662.0, + 142493184.0, + 233885040.0, + 241005264.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.552973357860537e-08, + 5.124695112712629e-10, + 4.966513311721599e-10, + 4.966223543512172e-10, + 4.969377687125132e-10 + ], + "bp_grad_norms_F": [ + 4.012842964584706e-06, + 1.8570215587487837e-08, + 1.8001765411668202e-08, + 1.799840099181438e-08, + 1.800739823920594e-08 + ], + "gamma_dfa": 0.11296637258055853, + "acc_eval": 0.33203125, + "loss_eval": 1.9206554889678955, + "epoch": 54 + }, + { + "hidden_norms": [ + 33169.98828125, + 22902584.0, + 146822496.0, + 241191920.0, + 248487904.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.486269026912851e-08, + 4.992010138593628e-10, + 4.874242676145002e-10, + 4.874663450671335e-10, + 4.884102011715186e-10 + ], + "bp_grad_norms_F": [ + 3.938752797694178e-06, + 1.8166964821375586e-08, + 1.767327617585579e-08, + 1.7670013008341812e-08, + 1.7678777552987412e-08 + ], + "gamma_dfa": 0.11258088904469332, + "acc_eval": 0.3134765625, + "loss_eval": 1.913904070854187, + "epoch": 55 + }, + { + "hidden_norms": [ + 33456.9140625, + 23628216.0, + 151346624.0, + 248325424.0, + 255824304.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.482947239623172e-08, + 5.02439700955648e-10, + 4.890933769097217e-10, + 4.891700933207233e-10, + 4.892242166931737e-10 + ], + "bp_grad_norms_F": [ + 3.895439022016944e-06, + 1.781435265968412e-08, + 1.7326955870089478e-08, + 1.7324007117736073e-08, + 1.7332443036366385e-08 + ], + "gamma_dfa": 0.11223017568408977, + "acc_eval": 0.314453125, + "loss_eval": 1.9154590368270874, + "epoch": 56 + }, + { + "hidden_norms": [ + 33716.85546875, + 24280678.0, + 155270816.0, + 255050304.0, + 262737184.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.482827157900829e-08, + 4.958616850458952e-10, + 4.826584132366918e-10, + 4.826221089437865e-10, + 4.828137889489881e-10 + ], + "bp_grad_norms_F": [ + 3.898983777617104e-06, + 1.7600514823357116e-08, + 1.7106302152569697e-08, + 1.7103344518432095e-08, + 1.7111482009113388e-08 + ], + "gamma_dfa": 0.11287979638109391, + "acc_eval": 0.30859375, + "loss_eval": 1.9285999536514282, + "epoch": 57 + }, + { + "hidden_norms": [ + 33981.390625, + 24925848.0, + 159148752.0, + 261662432.0, + 269540768.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.396101153744894e-08, + 4.846232304345222e-10, + 4.728849534174628e-10, + 4.72891226177552e-10, + 4.725210223099907e-10 + ], + "bp_grad_norms_F": [ + 3.847520019917283e-06, + 1.7274359720431676e-08, + 1.6806101399424733e-08, + 1.6803195279635474e-08, + 1.681126526875687e-08 + ], + "gamma_dfa": 0.11251267153238587, + "acc_eval": 0.330078125, + "loss_eval": 1.913767695426941, + "epoch": 58 + }, + { + "hidden_norms": [ + 34242.87890625, + 25494510.0, + 162965072.0, + 268190960.0, + 276245600.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.276207725226413e-08, + 4.64974586611433e-10, + 4.573621481540613e-10, + 4.5720988106623395e-10, + 4.578690204759539e-10 + ], + "bp_grad_norms_F": [ + 3.846054823952727e-06, + 1.7068730429059542e-08, + 1.6637597965996065e-08, + 1.663470783341836e-08, + 1.6642776046182917e-08 + ], + "gamma_dfa": 0.11268835317605408, + "acc_eval": 0.318359375, + "loss_eval": 1.9175846576690674, + "epoch": 59 + }, + { + "hidden_norms": [ + 34498.37890625, + 26013872.0, + 166717360.0, + 274736192.0, + 282985952.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.275441760157264e-08, + 4.638447681504232e-10, + 4.554343846496778e-10, + 4.5541673210358624e-10, + 4.558452226799403e-10 + ], + "bp_grad_norms_F": [ + 3.7814804727531737e-06, + 1.6729790885960938e-08, + 1.629800472358056e-08, + 1.629528156854576e-08, + 1.630315793477166e-08 + ], + "gamma_dfa": 0.11192971542368468, + "acc_eval": 0.3125, + "loss_eval": 1.9148613214492798, + "epoch": 60 + }, + { + "hidden_norms": [ + 34741.75390625, + 26574266.0, + 170266464.0, + 280835296.0, + 289264896.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.206668328763044e-08, + 4.543688481017938e-10, + 4.4642781138470866e-10, + 4.464762171085823e-10, + 4.4638817642272954e-10 + ], + "bp_grad_norms_F": [ + 3.800365902861813e-06, + 1.6550599113429598e-08, + 1.6135599523181554e-08, + 1.6132924329781417e-08, + 1.6140655034746487e-08 + ], + "gamma_dfa": 0.11263992198291817, + "acc_eval": 0.328125, + "loss_eval": 1.9202332496643066, + "epoch": 61 + }, + { + "hidden_norms": [ + 34981.7578125, + 27132752.0, + 173824032.0, + 286969856.0, + 295549056.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.146741154429037e-08, + 4.5107212409689623e-10, + 4.4140177624107935e-10, + 4.4141457156143815e-10, + 4.4168110835407504e-10 + ], + "bp_grad_norms_F": [ + 3.7655997857655166e-06, + 1.6349241960256222e-08, + 1.5922701379622595e-08, + 1.5920058160645567e-08, + 1.592757570278991e-08 + ], + "gamma_dfa": 0.11310465578208095, + "acc_eval": 0.314453125, + "loss_eval": 1.9224812984466553, + "epoch": 62 + }, + { + "hidden_norms": [ + 35201.25, + 27683016.0, + 177040880.0, + 292723872.0, + 301473504.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.122528700165276e-08, + 4.486005733550513e-10, + 4.4048292791032395e-10, + 4.4043477198663084e-10, + 4.4109013663806707e-10 + ], + "bp_grad_norms_F": [ + 3.748537892533932e-06, + 1.6115603074240425e-08, + 1.5725172275438126e-08, + 1.572264451965566e-08, + 1.5729948898979274e-08 + ], + "gamma_dfa": 0.11326105792613816, + "acc_eval": 0.3095703125, + "loss_eval": 1.9233062267303467, + "epoch": 63 + }, + { + "hidden_norms": [ + 35399.75390625, + 28156860.0, + 180111792.0, + 298457728.0, + 307298976.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.082014974457707e-08, + 4.4495629403229486e-10, + 4.324987312731565e-10, + 4.3260212079232474e-10, + 4.3259393289751813e-10 + ], + "bp_grad_norms_F": [ + 3.685790488816565e-06, + 1.5895359695150546e-08, + 1.5473323955461638e-08, + 1.547100403342938e-08, + 1.5478214265840506e-08 + ], + "gamma_dfa": 0.11222807004196511, + "acc_eval": 0.3125, + "loss_eval": 1.9198863506317139, + "epoch": 64 + }, + { + "hidden_norms": [ + 35584.6640625, + 28666806.0, + 183522992.0, + 303940064.0, + 312955008.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.149574088316513e-08, + 4.4883607941414994e-10, + 4.353337967888393e-10, + 4.3539158389727106e-10, + 4.35594643688475e-10 + ], + "bp_grad_norms_F": [ + 3.6930814530933276e-06, + 1.5769751726679715e-08, + 1.5353194271483517e-08, + 1.535078197889561e-08, + 1.5357914051605803e-08 + ], + "gamma_dfa": 0.11321029500413715, + "acc_eval": 0.3095703125, + "loss_eval": 1.9162211418151855, + "epoch": 65 + }, + { + "hidden_norms": [ + 35768.86328125, + 29145662.0, + 186551392.0, + 308909184.0, + 318089856.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.985555245364594e-08, + 4.355726057614362e-10, + 4.2523776166980554e-10, + 4.251851093428627e-10, + 4.2568140679044575e-10 + ], + "bp_grad_norms_F": [ + 3.7230390717013506e-06, + 1.5615523096812467e-08, + 1.523139303571952e-08, + 1.522908021911462e-08, + 1.5236116368555486e-08 + ], + "gamma_dfa": 0.11393742701784504, + "acc_eval": 0.31640625, + "loss_eval": 1.9276196956634521, + "epoch": 66 + }, + { + "hidden_norms": [ + 35944.30859375, + 29545796.0, + 189503824.0, + 313822880.0, + 323180096.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.027381343505112e-08, + 4.2508935260698877e-10, + 4.156285593470699e-10, + 4.156731903126598e-10, + 4.1562600583411324e-10 + ], + "bp_grad_norms_F": [ + 3.67820075553027e-06, + 1.5450812185235918e-08, + 1.5081118576176777e-08, + 1.5078812864999236e-08, + 1.5085870330722173e-08 + ], + "gamma_dfa": 0.11295431066082529, + "acc_eval": 0.3251953125, + "loss_eval": 1.9145984649658203, + "epoch": 67 + }, + { + "hidden_norms": [ + 36107.91015625, + 29963964.0, + 192509232.0, + 318614048.0, + 328116416.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.995779955332182e-08, + 4.257695862541766e-10, + 4.1527120631101866e-10, + 4.1522696392348735e-10, + 4.1541275974665837e-10 + ], + "bp_grad_norms_F": [ + 3.6363949220685754e-06, + 1.5271682585193957e-08, + 1.4899570466297973e-08, + 1.4897324263074552e-08, + 1.4904214751254585e-08 + ], + "gamma_dfa": 0.11261070579712396, + "acc_eval": 0.322265625, + "loss_eval": 1.9148796796798706, + "epoch": 68 + }, + { + "hidden_norms": [ + 36263.38671875, + 30397186.0, + 195132224.0, + 323205344.0, + 332809856.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.94296602432587e-08, + 4.221426264106043e-10, + 4.1666703420872864e-10, + 4.166992584320184e-10, + 4.166444134146019e-10 + ], + "bp_grad_norms_F": [ + 3.677051836348255e-06, + 1.5217779036902357e-08, + 1.486149248108859e-08, + 1.4859250718757266e-08, + 1.4866162523219373e-08 + ], + "gamma_dfa": 0.11349719034842565, + "acc_eval": 0.3134765625, + "loss_eval": 1.9238262176513672, + "epoch": 69 + }, + { + "hidden_norms": [ + 36417.9921875, + 30770712.0, + 197719328.0, + 327539232.0, + 337245152.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.906716976118332e-08, + 4.1953429619212557e-10, + 4.080901727654407e-10, + 4.080701054842706e-10, + 4.0843109450072745e-10 + ], + "bp_grad_norms_F": [ + 3.6080327845411375e-06, + 1.500828084033401e-08, + 1.4656276192681617e-08, + 1.465407439837918e-08, + 1.466091692492455e-08 + ], + "gamma_dfa": 0.11264980123269197, + "acc_eval": 0.3115234375, + "loss_eval": 1.9172749519348145, + "epoch": 70 + }, + { + "hidden_norms": [ + 36554.734375, + 31127202.0, + 200166992.0, + 331766240.0, + 341638624.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.895474768953136e-08, + 4.153002663986882e-10, + 4.053070101761591e-10, + 4.0528172484677327e-10, + 4.0563402636806245e-10 + ], + "bp_grad_norms_F": [ + 3.5790299079963006e-06, + 1.4871366360580396e-08, + 1.4521869928785236e-08, + 1.4519704549798007e-08, + 1.4526481351140319e-08 + ], + "gamma_dfa": 0.1125820265888251, + "acc_eval": 0.3291015625, + "loss_eval": 1.90960693359375, + "epoch": 71 + }, + { + "hidden_norms": [ + 36685.06640625, + 31478428.0, + 202703456.0, + 335890528.0, + 345860736.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.840604527269534e-08, + 4.11831152513642e-10, + 4.0155134772845713e-10, + 4.014005239305618e-10, + 4.018080868029017e-10 + ], + "bp_grad_norms_F": [ + 3.5732464311877266e-06, + 1.4777253198872131e-08, + 1.4430981742918902e-08, + 1.4428859884674239e-08, + 1.443555053270984e-08 + ], + "gamma_dfa": 0.11229235199152754, + "acc_eval": 0.3095703125, + "loss_eval": 1.912062644958496, + "epoch": 72 + }, + { + "hidden_norms": [ + 36808.640625, + 31756406.0, + 205006400.0, + 339625888.0, + 349722048.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.845510824859957e-08, + 4.056126268192628e-10, + 3.9775802096464474e-10, + 3.9773195847914167e-10, + 3.978435358931165e-10 + ], + "bp_grad_norms_F": [ + 3.601402113417862e-06, + 1.4699119255112691e-08, + 1.434870711136682e-08, + 1.4346603904868971e-08, + 1.4353199517813664e-08 + ], + "gamma_dfa": 0.11323098125649267, + "acc_eval": 0.3271484375, + "loss_eval": 1.9194645881652832, + "epoch": 73 + }, + { + "hidden_norms": [ + 36922.67578125, + 32105574.0, + 207090144.0, + 343260640.0, + 353436544.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.8447327805643e-08, + 4.050982882475296e-10, + 3.977037865698918e-10, + 3.9765896131527256e-10, + 3.979234441953139e-10 + ], + "bp_grad_norms_F": [ + 3.603466893764562e-06, + 1.4652233204515142e-08, + 1.4306199780378392e-08, + 1.4304094797523703e-08, + 1.4310627349800598e-08 + ], + "gamma_dfa": 0.11329636031587142, + "acc_eval": 0.3056640625, + "loss_eval": 1.922640323638916, + "epoch": 74 + }, + { + "hidden_norms": [ + 37024.05859375, + 32409028.0, + 208845456.0, + 346325312.0, + 356587104.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.819700359983472e-08, + 4.0326031403026263e-10, + 3.9583156197231517e-10, + 3.9586384170675615e-10, + 3.9581374289276994e-10 + ], + "bp_grad_norms_F": [ + 3.5432237837085268e-06, + 1.4486117194678627e-08, + 1.4156262828635136e-08, + 1.4154186267489877e-08, + 1.4160684180808403e-08 + ], + "gamma_dfa": 0.11267639175457589, + "acc_eval": 0.31640625, + "loss_eval": 1.9154051542282104, + "epoch": 75 + }, + { + "hidden_norms": [ + 37125.02734375, + 32663892.0, + 210781344.0, + 349533728.0, + 359873568.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.772787486397647e-08, + 3.9591485645473767e-10, + 3.875866017022389e-10, + 3.8754283115949306e-10, + 3.8766378995802597e-10 + ], + "bp_grad_norms_F": [ + 3.5503553590388037e-06, + 1.4420066918319208e-08, + 1.40893732236691e-08, + 1.4087291333453322e-08, + 1.4093810563053921e-08 + ], + "gamma_dfa": 0.11297615164312447, + "acc_eval": 0.32421875, + "loss_eval": 1.913941502571106, + "epoch": 76 + }, + { + "hidden_norms": [ + 37216.296875, + 32930840.0, + 212456432.0, + 352475008.0, + 362884992.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.74248425980295e-08, + 3.9426073517034865e-10, + 3.872507869928654e-10, + 3.8720734951702696e-10, + 3.8765768373139053e-10 + ], + "bp_grad_norms_F": [ + 3.55011752617429e-06, + 1.4357588895563822e-08, + 1.402936344874206e-08, + 1.402732330291201e-08, + 1.4033815887160017e-08 + ], + "gamma_dfa": 0.11311322844358074, + "acc_eval": 0.3203125, + "loss_eval": 1.914380431175232, + "epoch": 77 + }, + { + "hidden_norms": [ + 37298.37890625, + 33147848.0, + 214118832.0, + 355022880.0, + 365529568.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.774458682912154e-08, + 3.987353780487979e-10, + 3.904769285689724e-10, + 3.904657153164237e-10, + 3.907260348601227e-10 + ], + "bp_grad_norms_F": [ + 3.509487669361988e-06, + 1.4249152968659473e-08, + 1.3931584774695693e-08, + 1.3929625453101835e-08, + 1.3936028331329453e-08 + ], + "gamma_dfa": 0.11238172389857937, + "acc_eval": 0.314453125, + "loss_eval": 1.9106721878051758, + "epoch": 78 + }, + { + "hidden_norms": [ + 37372.10546875, + 33388374.0, + 215761392.0, + 357596800.0, + 368190304.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.751073300392818e-08, + 3.9374201121766816e-10, + 3.8655822987010424e-10, + 3.866116038420131e-10, + 3.8653891198947576e-10 + ], + "bp_grad_norms_F": [ + 3.537302973199985e-06, + 1.4222394817409167e-08, + 1.3910858243093571e-08, + 1.3908881157931319e-08, + 1.3915280483445258e-08 + ], + "gamma_dfa": 0.11306001050525083, + "acc_eval": 0.322265625, + "loss_eval": 1.9138463735580444, + "epoch": 79 + }, + { + "hidden_norms": [ + 37442.84375, + 33566284.0, + 216908128.0, + 359755968.0, + 370379136.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.704155453007843e-08, + 3.923593672183756e-10, + 3.850708640840139e-10, + 3.8509884170423447e-10, + 3.849042473635933e-10 + ], + "bp_grad_norms_F": [ + 3.509628641040763e-06, + 1.4144676541150147e-08, + 1.3834353218555862e-08, + 1.3832397449675682e-08, + 1.3838723056380786e-08 + ], + "gamma_dfa": 0.11266809623703011, + "acc_eval": 0.3251953125, + "loss_eval": 1.9121947288513184, + "epoch": 80 + }, + { + "hidden_norms": [ + 37512.11328125, + 33717608.0, + 218115872.0, + 361736960.0, + 372400416.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.701832688804643e-08, + 3.917752788851203e-10, + 3.835655681960759e-10, + 3.835243511662867e-10, + 3.835320394607322e-10 + ], + "bp_grad_norms_F": [ + 3.5144942103215726e-06, + 1.4111047441645042e-08, + 1.3798888254257236e-08, + 1.3796943143518092e-08, + 1.3803241216692186e-08 + ], + "gamma_dfa": 0.11281233225781762, + "acc_eval": 0.3193359375, + "loss_eval": 1.9152591228485107, + "epoch": 81 + }, + { + "hidden_norms": [ + 37568.84375, + 33899664.0, + 219258560.0, + 363709504.0, + 374424128.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.695909604559347e-08, + 3.8868031015937277e-10, + 3.823757421805851e-10, + 3.8241659838789133e-10, + 3.8222841558521736e-10 + ], + "bp_grad_norms_F": [ + 3.516150854920852e-06, + 1.40706539752955e-08, + 1.3756586092483758e-08, + 1.375462410635464e-08, + 1.3760891093284044e-08 + ], + "gamma_dfa": 0.11307295318874822, + "acc_eval": 0.326171875, + "loss_eval": 1.9149377346038818, + "epoch": 82 + }, + { + "hidden_norms": [ + 37613.421875, + 34060644.0, + 220322080.0, + 365325472.0, + 376109056.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.71154296583154e-08, + 3.8974332094987574e-10, + 3.834943751446218e-10, + 3.8340422503502225e-10, + 3.8375369548759863e-10 + ], + "bp_grad_norms_F": [ + 3.4982940633199178e-06, + 1.4013506799415154e-08, + 1.370163893454901e-08, + 1.3699707146486162e-08, + 1.3705942158992457e-08 + ], + "gamma_dfa": 0.1128659905607492, + "acc_eval": 0.3212890625, + "loss_eval": 1.912517786026001, + "epoch": 83 + }, + { + "hidden_norms": [ + 37660.46875, + 34177292.0, + 221168784.0, + 366778016.0, + 377600544.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.68943869186478e-08, + 3.894674860394076e-10, + 3.8076572450584933e-10, + 3.8073258434856427e-10, + 3.8100084198688933e-10 + ], + "bp_grad_norms_F": [ + 3.4944750950671732e-06, + 1.397998961039093e-08, + 1.3671985321650482e-08, + 1.3670069520799188e-08, + 1.3676272558882374e-08 + ], + "gamma_dfa": 0.11273636969053769, + "acc_eval": 0.318359375, + "loss_eval": 1.9171113967895508, + "epoch": 84 + }, + { + "hidden_norms": [ + 37701.8671875, + 34327872.0, + 222020640.0, + 368143552.0, + 379001216.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.639802307972786e-08, + 3.87883669628053e-10, + 3.8044753458699176e-10, + 3.804264403495239e-10, + 3.8037359373355173e-10 + ], + "bp_grad_norms_F": [ + 3.4919537483801832e-06, + 1.3943878052202763e-08, + 1.3639727569625393e-08, + 1.3637805551525162e-08, + 1.364400148418099e-08 + ], + "gamma_dfa": 0.11286781356830033, + "acc_eval": 0.328125, + "loss_eval": 1.9123945236206055, + "epoch": 85 + }, + { + "hidden_norms": [ + 37739.8125, + 34429904.0, + 222737072.0, + 369295712.0, + 380185984.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.741821323430486e-08, + 3.8846115213431176e-10, + 3.8069486452130263e-10, + 3.8060576912357647e-10, + 3.809500215279371e-10 + ], + "bp_grad_norms_F": [ + 3.500515958876349e-06, + 1.3945418153582523e-08, + 1.364027113481825e-08, + 1.3638369544821671e-08, + 1.364453350305439e-08 + ], + "gamma_dfa": 0.11293645015939546, + "acc_eval": 0.3154296875, + "loss_eval": 1.917877197265625, + "epoch": 86 + }, + { + "hidden_norms": [ + 37773.1484375, + 34523684.0, + 223309680.0, + 370332384.0, + 381249280.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.685363729275196e-08, + 3.8528755186284513e-10, + 3.7927344598287505e-10, + 3.7934516639026583e-10, + 3.7926364826468273e-10 + ], + "bp_grad_norms_F": [ + 3.4931999834952876e-06, + 1.3911479967987361e-08, + 1.360801249461474e-08, + 1.3606110904618163e-08, + 1.3612289961884017e-08 + ], + "gamma_dfa": 0.11282484548610228, + "acc_eval": 0.322265625, + "loss_eval": 1.9136494398117065, + "epoch": 87 + }, + { + "hidden_norms": [ + 37800.29296875, + 34600436.0, + 223845264.0, + 371228288.0, + 382171744.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.65767956320451e-08, + 3.853606878045923e-10, + 3.7911099259879677e-10, + 3.789283054000947e-10, + 3.791919833684432e-10 + ], + "bp_grad_norms_F": [ + 3.4772997423715424e-06, + 1.3876966242776234e-08, + 1.3575736979021258e-08, + 1.3573847823522556e-08, + 1.3580010893576855e-08 + ], + "gamma_dfa": 0.11266115616490424, + "acc_eval": 0.318359375, + "loss_eval": 1.912358045578003, + "epoch": 88 + }, + { + "hidden_norms": [ + 37822.953125, + 34659448.0, + 224278352.0, + 371994688.0, + 382956800.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.695878340678973e-08, + 3.8400196911148043e-10, + 3.7754030457470833e-10, + 3.775957047036371e-10, + 3.7752789783240814e-10 + ], + "bp_grad_norms_F": [ + 3.488719130473328e-06, + 1.387363113281026e-08, + 1.3571511026100325e-08, + 1.3569623646958462e-08, + 1.3575775170693305e-08 + ], + "gamma_dfa": 0.11286654848299804, + "acc_eval": 0.318359375, + "loss_eval": 1.9152348041534424, + "epoch": 89 + }, + { + "hidden_norms": [ + 37843.71484375, + 34715836.0, + 224633712.0, + 372602496.0, + 383583840.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.682009967562408e-08, + 3.831650552399424e-10, + 3.7603772873318064e-10, + 3.7600736413345714e-10, + 3.763372669052245e-10 + ], + "bp_grad_norms_F": [ + 3.4864976896642474e-06, + 1.3852580416084948e-08, + 1.355203504971314e-08, + 1.3550148558749697e-08, + 1.3556297417949281e-08 + ], + "gamma_dfa": 0.11291119743145828, + "acc_eval": 0.326171875, + "loss_eval": 1.914948582649231, + "epoch": 90 + }, + { + "hidden_norms": [ + 37859.484375, + 34761876.0, + 224938096.0, + 373110784.0, + 384106720.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.677319674963655e-08, + 3.8410433167435087e-10, + 3.768680645332978e-10, + 3.768474976517666e-10, + 3.767945122579164e-10 + ], + "bp_grad_norms_F": [ + 3.480063014649204e-06, + 1.3833711953736838e-08, + 1.3534608989118624e-08, + 1.3532734044474637e-08, + 1.3538858922856889e-08 + ], + "gamma_dfa": 0.1127637956833496, + "acc_eval": 0.322265625, + "loss_eval": 1.9153952598571777, + "epoch": 91 + }, + { + "hidden_norms": [ + 37872.0625, + 34797108.0, + 225202544.0, + 373570400.0, + 384579200.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.67909034746117e-08, + 3.821318816932262e-10, + 3.753052590926842e-10, + 3.7535435870594824e-10, + 3.7532754681990355e-10 + ], + "bp_grad_norms_F": [ + 3.4843556022678968e-06, + 1.3827068379157481e-08, + 1.352985190550271e-08, + 1.3527971631788205e-08, + 1.3534107168311493e-08 + ], + "gamma_dfa": 0.1129197701375233, + "acc_eval": 0.318359375, + "loss_eval": 1.9156945943832397, + "epoch": 92 + }, + { + "hidden_norms": [ + 37881.54296875, + 34826116.0, + 225403072.0, + 373889952.0, + 384906848.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.663099583192889e-08, + 3.844494445015556e-10, + 3.765425748980533e-10, + 3.7651176620911997e-10, + 3.7661743168548867e-10 + ], + "bp_grad_norms_F": [ + 3.480702616798226e-06, + 1.382177039488397e-08, + 1.3523890451949683e-08, + 1.3522016395484115e-08, + 1.3528141273866368e-08 + ], + "gamma_dfa": 0.11285195982236473, + "acc_eval": 0.322265625, + "loss_eval": 1.9148646593093872, + "epoch": 93 + }, + { + "hidden_norms": [ + 37889.18359375, + 34847784.0, + 225551344.0, + 374143840.0, + 385168448.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.623226767032975e-08, + 3.819731198007048e-10, + 3.7512581929632915e-10, + 3.752123889366743e-10, + 3.7511962980296687e-10 + ], + "bp_grad_norms_F": [ + 3.4782924558385275e-06, + 1.3813751031932497e-08, + 1.3516644692401769e-08, + 1.3514763530508844e-08, + 1.3520896402496874e-08 + ], + "gamma_dfa": 0.11281965267244232, + "acc_eval": 0.318359375, + "loss_eval": 1.9142093658447266, + "epoch": 94 + }, + { + "hidden_norms": [ + 37895.046875, + 34865808.0, + 225670928.0, + 374345440.0, + 385375392.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.64825137164371e-08, + 3.829765116147854e-10, + 3.7528671836817296e-10, + 3.7535685670775365e-10, + 3.752768373832538e-10 + ], + "bp_grad_norms_F": [ + 3.4792733458743896e-06, + 1.3809607679604596e-08, + 1.3512363672418815e-08, + 1.3510485175061149e-08, + 1.351661271797866e-08 + ], + "gamma_dfa": 0.11288163481003721, + "acc_eval": 0.32421875, + "loss_eval": 1.9146695137023926, + "epoch": 95 + }, + { + "hidden_norms": [ + 37898.87109375, + 34878456.0, + 225750400.0, + 374473248.0, + 385506496.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.652722817079848e-08, + 3.8302755411834255e-10, + 3.759152988891401e-10, + 3.7595143664859165e-10, + 3.7588568368995823e-10 + ], + "bp_grad_norms_F": [ + 3.480078930806485e-06, + 1.3808159060602065e-08, + 1.3511034957502943e-08, + 1.3509157348323697e-08, + 1.351528045034911e-08 + ], + "gamma_dfa": 0.1128929610213163, + "acc_eval": 0.3203125, + "loss_eval": 1.9147298336029053, + "epoch": 96 + }, + { + "hidden_norms": [ + 37900.7109375, + 34885860.0, + 225787696.0, + 374537472.0, + 385572896.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.630104820715133e-08, + 3.8308795025088216e-10, + 3.7579228617801164e-10, + 3.7582850720419003e-10, + 3.7576297629016153e-10 + ], + "bp_grad_norms_F": [ + 3.4770955608109944e-06, + 1.3803015619373582e-08, + 1.3505847995531894e-08, + 1.3503973050887907e-08, + 1.3510093488378061e-08 + ], + "gamma_dfa": 0.11285188281362935, + "acc_eval": 0.3212890625, + "loss_eval": 1.9143996238708496, + "epoch": 97 + }, + { + "hidden_norms": [ + 37902.46875, + 34890740.0, + 225820192.0, + 374593792.0, + 385630976.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.624973991620209e-08, + 3.8267702895389277e-10, + 3.7545791475857015e-10, + 3.7555664134103495e-10, + 3.75430270205257e-10 + ], + "bp_grad_norms_F": [ + 3.476953224890167e-06, + 1.3801756182374447e-08, + 1.350452816240022e-08, + 1.3502653217756233e-08, + 1.3508774543424806e-08 + ], + "gamma_dfa": 0.11284657929081732, + "acc_eval": 0.3203125, + "loss_eval": 1.9143402576446533, + "epoch": 98 + }, + { + "hidden_norms": [ + 37903.22265625, + 34893256.0, + 225836736.0, + 374620576.0, + 385658624.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.627380599866228e-08, + 3.8272779390169376e-10, + 3.7550038078926207e-10, + 3.7559910737172686e-10, + 3.7547268072479767e-10 + ], + "bp_grad_norms_F": [ + 3.477006657703896e-06, + 1.3801344067587706e-08, + 1.3504034335198867e-08, + 1.350215939055488e-08, + 1.3508279828045033e-08 + ], + "gamma_dfa": 0.11284785682073561, + "acc_eval": 0.3203125, + "loss_eval": 1.9143691062927246, + "epoch": 99 + }, + { + "hidden_norms": [ + 37903.25, + 34893376.0, + 225837280.0, + 374621408.0, + 385659456.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.626758874972438e-08, + 3.826984007471168e-10, + 3.755481758904722e-10, + 3.756469302285126e-10, + 3.755204758260078e-10 + ], + "bp_grad_norms_F": [ + 3.476960500847781e-06, + 1.3801311204986177e-08, + 1.3503997919883659e-08, + 1.3502122975239672e-08, + 1.3508243412729826e-08 + ], + "gamma_dfa": 0.11284651984533411, + "acc_eval": 0.3203125, + "loss_eval": 1.9143500328063965, + "epoch": 100 + } + ] +} \ No newline at end of file diff --git a/results/snapshot_evolution_v2/snapshot_evolution_s42.json b/results/snapshot_evolution_v2/snapshot_evolution_s42.json new file mode 100644 index 0000000..fb4a73e --- /dev/null +++ b/results/snapshot_evolution_v2/snapshot_evolution_s42.json @@ -0,0 +1,5473 @@ +{ + "config": { + "output_dir": "results/snapshot_evolution_v2", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 42, + "depth": 4, + "d_hidden": 256, + "log_every": 1 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010068593546748161, + 0.000997236929833889, + 0.0009934091940522194, + 0.0009870644425973296, + 0.0009829498594626784 + ], + "bp_grad_norms_F": [ + 0.03544403985142708, + 0.03507080301642418, + 0.03477022796869278, + 0.03443896397948265, + 0.03407429903745651 + ], + "gamma_dfa": NaN, + "acc_eval": 0.115234375, + "loss_eval": 2.383650302886963, + "epoch": 0 + }, + { + "hidden_norms": [ + 77.06888580322266, + 79.12034606933594, + 82.7389144897461, + 87.31297302246094, + 93.80765533447266 + ], + "bp_grad_norms_per_sample_med": [ + 5.941955532762222e-05, + 5.619435978587717e-05, + 5.499917097040452e-05, + 5.5899512517498806e-05, + 5.7389137509744614e-05 + ], + "bp_grad_norms_F": [ + 0.0026216788683086634, + 0.0023027872666716576, + 0.002111479640007019, + 0.002080164849758148, + 0.0021061261650174856 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3798828125, + "loss_eval": 1.6751981973648071, + "epoch": 1 + }, + { + "hidden_norms": [ + 98.86981201171875, + 98.9476089477539, + 102.55016326904297, + 106.3559341430664, + 112.6939697265625 + ], + "bp_grad_norms_per_sample_med": [ + 4.658113539335318e-05, + 4.402571721584536e-05, + 4.2862800910370424e-05, + 4.381770850159228e-05, + 4.3870313675142825e-05 + ], + "bp_grad_norms_F": [ + 0.00196655560284853, + 0.0018041934818029404, + 0.0016866555670276284, + 0.0016513779992237687, + 0.0016559252981096506 + ], + "gamma_dfa": NaN, + "acc_eval": 0.4541015625, + "loss_eval": 1.5228025913238525, + "epoch": 2 + }, + { + "hidden_norms": [ + 110.40647888183594, + 112.07202911376953, + 114.70049285888672, + 117.17343139648438, + 124.54205322265625 + ], + "bp_grad_norms_per_sample_med": [ + 4.4490061554824933e-05, + 4.3751915654866025e-05, + 4.270448334864341e-05, + 4.182140401098877e-05, + 4.151134271523915e-05 + ], + "bp_grad_norms_F": [ + 0.0019047901732847095, + 0.0017693191766738892, + 0.0016821600729599595, + 0.0016251102788373828, + 0.0015800207620486617 + ], + "gamma_dfa": NaN, + "acc_eval": 0.4697265625, + "loss_eval": 1.4416429996490479, + "epoch": 3 + }, + { + "hidden_norms": [ + 125.09136199951172, + 126.65565490722656, + 128.4573974609375, + 130.39990234375, + 138.1091766357422 + ], + "bp_grad_norms_per_sample_med": [ + 4.1048842831514776e-05, + 4.0168823034036905e-05, + 3.916600326192565e-05, + 3.953508348786272e-05, + 3.938759255106561e-05 + ], + "bp_grad_norms_F": [ + 0.0017511667683720589, + 0.001639657886698842, + 0.0015659942291676998, + 0.0015107291983440518, + 0.0014574137749150395 + ], + "gamma_dfa": NaN, + "acc_eval": 0.50390625, + "loss_eval": 1.3718887567520142, + "epoch": 4 + }, + { + "hidden_norms": [ + 139.76705932617188, + 139.05606079101562, + 139.5422821044922, + 141.0078582763672, + 148.9493865966797 + ], + "bp_grad_norms_per_sample_med": [ + 3.957379158237018e-05, + 4.0101109334500507e-05, + 3.9158370782388374e-05, + 3.927717261831276e-05, + 3.796629243879579e-05 + ], + "bp_grad_norms_F": [ + 0.0017042789841070771, + 0.001630594371818006, + 0.0015700262738391757, + 0.0015037605771794915, + 0.0014294973807409406 + ], + "gamma_dfa": NaN, + "acc_eval": 0.498046875, + "loss_eval": 1.367867112159729, + "epoch": 5 + }, + { + "hidden_norms": [ + 147.73207092285156, + 148.01638793945312, + 148.1798553466797, + 149.07754516601562, + 156.61810302734375 + ], + "bp_grad_norms_per_sample_med": [ + 3.987981835962273e-05, + 3.9670325350016356e-05, + 3.970034231315367e-05, + 3.8273319660220295e-05, + 3.6929654015693814e-05 + ], + "bp_grad_norms_F": [ + 0.0017687880899757147, + 0.001693942816928029, + 0.0016310750506818295, + 0.0015193652361631393, + 0.0014129421906545758 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5234375, + "loss_eval": 1.3461639881134033, + "epoch": 6 + }, + { + "hidden_norms": [ + 159.30731201171875, + 158.4180450439453, + 158.36903381347656, + 158.61819458007812, + 165.9392547607422 + ], + "bp_grad_norms_per_sample_med": [ + 3.744649075088091e-05, + 3.805281448876485e-05, + 3.727989678736776e-05, + 3.5814937291434035e-05, + 3.422912777750753e-05 + ], + "bp_grad_norms_F": [ + 0.0017357978504151106, + 0.0016663926653563976, + 0.0016097063198685646, + 0.0014966910239309072, + 0.001379394088871777 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5283203125, + "loss_eval": 1.3227663040161133, + "epoch": 7 + }, + { + "hidden_norms": [ + 171.02230834960938, + 169.76348876953125, + 168.44949340820312, + 168.26429748535156, + 176.89520263671875 + ], + "bp_grad_norms_per_sample_med": [ + 3.716369246831164e-05, + 3.8349648093571886e-05, + 3.801397542702034e-05, + 3.6082456063013524e-05, + 3.359258334967308e-05 + ], + "bp_grad_norms_F": [ + 0.0016445739893242717, + 0.001604317338205874, + 0.0015634173760190606, + 0.0014586447505280375, + 0.0013399318559095263 + ], + "gamma_dfa": NaN, + "acc_eval": 0.541015625, + "loss_eval": 1.2933616638183594, + "epoch": 8 + }, + { + "hidden_norms": [ + 177.41796875, + 177.29603576660156, + 175.89486694335938, + 175.0777587890625, + 181.38400268554688 + ], + "bp_grad_norms_per_sample_med": [ + 3.602267679525539e-05, + 3.6796918720938265e-05, + 3.648500933195464e-05, + 3.566688246792182e-05, + 3.4070406400132924e-05 + ], + "bp_grad_norms_F": [ + 0.0015903833555057645, + 0.0015696624759584665, + 0.0015270623844116926, + 0.0014402325032278895, + 0.0013178731314837933 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5478515625, + "loss_eval": 1.2806801795959473, + "epoch": 9 + }, + { + "hidden_norms": [ + 187.4056854248047, + 186.72698974609375, + 186.21583557128906, + 185.0518035888672, + 193.2371063232422 + ], + "bp_grad_norms_per_sample_med": [ + 3.3276784961344674e-05, + 3.436602492001839e-05, + 3.432494486332871e-05, + 3.371347702341154e-05, + 3.1834206311032176e-05 + ], + "bp_grad_norms_F": [ + 0.0014970082556828856, + 0.0014613966923207045, + 0.001435543643310666, + 0.001374539453536272, + 0.0012561712646856904 + ], + "gamma_dfa": NaN, + "acc_eval": 0.56640625, + "loss_eval": 1.2740942239761353, + "epoch": 10 + }, + { + "hidden_norms": [ + 194.4965057373047, + 191.25531005859375, + 189.80703735351562, + 188.18850708007812, + 195.7776336669922 + ], + "bp_grad_norms_per_sample_med": [ + 3.298965748399496e-05, + 3.40789083566051e-05, + 3.381206624908373e-05, + 3.3352327591273934e-05, + 3.1442876206710935e-05 + ], + "bp_grad_norms_F": [ + 0.0015152172418311238, + 0.001501554623246193, + 0.0014814225723966956, + 0.001403055852279067, + 0.001272345893085003 + ], + "gamma_dfa": NaN, + "acc_eval": 0.560546875, + "loss_eval": 1.265188455581665, + "epoch": 11 + }, + { + "hidden_norms": [ + 200.5504913330078, + 197.28366088867188, + 195.27011108398438, + 192.64669799804688, + 200.8507843017578 + ], + "bp_grad_norms_per_sample_med": [ + 3.453825775068253e-05, + 3.5414250305620953e-05, + 3.575523442123085e-05, + 3.455601472523995e-05, + 3.2858857593964785e-05 + ], + "bp_grad_norms_F": [ + 0.001518857548944652, + 0.001502488274127245, + 0.0014838415663689375, + 0.001404650043696165, + 0.0012748484732583165 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5458984375, + "loss_eval": 1.2733395099639893, + "epoch": 12 + }, + { + "hidden_norms": [ + 207.21469116210938, + 202.24969482421875, + 198.8241424560547, + 197.5497283935547, + 207.32147216796875 + ], + "bp_grad_norms_per_sample_med": [ + 3.2123080018209293e-05, + 3.345572258695029e-05, + 3.3888838515849784e-05, + 3.344774086144753e-05, + 3.095310239586979e-05 + ], + "bp_grad_norms_F": [ + 0.0014620382571592927, + 0.0014708929229527712, + 0.0014657732099294662, + 0.0013834136771038175, + 0.0012381445849314332 + ], + "gamma_dfa": NaN, + "acc_eval": 0.56640625, + "loss_eval": 1.2357412576675415, + "epoch": 13 + }, + { + "hidden_norms": [ + 214.6268310546875, + 208.3655242919922, + 205.5032501220703, + 202.8442840576172, + 211.64646911621094 + ], + "bp_grad_norms_per_sample_med": [ + 3.207657573511824e-05, + 3.362155257491395e-05, + 3.38435493176803e-05, + 3.330525942146778e-05, + 3.142434434266761e-05 + ], + "bp_grad_norms_F": [ + 0.0014900992391631007, + 0.0015044353203848004, + 0.001489310641773045, + 0.0014063691487535834, + 0.0012448005145415664 + ], + "gamma_dfa": NaN, + "acc_eval": 0.56640625, + "loss_eval": 1.2451550960540771, + "epoch": 14 + }, + { + "hidden_norms": [ + 220.40109252929688, + 213.53439331054688, + 209.3384552001953, + 206.62062072753906, + 213.82391357421875 + ], + "bp_grad_norms_per_sample_med": [ + 3.227095294278115e-05, + 3.415472019696608e-05, + 3.4918764868052676e-05, + 3.409514465602115e-05, + 3.082074908888899e-05 + ], + "bp_grad_norms_F": [ + 0.0015189005061984062, + 0.001544533297419548, + 0.0015320393722504377, + 0.0014468894805759192, + 0.0012609416153281927 + ], + "gamma_dfa": NaN, + "acc_eval": 0.564453125, + "loss_eval": 1.248854398727417, + "epoch": 15 + }, + { + "hidden_norms": [ + 226.32350158691406, + 219.70506286621094, + 213.84132385253906, + 210.67050170898438, + 219.11776733398438 + ], + "bp_grad_norms_per_sample_med": [ + 3.360298796906136e-05, + 3.4720324038062245e-05, + 3.473780452623032e-05, + 3.412307341932319e-05, + 3.0327399144880474e-05 + ], + "bp_grad_norms_F": [ + 0.0014919604873284698, + 0.0015073713148012757, + 0.001499581034295261, + 0.001411686884239316, + 0.0012323390692472458 + ], + "gamma_dfa": NaN, + "acc_eval": 0.57421875, + "loss_eval": 1.2207037210464478, + "epoch": 16 + }, + { + "hidden_norms": [ + 230.78538513183594, + 223.432373046875, + 216.73037719726562, + 212.86383056640625, + 220.8701171875 + ], + "bp_grad_norms_per_sample_med": [ + 3.253064278396778e-05, + 3.3939610148081556e-05, + 3.490943709039129e-05, + 3.4084565413650125e-05, + 3.0307599445222877e-05 + ], + "bp_grad_norms_F": [ + 0.0015068502398207784, + 0.0015421892749145627, + 0.0015326113207265735, + 0.0014369196724146605, + 0.0012492147507146 + ], + "gamma_dfa": NaN, + "acc_eval": 0.560546875, + "loss_eval": 1.216906189918518, + "epoch": 17 + }, + { + "hidden_norms": [ + 234.5084991455078, + 225.73875427246094, + 219.08822631835938, + 214.42320251464844, + 222.92369079589844 + ], + "bp_grad_norms_per_sample_med": [ + 3.451363227213733e-05, + 3.6047003959538415e-05, + 3.654924512375146e-05, + 3.617065158323385e-05, + 3.275999551988207e-05 + ], + "bp_grad_norms_F": [ + 0.001566705177538097, + 0.0015968933003023267, + 0.0015981856267899275, + 0.0014931216137483716, + 0.0012800253462046385 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5556640625, + "loss_eval": 1.2483153343200684, + "epoch": 18 + }, + { + "hidden_norms": [ + 238.0281219482422, + 229.677734375, + 223.0265350341797, + 217.872314453125, + 225.45947265625 + ], + "bp_grad_norms_per_sample_med": [ + 3.4922632039524615e-05, + 3.6500507121672854e-05, + 3.762893902603537e-05, + 3.615105015342124e-05, + 3.2680742151569575e-05 + ], + "bp_grad_norms_F": [ + 0.0015319561352953315, + 0.001577642629854381, + 0.001574998372234404, + 0.0014754259027540684, + 0.0012637749314308167 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5576171875, + "loss_eval": 1.2469550371170044, + "epoch": 19 + }, + { + "hidden_norms": [ + 241.45298767089844, + 233.28753662109375, + 226.9265899658203, + 222.43453979492188, + 229.83859252929688 + ], + "bp_grad_norms_per_sample_med": [ + 3.368386751390062e-05, + 3.570445187506266e-05, + 3.622082658694126e-05, + 3.5024619137402624e-05, + 3.180970816174522e-05 + ], + "bp_grad_norms_F": [ + 0.0015120706520974636, + 0.0015433274675160646, + 0.0015402185963466763, + 0.0014465245185419917, + 0.001252179266884923 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5634765625, + "loss_eval": 1.2113828659057617, + "epoch": 20 + }, + { + "hidden_norms": [ + 246.53602600097656, + 236.25527954101562, + 231.07940673828125, + 227.7357940673828, + 235.99017333984375 + ], + "bp_grad_norms_per_sample_med": [ + 3.2015348551794887e-05, + 3.388321783859283e-05, + 3.521092003211379e-05, + 3.46749002346769e-05, + 3.079533780692145e-05 + ], + "bp_grad_norms_F": [ + 0.0014757646713405848, + 0.001517578144557774, + 0.0015156606677919626, + 0.00144051609095186, + 0.0012491638772189617 + ], + "gamma_dfa": NaN, + "acc_eval": 0.576171875, + "loss_eval": 1.2042850255966187, + "epoch": 21 + }, + { + "hidden_norms": [ + 250.74209594726562, + 241.11993408203125, + 232.76829528808594, + 228.410400390625, + 237.100341796875 + ], + "bp_grad_norms_per_sample_med": [ + 3.173810910084285e-05, + 3.328004459035583e-05, + 3.405071402085014e-05, + 3.34872274834197e-05, + 3.07901827909518e-05 + ], + "bp_grad_norms_F": [ + 0.0014801323413848877, + 0.0015176001470535994, + 0.0015198889886960387, + 0.0014302636263892055, + 0.001232756651006639 + ], + "gamma_dfa": NaN, + "acc_eval": 0.587890625, + "loss_eval": 1.1819555759429932, + "epoch": 22 + }, + { + "hidden_norms": [ + 251.96310424804688, + 242.98260498046875, + 235.83056640625, + 229.86978149414062, + 238.271240234375 + ], + "bp_grad_norms_per_sample_med": [ + 3.078249574173242e-05, + 3.301461765659042e-05, + 3.3559550502104685e-05, + 3.2682331948308274e-05, + 2.9418402846204117e-05 + ], + "bp_grad_norms_F": [ + 0.00149905972648412, + 0.0015357647789642215, + 0.0015457755653187633, + 0.0014610268408432603, + 0.0012446421897038817 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5732421875, + "loss_eval": 1.1770297288894653, + "epoch": 23 + }, + { + "hidden_norms": [ + 255.878662109375, + 244.79376220703125, + 236.5006561279297, + 233.29434204101562, + 239.50732421875 + ], + "bp_grad_norms_per_sample_med": [ + 3.191530049662106e-05, + 3.370656486367807e-05, + 3.539594035828486e-05, + 3.486185596557334e-05, + 3.131559424218722e-05 + ], + "bp_grad_norms_F": [ + 0.001507170731201768, + 0.0015490618534386158, + 0.0015714912442490458, + 0.0014840371441096067, + 0.0012607484823092818 + ], + "gamma_dfa": NaN, + "acc_eval": 0.572265625, + "loss_eval": 1.2011631727218628, + "epoch": 24 + }, + { + "hidden_norms": [ + 256.66448974609375, + 244.18772888183594, + 236.46058654785156, + 231.88583374023438, + 238.06246948242188 + ], + "bp_grad_norms_per_sample_med": [ + 3.2962809200398624e-05, + 3.441200897214003e-05, + 3.570063927327283e-05, + 3.488562651909888e-05, + 3.0770879675401375e-05 + ], + "bp_grad_norms_F": [ + 0.0015825299778953195, + 0.0016350955702364445, + 0.0016404123743996024, + 0.0015316286589950323, + 0.0012829666957259178 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5703125, + "loss_eval": 1.192138433456421, + "epoch": 25 + }, + { + "hidden_norms": [ + 259.5942687988281, + 247.43173217773438, + 239.85533142089844, + 233.21835327148438, + 241.53346252441406 + ], + "bp_grad_norms_per_sample_med": [ + 3.1691903132013977e-05, + 3.34988217218779e-05, + 3.45351618307177e-05, + 3.441058288444765e-05, + 3.0752617021789774e-05 + ], + "bp_grad_norms_F": [ + 0.0015797498635947704, + 0.0016322932206094265, + 0.001641901326365769, + 0.0015325341373682022, + 0.0012732355389744043 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5791015625, + "loss_eval": 1.1775751113891602, + "epoch": 26 + }, + { + "hidden_norms": [ + 260.6902770996094, + 249.26528930664062, + 240.86239624023438, + 235.91477966308594, + 242.1553497314453 + ], + "bp_grad_norms_per_sample_med": [ + 3.32598174281884e-05, + 3.471180752967484e-05, + 3.609888517530635e-05, + 3.496996214380488e-05, + 3.091244798270054e-05 + ], + "bp_grad_norms_F": [ + 0.0015408779727295041, + 0.001589508610777557, + 0.0016157848294824362, + 0.0015165223740041256, + 0.0012689991854131222 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5859375, + "loss_eval": 1.1941479444503784, + "epoch": 27 + }, + { + "hidden_norms": [ + 265.0726623535156, + 253.6020050048828, + 244.876953125, + 239.7056427001953, + 248.2157440185547 + ], + "bp_grad_norms_per_sample_med": [ + 3.255613773944788e-05, + 3.457435013842769e-05, + 3.5964570997748524e-05, + 3.529110108502209e-05, + 3.089939127676189e-05 + ], + "bp_grad_norms_F": [ + 0.001513357157818973, + 0.0015594394644722342, + 0.0015772230690345168, + 0.001489063142798841, + 0.0012491336092352867 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5810546875, + "loss_eval": 1.1790356636047363, + "epoch": 28 + }, + { + "hidden_norms": [ + 266.9394836425781, + 253.8067169189453, + 243.13002014160156, + 236.81365966796875, + 245.42434692382812 + ], + "bp_grad_norms_per_sample_med": [ + 3.378500332473777e-05, + 3.5516346542863175e-05, + 3.742165063158609e-05, + 3.6865043512079865e-05, + 3.170729542034678e-05 + ], + "bp_grad_norms_F": [ + 0.0015557212755084038, + 0.0016067115357145667, + 0.001632526982575655, + 0.0015416526002809405, + 0.0012708577560260892 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5888671875, + "loss_eval": 1.1785690784454346, + "epoch": 29 + }, + { + "hidden_norms": [ + 271.3736572265625, + 257.6708984375, + 246.3377685546875, + 240.7875213623047, + 248.55162048339844 + ], + "bp_grad_norms_per_sample_med": [ + 3.2452040613861755e-05, + 3.456772174104117e-05, + 3.550515975803137e-05, + 3.530189496814273e-05, + 3.098960587522015e-05 + ], + "bp_grad_norms_F": [ + 0.0015420741401612759, + 0.0016120158834382892, + 0.0016289768973365426, + 0.0015373170608654618, + 0.0012695658951997757 + ], + "gamma_dfa": NaN, + "acc_eval": 0.57421875, + "loss_eval": 1.1686367988586426, + "epoch": 30 + }, + { + "hidden_norms": [ + 270.6155090332031, + 256.5137634277344, + 246.4404296875, + 238.71493530273438, + 245.14651489257812 + ], + "bp_grad_norms_per_sample_med": [ + 3.4225693525513634e-05, + 3.6208981327945367e-05, + 3.771808042074554e-05, + 3.671547892736271e-05, + 3.175914389430545e-05 + ], + "bp_grad_norms_F": [ + 0.0016278985422104597, + 0.00169221474789083, + 0.0017131771892309189, + 0.0016123101813718677, + 0.001308745937421918 + ], + "gamma_dfa": NaN, + "acc_eval": 0.572265625, + "loss_eval": 1.1706045866012573, + "epoch": 31 + }, + { + "hidden_norms": [ + 271.2703552246094, + 258.5479431152344, + 247.48568725585938, + 241.0449676513672, + 248.61419677734375 + ], + "bp_grad_norms_per_sample_med": [ + 3.370125705259852e-05, + 3.563391510397196e-05, + 3.776583253056742e-05, + 3.622193253249861e-05, + 3.1177536584436893e-05 + ], + "bp_grad_norms_F": [ + 0.001631051884032786, + 0.0016799280419945717, + 0.0016939701745286584, + 0.001596588990651071, + 0.0012989162933081388 + ], + "gamma_dfa": NaN, + "acc_eval": 0.576171875, + "loss_eval": 1.1757416725158691, + "epoch": 32 + }, + { + "hidden_norms": [ + 271.5987854003906, + 257.3157043457031, + 247.04425048828125, + 239.22933959960938, + 247.08534240722656 + ], + "bp_grad_norms_per_sample_med": [ + 3.276485949754715e-05, + 3.4356282412773e-05, + 3.570897752069868e-05, + 3.5391843994148076e-05, + 3.004215977853164e-05 + ], + "bp_grad_norms_F": [ + 0.0015858211554586887, + 0.0016445693327113986, + 0.0016775003168731928, + 0.0015801271656528115, + 0.0012829708866775036 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5947265625, + "loss_eval": 1.1316245794296265, + "epoch": 33 + }, + { + "hidden_norms": [ + 276.85565185546875, + 262.14959716796875, + 248.80125427246094, + 239.6945037841797, + 246.55982971191406 + ], + "bp_grad_norms_per_sample_med": [ + 3.424682654440403e-05, + 3.617212496465072e-05, + 3.731884135049768e-05, + 3.583814759622328e-05, + 3.1317249522544444e-05 + ], + "bp_grad_norms_F": [ + 0.001694253645837307, + 0.0017545269802212715, + 0.0017868074355646968, + 0.0016729168128222227, + 0.0013285611057654023 + ], + "gamma_dfa": NaN, + "acc_eval": 0.599609375, + "loss_eval": 1.1637687683105469, + "epoch": 34 + }, + { + "hidden_norms": [ + 274.4824523925781, + 260.23223876953125, + 249.41390991210938, + 242.22657775878906, + 248.33303833007812 + ], + "bp_grad_norms_per_sample_med": [ + 3.4118878829758614e-05, + 3.6190944229019806e-05, + 3.7162455555517226e-05, + 3.6398294469108805e-05, + 3.1276995287043974e-05 + ], + "bp_grad_norms_F": [ + 0.0016947221010923386, + 0.0017584856832399964, + 0.0017846780829131603, + 0.0016663862625136971, + 0.0013457784662023187 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5830078125, + "loss_eval": 1.1625440120697021, + "epoch": 35 + }, + { + "hidden_norms": [ + 279.3048095703125, + 263.830810546875, + 250.07839965820312, + 242.9677276611328, + 248.742431640625 + ], + "bp_grad_norms_per_sample_med": [ + 3.378376641194336e-05, + 3.623673183028586e-05, + 3.8036723708501086e-05, + 3.8026879337849095e-05, + 3.20856343023479e-05 + ], + "bp_grad_norms_F": [ + 0.0016582749085500836, + 0.001725532696582377, + 0.0017548021860420704, + 0.0016622358234599233, + 0.0013314742827787995 + ], + "gamma_dfa": NaN, + "acc_eval": 0.58203125, + "loss_eval": 1.1663323640823364, + "epoch": 36 + }, + { + "hidden_norms": [ + 277.88153076171875, + 263.3263244628906, + 254.0471954345703, + 246.00294494628906, + 251.6592559814453 + ], + "bp_grad_norms_per_sample_med": [ + 3.402382935746573e-05, + 3.644815296866e-05, + 3.812061549979262e-05, + 3.8299189327517524e-05, + 3.244871550123207e-05 + ], + "bp_grad_norms_F": [ + 0.0016575837507843971, + 0.001726161572150886, + 0.0017651193775236607, + 0.001658888068050146, + 0.001325216144323349 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5849609375, + "loss_eval": 1.1578618288040161, + "epoch": 37 + }, + { + "hidden_norms": [ + 278.96038818359375, + 264.09832763671875, + 252.11532592773438, + 243.7300567626953, + 250.29537963867188 + ], + "bp_grad_norms_per_sample_med": [ + 3.398891203687526e-05, + 3.60828016710002e-05, + 3.8209349440876395e-05, + 3.6874149373034015e-05, + 3.130899858660996e-05 + ], + "bp_grad_norms_F": [ + 0.0016938851913437247, + 0.0017578925471752882, + 0.0017999019473791122, + 0.0016839306335896254, + 0.0013463495997712016 + ], + "gamma_dfa": NaN, + "acc_eval": 0.59375, + "loss_eval": 1.1660709381103516, + "epoch": 38 + }, + { + "hidden_norms": [ + 279.11102294921875, + 262.8247375488281, + 250.32635498046875, + 241.73477172851562, + 246.8911590576172 + ], + "bp_grad_norms_per_sample_med": [ + 3.476023630355485e-05, + 3.673156606964767e-05, + 3.8200654671527445e-05, + 3.745179856196046e-05, + 3.111823389190249e-05 + ], + "bp_grad_norms_F": [ + 0.0017367384862154722, + 0.001807119813747704, + 0.0018404393922537565, + 0.0017188042402267456, + 0.0013523433590307832 + ], + "gamma_dfa": NaN, + "acc_eval": 0.58984375, + "loss_eval": 1.1548914909362793, + "epoch": 39 + }, + { + "hidden_norms": [ + 278.79083251953125, + 263.49237060546875, + 252.0679931640625, + 243.65948486328125, + 249.34564208984375 + ], + "bp_grad_norms_per_sample_med": [ + 3.3709933632053435e-05, + 3.595885937102139e-05, + 3.795271186390892e-05, + 3.70899579138495e-05, + 3.1362116715172306e-05 + ], + "bp_grad_norms_F": [ + 0.0017184949247166514, + 0.0017862631939351559, + 0.0018348938319832087, + 0.0017180118011310697, + 0.0013606568099930882 + ], + "gamma_dfa": NaN, + "acc_eval": 0.591796875, + "loss_eval": 1.159794569015503, + "epoch": 40 + }, + { + "hidden_norms": [ + 281.3595886230469, + 263.4467468261719, + 250.73536682128906, + 243.140380859375, + 247.22425842285156 + ], + "bp_grad_norms_per_sample_med": [ + 3.411353100091219e-05, + 3.656598346424289e-05, + 3.8585232687182724e-05, + 3.752345946850255e-05, + 3.1474613933824e-05 + ], + "bp_grad_norms_F": [ + 0.0017623946769163013, + 0.0018276257906109095, + 0.0018694576574489474, + 0.0017436364432796836, + 0.0013814391568303108 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5888671875, + "loss_eval": 1.153226375579834, + "epoch": 41 + }, + { + "hidden_norms": [ + 279.79888916015625, + 263.5989685058594, + 252.2397918701172, + 243.49703979492188, + 248.86973571777344 + ], + "bp_grad_norms_per_sample_med": [ + 3.528413435560651e-05, + 3.805026790359989e-05, + 4.0152310248231515e-05, + 3.962377377320081e-05, + 3.250985173508525e-05 + ], + "bp_grad_norms_F": [ + 0.0017320383340120316, + 0.0018105976050719619, + 0.001847731531597674, + 0.0017405269900336862, + 0.0013762396993115544 + ], + "gamma_dfa": NaN, + "acc_eval": 0.58984375, + "loss_eval": 1.1387929916381836, + "epoch": 42 + }, + { + "hidden_norms": [ + 280.80633544921875, + 263.2684326171875, + 251.36338806152344, + 242.25201416015625, + 245.46954345703125 + ], + "bp_grad_norms_per_sample_med": [ + 3.463789835222997e-05, + 3.694587940117344e-05, + 3.909278166247532e-05, + 3.8173999200807884e-05, + 3.152083809254691e-05 + ], + "bp_grad_norms_F": [ + 0.001763346022926271, + 0.0018382675480097532, + 0.0018745084526017308, + 0.0017674838891252875, + 0.0013920797500759363 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5986328125, + "loss_eval": 1.1115086078643799, + "epoch": 43 + }, + { + "hidden_norms": [ + 278.4877624511719, + 261.4671630859375, + 247.66079711914062, + 240.21690368652344, + 244.1111602783203 + ], + "bp_grad_norms_per_sample_med": [ + 3.559369361028075e-05, + 3.895946065313183e-05, + 4.048463233630173e-05, + 3.892362292390317e-05, + 3.229418143746443e-05 + ], + "bp_grad_norms_F": [ + 0.0018469772767275572, + 0.0019197544315829873, + 0.001963041489943862, + 0.0018302135867998004, + 0.001429378753527999 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6025390625, + "loss_eval": 1.16768217086792, + "epoch": 44 + }, + { + "hidden_norms": [ + 280.8171691894531, + 263.16705322265625, + 251.45835876464844, + 243.88563537597656, + 246.92945861816406 + ], + "bp_grad_norms_per_sample_med": [ + 3.3486583561170846e-05, + 3.533214839990251e-05, + 3.789112452068366e-05, + 3.651758743217215e-05, + 3.081141403526999e-05 + ], + "bp_grad_norms_F": [ + 0.0017694556154310703, + 0.0018461478175595403, + 0.0018877091351896524, + 0.001781664090231061, + 0.0014001834206283092 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.1236202716827393, + "epoch": 45 + }, + { + "hidden_norms": [ + 280.0203552246094, + 261.3996887207031, + 248.5751953125, + 240.40728759765625, + 243.84178161621094 + ], + "bp_grad_norms_per_sample_med": [ + 3.66695094271563e-05, + 3.912827742169611e-05, + 4.0782215364743024e-05, + 3.97856165363919e-05, + 3.258495053160004e-05 + ], + "bp_grad_norms_F": [ + 0.0018954386468976736, + 0.0019765326287597418, + 0.0020179273560643196, + 0.0018787897424772382, + 0.0014408754650503397 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5947265625, + "loss_eval": 1.142503261566162, + "epoch": 46 + }, + { + "hidden_norms": [ + 278.37445068359375, + 260.7147521972656, + 247.63418579101562, + 239.64564514160156, + 241.75396728515625 + ], + "bp_grad_norms_per_sample_med": [ + 3.824803570751101e-05, + 4.062152947881259e-05, + 4.1070070437854156e-05, + 4.01996003347449e-05, + 3.288290827185847e-05 + ], + "bp_grad_norms_F": [ + 0.001872657099738717, + 0.0019627343863248825, + 0.002008425537496805, + 0.0018816223600879312, + 0.001456336583942175 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6064453125, + "loss_eval": 1.137413740158081, + "epoch": 47 + }, + { + "hidden_norms": [ + 281.14813232421875, + 263.6340637207031, + 250.13082885742188, + 242.0965118408203, + 244.81060791015625 + ], + "bp_grad_norms_per_sample_med": [ + 3.531872062012553e-05, + 3.7883237382629886e-05, + 4.0227863792097196e-05, + 3.96844552597031e-05, + 3.296942304586992e-05 + ], + "bp_grad_norms_F": [ + 0.0018434273079037666, + 0.0019304269226267934, + 0.0019746439065784216, + 0.0018603875068947673, + 0.0014465745771303773 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6025390625, + "loss_eval": 1.1396205425262451, + "epoch": 48 + }, + { + "hidden_norms": [ + 281.31280517578125, + 262.5829772949219, + 247.9232940673828, + 239.8461456298828, + 242.20977783203125 + ], + "bp_grad_norms_per_sample_med": [ + 3.71285859728232e-05, + 3.963968629250303e-05, + 4.135111521463841e-05, + 4.0518349123885855e-05, + 3.323471173644066e-05 + ], + "bp_grad_norms_F": [ + 0.00189371092710644, + 0.0019808171782642603, + 0.002019244944676757, + 0.001904282602481544, + 0.0014800610952079296 + ], + "gamma_dfa": NaN, + "acc_eval": 0.59375, + "loss_eval": 1.1411675214767456, + "epoch": 49 + }, + { + "hidden_norms": [ + 278.64208984375, + 260.1700744628906, + 246.7251434326172, + 239.43145751953125, + 240.350830078125 + ], + "bp_grad_norms_per_sample_med": [ + 3.6054647353012115e-05, + 3.858766285702586e-05, + 4.05439204769209e-05, + 4.046479079988785e-05, + 3.3791853638831526e-05 + ], + "bp_grad_norms_F": [ + 0.0018870895728468895, + 0.00198533502407372, + 0.0020502021070569754, + 0.001929490827023983, + 0.0014933926286175847 + ], + "gamma_dfa": NaN, + "acc_eval": 0.59375, + "loss_eval": 1.1310430765151978, + "epoch": 50 + }, + { + "hidden_norms": [ + 281.7696533203125, + 261.5150451660156, + 247.67295837402344, + 239.7654266357422, + 240.27789306640625 + ], + "bp_grad_norms_per_sample_med": [ + 3.671262675197795e-05, + 3.92102992918808e-05, + 4.1406125092180446e-05, + 4.029196497867815e-05, + 3.32514064211864e-05 + ], + "bp_grad_norms_F": [ + 0.001880357856862247, + 0.001981948269531131, + 0.0020440546795725822, + 0.0019350070506334305, + 0.0014877711655572057 + ], + "gamma_dfa": NaN, + "acc_eval": 0.60546875, + "loss_eval": 1.1188440322875977, + "epoch": 51 + }, + { + "hidden_norms": [ + 279.01318359375, + 259.6091003417969, + 244.6603240966797, + 235.1455535888672, + 237.438232421875 + ], + "bp_grad_norms_per_sample_med": [ + 4.0185608668252826e-05, + 4.309232099330984e-05, + 4.5118234993424267e-05, + 4.371534669189714e-05, + 3.5620210837805644e-05 + ], + "bp_grad_norms_F": [ + 0.0020104716531932354, + 0.002107330597937107, + 0.002167000202462077, + 0.0020260754972696304, + 0.0015411453787237406 + ], + "gamma_dfa": NaN, + "acc_eval": 0.603515625, + "loss_eval": 1.1525764465332031, + "epoch": 52 + }, + { + "hidden_norms": [ + 278.2245178222656, + 257.14617919921875, + 243.9732666015625, + 234.4013214111328, + 236.68521118164062 + ], + "bp_grad_norms_per_sample_med": [ + 3.85418206860777e-05, + 4.142443503951654e-05, + 4.363177140476182e-05, + 4.2996281990781426e-05, + 3.424972965149209e-05 + ], + "bp_grad_norms_F": [ + 0.0020445864647626877, + 0.002142493613064289, + 0.0022005243226885796, + 0.002054274780675769, + 0.0015541499014943838 + ], + "gamma_dfa": NaN, + "acc_eval": 0.59765625, + "loss_eval": 1.162191390991211, + "epoch": 53 + }, + { + "hidden_norms": [ + 278.7825622558594, + 258.4292297363281, + 243.01690673828125, + 234.15765380859375, + 235.1446533203125 + ], + "bp_grad_norms_per_sample_med": [ + 3.855194881907664e-05, + 4.1293307731393725e-05, + 4.296215047361329e-05, + 4.1900369978975505e-05, + 3.372962964931503e-05 + ], + "bp_grad_norms_F": [ + 0.002041360829025507, + 0.0021457262337207794, + 0.0021996963769197464, + 0.0020641626324504614, + 0.001561368815600872 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6171875, + "loss_eval": 1.130479335784912, + "epoch": 54 + }, + { + "hidden_norms": [ + 275.3794860839844, + 256.83026123046875, + 242.16006469726562, + 231.49655151367188, + 232.30279541015625 + ], + "bp_grad_norms_per_sample_med": [ + 4.011294731753878e-05, + 4.240096313878894e-05, + 4.396942676976323e-05, + 4.347893627709709e-05, + 3.485888009890914e-05 + ], + "bp_grad_norms_F": [ + 0.0021268154960125685, + 0.002230642130598426, + 0.0022892621345818043, + 0.002145433332771063, + 0.0016037407331168652 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6005859375, + "loss_eval": 1.1599653959274292, + "epoch": 55 + }, + { + "hidden_norms": [ + 277.5028076171875, + 257.1715087890625, + 241.6505584716797, + 234.09323120117188, + 233.63377380371094 + ], + "bp_grad_norms_per_sample_med": [ + 3.876453047269024e-05, + 4.156330396654084e-05, + 4.3727923184633255e-05, + 4.2131912778131664e-05, + 3.510245369398035e-05 + ], + "bp_grad_norms_F": [ + 0.002074806485325098, + 0.002173666376620531, + 0.002245684852823615, + 0.0021073734387755394, + 0.0015908328350633383 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.144984245300293, + "epoch": 56 + }, + { + "hidden_norms": [ + 276.0826416015625, + 255.17193603515625, + 239.51519775390625, + 231.28643798828125, + 230.85292053222656 + ], + "bp_grad_norms_per_sample_med": [ + 3.960869798902422e-05, + 4.2907246097456664e-05, + 4.45116929768119e-05, + 4.3612952140392736e-05, + 3.500159073155373e-05 + ], + "bp_grad_norms_F": [ + 0.0021277335472404957, + 0.0022348251659423113, + 0.0022981096990406513, + 0.002155488822609186, + 0.001618923619389534 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6142578125, + "loss_eval": 1.1534931659698486, + "epoch": 57 + }, + { + "hidden_norms": [ + 275.6867370605469, + 254.65744018554688, + 238.1124267578125, + 229.36215209960938, + 227.90867614746094 + ], + "bp_grad_norms_per_sample_med": [ + 3.966662916354835e-05, + 4.33680324931629e-05, + 4.5270633563632146e-05, + 4.528860517893918e-05, + 3.5298704460728914e-05 + ], + "bp_grad_norms_F": [ + 0.002194908680394292, + 0.002305977512151003, + 0.0023776311427354813, + 0.002223761286586523, + 0.001651395345106721 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.1494864225387573, + "epoch": 58 + }, + { + "hidden_norms": [ + 274.8414306640625, + 253.18215942382812, + 238.03150939941406, + 228.1765594482422, + 229.46058654785156 + ], + "bp_grad_norms_per_sample_med": [ + 4.132632238906808e-05, + 4.4773249101126567e-05, + 4.6669130824739113e-05, + 4.591346441884525e-05, + 3.6523833841783926e-05 + ], + "bp_grad_norms_F": [ + 0.0022293017245829105, + 0.002341218525543809, + 0.002405093051493168, + 0.0022504546213895082, + 0.0016715668607503176 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5927734375, + "loss_eval": 1.1698435544967651, + "epoch": 59 + }, + { + "hidden_norms": [ + 273.4884338378906, + 251.2228240966797, + 236.2550048828125, + 226.7325439453125, + 225.68386840820312 + ], + "bp_grad_norms_per_sample_med": [ + 4.192883352516219e-05, + 4.3471976823639125e-05, + 4.7195244405884296e-05, + 4.490713035920635e-05, + 3.646116965683177e-05 + ], + "bp_grad_norms_F": [ + 0.0022312228102236986, + 0.002349371323361993, + 0.0024164437782019377, + 0.002271530916914344, + 0.0016918154433369637 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.1560128927230835, + "epoch": 60 + }, + { + "hidden_norms": [ + 273.4084777832031, + 250.5165557861328, + 236.19557189941406, + 227.0643768310547, + 226.594970703125 + ], + "bp_grad_norms_per_sample_med": [ + 4.2211744585074484e-05, + 4.488111881073564e-05, + 4.760283627547324e-05, + 4.589638047036715e-05, + 3.658623973024078e-05 + ], + "bp_grad_norms_F": [ + 0.0022313676308840513, + 0.002337696962058544, + 0.0024093035608530045, + 0.002264693146571517, + 0.0016880000475794077 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6044921875, + "loss_eval": 1.1498074531555176, + "epoch": 61 + }, + { + "hidden_norms": [ + 273.1318664550781, + 249.35223388671875, + 234.15737915039062, + 223.48074340820312, + 223.0059356689453 + ], + "bp_grad_norms_per_sample_med": [ + 4.4729218643624336e-05, + 4.768320650327951e-05, + 4.822494520340115e-05, + 4.791786341229454e-05, + 3.7625926779583097e-05 + ], + "bp_grad_norms_F": [ + 0.0023362624924629927, + 0.0024679312482476234, + 0.0025367215275764465, + 0.0023599599953740835, + 0.0017239096341654658 + ], + "gamma_dfa": NaN, + "acc_eval": 0.603515625, + "loss_eval": 1.1377537250518799, + "epoch": 62 + }, + { + "hidden_norms": [ + 270.9543762207031, + 249.6943817138672, + 234.0796356201172, + 223.80093383789062, + 222.75062561035156 + ], + "bp_grad_norms_per_sample_med": [ + 4.4321575842332095e-05, + 4.7786033974261954e-05, + 4.9388974730391055e-05, + 4.749266372527927e-05, + 3.7502803024835885e-05 + ], + "bp_grad_norms_F": [ + 0.0023458057548850775, + 0.0024719720240682364, + 0.0025427823420614004, + 0.0023789280094206333, + 0.0017488099401816726 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.1472076177597046, + "epoch": 63 + }, + { + "hidden_norms": [ + 270.6864318847656, + 249.71315002441406, + 233.9838409423828, + 223.17515563964844, + 222.17759704589844 + ], + "bp_grad_norms_per_sample_med": [ + 4.36245281889569e-05, + 4.725098915514536e-05, + 4.936556069878861e-05, + 4.7286572225857526e-05, + 3.7781614082632586e-05 + ], + "bp_grad_norms_F": [ + 0.0023510511964559555, + 0.0024691869039088488, + 0.0025394195690751076, + 0.0023858139757066965, + 0.0017493697814643383 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5986328125, + "loss_eval": 1.1437795162200928, + "epoch": 64 + }, + { + "hidden_norms": [ + 269.1813659667969, + 247.57632446289062, + 231.57135009765625, + 220.31541442871094, + 220.33135986328125 + ], + "bp_grad_norms_per_sample_med": [ + 4.363871266832575e-05, + 4.776224886882119e-05, + 4.8712514399085194e-05, + 4.777491994900629e-05, + 3.733497578650713e-05 + ], + "bp_grad_norms_F": [ + 0.0023870510049164295, + 0.0025214161723852158, + 0.0025991688016802073, + 0.0024342697579413652, + 0.0017686353530734777 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6123046875, + "loss_eval": 1.138253927230835, + "epoch": 65 + }, + { + "hidden_norms": [ + 268.92877197265625, + 245.84384155273438, + 230.63307189941406, + 220.8726806640625, + 219.60350036621094 + ], + "bp_grad_norms_per_sample_med": [ + 4.505042306846008e-05, + 4.780786548508331e-05, + 5.067480378784239e-05, + 4.878537220065482e-05, + 3.842872683890164e-05 + ], + "bp_grad_norms_F": [ + 0.00237255753017962, + 0.002493572887033224, + 0.0025717453099787235, + 0.0024270617868751287, + 0.0017787005053833127 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.1350346803665161, + "epoch": 66 + }, + { + "hidden_norms": [ + 268.9022521972656, + 244.85621643066406, + 229.2279510498047, + 218.72445678710938, + 217.325439453125 + ], + "bp_grad_norms_per_sample_med": [ + 4.515323234954849e-05, + 4.8419675295008346e-05, + 5.0062186346622184e-05, + 4.777919821208343e-05, + 3.962183836847544e-05 + ], + "bp_grad_norms_F": [ + 0.0024519655853509903, + 0.002586368238553405, + 0.00266969739459455, + 0.0024983694311231375, + 0.001813769806176424 + ], + "gamma_dfa": NaN, + "acc_eval": 0.58984375, + "loss_eval": 1.143377661705017, + "epoch": 67 + }, + { + "hidden_norms": [ + 267.7603454589844, + 245.58932495117188, + 229.04205322265625, + 219.0813446044922, + 217.887939453125 + ], + "bp_grad_norms_per_sample_med": [ + 4.398225064505823e-05, + 4.6881206799298525e-05, + 4.986919157090597e-05, + 4.9659283831715584e-05, + 3.928233854821883e-05 + ], + "bp_grad_norms_F": [ + 0.0024525129701942205, + 0.0025901535991579294, + 0.002675000112503767, + 0.0025050004478543997, + 0.0018165758810937405 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6083984375, + "loss_eval": 1.1445319652557373, + "epoch": 68 + }, + { + "hidden_norms": [ + 267.32110595703125, + 244.51095581054688, + 228.1964569091797, + 217.7543182373047, + 215.99093627929688 + ], + "bp_grad_norms_per_sample_med": [ + 4.567872019833885e-05, + 4.9028451030608267e-05, + 5.0534836191218346e-05, + 4.8578112910036e-05, + 3.865628605126403e-05 + ], + "bp_grad_norms_F": [ + 0.002467149868607521, + 0.0026051453314721584, + 0.0026927595026791096, + 0.002530105412006378, + 0.0018421142594888806 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.143081545829773, + "epoch": 69 + }, + { + "hidden_norms": [ + 266.6060791015625, + 242.973388671875, + 227.23739624023438, + 216.60504150390625, + 213.26922607421875 + ], + "bp_grad_norms_per_sample_med": [ + 4.524671021499671e-05, + 4.8752917791716754e-05, + 5.0053116865456104e-05, + 4.897990220342763e-05, + 3.949753590859473e-05 + ], + "bp_grad_norms_F": [ + 0.002536450745537877, + 0.002682002494111657, + 0.002782325493171811, + 0.002600395353510976, + 0.0018774428172037005 + ], + "gamma_dfa": NaN, + "acc_eval": 0.607421875, + "loss_eval": 1.1569209098815918, + "epoch": 70 + }, + { + "hidden_norms": [ + 265.7056579589844, + 243.6046142578125, + 226.88746643066406, + 217.55291748046875, + 213.99151611328125 + ], + "bp_grad_norms_per_sample_med": [ + 4.667519897338934e-05, + 4.9728132580639794e-05, + 5.27437987329904e-05, + 5.151727600605227e-05, + 4.0550570702180266e-05 + ], + "bp_grad_norms_F": [ + 0.002509700832888484, + 0.0026521242689341307, + 0.0027410376351326704, + 0.002574845217168331, + 0.001871992484666407 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.1381304264068604, + "epoch": 71 + }, + { + "hidden_norms": [ + 264.63116455078125, + 241.50344848632812, + 225.20465087890625, + 214.67364501953125, + 212.77584838867188 + ], + "bp_grad_norms_per_sample_med": [ + 4.526918928604573e-05, + 5.0124705012422055e-05, + 5.2680206863442436e-05, + 5.1697836170205846e-05, + 3.9593822293682024e-05 + ], + "bp_grad_norms_F": [ + 0.0025687876623123884, + 0.0027084490284323692, + 0.0027945584151893854, + 0.0026290949899703264, + 0.0018978636944666505 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.149982213973999, + "epoch": 72 + }, + { + "hidden_norms": [ + 264.168701171875, + 241.78074645996094, + 224.8336944580078, + 214.45762634277344, + 212.4181671142578 + ], + "bp_grad_norms_per_sample_med": [ + 4.745498517877422e-05, + 5.042303018854e-05, + 5.3622185077983886e-05, + 5.276402589515783e-05, + 4.0586572140455246e-05 + ], + "bp_grad_norms_F": [ + 0.0026231552474200726, + 0.002779489615932107, + 0.002866284688934684, + 0.00268669705837965, + 0.0019228557357564569 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.158836007118225, + "epoch": 73 + }, + { + "hidden_norms": [ + 263.89593505859375, + 240.3160858154297, + 223.6101531982422, + 212.4967803955078, + 210.63546752929688 + ], + "bp_grad_norms_per_sample_med": [ + 4.678544428315945e-05, + 5.029747626394965e-05, + 5.3069161367602646e-05, + 5.2157745813019574e-05, + 4.0450311644235626e-05 + ], + "bp_grad_norms_F": [ + 0.0026451845187693834, + 0.002798875328153372, + 0.0028935885056853294, + 0.0027081011794507504, + 0.001933218096382916 + ], + "gamma_dfa": NaN, + "acc_eval": 0.607421875, + "loss_eval": 1.1447510719299316, + "epoch": 74 + }, + { + "hidden_norms": [ + 262.4220275878906, + 239.43899536132812, + 223.32151794433594, + 212.5982666015625, + 209.80105590820312 + ], + "bp_grad_norms_per_sample_med": [ + 4.713214002549648e-05, + 5.087011959403753e-05, + 5.283053906168789e-05, + 5.280825644149445e-05, + 4.054068267578259e-05 + ], + "bp_grad_norms_F": [ + 0.002688886132091284, + 0.002841175301000476, + 0.002931408118456602, + 0.0027343749534338713, + 0.001953375292941928 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6201171875, + "loss_eval": 1.1561517715454102, + "epoch": 75 + }, + { + "hidden_norms": [ + 262.65814208984375, + 240.0749969482422, + 223.0806121826172, + 212.08688354492188, + 209.22561645507812 + ], + "bp_grad_norms_per_sample_med": [ + 4.8153047828236595e-05, + 5.145415343577042e-05, + 5.4130876378621906e-05, + 5.3563955589197576e-05, + 4.1630475607234985e-05 + ], + "bp_grad_norms_F": [ + 0.0026582488790154457, + 0.0028067713137716055, + 0.00290639977902174, + 0.0027312941383570433, + 0.0019485733937472105 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.1465811729431152, + "epoch": 76 + }, + { + "hidden_norms": [ + 262.0201721191406, + 239.08547973632812, + 222.36146545410156, + 211.62014770507812, + 208.1699676513672 + ], + "bp_grad_norms_per_sample_med": [ + 4.763290053233504e-05, + 5.171096199774183e-05, + 5.4121221182867885e-05, + 5.251873881206848e-05, + 4.096185875823721e-05 + ], + "bp_grad_norms_F": [ + 0.0027110630180686712, + 0.002856222679838538, + 0.002954155672341585, + 0.0027671835850924253, + 0.001963438233360648 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6142578125, + "loss_eval": 1.140420913696289, + "epoch": 77 + }, + { + "hidden_norms": [ + 261.04132080078125, + 238.44912719726562, + 221.8912353515625, + 210.62893676757812, + 207.68223571777344 + ], + "bp_grad_norms_per_sample_med": [ + 4.7598918172298e-05, + 5.09894234710373e-05, + 5.384815813158639e-05, + 5.2337087254272774e-05, + 4.065291432198137e-05 + ], + "bp_grad_norms_F": [ + 0.00274560390971601, + 0.0029035566840320826, + 0.0030046424362808466, + 0.0028060651384294033, + 0.001984622096642852 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.1556674242019653, + "epoch": 78 + }, + { + "hidden_norms": [ + 260.81304931640625, + 237.52015686035156, + 221.12814331054688, + 210.04925537109375, + 206.80441284179688 + ], + "bp_grad_norms_per_sample_med": [ + 4.8430883907712996e-05, + 5.440305176307447e-05, + 5.596410119323991e-05, + 5.4586391343036667e-05, + 4.195213477942161e-05 + ], + "bp_grad_norms_F": [ + 0.002767855068668723, + 0.002925564767792821, + 0.003015928901731968, + 0.002823467366397381, + 0.0020000736694782972 + ], + "gamma_dfa": NaN, + "acc_eval": 0.599609375, + "loss_eval": 1.155595302581787, + "epoch": 79 + }, + { + "hidden_norms": [ + 260.0649108886719, + 236.74310302734375, + 220.48731994628906, + 209.0772247314453, + 205.55821228027344 + ], + "bp_grad_norms_per_sample_med": [ + 4.8615416744723916e-05, + 5.309982589096762e-05, + 5.548154513235204e-05, + 5.3888015827396885e-05, + 4.1955223423428833e-05 + ], + "bp_grad_norms_F": [ + 0.0028222037944942713, + 0.0029849831480532885, + 0.003080391325056553, + 0.0028690374456346035, + 0.002019484294578433 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.151352882385254, + "epoch": 80 + }, + { + "hidden_norms": [ + 259.8204650878906, + 236.13253784179688, + 219.08865356445312, + 207.6793975830078, + 205.0387725830078 + ], + "bp_grad_norms_per_sample_med": [ + 4.734982212539762e-05, + 5.1937022362835705e-05, + 5.472155680763535e-05, + 5.394391337176785e-05, + 4.0832986996974796e-05 + ], + "bp_grad_norms_F": [ + 0.00282403570599854, + 0.0029848285485059023, + 0.0030928945634514093, + 0.002879998181015253, + 0.0020237534772604704 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.153958797454834, + "epoch": 81 + }, + { + "hidden_norms": [ + 259.70703125, + 235.5811767578125, + 218.87939453125, + 207.87005615234375, + 204.21360778808594 + ], + "bp_grad_norms_per_sample_med": [ + 4.972740134689957e-05, + 5.442327164928429e-05, + 5.538179539144039e-05, + 5.4411018936662003e-05, + 4.185390207567252e-05 + ], + "bp_grad_norms_F": [ + 0.002822998445481062, + 0.00298913661390543, + 0.0030840388499200344, + 0.0028817548882216215, + 0.0020279802847653627 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6201171875, + "loss_eval": 1.153503656387329, + "epoch": 82 + }, + { + "hidden_norms": [ + 258.22747802734375, + 235.3745880126953, + 218.20066833496094, + 206.82144165039062, + 203.41139221191406 + ], + "bp_grad_norms_per_sample_med": [ + 5.077639434603043e-05, + 5.5536078434670344e-05, + 5.664999844157137e-05, + 5.608425635728054e-05, + 4.293184611015022e-05 + ], + "bp_grad_norms_F": [ + 0.002843277994543314, + 0.0030130224768072367, + 0.0031098793260753155, + 0.00290561281144619, + 0.0020425335969775915 + ], + "gamma_dfa": NaN, + "acc_eval": 0.603515625, + "loss_eval": 1.1597235202789307, + "epoch": 83 + }, + { + "hidden_norms": [ + 258.78253173828125, + 234.73965454101562, + 217.91439819335938, + 207.1282958984375, + 203.4480743408203 + ], + "bp_grad_norms_per_sample_med": [ + 4.941036968375556e-05, + 5.3143365221330896e-05, + 5.529402187676169e-05, + 5.3718889830634e-05, + 4.207601887173951e-05 + ], + "bp_grad_norms_F": [ + 0.0028217420913279057, + 0.0029905554838478565, + 0.0030917164403945208, + 0.002896753139793873, + 0.00204362440854311 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.1545956134796143, + "epoch": 84 + }, + { + "hidden_norms": [ + 258.10736083984375, + 234.35299682617188, + 217.81224060058594, + 206.38864135742188, + 202.70126342773438 + ], + "bp_grad_norms_per_sample_med": [ + 4.899106716038659e-05, + 5.2254512411309406e-05, + 5.481128755491227e-05, + 5.298088217386976e-05, + 4.121303936699405e-05 + ], + "bp_grad_norms_F": [ + 0.002849399344995618, + 0.0030259499326348305, + 0.0031236386857926846, + 0.002921136561781168, + 0.0020506957080215216 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.150564193725586, + "epoch": 85 + }, + { + "hidden_norms": [ + 258.50750732421875, + 234.4120330810547, + 217.49217224121094, + 205.7490692138672, + 202.62380981445312 + ], + "bp_grad_norms_per_sample_med": [ + 4.976892887498252e-05, + 5.383255484048277e-05, + 5.497025267686695e-05, + 5.391201557358727e-05, + 4.2558931454550475e-05 + ], + "bp_grad_norms_F": [ + 0.0028686418663710356, + 0.003045660676434636, + 0.0031442255713045597, + 0.002935740165412426, + 0.0020568587351590395 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.152902603149414, + "epoch": 86 + }, + { + "hidden_norms": [ + 258.063720703125, + 233.87294006347656, + 217.34030151367188, + 205.4007110595703, + 202.4425506591797 + ], + "bp_grad_norms_per_sample_med": [ + 5.047345257480629e-05, + 5.492625859915279e-05, + 5.640966628561728e-05, + 5.587706982623786e-05, + 4.286773400963284e-05 + ], + "bp_grad_norms_F": [ + 0.002875820267945528, + 0.003056521760299802, + 0.0031533341389149427, + 0.002944495528936386, + 0.0020668748766183853 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6083984375, + "loss_eval": 1.152883529663086, + "epoch": 87 + }, + { + "hidden_norms": [ + 258.1524353027344, + 234.54095458984375, + 216.9737548828125, + 205.64048767089844, + 202.26617431640625 + ], + "bp_grad_norms_per_sample_med": [ + 4.9309845053358003e-05, + 5.373455860535614e-05, + 5.6388864322798327e-05, + 5.448140291264281e-05, + 4.2345352994743735e-05 + ], + "bp_grad_norms_F": [ + 0.0028876049909740686, + 0.0030658405739814043, + 0.0031632501631975174, + 0.002954283496364951, + 0.0020715948194265366 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.155066967010498, + "epoch": 88 + }, + { + "hidden_norms": [ + 257.7385559082031, + 233.87037658691406, + 216.7277069091797, + 205.37454223632812, + 202.0509033203125 + ], + "bp_grad_norms_per_sample_med": [ + 5.0028131227009e-05, + 5.394254549173638e-05, + 5.677127046510577e-05, + 5.581674486165866e-05, + 4.2508807382546365e-05 + ], + "bp_grad_norms_F": [ + 0.0028917219024151564, + 0.0030712694860994816, + 0.0031723883002996445, + 0.0029576809611171484, + 0.0020730902906507254 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6083984375, + "loss_eval": 1.1531357765197754, + "epoch": 89 + }, + { + "hidden_norms": [ + 257.52423095703125, + 233.51254272460938, + 216.73731994628906, + 205.52561950683594, + 202.19493103027344 + ], + "bp_grad_norms_per_sample_med": [ + 4.9573794967727736e-05, + 5.4153944802237675e-05, + 5.742486973758787e-05, + 5.468217204906978e-05, + 4.2126855987589806e-05 + ], + "bp_grad_norms_F": [ + 0.0029005431570112705, + 0.0030793119221925735, + 0.003179334569722414, + 0.0029661250300705433, + 0.002075627911835909 + ], + "gamma_dfa": NaN, + "acc_eval": 0.603515625, + "loss_eval": 1.155139684677124, + "epoch": 90 + }, + { + "hidden_norms": [ + 257.5526428222656, + 233.24456787109375, + 216.63601684570312, + 205.40318298339844, + 201.8704376220703 + ], + "bp_grad_norms_per_sample_med": [ + 4.996290954295546e-05, + 5.331254214979708e-05, + 5.576194598688744e-05, + 5.50017248315271e-05, + 4.1135557694360614e-05 + ], + "bp_grad_norms_F": [ + 0.002902554115280509, + 0.003083745948970318, + 0.0031855429988354445, + 0.0029742431361228228, + 0.002079661935567856 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.15346360206604, + "epoch": 91 + }, + { + "hidden_norms": [ + 257.3648681640625, + 233.42010498046875, + 216.6300506591797, + 204.97442626953125, + 201.4558868408203 + ], + "bp_grad_norms_per_sample_med": [ + 5.06279211549554e-05, + 5.411348683992401e-05, + 5.6813423725543544e-05, + 5.523188519873656e-05, + 4.197460293653421e-05 + ], + "bp_grad_norms_F": [ + 0.0029165328014642, + 0.003098647342994809, + 0.00319958315230906, + 0.002985388273373246, + 0.002088340697810054 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6015625, + "loss_eval": 1.155455470085144, + "epoch": 92 + }, + { + "hidden_norms": [ + 257.30535888671875, + 233.4147491455078, + 216.60826110839844, + 205.0714874267578, + 201.24066162109375 + ], + "bp_grad_norms_per_sample_med": [ + 5.053050699643791e-05, + 5.4108801123220474e-05, + 5.702309499611147e-05, + 5.574637179961428e-05, + 4.271106809028424e-05 + ], + "bp_grad_norms_F": [ + 0.002917014993727207, + 0.0030978922732174397, + 0.0031987964175641537, + 0.0029851715080440044, + 0.0020893686451017857 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.1536216735839844, + "epoch": 93 + }, + { + "hidden_norms": [ + 257.18878173828125, + 232.8798370361328, + 216.17039489746094, + 204.66229248046875, + 201.07859802246094 + ], + "bp_grad_norms_per_sample_med": [ + 5.010717359255068e-05, + 5.397907079895958e-05, + 5.614722249447368e-05, + 5.553716255235486e-05, + 4.292877929401584e-05 + ], + "bp_grad_norms_F": [ + 0.0029321948532015085, + 0.003115386702120304, + 0.0032163059804588556, + 0.002997474977746606, + 0.002096242969855666 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6123046875, + "loss_eval": 1.1570696830749512, + "epoch": 94 + }, + { + "hidden_norms": [ + 257.0701904296875, + 232.91481018066406, + 216.06378173828125, + 204.648681640625, + 201.00148010253906 + ], + "bp_grad_norms_per_sample_med": [ + 4.9896454584086314e-05, + 5.386451448430307e-05, + 5.5900127335917205e-05, + 5.5407243053196e-05, + 4.247200922691263e-05 + ], + "bp_grad_norms_F": [ + 0.0029298008885234594, + 0.0031122476793825626, + 0.0032105366699397564, + 0.0029950770549476147, + 0.0020956522785127163 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6083984375, + "loss_eval": 1.1554739475250244, + "epoch": 95 + }, + { + "hidden_norms": [ + 257.0519104003906, + 232.83355712890625, + 216.1780242919922, + 204.67999267578125, + 201.0236358642578 + ], + "bp_grad_norms_per_sample_med": [ + 5.054255234426819e-05, + 5.421326932264492e-05, + 5.641246752929874e-05, + 5.574019087362103e-05, + 4.288824857212603e-05 + ], + "bp_grad_norms_F": [ + 0.0029319566674530506, + 0.0031146046239882708, + 0.003213704563677311, + 0.002997281262651086, + 0.0020963428542017937 + ], + "gamma_dfa": NaN, + "acc_eval": 0.607421875, + "loss_eval": 1.1545898914337158, + "epoch": 96 + }, + { + "hidden_norms": [ + 257.1473388671875, + 232.85020446777344, + 216.2519989013672, + 204.68023681640625, + 200.93080139160156 + ], + "bp_grad_norms_per_sample_med": [ + 5.0549009756650776e-05, + 5.3789182857144624e-05, + 5.673874693457037e-05, + 5.580837023444474e-05, + 4.2498151742620394e-05 + ], + "bp_grad_norms_F": [ + 0.0029327664524316788, + 0.0031159960199147463, + 0.003215631702914834, + 0.002998515497893095, + 0.0020966045558452606 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.1546047925949097, + "epoch": 97 + }, + { + "hidden_norms": [ + 257.09906005859375, + 232.74813842773438, + 216.1462860107422, + 204.6047821044922, + 200.89031982421875 + ], + "bp_grad_norms_per_sample_med": [ + 5.086465898784809e-05, + 5.3742358431918547e-05, + 5.673644773196429e-05, + 5.5752621847204864e-05, + 4.2624127672752365e-05 + ], + "bp_grad_norms_F": [ + 0.0029341024346649647, + 0.003117120126262307, + 0.0032170764170587063, + 0.0029998423997312784, + 0.002097061835229397 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6083984375, + "loss_eval": 1.1545934677124023, + "epoch": 98 + }, + { + "hidden_norms": [ + 257.09326171875, + 232.7879638671875, + 216.1444091796875, + 204.5867919921875, + 200.89596557617188 + ], + "bp_grad_norms_per_sample_med": [ + 5.078025787952356e-05, + 5.40847031516023e-05, + 5.667618097504601e-05, + 5.571893780143e-05, + 4.271125726518221e-05 + ], + "bp_grad_norms_F": [ + 0.0029357182793319225, + 0.0031186225824058056, + 0.003218533471226692, + 0.0030010156333446503, + 0.002097515854984522 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.154747486114502, + "epoch": 99 + }, + { + "hidden_norms": [ + 257.0869140625, + 232.78091430664062, + 216.12852478027344, + 204.58143615722656, + 200.87417602539062 + ], + "bp_grad_norms_per_sample_med": [ + 5.08715384057723e-05, + 5.4204192565521225e-05, + 5.669457823387347e-05, + 5.573080852627754e-05, + 4.275495302863419e-05 + ], + "bp_grad_norms_F": [ + 0.002935809548944235, + 0.003118706401437521, + 0.0032186671160161495, + 0.003001126926392317, + 0.0020975489169359207 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.1547397375106812, + "epoch": 100 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010068593546748161, + 0.000997236929833889, + 0.0009934091940522194, + 0.0009870644425973296, + 0.0009829498594626784 + ], + "bp_grad_norms_F": [ + 0.03544403985142708, + 0.03507080301642418, + 0.03477022796869278, + 0.03443896397948265, + 0.03407429903745651 + ], + "gamma_dfa": 0.007406219025142491, + "acc_eval": 0.115234375, + "loss_eval": 2.383650302886963, + "epoch": 0 + }, + { + "hidden_norms": [ + 802.1658935546875, + 3058.3173828125, + 4910.8408203125, + 6491.31494140625, + 7304.1533203125 + ], + "bp_grad_norms_per_sample_med": [ + 2.526000798752648e-06, + 1.3625027577290894e-06, + 1.3747999219049234e-06, + 1.378283172925876e-06, + 1.3869492931917193e-06 + ], + "bp_grad_norms_F": [ + 0.00013306058826856315, + 7.476000610040501e-05, + 7.328101492021233e-05, + 7.293069211300462e-05, + 7.309897773666307e-05 + ], + "gamma_dfa": 0.08989996102172881, + "acc_eval": 0.310546875, + "loss_eval": 1.9283097982406616, + "epoch": 1 + }, + { + "hidden_norms": [ + 1580.1480712890625, + 13320.0517578125, + 22793.435546875, + 32440.041015625, + 37758.640625 + ], + "bp_grad_norms_per_sample_med": [ + 1.1427439403632889e-06, + 3.0901847480890865e-07, + 3.1107475706448895e-07, + 3.1377521736430936e-07, + 3.1722706239634135e-07 + ], + "bp_grad_norms_F": [ + 6.523138290503994e-05, + 2.3476462956750765e-05, + 2.0436000340851024e-05, + 1.96047385543352e-05, + 1.9654715288197622e-05 + ], + "gamma_dfa": 0.0858152944711037, + "acc_eval": 0.2880859375, + "loss_eval": 1.9359606504440308, + "epoch": 2 + }, + { + "hidden_norms": [ + 2343.090576171875, + 32438.32421875, + 58119.84375, + 87185.09375, + 104586.15625 + ], + "bp_grad_norms_per_sample_med": [ + 8.229510513046989e-07, + 1.3056541092737461e-07, + 1.2754330214193033e-07, + 1.2950138739142858e-07, + 1.2936459370394005e-07 + ], + "bp_grad_norms_F": [ + 0.0001579313538968563, + 2.960947858809959e-05, + 1.2371615412121173e-05, + 8.468440682918299e-06, + 7.067524620651966e-06 + ], + "gamma_dfa": 0.08629915304481983, + "acc_eval": 0.3017578125, + "loss_eval": 1.9288904666900635, + "epoch": 3 + }, + { + "hidden_norms": [ + 3129.4423828125, + 62780.5, + 117608.9375, + 182640.09375, + 223504.390625 + ], + "bp_grad_norms_per_sample_med": [ + 6.484323762379063e-07, + 7.041825256237644e-08, + 6.729855783760286e-08, + 6.816127040565334e-08, + 6.818439857170233e-08 + ], + "bp_grad_norms_F": [ + 2.9993034331710078e-05, + 2.8730657959386008e-06, + 2.3409718323819106e-06, + 2.367017486903933e-06, + 2.3597553990839515e-06 + ], + "gamma_dfa": 0.08862219587899745, + "acc_eval": 0.3076171875, + "loss_eval": 1.926429033279419, + "epoch": 4 + }, + { + "hidden_norms": [ + 3942.00390625, + 109015.7890625, + 203168.390625, + 329067.625, + 404167.84375 + ], + "bp_grad_norms_per_sample_med": [ + 5.148021386958135e-07, + 4.3746137379230277e-08, + 4.211498705330996e-08, + 4.271550579915129e-08, + 4.2616289164243426e-08 + ], + "bp_grad_norms_F": [ + 2.426102219033055e-05, + 1.769960135789006e-06, + 1.4341048881760798e-06, + 1.45279318530811e-06, + 1.44924592859752e-06 + ], + "gamma_dfa": 0.0876110177487135, + "acc_eval": 0.328125, + "loss_eval": 1.9219281673431396, + "epoch": 5 + }, + { + "hidden_norms": [ + 4737.880859375, + 173361.203125, + 331121.75, + 547707.8125, + 677363.375 + ], + "bp_grad_norms_per_sample_med": [ + 4.4596529846785415e-07, + 2.929639286719521e-08, + 2.8080462399771022e-08, + 2.8515311001342525e-08, + 2.847208158129888e-08 + ], + "bp_grad_norms_F": [ + 2.1308444047463126e-05, + 1.213497625940363e-06, + 9.622256129659945e-07, + 9.734020522955689e-07, + 9.715020041767275e-07 + ], + "gamma_dfa": 0.08417161786928773, + "acc_eval": 0.2919921875, + "loss_eval": 1.942756175994873, + "epoch": 6 + }, + { + "hidden_norms": [ + 5535.86865234375, + 258337.40625, + 501117.59375, + 823776.9375, + 1026549.875 + ], + "bp_grad_norms_per_sample_med": [ + 3.856409307445574e-07, + 2.2078769035260848e-08, + 2.0866384176088104e-08, + 2.09813144635973e-08, + 2.1003458527957264e-08 + ], + "bp_grad_norms_F": [ + 1.847265775722917e-05, + 8.849666528476519e-07, + 7.187628057181428e-07, + 7.262269718921743e-07, + 7.249743703141576e-07 + ], + "gamma_dfa": 0.08587896963581443, + "acc_eval": 0.2919921875, + "loss_eval": 1.9307396411895752, + "epoch": 7 + }, + { + "hidden_norms": [ + 6304.064453125, + 367445.5625, + 717525.125, + 1200281.0, + 1512872.125 + ], + "bp_grad_norms_per_sample_med": [ + 3.410295903449878e-07, + 1.670872862291617e-08, + 1.5770844186135946e-08, + 1.5891666649281433e-08, + 1.588542275499094e-08 + ], + "bp_grad_norms_F": [ + 1.6556636182940565e-05, + 6.716044254062581e-07, + 5.55544488634041e-07, + 5.606318040918268e-07, + 5.59783927656099e-07 + ], + "gamma_dfa": 0.08515941491350532, + "acc_eval": 0.306640625, + "loss_eval": 1.9279191493988037, + "epoch": 8 + }, + { + "hidden_norms": [ + 7086.48388671875, + 505478.71875, + 997925.8125, + 1708849.375, + 2150479.25 + ], + "bp_grad_norms_per_sample_med": [ + 3.013988703060022e-07, + 1.3297809964285534e-08, + 1.2481795153007624e-08, + 1.262175253202713e-08, + 1.2595491760691857e-08 + ], + "bp_grad_norms_F": [ + 1.4646101590187754e-05, + 5.195778953748231e-07, + 4.4164838186588895e-07, + 4.451969459751126e-07, + 4.4467057591646153e-07 + ], + "gamma_dfa": 0.08757842611521482, + "acc_eval": 0.318359375, + "loss_eval": 1.9144790172576904, + "epoch": 9 + }, + { + "hidden_norms": [ + 7891.7685546875, + 675713.625, + 1320934.25, + 2319375.25, + 2933561.75 + ], + "bp_grad_norms_per_sample_med": [ + 2.7613364750322944e-07, + 1.1096022767276281e-08, + 1.0442049891423721e-08, + 1.0500828651061056e-08, + 1.0485931234427426e-08 + ], + "bp_grad_norms_F": [ + 1.3369051885092631e-05, + 4.295688142974541e-07, + 3.6954631355001766e-07, + 3.72132660686475e-07, + 3.718281220699282e-07 + ], + "gamma_dfa": 0.08759273961186409, + "acc_eval": 0.3037109375, + "loss_eval": 1.928476095199585, + "epoch": 10 + }, + { + "hidden_norms": [ + 8605.7783203125, + 881309.9375, + 1719981.25, + 3048018.25, + 3848896.25 + ], + "bp_grad_norms_per_sample_med": [ + 2.546977952988527e-07, + 9.457612470953336e-09, + 8.959561981214392e-09, + 8.996098976865596e-09, + 8.995014511015142e-09 + ], + "bp_grad_norms_F": [ + 1.2278720532776788e-05, + 3.6486676435742993e-07, + 3.18511354180373e-07, + 3.204301890491479e-07, + 3.2022188634073245e-07 + ], + "gamma_dfa": 0.08920952118933201, + "acc_eval": 0.3017578125, + "loss_eval": 1.9193304777145386, + "epoch": 11 + }, + { + "hidden_norms": [ + 9378.4287109375, + 1120098.75, + 2197340.0, + 3930402.25, + 4945595.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.424853278171213e-07, + 8.285154784459792e-09, + 7.84627474104127e-09, + 7.900293752527432e-09, + 7.906582943917329e-09 + ], + "bp_grad_norms_F": [ + 1.1596725016715936e-05, + 3.161075028401683e-07, + 2.796709850372281e-07, + 2.81156104620095e-07, + 2.810372734529665e-07 + ], + "gamma_dfa": 0.09209982817992568, + "acc_eval": 0.287109375, + "loss_eval": 1.927558422088623, + "epoch": 12 + }, + { + "hidden_norms": [ + 10124.396484375, + 1412441.875, + 2752346.75, + 5010036.0, + 6325289.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.236940588318248e-07, + 7.092171738776187e-09, + 6.815563668993718e-09, + 6.8297678623707725e-09, + 6.830232379684276e-09 + ], + "bp_grad_norms_F": [ + 1.0770681910798885e-05, + 2.7517026524037647e-07, + 2.434409793750092e-07, + 2.4456548430862313e-07, + 2.445065661049739e-07 + ], + "gamma_dfa": 0.0919318727683276, + "acc_eval": 0.2900390625, + "loss_eval": 1.9280297756195068, + "epoch": 13 + }, + { + "hidden_norms": [ + 10873.9169921875, + 1726814.125, + 3365165.0, + 6225292.5, + 7941070.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.0750607632180618e-07, + 6.175024491739123e-09, + 5.938003866390318e-09, + 5.979505779407646e-09, + 5.979241990416995e-09 + ], + "bp_grad_norms_F": [ + 9.84854341368191e-06, + 2.3993459308258025e-07, + 2.1497004354387172e-07, + 2.1585482556929492e-07, + 2.1582005160780682e-07 + ], + "gamma_dfa": 0.09486197168007493, + "acc_eval": 0.2978515625, + "loss_eval": 1.9190003871917725, + "epoch": 14 + }, + { + "hidden_norms": [ + 11534.0087890625, + 2084976.25, + 4091674.75, + 7667605.5, + 9821730.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.9337822720899567e-07, + 5.5730837722478554e-09, + 5.387873702744628e-09, + 5.409793057964407e-09, + 5.415522696949893e-09 + ], + "bp_grad_norms_F": [ + 9.290296475228388e-06, + 2.1226249202754843e-07, + 1.9121620198347955e-07, + 1.9190700584204023e-07, + 1.9189823774468096e-07 + ], + "gamma_dfa": 0.09578572702594101, + "acc_eval": 0.28515625, + "loss_eval": 1.9317920207977295, + "epoch": 15 + }, + { + "hidden_norms": [ + 12231.0380859375, + 2494592.5, + 4969235.5, + 9387796.0, + 12017026.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7950755193396617e-07, + 4.997119606997558e-09, + 4.8298063326512874e-09, + 4.8657629037052175e-09, + 4.859395552614387e-09 + ], + "bp_grad_norms_F": [ + 8.774502930464223e-06, + 1.8752842834146577e-07, + 1.7071489821773866e-07, + 1.7126839679804107e-07, + 1.7126781415299774e-07 + ], + "gamma_dfa": 0.09745451644994318, + "acc_eval": 0.2978515625, + "loss_eval": 1.927154541015625, + "epoch": 16 + }, + { + "hidden_norms": [ + 12895.0341796875, + 2937750.0, + 5861416.5, + 11095317.0, + 14303387.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7269709928768862e-07, + 4.551929055907067e-09, + 4.4097947515808755e-09, + 4.41813474694186e-09, + 4.416958798714177e-09 + ], + "bp_grad_norms_F": [ + 8.354931196663529e-06, + 1.7010511044190935e-07, + 1.556661288759642e-07, + 1.5612842219070444e-07, + 1.5612160098044114e-07 + ], + "gamma_dfa": 0.09986255329567939, + "acc_eval": 0.3115234375, + "loss_eval": 1.9158110618591309, + "epoch": 17 + }, + { + "hidden_norms": [ + 13624.58984375, + 3430302.75, + 6892795.0, + 13179784.0, + 16997646.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.642013387481711e-07, + 4.094950600830316e-09, + 4.012986831725129e-09, + 4.022568500516854e-09, + 4.023625876925507e-09 + ], + "bp_grad_norms_F": [ + 7.884121259849053e-06, + 1.54415545239317e-07, + 1.407240830531009e-07, + 1.411058434541701e-07, + 1.4110656820776057e-07 + ], + "gamma_dfa": 0.09882167540490627, + "acc_eval": 0.296875, + "loss_eval": 1.9182151556015015, + "epoch": 18 + }, + { + "hidden_norms": [ + 14323.6708984375, + 3985548.0, + 8076905.5, + 15465362.0, + 20015594.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.551940442823252e-07, + 3.79724474086629e-09, + 3.6876826037257615e-09, + 3.700401984829682e-09, + 3.6983835993709135e-09 + ], + "bp_grad_norms_F": [ + 7.607863608427579e-06, + 1.393282218487002e-07, + 1.283839452526081e-07, + 1.2869591614617093e-07, + 1.2869809040694236e-07 + ], + "gamma_dfa": 0.1002046266803518, + "acc_eval": 0.294921875, + "loss_eval": 1.9388974905014038, + "epoch": 19 + }, + { + "hidden_norms": [ + 14955.4462890625, + 4541631.5, + 9327444.0, + 17893654.0, + 23108114.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.4713883444983367e-07, + 3.464018405452407e-09, + 3.3744134153579353e-09, + 3.379040602879968e-09, + 3.381670721225305e-09 + ], + "bp_grad_norms_F": [ + 7.235442353703547e-06, + 1.2747574373861426e-07, + 1.1753004969250469e-07, + 1.1780696951291247e-07, + 1.1780796427274254e-07 + ], + "gamma_dfa": 0.10065551439765841, + "acc_eval": 0.30859375, + "loss_eval": 1.9343281984329224, + "epoch": 20 + }, + { + "hidden_norms": [ + 15583.8564453125, + 5145675.5, + 10628445.0, + 20547210.0, + 26561584.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.4314694851691456e-07, + 3.170894435911009e-09, + 3.083378885548882e-09, + 3.0910656256821767e-09, + 3.0932543193529227e-09 + ], + "bp_grad_norms_F": [ + 6.938716524018673e-06, + 1.1743370009753562e-07, + 1.0794892091325892e-07, + 1.0819184126376058e-07, + 1.0819199047773509e-07 + ], + "gamma_dfa": 0.10184943513013422, + "acc_eval": 0.3154296875, + "loss_eval": 1.9154099225997925, + "epoch": 21 + }, + { + "hidden_norms": [ + 16234.9208984375, + 5839592.5, + 12062968.0, + 23496628.0, + 30428386.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.379862197836701e-07, + 2.91886981251821e-09, + 2.8514124394973805e-09, + 2.8584146161136914e-09, + 2.860225389866855e-09 + ], + "bp_grad_norms_F": [ + 6.72459282213822e-06, + 1.0762735769276333e-07, + 9.920048427147776e-08, + 9.94118352082296e-08, + 9.941232548271728e-08 + ], + "gamma_dfa": 0.1024534439202398, + "acc_eval": 0.3095703125, + "loss_eval": 1.9225246906280518, + "epoch": 22 + }, + { + "hidden_norms": [ + 16833.765625, + 6566770.0, + 13630788.0, + 26729236.0, + 34665300.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.331996628550769e-07, + 2.688527622751735e-09, + 2.6381341555747895e-09, + 2.6441848710589966e-09, + 2.644968466469777e-09 + ], + "bp_grad_norms_F": [ + 6.5681074374879245e-06, + 9.902939268613409e-08, + 9.131563416531208e-08, + 9.149899682370233e-08, + 9.149922419737777e-08 + ], + "gamma_dfa": 0.10199526121141389, + "acc_eval": 0.30859375, + "loss_eval": 1.9233064651489258, + "epoch": 23 + }, + { + "hidden_norms": [ + 17456.634765625, + 7337101.0, + 15401232.0, + 30171576.0, + 39161244.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2747005939672817e-07, + 2.4809998500074926e-09, + 2.4282977850731413e-09, + 2.432346990488554e-09, + 2.431272960734532e-09 + ], + "bp_grad_norms_F": [ + 6.5036538217100315e-06, + 9.14754565428666e-08, + 8.484188640522916e-08, + 8.500099824004792e-08, + 8.500632731056612e-08 + ], + "gamma_dfa": 0.10456769005395472, + "acc_eval": 0.30078125, + "loss_eval": 1.9299731254577637, + "epoch": 24 + }, + { + "hidden_norms": [ + 18049.205078125, + 8139419.5, + 17132936.0, + 33801196.0, + 43890588.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2153788020441425e-07, + 2.2737314253618024e-09, + 2.2332342641817604e-09, + 2.232388940370811e-09, + 2.237900753598865e-09 + ], + "bp_grad_norms_F": [ + 6.099615802668268e-06, + 8.523231542767462e-08, + 7.842250226985925e-08, + 7.855853567662052e-08, + 7.856372263859157e-08 + ], + "gamma_dfa": 0.10287670505931601, + "acc_eval": 0.3232421875, + "loss_eval": 1.923604965209961, + "epoch": 25 + }, + { + "hidden_norms": [ + 18644.9375, + 9035569.0, + 19136636.0, + 37813052.0, + 49194300.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.212478508705317e-07, + 2.0938955014315752e-09, + 2.0560451119422396e-09, + 2.058360148993188e-09, + 2.061209425363586e-09 + ], + "bp_grad_norms_F": [ + 5.810702987218974e-06, + 7.886949049407121e-08, + 7.294480752761956e-08, + 7.307144755941408e-08, + 7.307325233796291e-08 + ], + "gamma_dfa": 0.10249267728067935, + "acc_eval": 0.3037109375, + "loss_eval": 1.9200568199157715, + "epoch": 26 + }, + { + "hidden_norms": [ + 19280.703125, + 9952065.0, + 21071430.0, + 41963900.0, + 54690120.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1414142875310063e-07, + 1.9668882078605066e-09, + 1.928355919389446e-09, + 1.9296169107008154e-09, + 1.929810311551705e-09 + ], + "bp_grad_norms_F": [ + 5.566818344959756e-06, + 7.357547104902551e-08, + 6.781976935599232e-08, + 6.792832607516175e-08, + 6.79302942785398e-08 + ], + "gamma_dfa": 0.10335587273584679, + "acc_eval": 0.310546875, + "loss_eval": 1.92685067653656, + "epoch": 27 + }, + { + "hidden_norms": [ + 19887.205078125, + 10899353.0, + 23080260.0, + 46142640.0, + 60105148.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1361055385350483e-07, + 1.8462845696731733e-09, + 1.815088412904231e-09, + 1.8113950339682106e-09, + 1.8156832704008252e-09 + ], + "bp_grad_norms_F": [ + 5.398809662437998e-06, + 6.89453401037099e-08, + 6.4051612014282e-08, + 6.414857267600382e-08, + 6.415204012455433e-08 + ], + "gamma_dfa": 0.10455695656128228, + "acc_eval": 0.302734375, + "loss_eval": 1.923227310180664, + "epoch": 28 + }, + { + "hidden_norms": [ + 20438.587890625, + 11953376.0, + 25259200.0, + 50259240.0, + 65732368.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1073134231764925e-07, + 1.7497674420496878e-09, + 1.7245866956727696e-09, + 1.7265968654811559e-09, + 1.727246901062074e-09 + ], + "bp_grad_norms_F": [ + 5.281461653794395e-06, + 6.489771209317041e-08, + 6.026093046784808e-08, + 6.034837696233808e-08, + 6.035197941400838e-08 + ], + "gamma_dfa": 0.10511547370697372, + "acc_eval": 0.326171875, + "loss_eval": 1.9300421476364136, + "epoch": 29 + }, + { + "hidden_norms": [ + 20991.0234375, + 13017462.0, + 27475572.0, + 54971628.0, + 71927184.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0625635837868685e-07, + 1.6529324575742521e-09, + 1.6255721213553898e-09, + 1.6247864165208625e-09, + 1.6244732226056158e-09 + ], + "bp_grad_norms_F": [ + 5.098012934467988e-06, + 6.077872427567854e-08, + 5.674080227890954e-08, + 5.681971870785674e-08, + 5.6821534144546604e-08 + ], + "gamma_dfa": 0.10590779440826736, + "acc_eval": 0.3017578125, + "loss_eval": 1.9211739301681519, + "epoch": 30 + }, + { + "hidden_norms": [ + 21617.34765625, + 14125094.0, + 29881326.0, + 59926964.0, + 78189832.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0433515029717455e-07, + 1.5471924852406005e-09, + 1.5234034034250499e-09, + 1.5246930384904545e-09, + 1.5239296491387222e-09 + ], + "bp_grad_norms_F": [ + 4.977115622750716e-06, + 5.780140810429657e-08, + 5.362210941939338e-08, + 5.3694908075385683e-08, + 5.369727773540944e-08 + ], + "gamma_dfa": 0.10481705865822732, + "acc_eval": 0.3212890625, + "loss_eval": 1.9209015369415283, + "epoch": 31 + }, + { + "hidden_norms": [ + 22126.13671875, + 15300531.0, + 32579362.0, + 65167536.0, + 85083400.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0149238249823611e-07, + 1.4551810867402537e-09, + 1.4291762218121562e-09, + 1.432274854273885e-09, + 1.4318950469771607e-09 + ], + "bp_grad_norms_F": [ + 4.9215527724300046e-06, + 5.434217342781267e-08, + 5.088266163966182e-08, + 5.094950239481477e-08, + 5.0953229191463834e-08 + ], + "gamma_dfa": 0.10599250381346792, + "acc_eval": 0.30859375, + "loss_eval": 1.9330241680145264, + "epoch": 32 + }, + { + "hidden_norms": [ + 22662.396484375, + 16481282.0, + 35263600.0, + 70793304.0, + 92166136.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.882934648430819e-08, + 1.3810197430075277e-09, + 1.3668104426045602e-09, + 1.3675354182396404e-09, + 1.366150526038723e-09 + ], + "bp_grad_norms_F": [ + 4.6740801735722926e-06, + 5.137474090588512e-08, + 4.796589792022132e-08, + 4.802501862855024e-08, + 4.8027377630432966e-08 + ], + "gamma_dfa": 0.10529429838061333, + "acc_eval": 0.3115234375, + "loss_eval": 1.9205418825149536, + "epoch": 33 + }, + { + "hidden_norms": [ + 23192.3125, + 17779744.0, + 38108720.0, + 76522688.0, + 99643120.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.530750588737646e-08, + 1.3089170858293642e-09, + 1.2901538726239892e-09, + 1.2906937740808644e-09, + 1.2914372904404559e-09 + ], + "bp_grad_norms_F": [ + 4.669429472414777e-06, + 4.88593805414439e-08, + 4.5740907950175824e-08, + 4.579441181817856e-08, + 4.5798362435789386e-08 + ], + "gamma_dfa": 0.1058788642694708, + "acc_eval": 0.30078125, + "loss_eval": 1.9393997192382812, + "epoch": 34 + }, + { + "hidden_norms": [ + 23683.251953125, + 18992256.0, + 40936536.0, + 82030200.0, + 106929248.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.458356942104729e-08, + 1.2407530558533608e-09, + 1.2231146095942336e-09, + 1.2233244417458877e-09, + 1.2247586278490985e-09 + ], + "bp_grad_norms_F": [ + 4.483116299525136e-06, + 4.651869289773458e-08, + 4.358627236911161e-08, + 4.363666050721804e-08, + 4.3638891611408326e-08 + ], + "gamma_dfa": 0.10620562738040462, + "acc_eval": 0.3251953125, + "loss_eval": 1.9221802949905396, + "epoch": 35 + }, + { + "hidden_norms": [ + 24223.7265625, + 20421224.0, + 43883308.0, + 87849264.0, + 114523200.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.247051480087976e-08, + 1.182353992490448e-09, + 1.1679496259020539e-09, + 1.169668362166476e-09, + 1.1697178781133744e-09 + ], + "bp_grad_norms_F": [ + 4.388592969917227e-06, + 4.4431864409943955e-08, + 4.157495325785021e-08, + 4.162143696362364e-08, + 4.16235543809762e-08 + ], + "gamma_dfa": 0.10484841075958684, + "acc_eval": 0.2998046875, + "loss_eval": 1.9306102991104126, + "epoch": 36 + }, + { + "hidden_norms": [ + 24732.05078125, + 21765008.0, + 46887340.0, + 93818392.0, + 122372552.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.012441637423763e-08, + 1.1452657711075176e-09, + 1.1280866241136778e-09, + 1.1283430856323662e-09, + 1.1287816237270931e-09 + ], + "bp_grad_norms_F": [ + 4.297942268749466e-06, + 4.29258228962226e-08, + 3.9989565436826524e-08, + 4.003141995667647e-08, + 4.003394948881578e-08 + ], + "gamma_dfa": 0.10523941312567331, + "acc_eval": 0.302734375, + "loss_eval": 1.9360214471817017, + "epoch": 37 + }, + { + "hidden_norms": [ + 25179.26953125, + 23094218.0, + 50076040.0, + 100053064.0, + 130605352.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.80345041309738e-08, + 1.0831726626747695e-09, + 1.0690409668612233e-09, + 1.0700328401114234e-09, + 1.0692404739387484e-09 + ], + "bp_grad_norms_F": [ + 4.235343567415839e-06, + 4.072955306355652e-08, + 3.817867622046833e-08, + 3.8218924913735464e-08, + 3.822109917450689e-08 + ], + "gamma_dfa": 0.10568258634884842, + "acc_eval": 0.3193359375, + "loss_eval": 1.927825689315796, + "epoch": 38 + }, + { + "hidden_norms": [ + 25586.23828125, + 24470240.0, + 53013036.0, + 105981368.0, + 138543408.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.783595717432036e-08, + 1.0381262516290235e-09, + 1.0265919225815878e-09, + 1.0273364381419015e-09, + 1.0274008310773297e-09 + ], + "bp_grad_norms_F": [ + 4.177269602223532e-06, + 3.924894187434802e-08, + 3.684685978555535e-08, + 3.688498040332888e-08, + 3.688741045948518e-08 + ], + "gamma_dfa": 0.10561428684741259, + "acc_eval": 0.302734375, + "loss_eval": 1.9321579933166504, + "epoch": 39 + }, + { + "hidden_norms": [ + 26049.974609375, + 25812240.0, + 56223324.0, + 112200904.0, + 146978224.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.555475972116255e-08, + 9.982903392824483e-10, + 9.87055215340149e-10, + 9.8631947054173e-10, + 9.876408579856388e-10 + ], + "bp_grad_norms_F": [ + 4.088252808287507e-06, + 3.767732792425704e-08, + 3.5331073178213046e-08, + 3.536514370239274e-08, + 3.5367978767908426e-08 + ], + "gamma_dfa": 0.10579964506905526, + "acc_eval": 0.318359375, + "loss_eval": 1.930686116218567, + "epoch": 40 + }, + { + "hidden_norms": [ + 26467.328125, + 27200558.0, + 59437036.0, + 118688848.0, + 155514592.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.46039256430231e-08, + 9.647596055373242e-10, + 9.512606258255119e-10, + 9.511659238015113e-10, + 9.522146404705722e-10 + ], + "bp_grad_norms_F": [ + 4.015588729089359e-06, + 3.636354861669133e-08, + 3.413835614196614e-08, + 3.417060767674229e-08, + 3.417307326003538e-08 + ], + "gamma_dfa": 0.10565257369307801, + "acc_eval": 0.314453125, + "loss_eval": 1.9317667484283447, + "epoch": 41 + }, + { + "hidden_norms": [ + 26919.3671875, + 28678974.0, + 62716300.0, + 125549296.0, + 163974208.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.232915860162393e-08, + 9.29719468079071e-10, + 9.197844152986079e-10, + 9.194760508535182e-10, + 9.196678418810222e-10 + ], + "bp_grad_norms_F": [ + 3.951602138840826e-06, + 3.508949220076829e-08, + 3.2971975372220186e-08, + 3.3001178678659926e-08, + 3.300409190387654e-08 + ], + "gamma_dfa": 0.10566475696396083, + "acc_eval": 0.3056640625, + "loss_eval": 1.9284584522247314, + "epoch": 42 + }, + { + "hidden_norms": [ + 27317.033203125, + 30078810.0, + 66046968.0, + 132107504.0, + 172659440.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.130339068657122e-08, + 9.03509489447174e-10, + 8.925334360476711e-10, + 8.917908633776506e-10, + 8.925368222278962e-10 + ], + "bp_grad_norms_F": [ + 3.9174719859147444e-06, + 3.398368519924588e-08, + 3.1965900149089066e-08, + 3.199273024279137e-08, + 3.199540898890518e-08 + ], + "gamma_dfa": 0.10646540904417634, + "acc_eval": 0.3115234375, + "loss_eval": 1.9241154193878174, + "epoch": 43 + }, + { + "hidden_norms": [ + 27715.529296875, + 31383778.0, + 69356640.0, + 138681856.0, + 181338928.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.031172171740764e-08, + 8.735605017129444e-10, + 8.597746958827202e-10, + 8.612066615398817e-10, + 8.621173774869817e-10 + ], + "bp_grad_norms_F": [ + 3.837071290035965e-06, + 3.286310601424702e-08, + 3.101721191001161e-08, + 3.104238288642591e-08, + 3.104513979224066e-08 + ], + "gamma_dfa": 0.10568622383289039, + "acc_eval": 0.2939453125, + "loss_eval": 1.938409447669983, + "epoch": 44 + }, + { + "hidden_norms": [ + 28149.3203125, + 32840858.0, + 72848112.0, + 145667440.0, + 190265088.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.894184506085367e-08, + 8.401777051858517e-10, + 8.299890774665641e-10, + 8.304122944835512e-10, + 8.303523979513727e-10 + ], + "bp_grad_norms_F": [ + 3.798121497311513e-06, + 3.184389640864538e-08, + 3.004597459721481e-08, + 3.0069060130699654e-08, + 3.007191295978373e-08 + ], + "gamma_dfa": 0.10558789351489395, + "acc_eval": 0.3037109375, + "loss_eval": 1.9300565719604492, + "epoch": 45 + }, + { + "hidden_norms": [ + 28522.55078125, + 34358040.0, + 76134080.0, + 152412848.0, + 198973936.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.830858095303483e-08, + 8.109956595170331e-10, + 8.036356025087343e-10, + 8.033995135825478e-10, + 8.031720843959533e-10 + ], + "bp_grad_norms_F": [ + 3.7768336369481403e-06, + 3.096561229654071e-08, + 2.9296373327269976e-08, + 2.9317961391939207e-08, + 2.9320871064442144e-08 + ], + "gamma_dfa": 0.10623026502435096, + "acc_eval": 0.3115234375, + "loss_eval": 1.930029273033142, + "epoch": 46 + }, + { + "hidden_norms": [ + 28924.912109375, + 35808620.0, + 79629336.0, + 159269824.0, + 208087264.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.754207587140627e-08, + 7.940589297206202e-10, + 7.852188899093449e-10, + 7.844204730211857e-10, + 7.861447048895798e-10 + ], + "bp_grad_norms_F": [ + 3.695072564369184e-06, + 3.0030403053160626e-08, + 2.8479737679276695e-08, + 2.849986913133762e-08, + 2.8502654458861798e-08 + ], + "gamma_dfa": 0.1059467513114214, + "acc_eval": 0.30078125, + "loss_eval": 1.9284684658050537, + "epoch": 47 + }, + { + "hidden_norms": [ + 29289.236328125, + 37312204.0, + 83049256.0, + 165977216.0, + 216710016.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.562951509498816e-08, + 7.782112176890621e-10, + 7.675478586044449e-10, + 7.666810519779688e-10, + 7.681388303204528e-10 + ], + "bp_grad_norms_F": [ + 3.6269300380809e-06, + 2.9297559933638695e-08, + 2.782604902051844e-08, + 2.7844757610751003e-08, + 2.7847393724300673e-08 + ], + "gamma_dfa": 0.10581977141555399, + "acc_eval": 0.3037109375, + "loss_eval": 1.9282777309417725, + "epoch": 48 + }, + { + "hidden_norms": [ + 29638.296875, + 38754036.0, + 86627536.0, + 172893504.0, + 225686464.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.50456763398688e-08, + 7.526539391733422e-10, + 7.443530236628249e-10, + 7.439299176681402e-10, + 7.444729277494844e-10 + ], + "bp_grad_norms_F": [ + 3.6355218071548734e-06, + 2.845291824371543e-08, + 2.7127033064289208e-08, + 2.714476821097378e-08, + 2.7147471826083347e-08 + ], + "gamma_dfa": 0.1066790189652238, + "acc_eval": 0.3056640625, + "loss_eval": 1.925389051437378, + "epoch": 49 + }, + { + "hidden_norms": [ + 29950.615234375, + 40150236.0, + 90007640.0, + 179977856.0, + 235206976.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.382724476201474e-08, + 7.370593024802474e-10, + 7.280710478951846e-10, + 7.283330605289962e-10, + 7.279294389483937e-10 + ], + "bp_grad_norms_F": [ + 3.5918935736845015e-06, + 2.7770946431360244e-08, + 2.6450262424759785e-08, + 2.6465910352158062e-08, + 2.6468752523101102e-08 + ], + "gamma_dfa": 0.10654840966162737, + "acc_eval": 0.3076171875, + "loss_eval": 1.929931402206421, + "epoch": 50 + }, + { + "hidden_norms": [ + 30266.310546875, + 41604512.0, + 93401064.0, + 187075808.0, + 244203616.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.343555097349963e-08, + 7.144400626657443e-10, + 7.057154305378788e-10, + 7.05836944447924e-10, + 7.073042707084198e-10 + ], + "bp_grad_norms_F": [ + 3.5134323752572527e-06, + 2.7063506990998576e-08, + 2.580901536930469e-08, + 2.582418012764265e-08, + 2.582707381293403e-08 + ], + "gamma_dfa": 0.10640880587743595, + "acc_eval": 0.314453125, + "loss_eval": 1.9268465042114258, + "epoch": 51 + }, + { + "hidden_norms": [ + 30588.291015625, + 43073320.0, + 96898208.0, + 193783280.0, + 253267328.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.257300893570573e-08, + 6.925075513031231e-10, + 6.871804236752155e-10, + 6.855109813130866e-10, + 6.860176871015256e-10 + ], + "bp_grad_norms_F": [ + 3.4990612221008632e-06, + 2.652852693074692e-08, + 2.5297810068991566e-08, + 2.5311907236869047e-08, + 2.531497678148753e-08 + ], + "gamma_dfa": 0.10629434209840838, + "acc_eval": 0.3125, + "loss_eval": 1.932523488998413, + "epoch": 52 + }, + { + "hidden_norms": [ + 30898.34765625, + 44412940.0, + 100019336.0, + 199966816.0, + 261667760.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.140450719589353e-08, + 6.861456958162648e-10, + 6.789319106914604e-10, + 6.784582895491553e-10, + 6.785109696316738e-10 + ], + "bp_grad_norms_F": [ + 3.470987167020212e-06, + 2.5969489669819268e-08, + 2.478421379237261e-08, + 2.479695204726795e-08, + 2.4800137055080995e-08 + ], + "gamma_dfa": 0.1070190458704019, + "acc_eval": 0.310546875, + "loss_eval": 1.932159662246704, + "epoch": 53 + }, + { + "hidden_norms": [ + 31188.375, + 45820600.0, + 103429992.0, + 206547120.0, + 270181600.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.079076169702603e-08, + 6.688025688816879e-10, + 6.633480986728557e-10, + 6.629659043966285e-10, + 6.630911930649575e-10 + ], + "bp_grad_norms_F": [ + 3.4183981370006222e-06, + 2.540217280966317e-08, + 2.4278467236626966e-08, + 2.4290830680229192e-08, + 2.429379897250783e-08 + ], + "gamma_dfa": 0.10550818023330066, + "acc_eval": 0.2998046875, + "loss_eval": 1.9357173442840576, + "epoch": 54 + }, + { + "hidden_norms": [ + 31478.2109375, + 47178892.0, + 107044784.0, + 213196560.0, + 278895232.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.016877390242371e-08, + 6.609012226377331e-10, + 6.520708972779232e-10, + 6.519841333485488e-10, + 6.530669338644657e-10 + ], + "bp_grad_norms_F": [ + 3.405668167033582e-06, + 2.4965938649756936e-08, + 2.3893584000234114e-08, + 2.390493669679472e-08, + 2.390810749375305e-08 + ], + "gamma_dfa": 0.10673638083972037, + "acc_eval": 0.294921875, + "loss_eval": 1.9359304904937744, + "epoch": 55 + }, + { + "hidden_norms": [ + 31753.5859375, + 48563264.0, + 110454832.0, + 219550528.0, + 287320896.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.007908919831607e-08, + 6.483197867446222e-10, + 6.408613084651904e-10, + 6.410805775125539e-10, + 6.409432429244077e-10 + ], + "bp_grad_norms_F": [ + 3.369002797626308e-06, + 2.447991498399915e-08, + 2.3494733270013057e-08, + 2.350535943662635e-08, + 2.350850003551841e-08 + ], + "gamma_dfa": 0.10726616549072787, + "acc_eval": 0.3076171875, + "loss_eval": 1.9281866550445557, + "epoch": 56 + }, + { + "hidden_norms": [ + 32002.76953125, + 49866268.0, + 113724368.0, + 225759120.0, + 295231328.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.914736161434121e-08, + 6.332004365283694e-10, + 6.232644400583354e-10, + 6.233273341926804e-10, + 6.240686856173738e-10 + ], + "bp_grad_norms_F": [ + 3.3845158213807736e-06, + 2.415495181651295e-08, + 2.3192731291032942e-08, + 2.3202973764568924e-08, + 2.3206132127029377e-08 + ], + "gamma_dfa": 0.10715722179156728, + "acc_eval": 0.3095703125, + "loss_eval": 1.9343407154083252, + "epoch": 57 + }, + { + "hidden_norms": [ + 32277.291015625, + 51206064.0, + 116617608.0, + 231756352.0, + 303064864.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.926612172719615e-08, + 6.240719607752965e-10, + 6.182420131395361e-10, + 6.17405682135086e-10, + 6.178215161689593e-10 + ], + "bp_grad_norms_F": [ + 3.317889877507696e-06, + 2.3704412654979024e-08, + 2.2745311412109004e-08, + 2.2754765183208292e-08, + 2.2757769002623718e-08 + ], + "gamma_dfa": 0.10657632350921631, + "acc_eval": 0.302734375, + "loss_eval": 1.9305057525634766, + "epoch": 58 + }, + { + "hidden_norms": [ + 32521.890625, + 52538716.0, + 119605040.0, + 237773904.0, + 310920672.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.805787933217289e-08, + 6.190028489783117e-10, + 6.10553496649402e-10, + 6.107545580391616e-10, + 6.10922701316241e-10 + ], + "bp_grad_norms_F": [ + 3.2823897981870687e-06, + 2.3313557306892108e-08, + 2.2385792775025948e-08, + 2.239448981811165e-08, + 2.239757002087117e-08 + ], + "gamma_dfa": 0.10671919275773689, + "acc_eval": 0.302734375, + "loss_eval": 1.9269468784332275, + "epoch": 59 + }, + { + "hidden_norms": [ + 32717.80859375, + 53698120.0, + 122676120.0, + 243745136.0, + 318772768.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.75130422678194e-08, + 6.033377686343044e-10, + 5.948920800413759e-10, + 5.949861159315617e-10, + 5.951407144877408e-10 + ], + "bp_grad_norms_F": [ + 3.2588357044005534e-06, + 2.2926835541170476e-08, + 2.205681148836902e-08, + 2.206508220581327e-08, + 2.2068283200837868e-08 + ], + "gamma_dfa": 0.10711025857017376, + "acc_eval": 0.314453125, + "loss_eval": 1.9273767471313477, + "epoch": 60 + }, + { + "hidden_norms": [ + 32950.74609375, + 54885932.0, + 125689616.0, + 249312240.0, + 326217856.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.673791119737871e-08, + 5.923626589243725e-10, + 5.863842189590684e-10, + 5.866296337586618e-10, + 5.870876007563197e-10 + ], + "bp_grad_norms_F": [ + 3.2307948458765168e-06, + 2.2597017590442192e-08, + 2.1738133071380616e-08, + 2.1745805156569986e-08, + 2.1749071876797643e-08 + ], + "gamma_dfa": 0.10673619594308548, + "acc_eval": 0.31640625, + "loss_eval": 1.9271256923675537, + "epoch": 61 + }, + { + "hidden_norms": [ + 33148.1328125, + 55976648.0, + 128534072.0, + 254655232.0, + 333162784.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.663199769718631e-08, + 5.852057172184288e-10, + 5.787633705622852e-10, + 5.792484825128952e-10, + 5.793157620281875e-10 + ], + "bp_grad_norms_F": [ + 3.197097157681128e-06, + 2.2320827852695402e-08, + 2.1484760637235922e-08, + 2.149219824332249e-08, + 2.1495376145708178e-08 + ], + "gamma_dfa": 0.10659754439257085, + "acc_eval": 0.310546875, + "loss_eval": 1.9244905710220337, + "epoch": 62 + }, + { + "hidden_norms": [ + 33369.18359375, + 57164716.0, + 131352720.0, + 259876736.0, + 339964160.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.583201184184873e-08, + 5.737598174349046e-10, + 5.67273561458137e-10, + 5.66656666034504e-10, + 5.665773961105458e-10 + ], + "bp_grad_norms_F": [ + 3.2037539767770795e-06, + 2.2096731555620863e-08, + 2.127841902677119e-08, + 2.1285371687440602e-08, + 2.1288625973170383e-08 + ], + "gamma_dfa": 0.10679806087864563, + "acc_eval": 0.3154296875, + "loss_eval": 1.9308257102966309, + "epoch": 63 + }, + { + "hidden_norms": [ + 33540.88671875, + 58301528.0, + 133722112.0, + 264798368.0, + 346396256.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.606099844930213e-08, + 5.686319748399171e-10, + 5.629098853709991e-10, + 5.619399945366865e-10, + 5.626447086015673e-10 + ], + "bp_grad_norms_F": [ + 3.1530219075648347e-06, + 2.1766210167584177e-08, + 2.0992644067518995e-08, + 2.0999330274662498e-08, + 2.1002534822400776e-08 + ], + "gamma_dfa": 0.10647483140928671, + "acc_eval": 0.3115234375, + "loss_eval": 1.925765037536621, + "epoch": 64 + }, + { + "hidden_norms": [ + 33728.984375, + 59420104.0, + 136277376.0, + 270265568.0, + 353408672.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.57889458466343e-08, + 5.627094901150542e-10, + 5.575621631059846e-10, + 5.567652450189087e-10, + 5.571588745922895e-10 + ], + "bp_grad_norms_F": [ + 3.138873807984055e-06, + 2.1483266721133987e-08, + 2.0736742101234995e-08, + 2.0742897177683517e-08, + 2.0746110607205992e-08 + ], + "gamma_dfa": 0.10677585859230021, + "acc_eval": 0.3154296875, + "loss_eval": 1.9289934635162354, + "epoch": 65 + }, + { + "hidden_norms": [ + 33919.515625, + 60492864.0, + 138846208.0, + 275456896.0, + 359821632.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.451340084367985e-08, + 5.607461717183071e-10, + 5.556192728128906e-10, + 5.553609239150603e-10, + 5.557289628477236e-10 + ], + "bp_grad_norms_F": [ + 3.125772991552367e-06, + 2.1269308092541905e-08, + 2.0518179155715188e-08, + 2.052397540808215e-08, + 2.0527094690692138e-08 + ], + "gamma_dfa": 0.10671760967670707, + "acc_eval": 0.3125, + "loss_eval": 1.9296305179595947, + "epoch": 66 + }, + { + "hidden_norms": [ + 34098.5, + 61508056.0, + 141295472.0, + 280204000.0, + 365860768.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.474934366451635e-08, + 5.519530943409734e-10, + 5.459506735583375e-10, + 5.446967876743258e-10, + 5.452004958605983e-10 + ], + "bp_grad_norms_F": [ + 3.1189638320938684e-06, + 2.1083655710185667e-08, + 2.0349753881987453e-08, + 2.0355370722313637e-08, + 2.0358520202989894e-08 + ], + "gamma_dfa": 0.10652847628807649, + "acc_eval": 0.3046875, + "loss_eval": 1.9298161268234253, + "epoch": 67 + }, + { + "hidden_norms": [ + 34267.96875, + 62529272.0, + 143621744.0, + 284772064.0, + 371754336.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.392743046035321e-08, + 5.466314068058864e-10, + 5.412825743178473e-10, + 5.413390846698007e-10, + 5.416116999334974e-10 + ], + "bp_grad_norms_F": [ + 3.0790877190156607e-06, + 2.0871810946232472e-08, + 2.0159163227617682e-08, + 2.0164401703937074e-08, + 2.0167590264463797e-08 + ], + "gamma_dfa": 0.10652959482831648, + "acc_eval": 0.298828125, + "loss_eval": 1.926388144493103, + "epoch": 68 + }, + { + "hidden_norms": [ + 34420.42578125, + 63473892.0, + 145906128.0, + 289224256.0, + 377581856.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.427427479138714e-08, + 5.377295275721394e-10, + 5.307561612433176e-10, + 5.305922923248829e-10, + 5.308011252758149e-10 + ], + "bp_grad_norms_F": [ + 3.096157115578535e-06, + 2.067219107004803e-08, + 2.0005694878477698e-08, + 2.001087118230771e-08, + 2.001400645212925e-08 + ], + "gamma_dfa": 0.10710431921324925, + "acc_eval": 0.310546875, + "loss_eval": 1.9277684688568115, + "epoch": 69 + }, + { + "hidden_norms": [ + 34573.87890625, + 64328388.0, + 148036320.0, + 293257856.0, + 382751104.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.389419127117435e-08, + 5.373848033229933e-10, + 5.314943485323909e-10, + 5.314927387090052e-10, + 5.31539035009132e-10 + ], + "bp_grad_norms_F": [ + 3.072862682529376e-06, + 2.049388392322271e-08, + 1.98319511923728e-08, + 1.9836669196138246e-08, + 1.9840014076066836e-08 + ], + "gamma_dfa": 0.10700461147644091, + "acc_eval": 0.3076171875, + "loss_eval": 1.9307092428207397, + "epoch": 70 + }, + { + "hidden_norms": [ + 34690.74609375, + 65142160.0, + 150006800.0, + 297046144.0, + 387685792.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.348407310952098e-08, + 5.322000062868426e-10, + 5.271332259582096e-10, + 5.264539360005926e-10, + 5.263872671079639e-10 + ], + "bp_grad_norms_F": [ + 3.055365141335642e-06, + 2.0346906381973895e-08, + 1.9688986441224188e-08, + 1.969357477094036e-08, + 1.969680063496071e-08 + ], + "gamma_dfa": 0.10688555391971022, + "acc_eval": 0.314453125, + "loss_eval": 1.9277830123901367, + "epoch": 71 + }, + { + "hidden_norms": [ + 34818.79296875, + 65891160.0, + 151813680.0, + 300644832.0, + 392342848.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.302482802311715e-08, + 5.310150652526602e-10, + 5.265936020570905e-10, + 5.26124921407245e-10, + 5.26482579754628e-10 + ], + "bp_grad_norms_F": [ + 3.027237426067586e-06, + 2.0201985861945104e-08, + 1.9550000729395833e-08, + 1.955433681644081e-08, + 1.9557578667672715e-08 + ], + "gamma_dfa": 0.10652808679151349, + "acc_eval": 0.2998046875, + "loss_eval": 1.9273805618286133, + "epoch": 72 + }, + { + "hidden_norms": [ + 34951.515625, + 66590476.0, + 153730848.0, + 304118720.0, + 396925408.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.403244157127119e-08, + 5.26472032635894e-10, + 5.205495479110311e-10, + 5.201504782448296e-10, + 5.20502474454787e-10 + ], + "bp_grad_norms_F": [ + 3.0631524623458972e-06, + 2.0121730059941e-08, + 1.9494045488954725e-08, + 1.9498189729461046e-08, + 1.950143335704979e-08 + ], + "gamma_dfa": 0.1070192107144976, + "acc_eval": 0.3017578125, + "loss_eval": 1.934456467628479, + "epoch": 73 + }, + { + "hidden_norms": [ + 35056.31640625, + 67311408.0, + 155368816.0, + 307494752.0, + 401124448.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.303329769252741e-08, + 5.209726539057158e-10, + 5.160313842900166e-10, + 5.156270965755994e-10, + 5.161130411934778e-10 + ], + "bp_grad_norms_F": [ + 3.0127189347695094e-06, + 1.993531562050066e-08, + 1.93110221147208e-08, + 1.9314887467203334e-08, + 1.9318180832783582e-08 + ], + "gamma_dfa": 0.10658633662387729, + "acc_eval": 0.3076171875, + "loss_eval": 1.9260145425796509, + "epoch": 74 + }, + { + "hidden_norms": [ + 35158.68359375, + 67933192.0, + 157091536.0, + 310654048.0, + 405321344.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.339039515523837e-08, + 5.170803230036825e-10, + 5.107546607874269e-10, + 5.104218714357955e-10, + 5.108970468903351e-10 + ], + "bp_grad_norms_F": [ + 3.0164017061906634e-06, + 1.9819051289005074e-08, + 1.921591774589615e-08, + 1.921967651696832e-08, + 1.9223040936822144e-08 + ], + "gamma_dfa": 0.10703902837121859, + "acc_eval": 0.3095703125, + "loss_eval": 1.927987813949585, + "epoch": 75 + }, + { + "hidden_norms": [ + 35270.68359375, + 68510120.0, + 158496816.0, + 313641408.0, + 409130592.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.246813200050383e-08, + 5.133981018090594e-10, + 5.070178166199923e-10, + 5.070903141835004e-10, + 5.071925657240683e-10 + ], + "bp_grad_norms_F": [ + 3.004009158757981e-06, + 1.970923690919335e-08, + 1.910464320076244e-08, + 1.9108172821802327e-08, + 1.9111526583515115e-08 + ], + "gamma_dfa": 0.1070477613247931, + "acc_eval": 0.3193359375, + "loss_eval": 1.9260926246643066, + "epoch": 76 + }, + { + "hidden_norms": [ + 35364.3125, + 69078320.0, + 159830400.0, + 316294976.0, + 412518496.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.217867820623724e-08, + 5.12098419225282e-10, + 5.052269158589695e-10, + 5.058938268298618e-10, + 5.053178431246863e-10 + ], + "bp_grad_norms_F": [ + 2.9913805974501884e-06, + 1.9599063705300068e-08, + 1.900307999846973e-08, + 1.9006522578024487e-08, + 1.9009846141671005e-08 + ], + "gamma_dfa": 0.10688473540358245, + "acc_eval": 0.3076171875, + "loss_eval": 1.926918864250183, + "epoch": 77 + }, + { + "hidden_norms": [ + 35441.375, + 69602704.0, + 161117808.0, + 318818240.0, + 415766208.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.249013040360296e-08, + 5.102671063461628e-10, + 5.039960671027188e-10, + 5.038492956188634e-10, + 5.034740402365401e-10 + ], + "bp_grad_norms_F": [ + 2.9863124382245587e-06, + 1.9512324200832154e-08, + 1.8926254341522508e-08, + 1.8929529943534362e-08, + 1.8932860612608238e-08 + ], + "gamma_dfa": 0.10701000291737728, + "acc_eval": 0.306640625, + "loss_eval": 1.9271972179412842, + "epoch": 78 + }, + { + "hidden_norms": [ + 35514.78125, + 70081152.0, + 162190624.0, + 321009312.0, + 418699392.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.149930698029493e-08, + 5.099357047733122e-10, + 5.055039165036135e-10, + 5.048302331722709e-10, + 5.054044960317583e-10 + ], + "bp_grad_norms_F": [ + 2.969128445329261e-06, + 1.9427163877594467e-08, + 1.883810085701043e-08, + 1.884115441441736e-08, + 1.884450639977331e-08 + ], + "gamma_dfa": 0.10680000087450026, + "acc_eval": 0.3017578125, + "loss_eval": 1.9285144805908203, + "epoch": 79 + }, + { + "hidden_norms": [ + 35582.9765625, + 70499392.0, + 163284976.0, + 323095264.0, + 421363552.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.187113399391819e-08, + 5.05410657769545e-10, + 4.990756696798826e-10, + 4.979930912085706e-10, + 4.985904467069702e-10 + ], + "bp_grad_norms_F": [ + 2.9715449727518717e-06, + 1.9354965630213883e-08, + 1.877567434860339e-08, + 1.8778711918798763e-08, + 1.8782076338652587e-08 + ], + "gamma_dfa": 0.10694103027344681, + "acc_eval": 0.310546875, + "loss_eval": 1.92802095413208, + "epoch": 80 + }, + { + "hidden_norms": [ + 35639.56640625, + 70899536.0, + 164253712.0, + 324923200.0, + 423745824.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.238182237439105e-08, + 5.018311322046998e-10, + 4.970572842211141e-10, + 4.953790155859394e-10, + 4.961450694729308e-10 + ], + "bp_grad_norms_F": [ + 2.971921048811055e-06, + 1.9296171771543413e-08, + 1.872837351868384e-08, + 1.8731368456315067e-08, + 1.873476662694884e-08 + ], + "gamma_dfa": 0.10704115682892734, + "acc_eval": 0.3076171875, + "loss_eval": 1.926428198814392, + "epoch": 81 + }, + { + "hidden_norms": [ + 35689.78515625, + 71256024.0, + 165127008.0, + 326618208.0, + 425949792.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.238117578050151e-08, + 4.972192657604069e-10, + 4.926972718699574e-10, + 4.921834606541609e-10, + 4.923969565417963e-10 + ], + "bp_grad_norms_F": [ + 2.9655700473085744e-06, + 1.9235280035445612e-08, + 1.8671270751724478e-08, + 1.8674217727721043e-08, + 1.8677596358429582e-08 + ], + "gamma_dfa": 0.10696214074414456, + "acc_eval": 0.3056640625, + "loss_eval": 1.924986481666565, + "epoch": 82 + }, + { + "hidden_norms": [ + 35742.58984375, + 71595640.0, + 165912336.0, + 328130016.0, + 427838752.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.213700487478491e-08, + 4.983659041002397e-10, + 4.936055453264032e-10, + 4.941617670617404e-10, + 4.939196274200697e-10 + ], + "bp_grad_norms_F": [ + 2.951217993540922e-06, + 1.919361736213432e-08, + 1.863161003257119e-08, + 1.8634468190725784e-08, + 1.8637845045077484e-08 + ], + "gamma_dfa": 0.10690056857129093, + "acc_eval": 0.3046875, + "loss_eval": 1.9250625371932983, + "epoch": 83 + }, + { + "hidden_norms": [ + 35784.6640625, + 71885704.0, + 166691376.0, + 329546848.0, + 429668704.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.175997668833588e-08, + 4.971995593017198e-10, + 4.919967211414189e-10, + 4.91977791838849e-10, + 4.926699603835516e-10 + ], + "bp_grad_norms_F": [ + 2.9550594717875356e-06, + 1.9144454910247077e-08, + 1.8583381944381472e-08, + 1.858614595562358e-08, + 1.8589524586332118e-08 + ], + "gamma_dfa": 0.10689649073174223, + "acc_eval": 0.3076171875, + "loss_eval": 1.926330327987671, + "epoch": 84 + }, + { + "hidden_norms": [ + 35822.33984375, + 72122744.0, + 167344016.0, + 330816224.0, + 431313312.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.139300978702522e-08, + 4.980582613001161e-10, + 4.935602482269985e-10, + 4.934832542602408e-10, + 4.934415098745148e-10 + ], + "bp_grad_norms_F": [ + 2.9577784061984858e-06, + 1.9112555094125128e-08, + 1.8551357783280764e-08, + 1.8553992120473595e-08, + 1.8557404501962083e-08 + ], + "gamma_dfa": 0.10689723303948995, + "acc_eval": 0.3056640625, + "loss_eval": 1.9307332038879395, + "epoch": 85 + }, + { + "hidden_norms": [ + 35859.390625, + 72358304.0, + 167947920.0, + 331984992.0, + 432823232.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.135296359843778e-08, + 4.947317000514317e-10, + 4.903184525062443e-10, + 4.896648087004962e-10, + 4.905649775288623e-10 + ], + "bp_grad_norms_F": [ + 2.9511427328543505e-06, + 1.906450464161935e-08, + 1.8504644927475056e-08, + 1.8507259724742653e-08, + 1.8510663224446944e-08 + ], + "gamma_dfa": 0.10684622721601045, + "acc_eval": 0.314453125, + "loss_eval": 1.9271869659423828, + "epoch": 86 + }, + { + "hidden_norms": [ + 35888.20703125, + 72553136.0, + 168401376.0, + 332911328.0, + 434057600.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.163116239576993e-08, + 4.935953312745767e-10, + 4.904400219274407e-10, + 4.890517990574494e-10, + 4.891231308867816e-10 + ], + "bp_grad_norms_F": [ + 2.9438597266562283e-06, + 1.902795432329185e-08, + 1.8475304841558682e-08, + 1.8477877006262133e-08, + 1.848129471682114e-08 + ], + "gamma_dfa": 0.10682923735294025, + "acc_eval": 0.30859375, + "loss_eval": 1.9263050556182861, + "epoch": 87 + }, + { + "hidden_norms": [ + 35914.35546875, + 72735848.0, + 168823680.0, + 333752736.0, + 435137376.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.153870657499283e-08, + 4.920966967247864e-10, + 4.894144534084433e-10, + 4.876969939004994e-10, + 4.884483928435657e-10 + ], + "bp_grad_norms_F": [ + 2.9408777209027903e-06, + 1.8999060102942167e-08, + 1.8450597494279464e-08, + 1.8453114591920894e-08, + 1.84565323024799e-08 + ], + "gamma_dfa": 0.10694600266288035, + "acc_eval": 0.3115234375, + "loss_eval": 1.9252078533172607, + "epoch": 88 + }, + { + "hidden_norms": [ + 35936.5546875, + 72887360.0, + 169178624.0, + 334467840.0, + 436061952.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.168602340039797e-08, + 4.908231043820876e-10, + 4.854965318656923e-10, + 4.846267276370497e-10, + 4.847209300606892e-10 + ], + "bp_grad_norms_F": [ + 2.945510459539946e-06, + 1.8982424521141184e-08, + 1.8438125692910035e-08, + 1.844062857969675e-08, + 1.8444072935608347e-08 + ], + "gamma_dfa": 0.10697454003093299, + "acc_eval": 0.3134765625, + "loss_eval": 1.9264906644821167, + "epoch": 89 + }, + { + "hidden_norms": [ + 35955.3671875, + 73005808.0, + 169498240.0, + 335085920.0, + 436862656.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.152810527737529e-08, + 4.922047214250824e-10, + 4.872572900715966e-10, + 4.873856318532432e-10, + 4.87353157829773e-10 + ], + "bp_grad_norms_F": [ + 2.9327068205020623e-06, + 1.8955052638602865e-08, + 1.8409036073308016e-08, + 1.8411496327530585e-08, + 1.841491403808959e-08 + ], + "gamma_dfa": 0.10689280136284651, + "acc_eval": 0.3095703125, + "loss_eval": 1.9255037307739258, + "epoch": 90 + }, + { + "hidden_norms": [ + 35973.34375, + 73111368.0, + 169770208.0, + 335584768.0, + 437507744.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.107820382794671e-08, + 4.92519802719471e-10, + 4.876242187812352e-10, + 4.871342773604681e-10, + 4.873002001914983e-10 + ], + "bp_grad_norms_F": [ + 2.9368579816946294e-06, + 1.8944499302619988e-08, + 1.839602603581625e-08, + 1.8398441881117833e-08, + 1.8401848933535803e-08 + ], + "gamma_dfa": 0.10685028225998394, + "acc_eval": 0.306640625, + "loss_eval": 1.9265596866607666, + "epoch": 91 + }, + { + "hidden_norms": [ + 35985.046875, + 73193336.0, + 169984976.0, + 335981920.0, + 438037376.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.100844984757714e-08, + 4.92902163529152e-10, + 4.862484304091197e-10, + 4.871591463562197e-10, + 4.871424374996991e-10 + ], + "bp_grad_norms_F": [ + 2.930574055426405e-06, + 1.8926412437281215e-08, + 1.8379486377284593e-08, + 1.8381888011731462e-08, + 1.8385312827717826e-08 + ], + "gamma_dfa": 0.106783474504482, + "acc_eval": 0.30859375, + "loss_eval": 1.9269328117370605, + "epoch": 92 + }, + { + "hidden_norms": [ + 35994.07421875, + 73256784.0, + 170148048.0, + 336300032.0, + 438460544.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.113810968599864e-08, + 4.918689899824358e-10, + 4.860293834063611e-10, + 4.857191315821296e-10, + 4.859731506101639e-10 + ], + "bp_grad_norms_F": [ + 2.9313273444131482e-06, + 1.8918141719836967e-08, + 1.8372302790226058e-08, + 1.837469731924557e-08, + 1.8378123911588773e-08 + ], + "gamma_dfa": 0.10685011067107553, + "acc_eval": 0.3095703125, + "loss_eval": 1.9262909889221191, + "epoch": 93 + }, + { + "hidden_norms": [ + 36002.55078125, + 73308792.0, + 170289472.0, + 336572864.0, + 438812896.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.121508988599089e-08, + 4.917221074762779e-10, + 4.853899504553283e-10, + 4.847242052186118e-10, + 4.849394219519354e-10 + ], + "bp_grad_norms_F": [ + 2.933722271336592e-06, + 1.8911242349872737e-08, + 1.8366764109600808e-08, + 1.836915508590664e-08, + 1.8372583454606684e-08 + ], + "gamma_dfa": 0.10693995938345324, + "acc_eval": 0.3076171875, + "loss_eval": 1.9261877536773682, + "epoch": 94 + }, + { + "hidden_norms": [ + 36008.01953125, + 73348264.0, + 170386624.0, + 336761248.0, + 439049248.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.123732987362018e-08, + 4.916126949972011e-10, + 4.860848945575924e-10, + 4.87389184566922e-10, + 4.868180303319036e-10 + ], + "bp_grad_norms_F": [ + 2.9306668238859857e-06, + 1.8901717524499873e-08, + 1.835805107930355e-08, + 1.8360427844754668e-08, + 1.836385976616839e-08 + ], + "gamma_dfa": 0.10689331469620811, + "acc_eval": 0.30859375, + "loss_eval": 1.9260027408599854, + "epoch": 95 + }, + { + "hidden_norms": [ + 36011.9296875, + 73372720.0, + 170447072.0, + 336878464.0, + 439192800.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.115104156378948e-08, + 4.911633877391353e-10, + 4.862875657707377e-10, + 4.868677128122556e-10, + 4.867456437906981e-10 + ], + "bp_grad_norms_F": [ + 2.9297382297954755e-06, + 1.889710254943111e-08, + 1.8353631503487122e-08, + 1.835600293986772e-08, + 1.8359434861281443e-08 + ], + "gamma_dfa": 0.1068731502891751, + "acc_eval": 0.306640625, + "loss_eval": 1.9261021614074707, + "epoch": 96 + }, + { + "hidden_norms": [ + 36014.109375, + 73385416.0, + 170481184.0, + 336945120.0, + 439280128.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.12362214269524e-08, + 4.916780316222003e-10, + 4.858832225451692e-10, + 4.867402036978774e-10, + 4.862423241824843e-10 + ], + "bp_grad_norms_F": [ + 2.930293021563557e-06, + 1.8895260467388653e-08, + 1.8352444897118403e-08, + 1.835481810985584e-08, + 1.8358248254912723e-08 + ], + "gamma_dfa": 0.10688256371940952, + "acc_eval": 0.3095703125, + "loss_eval": 1.926184892654419, + "epoch": 97 + }, + { + "hidden_norms": [ + 36015.9375, + 73396752.0, + 170510784.0, + 337001056.0, + 439352832.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.120947659837839e-08, + 4.916590468084792e-10, + 4.857179658479538e-10, + 4.86417739420375e-10, + 4.85919415815772e-10 + ], + "bp_grad_norms_F": [ + 2.930209348050994e-06, + 1.889360845552801e-08, + 1.835070939648631e-08, + 1.8353080832866908e-08, + 1.835651275428063e-08 + ], + "gamma_dfa": 0.10688149025372695, + "acc_eval": 0.306640625, + "loss_eval": 1.9262256622314453, + "epoch": 98 + }, + { + "hidden_norms": [ + 36016.734375, + 73401888.0, + 170523312.0, + 337026592.0, + 439384864.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.119820028516187e-08, + 4.917350415745148e-10, + 4.857160784688119e-10, + 4.860361002556601e-10, + 4.855379431845108e-10 + ], + "bp_grad_norms_F": [ + 2.9303794235602254e-06, + 1.8893027586841526e-08, + 1.835026353091962e-08, + 1.835263319094338e-08, + 1.83560651123571e-08 + ], + "gamma_dfa": 0.10688879482768243, + "acc_eval": 0.3076171875, + "loss_eval": 1.926223874092102, + "epoch": 99 + }, + { + "hidden_norms": [ + 36016.7734375, + 73401992.0, + 170523904.0, + 337027392.0, + 439386048.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.120198747794348e-08, + 4.91758134213427e-10, + 4.857037549932386e-10, + 4.860785107752008e-10, + 4.855802981929003e-10 + ], + "bp_grad_norms_F": [ + 2.9303721476026112e-06, + 1.8893056008550957e-08, + 1.8350315045267962e-08, + 1.8352682928934883e-08, + 1.8356114850348604e-08 + ], + "gamma_dfa": 0.1068887785077095, + "acc_eval": 0.3076171875, + "loss_eval": 1.926220417022705, + "epoch": 100 + } + ] +} \ No newline at end of file diff --git a/results/snapshot_evolution_v2/snapshot_evolution_s456.json b/results/snapshot_evolution_v2/snapshot_evolution_s456.json new file mode 100644 index 0000000..f78065f --- /dev/null +++ b/results/snapshot_evolution_v2/snapshot_evolution_s456.json @@ -0,0 +1,5473 @@ +{ + "config": { + "output_dir": "results/snapshot_evolution_v2", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 456, + "depth": 4, + "d_hidden": 256, + "log_every": 1 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": [ + { + "hidden_norms": [ + 8.696551322937012, + 8.737784385681152, + 8.813130378723145, + 8.844642639160156, + 8.889528274536133 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010079912608489394, + 0.0010035138111561537, + 0.0009970925748348236, + 0.0009936393471434712, + 0.000986678060144186 + ], + "bp_grad_norms_F": [ + 0.035574451088905334, + 0.035288579761981964, + 0.035048045217990875, + 0.0346725769340992, + 0.03439188003540039 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0927734375, + "loss_eval": 2.4863264560699463, + "epoch": 0 + }, + { + "hidden_norms": [ + 79.9596176147461, + 82.38219451904297, + 86.97193145751953, + 92.46615600585938, + 99.17337799072266 + ], + "bp_grad_norms_per_sample_med": [ + 5.704927025362849e-05, + 5.414035331341438e-05, + 5.3104751714272425e-05, + 5.354730456019752e-05, + 5.5780339607736096e-05 + ], + "bp_grad_norms_F": [ + 0.00240120361559093, + 0.0021707164123654366, + 0.002052225871011615, + 0.0020026240963488817, + 0.002049861242994666 + ], + "gamma_dfa": NaN, + "acc_eval": 0.400390625, + "loss_eval": 1.6942739486694336, + "epoch": 1 + }, + { + "hidden_norms": [ + 95.21885681152344, + 97.9500732421875, + 101.84932708740234, + 108.15538787841797, + 115.16011810302734 + ], + "bp_grad_norms_per_sample_med": [ + 4.467168764676899e-05, + 4.3202508095419034e-05, + 4.3004638428101316e-05, + 4.286228431737982e-05, + 4.4292191887507215e-05 + ], + "bp_grad_norms_F": [ + 0.0018949288642033935, + 0.0017146588070318103, + 0.0016399234300479293, + 0.001598119386471808, + 0.0016228299355134368 + ], + "gamma_dfa": NaN, + "acc_eval": 0.4599609375, + "loss_eval": 1.5051867961883545, + "epoch": 2 + }, + { + "hidden_norms": [ + 112.65824890136719, + 111.87681579589844, + 114.76032257080078, + 118.74363708496094, + 125.05441284179688 + ], + "bp_grad_norms_per_sample_med": [ + 4.4033156882505864e-05, + 4.2794465116458014e-05, + 4.2031828343169764e-05, + 4.134616028750315e-05, + 4.226301462040283e-05 + ], + "bp_grad_norms_F": [ + 0.0018527565989643335, + 0.0017638156423345208, + 0.0016669610049575567, + 0.0015881577273830771, + 0.0015705813420936465 + ], + "gamma_dfa": NaN, + "acc_eval": 0.4931640625, + "loss_eval": 1.4331163167953491, + "epoch": 3 + }, + { + "hidden_norms": [ + 126.20967102050781, + 125.90274810791016, + 128.2918243408203, + 131.685302734375, + 136.71499633789062 + ], + "bp_grad_norms_per_sample_med": [ + 4.358301157481037e-05, + 4.267259282642044e-05, + 4.196130612399429e-05, + 4.08500200137496e-05, + 4.0281276596942917e-05 + ], + "bp_grad_norms_F": [ + 0.0018887611804530025, + 0.0017927174922078848, + 0.0016837789444252849, + 0.0015876276884227991, + 0.0015263468958437443 + ], + "gamma_dfa": NaN, + "acc_eval": 0.490234375, + "loss_eval": 1.4055290222167969, + "epoch": 4 + }, + { + "hidden_norms": [ + 137.673583984375, + 136.8435516357422, + 138.64651489257812, + 141.41473388671875, + 147.87835693359375 + ], + "bp_grad_norms_per_sample_med": [ + 4.085261025466025e-05, + 4.06657018174883e-05, + 3.941181785194203e-05, + 3.858502532239072e-05, + 3.7998870539013296e-05 + ], + "bp_grad_norms_F": [ + 0.001770049100741744, + 0.0016922445502132177, + 0.0016029543476179242, + 0.0015241446672007442, + 0.0014664788031950593 + ], + "gamma_dfa": NaN, + "acc_eval": 0.50390625, + "loss_eval": 1.3763911724090576, + "epoch": 5 + }, + { + "hidden_norms": [ + 150.45315551757812, + 148.60609436035156, + 150.3750457763672, + 152.9460906982422, + 158.2902069091797 + ], + "bp_grad_norms_per_sample_med": [ + 3.8344696804415435e-05, + 3.8422465877374634e-05, + 3.834897142951377e-05, + 3.7070902180857956e-05, + 3.6289642594056204e-05 + ], + "bp_grad_norms_F": [ + 0.0017990845954045653, + 0.001743242726661265, + 0.0016358466818928719, + 0.0015305348206311464, + 0.0014392968732863665 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5166015625, + "loss_eval": 1.373401165008545, + "epoch": 6 + }, + { + "hidden_norms": [ + 162.06126403808594, + 159.53811645507812, + 158.62655639648438, + 160.54307556152344, + 165.60415649414062 + ], + "bp_grad_norms_per_sample_med": [ + 3.797870522248559e-05, + 3.766914960579015e-05, + 3.7873480323469266e-05, + 3.735603968380019e-05, + 3.6521956644719467e-05 + ], + "bp_grad_norms_F": [ + 0.001707478309981525, + 0.0016470234841108322, + 0.0015834521036595106, + 0.001506388420239091, + 0.001406461582519114 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5283203125, + "loss_eval": 1.3223559856414795, + "epoch": 7 + }, + { + "hidden_norms": [ + 169.8936309814453, + 168.42221069335938, + 169.54115295410156, + 171.452880859375, + 176.4298553466797 + ], + "bp_grad_norms_per_sample_med": [ + 3.760562321986072e-05, + 3.8139285607030615e-05, + 3.7332967622205615e-05, + 3.670771184260957e-05, + 3.4867567592300475e-05 + ], + "bp_grad_norms_F": [ + 0.001674071652814746, + 0.0016396756982430816, + 0.001556537114083767, + 0.001464220928028226, + 0.0013669237960129976 + ], + "gamma_dfa": NaN, + "acc_eval": 0.529296875, + "loss_eval": 1.3310301303863525, + "epoch": 8 + }, + { + "hidden_norms": [ + 177.821044921875, + 176.60687255859375, + 177.76409912109375, + 179.53733825683594, + 184.176513671875 + ], + "bp_grad_norms_per_sample_med": [ + 3.643108357209712e-05, + 3.605252277338877e-05, + 3.6002034903503954e-05, + 3.529640525812283e-05, + 3.386645403224975e-05 + ], + "bp_grad_norms_F": [ + 0.0016080558998510242, + 0.0015692447777837515, + 0.0014910849276930094, + 0.0014210963854566216, + 0.0013221093686297536 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5390625, + "loss_eval": 1.3072502613067627, + "epoch": 9 + }, + { + "hidden_norms": [ + 188.1353759765625, + 184.39834594726562, + 184.91822814941406, + 185.82460021972656, + 191.45692443847656 + ], + "bp_grad_norms_per_sample_med": [ + 3.544713035807945e-05, + 3.5891316656488925e-05, + 3.613864828366786e-05, + 3.507022120174952e-05, + 3.361281778779812e-05 + ], + "bp_grad_norms_F": [ + 0.0015651460271328688, + 0.0015296414494514465, + 0.0014787326799705625, + 0.0014131872449070215, + 0.0013114992761984468 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5537109375, + "loss_eval": 1.2935423851013184, + "epoch": 10 + }, + { + "hidden_norms": [ + 193.53599548339844, + 189.33700561523438, + 190.08908081054688, + 192.31288146972656, + 198.0936737060547 + ], + "bp_grad_norms_per_sample_med": [ + 3.3899334084708244e-05, + 3.468272552709095e-05, + 3.463856774033047e-05, + 3.383589137229137e-05, + 3.240162550355308e-05 + ], + "bp_grad_norms_F": [ + 0.001495138043537736, + 0.0014781414065510035, + 0.0014301009941846132, + 0.0013711795909330249, + 0.0012839946430176497 + ], + "gamma_dfa": NaN, + "acc_eval": 0.544921875, + "loss_eval": 1.2766207456588745, + "epoch": 11 + }, + { + "hidden_norms": [ + 199.85023498535156, + 194.9699249267578, + 193.4657440185547, + 194.60928344726562, + 199.97662353515625 + ], + "bp_grad_norms_per_sample_med": [ + 3.289094092906453e-05, + 3.539410317898728e-05, + 3.491900861263275e-05, + 3.4397991839796305e-05, + 3.252939859521575e-05 + ], + "bp_grad_norms_F": [ + 0.0015656249597668648, + 0.0015614606672897935, + 0.0015110056847333908, + 0.0014306820230558515, + 0.00130200176499784 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5439453125, + "loss_eval": 1.2812860012054443, + "epoch": 12 + }, + { + "hidden_norms": [ + 206.15440368652344, + 199.86099243164062, + 199.35470581054688, + 201.66831970214844, + 206.71054077148438 + ], + "bp_grad_norms_per_sample_med": [ + 3.430957076488994e-05, + 3.5125638532917947e-05, + 3.523785198922269e-05, + 3.404217568458989e-05, + 3.245573316235095e-05 + ], + "bp_grad_norms_F": [ + 0.0015102275647222996, + 0.0015037795528769493, + 0.001468595233745873, + 0.0013989906292408705, + 0.0012804438592866063 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5517578125, + "loss_eval": 1.2559274435043335, + "epoch": 13 + }, + { + "hidden_norms": [ + 209.39404296875, + 203.8543243408203, + 201.63771057128906, + 202.7413787841797, + 209.64585876464844 + ], + "bp_grad_norms_per_sample_med": [ + 3.3599189919186756e-05, + 3.511353497742675e-05, + 3.4795291867339984e-05, + 3.415898390812799e-05, + 3.225719046895392e-05 + ], + "bp_grad_norms_F": [ + 0.0015785910654813051, + 0.0015854343073442578, + 0.0015357385855168104, + 0.00144979078322649, + 0.0013052559224888682 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5478515625, + "loss_eval": 1.2778449058532715, + "epoch": 14 + }, + { + "hidden_norms": [ + 214.74293518066406, + 208.2928924560547, + 206.78591918945312, + 207.79452514648438, + 213.0249481201172 + ], + "bp_grad_norms_per_sample_med": [ + 3.347836172906682e-05, + 3.457088314462453e-05, + 3.509481393848546e-05, + 3.4477459848858416e-05, + 3.169552292092703e-05 + ], + "bp_grad_norms_F": [ + 0.0015018024714663625, + 0.0015100837917998433, + 0.0014814585447311401, + 0.0014098759274929762, + 0.0012745971325784922 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5693359375, + "loss_eval": 1.2316113710403442, + "epoch": 15 + }, + { + "hidden_norms": [ + 223.09906005859375, + 214.6353302001953, + 211.16726684570312, + 210.60520935058594, + 214.28952026367188 + ], + "bp_grad_norms_per_sample_med": [ + 3.5336081054992974e-05, + 3.693878170452081e-05, + 3.7104789953446016e-05, + 3.635902612586506e-05, + 3.3355980121996254e-05 + ], + "bp_grad_norms_F": [ + 0.0015461220173165202, + 0.0015768769662827253, + 0.0015498694265261292, + 0.001453379518352449, + 0.0013068238040432334 + ], + "gamma_dfa": NaN, + "acc_eval": 0.55078125, + "loss_eval": 1.2516858577728271, + "epoch": 16 + }, + { + "hidden_norms": [ + 225.36517333984375, + 217.36669921875, + 214.27880859375, + 215.62054443359375, + 219.76197814941406 + ], + "bp_grad_norms_per_sample_med": [ + 3.474476397968829e-05, + 3.609717168728821e-05, + 3.612042564782314e-05, + 3.547673986759037e-05, + 3.216006007278338e-05 + ], + "bp_grad_norms_F": [ + 0.001510953065007925, + 0.0015347315929830074, + 0.0015160846523940563, + 0.001440546941012144, + 0.0012782461708411574 + ], + "gamma_dfa": NaN, + "acc_eval": 0.583984375, + "loss_eval": 1.2262325286865234, + "epoch": 17 + }, + { + "hidden_norms": [ + 230.7099151611328, + 222.3380889892578, + 218.67819213867188, + 217.3147735595703, + 221.999755859375 + ], + "bp_grad_norms_per_sample_med": [ + 3.285402272013016e-05, + 3.4367294574622065e-05, + 3.490627204882912e-05, + 3.413260492379777e-05, + 3.064925112994388e-05 + ], + "bp_grad_norms_F": [ + 0.0015693235909566283, + 0.0015950833912938833, + 0.0015582602936774492, + 0.001467122812755406, + 0.0012723723193630576 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5751953125, + "loss_eval": 1.2127145528793335, + "epoch": 18 + }, + { + "hidden_norms": [ + 235.28932189941406, + 226.01202392578125, + 222.56756591796875, + 222.25152587890625, + 226.0247344970703 + ], + "bp_grad_norms_per_sample_med": [ + 3.336059671710245e-05, + 3.488900983938947e-05, + 3.518831363180652e-05, + 3.5047873097937554e-05, + 3.1955056329024956e-05 + ], + "bp_grad_norms_F": [ + 0.0015264152316376567, + 0.0015387749299407005, + 0.0015209508128464222, + 0.001451890799216926, + 0.00127940543461591 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5673828125, + "loss_eval": 1.2340281009674072, + "epoch": 19 + }, + { + "hidden_norms": [ + 239.98486328125, + 230.95614624023438, + 226.7176513671875, + 225.3818359375, + 231.0238037109375 + ], + "bp_grad_norms_per_sample_med": [ + 3.4207379940198734e-05, + 3.5167759051546454e-05, + 3.5256896808277816e-05, + 3.462574022705667e-05, + 3.117474989267066e-05 + ], + "bp_grad_norms_F": [ + 0.0015223841182887554, + 0.0015598630998283625, + 0.0015445069875568151, + 0.0014689662493765354, + 0.0012761331163346767 + ], + "gamma_dfa": NaN, + "acc_eval": 0.56640625, + "loss_eval": 1.2441283464431763, + "epoch": 20 + }, + { + "hidden_norms": [ + 245.0663299560547, + 233.2012939453125, + 227.60426330566406, + 226.96006774902344, + 229.30145263671875 + ], + "bp_grad_norms_per_sample_med": [ + 3.25386063195765e-05, + 3.39963698934298e-05, + 3.503257903503254e-05, + 3.4624255931703374e-05, + 3.013665264006704e-05 + ], + "bp_grad_norms_F": [ + 0.001554132904857397, + 0.0015968671068549156, + 0.001575724920257926, + 0.0014765377854928374, + 0.0012655528262257576 + ], + "gamma_dfa": NaN, + "acc_eval": 0.595703125, + "loss_eval": 1.1905839443206787, + "epoch": 21 + }, + { + "hidden_norms": [ + 246.93258666992188, + 235.25485229492188, + 232.71095275878906, + 231.27796936035156, + 235.4611358642578 + ], + "bp_grad_norms_per_sample_med": [ + 3.248557914048433e-05, + 3.448772622505203e-05, + 3.525316424202174e-05, + 3.4218086511828005e-05, + 2.997798401338514e-05 + ], + "bp_grad_norms_F": [ + 0.001511804643087089, + 0.0015418389812111855, + 0.001536028808914125, + 0.0014609270729124546, + 0.001262559788301587 + ], + "gamma_dfa": NaN, + "acc_eval": 0.576171875, + "loss_eval": 1.2032543420791626, + "epoch": 22 + }, + { + "hidden_norms": [ + 251.2838592529297, + 237.0211639404297, + 234.6432342529297, + 233.30433654785156, + 238.11598205566406 + ], + "bp_grad_norms_per_sample_med": [ + 3.3030770282493904e-05, + 3.484229455352761e-05, + 3.59142868546769e-05, + 3.533583367243409e-05, + 3.1214847695082426e-05 + ], + "bp_grad_norms_F": [ + 0.0015120860189199448, + 0.00155613012611866, + 0.0015533699188381433, + 0.001477457000873983, + 0.0012758751399815083 + ], + "gamma_dfa": NaN, + "acc_eval": 0.568359375, + "loss_eval": 1.220862627029419, + "epoch": 23 + }, + { + "hidden_norms": [ + 253.3640594482422, + 242.6001739501953, + 237.11773681640625, + 237.31105041503906, + 241.1314697265625 + ], + "bp_grad_norms_per_sample_med": [ + 3.295885835541412e-05, + 3.492692485451698e-05, + 3.562758502084762e-05, + 3.515293064992875e-05, + 3.0970571970101446e-05 + ], + "bp_grad_norms_F": [ + 0.001516172313131392, + 0.0015499184373766184, + 0.0015383078716695309, + 0.0014658188447356224, + 0.0012659834465011954 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5888671875, + "loss_eval": 1.1925604343414307, + "epoch": 24 + }, + { + "hidden_norms": [ + 258.6325378417969, + 245.05575561523438, + 239.04722595214844, + 237.04385375976562, + 240.51011657714844 + ], + "bp_grad_norms_per_sample_med": [ + 3.258220021962188e-05, + 3.459660729276948e-05, + 3.553628994268365e-05, + 3.461805317783728e-05, + 3.001722870976664e-05 + ], + "bp_grad_norms_F": [ + 0.0015354488277807832, + 0.001572331297211349, + 0.0015721773961558938, + 0.0014915125211700797, + 0.0012740870006382465 + ], + "gamma_dfa": NaN, + "acc_eval": 0.58203125, + "loss_eval": 1.1843492984771729, + "epoch": 25 + }, + { + "hidden_norms": [ + 262.35577392578125, + 247.456298828125, + 241.52687072753906, + 239.8603057861328, + 242.48818969726562 + ], + "bp_grad_norms_per_sample_med": [ + 3.335328074172139e-05, + 3.581988130463287e-05, + 3.6700876080431044e-05, + 3.52635579474736e-05, + 3.091046164627187e-05 + ], + "bp_grad_norms_F": [ + 0.0015506797935813665, + 0.0016048819525167346, + 0.0016078166663646698, + 0.0015189298428595066, + 0.001287299208343029 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6025390625, + "loss_eval": 1.2021183967590332, + "epoch": 26 + }, + { + "hidden_norms": [ + 262.69769287109375, + 248.58924865722656, + 243.61415100097656, + 242.7408905029297, + 243.58761596679688 + ], + "bp_grad_norms_per_sample_med": [ + 3.363215728313662e-05, + 3.542406557244249e-05, + 3.617940456024371e-05, + 3.522956103552133e-05, + 3.093081613769755e-05 + ], + "bp_grad_norms_F": [ + 0.0015515872510150075, + 0.0015918170101940632, + 0.0015870564384385943, + 0.0015067857457324862, + 0.001285396981984377 + ], + "gamma_dfa": NaN, + "acc_eval": 0.576171875, + "loss_eval": 1.1753299236297607, + "epoch": 27 + }, + { + "hidden_norms": [ + 264.57330322265625, + 252.62904357910156, + 246.43833923339844, + 245.4523468017578, + 247.43896484375 + ], + "bp_grad_norms_per_sample_med": [ + 3.3458851248724386e-05, + 3.510742317303084e-05, + 3.596700116759166e-05, + 3.530932735884562e-05, + 3.0871200578985736e-05 + ], + "bp_grad_norms_F": [ + 0.0015561054460704327, + 0.0015992044936865568, + 0.0016016490990296006, + 0.0015203922521322966, + 0.001274992828257382 + ], + "gamma_dfa": NaN, + "acc_eval": 0.587890625, + "loss_eval": 1.1872658729553223, + "epoch": 28 + }, + { + "hidden_norms": [ + 268.63336181640625, + 253.74609375, + 247.2230224609375, + 244.07066345214844, + 248.91635131835938 + ], + "bp_grad_norms_per_sample_med": [ + 3.388441837159917e-05, + 3.55305674020201e-05, + 3.711709723575041e-05, + 3.565939550753683e-05, + 3.06438232655637e-05 + ], + "bp_grad_norms_F": [ + 0.0015880814753472805, + 0.001632494037039578, + 0.0016352345701307058, + 0.001542495796456933, + 0.001282386132515967 + ], + "gamma_dfa": NaN, + "acc_eval": 0.59375, + "loss_eval": 1.1748178005218506, + "epoch": 29 + }, + { + "hidden_norms": [ + 269.5155944824219, + 254.65687561035156, + 249.08070373535156, + 246.4084930419922, + 248.03065490722656 + ], + "bp_grad_norms_per_sample_med": [ + 3.340150215080939e-05, + 3.542837657732889e-05, + 3.656153057818301e-05, + 3.62997452612035e-05, + 3.134588405373506e-05 + ], + "bp_grad_norms_F": [ + 0.0015988025115802884, + 0.0016428054077550769, + 0.0016343789175152779, + 0.00154898373875767, + 0.001290567102842033 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5888671875, + "loss_eval": 1.184614658355713, + "epoch": 30 + }, + { + "hidden_norms": [ + 273.0482482910156, + 255.88157653808594, + 249.6538543701172, + 246.09181213378906, + 250.09861755371094 + ], + "bp_grad_norms_per_sample_med": [ + 3.485401612124406e-05, + 3.613552325987257e-05, + 3.727355215232819e-05, + 3.6410303437151015e-05, + 3.111722253379412e-05 + ], + "bp_grad_norms_F": [ + 0.0016218513483181596, + 0.001677986583672464, + 0.0016929754056036472, + 0.001593436230905354, + 0.0013143697287887335 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5673828125, + "loss_eval": 1.2012369632720947, + "epoch": 31 + }, + { + "hidden_norms": [ + 274.05010986328125, + 255.77792358398438, + 247.96664428710938, + 246.15379333496094, + 248.44847106933594 + ], + "bp_grad_norms_per_sample_med": [ + 3.431778895901516e-05, + 3.609380655689165e-05, + 3.7377911212388426e-05, + 3.6012417695019394e-05, + 3.0985673220129684e-05 + ], + "bp_grad_norms_F": [ + 0.0016116296174004674, + 0.0016683804569765925, + 0.0016786488704383373, + 0.0015687323175370693, + 0.001289981184527278 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5986328125, + "loss_eval": 1.1654620170593262, + "epoch": 32 + }, + { + "hidden_norms": [ + 274.6156921386719, + 257.166259765625, + 251.9473876953125, + 251.01661682128906, + 252.84222412109375 + ], + "bp_grad_norms_per_sample_med": [ + 3.185174864483997e-05, + 3.433173696976155e-05, + 3.572784407879226e-05, + 3.4680619137361646e-05, + 2.997389128722716e-05 + ], + "bp_grad_norms_F": [ + 0.0015743848634883761, + 0.001610185718163848, + 0.0016222007106989622, + 0.0015360275283455849, + 0.0012806184822693467 + ], + "gamma_dfa": NaN, + "acc_eval": 0.58984375, + "loss_eval": 1.1679120063781738, + "epoch": 33 + }, + { + "hidden_norms": [ + 274.3385009765625, + 256.1404724121094, + 249.90264892578125, + 247.3904266357422, + 249.5623016357422 + ], + "bp_grad_norms_per_sample_med": [ + 3.419954009586945e-05, + 3.6830995668424293e-05, + 3.8464357203338295e-05, + 3.64230691047851e-05, + 3.0958552088122815e-05 + ], + "bp_grad_norms_F": [ + 0.0016346886986866593, + 0.0016823107143864036, + 0.0016956342151388526, + 0.0015958002768456936, + 0.0013100137002766132 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5927734375, + "loss_eval": 1.1599082946777344, + "epoch": 34 + }, + { + "hidden_norms": [ + 276.65985107421875, + 258.50543212890625, + 251.1997833251953, + 247.7036895751953, + 248.07545471191406 + ], + "bp_grad_norms_per_sample_med": [ + 3.384043520782143e-05, + 3.567537714843638e-05, + 3.686825220938772e-05, + 3.5754670534515753e-05, + 3.0301211154437624e-05 + ], + "bp_grad_norms_F": [ + 0.0016451155534014106, + 0.0016956959152594209, + 0.001703266054391861, + 0.0016015227884054184, + 0.0013142916141077876 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.148215889930725, + "epoch": 35 + }, + { + "hidden_norms": [ + 279.6298522949219, + 261.1481018066406, + 253.67742919921875, + 250.86221313476562, + 250.6768035888672 + ], + "bp_grad_norms_per_sample_med": [ + 3.341220144648105e-05, + 3.499272861517966e-05, + 3.6701327189803123e-05, + 3.602671858971007e-05, + 3.081390605075285e-05 + ], + "bp_grad_norms_F": [ + 0.0016287019243463874, + 0.0016769150970503688, + 0.0016951658762991428, + 0.0015969424275681376, + 0.0013187138829380274 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6015625, + "loss_eval": 1.1451219320297241, + "epoch": 36 + }, + { + "hidden_norms": [ + 277.2866516113281, + 258.4331359863281, + 251.4995880126953, + 249.0448455810547, + 248.5166015625 + ], + "bp_grad_norms_per_sample_med": [ + 3.2723561162129045e-05, + 3.4428499930072576e-05, + 3.571901106624864e-05, + 3.4436179703334346e-05, + 2.9252587410155684e-05 + ], + "bp_grad_norms_F": [ + 0.0016638770466670394, + 0.0017149352934211493, + 0.0017208203207701445, + 0.0016291715437546372, + 0.0013402353506535292 + ], + "gamma_dfa": NaN, + "acc_eval": 0.599609375, + "loss_eval": 1.145239233970642, + "epoch": 37 + }, + { + "hidden_norms": [ + 279.7109680175781, + 259.3131103515625, + 250.73587036132812, + 247.214111328125, + 249.20944213867188 + ], + "bp_grad_norms_per_sample_med": [ + 3.449835639912635e-05, + 3.682902752188966e-05, + 3.780073166126385e-05, + 3.652105442597531e-05, + 3.046718666155357e-05 + ], + "bp_grad_norms_F": [ + 0.001753124757669866, + 0.0018144651548936963, + 0.0018306451383978128, + 0.0017095789080485702, + 0.001379602705128491 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5908203125, + "loss_eval": 1.1677792072296143, + "epoch": 38 + }, + { + "hidden_norms": [ + 279.9946594238281, + 260.2458190917969, + 252.0008087158203, + 250.56716918945312, + 250.73135375976562 + ], + "bp_grad_norms_per_sample_med": [ + 3.489958180580288e-05, + 3.730110984179191e-05, + 3.791403287323192e-05, + 3.650010330602527e-05, + 3.076100256294012e-05 + ], + "bp_grad_norms_F": [ + 0.0017145961755886674, + 0.0017580300336703658, + 0.001775139826349914, + 0.0016669962788000703, + 0.0013597821816802025 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.1510668992996216, + "epoch": 39 + }, + { + "hidden_norms": [ + 280.5132751464844, + 260.75970458984375, + 252.2814178466797, + 249.84548950195312, + 248.41783142089844 + ], + "bp_grad_norms_per_sample_med": [ + 3.552919588400982e-05, + 3.777973688556813e-05, + 3.952483166358434e-05, + 3.783141073654406e-05, + 3.1490348192164674e-05 + ], + "bp_grad_norms_F": [ + 0.0017431442392989993, + 0.0017984459409490228, + 0.0018199888290837407, + 0.0017078405944630504, + 0.0013792469399049878 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.1412110328674316, + "epoch": 40 + }, + { + "hidden_norms": [ + 279.3873596191406, + 259.55096435546875, + 251.9462432861328, + 247.29443359375, + 247.82852172851562 + ], + "bp_grad_norms_per_sample_med": [ + 3.456972990534268e-05, + 3.654780448414385e-05, + 3.848340566037223e-05, + 3.736113285413012e-05, + 3.1597948691342026e-05 + ], + "bp_grad_norms_F": [ + 0.0017544032307341695, + 0.0018107325304299593, + 0.0018319039372727275, + 0.0017261328175663948, + 0.0013868761016055942 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6083984375, + "loss_eval": 1.1418483257293701, + "epoch": 41 + }, + { + "hidden_norms": [ + 282.4360656738281, + 261.22149658203125, + 251.49090576171875, + 247.5189208984375, + 247.03427124023438 + ], + "bp_grad_norms_per_sample_med": [ + 3.5179280530428514e-05, + 3.728548108483665e-05, + 3.779769394895993e-05, + 3.6327692214399576e-05, + 3.026284321094863e-05 + ], + "bp_grad_norms_F": [ + 0.0017881252570077777, + 0.0018441356951370835, + 0.0018691252917051315, + 0.0017487212317064404, + 0.0013921407517045736 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6142578125, + "loss_eval": 1.1468144655227661, + "epoch": 42 + }, + { + "hidden_norms": [ + 283.1267395019531, + 261.29425048828125, + 252.38563537597656, + 248.00192260742188, + 246.58505249023438 + ], + "bp_grad_norms_per_sample_med": [ + 3.485176421236247e-05, + 3.699021544889547e-05, + 3.812833165284246e-05, + 3.7145182432141155e-05, + 3.1198313081404194e-05 + ], + "bp_grad_norms_F": [ + 0.0017692983383312821, + 0.0018438888946548104, + 0.001876220339909196, + 0.0017641744343563914, + 0.0014044356066733599 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62109375, + "loss_eval": 1.1329892873764038, + "epoch": 43 + }, + { + "hidden_norms": [ + 281.29327392578125, + 259.43359375, + 249.52906799316406, + 246.0892333984375, + 243.162109375 + ], + "bp_grad_norms_per_sample_med": [ + 3.586204911698587e-05, + 3.787377499975264e-05, + 3.9215286960825324e-05, + 3.7436715501826257e-05, + 3.160976120852865e-05 + ], + "bp_grad_norms_F": [ + 0.0018376735970377922, + 0.0019067999674007297, + 0.0019337635021656752, + 0.0017983472207561135, + 0.001438757055439055 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6181640625, + "loss_eval": 1.144508957862854, + "epoch": 44 + }, + { + "hidden_norms": [ + 282.5230407714844, + 259.55322265625, + 248.72308349609375, + 245.0394287109375, + 243.0651092529297 + ], + "bp_grad_norms_per_sample_med": [ + 3.6309906136011705e-05, + 3.868114436045289e-05, + 4.0484872442903e-05, + 3.8203681469894946e-05, + 3.144023139611818e-05 + ], + "bp_grad_norms_F": [ + 0.0018340122187510133, + 0.0019134157337248325, + 0.0019425065256655216, + 0.0018252682639285922, + 0.001443033921532333 + ], + "gamma_dfa": NaN, + "acc_eval": 0.61328125, + "loss_eval": 1.1290326118469238, + "epoch": 45 + }, + { + "hidden_norms": [ + 280.8598327636719, + 260.14111328125, + 250.84779357910156, + 245.9561767578125, + 243.0910186767578 + ], + "bp_grad_norms_per_sample_med": [ + 3.4626806154847145e-05, + 3.693445250974037e-05, + 3.8311845855787396e-05, + 3.7721722037531435e-05, + 3.145459049846977e-05 + ], + "bp_grad_norms_F": [ + 0.0018591763218864799, + 0.0019209657330065966, + 0.0019388735527172685, + 0.001830682042054832, + 0.001447839429602027 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.1423537731170654, + "epoch": 46 + }, + { + "hidden_norms": [ + 280.17266845703125, + 259.26568603515625, + 248.45452880859375, + 243.45750427246094, + 241.2735137939453 + ], + "bp_grad_norms_per_sample_med": [ + 3.609486884670332e-05, + 3.887504499289207e-05, + 4.01619981857948e-05, + 3.9294092857744545e-05, + 3.1412804673891515e-05 + ], + "bp_grad_norms_F": [ + 0.0018975000130012631, + 0.0019804267212748528, + 0.002001592656597495, + 0.0018729616422206163, + 0.0014571875799447298 + ], + "gamma_dfa": NaN, + "acc_eval": 0.61328125, + "loss_eval": 1.1366385221481323, + "epoch": 47 + }, + { + "hidden_norms": [ + 281.79833984375, + 259.25860595703125, + 249.18551635742188, + 244.24977111816406, + 240.67100524902344 + ], + "bp_grad_norms_per_sample_med": [ + 3.47710374626331e-05, + 3.7153975426917896e-05, + 3.885528349201195e-05, + 3.792768620769493e-05, + 3.113777347607538e-05 + ], + "bp_grad_norms_F": [ + 0.0019318967824801803, + 0.0019981141667813063, + 0.0020311782136559486, + 0.0018996316939592361, + 0.0014788025291636586 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6162109375, + "loss_eval": 1.138331651687622, + "epoch": 48 + }, + { + "hidden_norms": [ + 282.3840637207031, + 258.1807861328125, + 248.13995361328125, + 243.45587158203125, + 239.51858520507812 + ], + "bp_grad_norms_per_sample_med": [ + 3.68369001080282e-05, + 3.935660788556561e-05, + 4.189974788459949e-05, + 3.9929436752572656e-05, + 3.188087430316955e-05 + ], + "bp_grad_norms_F": [ + 0.0019372758688405156, + 0.0020036858040839434, + 0.0020287453662604094, + 0.001896715839393437, + 0.0014835885958746076 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.1377842426300049, + "epoch": 49 + }, + { + "hidden_norms": [ + 280.9283142089844, + 257.81524658203125, + 248.47984313964844, + 241.96157836914062, + 238.4756317138672 + ], + "bp_grad_norms_per_sample_med": [ + 3.7310775951482356e-05, + 3.98769298044499e-05, + 4.1753111872822046e-05, + 4.021048516733572e-05, + 3.21856678056065e-05 + ], + "bp_grad_norms_F": [ + 0.0019433718407526612, + 0.0020235073752701283, + 0.002055324148386717, + 0.0019370814552530646, + 0.0015049076173454523 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.133098840713501, + "epoch": 50 + }, + { + "hidden_norms": [ + 279.66400146484375, + 256.7322082519531, + 246.65223693847656, + 241.45947265625, + 236.65582275390625 + ], + "bp_grad_norms_per_sample_med": [ + 3.620017014327459e-05, + 3.800772174145095e-05, + 4.072795491083525e-05, + 3.888807259500027e-05, + 3.182498039677739e-05 + ], + "bp_grad_norms_F": [ + 0.0019729172345250845, + 0.002036863239482045, + 0.0020802877843379974, + 0.0019662927370518446, + 0.0015235996106639504 + ], + "gamma_dfa": NaN, + "acc_eval": 0.619140625, + "loss_eval": 1.1315571069717407, + "epoch": 51 + }, + { + "hidden_norms": [ + 280.00152587890625, + 258.0238037109375, + 247.4223175048828, + 240.8101348876953, + 237.3229217529297 + ], + "bp_grad_norms_per_sample_med": [ + 3.6401659599505365e-05, + 3.855170143651776e-05, + 4.065703978994861e-05, + 3.844475213554688e-05, + 3.1645795388612896e-05 + ], + "bp_grad_norms_F": [ + 0.0019983802922070026, + 0.0020701857283711433, + 0.002107742242515087, + 0.001981276087462902, + 0.0015306670684367418 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6171875, + "loss_eval": 1.137194037437439, + "epoch": 52 + }, + { + "hidden_norms": [ + 278.19708251953125, + 255.23036193847656, + 245.5857696533203, + 239.48196411132812, + 235.09983825683594 + ], + "bp_grad_norms_per_sample_med": [ + 3.97727417293936e-05, + 4.185501529718749e-05, + 4.392741175252013e-05, + 4.302372326492332e-05, + 3.48737376043573e-05 + ], + "bp_grad_norms_F": [ + 0.002044696593657136, + 0.00211329385638237, + 0.002144050318747759, + 0.0020148823969066143, + 0.0015573638956993818 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.1354646682739258, + "epoch": 53 + }, + { + "hidden_norms": [ + 276.7043762207031, + 255.62408447265625, + 243.71484375, + 238.2984161376953, + 233.8153076171875 + ], + "bp_grad_norms_per_sample_med": [ + 3.715257116709836e-05, + 3.887641287292354e-05, + 4.099323268746957e-05, + 3.948296944145113e-05, + 3.221148654120043e-05 + ], + "bp_grad_norms_F": [ + 0.0020365805830806494, + 0.00209893099963665, + 0.0021342532709240913, + 0.0020123852882534266, + 0.0015702869277447462 + ], + "gamma_dfa": NaN, + "acc_eval": 0.623046875, + "loss_eval": 1.1295127868652344, + "epoch": 54 + }, + { + "hidden_norms": [ + 279.308349609375, + 255.30587768554688, + 243.6786651611328, + 237.71823120117188, + 232.89991760253906 + ], + "bp_grad_norms_per_sample_med": [ + 3.9407084841514006e-05, + 4.1900668293237686e-05, + 4.364689812064171e-05, + 4.154618363827467e-05, + 3.264051701989956e-05 + ], + "bp_grad_norms_F": [ + 0.0021011638455092907, + 0.002175872679799795, + 0.002217113971710205, + 0.002071501687169075, + 0.0015880379360169172 + ], + "gamma_dfa": NaN, + "acc_eval": 0.626953125, + "loss_eval": 1.1201554536819458, + "epoch": 55 + }, + { + "hidden_norms": [ + 276.9933166503906, + 253.379638671875, + 244.23390197753906, + 238.01930236816406, + 233.3076171875 + ], + "bp_grad_norms_per_sample_med": [ + 3.799827391048893e-05, + 4.017200990347192e-05, + 4.2665858927648515e-05, + 4.083341627847403e-05, + 3.210103386663832e-05 + ], + "bp_grad_norms_F": [ + 0.002064710482954979, + 0.0021362933330237865, + 0.0021728368010371923, + 0.0020478416699916124, + 0.0015873984666541219 + ], + "gamma_dfa": NaN, + "acc_eval": 0.630859375, + "loss_eval": 1.1222728490829468, + "epoch": 56 + }, + { + "hidden_norms": [ + 276.41168212890625, + 251.91033935546875, + 241.81382751464844, + 234.8279266357422, + 230.53956604003906 + ], + "bp_grad_norms_per_sample_med": [ + 3.770063631236553e-05, + 3.94962407881394e-05, + 4.150882887188345e-05, + 4.040042040287517e-05, + 3.2475280022481456e-05 + ], + "bp_grad_norms_F": [ + 0.002123177284374833, + 0.0021965675987303257, + 0.00223328173160553, + 0.0020905195269733667, + 0.0016039537731558084 + ], + "gamma_dfa": NaN, + "acc_eval": 0.630859375, + "loss_eval": 1.1091526746749878, + "epoch": 57 + }, + { + "hidden_norms": [ + 274.760986328125, + 250.0972442626953, + 239.511474609375, + 233.29798889160156, + 228.16070556640625 + ], + "bp_grad_norms_per_sample_med": [ + 3.728809315362014e-05, + 4.0525967051507905e-05, + 4.239326517563313e-05, + 4.087138222530484e-05, + 3.216422919649631e-05 + ], + "bp_grad_norms_F": [ + 0.0021635335870087147, + 0.0022461507469415665, + 0.0022873859852552414, + 0.002144098049029708, + 0.001636566361412406 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6416015625, + "loss_eval": 1.1180500984191895, + "epoch": 58 + }, + { + "hidden_norms": [ + 273.91064453125, + 249.49452209472656, + 238.54373168945312, + 232.80734252929688, + 225.6833953857422 + ], + "bp_grad_norms_per_sample_med": [ + 3.966117583331652e-05, + 4.1986208088928834e-05, + 4.316144259064458e-05, + 4.332280877861194e-05, + 3.44519030477386e-05 + ], + "bp_grad_norms_F": [ + 0.0021825931034982204, + 0.0022617392241954803, + 0.0023092019837349653, + 0.00216560042463243, + 0.0016612708568572998 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6279296875, + "loss_eval": 1.131789207458496, + "epoch": 59 + }, + { + "hidden_norms": [ + 274.90008544921875, + 250.0712127685547, + 238.57467651367188, + 231.15719604492188, + 225.55587768554688 + ], + "bp_grad_norms_per_sample_med": [ + 4.130819797865115e-05, + 4.363877815194428e-05, + 4.489632920012809e-05, + 4.4512398744700477e-05, + 3.470887531875633e-05 + ], + "bp_grad_norms_F": [ + 0.002240521367639303, + 0.002310203853994608, + 0.0023576009552925825, + 0.002204722724854946, + 0.0016799044096842408 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6240234375, + "loss_eval": 1.1323366165161133, + "epoch": 60 + }, + { + "hidden_norms": [ + 275.4504699707031, + 249.5341796875, + 237.540283203125, + 230.39208984375, + 224.43321228027344 + ], + "bp_grad_norms_per_sample_med": [ + 4.056218676851131e-05, + 4.288182390155271e-05, + 4.5818003854947165e-05, + 4.356648423708975e-05, + 3.492152245598845e-05 + ], + "bp_grad_norms_F": [ + 0.002249655080959201, + 0.0023316002916544676, + 0.002382595557719469, + 0.002231382764875889, + 0.00168902100995183 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.1275749206542969, + "epoch": 61 + }, + { + "hidden_norms": [ + 273.6263122558594, + 248.43479919433594, + 234.8235321044922, + 228.0020751953125, + 222.4278106689453 + ], + "bp_grad_norms_per_sample_med": [ + 4.0597744373371825e-05, + 4.323143730289303e-05, + 4.647616151487455e-05, + 4.4688425987260416e-05, + 3.521826511132531e-05 + ], + "bp_grad_norms_F": [ + 0.002307126997038722, + 0.0023877634666860104, + 0.0024417925160378218, + 0.0022813305258750916, + 0.001714664394967258 + ], + "gamma_dfa": NaN, + "acc_eval": 0.626953125, + "loss_eval": 1.1252907514572144, + "epoch": 62 + }, + { + "hidden_norms": [ + 271.7508239746094, + 246.79209899902344, + 233.84280395507812, + 226.96934509277344, + 220.57888793945312 + ], + "bp_grad_norms_per_sample_med": [ + 4.177554728812538e-05, + 4.393904600874521e-05, + 4.635817458620295e-05, + 4.428510874276981e-05, + 3.396430111024529e-05 + ], + "bp_grad_norms_F": [ + 0.002355988370254636, + 0.0024527544155716896, + 0.0025022663176059723, + 0.0023387460969388485, + 0.0017370774876326323 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62109375, + "loss_eval": 1.1249933242797852, + "epoch": 63 + }, + { + "hidden_norms": [ + 271.7035217285156, + 246.70675659179688, + 233.96661376953125, + 226.53175354003906, + 220.52359008789062 + ], + "bp_grad_norms_per_sample_med": [ + 4.2499312257859856e-05, + 4.503092714003287e-05, + 4.670799171435647e-05, + 4.5866876462241635e-05, + 3.720118911587633e-05 + ], + "bp_grad_norms_F": [ + 0.002408105880022049, + 0.0024944571778178215, + 0.002545328810811043, + 0.002381332218647003, + 0.0017641197191551328 + ], + "gamma_dfa": NaN, + "acc_eval": 0.625, + "loss_eval": 1.1418037414550781, + "epoch": 64 + }, + { + "hidden_norms": [ + 271.0970153808594, + 246.78770446777344, + 234.2436065673828, + 226.7012176513672, + 219.61680603027344 + ], + "bp_grad_norms_per_sample_med": [ + 4.040581188746728e-05, + 4.3224725231993943e-05, + 4.4494401663541794e-05, + 4.3532105337362736e-05, + 3.4612559829838574e-05 + ], + "bp_grad_norms_F": [ + 0.0024068003986030817, + 0.002485552802681923, + 0.002538430504500866, + 0.002368941670283675, + 0.0017652952810749412 + ], + "gamma_dfa": NaN, + "acc_eval": 0.626953125, + "loss_eval": 1.1279454231262207, + "epoch": 65 + }, + { + "hidden_norms": [ + 270.66473388671875, + 244.8525390625, + 232.8356475830078, + 224.2222137451172, + 217.24554443359375 + ], + "bp_grad_norms_per_sample_med": [ + 4.1549992602085695e-05, + 4.493525193538517e-05, + 4.7448877012357116e-05, + 4.479651397559792e-05, + 3.5401590139372274e-05 + ], + "bp_grad_norms_F": [ + 0.002463088370859623, + 0.002551029436290264, + 0.002594881458207965, + 0.0024160456378012896, + 0.001803302438929677 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6376953125, + "loss_eval": 1.1330325603485107, + "epoch": 66 + }, + { + "hidden_norms": [ + 269.8645935058594, + 243.50497436523438, + 231.37692260742188, + 222.27967834472656, + 215.22059631347656 + ], + "bp_grad_norms_per_sample_med": [ + 4.1519095248077065e-05, + 4.487609476200305e-05, + 4.708006963483058e-05, + 4.4878328480990604e-05, + 3.578457108233124e-05 + ], + "bp_grad_norms_F": [ + 0.0024854058865457773, + 0.0025721373967826366, + 0.0026270432863384485, + 0.0024401266127824783, + 0.0018134783022105694 + ], + "gamma_dfa": NaN, + "acc_eval": 0.63671875, + "loss_eval": 1.123876690864563, + "epoch": 67 + }, + { + "hidden_norms": [ + 269.28570556640625, + 242.04359436035156, + 229.53497314453125, + 221.24327087402344, + 215.1306610107422 + ], + "bp_grad_norms_per_sample_med": [ + 4.279898348613642e-05, + 4.6176737669156864e-05, + 4.813459236174822e-05, + 4.609950337908231e-05, + 3.566763552953489e-05 + ], + "bp_grad_norms_F": [ + 0.0024860126432031393, + 0.002575797727331519, + 0.0026342689525336027, + 0.0024608916137367487, + 0.0018216874450445175 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.122079849243164, + "epoch": 68 + }, + { + "hidden_norms": [ + 268.3481140136719, + 242.3759765625, + 229.19241333007812, + 220.78233337402344, + 213.58587646484375 + ], + "bp_grad_norms_per_sample_med": [ + 4.163750054431148e-05, + 4.50872685178183e-05, + 4.8797548515722156e-05, + 4.597716542775743e-05, + 3.505409767967649e-05 + ], + "bp_grad_norms_F": [ + 0.0025033215060830116, + 0.002596172271296382, + 0.002654082840308547, + 0.002480126451700926, + 0.0018305372213944793 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6328125, + "loss_eval": 1.1238645315170288, + "epoch": 69 + }, + { + "hidden_norms": [ + 267.92425537109375, + 239.90985107421875, + 228.08212280273438, + 219.12835693359375, + 212.38052368164062 + ], + "bp_grad_norms_per_sample_med": [ + 4.42373457190115e-05, + 4.6515069698216394e-05, + 4.823393464903347e-05, + 4.762738535646349e-05, + 3.6444154829951e-05 + ], + "bp_grad_norms_F": [ + 0.0025684935972094536, + 0.002675230847671628, + 0.0027295781765133142, + 0.0025394319090992212, + 0.0018643162911757827 + ], + "gamma_dfa": NaN, + "acc_eval": 0.626953125, + "loss_eval": 1.135793685913086, + "epoch": 70 + }, + { + "hidden_norms": [ + 266.2279052734375, + 239.37680053710938, + 226.3264923095703, + 218.04910278320312, + 210.68836975097656 + ], + "bp_grad_norms_per_sample_med": [ + 4.4824198994319886e-05, + 4.7638000978622586e-05, + 4.962517414242029e-05, + 4.7396664740517735e-05, + 3.5957502404926345e-05 + ], + "bp_grad_norms_F": [ + 0.002600227715447545, + 0.002714222064241767, + 0.002763595897704363, + 0.0025755097158253193, + 0.0018772372277453542 + ], + "gamma_dfa": NaN, + "acc_eval": 0.623046875, + "loss_eval": 1.123576283454895, + "epoch": 71 + }, + { + "hidden_norms": [ + 266.4837951660156, + 239.67581176757812, + 227.51805114746094, + 218.58811950683594, + 211.26596069335938 + ], + "bp_grad_norms_per_sample_med": [ + 4.245663512847386e-05, + 4.560768138617277e-05, + 4.797001020051539e-05, + 4.539322981145233e-05, + 3.4807548217941076e-05 + ], + "bp_grad_norms_F": [ + 0.0025984421372413635, + 0.002703956561163068, + 0.002762222196906805, + 0.002577459439635277, + 0.0018865292659029365 + ], + "gamma_dfa": NaN, + "acc_eval": 0.61328125, + "loss_eval": 1.1362444162368774, + "epoch": 72 + }, + { + "hidden_norms": [ + 264.8100891113281, + 237.96121215820312, + 226.14822387695312, + 217.3454132080078, + 208.98077392578125 + ], + "bp_grad_norms_per_sample_med": [ + 4.217765308567323e-05, + 4.603620618581772e-05, + 4.735886977869086e-05, + 4.5346474507823586e-05, + 3.594472218537703e-05 + ], + "bp_grad_norms_F": [ + 0.0026375274173915386, + 0.0027397233061492443, + 0.0028012648690491915, + 0.0026011927984654903, + 0.0018980697495862842 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6318359375, + "loss_eval": 1.1286330223083496, + "epoch": 73 + }, + { + "hidden_norms": [ + 264.8172302246094, + 238.0478057861328, + 225.0303497314453, + 217.1344757080078, + 209.569580078125 + ], + "bp_grad_norms_per_sample_med": [ + 4.242224895278923e-05, + 4.6696859499206766e-05, + 4.831598562304862e-05, + 4.5893459173385054e-05, + 3.54531584889628e-05 + ], + "bp_grad_norms_F": [ + 0.0026500027161091566, + 0.002760941395536065, + 0.0028223067056387663, + 0.0026202781591564417, + 0.001915424014441669 + ], + "gamma_dfa": NaN, + "acc_eval": 0.626953125, + "loss_eval": 1.1304678916931152, + "epoch": 74 + }, + { + "hidden_norms": [ + 264.7013854980469, + 237.4438018798828, + 225.43527221679688, + 216.18502807617188, + 208.08302307128906 + ], + "bp_grad_norms_per_sample_med": [ + 4.43761091446504e-05, + 4.801220347872004e-05, + 4.9817157560028136e-05, + 4.829527097172104e-05, + 3.73583534383215e-05 + ], + "bp_grad_norms_F": [ + 0.002686889609321952, + 0.0028029615059494972, + 0.002866453491151333, + 0.002669648267328739, + 0.0019349679350852966 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6240234375, + "loss_eval": 1.1350867748260498, + "epoch": 75 + }, + { + "hidden_norms": [ + 264.3004455566406, + 236.1824188232422, + 223.4772186279297, + 214.64682006835938, + 207.52272033691406 + ], + "bp_grad_norms_per_sample_med": [ + 4.3003376049455255e-05, + 4.6196739276638255e-05, + 4.8772617446957156e-05, + 4.7264005843317136e-05, + 3.6179160815663636e-05 + ], + "bp_grad_norms_F": [ + 0.0027191757690161467, + 0.0028310383204370737, + 0.0028950762934982777, + 0.002689448418095708, + 0.0019433586858212948 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6259765625, + "loss_eval": 1.1378443241119385, + "epoch": 76 + }, + { + "hidden_norms": [ + 262.62811279296875, + 235.80126953125, + 222.7261199951172, + 213.42430114746094, + 205.99493408203125 + ], + "bp_grad_norms_per_sample_med": [ + 4.4399519538274035e-05, + 4.737091148854233e-05, + 4.900431667920202e-05, + 4.768445069203153e-05, + 3.608842962421477e-05 + ], + "bp_grad_norms_F": [ + 0.0027450472116470337, + 0.0028562990482896566, + 0.0029378861654549837, + 0.0027161173056811094, + 0.0019581648521125317 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6220703125, + "loss_eval": 1.137312889099121, + "epoch": 77 + }, + { + "hidden_norms": [ + 262.612060546875, + 235.62489318847656, + 222.1566925048828, + 212.93875122070312, + 205.24142456054688 + ], + "bp_grad_norms_per_sample_med": [ + 4.443951911525801e-05, + 4.7095887566683814e-05, + 4.906025424133986e-05, + 4.8352503654314205e-05, + 3.6001758417114615e-05 + ], + "bp_grad_norms_F": [ + 0.002745443256571889, + 0.002859732834622264, + 0.002942001214250922, + 0.002725319005548954, + 0.001969744684174657 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6279296875, + "loss_eval": 1.126712441444397, + "epoch": 78 + }, + { + "hidden_norms": [ + 262.6611633300781, + 235.52174377441406, + 221.89093017578125, + 213.1799774169922, + 204.9930877685547 + ], + "bp_grad_norms_per_sample_med": [ + 4.5766752009512857e-05, + 4.834473293158226e-05, + 5.181043525226414e-05, + 4.826926306122914e-05, + 3.573719732230529e-05 + ], + "bp_grad_norms_F": [ + 0.0027218428440392017, + 0.002838012296706438, + 0.002919211983680725, + 0.0027209871914237738, + 0.001970200566574931 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62109375, + "loss_eval": 1.1352139711380005, + "epoch": 79 + }, + { + "hidden_norms": [ + 261.58856201171875, + 234.9381103515625, + 221.2636260986328, + 211.9308624267578, + 204.54647827148438 + ], + "bp_grad_norms_per_sample_med": [ + 4.5460306864697486e-05, + 4.857210296904668e-05, + 4.9856924306368455e-05, + 4.823243580176495e-05, + 3.731804099516012e-05 + ], + "bp_grad_norms_F": [ + 0.002767088357359171, + 0.0028805267065763474, + 0.0029621378052979708, + 0.00275496207177639, + 0.001986011164262891 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6259765625, + "loss_eval": 1.134087324142456, + "epoch": 80 + }, + { + "hidden_norms": [ + 261.3812561035156, + 234.79383850097656, + 220.678955078125, + 211.66114807128906, + 203.9405517578125 + ], + "bp_grad_norms_per_sample_med": [ + 4.64644399471581e-05, + 5.052189590060152e-05, + 5.2927574870409444e-05, + 5.0570299208629876e-05, + 3.7252495530992746e-05 + ], + "bp_grad_norms_F": [ + 0.0027735778130590916, + 0.002885127207264304, + 0.0029686433263123035, + 0.002763227093964815, + 0.0019980284851044416 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.135728359222412, + "epoch": 81 + }, + { + "hidden_norms": [ + 261.2560729980469, + 233.66014099121094, + 220.25682067871094, + 211.13511657714844, + 203.18130493164062 + ], + "bp_grad_norms_per_sample_med": [ + 4.6268629375845194e-05, + 4.9701800890034065e-05, + 5.169105133973062e-05, + 5.069339385954663e-05, + 3.80978781322483e-05 + ], + "bp_grad_norms_F": [ + 0.0028223153203725815, + 0.0029419492930173874, + 0.0030234854202717543, + 0.002805375959724188, + 0.002015760401263833 + ], + "gamma_dfa": NaN, + "acc_eval": 0.619140625, + "loss_eval": 1.1317980289459229, + "epoch": 82 + }, + { + "hidden_norms": [ + 260.62255859375, + 233.12937927246094, + 219.89907836914062, + 210.4191436767578, + 202.494873046875 + ], + "bp_grad_norms_per_sample_med": [ + 4.5126867917133495e-05, + 4.8572586820228025e-05, + 5.1520797569537535e-05, + 4.971070302417502e-05, + 3.838812335743569e-05 + ], + "bp_grad_norms_F": [ + 0.0028271761257201433, + 0.002944816369563341, + 0.003029909450560808, + 0.0028170389123260975, + 0.002025141380727291 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6259765625, + "loss_eval": 1.1392892599105835, + "epoch": 83 + }, + { + "hidden_norms": [ + 260.0465393066406, + 232.27760314941406, + 218.845458984375, + 209.7770233154297, + 201.92831420898438 + ], + "bp_grad_norms_per_sample_med": [ + 4.730001455754973e-05, + 5.118208355270326e-05, + 5.1580365834524855e-05, + 4.936498589813709e-05, + 3.706002826220356e-05 + ], + "bp_grad_norms_F": [ + 0.0028656981885433197, + 0.002991823712363839, + 0.0030798574443906546, + 0.0028517318423837423, + 0.0020406947005540133 + ], + "gamma_dfa": NaN, + "acc_eval": 0.625, + "loss_eval": 1.1393200159072876, + "epoch": 84 + }, + { + "hidden_norms": [ + 259.99285888671875, + 232.2432403564453, + 218.6685333251953, + 209.5802001953125, + 201.7836456298828 + ], + "bp_grad_norms_per_sample_med": [ + 4.4883607188239694e-05, + 4.9325379222864285e-05, + 5.1563201850512996e-05, + 4.9446705816080794e-05, + 3.641278817667626e-05 + ], + "bp_grad_norms_F": [ + 0.002843427937477827, + 0.0029685739427804947, + 0.0030620063189417124, + 0.0028350763022899628, + 0.0020346841774880886 + ], + "gamma_dfa": NaN, + "acc_eval": 0.625, + "loss_eval": 1.136763572692871, + "epoch": 85 + }, + { + "hidden_norms": [ + 259.7002868652344, + 232.1937713623047, + 218.6339569091797, + 209.42572021484375, + 201.48532104492188 + ], + "bp_grad_norms_per_sample_med": [ + 4.557083229883574e-05, + 5.006462743040174e-05, + 5.1964529120596126e-05, + 5.040188261773437e-05, + 3.70733359886799e-05 + ], + "bp_grad_norms_F": [ + 0.002866365248337388, + 0.0029951538890600204, + 0.0030862949788570404, + 0.0028592217713594437, + 0.002047886373475194 + ], + "gamma_dfa": NaN, + "acc_eval": 0.630859375, + "loss_eval": 1.139750361442566, + "epoch": 86 + }, + { + "hidden_norms": [ + 259.22808837890625, + 232.3558807373047, + 218.42848205566406, + 209.1579132080078, + 201.5212860107422 + ], + "bp_grad_norms_per_sample_med": [ + 4.5765504182782024e-05, + 4.875436570728198e-05, + 5.104453521198593e-05, + 5.005718412576243e-05, + 3.675639891298488e-05 + ], + "bp_grad_norms_F": [ + 0.002878013998270035, + 0.003002135781571269, + 0.0030916042160242796, + 0.002861205255612731, + 0.0020479748491197824 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.1344283819198608, + "epoch": 87 + }, + { + "hidden_norms": [ + 259.1551513671875, + 232.05300903320312, + 218.15708923339844, + 208.9161834716797, + 201.6800537109375 + ], + "bp_grad_norms_per_sample_med": [ + 4.611797339748591e-05, + 4.964259278494865e-05, + 5.252738264971413e-05, + 5.0600574468262494e-05, + 3.820879283011891e-05 + ], + "bp_grad_norms_F": [ + 0.0028855716809630394, + 0.003010405693203211, + 0.0031016215216368437, + 0.002874146681278944, + 0.0020545709412544966 + ], + "gamma_dfa": NaN, + "acc_eval": 0.626953125, + "loss_eval": 1.135157823562622, + "epoch": 88 + }, + { + "hidden_norms": [ + 259.21893310546875, + 231.72747802734375, + 217.7665252685547, + 208.59022521972656, + 201.1155548095703 + ], + "bp_grad_norms_per_sample_med": [ + 4.6835561079205945e-05, + 5.060776311438531e-05, + 5.325842721504159e-05, + 5.128757766215131e-05, + 3.774667493416928e-05 + ], + "bp_grad_norms_F": [ + 0.002893448108807206, + 0.0030188425444066525, + 0.0031124993693083525, + 0.002883171197026968, + 0.002058332087472081 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6298828125, + "loss_eval": 1.1357543468475342, + "epoch": 89 + }, + { + "hidden_norms": [ + 258.88385009765625, + 230.9880828857422, + 217.33352661132812, + 208.3406524658203, + 200.54083251953125 + ], + "bp_grad_norms_per_sample_med": [ + 4.6940938773332164e-05, + 5.0942355301231146e-05, + 5.368283382267691e-05, + 5.184212204767391e-05, + 3.746367656276561e-05 + ], + "bp_grad_norms_F": [ + 0.0029224599711596966, + 0.0030530549120157957, + 0.003145798807963729, + 0.0029114321805536747, + 0.0020718672312796116 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6279296875, + "loss_eval": 1.1398890018463135, + "epoch": 90 + }, + { + "hidden_norms": [ + 258.7764587402344, + 231.19357299804688, + 217.22779846191406, + 207.97528076171875, + 199.982421875 + ], + "bp_grad_norms_per_sample_med": [ + 4.70306295028422e-05, + 5.185308327781968e-05, + 5.281997437123209e-05, + 5.1426530262688175e-05, + 3.7254685594234616e-05 + ], + "bp_grad_norms_F": [ + 0.002924826927483082, + 0.0030514320824295282, + 0.0031429482623934746, + 0.0029119658283889294, + 0.0020754521246999502 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.138663411140442, + "epoch": 91 + }, + { + "hidden_norms": [ + 258.7837829589844, + 230.58901977539062, + 217.062255859375, + 207.7244873046875, + 199.89395141601562 + ], + "bp_grad_norms_per_sample_med": [ + 4.688404078478925e-05, + 5.141457950230688e-05, + 5.3491079597733915e-05, + 5.087396493763663e-05, + 3.739634121302515e-05 + ], + "bp_grad_norms_F": [ + 0.0029230716172605753, + 0.0030518025159835815, + 0.0031419326551258564, + 0.002910938812419772, + 0.00207503535784781 + ], + "gamma_dfa": NaN, + "acc_eval": 0.626953125, + "loss_eval": 1.1365739107131958, + "epoch": 92 + }, + { + "hidden_norms": [ + 258.7561950683594, + 230.4254913330078, + 217.07546997070312, + 207.6160125732422, + 199.7816162109375 + ], + "bp_grad_norms_per_sample_med": [ + 4.680828351411037e-05, + 5.096250242786482e-05, + 5.211709503782913e-05, + 5.09246347064618e-05, + 3.779645703616552e-05 + ], + "bp_grad_norms_F": [ + 0.002931967144832015, + 0.0030605625361204147, + 0.00315046776086092, + 0.0029180829878896475, + 0.002077121753245592 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.1363377571105957, + "epoch": 93 + }, + { + "hidden_norms": [ + 258.76409912109375, + 230.5386505126953, + 216.76475524902344, + 207.16859436035156, + 199.2827911376953 + ], + "bp_grad_norms_per_sample_med": [ + 4.749056097352877e-05, + 5.2020419389009476e-05, + 5.3769603255204856e-05, + 5.178397987037897e-05, + 3.789216498262249e-05 + ], + "bp_grad_norms_F": [ + 0.0029493479523807764, + 0.0030784173868596554, + 0.0031682881526649, + 0.0029316784348338842, + 0.002084067091345787 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6298828125, + "loss_eval": 1.1382873058319092, + "epoch": 94 + }, + { + "hidden_norms": [ + 258.7884826660156, + 230.40945434570312, + 216.70376586914062, + 207.1806182861328, + 199.41917419433594 + ], + "bp_grad_norms_per_sample_med": [ + 4.741501834359951e-05, + 5.169968062546104e-05, + 5.352263542590663e-05, + 5.053802306065336e-05, + 3.758866660064086e-05 + ], + "bp_grad_norms_F": [ + 0.002947731176391244, + 0.003076745430007577, + 0.0031680618412792683, + 0.0029321794863790274, + 0.0020845714025199413 + ], + "gamma_dfa": NaN, + "acc_eval": 0.630859375, + "loss_eval": 1.1382077932357788, + "epoch": 95 + }, + { + "hidden_norms": [ + 258.766845703125, + 230.38992309570312, + 216.7628173828125, + 207.26092529296875, + 199.36366271972656 + ], + "bp_grad_norms_per_sample_med": [ + 4.718741183751263e-05, + 5.1928480388596654e-05, + 5.3666040912503377e-05, + 5.089692058390938e-05, + 3.752821430680342e-05 + ], + "bp_grad_norms_F": [ + 0.002943811472505331, + 0.003073457395657897, + 0.0031646883580833673, + 0.0029298998415470123, + 0.002084212377667427 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.138296365737915, + "epoch": 96 + }, + { + "hidden_norms": [ + 258.8481140136719, + 230.38389587402344, + 216.7748260498047, + 207.24560546875, + 199.39401245117188 + ], + "bp_grad_norms_per_sample_med": [ + 4.728109706775285e-05, + 5.156427505426109e-05, + 5.3663239668821916e-05, + 5.139272616361268e-05, + 3.7748181057395414e-05 + ], + "bp_grad_norms_F": [ + 0.002947240835055709, + 0.003076959168538451, + 0.0031680231913924217, + 0.0029323517810553312, + 0.0020851469598710537 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.1388041973114014, + "epoch": 97 + }, + { + "hidden_norms": [ + 258.77734375, + 230.3692626953125, + 216.7212677001953, + 207.1890869140625, + 199.34091186523438 + ], + "bp_grad_norms_per_sample_med": [ + 4.7204313887050375e-05, + 5.154019163455814e-05, + 5.373918611439876e-05, + 5.1062332204310223e-05, + 3.7904177588643506e-05 + ], + "bp_grad_norms_F": [ + 0.0029484080150723457, + 0.0030780842062085867, + 0.0031695417128503323, + 0.0029333126731216908, + 0.002085541607812047 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.138832688331604, + "epoch": 98 + }, + { + "hidden_norms": [ + 258.7897644042969, + 230.38552856445312, + 216.73997497558594, + 207.1963653564453, + 199.38656616210938 + ], + "bp_grad_norms_per_sample_med": [ + 4.726059705717489e-05, + 5.1730185077758506e-05, + 5.3854040743317455e-05, + 5.0960083171958104e-05, + 3.793121504713781e-05 + ], + "bp_grad_norms_F": [ + 0.00294809159822762, + 0.003077775239944458, + 0.003169153118506074, + 0.0029330949764698744, + 0.0020853858441114426 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.1388249397277832, + "epoch": 99 + }, + { + "hidden_norms": [ + 258.7891845703125, + 230.38888549804688, + 216.73963928222656, + 207.19769287109375, + 199.4077606201172 + ], + "bp_grad_norms_per_sample_med": [ + 4.725577309727669e-05, + 5.174486432224512e-05, + 5.38085114385467e-05, + 5.098402107250877e-05, + 3.7933263229206204e-05 + ], + "bp_grad_norms_F": [ + 0.002948042470961809, + 0.0030777468346059322, + 0.003169137053191662, + 0.002933081705123186, + 0.0020853858441114426 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6279296875, + "loss_eval": 1.1387826204299927, + "epoch": 100 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.696551322937012, + 8.737784385681152, + 8.813130378723145, + 8.844642639160156, + 8.889528274536133 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010079912608489394, + 0.0010035138111561537, + 0.0009970925748348236, + 0.0009936393471434712, + 0.000986678060144186 + ], + "bp_grad_norms_F": [ + 0.035574451088905334, + 0.035288579761981964, + 0.035048045217990875, + 0.0346725769340992, + 0.03439188003540039 + ], + "gamma_dfa": 0.0033523982419865206, + "acc_eval": 0.0927734375, + "loss_eval": 2.4863264560699463, + "epoch": 0 + }, + { + "hidden_norms": [ + 900.3377685546875, + 3463.92626953125, + 6660.5166015625, + 10478.5126953125, + 13466.513671875 + ], + "bp_grad_norms_per_sample_med": [ + 2.017142833210528e-06, + 7.972002435963077e-07, + 7.783806381667091e-07, + 7.758338256280695e-07, + 7.810436954969191e-07 + ], + "bp_grad_norms_F": [ + 0.00013047464017290622, + 7.321321754716337e-05, + 7.131113670766354e-05, + 7.113779429346323e-05, + 7.09498199285008e-05 + ], + "gamma_dfa": 0.1028625147882849, + "acc_eval": 0.2861328125, + "loss_eval": 1.970402717590332, + "epoch": 1 + }, + { + "hidden_norms": [ + 1784.805419921875, + 14085.2138671875, + 36523.9375, + 61422.50390625, + 73870.3359375 + ], + "bp_grad_norms_per_sample_med": [ + 9.087140711017128e-07, + 1.772240381114898e-07, + 1.705584367073243e-07, + 1.7156033038645546e-07, + 1.728751612972701e-07 + ], + "bp_grad_norms_F": [ + 4.7445286327274516e-05, + 1.1973520486208145e-05, + 9.698592293716501e-06, + 9.335580216429662e-06, + 9.154121471510734e-06 + ], + "gamma_dfa": 0.09588160619023256, + "acc_eval": 0.298828125, + "loss_eval": 1.9628738164901733, + "epoch": 2 + }, + { + "hidden_norms": [ + 2670.88134765625, + 35761.4921875, + 99927.7890625, + 170223.953125, + 201448.390625 + ], + "bp_grad_norms_per_sample_med": [ + 5.815078338855528e-07, + 7.772520405069372e-08, + 7.527528111950232e-08, + 7.557918735301428e-08, + 7.57173737042649e-08 + ], + "bp_grad_norms_F": [ + 2.8944486984983087e-05, + 3.2005805223889183e-06, + 2.6765355869429186e-06, + 2.639568720042007e-06, + 2.6436800908413716e-06 + ], + "gamma_dfa": 0.09442083747126162, + "acc_eval": 0.2900390625, + "loss_eval": 1.9821033477783203, + "epoch": 3 + }, + { + "hidden_norms": [ + 3506.001220703125, + 70233.9375, + 205054.078125, + 348792.375, + 416698.5625 + ], + "bp_grad_norms_per_sample_med": [ + 4.5228594558466284e-07, + 4.338783554658221e-08, + 4.114394869247917e-08, + 4.122260932604149e-08, + 4.124275321260029e-08 + ], + "bp_grad_norms_F": [ + 2.319143823115155e-05, + 1.7165241388283903e-06, + 1.3772670399703202e-06, + 1.3777447520624264e-06, + 1.3796359326079255e-06 + ], + "gamma_dfa": 0.09172606549691409, + "acc_eval": 0.298828125, + "loss_eval": 1.9661527872085571, + "epoch": 4 + }, + { + "hidden_norms": [ + 4351.04052734375, + 120982.0390625, + 361547.03125, + 633667.3125, + 764198.75 + ], + "bp_grad_norms_per_sample_med": [ + 3.632259790720127e-07, + 2.6118947005215887e-08, + 2.4913996199416033e-08, + 2.494128636953974e-08, + 2.4942012899487054e-08 + ], + "bp_grad_norms_F": [ + 1.894752676889766e-05, + 1.1090510270150844e-06, + 8.424218549407669e-07, + 8.403117703892349e-07, + 8.407336054006009e-07 + ], + "gamma_dfa": 0.08992433547973633, + "acc_eval": 0.2900390625, + "loss_eval": 1.980475664138794, + "epoch": 5 + }, + { + "hidden_norms": [ + 5174.9833984375, + 189817.0625, + 576763.3125, + 1012734.125, + 1235217.5 + ], + "bp_grad_norms_per_sample_med": [ + 3.340334444601467e-07, + 1.826493090106851e-08, + 1.7263264595612782e-08, + 1.730784759956805e-08, + 1.7305337607353977e-08 + ], + "bp_grad_norms_F": [ + 1.7139096598839387e-05, + 7.582453918075771e-07, + 5.794162802885694e-07, + 5.812879635413992e-07, + 5.813373604723893e-07 + ], + "gamma_dfa": 0.08752730302512646, + "acc_eval": 0.3056640625, + "loss_eval": 1.9696743488311768, + "epoch": 6 + }, + { + "hidden_norms": [ + 5963.3935546875, + 276686.75, + 861517.375, + 1555059.75, + 1913322.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.834741223978199e-07, + 1.3120247110975924e-08, + 1.2326365705916942e-08, + 1.2353129186237766e-08, + 1.2349524958210623e-08 + ], + "bp_grad_norms_F": [ + 1.4978587387304287e-05, + 5.169860628484457e-07, + 4.2094282548532647e-07, + 4.222391680741566e-07, + 4.222146685606276e-07 + ], + "gamma_dfa": 0.08884745300747454, + "acc_eval": 0.2919921875, + "loss_eval": 1.9592503309249878, + "epoch": 7 + }, + { + "hidden_norms": [ + 6751.1630859375, + 390990.65625, + 1268157.625, + 2303462.75, + 2850455.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.5272595394199016e-07, + 9.644952392307005e-09, + 9.213153795428752e-09, + 9.189856875480018e-09, + 9.217835383878992e-09 + ], + "bp_grad_norms_F": [ + 1.3214407772466075e-05, + 3.7820277043465467e-07, + 3.14011003865744e-07, + 3.1468064776163374e-07, + 3.146610936255456e-07 + ], + "gamma_dfa": 0.08774545323103666, + "acc_eval": 0.3115234375, + "loss_eval": 1.9636309146881104, + "epoch": 8 + }, + { + "hidden_norms": [ + 7557.10302734375, + 541741.25, + 1767146.375, + 3237576.25, + 4005094.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.3122942138797953e-07, + 7.519741274109037e-09, + 7.2226606917524805e-09, + 7.218183384338772e-09, + 7.221534037427091e-09 + ], + "bp_grad_norms_F": [ + 1.196970697492361e-05, + 2.9184533900661336e-07, + 2.4720966962377133e-07, + 2.4752529270699597e-07, + 2.4754368155299744e-07 + ], + "gamma_dfa": 0.08941872720606625, + "acc_eval": 0.2900390625, + "loss_eval": 1.9587393999099731, + "epoch": 9 + }, + { + "hidden_norms": [ + 8353.015625, + 720288.5625, + 2367034.25, + 4437438.5, + 5500873.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.1009967099416826e-07, + 6.096115612308495e-09, + 5.8281148795913396e-09, + 5.816529036195561e-09, + 5.823292070772368e-09 + ], + "bp_grad_norms_F": [ + 1.0853039384528529e-05, + 2.2833219759377243e-07, + 1.979581298883204e-07, + 1.9814572738141578e-07, + 1.9820384977720096e-07 + ], + "gamma_dfa": 0.09132041316479445, + "acc_eval": 0.2978515625, + "loss_eval": 1.9605882167816162, + "epoch": 10 + }, + { + "hidden_norms": [ + 9134.4443359375, + 924688.8125, + 3108971.25, + 5809310.0, + 7180875.5 + ], + "bp_grad_norms_per_sample_med": [ + 1.9402843065563502e-07, + 4.977510403847418e-09, + 4.8141264308299014e-09, + 4.791541829973767e-09, + 4.794175723077387e-09 + ], + "bp_grad_norms_F": [ + 1.0063903573609423e-05, + 1.9364638603747153e-07, + 1.6622837506474752e-07, + 1.6636218447274587e-07, + 1.6641583044929575e-07 + ], + "gamma_dfa": 0.08994872949551791, + "acc_eval": 0.2822265625, + "loss_eval": 1.9717106819152832, + "epoch": 11 + }, + { + "hidden_norms": [ + 9934.0107421875, + 1171186.5, + 4059807.75, + 7477705.0, + 9248714.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.802942222184356e-07, + 4.213630333538276e-09, + 4.032348677185382e-09, + 4.031016409555832e-09, + 4.033940292913485e-09 + ], + "bp_grad_norms_F": [ + 9.375374247611035e-06, + 1.60658984782458e-07, + 1.398711617639492e-07, + 1.399746452079853e-07, + 1.4004145043600147e-07 + ], + "gamma_dfa": 0.09168496390338987, + "acc_eval": 0.2998046875, + "loss_eval": 1.9513648748397827, + "epoch": 12 + }, + { + "hidden_norms": [ + 10690.2216796875, + 1474348.375, + 5210694.5, + 9539616.0, + 11795722.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7011585384807404e-07, + 3.5948770626959003e-09, + 3.444458496204561e-09, + 3.439692752849055e-09, + 3.4398179860062328e-09 + ], + "bp_grad_norms_F": [ + 8.913790225051343e-06, + 1.346561759874021e-07, + 1.1880944583708697e-07, + 1.1887690476442003e-07, + 1.1894194784645151e-07 + ], + "gamma_dfa": 0.0931803259300068, + "acc_eval": 0.3134765625, + "loss_eval": 1.959463357925415, + "epoch": 13 + }, + { + "hidden_norms": [ + 11428.3076171875, + 1789460.25, + 6431273.0, + 11810251.0, + 14610525.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5823535193248972e-07, + 3.1298097447063356e-09, + 3.012203153573978e-09, + 3.010908633527265e-09, + 3.010648619294898e-09 + ], + "bp_grad_norms_F": [ + 8.233506378019229e-06, + 1.1668681310084139e-07, + 1.0298786889961775e-07, + 1.0303519104581937e-07, + 1.0309597797686365e-07 + ], + "gamma_dfa": 0.09336384548805654, + "acc_eval": 0.2861328125, + "loss_eval": 1.9515889883041382, + "epoch": 14 + }, + { + "hidden_norms": [ + 12175.4384765625, + 2177908.0, + 7886216.5, + 14475684.0, + 17927020.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5137742082060868e-07, + 2.705691448667835e-09, + 2.5981530260565933e-09, + 2.5995214869567462e-09, + 2.6000293029682098e-09 + ], + "bp_grad_norms_F": [ + 7.800716048222966e-06, + 1.0053086896277819e-07, + 8.984200405848242e-08, + 8.987952071493055e-08, + 8.993622913067156e-08 + ], + "gamma_dfa": 0.09357930033002049, + "acc_eval": 0.2978515625, + "loss_eval": 1.9580912590026855, + "epoch": 15 + }, + { + "hidden_norms": [ + 12918.6787109375, + 2622644.5, + 9573671.0, + 17460572.0, + 21682046.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.432233602827182e-07, + 2.359643591631766e-09, + 2.2714441438864696e-09, + 2.2688442236074025e-09, + 2.2694950363444377e-09 + ], + "bp_grad_norms_F": [ + 7.43454029361601e-06, + 8.846858889910436e-08, + 7.942762891843813e-08, + 7.945371294226788e-08, + 7.950914238108453e-08 + ], + "gamma_dfa": 0.09332277777139097, + "acc_eval": 0.30859375, + "loss_eval": 1.9656270742416382, + "epoch": 16 + }, + { + "hidden_norms": [ + 13676.931640625, + 3144179.5, + 11421599.0, + 20832254.0, + 25907438.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.3402345189206244e-07, + 2.1064472388587774e-09, + 2.0263852817947736e-09, + 2.0199610872850826e-09, + 2.0222397090208233e-09 + ], + "bp_grad_norms_F": [ + 6.909830062795663e-06, + 7.773559929091789e-08, + 7.076827301943922e-08, + 7.077783692466255e-08, + 7.082799413637986e-08 + ], + "gamma_dfa": 0.0945073509356007, + "acc_eval": 0.296875, + "loss_eval": 1.9510960578918457, + "epoch": 17 + }, + { + "hidden_norms": [ + 14410.64453125, + 3691622.0, + 13302875.0, + 24659928.0, + 30700242.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2569752527724631e-07, + 1.8540845525549798e-09, + 1.8018908587436044e-09, + 1.8003264434796051e-09, + 1.802896276714705e-09 + ], + "bp_grad_norms_F": [ + 6.58303315503872e-06, + 6.894391191281102e-08, + 6.3350469758916e-08, + 6.336826174901944e-08, + 6.340740554833246e-08 + ], + "gamma_dfa": 0.09388192358892411, + "acc_eval": 0.30859375, + "loss_eval": 1.9456725120544434, + "epoch": 18 + }, + { + "hidden_norms": [ + 15102.634765625, + 4270070.0, + 15687016.0, + 28858048.0, + 35882240.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2314617947595252e-07, + 1.6925943979728686e-09, + 1.6383979728473719e-09, + 1.6367472932543592e-09, + 1.6394127166918793e-09 + ], + "bp_grad_norms_F": [ + 6.343140285025584e-06, + 6.240136940505181e-08, + 5.757489418556361e-08, + 5.7587019597349354e-08, + 5.7624333749117795e-08 + ], + "gamma_dfa": 0.09518493304494768, + "acc_eval": 0.302734375, + "loss_eval": 1.9497833251953125, + "epoch": 19 + }, + { + "hidden_norms": [ + 15809.6728515625, + 4913181.0, + 18109688.0, + 33281892.0, + 41436228.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1704661773137559e-07, + 1.533212445892218e-09, + 1.483607681151966e-09, + 1.4837684414459318e-09, + 1.4838255069093975e-09 + ], + "bp_grad_norms_F": [ + 6.079233116906835e-06, + 5.7217945936827164e-08, + 5.270470992968512e-08, + 5.2718213794378244e-08, + 5.2752689327917324e-08 + ], + "gamma_dfa": 0.09407007653499022, + "acc_eval": 0.2958984375, + "loss_eval": 1.961036205291748, + "epoch": 20 + }, + { + "hidden_norms": [ + 16522.783203125, + 5620503.0, + 20819020.0, + 38391960.0, + 47723272.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1146808986950418e-07, + 1.4118024527220996e-09, + 1.3678460586419305e-09, + 1.3669514409286876e-09, + 1.3668450815629285e-09 + ], + "bp_grad_norms_F": [ + 5.778397280664649e-06, + 5.162353389209784e-08, + 4.8153967924235985e-08, + 4.816252285877454e-08, + 4.8193449231348495e-08 + ], + "gamma_dfa": 0.09494083630852401, + "acc_eval": 0.2958984375, + "loss_eval": 1.9576481580734253, + "epoch": 21 + }, + { + "hidden_norms": [ + 17230.27734375, + 6437730.5, + 23789486.0, + 43960328.0, + 54569096.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0952022932997352e-07, + 1.2858689668604484e-09, + 1.246260317167014e-09, + 1.2462959553261044e-09, + 1.2484926426026277e-09 + ], + "bp_grad_norms_F": [ + 5.637425147142494e-06, + 4.732414282671016e-08, + 4.430494371376881e-08, + 4.431280586913999e-08, + 4.434128086927558e-08 + ], + "gamma_dfa": 0.09481688600499183, + "acc_eval": 0.2900390625, + "loss_eval": 1.9625442028045654, + "epoch": 22 + }, + { + "hidden_norms": [ + 17916.12890625, + 7217473.5, + 26969020.0, + 49888804.0, + 62010184.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.043977349013403e-07, + 1.1912204556097095e-09, + 1.159051632448893e-09, + 1.1590449711107453e-09, + 1.159014662022173e-09 + ], + "bp_grad_norms_F": [ + 5.385433269111672e-06, + 4.3334623001101136e-08, + 4.083162963297582e-08, + 4.0836408032873805e-08, + 4.0863898931320364e-08 + ], + "gamma_dfa": 0.0946647283853963, + "acc_eval": 0.2939453125, + "loss_eval": 1.9656811952590942, + "epoch": 23 + }, + { + "hidden_norms": [ + 18617.46875, + 8095365.0, + 30241864.0, + 56059896.0, + 69702984.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.001103129283365e-07, + 1.1034658742303805e-09, + 1.0674757744411068e-09, + 1.0666105776380164e-09, + 1.0677670969627684e-09 + ], + "bp_grad_norms_F": [ + 5.150916877028067e-06, + 3.999087283546032e-08, + 3.779740609388682e-08, + 3.780221291549424e-08, + 3.782682256314729e-08 + ], + "gamma_dfa": 0.09509630355751142, + "acc_eval": 0.296875, + "loss_eval": 1.9476948976516724, + "epoch": 24 + }, + { + "hidden_norms": [ + 19248.7890625, + 9047595.0, + 33634812.0, + 62495088.0, + 77796536.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.749370377676314e-08, + 1.0280801765460978e-09, + 9.980430926148642e-10, + 9.978470272287154e-10, + 9.990493987643845e-10 + ], + "bp_grad_norms_F": [ + 5.017087005398935e-06, + 3.7442834610601494e-08, + 3.536156611971819e-08, + 3.536548476290591e-08, + 3.538822213045023e-08 + ], + "gamma_dfa": 0.09479212731821463, + "acc_eval": 0.2861328125, + "loss_eval": 1.9604804515838623, + "epoch": 25 + }, + { + "hidden_norms": [ + 19902.470703125, + 10030725.0, + 37252656.0, + 69351704.0, + 86270768.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.411947843318558e-08, + 9.563448921667828e-10, + 9.361866837309663e-10, + 9.359075736625755e-10, + 9.361766917237446e-10 + ], + "bp_grad_norms_F": [ + 4.873440502706217e-06, + 3.4947159832654506e-08, + 3.313299146157078e-08, + 3.3137865784738096e-08, + 3.315915364510147e-08 + ], + "gamma_dfa": 0.09510701123508625, + "acc_eval": 0.2978515625, + "loss_eval": 1.9498941898345947, + "epoch": 26 + }, + { + "hidden_norms": [ + 20513.66796875, + 11086393.0, + 41223968.0, + 76828584.0, + 95694480.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.249640697817085e-08, + 9.003223166992314e-10, + 8.743661350507637e-10, + 8.736535939135592e-10, + 8.752278901624777e-10 + ], + "bp_grad_norms_F": [ + 4.75014485346037e-06, + 3.290759664764664e-08, + 3.1125043875590563e-08, + 3.1127818544973707e-08, + 3.11488683735206e-08 + ], + "gamma_dfa": 0.09552363055991009, + "acc_eval": 0.2841796875, + "loss_eval": 1.9527215957641602, + "epoch": 27 + }, + { + "hidden_norms": [ + 21161.345703125, + 12263719.0, + 45533684.0, + 84877296.0, + 105753224.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.900443049242313e-08, + 8.457264888406257e-10, + 8.261510919815862e-10, + 8.261567541190118e-10, + 8.276057061884501e-10 + ], + "bp_grad_norms_F": [ + 4.624974280886818e-06, + 3.0792985938887796e-08, + 2.9227694042788244e-08, + 2.9232776199705768e-08, + 2.9251353339532216e-08 + ], + "gamma_dfa": 0.09527035459177569, + "acc_eval": 0.2890625, + "loss_eval": 1.950648307800293, + "epoch": 28 + }, + { + "hidden_norms": [ + 21787.568359375, + 13358760.0, + 49723396.0, + 92840264.0, + 115901424.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.79872459336184e-08, + 8.034463094830357e-10, + 7.846168159630906e-10, + 7.837334670135476e-10, + 7.841179927581265e-10 + ], + "bp_grad_norms_F": [ + 4.530191290541552e-06, + 2.9184068495169413e-08, + 2.7723606521590227e-08, + 2.7726789753046432e-08, + 2.7744931685447227e-08 + ], + "gamma_dfa": 0.09598725114483386, + "acc_eval": 0.2919921875, + "loss_eval": 1.9504928588867188, + "epoch": 29 + }, + { + "hidden_norms": [ + 22378.34765625, + 14611837.0, + 54335560.0, + 101350864.0, + 126710488.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.497670478391228e-08, + 7.560595483013799e-10, + 7.353461728420996e-10, + 7.342743080229752e-10, + 7.348425756781296e-10 + ], + "bp_grad_norms_F": [ + 4.383283339848276e-06, + 2.7485034692631416e-08, + 2.6182895851434296e-08, + 2.618475392068831e-08, + 2.620201833281044e-08 + ], + "gamma_dfa": 0.09509110247017816, + "acc_eval": 0.2958984375, + "loss_eval": 1.9564056396484375, + "epoch": 30 + }, + { + "hidden_norms": [ + 22972.798828125, + 15931348.0, + 59291124.0, + 110237776.0, + 138020368.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.252197858382715e-08, + 7.193445838993284e-10, + 6.977300404109599e-10, + 6.966639487515636e-10, + 6.977723399081981e-10 + ], + "bp_grad_norms_F": [ + 4.255563453625655e-06, + 2.5971447215056287e-08, + 2.4833044065530885e-08, + 2.4835205891804435e-08, + 2.4851219748711628e-08 + ], + "gamma_dfa": 0.0951943755208049, + "acc_eval": 0.30859375, + "loss_eval": 1.9508299827575684, + "epoch": 31 + }, + { + "hidden_norms": [ + 23525.689453125, + 17283022.0, + 64234984.0, + 119317480.0, + 149347744.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.036072784989301e-08, + 6.884249836858203e-10, + 6.666004415123439e-10, + 6.656397100179845e-10, + 6.674217845059616e-10 + ], + "bp_grad_norms_F": [ + 4.212505245959619e-06, + 2.4864668546342727e-08, + 2.375563212808629e-08, + 2.3757841915994504e-08, + 2.3773273127858374e-08 + ], + "gamma_dfa": 0.09534151147818193, + "acc_eval": 0.294921875, + "loss_eval": 1.95639967918396, + "epoch": 32 + }, + { + "hidden_norms": [ + 24102.95703125, + 18811968.0, + 69193392.0, + 128823560.0, + 161700704.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.921565980950618e-08, + 6.526117424243694e-10, + 6.390621365426341e-10, + 6.381262185328751e-10, + 6.384171524764781e-10 + ], + "bp_grad_norms_F": [ + 4.09630820286111e-06, + 2.3687046990517047e-08, + 2.2686869272092736e-08, + 2.2687553169475905e-08, + 2.2702355551018627e-08 + ], + "gamma_dfa": 0.0947199320216896, + "acc_eval": 0.2880859375, + "loss_eval": 1.960526943206787, + "epoch": 33 + }, + { + "hidden_norms": [ + 24687.955078125, + 20313542.0, + 74389296.0, + 138258576.0, + 173791248.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.937118340350935e-08, + 6.360312831965587e-10, + 6.205357339084117e-10, + 6.196035906569364e-10, + 6.196675395031548e-10 + ], + "bp_grad_norms_F": [ + 4.070574505021796e-06, + 2.2864428572688666e-08, + 2.1894738466698982e-08, + 2.1895061763643753e-08, + 2.1909569269951135e-08 + ], + "gamma_dfa": 0.09556430295924656, + "acc_eval": 0.2822265625, + "loss_eval": 1.97263765335083, + "epoch": 34 + }, + { + "hidden_norms": [ + 25226.55078125, + 21851366.0, + 80000824.0, + 148574480.0, + 186595952.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.592127104771862e-08, + 6.044152955908544e-10, + 5.892630272619215e-10, + 5.896260146798227e-10, + 5.900769872724254e-10 + ], + "bp_grad_norms_F": [ + 3.966818894696189e-06, + 2.1824051898988728e-08, + 2.093374718015184e-08, + 2.093443285389185e-08, + 2.0947767964685227e-08 + ], + "gamma_dfa": 0.09587649442255497, + "acc_eval": 0.298828125, + "loss_eval": 1.9495991468429565, + "epoch": 35 + }, + { + "hidden_norms": [ + 25759.50390625, + 23391128.0, + 85561480.0, + 158667136.0, + 198961760.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.493858333873504e-08, + 5.860726903783586e-10, + 5.731417562770957e-10, + 5.733850616529423e-10, + 5.73569580719635e-10 + ], + "bp_grad_norms_F": [ + 3.896147973136976e-06, + 2.099926454945944e-08, + 2.0218029916918567e-08, + 2.0218159590967844e-08, + 2.0230830344303286e-08 + ], + "gamma_dfa": 0.09563440945930779, + "acc_eval": 0.294921875, + "loss_eval": 1.954901099205017, + "epoch": 36 + }, + { + "hidden_norms": [ + 26267.0859375, + 25111884.0, + 91593392.0, + 169479968.0, + 212491408.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.387680511783401e-08, + 5.612941222921108e-10, + 5.475105369079358e-10, + 5.468157038279742e-10, + 5.479569020749864e-10 + ], + "bp_grad_norms_F": [ + 3.838411430479027e-06, + 2.0261547106770195e-08, + 1.9493551661753372e-08, + 1.949278782831243e-08, + 1.9505332460312275e-08 + ], + "gamma_dfa": 0.09528586096712388, + "acc_eval": 0.302734375, + "loss_eval": 1.9556396007537842, + "epoch": 37 + }, + { + "hidden_norms": [ + 26761.587890625, + 26706742.0, + 97554944.0, + 180407616.0, + 226265728.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.260722156843258e-08, + 5.407673198121188e-10, + 5.32608401826451e-10, + 5.31698407524317e-10, + 5.328552044048251e-10 + ], + "bp_grad_norms_F": [ + 3.7372303722804645e-06, + 1.9519287519642603e-08, + 1.8807236656925852e-08, + 1.8806394663783976e-08, + 1.8818212765836506e-08 + ], + "gamma_dfa": 0.09491665422683582, + "acc_eval": 0.2890625, + "loss_eval": 1.963973879814148, + "epoch": 38 + }, + { + "hidden_norms": [ + 27302.328125, + 28336562.0, + 103781320.0, + 191401696.0, + 240130064.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.187927053564636e-08, + 5.305865746763061e-10, + 5.205576525391109e-10, + 5.20661624925367e-10, + 5.217564713611011e-10 + ], + "bp_grad_norms_F": [ + 3.734877054739627e-06, + 1.88775892695503e-08, + 1.8220953634795478e-08, + 1.8220212893993448e-08, + 1.8231482101782603e-08 + ], + "gamma_dfa": 0.0957885464449646, + "acc_eval": 0.302734375, + "loss_eval": 1.9604723453521729, + "epoch": 39 + }, + { + "hidden_norms": [ + 27801.44140625, + 30051226.0, + 109945288.0, + 203002704.0, + 254881776.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.894305215610075e-08, + 5.044222262107212e-10, + 4.932855790507062e-10, + 4.934126440758746e-10, + 4.940316489232544e-10 + ], + "bp_grad_norms_F": [ + 3.610647127061384e-06, + 1.8150354108570355e-08, + 1.753623024569606e-08, + 1.7534704355171016e-08, + 1.7545806585417267e-08 + ], + "gamma_dfa": 0.09517717303242534, + "acc_eval": 0.2958984375, + "loss_eval": 1.9589688777923584, + "epoch": 40 + }, + { + "hidden_norms": [ + 28266.703125, + 31897594.0, + 116263888.0, + 215162448.0, + 270215296.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.807566421684896e-08, + 4.835814526593651e-10, + 4.775287942848649e-10, + 4.773109685274335e-10, + 4.784843632421598e-10 + ], + "bp_grad_norms_F": [ + 3.590413371057366e-06, + 1.7596850199197434e-08, + 1.705259222717359e-08, + 1.7050926004458233e-08, + 1.7061644541627174e-08 + ], + "gamma_dfa": 0.0961545761092566, + "acc_eval": 0.30859375, + "loss_eval": 1.9595096111297607, + "epoch": 41 + }, + { + "hidden_norms": [ + 28755.66015625, + 33582328.0, + 122605680.0, + 226378480.0, + 284438688.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.689399612014313e-08, + 4.746543713629592e-10, + 4.678599174745557e-10, + 4.68083238835959e-10, + 4.683119447790318e-10 + ], + "bp_grad_norms_F": [ + 3.5121436212648405e-06, + 1.7124380136124273e-08, + 1.6555107507087996e-08, + 1.655343240258844e-08, + 1.656368908697914e-08 + ], + "gamma_dfa": 0.09569378412561491, + "acc_eval": 0.287109375, + "loss_eval": 1.9612011909484863, + "epoch": 42 + }, + { + "hidden_norms": [ + 29227.5703125, + 35443612.0, + 129229904.0, + 238040368.0, + 299000064.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.582912703834154e-08, + 4.575871348500016e-10, + 4.493441174702184e-10, + 4.48520082185766e-10, + 4.485415650012925e-10 + ], + "bp_grad_norms_F": [ + 3.4321058137720684e-06, + 1.6602150765265833e-08, + 1.6083028242519504e-08, + 1.6080972997656318e-08, + 1.609118882583971e-08 + ], + "gamma_dfa": 0.09606127908773487, + "acc_eval": 0.306640625, + "loss_eval": 1.9551353454589844, + "epoch": 43 + }, + { + "hidden_norms": [ + 29665.798828125, + 37243032.0, + 135839760.0, + 250377328.0, + 314433920.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.588776813032382e-08, + 4.4936304677278827e-10, + 4.4115311403913893e-10, + 4.406963405312325e-10, + 4.4055534220710513e-10 + ], + "bp_grad_norms_F": [ + 3.3984799756581197e-06, + 1.6157997606569552e-08, + 1.564128204734061e-08, + 1.5638891071034777e-08, + 1.564865925729464e-08 + ], + "gamma_dfa": 0.09547593681054423, + "acc_eval": 0.2900390625, + "loss_eval": 1.9503705501556396, + "epoch": 44 + }, + { + "hidden_norms": [ + 30096.123046875, + 39014544.0, + 141817168.0, + 261217760.0, + 328197248.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.549055342475185e-08, + 4.3991607578952596e-10, + 4.348142956800416e-10, + 4.3428130536149467e-10, + 4.349899329625373e-10 + ], + "bp_grad_norms_F": [ + 3.382166596566094e-06, + 1.5776649320287106e-08, + 1.5299850275596327e-08, + 1.5297549893489304e-08, + 1.5307026757227504e-08 + ], + "gamma_dfa": 0.09610002994304523, + "acc_eval": 0.2998046875, + "loss_eval": 1.952854037284851, + "epoch": 45 + }, + { + "hidden_norms": [ + 30554.974609375, + 40873780.0, + 148087312.0, + 272436128.0, + 342258336.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.514299855098216e-08, + 4.291983157767021e-10, + 4.228755678958862e-10, + 4.2251957488304015e-10, + 4.227345695717588e-10 + ], + "bp_grad_norms_F": [ + 3.3793355669331504e-06, + 1.5485536408732514e-08, + 1.4993654318118388e-08, + 1.499121538017789e-08, + 1.5000590991576246e-08 + ], + "gamma_dfa": 0.09557013235462364, + "acc_eval": 0.3017578125, + "loss_eval": 1.9633105993270874, + "epoch": 46 + }, + { + "hidden_norms": [ + 30981.4765625, + 42548124.0, + 153904848.0, + 283882112.0, + 356627616.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.343542224840348e-08, + 4.1842326825580756e-10, + 4.139384113255318e-10, + 4.141494092113618e-10, + 4.1477912771092917e-10 + ], + "bp_grad_norms_F": [ + 3.3046233056666097e-06, + 1.508391989091251e-08, + 1.4620022525946297e-08, + 1.4617588028897899e-08, + 1.462664656060042e-08 + ], + "gamma_dfa": 0.09567815247282851, + "acc_eval": 0.296875, + "loss_eval": 1.958325982093811, + "epoch": 47 + }, + { + "hidden_norms": [ + 31383.2578125, + 44333160.0, + 160058736.0, + 295685184.0, + 371288096.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.18988522660402e-08, + 4.057836289206307e-10, + 4.0004452528386025e-10, + 3.9987613220660023e-10, + 4.004964138104583e-10 + ], + "bp_grad_norms_F": [ + 3.2255043151963037e-06, + 1.4663311453944061e-08, + 1.4252069746589768e-08, + 1.424969386931707e-08, + 1.4258660918642363e-08 + ], + "gamma_dfa": 0.09609431066201068, + "acc_eval": 0.302734375, + "loss_eval": 1.9508600234985352, + "epoch": 48 + }, + { + "hidden_norms": [ + 31750.03125, + 46204072.0, + 166757840.0, + 307620864.0, + 385856832.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.133605978675405e-08, + 3.9670436380312424e-10, + 3.904292722456404e-10, + 3.9002356899686674e-10, + 3.9039230181892037e-10 + ], + "bp_grad_norms_F": [ + 3.2063508115243167e-06, + 1.4354414545891814e-08, + 1.3938280751801813e-08, + 1.3935605558401676e-08, + 1.394456727865645e-08 + ], + "gamma_dfa": 0.09565898558139452, + "acc_eval": 0.310546875, + "loss_eval": 1.9467211961746216, + "epoch": 49 + }, + { + "hidden_norms": [ + 32133.1484375, + 47907484.0, + 173083168.0, + 319475424.0, + 400677984.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.030914079246941e-08, + 3.8645733835274143e-10, + 3.81215115030642e-10, + 3.812981042017327e-10, + 3.811861937208505e-10 + ], + "bp_grad_norms_F": [ + 3.177025973855052e-06, + 1.4072985443647212e-08, + 1.368274382684831e-08, + 1.3679918531295243e-08, + 1.368857649453048e-08 + ], + "gamma_dfa": 0.09606298332801089, + "acc_eval": 0.30078125, + "loss_eval": 1.9524433612823486, + "epoch": 50 + }, + { + "hidden_norms": [ + 32483.716796875, + 49794588.0, + 179046160.0, + 330962240.0, + 414954912.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.051003254015086e-08, + 3.794887737385011e-10, + 3.751928767670165e-10, + 3.752734789586043e-10, + 3.7574471312140645e-10 + ], + "bp_grad_norms_F": [ + 3.154751766487607e-06, + 1.3766489281863414e-08, + 1.339402011524271e-08, + 1.3391274755747418e-08, + 1.3399712450734569e-08 + ], + "gamma_dfa": 0.09573800596626825, + "acc_eval": 0.3046875, + "loss_eval": 1.952356219291687, + "epoch": 51 + }, + { + "hidden_norms": [ + 32825.296875, + 51662352.0, + 185889568.0, + 343223360.0, + 430225696.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.9168662858155585e-08, + 3.7636679883767954e-10, + 3.7184264001233203e-10, + 3.7154498921943e-10, + 3.7157116272723556e-10 + ], + "bp_grad_norms_F": [ + 3.0909043289284455e-06, + 1.346105005239906e-08, + 1.3102917861829155e-08, + 1.3100156515122308e-08, + 1.3108366836434016e-08 + ], + "gamma_dfa": 0.09539097778178984, + "acc_eval": 0.291015625, + "loss_eval": 1.9585516452789307, + "epoch": 52 + }, + { + "hidden_norms": [ + 33148.9453125, + 53487464.0, + 192413680.0, + 354830112.0, + 444651488.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.949418024897568e-08, + 3.692673389288359e-10, + 3.6510769407804844e-10, + 3.6480282683548637e-10, + 3.65057900575394e-10 + ], + "bp_grad_norms_F": [ + 3.0807416351308348e-06, + 1.3205962545725924e-08, + 1.2856014031115137e-08, + 1.2853148767533185e-08, + 1.2861222309368259e-08 + ], + "gamma_dfa": 0.09566472223013989, + "acc_eval": 0.2880859375, + "loss_eval": 1.9538320302963257, + "epoch": 53 + }, + { + "hidden_norms": [ + 33465.359375, + 55258308.0, + 198680688.0, + 365875680.0, + 458634560.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.9228732141036744e-08, + 3.640579226971141e-10, + 3.6045816331764513e-10, + 3.6029040861862427e-10, + 3.6025293859154317e-10 + ], + "bp_grad_norms_F": [ + 3.058711854464491e-06, + 1.294814744312589e-08, + 1.2619584488504643e-08, + 1.2616848898971966e-08, + 1.2624772338654111e-08 + ], + "gamma_dfa": 0.09607254836737411, + "acc_eval": 0.2998046875, + "loss_eval": 1.9489495754241943, + "epoch": 54 + }, + { + "hidden_norms": [ + 33763.53125, + 56920656.0, + 204554208.0, + 376681216.0, + 472155680.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.756867338391203e-08, + 3.4894195866108646e-10, + 3.4671995829960167e-10, + 3.464649955819965e-10, + 3.4666045034548176e-10 + ], + "bp_grad_norms_F": [ + 3.092292217843351e-06, + 1.2733584853208413e-08, + 1.2427238793577544e-08, + 1.2424394846277664e-08, + 1.2432122886707475e-08 + ], + "gamma_dfa": 0.09629741777825984, + "acc_eval": 0.3017578125, + "loss_eval": 1.9477816820144653, + "epoch": 55 + }, + { + "hidden_norms": [ + 34061.03125, + 58650568.0, + 210577584.0, + 387585472.0, + 485747168.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.70959208801014e-08, + 3.4928168690662176e-10, + 3.46003392603933e-10, + 3.4562114281655454e-10, + 3.4606426058125805e-10 + ], + "bp_grad_norms_F": [ + 3.178826091243536e-06, + 1.2512856528701377e-08, + 1.2208544397651622e-08, + 1.2205639166040783e-08, + 1.2213387634574246e-08 + ], + "gamma_dfa": 0.09542209599749185, + "acc_eval": 0.3046875, + "loss_eval": 1.9549853801727295, + "epoch": 56 + }, + { + "hidden_norms": [ + 34344.76171875, + 60294200.0, + 216821792.0, + 398493824.0, + 499371840.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.7367511629990986e-08, + 3.416208427253764e-10, + 3.378898272288211e-10, + 3.377436663676292e-10, + 3.386138314187548e-10 + ], + "bp_grad_norms_F": [ + 3.2603361432848033e-06, + 1.2295201301526504e-08, + 1.2022674411582557e-08, + 1.2019833128817936e-08, + 1.2027326690144946e-08 + ], + "gamma_dfa": 0.09621504079404986, + "acc_eval": 0.294921875, + "loss_eval": 1.9597327709197998, + "epoch": 57 + }, + { + "hidden_norms": [ + 34621.87109375, + 62004936.0, + 222707536.0, + 409299680.0, + 512662208.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.6534943837505125e-08, + 3.356194766546139e-10, + 3.3068575655548216e-10, + 3.3087257933495096e-10, + 3.3104252672444545e-10 + ], + "bp_grad_norms_F": [ + 3.325955731270369e-06, + 1.2073825494951507e-08, + 1.1812358202689666e-08, + 1.1809524025352403e-08, + 1.1816909228912209e-08 + ], + "gamma_dfa": 0.09621665377926547, + "acc_eval": 0.3017578125, + "loss_eval": 1.9411261081695557, + "epoch": 58 + }, + { + "hidden_norms": [ + 34892.69921875, + 63619864.0, + 228332912.0, + 419524224.0, + 525474048.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.6131870707076814e-08, + 3.3116545616884707e-10, + 3.281262206389357e-10, + 3.2806185545908306e-10, + 3.281940552657403e-10 + ], + "bp_grad_norms_F": [ + 3.306513235656894e-06, + 1.1909767394513437e-08, + 1.165356344756674e-08, + 1.1650684861308491e-08, + 1.1658000786951561e-08 + ], + "gamma_dfa": 0.09604647590094828, + "acc_eval": 0.30078125, + "loss_eval": 1.9494699239730835, + "epoch": 59 + }, + { + "hidden_norms": [ + 35134.12890625, + 65285940.0, + 233831760.0, + 429654048.0, + 537931904.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.542536740676951e-08, + 3.2549649087165733e-10, + 3.224807365587168e-10, + 3.2198288479889925e-10, + 3.2189514942437825e-10 + ], + "bp_grad_norms_F": [ + 3.2077998639579164e-06, + 1.1713971126425804e-08, + 1.1479991179896842e-08, + 1.147721562233528e-08, + 1.1484392992144876e-08 + ], + "gamma_dfa": 0.09610223810159368, + "acc_eval": 0.298828125, + "loss_eval": 1.947687029838562, + "epoch": 60 + }, + { + "hidden_norms": [ + 35383.89453125, + 66896316.0, + 239557328.0, + 439032672.0, + 549329344.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.55890657949476e-08, + 3.2204855449080583e-10, + 3.1836161484832814e-10, + 3.185524344306856e-10, + 3.1883792828146795e-10 + ], + "bp_grad_norms_F": [ + 3.19811397275771e-06, + 1.1587792059231106e-08, + 1.1364262419988336e-08, + 1.1361324325775968e-08, + 1.1368459951199839e-08 + ], + "gamma_dfa": 0.09620415412791772, + "acc_eval": 0.3046875, + "loss_eval": 1.9550621509552002, + "epoch": 61 + }, + { + "hidden_norms": [ + 35603.75390625, + 68393976.0, + 244906672.0, + 448738336.0, + 561222784.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.4847117070266904e-08, + 3.208481536010055e-10, + 3.1700905789300293e-10, + 3.1679742162893376e-10, + 3.169834394967097e-10 + ], + "bp_grad_norms_F": [ + 3.1413667329616146e-06, + 1.1423910706298557e-08, + 1.1206890526693769e-08, + 1.1204000394116065e-08, + 1.1211046313519546e-08 + ], + "gamma_dfa": 0.09554143912100699, + "acc_eval": 0.302734375, + "loss_eval": 1.9572508335113525, + "epoch": 62 + }, + { + "hidden_norms": [ + 35840.75, + 69909448.0, + 249732624.0, + 457790144.0, + 572499584.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.482150200464275e-08, + 3.132541726014182e-10, + 3.1085201079861235e-10, + 3.1094149477439714e-10, + 3.1132280087220465e-10 + ], + "bp_grad_norms_F": [ + 3.1111580938159022e-06, + 1.1274166489272375e-08, + 1.1068144623038734e-08, + 1.1065306892987792e-08, + 1.1072265770906142e-08 + ], + "gamma_dfa": 0.09598036286843126, + "acc_eval": 0.2939453125, + "loss_eval": 1.9514048099517822, + "epoch": 63 + }, + { + "hidden_norms": [ + 36044.14453125, + 71301840.0, + 254043168.0, + 466339968.0, + 583323328.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.41697069422753e-08, + 3.088812261520246e-10, + 3.0549318630335165e-10, + 3.051613683968668e-10, + 3.050981411956144e-10 + ], + "bp_grad_norms_F": [ + 3.063583790208213e-06, + 1.1131353616633533e-08, + 1.0936378025405702e-08, + 1.0933466576545925e-08, + 1.0940373940115933e-08 + ], + "gamma_dfa": 0.09560732997124433, + "acc_eval": 0.3076171875, + "loss_eval": 1.9496949911117554, + "epoch": 64 + }, + { + "hidden_norms": [ + 36240.3046875, + 72753064.0, + 259111488.0, + 475471840.0, + 594591872.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.367900612895937e-08, + 3.0714322751812517e-10, + 3.043856555695612e-10, + 3.04040070897571e-10, + 3.043043039774318e-10 + ], + "bp_grad_norms_F": [ + 3.096502268817858e-06, + 1.1002981636920595e-08, + 1.0808172135057248e-08, + 1.0805252692591694e-08, + 1.0812099660029162e-08 + ], + "gamma_dfa": 0.09588889799488243, + "acc_eval": 0.2978515625, + "loss_eval": 1.951111078262329, + "epoch": 65 + }, + { + "hidden_norms": [ + 36427.96484375, + 74044192.0, + 263715872.0, + 483414560.0, + 604480512.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.3715726977543454e-08, + 3.022930794571721e-10, + 2.992986969374556e-10, + 2.9908994725325044e-10, + 2.9924074329557016e-10 + ], + "bp_grad_norms_F": [ + 3.0333421818795614e-06, + 1.0890616408687492e-08, + 1.0706762587631147e-08, + 1.0703858244198727e-08, + 1.071066169089363e-08 + ], + "gamma_dfa": 0.09630945282333414, + "acc_eval": 0.30078125, + "loss_eval": 1.949332594871521, + "epoch": 66 + }, + { + "hidden_norms": [ + 36613.015625, + 75303768.0, + 267802576.0, + 490809920.0, + 613719616.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.348211473688025e-08, + 3.012197435925401e-10, + 2.9878169383046327e-10, + 2.9841951132425493e-10, + 2.984068825373498e-10 + ], + "bp_grad_norms_F": [ + 3.008998646691907e-06, + 1.0781116444036343e-08, + 1.0603616651394532e-08, + 1.0600682998074262e-08, + 1.0607434930420823e-08 + ], + "gamma_dfa": 0.0960872639734589, + "acc_eval": 0.310546875, + "loss_eval": 1.9464266300201416, + "epoch": 67 + }, + { + "hidden_norms": [ + 36784.2265625, + 76478576.0, + 271792224.0, + 498011968.0, + 622710336.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.403291680750044e-08, + 3.0129157502223336e-10, + 2.977850743768329e-10, + 2.975975854635493e-10, + 2.9797145306709183e-10 + ], + "bp_grad_norms_F": [ + 2.9997727324371226e-06, + 1.0701310948491027e-08, + 1.052768094922385e-08, + 1.0524773941256171e-08, + 1.0531463701113353e-08 + ], + "gamma_dfa": 0.09624087948759552, + "acc_eval": 0.2939453125, + "loss_eval": 1.9560136795043945, + "epoch": 68 + }, + { + "hidden_norms": [ + 36953.8671875, + 77622176.0, + 275419712.0, + 504592704.0, + 630923392.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.3204310290766443e-08, + 2.9739929963135125e-10, + 2.9424951364376284e-10, + 2.9405439194718497e-10, + 2.94715835069681e-10 + ], + "bp_grad_norms_F": [ + 2.95851918963308e-06, + 1.0595774924127e-08, + 1.0427880781094245e-08, + 1.042505370918434e-08, + 1.0431726593651547e-08 + ], + "gamma_dfa": 0.09637677710998105, + "acc_eval": 0.2978515625, + "loss_eval": 1.950129747390747, + "epoch": 69 + }, + { + "hidden_norms": [ + 37103.0546875, + 78713944.0, + 279082240.0, + 511376384.0, + 639270976.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.3287564583115454e-08, + 2.9558042125010786e-10, + 2.94046592630437e-10, + 2.936023091315576e-10, + 2.9353278141464045e-10 + ], + "bp_grad_norms_F": [ + 2.9398986498563318e-06, + 1.0504810354916572e-08, + 1.034081797968156e-08, + 1.0337980249630618e-08, + 1.0344593626143705e-08 + ], + "gamma_dfa": 0.09638382289995207, + "acc_eval": 0.29296875, + "loss_eval": 1.9502758979797363, + "epoch": 70 + }, + { + "hidden_norms": [ + 37248.1015625, + 79737480.0, + 282511072.0, + 517720224.0, + 647238976.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.260229585246634e-08, + 2.899096518405031e-10, + 2.8717414557455356e-10, + 2.8704966181791747e-10, + 2.871551885164081e-10 + ], + "bp_grad_norms_F": [ + 2.9307011573109776e-06, + 1.0423523377767197e-08, + 1.0264206373733487e-08, + 1.0261346439222052e-08, + 1.0267889649639983e-08 + ], + "gamma_dfa": 0.0963258501906239, + "acc_eval": 0.3017578125, + "loss_eval": 1.949232816696167, + "epoch": 71 + }, + { + "hidden_norms": [ + 37381.0390625, + 80657776.0, + 285833920.0, + 523738208.0, + 654706368.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.2669339112298985e-08, + 2.929272380214343e-10, + 2.8994415202099333e-10, + 2.898675188767186e-10, + 2.900694684448979e-10 + ], + "bp_grad_norms_F": [ + 2.912831860157894e-06, + 1.0341300260563457e-08, + 1.018425699328418e-08, + 1.0181377518847512e-08, + 1.0187909182945987e-08 + ], + "gamma_dfa": 0.09613002402329585, + "acc_eval": 0.2958984375, + "loss_eval": 1.9482614994049072, + "epoch": 72 + }, + { + "hidden_norms": [ + 37505.28515625, + 81612512.0, + 289044000.0, + 529475296.0, + 661837376.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.200942965188915e-08, + 2.875680804592662e-10, + 2.8434027354862224e-10, + 2.8415880759524725e-10, + 2.840882251664567e-10 + ], + "bp_grad_norms_F": [ + 2.9117632038833108e-06, + 1.0266585803719863e-08, + 1.0111568471415922e-08, + 1.0108765380323348e-08, + 1.0115227766505086e-08 + ], + "gamma_dfa": 0.09620579873444512, + "acc_eval": 0.2958984375, + "loss_eval": 1.949747085571289, + "epoch": 73 + }, + { + "hidden_norms": [ + 37622.05078125, + 82508960.0, + 292035424.0, + 534928544.0, + 668760064.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.211632014834322e-08, + 2.8521121575586506e-10, + 2.8250474182200946e-10, + 2.822122813217476e-10, + 2.8265498275281686e-10 + ], + "bp_grad_norms_F": [ + 2.9012180675636046e-06, + 1.0211213208322079e-08, + 1.0059093114023199e-08, + 1.0056256272150677e-08, + 1.0062689348444565e-08 + ], + "gamma_dfa": 0.09616703895881074, + "acc_eval": 0.2998046875, + "loss_eval": 1.9510722160339355, + "epoch": 74 + }, + { + "hidden_norms": [ + 37739.125, + 83378024.0, + 294890528.0, + 540384832.0, + 675452224.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.20015284166675e-08, + 2.812508559379978e-10, + 2.7935267987722057e-10, + 2.7908611532900807e-10, + 2.792987507937994e-10 + ], + "bp_grad_norms_F": [ + 2.858193283827859e-06, + 1.0136964156970407e-08, + 9.987989102455685e-09, + 9.985158477832101e-09, + 9.991581784163373e-09 + ], + "gamma_dfa": 0.09625962336212979, + "acc_eval": 0.306640625, + "loss_eval": 1.949669599533081, + "epoch": 75 + }, + { + "hidden_norms": [ + 37841.23828125, + 84099792.0, + 297324992.0, + 545087552.0, + 681202944.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.180555717743118e-08, + 2.81841883165157e-10, + 2.790032094246442e-10, + 2.7877883335136744e-10, + 2.790592201762365e-10 + ], + "bp_grad_norms_F": [ + 2.8341921733954223e-06, + 1.0072185752107998e-08, + 9.925220645357058e-09, + 9.922425547870262e-09, + 9.928815103421584e-09 + ], + "gamma_dfa": 0.09619013674819143, + "acc_eval": 0.2958984375, + "loss_eval": 1.947105884552002, + "epoch": 76 + }, + { + "hidden_norms": [ + 37933.76953125, + 84846568.0, + 299677280.0, + 549384448.0, + 686714688.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.136923775239666e-08, + 2.810240096184913e-10, + 2.7924595968897847e-10, + 2.7894245246962157e-10, + 2.789228015220857e-10 + ], + "bp_grad_norms_F": [ + 2.822413307512761e-06, + 1.0021487639733095e-08, + 9.876163886701761e-09, + 9.873332373899757e-09, + 9.879697948633748e-09 + ], + "gamma_dfa": 0.09583658421615837, + "acc_eval": 0.306640625, + "loss_eval": 1.9495177268981934, + "epoch": 77 + }, + { + "hidden_norms": [ + 38020.0, + 85562224.0, + 301864096.0, + 553597760.0, + 691941760.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.160018545780076e-08, + 2.8198060553208393e-10, + 2.797063691772905e-10, + 2.7946911451692813e-10, + 2.796869680299352e-10 + ], + "bp_grad_norms_F": [ + 2.7969890652457252e-06, + 9.96650406648314e-09, + 9.82430670148915e-09, + 9.821477853222405e-09, + 9.827816782603804e-09 + ], + "gamma_dfa": 0.09604255547674256, + "acc_eval": 0.298828125, + "loss_eval": 1.9492969512939453, + "epoch": 78 + }, + { + "hidden_norms": [ + 38095.6171875, + 86194680.0, + 304047168.0, + 557639872.0, + 696924224.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.120950063997043e-08, + 2.782411523405415e-10, + 2.750368821580196e-10, + 2.7475391406461824e-10, + 2.748750949077561e-10 + ], + "bp_grad_norms_F": [ + 2.7781038625107612e-06, + 9.913026843832995e-09, + 9.771905951083681e-09, + 9.769114406310564e-09, + 9.775444453907767e-09 + ], + "gamma_dfa": 0.09590470486728009, + "acc_eval": 0.3037109375, + "loss_eval": 1.9471888542175293, + "epoch": 79 + }, + { + "hidden_norms": [ + 38161.02734375, + 86761784.0, + 305935040.0, + 560989248.0, + 701039488.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.1234330555871566e-08, + 2.762826911695271e-10, + 2.737765292248895e-10, + 2.7344454478495095e-10, + 2.735327242486818e-10 + ], + "bp_grad_norms_F": [ + 2.7851888262375724e-06, + 9.883654783493512e-09, + 9.742406881230181e-09, + 9.73962688277652e-09, + 9.74590719238222e-09 + ], + "gamma_dfa": 0.0961023918025603, + "acc_eval": 0.306640625, + "loss_eval": 1.9466722011566162, + "epoch": 80 + }, + { + "hidden_norms": [ + 38225.30859375, + 87283448.0, + 307635232.0, + 564114432.0, + 704943360.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.112997669698416e-08, + 2.7494201360056536e-10, + 2.7230390164945106e-10, + 2.724628855865774e-10, + 2.7264715485308955e-10 + ], + "bp_grad_norms_F": [ + 2.775808070509811e-06, + 9.851329529908526e-09, + 9.711465409623088e-09, + 9.708682746634167e-09, + 9.714950621741991e-09 + ], + "gamma_dfa": 0.09609865310994792, + "acc_eval": 0.30078125, + "loss_eval": 1.9487848281860352, + "epoch": 81 + }, + { + "hidden_norms": [ + 38286.74609375, + 87760048.0, + 309161312.0, + 566976960.0, + 708521920.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.100326561091606e-08, + 2.750530914141791e-10, + 2.7221699894219853e-10, + 2.720162428637707e-10, + 2.72086408958927e-10 + ], + "bp_grad_norms_F": [ + 2.76197988569038e-06, + 9.813816426174071e-09, + 9.67496749382235e-09, + 9.672206147115503e-09, + 9.678448265049155e-09 + ], + "gamma_dfa": 0.09604053818475222, + "acc_eval": 0.3017578125, + "loss_eval": 1.946324110031128, + "epoch": 82 + }, + { + "hidden_norms": [ + 38345.609375, + 88198008.0, + 310597792.0, + 569628928.0, + 711849600.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.150431903189201e-08, + 2.739733162560043e-10, + 2.706747326275405e-10, + 2.703801071923806e-10, + 2.703643420254309e-10 + ], + "bp_grad_norms_F": [ + 2.754284651018679e-06, + 9.79015535307326e-09, + 9.652834087603424e-09, + 9.650069188182897e-09, + 9.656329069684944e-09 + ], + "gamma_dfa": 0.09618356187274912, + "acc_eval": 0.3017578125, + "loss_eval": 1.952025294303894, + "epoch": 83 + }, + { + "hidden_norms": [ + 38393.00390625, + 88631992.0, + 311868064.0, + 571956672.0, + 714769600.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.135545677603659e-08, + 2.741361304625656e-10, + 2.7016161530113436e-10, + 2.7007868164119486e-10, + 2.702876256144293e-10 + ], + "bp_grad_norms_F": [ + 2.7439270979812136e-06, + 9.758214680744004e-09, + 9.621899721423688e-09, + 9.619145480144198e-09, + 9.625373387223135e-09 + ], + "gamma_dfa": 0.09624775896372739, + "acc_eval": 0.302734375, + "loss_eval": 1.9458943605422974, + "epoch": 84 + }, + { + "hidden_norms": [ + 38432.8515625, + 89003520.0, + 313081504.0, + 574038272.0, + 717387392.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.1023032909824906e-08, + 2.709044100157598e-10, + 2.6825267007701825e-10, + 2.6804419794856926e-10, + 2.6862953528272726e-10 + ], + "bp_grad_norms_F": [ + 2.7511816824699054e-06, + 9.751657259471358e-09, + 9.615223284242802e-09, + 9.612453943930177e-09, + 9.618667640154399e-09 + ], + "gamma_dfa": 0.09613665863071219, + "acc_eval": 0.3095703125, + "loss_eval": 1.9508092403411865, + "epoch": 85 + }, + { + "hidden_norms": [ + 38471.12890625, + 89306096.0, + 314023616.0, + 575863488.0, + 719706496.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.104102740460803e-08, + 2.722161940305057e-10, + 2.698590240157728e-10, + 2.697040091259595e-10, + 2.698894441266475e-10 + ], + "bp_grad_norms_F": [ + 2.731306722125737e-06, + 9.717195048608573e-09, + 9.582218574166745e-09, + 9.579466997422514e-09, + 9.585680693646736e-09 + ], + "gamma_dfa": 0.09615167022275273, + "acc_eval": 0.296875, + "loss_eval": 1.9497017860412598, + "epoch": 86 + }, + { + "hidden_norms": [ + 38506.49609375, + 89593104.0, + 314968672.0, + 577511168.0, + 721761728.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.099763100702148e-08, + 2.7151769721456276e-10, + 2.698610224172171e-10, + 2.6943663966605413e-10, + 2.6953861365086595e-10 + ], + "bp_grad_norms_F": [ + 2.73057457889081e-06, + 9.698882585951196e-09, + 9.564125491579034e-09, + 9.561379243905321e-09, + 9.567577841096409e-09 + ], + "gamma_dfa": 0.09604650201799814, + "acc_eval": 0.2998046875, + "loss_eval": 1.948227882385254, + "epoch": 87 + }, + { + "hidden_norms": [ + 38536.46875, + 89827632.0, + 315715328.0, + 578913664.0, + 723505408.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.074277709127273e-08, + 2.7221166987168033e-10, + 2.7026783588901537e-10, + 2.700663026544703e-10, + 2.7004307123768e-10 + ], + "bp_grad_norms_F": [ + 2.727413175307447e-06, + 9.684548274435656e-09, + 9.549998125635284e-09, + 9.547248325247892e-09, + 9.553437152476363e-09 + ], + "gamma_dfa": 0.09602321147394832, + "acc_eval": 0.2978515625, + "loss_eval": 1.9482835531234741, + "epoch": 88 + }, + { + "hidden_norms": [ + 38560.86328125, + 90036944.0, + 316345728.0, + 580143808.0, + 725043392.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.10075821580358e-08, + 2.70407807256845e-10, + 2.6787719265009e-10, + 2.677959520802631e-10, + 2.679190480581184e-10 + ], + "bp_grad_norms_F": [ + 2.7208343453821726e-06, + 9.672045386821537e-09, + 9.538242196072133e-09, + 9.535500389290519e-09, + 9.541698986481606e-09 + ], + "gamma_dfa": 0.09616725159867201, + "acc_eval": 0.3017578125, + "loss_eval": 1.9490463733673096, + "epoch": 89 + }, + { + "hidden_norms": [ + 38581.62890625, + 90197056.0, + 316901888.0, + 581085248.0, + 726214080.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.062888064344406e-08, + 2.7050772732906125e-10, + 2.680498045748436e-10, + 2.6770730077174676e-10, + 2.6768456895531756e-10 + ], + "bp_grad_norms_F": [ + 2.7148839762958232e-06, + 9.659022026653474e-09, + 9.525311206459719e-09, + 9.522568511499685e-09, + 9.528759115084995e-09 + ], + "gamma_dfa": 0.09604255046724575, + "acc_eval": 0.2998046875, + "loss_eval": 1.9472681283950806, + "epoch": 90 + }, + { + "hidden_norms": [ + 38598.60546875, + 90331488.0, + 317399072.0, + 581959360.0, + 727306816.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.070089059699967e-08, + 2.706254109696715e-10, + 2.6912555517455417e-10, + 2.687201572371123e-10, + 2.686441624710767e-10 + ], + "bp_grad_norms_F": [ + 2.7157270778843667e-06, + 9.650602983413137e-09, + 9.516874399650987e-09, + 9.514130816512534e-09, + 9.520310761956807e-09 + ], + "gamma_dfa": 0.09604466614109697, + "acc_eval": 0.296875, + "loss_eval": 1.9475460052490234, + "epoch": 91 + }, + { + "hidden_norms": [ + 38612.046875, + 90438432.0, + 317761152.0, + 582634240.0, + 728132928.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.071476039120171e-08, + 2.693741063541921e-10, + 2.670912935265335e-10, + 2.670463572496118e-10, + 2.6704632949403617e-10 + ], + "bp_grad_norms_F": [ + 2.7161215712112607e-06, + 9.646365484172748e-09, + 9.512908683007026e-09, + 9.51017486983119e-09, + 9.516351262561784e-09 + ], + "gamma_dfa": 0.09614986698579742, + "acc_eval": 0.3017578125, + "loss_eval": 1.947176218032837, + "epoch": 92 + }, + { + "hidden_norms": [ + 38622.60546875, + 90514344.0, + 318023872.0, + 583138880.0, + 728758976.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.0669719087181875e-08, + 2.7007937553058525e-10, + 2.6770055616687216e-10, + 2.676309729388038e-10, + 2.678066102212995e-10 + ], + "bp_grad_norms_F": [ + 2.715124537644442e-06, + 9.639773423941733e-09, + 9.506337939058085e-09, + 9.503595244098051e-09, + 9.509768084114967e-09 + ], + "gamma_dfa": 0.09608547511743382, + "acc_eval": 0.30078125, + "loss_eval": 1.9474897384643555, + "epoch": 93 + }, + { + "hidden_norms": [ + 38631.16796875, + 90589928.0, + 318254208.0, + 583549632.0, + 729273152.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.0695071251993795e-08, + 2.704435009270867e-10, + 2.6853075318911124e-10, + 2.682237765228024e-10, + 2.6814858666845964e-10 + ], + "bp_grad_norms_F": [ + 2.7134594802191714e-06, + 9.634878672670766e-09, + 9.501549769197482e-09, + 9.498809738772707e-09, + 9.504978137897524e-09 + ], + "gamma_dfa": 0.0960953844114556, + "acc_eval": 0.2978515625, + "loss_eval": 1.9472770690917969, + "epoch": 94 + }, + { + "hidden_norms": [ + 38638.31640625, + 90643280.0, + 318415136.0, + 583858560.0, + 729656640.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.078240761235975e-08, + 2.6967122979115743e-10, + 2.669718335290838e-10, + 2.6691132637424175e-10, + 2.6697202781811313e-10 + ], + "bp_grad_norms_F": [ + 2.711297611313057e-06, + 9.631804687160184e-09, + 9.498727138179675e-09, + 9.495988884111739e-09, + 9.502159947771815e-09 + ], + "gamma_dfa": 0.09613717825050117, + "acc_eval": 0.2998046875, + "loss_eval": 1.94759202003479, + "epoch": 95 + }, + { + "hidden_norms": [ + 38642.26171875, + 90677816.0, + 318520992.0, + 584046976.0, + 729889984.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.069002995128358e-08, + 2.6985705336990407e-10, + 2.6735619274020905e-10, + 2.671637633344659e-10, + 2.6708837919109385e-10 + ], + "bp_grad_norms_F": [ + 2.7110704650112893e-06, + 9.629748554118578e-09, + 9.496692321420142e-09, + 9.493953179173786e-09, + 9.500122466477023e-09 + ], + "gamma_dfa": 0.09612438916155952, + "acc_eval": 0.2998046875, + "loss_eval": 1.9474642276763916, + "epoch": 96 + }, + { + "hidden_norms": [ + 38644.16015625, + 90695256.0, + 318576288.0, + 584137856.0, + 730003328.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.070784681038276e-08, + 2.6936791686082984e-10, + 2.671484977678773e-10, + 2.668835430430505e-10, + 2.671484977678773e-10 + ], + "bp_grad_norms_F": [ + 2.710563421715051e-06, + 9.628578823139833e-09, + 9.495578545681838e-09, + 9.492838515257063e-09, + 9.499009578917139e-09 + ], + "gamma_dfa": 0.09612188487153617, + "acc_eval": 0.298828125, + "loss_eval": 1.9476267099380493, + "epoch": 97 + }, + { + "hidden_norms": [ + 38646.0625, + 90710400.0, + 318627968.0, + 584229760.0, + 730119232.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.075278863841959e-08, + 2.692224221334527e-10, + 2.671664001141494e-10, + 2.669355292361786e-10, + 2.6700280875147087e-10 + ], + "bp_grad_norms_F": [ + 2.7103426418761956e-06, + 9.62763913037179e-09, + 9.494667274623225e-09, + 9.49192813237687e-09, + 9.498098307858527e-09 + ], + "gamma_dfa": 0.09612667236069683, + "acc_eval": 0.2998046875, + "loss_eval": 1.9476723670959473, + "epoch": 98 + }, + { + "hidden_norms": [ + 38646.953125, + 90717408.0, + 318651872.0, + 584275776.0, + 730176960.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.076975639894954e-08, + 2.691815659261465e-10, + 2.671429466527542e-10, + 2.669321430559535e-10, + 2.669318377446217e-10 + ], + "bp_grad_norms_F": [ + 2.7102296371595003e-06, + 9.62716750763093e-09, + 9.494214303629178e-09, + 9.491475161382823e-09, + 9.4976462250429e-09 + ], + "gamma_dfa": 0.09612801273397054, + "acc_eval": 0.2998046875, + "loss_eval": 1.9476864337921143, + "epoch": 99 + }, + { + "hidden_norms": [ + 38646.98046875, + 90717592.0, + 318652416.0, + 584276736.0, + 730178112.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.076372033840926e-08, + 2.692036038531853e-10, + 2.6715371581609304e-10, + 2.669119369969053e-10, + 2.6695023969125486e-10 + ], + "bp_grad_norms_F": [ + 2.710211447265465e-06, + 9.627171060344608e-09, + 9.494216968164437e-09, + 9.491476937739662e-09, + 9.497648001399739e-09 + ], + "gamma_dfa": 0.09612751441454748, + "acc_eval": 0.2998046875, + "loss_eval": 1.947685956954956, + "epoch": 100 + } + ] +} \ No newline at end of file diff --git a/results/snapshot_evolution_v2/snapshot_fa_canonical_s42.json b/results/snapshot_evolution_v2/snapshot_fa_canonical_s42.json new file mode 100644 index 0000000..d29ad2d --- /dev/null +++ b/results/snapshot_evolution_v2/snapshot_fa_canonical_s42.json @@ -0,0 +1,2734 @@ +{ + "fa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010068593546748161, + 0.000997236929833889, + 0.0009934091940522194, + 0.0009870644425973296, + 0.0009829498594626784 + ], + "bp_grad_norms_F": [ + 0.03544403985142708, + 0.03507080301642418, + 0.03477022796869278, + 0.03443896397948265, + 0.03407429903745651 + ], + "gamma_dfa": NaN, + "acc_eval": 0.115234375, + "loss_eval": 2.383650302886963, + "epoch": 0 + }, + { + "hidden_norms": [ + 634.95556640625, + 4686.67578125, + 8548.919921875, + 9006.0517578125, + 8484.302734375 + ], + "bp_grad_norms_per_sample_med": [ + 2.975244342451333e-06, + 1.1454501418484142e-06, + 1.1543062328200904e-06, + 1.164633545158722e-06, + 1.1064564660046017e-06 + ], + "bp_grad_norms_F": [ + 0.0001923188247019425, + 9.00624945643358e-05, + 6.289214798016474e-05, + 5.813155075884424e-05, + 5.113427323522046e-05 + ], + "gamma_dfa": NaN, + "acc_eval": 0.27734375, + "loss_eval": 1.9464800357818604, + "epoch": 1 + }, + { + "hidden_norms": [ + 838.77099609375, + 8185.21484375, + 20076.259765625, + 21714.076171875, + 19607.720703125 + ], + "bp_grad_norms_per_sample_med": [ + 2.675848463695729e-06, + 5.853078732798167e-07, + 5.769501285612932e-07, + 5.794665298708424e-07, + 5.573179464590794e-07 + ], + "bp_grad_norms_F": [ + 0.00015455791435670108, + 2.4559509256505407e-05, + 2.031458825513255e-05, + 2.0197476260364056e-05, + 1.898946902656462e-05 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2958984375, + "loss_eval": 1.932114601135254, + "epoch": 2 + }, + { + "hidden_norms": [ + 966.05859375, + 10760.646484375, + 31344.212890625, + 35515.1015625, + 30314.041015625 + ], + "bp_grad_norms_per_sample_med": [ + 2.748855649770121e-06, + 4.3298211949149845e-07, + 4.17521391682385e-07, + 4.17111380102142e-07, + 3.9905967241793405e-07 + ], + "bp_grad_norms_F": [ + 0.00015430455096065998, + 1.7030582966981456e-05, + 1.4290850231191143e-05, + 1.4243430996430106e-05, + 1.3498008229362313e-05 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3203125, + "loss_eval": 1.9043192863464355, + "epoch": 3 + }, + { + "hidden_norms": [ + 1071.293212890625, + 12608.09765625, + 40531.1171875, + 47819.078125, + 38897.390625 + ], + "bp_grad_norms_per_sample_med": [ + 2.733014980549342e-06, + 3.670443504688592e-07, + 3.5215543903177604e-07, + 3.5238662121628295e-07, + 3.3813631716839154e-07 + ], + "bp_grad_norms_F": [ + 0.0001624817814445123, + 1.4486134205071721e-05, + 1.1960014489886817e-05, + 1.1927315426873975e-05, + 1.1350254681019578e-05 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3115234375, + "loss_eval": 1.898539662361145, + "epoch": 4 + }, + { + "hidden_norms": [ + 1170.5045166015625, + 14295.359375, + 49885.03515625, + 61276.62890625, + 47640.921875 + ], + "bp_grad_norms_per_sample_med": [ + 2.690757355594542e-06, + 3.267070951551432e-07, + 3.0663491656923725e-07, + 3.0629081493316335e-07, + 2.9683877755815047e-07 + ], + "bp_grad_norms_F": [ + 0.0001624024735065177, + 1.2482374586397782e-05, + 1.0314163773728069e-05, + 1.0298784218321089e-05, + 9.855078133114148e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.322265625, + "loss_eval": 1.877720832824707, + "epoch": 5 + }, + { + "hidden_norms": [ + 1288.9276123046875, + 15613.23046875, + 57501.26171875, + 73376.796875, + 54583.2109375 + ], + "bp_grad_norms_per_sample_med": [ + 2.7759115255321376e-06, + 3.0544967444257054e-07, + 2.801086793624563e-07, + 2.7996006224384473e-07, + 2.7101373234472703e-07 + ], + "bp_grad_norms_F": [ + 0.00017124316946137697, + 1.1784563866967801e-05, + 9.484625479672104e-06, + 9.465281436860096e-06, + 9.092000254895538e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.32421875, + "loss_eval": 1.8702466487884521, + "epoch": 6 + }, + { + "hidden_norms": [ + 1437.197021484375, + 16777.841796875, + 65706.7109375, + 87232.4140625, + 61590.078125 + ], + "bp_grad_norms_per_sample_med": [ + 2.883781235141214e-06, + 2.9475407359313976e-07, + 2.6204861569567584e-07, + 2.6302603828298743e-07, + 2.5517954327369807e-07 + ], + "bp_grad_norms_F": [ + 0.00017113517969846725, + 1.1177045962540433e-05, + 8.825853001326323e-06, + 8.807965969026554e-06, + 8.485528269375209e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.33984375, + "loss_eval": 1.8411049842834473, + "epoch": 7 + }, + { + "hidden_norms": [ + 1575.2144775390625, + 17884.404296875, + 73215.0, + 101692.0703125, + 67757.890625 + ], + "bp_grad_norms_per_sample_med": [ + 2.8855845357611543e-06, + 2.785824051443342e-07, + 2.509512739834463e-07, + 2.5104517931140435e-07, + 2.451099874178908e-07 + ], + "bp_grad_norms_F": [ + 0.0001778283913154155, + 1.0928491974482313e-05, + 8.524083568772767e-06, + 8.510252882842906e-06, + 8.22034417069517e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.349609375, + "loss_eval": 1.8426380157470703, + "epoch": 8 + }, + { + "hidden_norms": [ + 1746.853515625, + 18578.95703125, + 80693.078125, + 117047.6171875, + 73706.9765625 + ], + "bp_grad_norms_per_sample_med": [ + 2.964599843835458e-06, + 2.738325974860345e-07, + 2.414699338260107e-07, + 2.418815370219818e-07, + 2.3542932581221976e-07 + ], + "bp_grad_norms_F": [ + 0.0001854781003203243, + 1.0656134691089392e-05, + 8.172302841558121e-06, + 8.16663850855548e-06, + 7.904830454208422e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3671875, + "loss_eval": 1.8274496793746948, + "epoch": 9 + }, + { + "hidden_norms": [ + 1938.662109375, + 19766.384765625, + 88785.7734375, + 134051.8125, + 79702.1796875 + ], + "bp_grad_norms_per_sample_med": [ + 2.93986431643134e-06, + 2.6766733185468183e-07, + 2.3016899319827644e-07, + 2.3030897011722118e-07, + 2.2565886581560335e-07 + ], + "bp_grad_norms_F": [ + 0.0001912089210236445, + 1.0689387636375614e-05, + 7.921232281660195e-06, + 7.924772944534197e-06, + 7.683997864660341e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3505859375, + "loss_eval": 1.8229554891586304, + "epoch": 10 + }, + { + "hidden_norms": [ + 2088.147705078125, + 20979.9453125, + 96985.96875, + 150667.6875, + 85126.3359375 + ], + "bp_grad_norms_per_sample_med": [ + 2.9922123303549597e-06, + 2.649965722412162e-07, + 2.2647282094112597e-07, + 2.272310553053103e-07, + 2.2135814958801348e-07 + ], + "bp_grad_norms_F": [ + 0.00019602400425355881, + 1.0553159881965257e-05, + 7.715923857176676e-06, + 7.728580385446548e-06, + 7.498896593460813e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.375, + "loss_eval": 1.8172534704208374, + "epoch": 11 + }, + { + "hidden_norms": [ + 2276.7451171875, + 22148.2578125, + 105343.15625, + 167593.515625, + 90718.5 + ], + "bp_grad_norms_per_sample_med": [ + 3.033006578334607e-06, + 2.6026333443951444e-07, + 2.1839655062194652e-07, + 2.189913459460513e-07, + 2.1411695172446343e-07 + ], + "bp_grad_norms_F": [ + 0.00019336632976774126, + 1.0404637578176335e-05, + 7.483776698791189e-06, + 7.508507223974448e-06, + 7.2862567321863025e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.349609375, + "loss_eval": 1.8100277185440063, + "epoch": 12 + }, + { + "hidden_norms": [ + 2470.05517578125, + 22943.138671875, + 111998.0078125, + 181164.46875, + 93911.8515625 + ], + "bp_grad_norms_per_sample_med": [ + 3.0791732115176274e-06, + 2.678765156360896e-07, + 2.2002203081683547e-07, + 2.2065630389533908e-07, + 2.1573649178208143e-07 + ], + "bp_grad_norms_F": [ + 0.00020370102720335126, + 1.0737571756180841e-05, + 7.488396931876196e-06, + 7.527175512223039e-06, + 7.304198788915528e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3447265625, + "loss_eval": 1.8219082355499268, + "epoch": 13 + }, + { + "hidden_norms": [ + 2655.71875, + 23620.771484375, + 118446.4453125, + 194098.046875, + 97110.40625 + ], + "bp_grad_norms_per_sample_med": [ + 3.03382375932415e-06, + 2.674543395642104e-07, + 2.1672505567948974e-07, + 2.1837567487636989e-07, + 2.127215310565589e-07 + ], + "bp_grad_norms_F": [ + 0.00019606151909101754, + 1.0727502740337513e-05, + 7.367311354755657e-06, + 7.4189733823004644e-06, + 7.2012962846201845e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3447265625, + "loss_eval": 1.800294041633606, + "epoch": 14 + }, + { + "hidden_norms": [ + 2864.51904296875, + 23962.1328125, + 123932.375, + 204264.46875, + 99147.40625 + ], + "bp_grad_norms_per_sample_med": [ + 3.0961696211306844e-06, + 2.757700485744863e-07, + 2.1832956065281905e-07, + 2.1977299979880627e-07, + 2.1560039442647394e-07 + ], + "bp_grad_norms_F": [ + 0.00020294770365580916, + 1.0936742910416797e-05, + 7.422260750900023e-06, + 7.487843049602816e-06, + 7.265869498951361e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.349609375, + "loss_eval": 1.8283555507659912, + "epoch": 15 + }, + { + "hidden_norms": [ + 3058.654296875, + 24515.28515625, + 129439.953125, + 215162.921875, + 101313.0703125 + ], + "bp_grad_norms_per_sample_med": [ + 3.0670128126075724e-06, + 2.704452413127001e-07, + 2.1300424180026312e-07, + 2.1552395423896087e-07, + 2.103476077763844e-07 + ], + "bp_grad_norms_F": [ + 0.00020699974265880883, + 1.1274227290414274e-05, + 7.348373856075341e-06, + 7.4233907980669755e-06, + 7.201060725492425e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3603515625, + "loss_eval": 1.8033101558685303, + "epoch": 16 + }, + { + "hidden_norms": [ + 3205.80859375, + 24759.69921875, + 132512.875, + 221758.34375, + 102296.3515625 + ], + "bp_grad_norms_per_sample_med": [ + 3.0818489449302433e-06, + 2.7902248689315456e-07, + 2.1470867750394973e-07, + 2.1584412479569437e-07, + 2.1120550286468642e-07 + ], + "bp_grad_norms_F": [ + 0.00019346778572071344, + 1.1271905350440647e-05, + 7.35169760446297e-06, + 7.441570687660715e-06, + 7.2173174885392655e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3623046875, + "loss_eval": 1.789717197418213, + "epoch": 17 + }, + { + "hidden_norms": [ + 3365.503173828125, + 24903.955078125, + 137239.453125, + 228336.28125, + 103774.4140625 + ], + "bp_grad_norms_per_sample_med": [ + 3.0317510208988097e-06, + 2.810125181440526e-07, + 2.1507479175397748e-07, + 2.1818523521233146e-07, + 2.1249555004487775e-07 + ], + "bp_grad_norms_F": [ + 0.00019401832832954824, + 1.144540510722436e-05, + 7.354777153523173e-06, + 7.453731996065471e-06, + 7.234774784592446e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3515625, + "loss_eval": 1.7909660339355469, + "epoch": 18 + }, + { + "hidden_norms": [ + 3517.615478515625, + 25088.482421875, + 140183.171875, + 234581.5, + 105112.640625 + ], + "bp_grad_norms_per_sample_med": [ + 3.0766200325160753e-06, + 2.8522768502625695e-07, + 2.1497518787327863e-07, + 2.1691003837531753e-07, + 2.1271530670219363e-07 + ], + "bp_grad_norms_F": [ + 0.00020355181186459959, + 1.1879135854542255e-05, + 7.4169261097267736e-06, + 7.52632467992953e-06, + 7.302520316443406e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.34765625, + "loss_eval": 1.8049894571304321, + "epoch": 19 + }, + { + "hidden_norms": [ + 3643.212890625, + 25572.47265625, + 143095.625, + 240103.59375, + 106815.9609375 + ], + "bp_grad_norms_per_sample_med": [ + 2.9240111416584114e-06, + 2.7889984721696237e-07, + 2.1295824126355e-07, + 2.145163620070889e-07, + 2.1029546815043432e-07 + ], + "bp_grad_norms_F": [ + 0.00019266517483629286, + 1.1654319678200409e-05, + 7.349848146986915e-06, + 7.464911050192313e-06, + 7.246624591061845e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3681640625, + "loss_eval": 1.7967158555984497, + "epoch": 20 + }, + { + "hidden_norms": [ + 3727.509521484375, + 26266.642578125, + 147179.796875, + 243896.734375, + 107961.3359375 + ], + "bp_grad_norms_per_sample_med": [ + 3.034621840924956e-06, + 2.95065575528497e-07, + 2.1733650612532074e-07, + 2.1865858457204013e-07, + 2.140783124104928e-07 + ], + "bp_grad_norms_F": [ + 0.00019002222688868642, + 1.179500304715475e-05, + 7.40604900784092e-06, + 7.5316506809031125e-06, + 7.309085049200803e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3603515625, + "loss_eval": 1.7879303693771362, + "epoch": 21 + }, + { + "hidden_norms": [ + 3814.343994140625, + 26307.63671875, + 149997.296875, + 248837.015625, + 109946.75 + ], + "bp_grad_norms_per_sample_med": [ + 3.0296112072392134e-06, + 2.891725046083593e-07, + 2.132598950765896e-07, + 2.164179448982395e-07, + 2.1202281175192184e-07 + ], + "bp_grad_norms_F": [ + 0.00019085934036411345, + 1.1828436981886625e-05, + 7.313527476071613e-06, + 7.4397207754373085e-06, + 7.220100542326691e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3798828125, + "loss_eval": 1.769087791442871, + "epoch": 22 + }, + { + "hidden_norms": [ + 3903.16357421875, + 26762.390625, + 151661.765625, + 252546.703125, + 112163.4375 + ], + "bp_grad_norms_per_sample_med": [ + 3.10251039081777e-06, + 2.9397492085081467e-07, + 2.119260216204566e-07, + 2.151843716546864e-07, + 2.0996778005155647e-07 + ], + "bp_grad_norms_F": [ + 0.0001914280146593228, + 1.1861766324727796e-05, + 7.28844088371261e-06, + 7.418064342346042e-06, + 7.190795258793514e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.349609375, + "loss_eval": 1.7941722869873047, + "epoch": 23 + }, + { + "hidden_norms": [ + 3989.95361328125, + 27301.33984375, + 155319.25, + 259232.390625, + 115495.6796875 + ], + "bp_grad_norms_per_sample_med": [ + 2.962329745059833e-06, + 2.8580453204085643e-07, + 2.0789140364740888e-07, + 2.0986689719393326e-07, + 2.051628200661071e-07 + ], + "bp_grad_norms_F": [ + 0.00018467944755684584, + 1.1658386029012036e-05, + 7.1250747168960515e-06, + 7.254411684698425e-06, + 7.026835191936698e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3642578125, + "loss_eval": 1.772944450378418, + "epoch": 24 + }, + { + "hidden_norms": [ + 4044.4833984375, + 27958.3046875, + 158277.765625, + 265767.4375, + 119247.171875 + ], + "bp_grad_norms_per_sample_med": [ + 2.939599653473124e-06, + 2.9012642244197195e-07, + 2.0495993169333815e-07, + 2.0806970724152052e-07, + 2.0302766756685742e-07 + ], + "bp_grad_norms_F": [ + 0.00017772591672837734, + 1.151475134975044e-05, + 7.005810857663164e-06, + 7.14335192242288e-06, + 6.918045983184129e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.359375, + "loss_eval": 1.7681654691696167, + "epoch": 25 + }, + { + "hidden_norms": [ + 4102.31298828125, + 28819.13671875, + 162886.59375, + 274888.375, + 124251.71875 + ], + "bp_grad_norms_per_sample_med": [ + 3.00775354844518e-06, + 2.8842808319495816e-07, + 1.9920004490359133e-07, + 2.0228824837431603e-07, + 1.9777876048010512e-07 + ], + "bp_grad_norms_F": [ + 0.00017743176431395113, + 1.1497872947074939e-05, + 6.855066203570459e-06, + 6.992981980147306e-06, + 6.764100362488534e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.361328125, + "loss_eval": 1.7643167972564697, + "epoch": 26 + }, + { + "hidden_norms": [ + 4156.68994140625, + 29263.09765625, + 167567.5625, + 286674.25, + 130533.7578125 + ], + "bp_grad_norms_per_sample_med": [ + 2.9521122542064404e-06, + 2.7994269657938275e-07, + 1.9472663836950233e-07, + 1.9846331156259112e-07, + 1.9457104372122558e-07 + ], + "bp_grad_norms_F": [ + 0.0001732901146169752, + 1.1156066648254637e-05, + 6.697610388073372e-06, + 6.834617579443147e-06, + 6.61404874335858e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.357421875, + "loss_eval": 1.7718162536621094, + "epoch": 27 + }, + { + "hidden_norms": [ + 4236.7529296875, + 30445.798828125, + 173905.171875, + 301198.6875, + 138844.546875 + ], + "bp_grad_norms_per_sample_med": [ + 2.825209094226011e-06, + 2.710314390697022e-07, + 1.868730663545648e-07, + 1.8901035048202175e-07, + 1.8439881444010098e-07 + ], + "bp_grad_norms_F": [ + 0.00016928529657889158, + 1.0838041816896293e-05, + 6.40136795482249e-06, + 6.533743089676136e-06, + 6.317317456705496e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3740234375, + "loss_eval": 1.7575714588165283, + "epoch": 28 + }, + { + "hidden_norms": [ + 4307.15966796875, + 30990.375, + 179990.59375, + 314925.53125, + 146306.109375 + ], + "bp_grad_norms_per_sample_med": [ + 2.882675744331209e-06, + 2.69783697603998e-07, + 1.8120582012670639e-07, + 1.8295163783932367e-07, + 1.7808179109124467e-07 + ], + "bp_grad_norms_F": [ + 0.0001705507020233199, + 1.0706517059588805e-05, + 6.220788691280177e-06, + 6.352388027153211e-06, + 6.134147952252533e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.38671875, + "loss_eval": 1.765124797821045, + "epoch": 29 + }, + { + "hidden_norms": [ + 4360.767578125, + 32488.16015625, + 189370.28125, + 333218.25, + 156773.703125 + ], + "bp_grad_norms_per_sample_med": [ + 2.8181013931316556e-06, + 2.653597448443179e-07, + 1.7396521911905438e-07, + 1.755686014348612e-07, + 1.7160699883334019e-07 + ], + "bp_grad_norms_F": [ + 0.00016797029820736498, + 1.0374783414590638e-05, + 5.9415992836875375e-06, + 6.068700713512953e-06, + 5.864551440026844e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3564453125, + "loss_eval": 1.755420207977295, + "epoch": 30 + }, + { + "hidden_norms": [ + 4420.99462890625, + 33248.23046875, + 197272.421875, + 350132.625, + 166295.0625 + ], + "bp_grad_norms_per_sample_med": [ + 2.8225279038451845e-06, + 2.5861882591016183e-07, + 1.676798291327941e-07, + 1.704754311049328e-07, + 1.6635479482829396e-07 + ], + "bp_grad_norms_F": [ + 0.00016677004168741405, + 1.0174546332564205e-05, + 5.748868716182187e-06, + 5.872501787962392e-06, + 5.676161890733056e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.365234375, + "loss_eval": 1.749579906463623, + "epoch": 31 + }, + { + "hidden_norms": [ + 4467.9111328125, + 34465.12109375, + 206817.0625, + 370568.6875, + 177992.796875 + ], + "bp_grad_norms_per_sample_med": [ + 2.797579327307176e-06, + 2.4461206749037956e-07, + 1.6084129583759932e-07, + 1.623946417339539e-07, + 1.5842591949422058e-07 + ], + "bp_grad_norms_F": [ + 0.0001667520118644461, + 9.997165761888027e-06, + 5.521564617083641e-06, + 5.637548838421935e-06, + 5.447109742817702e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3818359375, + "loss_eval": 1.7478370666503906, + "epoch": 32 + }, + { + "hidden_norms": [ + 4500.455078125, + 35232.3984375, + 215903.1875, + 387229.5, + 187304.4375 + ], + "bp_grad_norms_per_sample_med": [ + 2.744678795352229e-06, + 2.4473743565067707e-07, + 1.5567927391657577e-07, + 1.5809170861302846e-07, + 1.5448634371750813e-07 + ], + "bp_grad_norms_F": [ + 0.00016586907440796494, + 9.867669177765492e-06, + 5.356784186005825e-06, + 5.468943072628463e-06, + 5.285164206725312e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.380859375, + "loss_eval": 1.748937964439392, + "epoch": 33 + }, + { + "hidden_norms": [ + 4559.64990234375, + 36405.82421875, + 224989.71875, + 406526.59375, + 197279.796875 + ], + "bp_grad_norms_per_sample_med": [ + 2.676637450349517e-06, + 2.350530081685065e-07, + 1.5119638874239172e-07, + 1.5273755593625538e-07, + 1.4942507675641536e-07 + ], + "bp_grad_norms_F": [ + 0.00016609806334599853, + 9.700875125417951e-06, + 5.207733465795172e-06, + 5.317946943250718e-06, + 5.140104349266039e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.38671875, + "loss_eval": 1.747586965560913, + "epoch": 34 + }, + { + "hidden_norms": [ + 4600.470703125, + 37569.390625, + 234249.046875, + 424273.0625, + 207188.484375 + ], + "bp_grad_norms_per_sample_med": [ + 2.6595262170303613e-06, + 2.3298444773445226e-07, + 1.4830226291451254e-07, + 1.5017273824469157e-07, + 1.4676733428586886e-07 + ], + "bp_grad_norms_F": [ + 0.0001615065266378224, + 9.520201274426654e-06, + 5.091071670904057e-06, + 5.198567123443354e-06, + 5.027129645895911e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.375, + "loss_eval": 1.7455894947052002, + "epoch": 35 + }, + { + "hidden_norms": [ + 4655.232421875, + 38777.5, + 243977.203125, + 443307.78125, + 217682.03125 + ], + "bp_grad_norms_per_sample_med": [ + 2.7372755084797973e-06, + 2.3094322898487007e-07, + 1.4448018248458538e-07, + 1.465641616960056e-07, + 1.4282748850291682e-07 + ], + "bp_grad_norms_F": [ + 0.00016169788432307541, + 9.384648365085013e-06, + 4.931174771627411e-06, + 5.035632966610137e-06, + 4.871027158515062e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3779296875, + "loss_eval": 1.739393949508667, + "epoch": 36 + }, + { + "hidden_norms": [ + 4674.50634765625, + 39366.46875, + 253330.671875, + 458747.40625, + 225757.234375 + ], + "bp_grad_norms_per_sample_med": [ + 2.720141083045746e-06, + 2.3003921967301721e-07, + 1.4151289917663235e-07, + 1.4314728957742773e-07, + 1.4079574839342968e-07 + ], + "bp_grad_norms_F": [ + 0.00016218192467931658, + 9.336513357993681e-06, + 4.852768142882269e-06, + 4.95553604196175e-06, + 4.79518030260806e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3818359375, + "loss_eval": 1.7406929731369019, + "epoch": 37 + }, + { + "hidden_norms": [ + 4730.9697265625, + 40562.7578125, + 261285.078125, + 476049.71875, + 235002.046875 + ], + "bp_grad_norms_per_sample_med": [ + 2.727818809944438e-06, + 2.3385531733310927e-07, + 1.4104001877512928e-07, + 1.4261416936278692e-07, + 1.39172499302731e-07 + ], + "bp_grad_norms_F": [ + 0.00016533929738216102, + 9.380160008731764e-06, + 4.782661108038155e-06, + 4.884728696197271e-06, + 4.725173766928492e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3759765625, + "loss_eval": 1.7494721412658691, + "epoch": 38 + }, + { + "hidden_norms": [ + 4769.4833984375, + 41614.734375, + 272033.25, + 494194.5, + 244904.296875 + ], + "bp_grad_norms_per_sample_med": [ + 2.728792651396361e-06, + 2.2869069482567284e-07, + 1.3784755026335915e-07, + 1.3816679711453617e-07, + 1.3538770815557655e-07 + ], + "bp_grad_norms_F": [ + 0.0001621924457140267, + 9.226439942722209e-06, + 4.664412244892446e-06, + 4.759738658322021e-06, + 4.6096511141513474e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.380859375, + "loss_eval": 1.744396686553955, + "epoch": 39 + }, + { + "hidden_norms": [ + 4807.61669921875, + 41796.7890625, + 279173.46875, + 509024.46875, + 251937.796875 + ], + "bp_grad_norms_per_sample_med": [ + 2.7552744086278835e-06, + 2.2436680069404247e-07, + 1.334142893938406e-07, + 1.3510819485418324e-07, + 1.3202044613080943e-07 + ], + "bp_grad_norms_F": [ + 0.00016327289631590247, + 9.199145097227301e-06, + 4.6049044613027945e-06, + 4.701471880252939e-06, + 4.55197186965961e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.37890625, + "loss_eval": 1.738051176071167, + "epoch": 40 + }, + { + "hidden_norms": [ + 4846.89013671875, + 43419.1953125, + 288358.6875, + 526415.1875, + 261093.328125 + ], + "bp_grad_norms_per_sample_med": [ + 2.7159530873177573e-06, + 2.2739833127616293e-07, + 1.3493598771674442e-07, + 1.3701293255508062e-07, + 1.3374133800425625e-07 + ], + "bp_grad_norms_F": [ + 0.00016205597785301507, + 9.20344336918788e-06, + 4.573969818011392e-06, + 4.670639100368135e-06, + 4.519301455729874e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3759765625, + "loss_eval": 1.769773244857788, + "epoch": 41 + }, + { + "hidden_norms": [ + 4880.62109375, + 44368.0, + 297320.0, + 543147.8125, + 270529.90625 + ], + "bp_grad_norms_per_sample_med": [ + 2.704309054024634e-06, + 2.2085772855007235e-07, + 1.31169457517899e-07, + 1.3294274481268076e-07, + 1.296902354397389e-07 + ], + "bp_grad_norms_F": [ + 0.000160810406669043, + 9.048065294336993e-06, + 4.454658665054012e-06, + 4.546407581074163e-06, + 4.4059761421522126e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.388671875, + "loss_eval": 1.7465946674346924, + "epoch": 42 + }, + { + "hidden_norms": [ + 4899.1767578125, + 45389.57421875, + 307315.8125, + 560231.5625, + 278935.6875 + ], + "bp_grad_norms_per_sample_med": [ + 2.7406351819081465e-06, + 2.2317071568522806e-07, + 1.2826720308112272e-07, + 1.3064222059711028e-07, + 1.270270928444006e-07 + ], + "bp_grad_norms_F": [ + 0.00016026092635001987, + 8.999614692584146e-06, + 4.385735792311607e-06, + 4.476342382986331e-06, + 4.342015927250031e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.38671875, + "loss_eval": 1.73671293258667, + "epoch": 43 + }, + { + "hidden_norms": [ + 4931.53857421875, + 45391.578125, + 314715.1875, + 576663.1875, + 287751.21875 + ], + "bp_grad_norms_per_sample_med": [ + 2.7501505428517703e-06, + 2.1621856660658523e-07, + 1.2502815138759615e-07, + 1.2642922797567735e-07, + 1.2348743894108338e-07 + ], + "bp_grad_norms_F": [ + 0.00015757110668346286, + 8.882019756129012e-06, + 4.295293820177903e-06, + 4.383605300972704e-06, + 4.2555047912173904e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.376953125, + "loss_eval": 1.7194021940231323, + "epoch": 44 + }, + { + "hidden_norms": [ + 4952.10205078125, + 46544.41015625, + 321747.78125, + 590124.0, + 293778.09375 + ], + "bp_grad_norms_per_sample_med": [ + 2.7445450996310683e-06, + 2.20402526451835e-07, + 1.2519362257989997e-07, + 1.2609659449935862e-07, + 1.243117537796934e-07 + ], + "bp_grad_norms_F": [ + 0.00015927865752018988, + 8.919399988371879e-06, + 4.280226676200982e-06, + 4.3682503019226715e-06, + 4.240421731083188e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.376953125, + "loss_eval": 1.7289605140686035, + "epoch": 45 + }, + { + "hidden_norms": [ + 4985.6728515625, + 47313.03515625, + 330026.15625, + 605693.8125, + 301341.84375 + ], + "bp_grad_norms_per_sample_med": [ + 2.751742158579873e-06, + 2.1928519799985224e-07, + 1.2418719563811464e-07, + 1.259736563952174e-07, + 1.2327782883403415e-07 + ], + "bp_grad_norms_F": [ + 0.0001606208534212783, + 8.962500942288898e-06, + 4.251486188877607e-06, + 4.337850896263262e-06, + 4.2124443098146e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.390625, + "loss_eval": 1.7371184825897217, + "epoch": 46 + }, + { + "hidden_norms": [ + 4993.990234375, + 47521.25390625, + 335434.3125, + 618341.0625, + 307157.4375 + ], + "bp_grad_norms_per_sample_med": [ + 2.7009368750441354e-06, + 2.1855973386664118e-07, + 1.2373016033961903e-07, + 1.255795467614007e-07, + 1.2245830305346317e-07 + ], + "bp_grad_norms_F": [ + 0.00015943347534630448, + 8.89301736606285e-06, + 4.223482847010018e-06, + 4.306960363464896e-06, + 4.1826651795418e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.384765625, + "loss_eval": 1.737732172012329, + "epoch": 47 + }, + { + "hidden_norms": [ + 5012.49951171875, + 48445.1953125, + 344918.46875, + 633703.8125, + 314618.65625 + ], + "bp_grad_norms_per_sample_med": [ + 2.7400287763157394e-06, + 2.1858940613128652e-07, + 1.2219133793678338e-07, + 1.242535176970705e-07, + 1.2144892025389709e-07 + ], + "bp_grad_norms_F": [ + 0.0001590315659996122, + 8.84339078766061e-06, + 4.180086762062274e-06, + 4.265210009180009e-06, + 4.143982550885994e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.375, + "loss_eval": 1.7298643589019775, + "epoch": 48 + }, + { + "hidden_norms": [ + 5054.08984375, + 49201.015625, + 353929.5625, + 650649.9375, + 323234.34375 + ], + "bp_grad_norms_per_sample_med": [ + 2.710038643272128e-06, + 2.1170153274852055e-07, + 1.1893747853264358e-07, + 1.2112403169339814e-07, + 1.1869307314782418e-07 + ], + "bp_grad_norms_F": [ + 0.00015847652684897184, + 8.75549994816538e-06, + 4.11285736845457e-06, + 4.190015260974178e-06, + 4.073814125149511e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3876953125, + "loss_eval": 1.7279736995697021, + "epoch": 49 + }, + { + "hidden_norms": [ + 5079.68505859375, + 49818.85546875, + 363584.96875, + 665326.4375, + 330221.40625 + ], + "bp_grad_norms_per_sample_med": [ + 2.728055960687925e-06, + 2.1385960735642584e-07, + 1.1923917497824732e-07, + 1.2005260430214548e-07, + 1.1790963583280245e-07 + ], + "bp_grad_norms_F": [ + 0.00015702334349043667, + 8.663697371957824e-06, + 4.082327905052807e-06, + 4.160873686487321e-06, + 4.0494828681403305e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3876953125, + "loss_eval": 1.7221198081970215, + "epoch": 50 + }, + { + "hidden_norms": [ + 5103.2626953125, + 50236.62109375, + 366800.8125, + 675614.9375, + 334505.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.6967995836457703e-06, + 2.110563741553051e-07, + 1.1874865890604269e-07, + 1.1944737821067974e-07, + 1.17826154166778e-07 + ], + "bp_grad_norms_F": [ + 0.00015892359078861773, + 8.714905561646447e-06, + 4.066732344654156e-06, + 4.143567366554635e-06, + 4.033038294437574e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3955078125, + "loss_eval": 1.7186274528503418, + "epoch": 51 + }, + { + "hidden_norms": [ + 5129.00830078125, + 51124.4453125, + 375390.84375, + 689126.5, + 340674.15625 + ], + "bp_grad_norms_per_sample_med": [ + 2.7418275294621708e-06, + 2.1331975119665003e-07, + 1.1826992363239697e-07, + 1.1942577771151264e-07, + 1.1719654224862097e-07 + ], + "bp_grad_norms_F": [ + 0.00015799023094587028, + 8.683533451403491e-06, + 4.048787559440825e-06, + 4.127006377530051e-06, + 4.019248081021942e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3876953125, + "loss_eval": 1.7216696739196777, + "epoch": 52 + }, + { + "hidden_norms": [ + 5147.63671875, + 51383.28515625, + 382888.34375, + 701867.8125, + 346661.03125 + ], + "bp_grad_norms_per_sample_med": [ + 2.725489366639522e-06, + 2.1360351354360319e-07, + 1.1696960910967391e-07, + 1.1808428013182493e-07, + 1.1615074413384718e-07 + ], + "bp_grad_norms_F": [ + 0.0001584803540026769, + 8.698161764186807e-06, + 4.018610525235999e-06, + 4.092659764864948e-06, + 3.9867554733064026e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.39453125, + "loss_eval": 1.7209246158599854, + "epoch": 53 + }, + { + "hidden_norms": [ + 5179.68603515625, + 52093.16796875, + 388203.75, + 712999.25, + 350465.40625 + ], + "bp_grad_norms_per_sample_med": [ + 2.7409823815105483e-06, + 2.16206004211017e-07, + 1.1817400746849671e-07, + 1.1920442943846865e-07, + 1.1731118831903586e-07 + ], + "bp_grad_norms_F": [ + 0.00015836946840863675, + 8.735608389542904e-06, + 4.036091922898777e-06, + 4.111263024242362e-06, + 4.005241407867288e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3837890625, + "loss_eval": 1.7180767059326172, + "epoch": 54 + }, + { + "hidden_norms": [ + 5197.8408203125, + 53041.44140625, + 398597.125, + 728487.4375, + 358157.9375 + ], + "bp_grad_norms_per_sample_med": [ + 2.763840029729181e-06, + 2.1291030805059563e-07, + 1.1598489635389342e-07, + 1.1754219286785883e-07, + 1.1593917292884726e-07 + ], + "bp_grad_norms_F": [ + 0.0001594589266460389, + 8.711985174159054e-06, + 4.000611625087913e-06, + 4.07353172704461e-06, + 3.971201294916682e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.38671875, + "loss_eval": 1.7179795503616333, + "epoch": 55 + }, + { + "hidden_norms": [ + 5217.0146484375, + 53347.57421875, + 403986.625, + 738288.125, + 361666.125 + ], + "bp_grad_norms_per_sample_med": [ + 2.7599005534284515e-06, + 2.135690380100641e-07, + 1.1644724651205252e-07, + 1.166295646726212e-07, + 1.1492483054098557e-07 + ], + "bp_grad_norms_F": [ + 0.0001592675835127011, + 8.73087174113607e-06, + 4.000759417976951e-06, + 4.0730465116212144e-06, + 3.972524154960411e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.390625, + "loss_eval": 1.719031810760498, + "epoch": 56 + }, + { + "hidden_norms": [ + 5245.46875, + 53932.046875, + 410963.8125, + 750011.5, + 367171.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.727937499003019e-06, + 2.1207910094744875e-07, + 1.1586875103830607e-07, + 1.1747369654813156e-07, + 1.1563617619003708e-07 + ], + "bp_grad_norms_F": [ + 0.0001595055073266849, + 8.686207365826704e-06, + 3.98215252062073e-06, + 4.0539648580306675e-06, + 3.954477506340481e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3837890625, + "loss_eval": 1.7162381410598755, + "epoch": 57 + }, + { + "hidden_norms": [ + 5273.81396484375, + 54359.40234375, + 415035.71875, + 757034.5, + 368386.46875 + ], + "bp_grad_norms_per_sample_med": [ + 2.8185475002828753e-06, + 2.183954137535693e-07, + 1.180805142553254e-07, + 1.196149383986267e-07, + 1.1741713734636505e-07 + ], + "bp_grad_norms_F": [ + 0.00016158133803401142, + 8.819352842692751e-06, + 4.027346676593879e-06, + 4.101018930668943e-06, + 3.999525233666645e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3828125, + "loss_eval": 1.7294056415557861, + "epoch": 58 + }, + { + "hidden_norms": [ + 5279.26513671875, + 54860.85546875, + 420308.09375, + 767223.875, + 372461.6875 + ], + "bp_grad_norms_per_sample_med": [ + 2.7814132863568375e-06, + 2.1827422358455806e-07, + 1.1745117944883532e-07, + 1.1896155172053113e-07, + 1.1699857083158349e-07 + ], + "bp_grad_norms_F": [ + 0.0001601481344550848, + 8.751929271966219e-06, + 4.01089027946e-06, + 4.083126441400964e-06, + 3.984826435043942e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3740234375, + "loss_eval": 1.7233260869979858, + "epoch": 59 + }, + { + "hidden_norms": [ + 5281.876953125, + 55172.76171875, + 426239.0, + 777712.75, + 377365.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.729702600845485e-06, + 2.1274833272855176e-07, + 1.14989177291136e-07, + 1.1596039684036441e-07, + 1.1409560585207146e-07 + ], + "bp_grad_norms_F": [ + 0.00016002384654711932, + 8.679173333803192e-06, + 3.97576059185667e-06, + 4.045130026497645e-06, + 3.949881829612423e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.392578125, + "loss_eval": 1.7190814018249512, + "epoch": 60 + }, + { + "hidden_norms": [ + 5293.4951171875, + 55554.5703125, + 430637.53125, + 784743.25, + 379242.96875 + ], + "bp_grad_norms_per_sample_med": [ + 2.768365220617852e-06, + 2.1479348788489006e-07, + 1.1614937989179452e-07, + 1.1718410775074517e-07, + 1.1549084888429206e-07 + ], + "bp_grad_norms_F": [ + 0.00016024228534661233, + 8.705451364221517e-06, + 3.991565336036729e-06, + 4.061004801769741e-06, + 3.96601899410598e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3837890625, + "loss_eval": 1.7091575860977173, + "epoch": 61 + }, + { + "hidden_norms": [ + 5305.26953125, + 56114.8203125, + 436835.59375, + 794036.0, + 382300.59375 + ], + "bp_grad_norms_per_sample_med": [ + 2.793117346300278e-06, + 2.1690949836283835e-07, + 1.1630865515144251e-07, + 1.1756346651736749e-07, + 1.1506058683607989e-07 + ], + "bp_grad_norms_F": [ + 0.00016134958423208445, + 8.74852321430808e-06, + 3.9943656702234875e-06, + 4.064597760589095e-06, + 3.969457793573383e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3798828125, + "loss_eval": 1.7154879570007324, + "epoch": 62 + }, + { + "hidden_norms": [ + 5302.8837890625, + 56558.90625, + 441340.78125, + 802203.0625, + 385590.65625 + ], + "bp_grad_norms_per_sample_med": [ + 2.8357644623611122e-06, + 2.1830236107689416e-07, + 1.174595283259805e-07, + 1.1849279246689548e-07, + 1.1699435020773308e-07 + ], + "bp_grad_norms_F": [ + 0.00016155940829776227, + 8.755636372370645e-06, + 4.0028130570135545e-06, + 4.07254128731438e-06, + 3.978685981564922e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.388671875, + "loss_eval": 1.7206263542175293, + "epoch": 63 + }, + { + "hidden_norms": [ + 5312.6650390625, + 56690.29296875, + 446444.65625, + 811108.375, + 389126.15625 + ], + "bp_grad_norms_per_sample_med": [ + 2.7693422453012317e-06, + 2.0976162318220304e-07, + 1.1542074673798197e-07, + 1.161635623248003e-07, + 1.1368263841404769e-07 + ], + "bp_grad_norms_F": [ + 0.00016044928634073585, + 8.682382031111047e-06, + 3.968462351622293e-06, + 4.03698095396976e-06, + 3.944758191209985e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3935546875, + "loss_eval": 1.708216667175293, + "epoch": 64 + }, + { + "hidden_norms": [ + 5315.3154296875, + 57172.39453125, + 452320.78125, + 819345.4375, + 392431.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.7417515866545727e-06, + 2.1362264135404985e-07, + 1.1589729354000156e-07, + 1.165334211350455e-07, + 1.1489947127074629e-07 + ], + "bp_grad_norms_F": [ + 0.00016101017536129802, + 8.694333700987045e-06, + 3.9719238884572405e-06, + 4.039454324811231e-06, + 3.947835011786083e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3916015625, + "loss_eval": 1.7132065296173096, + "epoch": 65 + }, + { + "hidden_norms": [ + 5323.32421875, + 57353.53515625, + 455451.03125, + 825786.625, + 393529.90625 + ], + "bp_grad_norms_per_sample_med": [ + 2.7779890388046624e-06, + 2.1516311221603246e-07, + 1.1656365472845209e-07, + 1.1796725374324524e-07, + 1.1570150348916286e-07 + ], + "bp_grad_norms_F": [ + 0.00016156666970346123, + 8.733955837669782e-06, + 3.986176579928724e-06, + 4.05381206292077e-06, + 3.9624515011382755e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3994140625, + "loss_eval": 1.715019702911377, + "epoch": 66 + }, + { + "hidden_norms": [ + 5342.94140625, + 57836.46875, + 461806.90625, + 835003.3125, + 397621.53125 + ], + "bp_grad_norms_per_sample_med": [ + 2.7782559754996328e-06, + 2.1394832572241285e-07, + 1.1512971553884199e-07, + 1.1638152841442206e-07, + 1.1455212955979732e-07 + ], + "bp_grad_norms_F": [ + 0.00016023094940464944, + 8.671009709360078e-06, + 3.967585598729784e-06, + 4.035073743580142e-06, + 3.945795015170006e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3876953125, + "loss_eval": 1.7059491872787476, + "epoch": 67 + }, + { + "hidden_norms": [ + 5353.94189453125, + 58288.83984375, + 465855.71875, + 840827.8125, + 399727.625 + ], + "bp_grad_norms_per_sample_med": [ + 2.7943997338297777e-06, + 2.1217401524609159e-07, + 1.1551408363175142e-07, + 1.1611316352855283e-07, + 1.1411684397444333e-07 + ], + "bp_grad_norms_F": [ + 0.00015934662951622158, + 8.68945244292263e-06, + 3.9676901906204876e-06, + 4.034785888507031e-06, + 3.945680873584934e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.39453125, + "loss_eval": 1.703755259513855, + "epoch": 68 + }, + { + "hidden_norms": [ + 5350.173828125, + 58626.13671875, + 469388.5, + 847294.5, + 401525.625 + ], + "bp_grad_norms_per_sample_med": [ + 2.773014784906991e-06, + 2.1550022211158648e-07, + 1.1623347972999909e-07, + 1.1767290430952926e-07, + 1.1548346634526752e-07 + ], + "bp_grad_norms_F": [ + 0.00016030117694754153, + 8.702772902324796e-06, + 3.981078407377936e-06, + 4.047733909828821e-06, + 3.958340130338911e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3916015625, + "loss_eval": 1.7165981531143188, + "epoch": 69 + }, + { + "hidden_norms": [ + 5357.58251953125, + 58903.7734375, + 474182.15625, + 855194.375, + 404878.59375 + ], + "bp_grad_norms_per_sample_med": [ + 2.75364641311171e-06, + 2.1325861609966523e-07, + 1.1510206121556621e-07, + 1.1569208169248668e-07, + 1.1389116849613856e-07 + ], + "bp_grad_norms_F": [ + 0.00015995267312973738, + 8.656907994009089e-06, + 3.959937203035224e-06, + 4.026182978122961e-06, + 3.939108864869922e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3955078125, + "loss_eval": 1.7067822217941284, + "epoch": 70 + }, + { + "hidden_norms": [ + 5361.0703125, + 59035.59375, + 477104.5, + 859434.875, + 405244.875 + ], + "bp_grad_norms_per_sample_med": [ + 2.7923097150051035e-06, + 2.1804021343996283e-07, + 1.1658453757945608e-07, + 1.1743448169454496e-07, + 1.1549956013823248e-07 + ], + "bp_grad_norms_F": [ + 0.0001615561341168359, + 8.730263289180584e-06, + 3.989315700891893e-06, + 4.055812496517319e-06, + 3.967216798628215e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.392578125, + "loss_eval": 1.713646411895752, + "epoch": 71 + }, + { + "hidden_norms": [ + 5369.7529296875, + 59398.04296875, + 480994.0625, + 865578.875, + 407758.6875 + ], + "bp_grad_norms_per_sample_med": [ + 2.7749495075113373e-06, + 2.139253751920478e-07, + 1.1538476485384308e-07, + 1.1588154080754975e-07, + 1.1468705451989081e-07 + ], + "bp_grad_norms_F": [ + 0.00016089060227386653, + 8.69345421961043e-06, + 3.971756996179465e-06, + 4.03762214773451e-06, + 3.950478458136786e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3896484375, + "loss_eval": 1.7055977582931519, + "epoch": 72 + }, + { + "hidden_norms": [ + 5376.67578125, + 59606.38671875, + 484413.75, + 871224.125, + 409605.40625 + ], + "bp_grad_norms_per_sample_med": [ + 2.767387286439771e-06, + 2.163243522090852e-07, + 1.1596397797575264e-07, + 1.1663173182796527e-07, + 1.1466888594213742e-07 + ], + "bp_grad_norms_F": [ + 0.0001625583681743592, + 8.740000339457765e-06, + 3.985041985288262e-06, + 4.0507725316274446e-06, + 3.964435109082842e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3896484375, + "loss_eval": 1.717661738395691, + "epoch": 73 + }, + { + "hidden_norms": [ + 5388.92626953125, + 60038.8828125, + 487315.0, + 875672.0625, + 411209.46875 + ], + "bp_grad_norms_per_sample_med": [ + 2.811367039612378e-06, + 2.1376251879701158e-07, + 1.150508310843179e-07, + 1.1646184105984503e-07, + 1.1464238269809357e-07 + ], + "bp_grad_norms_F": [ + 0.0001601450494490564, + 8.67134895088384e-06, + 3.971680598624516e-06, + 4.03764806833351e-06, + 3.951014605263481e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.38671875, + "loss_eval": 1.7057151794433594, + "epoch": 74 + }, + { + "hidden_norms": [ + 5394.13818359375, + 60238.7265625, + 490408.5625, + 880235.0625, + 412592.1875 + ], + "bp_grad_norms_per_sample_med": [ + 2.7481701181386597e-06, + 2.1436494535009842e-07, + 1.1508839747875754e-07, + 1.1683697209718957e-07, + 1.148769968040142e-07 + ], + "bp_grad_norms_F": [ + 0.00016096947365440428, + 8.67969538376201e-06, + 3.976166681241011e-06, + 4.041281044919742e-06, + 3.95562074118061e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3974609375, + "loss_eval": 1.711783528327942, + "epoch": 75 + }, + { + "hidden_norms": [ + 5398.15234375, + 60386.79296875, + 492903.0625, + 883714.5, + 413466.03125 + ], + "bp_grad_norms_per_sample_med": [ + 2.7468756798043614e-06, + 2.142960227047297e-07, + 1.155566522470508e-07, + 1.1617837003541354e-07, + 1.1447124137475839e-07 + ], + "bp_grad_norms_F": [ + 0.00016124852118082345, + 8.686849469086155e-06, + 3.9795741031412035e-06, + 4.044950401294045e-06, + 3.958904471801361e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3955078125, + "loss_eval": 1.7077192068099976, + "epoch": 76 + }, + { + "hidden_norms": [ + 5399.38623046875, + 60673.9140625, + 495671.34375, + 887343.3125, + 414498.4375 + ], + "bp_grad_norms_per_sample_med": [ + 2.782978071991238e-06, + 2.1490254198397452e-07, + 1.1598574900517633e-07, + 1.167711403127214e-07, + 1.1515145814655625e-07 + ], + "bp_grad_norms_F": [ + 0.00016076312749646604, + 8.698333658685442e-06, + 3.980411747761536e-06, + 4.046264621138107e-06, + 3.960503818234429e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3896484375, + "loss_eval": 1.7069586515426636, + "epoch": 77 + }, + { + "hidden_norms": [ + 5401.99755859375, + 60780.171875, + 498870.40625, + 892185.3125, + 416521.0625 + ], + "bp_grad_norms_per_sample_med": [ + 2.731095946728601e-06, + 2.1313489639851468e-07, + 1.1489591145164013e-07, + 1.1583144754467867e-07, + 1.1378151754115606e-07 + ], + "bp_grad_norms_F": [ + 0.00016048294492065907, + 8.671476280142087e-06, + 3.968764303863281e-06, + 4.033439381601056e-06, + 3.948562607547501e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.388671875, + "loss_eval": 1.7046585083007812, + "epoch": 78 + }, + { + "hidden_norms": [ + 5396.2353515625, + 60906.8125, + 499556.1875, + 893389.6875, + 416091.625 + ], + "bp_grad_norms_per_sample_med": [ + 2.8349218155199196e-06, + 2.165559180866694e-07, + 1.1532758037446911e-07, + 1.1579567171793315e-07, + 1.1431712465537203e-07 + ], + "bp_grad_norms_F": [ + 0.00016091841098386794, + 8.715818694327027e-06, + 3.983707301813411e-06, + 4.049661583849229e-06, + 3.963775725424057e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.39453125, + "loss_eval": 1.7074486017227173, + "epoch": 79 + }, + { + "hidden_norms": [ + 5399.12646484375, + 60870.21484375, + 502091.5625, + 896890.0625, + 417516.5625 + ], + "bp_grad_norms_per_sample_med": [ + 2.7684259293891955e-06, + 2.148178452898719e-07, + 1.1549953882195041e-07, + 1.1610666916794798e-07, + 1.1443260916621512e-07 + ], + "bp_grad_norms_F": [ + 0.00016129721188917756, + 8.707292181497905e-06, + 3.980841484008124e-06, + 4.045855348522309e-06, + 3.9603528421139345e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.390625, + "loss_eval": 1.706810474395752, + "epoch": 80 + }, + { + "hidden_norms": [ + 5394.28564453125, + 61078.3671875, + 504476.65625, + 900378.125, + 418670.8125 + ], + "bp_grad_norms_per_sample_med": [ + 2.764037617453141e-06, + 2.1426544094538258e-07, + 1.156425071258127e-07, + 1.1587813730784546e-07, + 1.145299108884501e-07 + ], + "bp_grad_norms_F": [ + 0.00016113216406665742, + 8.712745511729736e-06, + 3.979288521804847e-06, + 4.0438499127049e-06, + 3.9589867810718715e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3896484375, + "loss_eval": 1.7053430080413818, + "epoch": 81 + }, + { + "hidden_norms": [ + 5396.7236328125, + 61213.38671875, + 505729.4375, + 902413.125, + 419251.0625 + ], + "bp_grad_norms_per_sample_med": [ + 2.7847922865475994e-06, + 2.1385373827342846e-07, + 1.1590607584821555e-07, + 1.167506624710768e-07, + 1.1480997130774995e-07 + ], + "bp_grad_norms_F": [ + 0.0001612855412531644, + 8.721244739717804e-06, + 3.984357590525178e-06, + 4.048785740451422e-06, + 3.963945800933288e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.390625, + "loss_eval": 1.708754062652588, + "epoch": 82 + }, + { + "hidden_norms": [ + 5401.74169921875, + 61391.25, + 507562.5, + 904882.1875, + 420061.125 + ], + "bp_grad_norms_per_sample_med": [ + 2.7846790544572286e-06, + 2.140303649866837e-07, + 1.1582537240428792e-07, + 1.1669516197798657e-07, + 1.1512172903849205e-07 + ], + "bp_grad_norms_F": [ + 0.00016096761100925505, + 8.707896085979883e-06, + 3.9824740269978065e-06, + 4.0467593862558715e-06, + 3.962396021961467e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3876953125, + "loss_eval": 1.7056825160980225, + "epoch": 83 + }, + { + "hidden_norms": [ + 5407.85205078125, + 61435.578125, + 508690.6875, + 906681.875, + 420568.9375 + ], + "bp_grad_norms_per_sample_med": [ + 2.766970737866359e-06, + 2.144422381888944e-07, + 1.157119697836606e-07, + 1.1730713112001467e-07, + 1.1475398054017205e-07 + ], + "bp_grad_norms_F": [ + 0.00016140809748321772, + 8.720307960174978e-06, + 3.985259354521986e-06, + 4.050050392834237e-06, + 3.965534688177286e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.390625, + "loss_eval": 1.7068425416946411, + "epoch": 84 + }, + { + "hidden_norms": [ + 5412.962890625, + 61492.68359375, + 510179.25, + 908609.25, + 421252.96875 + ], + "bp_grad_norms_per_sample_med": [ + 2.7769999633164844e-06, + 2.1622201984428102e-07, + 1.1603597727116721e-07, + 1.1669756361243344e-07, + 1.1481289163839392e-07 + ], + "bp_grad_norms_F": [ + 0.00016168547153938562, + 8.720241567061748e-06, + 3.984777777077397e-06, + 4.049422386742663e-06, + 3.9649389691476244e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.38671875, + "loss_eval": 1.7068109512329102, + "epoch": 85 + }, + { + "hidden_norms": [ + 5414.86083984375, + 61660.16015625, + 511083.3125, + 910132.875, + 421357.09375 + ], + "bp_grad_norms_per_sample_med": [ + 2.7625901566352695e-06, + 2.1562310337230883e-07, + 1.1591524184950686e-07, + 1.168542453910959e-07, + 1.1494233120856734e-07 + ], + "bp_grad_norms_F": [ + 0.00016218819655478, + 8.743301805225201e-06, + 3.990852292190539e-06, + 4.055550562043209e-06, + 3.9708543226879556e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.384765625, + "loss_eval": 1.7097513675689697, + "epoch": 86 + }, + { + "hidden_norms": [ + 5414.11181640625, + 61679.67578125, + 512268.53125, + 911841.3125, + 422135.65625 + ], + "bp_grad_norms_per_sample_med": [ + 2.7821745334222214e-06, + 2.1437830355353071e-07, + 1.1559337309563489e-07, + 1.1630524454631086e-07, + 1.143072410059176e-07 + ], + "bp_grad_norms_F": [ + 0.00016158135258592665, + 8.71670272317715e-06, + 3.983236638305243e-06, + 4.047654329042416e-06, + 3.9634205677430145e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3916015625, + "loss_eval": 1.7057619094848633, + "epoch": 87 + }, + { + "hidden_norms": [ + 5415.7666015625, + 61667.71875, + 513312.21875, + 913202.4375, + 422493.96875 + ], + "bp_grad_norms_per_sample_med": [ + 2.759925337159075e-06, + 2.1446679454584228e-07, + 1.1589692405777896e-07, + 1.1621393980476569e-07, + 1.1463799864941393e-07 + ], + "bp_grad_norms_F": [ + 0.000161813193699345, + 8.719586730876472e-06, + 3.9842125261202455e-06, + 4.0484619603375904e-06, + 3.964251391153084e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.390625, + "loss_eval": 1.7056890726089478, + "epoch": 88 + }, + { + "hidden_norms": [ + 5416.599609375, + 61688.796875, + 513735.6875, + 914162.125, + 422800.5625 + ], + "bp_grad_norms_per_sample_med": [ + 2.7784999474533834e-06, + 2.1510695091819798e-07, + 1.1558491763707934e-07, + 1.1671390609535592e-07, + 1.1512633335541977e-07 + ], + "bp_grad_norms_F": [ + 0.0001624061696929857, + 8.740545126784127e-06, + 3.989640845247777e-06, + 4.053715656482382e-06, + 3.969642875745194e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3876953125, + "loss_eval": 1.7097570896148682, + "epoch": 89 + }, + { + "hidden_norms": [ + 5416.76220703125, + 61798.24609375, + 514785.84375, + 915175.75, + 423199.09375 + ], + "bp_grad_norms_per_sample_med": [ + 2.777203462756006e-06, + 2.1360766311318002e-07, + 1.1558247337006833e-07, + 1.1610516992277553e-07, + 1.1466264027149009e-07 + ], + "bp_grad_norms_F": [ + 0.0001616168738109991, + 8.719413926883135e-06, + 3.9822580220061354e-06, + 4.046389676659601e-06, + 3.9626197576581035e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3916015625, + "loss_eval": 1.7034153938293457, + "epoch": 90 + }, + { + "hidden_norms": [ + 5416.92138671875, + 61928.12109375, + 515030.59375, + 915798.25, + 423164.4375 + ], + "bp_grad_norms_per_sample_med": [ + 2.810946853060159e-06, + 2.1559939966664388e-07, + 1.1640541686119832e-07, + 1.1669366983824148e-07, + 1.1499378160806373e-07 + ], + "bp_grad_norms_F": [ + 0.00016196168144233525, + 8.733930371818133e-06, + 3.986880528827896e-06, + 4.051325959153473e-06, + 3.9673618630331475e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3857421875, + "loss_eval": 1.7049140930175781, + "epoch": 91 + }, + { + "hidden_norms": [ + 5416.93212890625, + 61895.34765625, + 515480.125, + 916358.0, + 423425.4375 + ], + "bp_grad_norms_per_sample_med": [ + 2.8099400424252963e-06, + 2.1475410960647423e-07, + 1.1618925555012538e-07, + 1.1643356145896178e-07, + 1.1480153716547647e-07 + ], + "bp_grad_norms_F": [ + 0.00016178778605535626, + 8.72767577675404e-06, + 3.985679995821556e-06, + 4.050090865348466e-06, + 3.966247277276125e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3876953125, + "loss_eval": 1.7039738893508911, + "epoch": 92 + }, + { + "hidden_norms": [ + 5417.095703125, + 61845.4921875, + 515914.6875, + 916804.125, + 423511.625 + ], + "bp_grad_norms_per_sample_med": [ + 2.805000349326292e-06, + 2.15853873442029e-07, + 1.1573133917863743e-07, + 1.1623403395333298e-07, + 1.146071184621178e-07 + ], + "bp_grad_norms_F": [ + 0.00016200476966332644, + 8.730704394110944e-06, + 3.986714546044823e-06, + 4.050946245115483e-06, + 3.967099928559037e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3896484375, + "loss_eval": 1.7049956321716309, + "epoch": 93 + }, + { + "hidden_norms": [ + 5417.3349609375, + 61879.95703125, + 516017.53125, + 916914.5625, + 423434.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.7787407361756777e-06, + 2.167610944070475e-07, + 1.1583406234194626e-07, + 1.1677065714366108e-07, + 1.1465835569879346e-07 + ], + "bp_grad_norms_F": [ + 0.0001623090065550059, + 8.742457794141956e-06, + 3.991137873526895e-06, + 4.055534191138577e-06, + 3.971431851823581e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3876953125, + "loss_eval": 1.7075328826904297, + "epoch": 94 + }, + { + "hidden_norms": [ + 5417.50390625, + 61889.82421875, + 516312.4375, + 917429.0, + 423711.03125 + ], + "bp_grad_norms_per_sample_med": [ + 2.7708026664186036e-06, + 2.1539200645293022e-07, + 1.1580210923511913e-07, + 1.16502334890356e-07, + 1.1404062405517834e-07 + ], + "bp_grad_norms_F": [ + 0.00016205437714233994, + 8.73019962455146e-06, + 3.986566753155785e-06, + 4.050732059113216e-06, + 3.966889835282927e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.388671875, + "loss_eval": 1.7053842544555664, + "epoch": 95 + }, + { + "hidden_norms": [ + 5417.48828125, + 61898.47265625, + 516375.0, + 917465.6875, + 423663.46875 + ], + "bp_grad_norms_per_sample_med": [ + 2.7983871859760256e-06, + 2.1556444096404448e-07, + 1.160928064791733e-07, + 1.1642453046079027e-07, + 1.1440795333328424e-07 + ], + "bp_grad_norms_F": [ + 0.00016201405378524214, + 8.732341484574135e-06, + 3.987765467172721e-06, + 4.052003077958943e-06, + 3.9681326597929e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3876953125, + "loss_eval": 1.7055914402008057, + "epoch": 96 + }, + { + "hidden_norms": [ + 5417.54931640625, + 61916.09375, + 516515.78125, + 917698.75, + 423749.71875 + ], + "bp_grad_norms_per_sample_med": [ + 2.7831354145746445e-06, + 2.1518340531656577e-07, + 1.1582258707676374e-07, + 1.1653285980628425e-07, + 1.1448688042037247e-07 + ], + "bp_grad_norms_F": [ + 0.00016204272105824202, + 8.731909474590793e-06, + 3.987126092397375e-06, + 4.051275027450174e-06, + 3.967459178966237e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3896484375, + "loss_eval": 1.7053790092468262, + "epoch": 97 + }, + { + "hidden_norms": [ + 5417.61865234375, + 61911.2734375, + 516535.4375, + 917715.875, + 423733.46875 + ], + "bp_grad_norms_per_sample_med": [ + 2.784623802654096e-06, + 2.1553401552409923e-07, + 1.157067259782707e-07, + 1.1653578724235558e-07, + 1.1444880243516309e-07 + ], + "bp_grad_norms_F": [ + 0.0001621013943804428, + 8.73380577104399e-06, + 3.987797754234634e-06, + 4.05199125452782e-06, + 3.968138116761111e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3876953125, + "loss_eval": 1.7057509422302246, + "epoch": 98 + }, + { + "hidden_norms": [ + 5417.64111328125, + 61917.359375, + 516576.09375, + 917756.125, + 423741.78125 + ], + "bp_grad_norms_per_sample_med": [ + 2.785410288197454e-06, + 2.1554964746428595e-07, + 1.1583354364574916e-07, + 1.1650187303757775e-07, + 1.145084596032575e-07 + ], + "bp_grad_norms_F": [ + 0.00016210223839152604, + 8.733919457881711e-06, + 3.987840045738267e-06, + 4.052033091284102e-06, + 3.968175860791234e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.388671875, + "loss_eval": 1.7057793140411377, + "epoch": 99 + }, + { + "hidden_norms": [ + 5417.64697265625, + 61917.6640625, + 516580.8125, + 917765.6875, + 423747.84375 + ], + "bp_grad_norms_per_sample_med": [ + 2.786067398119485e-06, + 2.1562047436418652e-07, + 1.1590604742650612e-07, + 1.1655521348075126e-07, + 1.1442210023915322e-07 + ], + "bp_grad_norms_F": [ + 0.00016209435125347227, + 8.73375483934069e-06, + 3.987807303929003e-06, + 4.0519980757380836e-06, + 3.968141299992567e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.388671875, + "loss_eval": 1.705754280090332, + "epoch": 100 + } + ], + "seed": 42, + "depth": 4, + "d_hidden": 256 +} \ No newline at end of file diff --git a/results/snapshot_evolution_v2/snapshot_fa_s42.json b/results/snapshot_evolution_v2/snapshot_fa_s42.json new file mode 100644 index 0000000..277acec --- /dev/null +++ b/results/snapshot_evolution_v2/snapshot_fa_s42.json @@ -0,0 +1,2734 @@ +{ + "fa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010068593546748161, + 0.000997236929833889, + 0.0009934091940522194, + 0.0009870644425973296, + 0.0009829498594626784 + ], + "bp_grad_norms_F": [ + 0.03544403985142708, + 0.03507080301642418, + 0.03477022796869278, + 0.03443896397948265, + 0.03407429903745651 + ], + "gamma_dfa": NaN, + "acc_eval": 0.115234375, + "loss_eval": 2.383650302886963, + "epoch": 0 + }, + { + "hidden_norms": [ + 1156.72998046875, + 7932.5859375, + 11656.220703125, + 13101.765625, + 12094.2197265625 + ], + "bp_grad_norms_per_sample_med": [ + 1.5287704400179791e-06, + 8.219874985115894e-07, + 8.303726986014226e-07, + 8.411634553340264e-07, + 8.074007382674608e-07 + ], + "bp_grad_norms_F": [ + 0.0005889489548280835, + 0.0001249020715476945, + 0.00010261647548759356, + 8.311456622323021e-05, + 6.362409476423636e-05 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2431640625, + "loss_eval": 2.0429816246032715, + "epoch": 1 + }, + { + "hidden_norms": [ + 2267.652099609375, + 33227.19921875, + 62863.03515625, + 73248.0546875, + 64100.21875 + ], + "bp_grad_norms_per_sample_med": [ + 6.826750791333325e-07, + 1.582481274908787e-07, + 1.5909284911685972e-07, + 1.6235998145930353e-07, + 1.57003455569793e-07 + ], + "bp_grad_norms_F": [ + 9.194230369757861e-05, + 3.062757241423242e-05, + 2.5034905775100924e-05, + 1.2339382010395639e-05, + 1.1088715837104246e-05 + ], + "gamma_dfa": NaN, + "acc_eval": 0.234375, + "loss_eval": 2.053070068359375, + "epoch": 2 + }, + { + "hidden_norms": [ + 3317.195556640625, + 69574.59375, + 208893.703125, + 272473.75, + 236858.453125 + ], + "bp_grad_norms_per_sample_med": [ + 5.585509370575892e-07, + 5.853191709093153e-08, + 5.772180244889569e-08, + 5.9099026117337417e-08, + 5.743537911939711e-08 + ], + "bp_grad_norms_F": [ + 5.4304215154843405e-05, + 1.798659286578186e-05, + 6.792580734327203e-06, + 5.748081548517803e-06, + 5.4292308959702495e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2529296875, + "loss_eval": 2.109177350997925, + "epoch": 3 + }, + { + "hidden_norms": [ + 4279.80322265625, + 131147.296875, + 524522.6875, + 669556.125, + 582199.5 + ], + "bp_grad_norms_per_sample_med": [ + 4.5417544924930553e-07, + 2.7819011094720736e-08, + 2.7284025705398562e-08, + 2.7924896173203706e-08, + 2.717020919362767e-08 + ], + "bp_grad_norms_F": [ + 2.7083517124992795e-05, + 3.1135298286244506e-06, + 2.188051212215214e-06, + 1.643483983571059e-06, + 1.5356297353719128e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2314453125, + "loss_eval": 2.1304922103881836, + "epoch": 4 + }, + { + "hidden_norms": [ + 5095.1298828125, + 222828.6875, + 891649.1875, + 1124229.75, + 978070.3125 + ], + "bp_grad_norms_per_sample_med": [ + 3.9661114215050475e-07, + 1.7936926610673254e-08, + 1.787710601774961e-08, + 1.8164961090860743e-08, + 1.7773361449258118e-08 + ], + "bp_grad_norms_F": [ + 2.5229386665159836e-05, + 1.7291312133238534e-06, + 8.046768016356509e-07, + 6.81868698393373e-07, + 6.581432785424113e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2275390625, + "loss_eval": 2.1189823150634766, + "epoch": 5 + }, + { + "hidden_norms": [ + 5762.8369140625, + 345252.125, + 1352057.25, + 1685390.25, + 1472510.375 + ], + "bp_grad_norms_per_sample_med": [ + 3.5811123666462663e-07, + 1.2679316263586315e-08, + 1.2558022177699968e-08, + 1.2735733356805667e-08, + 1.2553626582700872e-08 + ], + "bp_grad_norms_F": [ + 1.9819366571027786e-05, + 7.985001957422355e-07, + 4.666244706186262e-07, + 4.659337093926297e-07, + 4.531105162186577e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2314453125, + "loss_eval": 2.1147799491882324, + "epoch": 6 + }, + { + "hidden_norms": [ + 6342.46337890625, + 489436.21875, + 1846600.125, + 2298539.25, + 2010095.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.2295056939801725e-07, + 9.47152134500584e-09, + 9.449903082270339e-09, + 9.579181003971371e-09, + 9.398083200551355e-09 + ], + "bp_grad_norms_F": [ + 1.761323437676765e-05, + 3.5219920846429886e-07, + 3.464733993041591e-07, + 3.515923765462503e-07, + 3.4331398524045653e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.263671875, + "loss_eval": 2.0468926429748535, + "epoch": 7 + }, + { + "hidden_norms": [ + 6895.3232421875, + 642604.125, + 2340199.25, + 2912852.0, + 2551695.75 + ], + "bp_grad_norms_per_sample_med": [ + 3.2115181625158584e-07, + 8.011411978259275e-09, + 8.093356207439228e-09, + 8.185297772911326e-09, + 8.036058929405954e-09 + ], + "bp_grad_norms_F": [ + 1.6510130080860108e-05, + 2.8924068828928284e-07, + 2.88436524442659e-07, + 2.9188095140852965e-07, + 2.860562631212815e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2373046875, + "loss_eval": 2.0705394744873047, + "epoch": 8 + }, + { + "hidden_norms": [ + 7418.32666015625, + 802952.8125, + 2905706.5, + 3629847.25, + 3176127.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.9990744110364176e-07, + 6.746414982217175e-09, + 6.801009533319302e-09, + 6.844500521907548e-09, + 6.780156436292373e-09 + ], + "bp_grad_norms_F": [ + 1.5715995687060058e-05, + 2.419061502223485e-07, + 2.416737459043361e-07, + 2.441595654545381e-07, + 2.39673738633428e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.271484375, + "loss_eval": 2.03157901763916, + "epoch": 9 + }, + { + "hidden_norms": [ + 8026.80126953125, + 964342.4375, + 3455197.75, + 4322591.0, + 3777789.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.9810524893036927e-07, + 5.931947377746383e-09, + 5.9767870652649435e-09, + 6.012730313642578e-09, + 5.922320855944463e-09 + ], + "bp_grad_norms_F": [ + 1.546428757137619e-05, + 2.1311132059054216e-07, + 2.1318879817044945e-07, + 2.1529912430651166e-07, + 2.115393868962201e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2421875, + "loss_eval": 2.029039144515991, + "epoch": 10 + }, + { + "hidden_norms": [ + 8568.4677734375, + 1146051.75, + 4149878.75, + 5211595.5, + 4551772.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.77834743656058e-07, + 5.156825633179096e-09, + 5.185044393840599e-09, + 5.243859568793141e-09, + 5.148059312176656e-09 + ], + "bp_grad_norms_F": [ + 1.4489689419860952e-05, + 1.8374593935277517e-07, + 1.8364994502917398e-07, + 1.8539546431384224e-07, + 1.8235705567803961e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.279296875, + "loss_eval": 2.015061855316162, + "epoch": 11 + }, + { + "hidden_norms": [ + 9099.6689453125, + 1306440.25, + 4712579.5, + 5930700.5, + 5167806.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.789404618397384e-07, + 4.740023484828271e-09, + 4.688871069191691e-09, + 4.722021884617789e-09, + 4.664129082954105e-09 + ], + "bp_grad_norms_F": [ + 1.440922096662689e-05, + 1.6886964715467911e-07, + 1.6845007166921278e-07, + 1.6997903173887607e-07, + 1.673002003599322e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.279296875, + "loss_eval": 2.0080716609954834, + "epoch": 12 + }, + { + "hidden_norms": [ + 9619.3310546875, + 1468314.25, + 5278606.0, + 6647205.0, + 5776389.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.678217470020172e-07, + 4.431488953571261e-09, + 4.461886859985498e-09, + 4.481298443437254e-09, + 4.434627776106481e-09 + ], + "bp_grad_norms_F": [ + 1.4280021787271835e-05, + 1.5716064183379785e-07, + 1.5650925888621714e-07, + 1.5793726504398364e-07, + 1.5547414022876183e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.294921875, + "loss_eval": 2.003105401992798, + "epoch": 13 + }, + { + "hidden_norms": [ + 10185.365234375, + 1637280.875, + 5941891.0, + 7477497.0, + 6482495.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.580181046596408e-07, + 4.108497098087582e-09, + 4.027958855346014e-09, + 4.0670666834330405e-09, + 4.01310229491969e-09 + ], + "bp_grad_norms_F": [ + 1.3607143955596257e-05, + 1.4447114438098652e-07, + 1.4335948606003512e-07, + 1.4459322983384482e-07, + 1.424295135166176e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2841796875, + "loss_eval": 1.9895731210708618, + "epoch": 14 + }, + { + "hidden_norms": [ + 10773.4443359375, + 1777185.125, + 6485962.5, + 8158632.5, + 7057802.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.536919225804013e-07, + 3.8119583045670424e-09, + 3.815232130222057e-09, + 3.836773565524254e-09, + 3.790971536687948e-09 + ], + "bp_grad_norms_F": [ + 1.3741724615101703e-05, + 1.3785883368200302e-07, + 1.3661090747518756e-07, + 1.3781669849777245e-07, + 1.3573732360327995e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.263671875, + "loss_eval": 2.0124382972717285, + "epoch": 15 + }, + { + "hidden_norms": [ + 11403.58984375, + 1931677.0, + 7089585.5, + 8906384.0, + 7683122.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.446777500608732e-07, + 3.674859083702131e-09, + 3.648833679648078e-09, + 3.6761997890266684e-09, + 3.624884392650074e-09 + ], + "bp_grad_norms_F": [ + 1.3561247214965988e-05, + 1.2985380237751087e-07, + 1.2829688955662277e-07, + 1.294151275033073e-07, + 1.2746555455578346e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.26953125, + "loss_eval": 2.0030646324157715, + "epoch": 16 + }, + { + "hidden_norms": [ + 12115.1162109375, + 2091857.0, + 7735447.5, + 9727085.0, + 8371443.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.378987460360804e-07, + 3.4695852857424825e-09, + 3.42812689346772e-09, + 3.4526042025362358e-09, + 3.40047856539627e-09 + ], + "bp_grad_norms_F": [ + 1.3279566701385193e-05, + 1.2257437731477694e-07, + 1.2078584177288576e-07, + 1.2181956776657898e-07, + 1.1999593141354126e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2939453125, + "loss_eval": 1.9935777187347412, + "epoch": 17 + }, + { + "hidden_norms": [ + 12755.7646484375, + 2248501.0, + 8338276.5, + 10490721.0, + 8991669.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.3127104498144035e-07, + 3.35100103221464e-09, + 3.3095433060736923e-09, + 3.326423581029303e-09, + 3.2682878625678313e-09 + ], + "bp_grad_norms_F": [ + 1.3015700460528024e-05, + 1.1814677947086238e-07, + 1.1589928305966168e-07, + 1.1685516199122503e-07, + 1.1511789210771894e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2900390625, + "loss_eval": 1.9912320375442505, + "epoch": 18 + }, + { + "hidden_norms": [ + 13395.4189453125, + 2393670.0, + 8949124.0, + 11235038.0, + 9603954.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.2520477216403378e-07, + 3.2867890631393948e-09, + 3.2246825210080488e-09, + 3.250592239822936e-09, + 3.201830800492189e-09 + ], + "bp_grad_norms_F": [ + 1.3049841072643176e-05, + 1.1301781910333375e-07, + 1.1090982354744483e-07, + 1.1187000836798688e-07, + 1.101881252907333e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2626953125, + "loss_eval": 2.0112197399139404, + "epoch": 19 + }, + { + "hidden_norms": [ + 14034.6982421875, + 2529761.5, + 9576616.0, + 12035853.0, + 10258897.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.1533313088184514e-07, + 3.174721152632287e-09, + 3.1246687459685063e-09, + 3.149874805430386e-09, + 3.09314329705046e-09 + ], + "bp_grad_norms_F": [ + 1.26855793496361e-05, + 1.0948959072720754e-07, + 1.0680034279175743e-07, + 1.0768705749342189e-07, + 1.0610038714276016e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.25, + "loss_eval": 2.0056447982788086, + "epoch": 20 + }, + { + "hidden_norms": [ + 14717.9462890625, + 2650771.25, + 10157696.0, + 12784758.0, + 10849881.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.086567434389508e-07, + 2.999795301050767e-09, + 2.966421552841325e-09, + 2.9786708655166194e-09, + 2.947827537624903e-09 + ], + "bp_grad_norms_F": [ + 1.2321271242399234e-05, + 1.0535904237940485e-07, + 1.0280631101977633e-07, + 1.0365675251478024e-07, + 1.021143916091205e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.294921875, + "loss_eval": 1.9869788885116577, + "epoch": 21 + }, + { + "hidden_norms": [ + 15327.8466796875, + 2777500.75, + 10776735.0, + 13573723.0, + 11474654.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.0232576503076416e-07, + 2.9384910060770153e-09, + 2.867603710043909e-09, + 2.8935454032819052e-09, + 2.8441446975335793e-09 + ], + "bp_grad_norms_F": [ + 1.231426631420618e-05, + 1.0333050681765599e-07, + 1.0039466502576033e-07, + 1.0124550442469626e-07, + 9.972216474807283e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2939453125, + "loss_eval": 1.9892809391021729, + "epoch": 22 + }, + { + "hidden_norms": [ + 15945.8837890625, + 2878910.75, + 11304857.0, + 14241028.0, + 11994238.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.0171727044271393e-07, + 2.9479860774728195e-09, + 2.8580404709543927e-09, + 2.8716116151628057e-09, + 2.8270419338838337e-09 + ], + "bp_grad_norms_F": [ + 1.2025901924062055e-05, + 1.0096052704966496e-07, + 9.789676624905042e-08, + 9.872773176766714e-08, + 9.722123195388122e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2802734375, + "loss_eval": 1.9858973026275635, + "epoch": 23 + }, + { + "hidden_norms": [ + 16595.853515625, + 3002464.5, + 11949546.0, + 15061732.0, + 12646630.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.9120048477816454e-07, + 2.8694004949869623e-09, + 2.772703400211185e-09, + 2.777924779095997e-09, + 2.7492945697815685e-09 + ], + "bp_grad_norms_F": [ + 1.2024025636492297e-05, + 9.894926478182242e-08, + 9.581360416177631e-08, + 9.663772715384766e-08, + 9.51538083882042e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.296875, + "loss_eval": 1.9969089031219482, + "epoch": 24 + }, + { + "hidden_norms": [ + 17227.1640625, + 3125553.25, + 12574712.0, + 15844785.0, + 13247150.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.8941717883080855e-07, + 2.8377846739147117e-09, + 2.7375035571708395e-09, + 2.7606503749666444e-09, + 2.7206534802814986e-09 + ], + "bp_grad_norms_F": [ + 1.153391167463269e-05, + 9.671435208247203e-08, + 9.34372863525823e-08, + 9.424089597587226e-08, + 9.280081059159784e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.294921875, + "loss_eval": 1.9766383171081543, + "epoch": 25 + }, + { + "hidden_norms": [ + 17808.20703125, + 3256055.25, + 13319775.0, + 16758460.0, + 13956453.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.8628608700055338e-07, + 2.7554525328099544e-09, + 2.625358597185823e-09, + 2.6348250248275917e-09, + 2.614828797931068e-09 + ], + "bp_grad_norms_F": [ + 1.0964491593767889e-05, + 9.419229485274627e-08, + 9.09606185928169e-08, + 9.175563775443152e-08, + 9.03681396380307e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2919921875, + "loss_eval": 1.9645390510559082, + "epoch": 26 + }, + { + "hidden_norms": [ + 18401.28125, + 3393640.75, + 14088409.0, + 17726368.0, + 14707189.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7694672749257734e-07, + 2.722393421805691e-09, + 2.634128470901942e-09, + 2.6627771099185793e-09, + 2.6215960513553682e-09 + ], + "bp_grad_norms_F": [ + 1.1054430615331512e-05, + 9.26544814205954e-08, + 8.924564554035896e-08, + 9.002578593708677e-08, + 8.865336553753878e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2861328125, + "loss_eval": 1.974367618560791, + "epoch": 27 + }, + { + "hidden_norms": [ + 18936.51953125, + 3515726.25, + 14734875.0, + 18530786.0, + 15301454.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7923295558830432e-07, + 2.6605673220103654e-09, + 2.530292642077825e-09, + 2.5396913461150916e-09, + 2.517351882502794e-09 + ], + "bp_grad_norms_F": [ + 1.1157896551594604e-05, + 9.233546904852119e-08, + 8.888883229474231e-08, + 8.968125086994405e-08, + 8.831575115664236e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2841796875, + "loss_eval": 1.986099362373352, + "epoch": 28 + }, + { + "hidden_norms": [ + 19457.962890625, + 3664789.5, + 15342228.0, + 19308666.0, + 15894652.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7488744674665213e-07, + 2.6636790551037848e-09, + 2.4992619085395518e-09, + 2.507181573463413e-09, + 2.486318262384657e-09 + ], + "bp_grad_norms_F": [ + 1.092042657546699e-05, + 9.157383118463258e-08, + 8.810303597783786e-08, + 8.888122238204232e-08, + 8.75455583582152e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.32421875, + "loss_eval": 1.9868172407150269, + "epoch": 29 + }, + { + "hidden_norms": [ + 19933.78515625, + 3775119.25, + 16017107.0, + 20154288.0, + 16541561.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.715164188453855e-07, + 2.5937807457410145e-09, + 2.4676627408126706e-09, + 2.4873916260048645e-09, + 2.4605657511500567e-09 + ], + "bp_grad_norms_F": [ + 1.0760413715615869e-05, + 9.029215419786851e-08, + 8.696353148707203e-08, + 8.772182269467521e-08, + 8.64171596504093e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.291015625, + "loss_eval": 1.9754526615142822, + "epoch": 30 + }, + { + "hidden_norms": [ + 20432.466796875, + 3910461.25, + 16712518.0, + 21021696.0, + 17196572.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.710603356741558e-07, + 2.6387678708772455e-09, + 2.524718212271182e-09, + 2.5378650292395832e-09, + 2.5052109275947032e-09 + ], + "bp_grad_norms_F": [ + 1.0587626093183644e-05, + 8.93876332952459e-08, + 8.59824282883892e-08, + 8.675493745613494e-08, + 8.546451368829366e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3076171875, + "loss_eval": 1.9657469987869263, + "epoch": 31 + }, + { + "hidden_norms": [ + 20875.439453125, + 4054334.0, + 17463474.0, + 21948092.0, + 17887228.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.729485461510194e-07, + 2.6252673368531987e-09, + 2.4720219204965588e-09, + 2.491059358789016e-09, + 2.4621127359125694e-09 + ], + "bp_grad_norms_F": [ + 1.0830392966454383e-05, + 8.912193294463577e-08, + 8.547249308321625e-08, + 8.626851411008829e-08, + 8.495522507701025e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.31640625, + "loss_eval": 1.9752991199493408, + "epoch": 32 + }, + { + "hidden_norms": [ + 21372.0234375, + 4181554.25, + 18179600.0, + 22866024.0, + 18562826.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6644050049308134e-07, + 2.5652076018900516e-09, + 2.4415069965755265e-09, + 2.4562532008332028e-09, + 2.423905742787724e-09 + ], + "bp_grad_norms_F": [ + 1.0476498573552817e-05, + 8.780278903941507e-08, + 8.420673225373321e-08, + 8.501019266304866e-08, + 8.373319104748589e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.318359375, + "loss_eval": 1.9647243022918701, + "epoch": 33 + }, + { + "hidden_norms": [ + 21698.390625, + 4323451.5, + 18873394.0, + 23742746.0, + 19211736.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6982900774564769e-07, + 2.6139097553112833e-09, + 2.4535891096633122e-09, + 2.465766257842006e-09, + 2.4349082750063644e-09 + ], + "bp_grad_norms_F": [ + 1.0547244528424926e-05, + 8.761546865798664e-08, + 8.380350635661671e-08, + 8.460440881208342e-08, + 8.332586531878405e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3115234375, + "loss_eval": 1.9688763618469238, + "epoch": 34 + }, + { + "hidden_norms": [ + 22000.6484375, + 4419910.5, + 19288578.0, + 24275390.0, + 19571482.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6632812105399353e-07, + 2.5976403250638214e-09, + 2.4608304283191273e-09, + 2.4786184216196716e-09, + 2.4511619400868767e-09 + ], + "bp_grad_norms_F": [ + 1.0402384759800043e-05, + 8.75945431744185e-08, + 8.378519567031617e-08, + 8.458554390244899e-08, + 8.331597456390227e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3115234375, + "loss_eval": 1.962469458580017, + "epoch": 35 + }, + { + "hidden_norms": [ + 22332.140625, + 4505425.5, + 19876824.0, + 24999434.0, + 20098762.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.673159886195208e-07, + 2.5706452522200607e-09, + 2.4236175288905315e-09, + 2.4205843995872556e-09, + 2.4001298726261666e-09 + ], + "bp_grad_norms_F": [ + 1.0201652912655845e-05, + 8.668673245892933e-08, + 8.301810083821692e-08, + 8.384706973174616e-08, + 8.257533323785538e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3046875, + "loss_eval": 1.9482183456420898, + "epoch": 36 + }, + { + "hidden_norms": [ + 22704.90625, + 4601120.5, + 20416742.0, + 25650594.0, + 20558608.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6260217705621471e-07, + 2.501829188261695e-09, + 2.37497355115579e-09, + 2.379827890308661e-09, + 2.364261231235787e-09 + ], + "bp_grad_norms_F": [ + 1.0307686352462042e-05, + 8.687224806180893e-08, + 8.317324073914278e-08, + 8.40014422465174e-08, + 8.273995177887628e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.306640625, + "loss_eval": 1.9718880653381348, + "epoch": 37 + }, + { + "hidden_norms": [ + 22953.462890625, + 4708118.5, + 21018216.0, + 26396430.0, + 21081344.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6642815126033383e-07, + 2.5344910614677474e-09, + 2.3881991939589398e-09, + 2.393568676595237e-09, + 2.366601137282487e-09 + ], + "bp_grad_norms_F": [ + 1.0291260878148023e-05, + 8.597661604881068e-08, + 8.222435354809932e-08, + 8.30701907261755e-08, + 8.179645050176987e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3173828125, + "loss_eval": 1.9656648635864258, + "epoch": 38 + }, + { + "hidden_norms": [ + 23329.68359375, + 4813138.0, + 21547542.0, + 27050624.0, + 21536360.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6755477361130033e-07, + 2.5133575221047977e-09, + 2.3339741250794077e-09, + 2.3630628565030065e-09, + 2.3331871989995534e-09 + ], + "bp_grad_norms_F": [ + 1.0207740160694811e-05, + 8.593145395252577e-08, + 8.217772773377874e-08, + 8.303662468733819e-08, + 8.176558452532845e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3076171875, + "loss_eval": 1.9581431150436401, + "epoch": 39 + }, + { + "hidden_norms": [ + 23598.361328125, + 4903029.0, + 22069792.0, + 27713646.0, + 21984984.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6272531411232194e-07, + 2.4648321161890863e-09, + 2.360529327560812e-09, + 2.364856310776986e-09, + 2.3259458803437383e-09 + ], + "bp_grad_norms_F": [ + 1.0116659723280463e-05, + 8.537404028174933e-08, + 8.159113207284463e-08, + 8.246142613188567e-08, + 8.120937167177544e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3212890625, + "loss_eval": 1.9615185260772705, + "epoch": 40 + }, + { + "hidden_norms": [ + 23904.275390625, + 5004298.0, + 22611816.0, + 28369744.0, + 22444866.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6563248550482967e-07, + 2.5165425299178423e-09, + 2.3475779098447447e-09, + 2.3561286255358027e-09, + 2.3397561665916555e-09 + ], + "bp_grad_norms_F": [ + 1.0093037417391315e-05, + 8.496893855181042e-08, + 8.129408968216012e-08, + 8.217033098389948e-08, + 8.091691228173659e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3056640625, + "loss_eval": 1.9596519470214844, + "epoch": 41 + }, + { + "hidden_norms": [ + 24124.95703125, + 5079679.0, + 23056108.0, + 28905466.0, + 22810520.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.650763863381144e-07, + 2.5150639348936465e-09, + 2.375127650111608e-09, + 2.3864086262648243e-09, + 2.3595001508169844e-09 + ], + "bp_grad_norms_F": [ + 1.0080430001835339e-05, + 8.473855928059493e-08, + 8.099364379177132e-08, + 8.18785963474511e-08, + 8.06336757364079e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3251953125, + "loss_eval": 1.9462497234344482, + "epoch": 42 + }, + { + "hidden_norms": [ + 24350.154296875, + 5170977.5, + 23526890.0, + 29466298.0, + 23191828.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6226854882006592e-07, + 2.5123039204544284e-09, + 2.381558061870237e-09, + 2.391710607341224e-09, + 2.3734676446451886e-09 + ], + "bp_grad_norms_F": [ + 1.0192407899012323e-05, + 8.457134015316115e-08, + 8.096912296196024e-08, + 8.18817795789073e-08, + 8.06216249316094e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.318359375, + "loss_eval": 1.950229287147522, + "epoch": 43 + }, + { + "hidden_norms": [ + 24543.87890625, + 5230886.0, + 23931748.0, + 29937192.0, + 23499106.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6538373870389478e-07, + 2.4975805867910594e-09, + 2.3630661871720804e-09, + 2.3725827968945623e-09, + 2.3566677498365607e-09 + ], + "bp_grad_norms_F": [ + 1.0082419976242818e-05, + 8.452050792584487e-08, + 8.1015215869229e-08, + 8.194035672204336e-08, + 8.06845363854336e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.30078125, + "loss_eval": 1.9453504085540771, + "epoch": 44 + }, + { + "hidden_norms": [ + 24711.091796875, + 5298309.0, + 24318082.0, + 30413608.0, + 23808788.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6054062257353507e-07, + 2.4891384509118097e-09, + 2.358970574434238e-09, + 2.368707230360201e-09, + 2.3476884880579973e-09 + ], + "bp_grad_norms_F": [ + 1.0053097867057659e-05, + 8.462841805112475e-08, + 8.112137095395155e-08, + 8.206667700960679e-08, + 8.080490943029872e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3076171875, + "loss_eval": 1.9472556114196777, + "epoch": 45 + }, + { + "hidden_norms": [ + 24881.759765625, + 5378830.0, + 24836314.0, + 31031698.0, + 24231208.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.623594982902432e-07, + 2.4946655852176036e-09, + 2.3718913499948258e-09, + 2.3750907907071905e-09, + 2.3478305966051494e-09 + ], + "bp_grad_norms_F": [ + 1.012617394735571e-05, + 8.473565316080567e-08, + 8.116323613194254e-08, + 8.212452939915238e-08, + 8.085635272436775e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3125, + "loss_eval": 1.9553910493850708, + "epoch": 46 + }, + { + "hidden_norms": [ + 25032.86328125, + 5446721.0, + 25258438.0, + 31534450.0, + 24555236.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.632960788811033e-07, + 2.470913029739563e-09, + 2.316862923734675e-09, + 2.3169177687520914e-09, + 2.3029997908707855e-09 + ], + "bp_grad_norms_F": [ + 9.900480108626653e-06, + 8.452943944803337e-08, + 8.106712812150363e-08, + 8.2038923210348e-08, + 8.077390845073751e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3115234375, + "loss_eval": 1.9489891529083252, + "epoch": 47 + }, + { + "hidden_norms": [ + 25306.201171875, + 5468743.5, + 25525060.0, + 31867246.0, + 24722362.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5847486167785974e-07, + 2.4746471538605874e-09, + 2.3425053008452323e-09, + 2.3598758502885175e-09, + 2.3311046426499615e-09 + ], + "bp_grad_norms_F": [ + 9.7980091595673e-06, + 8.43976621922593e-08, + 8.096849057892541e-08, + 8.195242884312393e-08, + 8.069165602364592e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3134765625, + "loss_eval": 1.9313395023345947, + "epoch": 48 + }, + { + "hidden_norms": [ + 25419.810546875, + 5521521.5, + 25869234.0, + 32269302.0, + 24978000.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6377224199004559e-07, + 2.4982107493798367e-09, + 2.3510355884326373e-09, + 2.359785478134313e-09, + 2.3393140757832498e-09 + ], + "bp_grad_norms_F": [ + 1.003210672934074e-05, + 8.464159151344575e-08, + 8.12287339613249e-08, + 8.224073155815859e-08, + 8.095251047279817e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3095703125, + "loss_eval": 1.94147527217865, + "epoch": 49 + }, + { + "hidden_norms": [ + 25543.001953125, + 5573999.0, + 26298990.0, + 32786014.0, + 25316304.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.593823384382631e-07, + 2.512666297249666e-09, + 2.392667397543846e-09, + 2.4054993552624637e-09, + 2.386617126148849e-09 + ], + "bp_grad_norms_F": [ + 1.0020607987826224e-05, + 8.429628906014841e-08, + 8.090298564411569e-08, + 8.193208600459911e-08, + 8.064517231787249e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.32421875, + "loss_eval": 1.9412651062011719, + "epoch": 50 + }, + { + "hidden_norms": [ + 25755.05859375, + 5633394.5, + 26712786.0, + 33270568.0, + 25632750.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.615333218296655e-07, + 2.483285133081381e-09, + 2.346244309947565e-09, + 2.3569415308344333e-09, + 2.342600557980745e-09 + ], + "bp_grad_norms_F": [ + 9.841775863606017e-06, + 8.406106388747503e-08, + 8.07588094176026e-08, + 8.180128219237304e-08, + 8.051125632846379e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3193359375, + "loss_eval": 1.9356749057769775, + "epoch": 51 + }, + { + "hidden_norms": [ + 25838.6875, + 5676516.5, + 26956640.0, + 33554564.0, + 25797852.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5953406773405732e-07, + 2.4927520048123597e-09, + 2.379676899977312e-09, + 2.3930151193951588e-09, + 2.37515118683973e-09 + ], + "bp_grad_norms_F": [ + 1.0000761903938837e-05, + 8.431718612200712e-08, + 8.108807492135384e-08, + 8.215462798943918e-08, + 8.085050495765245e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.322265625, + "loss_eval": 1.9513205289840698, + "epoch": 52 + }, + { + "hidden_norms": [ + 25925.244140625, + 5739893.0, + 27348932.0, + 34049508.0, + 26115016.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5941535025376652e-07, + 2.4419115618457e-09, + 2.335727167235291e-09, + 2.3481498967470316e-09, + 2.335213800108704e-09 + ], + "bp_grad_norms_F": [ + 9.962137482943945e-06, + 8.399173623274692e-08, + 8.08289613019042e-08, + 8.190350797576684e-08, + 8.060307266077871e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3173828125, + "loss_eval": 1.9443122148513794, + "epoch": 53 + }, + { + "hidden_norms": [ + 26078.8125, + 5808761.5, + 27799278.0, + 34615776.0, + 26499736.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5867621527831943e-07, + 2.4137036813698387e-09, + 2.31744068379669e-09, + 2.327602111051874e-09, + 2.313133462550354e-09 + ], + "bp_grad_norms_F": [ + 9.748204320203513e-06, + 8.347069524461403e-08, + 8.032785814293675e-08, + 8.14167648854891e-08, + 8.011366503524187e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.314453125, + "loss_eval": 1.9361423254013062, + "epoch": 54 + }, + { + "hidden_norms": [ + 26192.453125, + 5875144.0, + 28166196.0, + 35073324.0, + 26791154.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5812705100870517e-07, + 2.4364927853071094e-09, + 2.339390015038134e-09, + 2.3421220518571317e-09, + 2.328011117214146e-09 + ], + "bp_grad_norms_F": [ + 9.899279575620312e-06, + 8.359175751593284e-08, + 8.043829780035594e-08, + 8.154502495472116e-08, + 8.023434361348336e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.306640625, + "loss_eval": 1.940393090248108, + "epoch": 55 + }, + { + "hidden_norms": [ + 26281.6796875, + 5935011.0, + 28625862.0, + 35638648.0, + 27180628.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6062698193763936e-07, + 2.4364579243041362e-09, + 2.3309267849214166e-09, + 2.3373505353418977e-09, + 2.3235424695400297e-09 + ], + "bp_grad_norms_F": [ + 9.917155693983659e-06, + 8.292303022017222e-08, + 7.976373694873473e-08, + 8.087503999831824e-08, + 7.955991776498195e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.318359375, + "loss_eval": 1.945765495300293, + "epoch": 56 + }, + { + "hidden_norms": [ + 26394.865234375, + 5988690.5, + 28944822.0, + 36062032.0, + 27426714.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6303006589168945e-07, + 2.4247555074907723e-09, + 2.309517688203755e-09, + 2.3198174492478074e-09, + 2.3075219512946887e-09 + ], + "bp_grad_norms_F": [ + 1.0007075616158545e-05, + 8.301859821813196e-08, + 7.986342609456187e-08, + 8.099387827087412e-08, + 7.966451676111319e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3115234375, + "loss_eval": 1.9433667659759521, + "epoch": 57 + }, + { + "hidden_norms": [ + 26515.357421875, + 6051740.5, + 29293128.0, + 36499980.0, + 27690768.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5923862406452827e-07, + 2.3941215676615e-09, + 2.28924412759568e-09, + 2.2969097734915067e-09, + 2.280708066848547e-09 + ], + "bp_grad_norms_F": [ + 9.82554138317937e-06, + 8.282027863515395e-08, + 7.976368721074323e-08, + 8.090249536962801e-08, + 7.957222436516531e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.306640625, + "loss_eval": 1.944448709487915, + "epoch": 58 + }, + { + "hidden_norms": [ + 26621.947265625, + 6089471.5, + 29639332.0, + 36907412.0, + 27955134.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5679145803915162e-07, + 2.3988511177464034e-09, + 2.303158996852517e-09, + 2.3152970651807436e-09, + 2.2871571303539895e-09 + ], + "bp_grad_norms_F": [ + 9.731273166835308e-06, + 8.24191062065438e-08, + 7.936159107657659e-08, + 8.050036370832458e-08, + 7.917343225471996e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3125, + "loss_eval": 1.9350972175598145, + "epoch": 59 + }, + { + "hidden_norms": [ + 26731.64453125, + 6146909.5, + 30036422.0, + 37405476.0, + 28295768.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5779031059537374e-07, + 2.4025526013105036e-09, + 2.3019863792939077e-09, + 2.3154580475193143e-09, + 2.293559120403188e-09 + ], + "bp_grad_norms_F": [ + 9.80158438323997e-06, + 8.19560526110763e-08, + 7.889645559089331e-08, + 8.003749485396838e-08, + 7.871490481647925e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.328125, + "loss_eval": 1.941221833229065, + "epoch": 60 + }, + { + "hidden_norms": [ + 26842.380859375, + 6189510.0, + 30305302.0, + 37746040.0, + 28515236.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5621530735643319e-07, + 2.3939163984465495e-09, + 2.3025825690581314e-09, + 2.3148469807665606e-09, + 2.2962292067774115e-09 + ], + "bp_grad_norms_F": [ + 9.731598765938543e-06, + 8.167720011442725e-08, + 7.863504691840717e-08, + 7.977818938798009e-08, + 7.845925864558012e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3408203125, + "loss_eval": 1.9333854913711548, + "epoch": 61 + }, + { + "hidden_norms": [ + 26940.765625, + 6243737.5, + 30559802.0, + 38046748.0, + 28709922.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5672847553105385e-07, + 2.3640371882294176e-09, + 2.2657933307357325e-09, + 2.2837092217287136e-09, + 2.2615944672566e-09 + ], + "bp_grad_norms_F": [ + 9.668071470514406e-06, + 8.165712017671467e-08, + 7.869160612017367e-08, + 7.984421301898692e-08, + 7.851971872696595e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3203125, + "loss_eval": 1.9349033832550049, + "epoch": 62 + }, + { + "hidden_norms": [ + 27024.9140625, + 6285780.0, + 30783454.0, + 38328276.0, + 28883832.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5834399391678744e-07, + 2.3645019275875256e-09, + 2.2709001346044033e-09, + 2.2806179167389473e-09, + 2.2639952135250496e-09 + ], + "bp_grad_norms_F": [ + 9.799305189517327e-06, + 8.167254605950802e-08, + 7.873082097376027e-08, + 7.989201833424886e-08, + 7.856029071717785e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.31640625, + "loss_eval": 1.9409070014953613, + "epoch": 63 + }, + { + "hidden_norms": [ + 27131.298828125, + 6330564.0, + 31012118.0, + 38625700.0, + 29050708.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.588112752415327e-07, + 2.403508059245496e-09, + 2.2917150399592856e-09, + 2.3033945861783423e-09, + 2.2864310444958846e-09 + ], + "bp_grad_norms_F": [ + 9.54241204453865e-06, + 8.120213124129805e-08, + 7.823086889402475e-08, + 7.938096047155341e-08, + 7.805995494436502e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3388671875, + "loss_eval": 1.9211525917053223, + "epoch": 64 + }, + { + "hidden_norms": [ + 27208.25, + 6368866.0, + 31290472.0, + 38967492.0, + 29272872.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5740459957669373e-07, + 2.3837900542389434e-09, + 2.284773703564724e-09, + 2.298153001234482e-09, + 2.2881960770604337e-09 + ], + "bp_grad_norms_F": [ + 9.658318958827294e-06, + 8.104061777203242e-08, + 7.810449886846982e-08, + 7.925908818151584e-08, + 7.793548206791456e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.341796875, + "loss_eval": 1.9278589487075806, + "epoch": 65 + }, + { + "hidden_norms": [ + 27276.62890625, + 6418036.5, + 31545874.0, + 39283716.0, + 29477138.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5503043471198907e-07, + 2.357751327508595e-09, + 2.2688111389612686e-09, + 2.2810615618595875e-09, + 2.2629353946257424e-09 + ], + "bp_grad_norms_F": [ + 9.6196936283377e-06, + 8.082280089638516e-08, + 7.795324563630857e-08, + 7.91092062968346e-08, + 7.778949395742529e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.33984375, + "loss_eval": 1.9305698871612549, + "epoch": 66 + }, + { + "hidden_norms": [ + 27340.607421875, + 6465153.0, + 31796498.0, + 39598816.0, + 29679376.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5558319432784629e-07, + 2.3627866330144798e-09, + 2.2779722552712656e-09, + 2.2912376440586968e-09, + 2.2693087409209056e-09 + ], + "bp_grad_norms_F": [ + 9.68782387644751e-06, + 8.066198375900058e-08, + 7.781451927257876e-08, + 7.897661191691441e-08, + 7.765357423750174e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3173828125, + "loss_eval": 1.9328408241271973, + "epoch": 67 + }, + { + "hidden_norms": [ + 27396.21484375, + 6507270.5, + 32041844.0, + 39890444.0, + 29881876.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5313091239477217e-07, + 2.336748128328736e-09, + 2.2449873071650472e-09, + 2.2587733905510277e-09, + 2.237245722014336e-09 + ], + "bp_grad_norms_F": [ + 9.509177289146464e-06, + 8.020302288969106e-08, + 7.739499352510393e-08, + 7.854830386122558e-08, + 7.723401296289012e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.318359375, + "loss_eval": 1.9248214960098267, + "epoch": 68 + }, + { + "hidden_norms": [ + 27461.697265625, + 6534744.5, + 32295470.0, + 40216712.0, + 30089670.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5820302223801264e-07, + 2.3342023869332706e-09, + 2.2277899525136036e-09, + 2.237228180490547e-09, + 2.2202666372095337e-09 + ], + "bp_grad_norms_F": [ + 9.662662705522962e-06, + 8.017656227821135e-08, + 7.73198536307973e-08, + 7.847864225141166e-08, + 7.715301109101347e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.32421875, + "loss_eval": 1.9348523616790771, + "epoch": 69 + }, + { + "hidden_norms": [ + 27519.265625, + 6576646.0, + 32533798.0, + 40497036.0, + 30273994.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5546247311704064e-07, + 2.332068760324546e-09, + 2.2422437240265936e-09, + 2.259832765361125e-09, + 2.2382042885737974e-09 + ], + "bp_grad_norms_F": [ + 9.630303793528583e-06, + 7.993662620719988e-08, + 7.707911464649442e-08, + 7.823470582479786e-08, + 7.691809855714382e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3212890625, + "loss_eval": 1.9298650026321411, + "epoch": 70 + }, + { + "hidden_norms": [ + 27578.833984375, + 6611492.0, + 32783444.0, + 40806224.0, + 30475316.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5486573090583988e-07, + 2.310989177800593e-09, + 2.214788796806033e-09, + 2.2242498953772838e-09, + 2.209040284029129e-09 + ], + "bp_grad_norms_F": [ + 9.58504097070545e-06, + 7.973878268785484e-08, + 7.692549530702308e-08, + 7.808419866250915e-08, + 7.67675771840004e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.314453125, + "loss_eval": 1.9349405765533447, + "epoch": 71 + }, + { + "hidden_norms": [ + 27637.01953125, + 6652277.0, + 32940606.0, + 41021348.0, + 30603354.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5176895828972192e-07, + 2.309274771405967e-09, + 2.2196366966653613e-09, + 2.2291524182094236e-09, + 2.212444005778025e-09 + ], + "bp_grad_norms_F": [ + 9.506617061560974e-06, + 7.949277147645262e-08, + 7.665874335316403e-08, + 7.781166289078101e-08, + 7.6499844681166e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.32421875, + "loss_eval": 1.9272165298461914, + "epoch": 72 + }, + { + "hidden_norms": [ + 27665.341796875, + 6675607.5, + 33128100.0, + 41256448.0, + 30754874.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.570084151580886e-07, + 2.2943660304974856e-09, + 2.2026656054663363e-09, + 2.2121668941110784e-09, + 2.1966797270067673e-09 + ], + "bp_grad_norms_F": [ + 9.71559165918734e-06, + 7.9600532387758e-08, + 7.679192037812754e-08, + 7.795681966626944e-08, + 7.663498990950757e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3115234375, + "loss_eval": 1.941681146621704, + "epoch": 73 + }, + { + "hidden_norms": [ + 27715.794921875, + 6709802.5, + 33331388.0, + 41504024.0, + 30915288.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5387240637210198e-07, + 2.3100528157016242e-09, + 2.2238448860179005e-09, + 2.2321375858780357e-09, + 2.2150188350167355e-09 + ], + "bp_grad_norms_F": [ + 9.473335921938997e-06, + 7.898351128687864e-08, + 7.616839781121598e-08, + 7.73214452465254e-08, + 7.601196472251104e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.33203125, + "loss_eval": 1.9246938228607178, + "epoch": 74 + }, + { + "hidden_norms": [ + 27766.177734375, + 6726091.5, + 33455028.0, + 41663816.0, + 31007976.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5595279023727926e-07, + 2.298697898694968e-09, + 2.2091579676697393e-09, + 2.215150729512061e-09, + 2.1983310727335947e-09 + ], + "bp_grad_norms_F": [ + 9.587340173311532e-06, + 7.91313112813441e-08, + 7.627861009495973e-08, + 7.743443575236597e-08, + 7.611913588334573e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3232421875, + "loss_eval": 1.931347370147705, + "epoch": 75 + }, + { + "hidden_norms": [ + 27818.396484375, + 6749941.5, + 33562528.0, + 41806788.0, + 31089946.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.542799026310604e-07, + 2.3069177679246877e-09, + 2.2149184708553094e-09, + 2.2274431188407107e-09, + 2.2138819666395193e-09 + ], + "bp_grad_norms_F": [ + 9.57066185947042e-06, + 7.899650000808833e-08, + 7.612889874053508e-08, + 7.72842909668725e-08, + 7.59681810791335e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.328125, + "loss_eval": 1.9290614128112793, + "epoch": 76 + }, + { + "hidden_norms": [ + 27874.181640625, + 6776020.5, + 33686440.0, + 41956108.0, + 31183962.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5547591658560123e-07, + 2.2904955709890373e-09, + 2.199639581590418e-09, + 2.2111712461025945e-09, + 2.1966135577144996e-09 + ], + "bp_grad_norms_F": [ + 9.538461199554149e-06, + 7.882318442398173e-08, + 7.600280582664709e-08, + 7.715882333059199e-08, + 7.58423581714851e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3369140625, + "loss_eval": 1.9268429279327393, + "epoch": 77 + }, + { + "hidden_norms": [ + 27928.552734375, + 6790532.0, + 33797660.0, + 42095308.0, + 31270040.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5469180425498053e-07, + 2.3010513494625684e-09, + 2.2103030516973377e-09, + 2.2237711672090654e-09, + 2.206205884647261e-09 + ], + "bp_grad_norms_F": [ + 9.510661584499758e-06, + 7.866238149745186e-08, + 7.584375794067455e-08, + 7.699873805222524e-08, + 7.568271342961452e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3291015625, + "loss_eval": 1.9229360818862915, + "epoch": 78 + }, + { + "hidden_norms": [ + 27959.18359375, + 6814900.0, + 33951204.0, + 42283796.0, + 31402056.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5280090792657575e-07, + 2.2722823622700616e-09, + 2.182985348042621e-09, + 2.195454484876791e-09, + 2.1783830295163398e-09 + ], + "bp_grad_norms_F": [ + 9.445489922654815e-06, + 7.852113270701011e-08, + 7.573528648663341e-08, + 7.688608150147047e-08, + 7.557830628002193e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3232421875, + "loss_eval": 1.9262363910675049, + "epoch": 79 + }, + { + "hidden_norms": [ + 27969.6171875, + 6828402.0, + 34031784.0, + 42376960.0, + 31453510.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5404552300424257e-07, + 2.2810822120078456e-09, + 2.1932544669311937e-09, + 2.216228756068972e-09, + 2.193953241302893e-09 + ], + "bp_grad_norms_F": [ + 9.498375220573507e-06, + 7.844284510838406e-08, + 7.562837112118359e-08, + 7.677955693452532e-08, + 7.546795188773103e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.330078125, + "loss_eval": 1.925222396850586, + "epoch": 80 + }, + { + "hidden_norms": [ + 27976.40625, + 6839237.5, + 34096948.0, + 42451852.0, + 31495834.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5588855717396655e-07, + 2.290766465407046e-09, + 2.2075170580393433e-09, + 2.2167860880273338e-09, + 2.1972801356184846e-09 + ], + "bp_grad_norms_F": [ + 9.528901500743814e-06, + 7.844620597552421e-08, + 7.561048676052451e-08, + 7.67637402532273e-08, + 7.544804248027503e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3427734375, + "loss_eval": 1.9254777431488037, + "epoch": 81 + }, + { + "hidden_norms": [ + 28004.76953125, + 6848695.0, + 34154160.0, + 42523512.0, + 31536314.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.562642069075082e-07, + 2.289735068217169e-09, + 2.2051671599854217e-09, + 2.2135104860154797e-09, + 2.188419445658951e-09 + ], + "bp_grad_norms_F": [ + 9.512452379567549e-06, + 7.840634452804807e-08, + 7.557503778343744e-08, + 7.672917234913257e-08, + 7.541159163793054e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.341796875, + "loss_eval": 1.9253835678100586, + "epoch": 82 + }, + { + "hidden_norms": [ + 28036.138671875, + 6859844.5, + 34231564.0, + 42620400.0, + 31595422.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5447380974364933e-07, + 2.2824857559555767e-09, + 2.1902821778496673e-09, + 2.2037338620606306e-09, + 2.183933034416441e-09 + ], + "bp_grad_norms_F": [ + 9.456872248847503e-06, + 7.838458770947909e-08, + 7.556796077778927e-08, + 7.67221948194674e-08, + 7.540831603591869e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.333984375, + "loss_eval": 1.9241688251495361, + "epoch": 83 + }, + { + "hidden_norms": [ + 28063.341796875, + 6866642.0, + 34298612.0, + 42705280.0, + 31647722.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.550155843688117e-07, + 2.281024480410565e-09, + 2.1895063540000592e-09, + 2.20287676988562e-09, + 2.1853003850935693e-09 + ], + "bp_grad_norms_F": [ + 9.501630302111153e-06, + 7.833479287455702e-08, + 7.55063354063168e-08, + 7.666048418286664e-08, + 7.534579538059916e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.333984375, + "loss_eval": 1.9253199100494385, + "epoch": 84 + }, + { + "hidden_norms": [ + 28090.240234375, + 6875769.0, + 34361584.0, + 42782612.0, + 31697334.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.536338629648526e-07, + 2.267983800763318e-09, + 2.1772310621059887e-09, + 2.1934687399749464e-09, + 2.1765453883659802e-09 + ], + "bp_grad_norms_F": [ + 9.536663128528744e-06, + 7.836315774056857e-08, + 7.554304914947352e-08, + 7.669789425790441e-08, + 7.538390178751797e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3203125, + "loss_eval": 1.9292113780975342, + "epoch": 85 + }, + { + "hidden_norms": [ + 28114.236328125, + 6884728.0, + 34407252.0, + 42840440.0, + 31732750.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5464524949493352e-07, + 2.280014399502761e-09, + 2.1917956338768363e-09, + 2.2101085406234233e-09, + 2.1894293045221502e-09 + ], + "bp_grad_norms_F": [ + 9.505700290901586e-06, + 7.817885716576711e-08, + 7.534623591709533e-08, + 7.650118760693658e-08, + 7.518445244159011e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3310546875, + "loss_eval": 1.9261689186096191, + "epoch": 86 + }, + { + "hidden_norms": [ + 28132.669921875, + 6893751.5, + 34460884.0, + 42910656.0, + 31780534.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5502969574754388e-07, + 2.2780193287275097e-09, + 2.1857382570544814e-09, + 2.200839510635433e-09, + 2.1766897173591815e-09 + ], + "bp_grad_norms_F": [ + 9.460140972805675e-06, + 7.810618996018093e-08, + 7.528173284754303e-08, + 7.643409105639876e-08, + 7.512058886049999e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.333984375, + "loss_eval": 1.9239721298217773, + "epoch": 87 + }, + { + "hidden_norms": [ + 28148.599609375, + 6899411.0, + 34495884.0, + 42954048.0, + 31804918.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5502014605317527e-07, + 2.2734785165567928e-09, + 2.191139492069283e-09, + 2.201265170143074e-09, + 2.182727776300908e-09 + ], + "bp_grad_norms_F": [ + 9.466436495131347e-06, + 7.804617752071863e-08, + 7.521869349602639e-08, + 7.63711227591557e-08, + 7.50560502638109e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3369140625, + "loss_eval": 1.9230663776397705, + "epoch": 88 + }, + { + "hidden_norms": [ + 28162.9609375, + 6901370.5, + 34523684.0, + 42989220.0, + 31824814.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5575578515836241e-07, + 2.2783777087198587e-09, + 2.1914692283075965e-09, + 2.19572404702717e-09, + 2.1778470138400507e-09 + ], + "bp_grad_norms_F": [ + 9.514466910331976e-06, + 7.809557445170867e-08, + 7.525108713934969e-08, + 7.640503696393353e-08, + 7.508738519845792e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3447265625, + "loss_eval": 1.9263484477996826, + "epoch": 89 + }, + { + "hidden_norms": [ + 28175.54296875, + 6907143.0, + 34559816.0, + 43035484.0, + 31854504.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5354446247783926e-07, + 2.272713128803616e-09, + 2.1856987331148048e-09, + 2.2020374412790034e-09, + 2.1765065305601183e-09 + ], + "bp_grad_norms_F": [ + 9.444916940992698e-06, + 7.799643242378806e-08, + 7.51774322793608e-08, + 7.632959864167788e-08, + 7.50167856722328e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3349609375, + "loss_eval": 1.9226629734039307, + "epoch": 90 + }, + { + "hidden_norms": [ + 28185.98046875, + 6908239.0, + 34575728.0, + 43054472.0, + 31863434.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5382977380795637e-07, + 2.274502586274707e-09, + 2.1870079081054428e-09, + 2.1993444843104726e-09, + 2.181675506918168e-09 + ], + "bp_grad_norms_F": [ + 9.480510016146582e-06, + 7.80089948193563e-08, + 7.51953308508746e-08, + 7.635033938413471e-08, + 7.503523846708049e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3359375, + "loss_eval": 1.92463219165802, + "epoch": 91 + }, + { + "hidden_norms": [ + 28195.05078125, + 6911853.0, + 34606972.0, + 43094588.0, + 31890320.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5355996652033355e-07, + 2.2723862791451666e-09, + 2.1887525125663387e-09, + 2.1977624165003817e-09, + 2.1820119044946296e-09 + ], + "bp_grad_norms_F": [ + 9.450015568290837e-06, + 7.795882339678428e-08, + 7.514577760048269e-08, + 7.629873266523646e-08, + 7.498609022604796e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3388671875, + "loss_eval": 1.9231452941894531, + "epoch": 92 + }, + { + "hidden_norms": [ + 28202.009765625, + 6911585.0, + 34614424.0, + 43102544.0, + 31893396.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5335498915192147e-07, + 2.273481403136657e-09, + 2.18971196730422e-09, + 2.201623994224633e-09, + 2.179575853133997e-09 + ], + "bp_grad_norms_F": [ + 9.466421943216119e-06, + 7.796668910486915e-08, + 7.514941557928978e-08, + 7.630385567836129e-08, + 7.498929477378624e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3349609375, + "loss_eval": 1.9242045879364014, + "epoch": 93 + }, + { + "hidden_norms": [ + 28207.30078125, + 6912594.5, + 34624228.0, + 43114124.0, + 31900214.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.541789487191636e-07, + 2.26694063520938e-09, + 2.1774959613196643e-09, + 2.1911708003585773e-09, + 2.177005020698175e-09 + ], + "bp_grad_norms_F": [ + 9.48972228798084e-06, + 7.800251466960617e-08, + 7.518539746342867e-08, + 7.634076126805667e-08, + 7.502466559117238e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3349609375, + "loss_eval": 1.9264299869537354, + "epoch": 94 + }, + { + "hidden_norms": [ + 28210.744140625, + 6914176.5, + 34633372.0, + 43125584.0, + 31907212.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5396986441373883e-07, + 2.2685893164009485e-09, + 2.182473091139059e-09, + 2.2001969135487798e-09, + 2.1797674776280473e-09 + ], + "bp_grad_norms_F": [ + 9.470595614402555e-06, + 7.796354850597709e-08, + 7.514324096291602e-08, + 7.629726184177343e-08, + 7.498252330151445e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3388671875, + "loss_eval": 1.9243674278259277, + "epoch": 95 + }, + { + "hidden_norms": [ + 28213.134765625, + 6914654.0, + 34637116.0, + 43129968.0, + 31909774.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5392139118830528e-07, + 2.2676351907335857e-09, + 2.181399949563456e-09, + 2.194956438827944e-09, + 2.1772521563434566e-09 + ], + "bp_grad_norms_F": [ + 9.468548341828864e-06, + 7.796590040243245e-08, + 7.514832134347671e-08, + 7.630251985801806e-08, + 7.498784526660529e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.33984375, + "loss_eval": 1.9245264530181885, + "epoch": 96 + }, + { + "hidden_norms": [ + 28214.392578125, + 6914571.0, + 34637992.0, + 43130936.0, + 31909692.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5425968058480066e-07, + 2.2704826907471443e-09, + 2.18207008018112e-09, + 2.1958874718563948e-09, + 2.177970914729599e-09 + ], + "bp_grad_norms_F": [ + 9.473776117374655e-06, + 7.796563039619286e-08, + 7.514674393860332e-08, + 7.63012906190852e-08, + 7.498606890976589e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.337890625, + "loss_eval": 1.9245213270187378, + "epoch": 97 + }, + { + "hidden_norms": [ + 28215.587890625, + 6915082.0, + 34641648.0, + 43135608.0, + 31912816.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5412730647312856e-07, + 2.2691615253478403e-09, + 2.181160807523952e-09, + 2.1947776929209795e-09, + 2.1773913783107446e-09 + ], + "bp_grad_norms_F": [ + 9.472671081312e-06, + 7.796593592956924e-08, + 7.514773869843339e-08, + 7.630221432464168e-08, + 7.498719867271575e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.337890625, + "loss_eval": 1.9246418476104736, + "epoch": 98 + }, + { + "hidden_norms": [ + 28216.130859375, + 6915161.5, + 34642452.0, + 43136600.0, + 31913348.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5420548038491688e-07, + 2.2695016976825855e-09, + 2.1805732774993203e-09, + 2.1951678252918327e-09, + 2.1776345171531375e-09 + ], + "bp_grad_norms_F": [ + 9.474650141783059e-06, + 7.796723622277568e-08, + 7.514872635283609e-08, + 7.63033014550274e-08, + 7.498815079998167e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.337890625, + "loss_eval": 1.9247386455535889, + "epoch": 99 + }, + { + "hidden_norms": [ + 28216.1875, + 6915194.0, + 34642580.0, + 43136768.0, + 31913448.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5419134058447526e-07, + 2.2693393830763853e-09, + 2.180579494748258e-09, + 2.194876502770171e-09, + 2.1777446512771803e-09 + ], + "bp_grad_norms_F": [ + 9.474156286159996e-06, + 7.796705148166438e-08, + 7.51486410877078e-08, + 7.630320908447175e-08, + 7.498806553485338e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.337890625, + "loss_eval": 1.9247117042541504, + "epoch": 100 + } + ], + "seed": 42, + "depth": 4, + "d_hidden": 256 +} \ No newline at end of file diff --git a/results/snapshot_evolution_v3_fa.log b/results/snapshot_evolution_v3_fa.log new file mode 100644 index 0000000..cde8c3e --- /dev/null +++ b/results/snapshot_evolution_v3_fa.log @@ -0,0 +1 @@ +device=cuda:0, depth=4, d_hidden=256, epochs=100, seed=42 diff --git a/results/snapshot_exploit/snapshot_L4_d256_s42.json b/results/snapshot_exploit/snapshot_L4_d256_s42.json new file mode 100644 index 0000000..45860f7 --- /dev/null +++ b/results/snapshot_exploit/snapshot_L4_d256_s42.json @@ -0,0 +1,209 @@ +{ + "config": { + "L": 4, + "d": 256, + "seed": 42, + "lr_update": 0.001, + "estimator_epochs": 100 + }, + "credit_quality": { + "dfa": { + "gamma": 0.008470005544950254, + "rho": -0.022525018197484314, + "nudge": -2.3932622525535407e-05 + }, + "scalar_cb": { + "gamma": 0.12223921716213226, + "rho": 0.09000759199261665, + "nudge": -0.00036903251748299226 + }, + "vec_eT_M4": { + "gamma": 0.37760399281978607, + "rho": 0.41141805797815323, + "nudge": -0.0013705549063161016 + }, + "oracle_bp": { + "gamma": 1.0, + "rho": 0.9979714304208755, + "nudge": -0.0031722619314678013 + } + }, + "exploitability": { + "dfa": { + "gamma": 0.008470005544950254, + "rho": -0.022525018197484314, + "nudge": -2.3932622525535407e-05, + "loss_before": 1.1802499413490295, + "loss_after_1step": 1.1798909544944762, + "delta_loss_1step": -0.00035898685455326707, + "delta_acc_1step": 0.002343749999999978 + }, + "scalar_cb": { + "gamma": 0.12223921716213226, + "rho": 0.09000759199261665, + "nudge": -0.00036903251748299226, + "loss_before": 1.1802499413490295, + "loss_after_1step": 1.1835142850875855, + "delta_loss_1step": 0.003264343738555997, + "delta_acc_1step": 0.0007812499999999556 + }, + "vec_eT_M4": { + "gamma": 0.37760399281978607, + "rho": 0.41141805797815323, + "nudge": -0.0013705549063161016, + "loss_before": 1.1802499413490295, + "loss_after_1step": 1.1832772016525268, + "delta_loss_1step": 0.0030272603034973145, + "delta_acc_1step": -0.0031250000000000444 + }, + "oracle_bp": { + "gamma": 1.0, + "rho": 0.9979714304208755, + "nudge": -0.0031722619314678013, + "loss_before": 1.1802499413490295, + "loss_after_1step": 1.1796290874481201, + "delta_loss_1step": -0.0006208539009093794, + "delta_acc_1step": 0.005468750000000022 + } + }, + "rollout": { + "dfa": { + "1": { + "loss": 1.1801316797733308, + "acc": 0.61328125, + "delta_loss": -0.00011826157569871931, + "delta_acc": 0.6109375 + }, + "5": { + "loss": 1.18045933842659, + "acc": 0.615625, + "delta_loss": 0.00020939707756051362, + "delta_acc": 0.61328125 + }, + "20": { + "loss": 1.1795716643333436, + "acc": 0.61171875, + "delta_loss": -0.0006782770156859019, + "delta_acc": 0.609375 + } + }, + "scalar_cb": { + "1": { + "loss": 1.1848249435424805, + "acc": 0.6125, + "delta_loss": 0.004575002193450972, + "delta_acc": 0.6117187500000001 + }, + "5": { + "loss": 1.222687977552414, + "acc": 0.60234375, + "delta_loss": 0.04243803620338449, + "delta_acc": 0.6015625 + }, + "20": { + "loss": 1.584816002845764, + "acc": 0.5546875, + "delta_loss": 0.4045660614967346, + "delta_acc": 0.55390625 + } + }, + "vec_eT_M4": { + "1": { + "loss": 1.1844943702220916, + "acc": 0.6015625, + "delta_loss": 0.004244428873062089, + "delta_acc": 0.6046875 + }, + "5": { + "loss": 1.2300199925899507, + "acc": 0.590625, + "delta_loss": 0.049770051240921154, + "delta_acc": 0.59375 + }, + "20": { + "loss": 1.4517351746559144, + "acc": 0.54296875, + "delta_loss": 0.2714852333068849, + "delta_acc": 0.54609375 + } + }, + "oracle_bp": { + "1": { + "loss": 1.180982232093811, + "acc": 0.61328125, + "delta_loss": 0.0007322907447815385, + "delta_acc": 0.6078125 + }, + "5": { + "loss": 1.1867272675037384, + "acc": 0.61796875, + "delta_loss": 0.006477326154708862, + "delta_acc": 0.6124999999999999 + }, + "20": { + "loss": 1.2059795916080476, + "acc": 0.6171875, + "delta_loss": 0.025729650259018078, + "delta_acc": 0.61171875 + } + } + }, + "layer_ablation": { + "dfa": { + "last_1": { + "delta_loss": 7.04765319825551e-05, + "loss": 1.180320417881012 + }, + "last_2": { + "delta_loss": 0.0005654990673065186, + "loss": 1.180815440416336 + }, + "all": { + "delta_loss": 0.0015505015850068027, + "loss": 1.1818004429340363 + } + }, + "scalar_cb": { + "last_1": { + "delta_loss": 0.008096528053283647, + "loss": 1.1883464694023131 + }, + "last_2": { + "delta_loss": 0.01775211691856393, + "loss": 1.1980020582675934 + }, + "all": { + "delta_loss": 0.04727613925933838, + "loss": 1.2275260806083679 + } + }, + "vec_eT_M4": { + "last_1": { + "delta_loss": 0.006879746913909912, + "loss": 1.1871296882629394 + }, + "last_2": { + "delta_loss": 0.014995932579040527, + "loss": 1.19524587392807 + }, + "all": { + "delta_loss": 0.05422646403312692, + "loss": 1.2344764053821564 + } + }, + "oracle_bp": { + "last_1": { + "delta_loss": 0.0035166800022126132, + "loss": 1.183766621351242 + }, + "last_2": { + "delta_loss": 0.004922467470169112, + "loss": 1.1851724088191986 + }, + "all": { + "delta_loss": 0.0027257800102233887, + "loss": 1.1829757213592529 + } + } + } +} \ No newline at end of file diff --git a/results/snapshot_fa_canonical_all.log b/results/snapshot_fa_canonical_all.log new file mode 100644 index 0000000..7a66940 --- /dev/null +++ b/results/snapshot_fa_canonical_all.log @@ -0,0 +1,142 @@ +=== 1/3 ResMLP FA (canonical) === +FA snapshot: depth=4, d=256, seed=42, epochs=100 + [FA] Ep 0: ||h||_med=[8.718070030212402, 8.780964851379395, 8.812002182006836, 8.828720092773438, 8.893179893493652] acc=0.1152 + [FA] Ep 1: ||h_L||=8.484e+03 ||g_2||=1.154e-06 acc=0.2773 + [FA] Ep 2: ||h_L||=1.961e+04 ||g_2||=5.770e-07 acc=0.2959 + [FA] Ep 3: ||h_L||=3.031e+04 ||g_2||=4.175e-07 acc=0.3203 + [FA] Ep 4: ||h_L||=3.890e+04 ||g_2||=3.522e-07 acc=0.3115 + [FA] Ep 5: ||h_L||=4.764e+04 ||g_2||=3.066e-07 acc=0.3223 + [FA] Ep 6: ||h_L||=5.458e+04 ||g_2||=2.801e-07 acc=0.3242 + [FA] Ep 7: ||h_L||=6.159e+04 ||g_2||=2.620e-07 acc=0.3398 + [FA] Ep 8: ||h_L||=6.776e+04 ||g_2||=2.510e-07 acc=0.3496 + [FA] Ep 9: ||h_L||=7.371e+04 ||g_2||=2.415e-07 acc=0.3672 + [FA] Ep 10: ||h_L||=7.970e+04 ||g_2||=2.302e-07 acc=0.3506 + [FA] Ep 11: ||h_L||=8.513e+04 ||g_2||=2.265e-07 acc=0.3750 + [FA] Ep 12: ||h_L||=9.072e+04 ||g_2||=2.184e-07 acc=0.3496 + [FA] Ep 13: ||h_L||=9.391e+04 ||g_2||=2.200e-07 acc=0.3447 + [FA] Ep 14: ||h_L||=9.711e+04 ||g_2||=2.167e-07 acc=0.3447 + [FA] Ep 15: ||h_L||=9.915e+04 ||g_2||=2.183e-07 acc=0.3496 + [FA] Ep 16: ||h_L||=1.013e+05 ||g_2||=2.130e-07 acc=0.3604 + [FA] Ep 17: ||h_L||=1.023e+05 ||g_2||=2.147e-07 acc=0.3623 + [FA] Ep 18: ||h_L||=1.038e+05 ||g_2||=2.151e-07 acc=0.3516 + [FA] Ep 19: ||h_L||=1.051e+05 ||g_2||=2.150e-07 acc=0.3477 + [FA] Ep 20: ||h_L||=1.068e+05 ||g_2||=2.130e-07 acc=0.3682 + [FA] Ep 21: ||h_L||=1.080e+05 ||g_2||=2.173e-07 acc=0.3604 + [FA] Ep 22: ||h_L||=1.099e+05 ||g_2||=2.133e-07 acc=0.3799 + [FA] Ep 23: ||h_L||=1.122e+05 ||g_2||=2.119e-07 acc=0.3496 + [FA] Ep 24: ||h_L||=1.155e+05 ||g_2||=2.079e-07 acc=0.3643 + [FA] Ep 25: ||h_L||=1.192e+05 ||g_2||=2.050e-07 acc=0.3594 + [FA] Ep 26: ||h_L||=1.243e+05 ||g_2||=1.992e-07 acc=0.3613 + [FA] Ep 27: ||h_L||=1.305e+05 ||g_2||=1.947e-07 acc=0.3574 + [FA] Ep 28: ||h_L||=1.388e+05 ||g_2||=1.869e-07 acc=0.3740 + [FA] Ep 29: ||h_L||=1.463e+05 ||g_2||=1.812e-07 acc=0.3867 + [FA] Ep 30: ||h_L||=1.568e+05 ||g_2||=1.740e-07 acc=0.3564 + [FA] Ep 31: ||h_L||=1.663e+05 ||g_2||=1.677e-07 acc=0.3652 + [FA] Ep 32: ||h_L||=1.780e+05 ||g_2||=1.608e-07 acc=0.3818 + [FA] Ep 33: ||h_L||=1.873e+05 ||g_2||=1.557e-07 acc=0.3809 + [FA] Ep 34: ||h_L||=1.973e+05 ||g_2||=1.512e-07 acc=0.3867 + [FA] Ep 35: ||h_L||=2.072e+05 ||g_2||=1.483e-07 acc=0.3750 + [FA] Ep 36: ||h_L||=2.177e+05 ||g_2||=1.445e-07 acc=0.3779 + [FA] Ep 37: ||h_L||=2.258e+05 ||g_2||=1.415e-07 acc=0.3818 + [FA] Ep 38: ||h_L||=2.350e+05 ||g_2||=1.410e-07 acc=0.3760 + [FA] Ep 39: ||h_L||=2.449e+05 ||g_2||=1.378e-07 acc=0.3809 + [FA] Ep 40: ||h_L||=2.519e+05 ||g_2||=1.334e-07 acc=0.3789 + [FA] Ep 41: ||h_L||=2.611e+05 ||g_2||=1.349e-07 acc=0.3760 + [FA] Ep 42: ||h_L||=2.705e+05 ||g_2||=1.312e-07 acc=0.3887 + [FA] Ep 43: ||h_L||=2.789e+05 ||g_2||=1.283e-07 acc=0.3867 + [FA] Ep 44: ||h_L||=2.878e+05 ||g_2||=1.250e-07 acc=0.3770 + [FA] Ep 45: ||h_L||=2.938e+05 ||g_2||=1.252e-07 acc=0.3770 + [FA] Ep 46: ||h_L||=3.013e+05 ||g_2||=1.242e-07 acc=0.3906 + [FA] Ep 47: ||h_L||=3.072e+05 ||g_2||=1.237e-07 acc=0.3848 + [FA] Ep 48: ||h_L||=3.146e+05 ||g_2||=1.222e-07 acc=0.3750 + [FA] Ep 49: ||h_L||=3.232e+05 ||g_2||=1.189e-07 acc=0.3877 + [FA] Ep 50: ||h_L||=3.302e+05 ||g_2||=1.192e-07 acc=0.3877 + [FA] Ep 51: ||h_L||=3.345e+05 ||g_2||=1.187e-07 acc=0.3955 + [FA] Ep 52: ||h_L||=3.407e+05 ||g_2||=1.183e-07 acc=0.3877 + [FA] Ep 53: ||h_L||=3.467e+05 ||g_2||=1.170e-07 acc=0.3945 + [FA] Ep 54: ||h_L||=3.505e+05 ||g_2||=1.182e-07 acc=0.3838 + [FA] Ep 55: ||h_L||=3.582e+05 ||g_2||=1.160e-07 acc=0.3867 + [FA] Ep 56: ||h_L||=3.617e+05 ||g_2||=1.164e-07 acc=0.3906 + [FA] Ep 57: ||h_L||=3.672e+05 ||g_2||=1.159e-07 acc=0.3838 + [FA] Ep 58: ||h_L||=3.684e+05 ||g_2||=1.181e-07 acc=0.3828 + [FA] Ep 59: ||h_L||=3.725e+05 ||g_2||=1.175e-07 acc=0.3740 + [FA] Ep 60: ||h_L||=3.774e+05 ||g_2||=1.150e-07 acc=0.3926 + [FA] Ep 61: ||h_L||=3.792e+05 ||g_2||=1.161e-07 acc=0.3838 + [FA] Ep 62: ||h_L||=3.823e+05 ||g_2||=1.163e-07 acc=0.3799 + [FA] Ep 63: ||h_L||=3.856e+05 ||g_2||=1.175e-07 acc=0.3887 + [FA] Ep 64: ||h_L||=3.891e+05 ||g_2||=1.154e-07 acc=0.3936 + [FA] Ep 65: ||h_L||=3.924e+05 ||g_2||=1.159e-07 acc=0.3916 + [FA] Ep 66: ||h_L||=3.935e+05 ||g_2||=1.166e-07 acc=0.3994 + [FA] Ep 67: ||h_L||=3.976e+05 ||g_2||=1.151e-07 acc=0.3877 + [FA] Ep 68: ||h_L||=3.997e+05 ||g_2||=1.155e-07 acc=0.3945 + [FA] Ep 69: ||h_L||=4.015e+05 ||g_2||=1.162e-07 acc=0.3916 + [FA] Ep 70: ||h_L||=4.049e+05 ||g_2||=1.151e-07 acc=0.3955 + [FA] Ep 71: ||h_L||=4.052e+05 ||g_2||=1.166e-07 acc=0.3926 + [FA] Ep 72: ||h_L||=4.078e+05 ||g_2||=1.154e-07 acc=0.3896 + [FA] Ep 73: ||h_L||=4.096e+05 ||g_2||=1.160e-07 acc=0.3896 + [FA] Ep 74: ||h_L||=4.112e+05 ||g_2||=1.151e-07 acc=0.3867 + [FA] Ep 75: ||h_L||=4.126e+05 ||g_2||=1.151e-07 acc=0.3975 + [FA] Ep 76: ||h_L||=4.135e+05 ||g_2||=1.156e-07 acc=0.3955 + [FA] Ep 77: ||h_L||=4.145e+05 ||g_2||=1.160e-07 acc=0.3896 + [FA] Ep 78: ||h_L||=4.165e+05 ||g_2||=1.149e-07 acc=0.3887 + [FA] Ep 79: ||h_L||=4.161e+05 ||g_2||=1.153e-07 acc=0.3945 + [FA] Ep 80: ||h_L||=4.175e+05 ||g_2||=1.155e-07 acc=0.3906 + [FA] Ep 81: ||h_L||=4.187e+05 ||g_2||=1.156e-07 acc=0.3896 + [FA] Ep 82: ||h_L||=4.193e+05 ||g_2||=1.159e-07 acc=0.3906 + [FA] Ep 83: ||h_L||=4.201e+05 ||g_2||=1.158e-07 acc=0.3877 + [FA] Ep 84: ||h_L||=4.206e+05 ||g_2||=1.157e-07 acc=0.3906 + [FA] Ep 85: ||h_L||=4.213e+05 ||g_2||=1.160e-07 acc=0.3867 + [FA] Ep 86: ||h_L||=4.214e+05 ||g_2||=1.159e-07 acc=0.3848 + [FA] Ep 87: ||h_L||=4.221e+05 ||g_2||=1.156e-07 acc=0.3916 + [FA] Ep 88: ||h_L||=4.225e+05 ||g_2||=1.159e-07 acc=0.3906 + [FA] Ep 89: ||h_L||=4.228e+05 ||g_2||=1.156e-07 acc=0.3877 + [FA] Ep 90: ||h_L||=4.232e+05 ||g_2||=1.156e-07 acc=0.3916 + [FA] Ep 91: ||h_L||=4.232e+05 ||g_2||=1.164e-07 acc=0.3857 + [FA] Ep 92: ||h_L||=4.234e+05 ||g_2||=1.162e-07 acc=0.3877 + [FA] Ep 93: ||h_L||=4.235e+05 ||g_2||=1.157e-07 acc=0.3896 + [FA] Ep 94: ||h_L||=4.234e+05 ||g_2||=1.158e-07 acc=0.3877 + [FA] Ep 95: ||h_L||=4.237e+05 ||g_2||=1.158e-07 acc=0.3887 + [FA] Ep 96: ||h_L||=4.237e+05 ||g_2||=1.161e-07 acc=0.3877 + [FA] Ep 97: ||h_L||=4.237e+05 ||g_2||=1.158e-07 acc=0.3896 + [FA] Ep 98: ||h_L||=4.237e+05 ||g_2||=1.157e-07 acc=0.3877 + [FA] Ep 99: ||h_L||=4.237e+05 ||g_2||=1.158e-07 acc=0.3887 + [FA] Ep 100: ||h_L||=4.237e+05 ||g_2||=1.159e-07 acc=0.3887 +Saved: results/snapshot_evolution_v2/snapshot_fa_canonical_s42.json +=== 2/3 StudentNet FA (canonical) === +StudentNet FA: alpha=1.0, L=4, d=128, seed=42 + [FA] Ep 0: acc=0.0845 + [FA] Ep 1: ||h_L||=1.230e+01 ||g||=3.496e-04 acc=0.5270 + [FA] Ep 5: ||h_L||=3.658e+01 ||g||=2.665e-04 acc=0.7070 + [FA] Ep 10: ||h_L||=7.605e+01 ||g||=1.848e-04 acc=0.6585 + [FA] Ep 15: ||h_L||=1.489e+02 ||g||=2.047e-04 acc=0.6110 + [FA] Ep 20: ||h_L||=3.292e+02 ||g||=2.434e-04 acc=0.5745 + [FA] Ep 25: ||h_L||=5.442e+02 ||g||=2.650e-04 acc=0.4685 + [FA] Ep 30: ||h_L||=7.710e+02 ||g||=3.195e-04 acc=0.3240 + [FA] Ep 35: ||h_L||=9.629e+02 ||g||=3.131e-04 acc=0.3775 + [FA] Ep 40: ||h_L||=1.124e+03 ||g||=3.087e-04 acc=0.3395 + [FA] Ep 45: ||h_L||=1.252e+03 ||g||=3.134e-04 acc=0.3360 + [FA] Ep 50: ||h_L||=1.350e+03 ||g||=3.060e-04 acc=0.3360 + [FA] Ep 55: ||h_L||=1.425e+03 ||g||=2.972e-04 acc=0.3530 + [FA] Ep 60: ||h_L||=1.478e+03 ||g||=3.112e-04 acc=0.3150 + [FA] Ep 65: ||h_L||=1.512e+03 ||g||=3.082e-04 acc=0.3430 + [FA] Ep 70: ||h_L||=1.531e+03 ||g||=3.000e-04 acc=0.3520 + [FA] Ep 75: ||h_L||=1.539e+03 ||g||=3.030e-04 acc=0.3560 + [FA] Ep 80: ||h_L||=1.540e+03 ||g||=3.003e-04 acc=0.3595 +Saved: results/snapshot_synth_v1/snapshot_fa_canonical_s42.json +=== 3/3 ViT FA (canonical) === + [FA-vit] Ep 0: acc=0.1230 + [FA-vit] Ep 1: ||h_L||=1.626e+03 ||g_L||=5.029e-07 acc=0.2500 + [FA-vit] Ep 5: ||h_L||=4.490e+04 ||g_L||=2.834e-08 acc=0.2373 + [FA-vit] Ep 10: ||h_L||=2.109e+05 ||g_L||=5.916e-09 acc=0.2021 + [FA-vit] Ep 15: ||h_L||=7.814e+05 ||g_L||=1.013e-09 acc=0.1924 + [FA-vit] Ep 20: ||h_L||=3.356e+06 ||g_L||=2.481e-10 acc=0.1729 + [FA-vit] Ep 25: ||h_L||=8.750e+06 ||g_L||=1.192e-10 acc=0.1582 + [FA-vit] Ep 30: ||h_L||=1.587e+07 ||g_L||=7.185e-11 acc=0.1650 + [FA-vit] Ep 35: ||h_L||=2.381e+07 ||g_L||=5.271e-11 acc=0.1582 + [FA-vit] Ep 40: ||h_L||=2.944e+07 ||g_L||=4.898e-11 acc=0.1758 + [FA-vit] Ep 45: ||h_L||=3.222e+07 ||g_L||=4.930e-11 acc=0.1641 + [FA-vit] Ep 50: ||h_L||=3.331e+07 ||g_L||=5.144e-11 acc=0.1592 + [FA-vit] Ep 55: ||h_L||=3.378e+07 ||g_L||=4.934e-11 acc=0.1553 + [FA-vit] Ep 60: ||h_L||=3.376e+07 ||g_L||=5.086e-11 acc=0.1631 +Saved: results/snapshot_vit_v1/snapshot_fa_canonical_s42.json +=== ALL DONE === diff --git a/results/snapshot_fa_canonical_noln.log b/results/snapshot_fa_canonical_noln.log new file mode 100644 index 0000000..3390416 --- /dev/null +++ b/results/snapshot_fa_canonical_noln.log @@ -0,0 +1,13 @@ + [FA] Ep 0: acc=0.1123 + [FA] Ep 1: ||h_L||=2.126e+03 ||g_L||=6.794e-04 acc=0.1953 + [FA] Ep 10: ||h_L||=3.026e+04 ||g_L||=7.023e-04 acc=0.1904 + [FA] Ep 20: ||h_L||=3.009e+05 ||g_L||=7.148e-04 acc=0.1924 + [FA] Ep 30: ||h_L||=7.488e+05 ||g_L||=7.095e-04 acc=0.1592 + [FA] Ep 40: ||h_L||=1.504e+06 ||g_L||=7.357e-04 acc=0.1328 + [FA] Ep 50: ||h_L||=2.461e+06 ||g_L||=7.304e-04 acc=0.1523 + [FA] Ep 60: ||h_L||=3.371e+06 ||g_L||=6.871e-04 acc=0.2373 + [FA] Ep 70: ||h_L||=4.105e+06 ||g_L||=6.944e-04 acc=0.2305 + [FA] Ep 80: ||h_L||=4.452e+06 ||g_L||=6.829e-04 acc=0.2529 + [FA] Ep 90: ||h_L||=4.530e+06 ||g_L||=6.455e-04 acc=0.2852 + [FA] Ep 100: ||h_L||=4.532e+06 ||g_L||=6.448e-04 acc=0.2949 +Saved: results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json diff --git a/results/snapshot_fa_crossarch.log b/results/snapshot_fa_crossarch.log new file mode 100644 index 0000000..1b57c54 --- /dev/null +++ b/results/snapshot_fa_crossarch.log @@ -0,0 +1,28 @@ + [FA-vit] Ep 0: acc=0.1230 + [FA-vit] Ep 1: ||h_L||=9.189e+03 ||g_L||=1.397e-07 acc=0.1924 + [FA-vit] Ep 5: ||h_L||=8.370e+04 ||g_L||=1.345e-08 acc=0.1748 + [FA-vit] Ep 10: ||h_L||=3.438e+05 ||g_L||=2.922e-09 acc=0.1523 + [FA-vit] Ep 15: ||h_L||=6.607e+05 ||g_L||=1.928e-09 acc=0.1475 + [FA-vit] Ep 20: ||h_L||=2.780e+06 ||g_L||=6.684e-10 acc=0.1299 + [FA-vit] Ep 25: ||h_L||=3.569e+06 ||g_L||=6.848e-10 acc=0.1445 + [FA-vit] Ep 30: ||h_L||=2.385e+06 ||g_L||=4.479e-10 acc=0.1475 + [FA-vit] Ep 35: ||h_L||=4.374e+06 ||g_L||=1.958e-10 acc=0.1670 + [FA-vit] Ep 40: ||h_L||=2.694e+06 ||g_L||=4.407e-10 acc=0.1182 + [FA-vit] Ep 45: ||h_L||=7.187e+06 ||g_L||=2.039e-10 acc=0.1143 + [FA-vit] Ep 50: ||h_L||=8.005e+06 ||g_L||=1.980e-10 acc=0.1123 + [FA-vit] Ep 55: ||h_L||=8.736e+06 ||g_L||=1.914e-10 acc=0.1123 + [FA-vit] Ep 60: ||h_L||=8.772e+06 ||g_L||=1.910e-10 acc=0.1133 +Saved: results/snapshot_vit_v1/snapshot_fa_vit_s42.json + [FA] Ep 0: acc=0.1123 + [FA] Ep 1: ||h_L||=2.126e+03 ||g_L||=6.794e-04 acc=0.1953 + [FA] Ep 10: ||h_L||=3.026e+04 ||g_L||=7.023e-04 acc=0.1904 + [FA] Ep 20: ||h_L||=3.009e+05 ||g_L||=7.148e-04 acc=0.1924 + [FA] Ep 30: ||h_L||=7.488e+05 ||g_L||=7.095e-04 acc=0.1592 + [FA] Ep 40: ||h_L||=1.504e+06 ||g_L||=7.357e-04 acc=0.1328 + [FA] Ep 50: ||h_L||=2.461e+06 ||g_L||=7.304e-04 acc=0.1523 + [FA] Ep 60: ||h_L||=3.371e+06 ||g_L||=6.871e-04 acc=0.2373 + [FA] Ep 70: ||h_L||=4.105e+06 ||g_L||=6.944e-04 acc=0.2305 + [FA] Ep 80: ||h_L||=4.452e+06 ||g_L||=6.829e-04 acc=0.2529 + [FA] Ep 90: ||h_L||=4.530e+06 ||g_L||=6.455e-04 acc=0.2852 + [FA] Ep 100: ||h_L||=4.532e+06 ||g_L||=6.448e-04 acc=0.2949 +Saved: results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json diff --git a/results/snapshot_fa_evolution.log b/results/snapshot_fa_evolution.log new file mode 100644 index 0000000..de11218 --- /dev/null +++ b/results/snapshot_fa_evolution.log @@ -0,0 +1,103 @@ +FA snapshot: depth=4, d=256, seed=42, epochs=100 + [FA] Ep 0: ||h||_med=[8.718070030212402, 8.780964851379395, 8.812002182006836, 8.828720092773438, 8.893179893493652] acc=0.1152 + [FA] Ep 1: ||h_L||=1.209e+04 ||g_2||=8.304e-07 acc=0.2432 + [FA] Ep 2: ||h_L||=6.410e+04 ||g_2||=1.591e-07 acc=0.2344 + [FA] Ep 3: ||h_L||=2.369e+05 ||g_2||=5.772e-08 acc=0.2529 + [FA] Ep 4: ||h_L||=5.822e+05 ||g_2||=2.728e-08 acc=0.2314 + [FA] Ep 5: ||h_L||=9.781e+05 ||g_2||=1.788e-08 acc=0.2275 + [FA] Ep 6: ||h_L||=1.473e+06 ||g_2||=1.256e-08 acc=0.2314 + [FA] Ep 7: ||h_L||=2.010e+06 ||g_2||=9.450e-09 acc=0.2637 + [FA] Ep 8: ||h_L||=2.552e+06 ||g_2||=8.093e-09 acc=0.2373 + [FA] Ep 9: ||h_L||=3.176e+06 ||g_2||=6.801e-09 acc=0.2715 + [FA] Ep 10: ||h_L||=3.778e+06 ||g_2||=5.977e-09 acc=0.2422 + [FA] Ep 11: ||h_L||=4.552e+06 ||g_2||=5.185e-09 acc=0.2793 + [FA] Ep 12: ||h_L||=5.168e+06 ||g_2||=4.689e-09 acc=0.2793 + [FA] Ep 13: ||h_L||=5.776e+06 ||g_2||=4.462e-09 acc=0.2949 + [FA] Ep 14: ||h_L||=6.482e+06 ||g_2||=4.028e-09 acc=0.2842 + [FA] Ep 15: ||h_L||=7.058e+06 ||g_2||=3.815e-09 acc=0.2637 + [FA] Ep 16: ||h_L||=7.683e+06 ||g_2||=3.649e-09 acc=0.2695 + [FA] Ep 17: ||h_L||=8.371e+06 ||g_2||=3.428e-09 acc=0.2939 + [FA] Ep 18: ||h_L||=8.992e+06 ||g_2||=3.310e-09 acc=0.2900 + [FA] Ep 19: ||h_L||=9.604e+06 ||g_2||=3.225e-09 acc=0.2627 + [FA] Ep 20: ||h_L||=1.026e+07 ||g_2||=3.125e-09 acc=0.2500 + [FA] Ep 21: ||h_L||=1.085e+07 ||g_2||=2.966e-09 acc=0.2949 + [FA] Ep 22: ||h_L||=1.147e+07 ||g_2||=2.868e-09 acc=0.2939 + [FA] Ep 23: ||h_L||=1.199e+07 ||g_2||=2.858e-09 acc=0.2803 + [FA] Ep 24: ||h_L||=1.265e+07 ||g_2||=2.773e-09 acc=0.2969 + [FA] Ep 25: ||h_L||=1.325e+07 ||g_2||=2.738e-09 acc=0.2949 + [FA] Ep 26: ||h_L||=1.396e+07 ||g_2||=2.625e-09 acc=0.2920 + [FA] Ep 27: ||h_L||=1.471e+07 ||g_2||=2.634e-09 acc=0.2861 + [FA] Ep 28: ||h_L||=1.530e+07 ||g_2||=2.530e-09 acc=0.2842 + [FA] Ep 29: ||h_L||=1.589e+07 ||g_2||=2.499e-09 acc=0.3242 + [FA] Ep 30: ||h_L||=1.654e+07 ||g_2||=2.468e-09 acc=0.2910 + [FA] Ep 31: ||h_L||=1.720e+07 ||g_2||=2.525e-09 acc=0.3076 + [FA] Ep 32: ||h_L||=1.789e+07 ||g_2||=2.472e-09 acc=0.3164 + [FA] Ep 33: ||h_L||=1.856e+07 ||g_2||=2.442e-09 acc=0.3184 + [FA] Ep 34: ||h_L||=1.921e+07 ||g_2||=2.454e-09 acc=0.3115 + [FA] Ep 35: ||h_L||=1.957e+07 ||g_2||=2.461e-09 acc=0.3115 + [FA] Ep 36: ||h_L||=2.010e+07 ||g_2||=2.424e-09 acc=0.3047 + [FA] Ep 37: ||h_L||=2.056e+07 ||g_2||=2.375e-09 acc=0.3066 + [FA] Ep 38: ||h_L||=2.108e+07 ||g_2||=2.388e-09 acc=0.3174 + [FA] Ep 39: ||h_L||=2.154e+07 ||g_2||=2.334e-09 acc=0.3076 + [FA] Ep 40: ||h_L||=2.198e+07 ||g_2||=2.361e-09 acc=0.3213 + [FA] Ep 41: ||h_L||=2.244e+07 ||g_2||=2.348e-09 acc=0.3057 + [FA] Ep 42: ||h_L||=2.281e+07 ||g_2||=2.375e-09 acc=0.3252 + [FA] Ep 43: ||h_L||=2.319e+07 ||g_2||=2.382e-09 acc=0.3184 + [FA] Ep 44: ||h_L||=2.350e+07 ||g_2||=2.363e-09 acc=0.3008 + [FA] Ep 45: ||h_L||=2.381e+07 ||g_2||=2.359e-09 acc=0.3076 + [FA] Ep 46: ||h_L||=2.423e+07 ||g_2||=2.372e-09 acc=0.3125 + [FA] Ep 47: ||h_L||=2.456e+07 ||g_2||=2.317e-09 acc=0.3115 + [FA] Ep 48: ||h_L||=2.472e+07 ||g_2||=2.343e-09 acc=0.3135 + [FA] Ep 49: ||h_L||=2.498e+07 ||g_2||=2.351e-09 acc=0.3096 + [FA] Ep 50: ||h_L||=2.532e+07 ||g_2||=2.393e-09 acc=0.3242 + [FA] Ep 51: ||h_L||=2.563e+07 ||g_2||=2.346e-09 acc=0.3193 + [FA] Ep 52: ||h_L||=2.580e+07 ||g_2||=2.380e-09 acc=0.3223 + [FA] Ep 53: ||h_L||=2.612e+07 ||g_2||=2.336e-09 acc=0.3174 + [FA] Ep 54: ||h_L||=2.650e+07 ||g_2||=2.317e-09 acc=0.3145 + [FA] Ep 55: ||h_L||=2.679e+07 ||g_2||=2.339e-09 acc=0.3066 + [FA] Ep 56: ||h_L||=2.718e+07 ||g_2||=2.331e-09 acc=0.3184 + [FA] Ep 57: ||h_L||=2.743e+07 ||g_2||=2.310e-09 acc=0.3115 + [FA] Ep 58: ||h_L||=2.769e+07 ||g_2||=2.289e-09 acc=0.3066 + [FA] Ep 59: ||h_L||=2.796e+07 ||g_2||=2.303e-09 acc=0.3125 + [FA] Ep 60: ||h_L||=2.830e+07 ||g_2||=2.302e-09 acc=0.3281 + [FA] Ep 61: ||h_L||=2.852e+07 ||g_2||=2.303e-09 acc=0.3408 + [FA] Ep 62: ||h_L||=2.871e+07 ||g_2||=2.266e-09 acc=0.3203 + [FA] Ep 63: ||h_L||=2.888e+07 ||g_2||=2.271e-09 acc=0.3164 + [FA] Ep 64: ||h_L||=2.905e+07 ||g_2||=2.292e-09 acc=0.3389 + [FA] Ep 65: ||h_L||=2.927e+07 ||g_2||=2.285e-09 acc=0.3418 + [FA] Ep 66: ||h_L||=2.948e+07 ||g_2||=2.269e-09 acc=0.3398 + [FA] Ep 67: ||h_L||=2.968e+07 ||g_2||=2.278e-09 acc=0.3174 + [FA] Ep 68: ||h_L||=2.988e+07 ||g_2||=2.245e-09 acc=0.3184 + [FA] Ep 69: ||h_L||=3.009e+07 ||g_2||=2.228e-09 acc=0.3242 + [FA] Ep 70: ||h_L||=3.027e+07 ||g_2||=2.242e-09 acc=0.3213 + [FA] Ep 71: ||h_L||=3.048e+07 ||g_2||=2.215e-09 acc=0.3145 + [FA] Ep 72: ||h_L||=3.060e+07 ||g_2||=2.220e-09 acc=0.3242 + [FA] Ep 73: ||h_L||=3.075e+07 ||g_2||=2.203e-09 acc=0.3115 + [FA] Ep 74: ||h_L||=3.092e+07 ||g_2||=2.224e-09 acc=0.3320 + [FA] Ep 75: ||h_L||=3.101e+07 ||g_2||=2.209e-09 acc=0.3232 + [FA] Ep 76: ||h_L||=3.109e+07 ||g_2||=2.215e-09 acc=0.3281 + [FA] Ep 77: ||h_L||=3.118e+07 ||g_2||=2.200e-09 acc=0.3369 + [FA] Ep 78: ||h_L||=3.127e+07 ||g_2||=2.210e-09 acc=0.3291 + [FA] Ep 79: ||h_L||=3.140e+07 ||g_2||=2.183e-09 acc=0.3232 + [FA] Ep 80: ||h_L||=3.145e+07 ||g_2||=2.193e-09 acc=0.3301 + [FA] Ep 81: ||h_L||=3.150e+07 ||g_2||=2.208e-09 acc=0.3428 + [FA] Ep 82: ||h_L||=3.154e+07 ||g_2||=2.205e-09 acc=0.3418 + [FA] Ep 83: ||h_L||=3.160e+07 ||g_2||=2.190e-09 acc=0.3340 + [FA] Ep 84: ||h_L||=3.165e+07 ||g_2||=2.190e-09 acc=0.3340 + [FA] Ep 85: ||h_L||=3.170e+07 ||g_2||=2.177e-09 acc=0.3203 + [FA] Ep 86: ||h_L||=3.173e+07 ||g_2||=2.192e-09 acc=0.3311 + [FA] Ep 87: ||h_L||=3.178e+07 ||g_2||=2.186e-09 acc=0.3340 + [FA] Ep 88: ||h_L||=3.180e+07 ||g_2||=2.191e-09 acc=0.3369 + [FA] Ep 89: ||h_L||=3.182e+07 ||g_2||=2.191e-09 acc=0.3447 + [FA] Ep 90: ||h_L||=3.185e+07 ||g_2||=2.186e-09 acc=0.3350 + [FA] Ep 91: ||h_L||=3.186e+07 ||g_2||=2.187e-09 acc=0.3359 + [FA] Ep 92: ||h_L||=3.189e+07 ||g_2||=2.189e-09 acc=0.3389 + [FA] Ep 93: ||h_L||=3.189e+07 ||g_2||=2.190e-09 acc=0.3350 + [FA] Ep 94: ||h_L||=3.190e+07 ||g_2||=2.177e-09 acc=0.3350 + [FA] Ep 95: ||h_L||=3.191e+07 ||g_2||=2.182e-09 acc=0.3389 + [FA] Ep 96: ||h_L||=3.191e+07 ||g_2||=2.181e-09 acc=0.3398 + [FA] Ep 97: ||h_L||=3.191e+07 ||g_2||=2.182e-09 acc=0.3379 + [FA] Ep 98: ||h_L||=3.191e+07 ||g_2||=2.181e-09 acc=0.3379 + [FA] Ep 99: ||h_L||=3.191e+07 ||g_2||=2.181e-09 acc=0.3379 + [FA] Ep 100: ||h_L||=3.191e+07 ||g_2||=2.181e-09 acc=0.3379 +Saved: results/snapshot_evolution_v2/snapshot_fa_s42.json diff --git a/results/snapshot_fa_studentnet_vit.log b/results/snapshot_fa_studentnet_vit.log new file mode 100644 index 0000000..0570253 --- /dev/null +++ b/results/snapshot_fa_studentnet_vit.log @@ -0,0 +1,37 @@ +=== StudentNet FA === +StudentNet FA: alpha=1.0, L=4, d=128, seed=42 + [FA] Ep 0: acc=0.0845 + [FA] Ep 1: ||h_L||=1.231e+01 ||g||=3.495e-04 acc=0.5265 + [FA] Ep 5: ||h_L||=4.041e+01 ||g||=2.552e-04 acc=0.6975 + [FA] Ep 10: ||h_L||=8.444e+01 ||g||=1.786e-04 acc=0.6390 + [FA] Ep 15: ||h_L||=1.890e+02 ||g||=2.161e-04 acc=0.5950 + [FA] Ep 20: ||h_L||=2.788e+02 ||g||=2.619e-04 acc=0.5395 + [FA] Ep 25: ||h_L||=4.329e+02 ||g||=2.602e-04 acc=0.5250 + [FA] Ep 30: ||h_L||=6.099e+02 ||g||=2.943e-04 acc=0.4955 + [FA] Ep 35: ||h_L||=7.748e+02 ||g||=3.192e-04 acc=0.4345 + [FA] Ep 40: ||h_L||=9.199e+02 ||g||=3.218e-04 acc=0.3900 + [FA] Ep 45: ||h_L||=1.035e+03 ||g||=3.294e-04 acc=0.3930 + [FA] Ep 50: ||h_L||=1.131e+03 ||g||=3.222e-04 acc=0.3930 + [FA] Ep 55: ||h_L||=1.207e+03 ||g||=3.115e-04 acc=0.3980 + [FA] Ep 60: ||h_L||=1.263e+03 ||g||=3.292e-04 acc=0.3780 + [FA] Ep 65: ||h_L||=1.300e+03 ||g||=3.133e-04 acc=0.4165 + [FA] Ep 70: ||h_L||=1.321e+03 ||g||=3.109e-04 acc=0.3970 + [FA] Ep 75: ||h_L||=1.329e+03 ||g||=3.141e-04 acc=0.4005 + [FA] Ep 80: ||h_L||=1.330e+03 ||g||=3.108e-04 acc=0.4140 +Saved: results/snapshot_synth_v1/snapshot_fa_synth_a1.0_L4_s42.json +=== ViT FA === + [FA-vit] Ep 0: acc=0.1230 + [FA-vit] Ep 1: ||h_L||=9.136e+03 ||g_L||=1.402e-07 acc=0.1963 + [FA-vit] Ep 5: ||h_L||=6.324e+04 ||g_L||=4.792e-08 acc=0.1289 + [FA-vit] Ep 10: ||h_L||=4.361e+05 ||g_L||=3.547e-09 acc=0.1982 + [FA-vit] Ep 15: ||h_L||=7.800e+05 ||g_L||=1.709e-09 acc=0.2012 + [FA-vit] Ep 20: ||h_L||=5.439e+05 ||g_L||=2.660e-09 acc=0.0889 + [FA-vit] Ep 25: ||h_L||=1.547e+07 ||g_L||=7.764e-11 acc=0.1797 + [FA-vit] Ep 30: ||h_L||=3.427e+07 ||g_L||=3.899e-11 acc=0.1748 + [FA-vit] Ep 35: ||h_L||=1.976e+06 ||g_L||=9.433e-10 acc=0.1035 + [FA-vit] Ep 40: ||h_L||=2.438e+06 ||g_L||=8.750e-10 acc=0.1084 + [FA-vit] Ep 45: ||h_L||=2.888e+06 ||g_L||=9.925e-10 acc=0.1064 + [FA-vit] Ep 50: ||h_L||=3.180e+06 ||g_L||=9.062e-10 acc=0.1113 + [FA-vit] Ep 55: ||h_L||=3.312e+06 ||g_L||=9.031e-10 acc=0.1182 + [FA-vit] Ep 60: ||h_L||=3.335e+06 ||g_L||=9.009e-10 acc=0.1172 +Saved: results/snapshot_vit_v1/snapshot_fa_vit_s42.json diff --git a/results/snapshot_no_outln_v1/run_s123.log b/results/snapshot_no_outln_v1/run_s123.log new file mode 100644 index 0000000..a946d6d --- /dev/null +++ b/results/snapshot_no_outln_v1/run_s123.log @@ -0,0 +1,51 @@ +NO-OUT_LN VARIANT: depth=4, d_hidden=256, epochs=100, seed=123 + +=== BP training (NO out_ln) === + [BP-noLN] Ep 0: ||h_L||=8.791e+00 ||g||=5.394e-04 acc=0.1016 + [BP-noLN] Ep 1: ||h_L||=3.456e+01 ||g||=1.382e-04 acc=0.4355 + [BP-noLN] Ep 5: ||h_L||=5.193e+01 ||g||=9.721e-05 acc=0.5049 + [BP-noLN] Ep 10: ||h_L||=6.115e+01 ||g||=8.778e-05 acc=0.5430 + [BP-noLN] Ep 15: ||h_L||=6.668e+01 ||g||=8.387e-05 acc=0.5586 + [BP-noLN] Ep 20: ||h_L||=6.880e+01 ||g||=8.997e-05 acc=0.5176 + [BP-noLN] Ep 25: ||h_L||=7.092e+01 ||g||=8.184e-05 acc=0.5850 + [BP-noLN] Ep 30: ||h_L||=7.285e+01 ||g||=7.960e-05 acc=0.5693 + [BP-noLN] Ep 35: ||h_L||=7.522e+01 ||g||=8.247e-05 acc=0.5869 + [BP-noLN] Ep 40: ||h_L||=7.551e+01 ||g||=8.186e-05 acc=0.6201 + [BP-noLN] Ep 45: ||h_L||=7.421e+01 ||g||=8.565e-05 acc=0.5918 + [BP-noLN] Ep 50: ||h_L||=7.473e+01 ||g||=9.094e-05 acc=0.5840 + [BP-noLN] Ep 55: ||h_L||=7.556e+01 ||g||=8.896e-05 acc=0.6143 + [BP-noLN] Ep 60: ||h_L||=7.545e+01 ||g||=9.015e-05 acc=0.6396 + [BP-noLN] Ep 65: ||h_L||=7.509e+01 ||g||=9.009e-05 acc=0.6455 + [BP-noLN] Ep 70: ||h_L||=7.466e+01 ||g||=9.170e-05 acc=0.6230 + [BP-noLN] Ep 75: ||h_L||=7.410e+01 ||g||=1.030e-04 acc=0.6455 + [BP-noLN] Ep 80: ||h_L||=7.313e+01 ||g||=1.043e-04 acc=0.6309 + [BP-noLN] Ep 85: ||h_L||=7.275e+01 ||g||=1.035e-04 acc=0.6396 + [BP-noLN] Ep 90: ||h_L||=7.262e+01 ||g||=1.079e-04 acc=0.6445 + [BP-noLN] Ep 95: ||h_L||=7.256e+01 ||g||=1.087e-04 acc=0.6377 + [BP-noLN] Ep 100: ||h_L||=7.248e+01 ||g||=1.082e-04 acc=0.6396 + +=== DFA training (NO out_ln) === + [DFA-noLN] Ep 0: ||h_L||=8.791e+00 ||g||=5.394e-04 acc=0.1016 + [DFA-noLN] Ep 1: ||h_L||=1.231e+03 ||g||=6.461e-04 acc=0.2129 γ=0.0130 + [DFA-noLN] Ep 5: ||h_L||=1.290e+04 ||g||=7.423e-04 acc=0.2080 γ=-0.0053 + [DFA-noLN] Ep 10: ||h_L||=6.970e+04 ||g||=7.399e-04 acc=0.2031 γ=-0.0038 + [DFA-noLN] Ep 15: ||h_L||=2.144e+05 ||g||=7.383e-04 acc=0.1807 γ=0.0158 + [DFA-noLN] Ep 20: ||h_L||=5.289e+05 ||g||=7.379e-04 acc=0.2295 γ=0.0205 + [DFA-noLN] Ep 25: ||h_L||=1.047e+06 ||g||=7.582e-04 acc=0.1729 γ=-0.0056 + [DFA-noLN] Ep 30: ||h_L||=1.809e+06 ||g||=7.676e-04 acc=0.1934 γ=0.0171 + [DFA-noLN] Ep 35: ||h_L||=2.741e+06 ||g||=7.757e-04 acc=0.1504 γ=0.0181 + [DFA-noLN] Ep 40: ||h_L||=3.868e+06 ||g||=7.547e-04 acc=0.1377 γ=0.0036 + [DFA-noLN] Ep 45: ||h_L||=5.087e+06 ||g||=7.677e-04 acc=0.2246 γ=0.0148 + [DFA-noLN] Ep 50: ||h_L||=6.378e+06 ||g||=7.632e-04 acc=0.2002 γ=-0.0010 + [DFA-noLN] Ep 55: ||h_L||=7.652e+06 ||g||=7.547e-04 acc=0.0908 γ=0.0198 + [DFA-noLN] Ep 60: ||h_L||=8.786e+06 ||g||=7.196e-04 acc=0.1670 γ=0.0255 + [DFA-noLN] Ep 65: ||h_L||=9.795e+06 ||g||=7.598e-04 acc=0.1699 γ=0.0191 + [DFA-noLN] Ep 70: ||h_L||=1.063e+07 ||g||=7.313e-04 acc=0.2422 γ=0.0235 + [DFA-noLN] Ep 75: ||h_L||=1.127e+07 ||g||=7.316e-04 acc=0.2490 γ=0.0445 + [DFA-noLN] Ep 80: ||h_L||=1.173e+07 ||g||=7.425e-04 acc=0.1904 γ=0.0283 + [DFA-noLN] Ep 85: ||h_L||=1.203e+07 ||g||=7.233e-04 acc=0.2500 γ=0.0402 + [DFA-noLN] Ep 90: ||h_L||=1.216e+07 ||g||=7.064e-04 acc=0.3096 γ=0.0335 + [DFA-noLN] Ep 95: ||h_L||=1.218e+07 ||g||=7.087e-04 acc=0.2920 γ=0.0295 + [DFA-noLN] Ep 100: ||h_L||=1.218e+07 ||g||=7.086e-04 acc=0.3135 γ=0.0273 + +Saved results/snapshot_no_outln_v1/snapshot_noLN_s123.json diff --git a/results/snapshot_no_outln_v1/run_s42.log b/results/snapshot_no_outln_v1/run_s42.log new file mode 100644 index 0000000..81d2970 --- /dev/null +++ b/results/snapshot_no_outln_v1/run_s42.log @@ -0,0 +1,51 @@ +NO-OUT_LN VARIANT: depth=4, d_hidden=256, epochs=100, seed=42 + +=== BP training (NO out_ln) === + [BP-noLN] Ep 0: ||h_L||=8.893e+00 ||g||=5.483e-04 acc=0.1123 + [BP-noLN] Ep 1: ||h_L||=3.310e+01 ||g||=1.421e-04 acc=0.4229 + [BP-noLN] Ep 5: ||h_L||=5.238e+01 ||g||=9.984e-05 acc=0.5010 + [BP-noLN] Ep 10: ||h_L||=6.111e+01 ||g||=8.972e-05 acc=0.5518 + [BP-noLN] Ep 15: ||h_L||=6.640e+01 ||g||=8.892e-05 acc=0.5195 + [BP-noLN] Ep 20: ||h_L||=6.977e+01 ||g||=8.730e-05 acc=0.5488 + [BP-noLN] Ep 25: ||h_L||=7.080e+01 ||g||=8.598e-05 acc=0.5547 + [BP-noLN] Ep 30: ||h_L||=7.441e+01 ||g||=8.621e-05 acc=0.5723 + [BP-noLN] Ep 35: ||h_L||=7.537e+01 ||g||=7.991e-05 acc=0.6025 + [BP-noLN] Ep 40: ||h_L||=7.552e+01 ||g||=8.747e-05 acc=0.5859 + [BP-noLN] Ep 45: ||h_L||=7.571e+01 ||g||=8.227e-05 acc=0.5918 + [BP-noLN] Ep 50: ||h_L||=7.514e+01 ||g||=9.716e-05 acc=0.5811 + [BP-noLN] Ep 55: ||h_L||=7.693e+01 ||g||=9.600e-05 acc=0.6006 + [BP-noLN] Ep 60: ||h_L||=7.581e+01 ||g||=9.903e-05 acc=0.6113 + [BP-noLN] Ep 65: ||h_L||=7.549e+01 ||g||=1.009e-04 acc=0.6221 + [BP-noLN] Ep 70: ||h_L||=7.530e+01 ||g||=1.088e-04 acc=0.6074 + [BP-noLN] Ep 75: ||h_L||=7.454e+01 ||g||=1.082e-04 acc=0.6143 + [BP-noLN] Ep 80: ||h_L||=7.426e+01 ||g||=1.162e-04 acc=0.6123 + [BP-noLN] Ep 85: ||h_L||=7.353e+01 ||g||=1.161e-04 acc=0.6084 + [BP-noLN] Ep 90: ||h_L||=7.339e+01 ||g||=1.168e-04 acc=0.6123 + [BP-noLN] Ep 95: ||h_L||=7.308e+01 ||g||=1.164e-04 acc=0.6143 + [BP-noLN] Ep 100: ||h_L||=7.297e+01 ||g||=1.158e-04 acc=0.6162 + +=== DFA training (NO out_ln) === + [DFA-noLN] Ep 0: ||h_L||=8.893e+00 ||g||=5.483e-04 acc=0.1123 + [DFA-noLN] Ep 1: ||h_L||=1.560e+03 ||g||=6.859e-04 acc=0.1494 γ=0.0084 + [DFA-noLN] Ep 5: ||h_L||=1.050e+04 ||g||=7.522e-04 acc=0.1748 γ=-0.0063 + [DFA-noLN] Ep 10: ||h_L||=2.200e+04 ||g||=7.641e-04 acc=0.1445 γ=-0.0167 + [DFA-noLN] Ep 15: ||h_L||=1.004e+05 ||g||=7.608e-04 acc=0.1738 γ=-0.0118 + [DFA-noLN] Ep 20: ||h_L||=3.150e+05 ||g||=7.782e-04 acc=0.2070 γ=0.0027 + [DFA-noLN] Ep 25: ||h_L||=6.817e+05 ||g||=7.884e-04 acc=0.1572 γ=0.0340 + [DFA-noLN] Ep 30: ||h_L||=1.298e+06 ||g||=7.771e-04 acc=0.1299 γ=0.0393 + [DFA-noLN] Ep 35: ||h_L||=2.143e+06 ||g||=7.980e-04 acc=0.0996 γ=0.0196 + [DFA-noLN] Ep 40: ||h_L||=3.180e+06 ||g||=7.691e-04 acc=0.1016 γ=-0.0085 + [DFA-noLN] Ep 45: ||h_L||=4.347e+06 ||g||=7.934e-04 acc=0.1582 γ=0.0262 + [DFA-noLN] Ep 50: ||h_L||=5.552e+06 ||g||=7.869e-04 acc=0.2197 γ=0.0165 + [DFA-noLN] Ep 55: ||h_L||=6.742e+06 ||g||=7.851e-04 acc=0.1885 γ=0.0046 + [DFA-noLN] Ep 60: ||h_L||=7.801e+06 ||g||=7.600e-04 acc=0.1572 γ=0.0045 + [DFA-noLN] Ep 65: ||h_L||=8.775e+06 ||g||=7.795e-04 acc=0.2031 γ=0.0088 + [DFA-noLN] Ep 70: ||h_L||=9.556e+06 ||g||=7.968e-04 acc=0.1836 γ=0.0093 + [DFA-noLN] Ep 75: ||h_L||=1.016e+07 ||g||=7.656e-04 acc=0.2490 γ=0.0168 + [DFA-noLN] Ep 80: ||h_L||=1.064e+07 ||g||=7.633e-04 acc=0.2764 γ=0.0198 + [DFA-noLN] Ep 85: ||h_L||=1.095e+07 ||g||=7.466e-04 acc=0.2773 γ=0.0195 + [DFA-noLN] Ep 90: ||h_L||=1.107e+07 ||g||=7.453e-04 acc=0.2695 γ=0.0131 + [DFA-noLN] Ep 95: ||h_L||=1.113e+07 ||g||=7.446e-04 acc=0.3105 γ=0.0146 + [DFA-noLN] Ep 100: ||h_L||=1.113e+07 ||g||=7.392e-04 acc=0.3320 γ=0.0164 + +Saved results/snapshot_no_outln_v1/snapshot_noLN_s42.json diff --git a/results/snapshot_no_outln_v1/run_s456.log b/results/snapshot_no_outln_v1/run_s456.log new file mode 100644 index 0000000..a0a3bd0 --- /dev/null +++ b/results/snapshot_no_outln_v1/run_s456.log @@ -0,0 +1,51 @@ +NO-OUT_LN VARIANT: depth=4, d_hidden=256, epochs=100, seed=456 + +=== BP training (NO out_ln) === + [BP-noLN] Ep 0: ||h_L||=8.890e+00 ||g||=5.542e-04 acc=0.0918 + [BP-noLN] Ep 1: ||h_L||=3.410e+01 ||g||=1.500e-04 acc=0.4365 + [BP-noLN] Ep 5: ||h_L||=5.250e+01 ||g||=1.052e-04 acc=0.4961 + [BP-noLN] Ep 10: ||h_L||=6.330e+01 ||g||=8.751e-05 acc=0.5596 + [BP-noLN] Ep 15: ||h_L||=6.619e+01 ||g||=8.857e-05 acc=0.5215 + [BP-noLN] Ep 20: ||h_L||=7.009e+01 ||g||=8.610e-05 acc=0.5420 + [BP-noLN] Ep 25: ||h_L||=7.285e+01 ||g||=8.470e-05 acc=0.5723 + [BP-noLN] Ep 30: ||h_L||=7.493e+01 ||g||=8.152e-05 acc=0.5938 + [BP-noLN] Ep 35: ||h_L||=7.640e+01 ||g||=7.781e-05 acc=0.6074 + [BP-noLN] Ep 40: ||h_L||=7.799e+01 ||g||=8.443e-05 acc=0.5938 + [BP-noLN] Ep 45: ||h_L||=7.734e+01 ||g||=7.914e-05 acc=0.6143 + [BP-noLN] Ep 50: ||h_L||=7.667e+01 ||g||=8.950e-05 acc=0.5996 + [BP-noLN] Ep 55: ||h_L||=7.591e+01 ||g||=9.021e-05 acc=0.6201 + [BP-noLN] Ep 60: ||h_L||=7.667e+01 ||g||=8.730e-05 acc=0.6338 + [BP-noLN] Ep 65: ||h_L||=7.629e+01 ||g||=9.670e-05 acc=0.6230 + [BP-noLN] Ep 70: ||h_L||=7.612e+01 ||g||=9.637e-05 acc=0.6260 + [BP-noLN] Ep 75: ||h_L||=7.544e+01 ||g||=9.639e-05 acc=0.6338 + [BP-noLN] Ep 80: ||h_L||=7.434e+01 ||g||=9.999e-05 acc=0.6455 + [BP-noLN] Ep 85: ||h_L||=7.429e+01 ||g||=1.013e-04 acc=0.6348 + [BP-noLN] Ep 90: ||h_L||=7.381e+01 ||g||=1.076e-04 acc=0.6348 + [BP-noLN] Ep 95: ||h_L||=7.380e+01 ||g||=1.084e-04 acc=0.6436 + [BP-noLN] Ep 100: ||h_L||=7.373e+01 ||g||=1.088e-04 acc=0.6465 + +=== DFA training (NO out_ln) === + [DFA-noLN] Ep 0: ||h_L||=8.890e+00 ||g||=5.542e-04 acc=0.0918 + [DFA-noLN] Ep 1: ||h_L||=1.507e+03 ||g||=6.424e-04 acc=0.2246 γ=0.0136 + [DFA-noLN] Ep 5: ||h_L||=1.140e+04 ||g||=7.475e-04 acc=0.2314 γ=-0.0000 + [DFA-noLN] Ep 10: ||h_L||=2.845e+04 ||g||=7.444e-04 acc=0.1895 γ=-0.0067 + [DFA-noLN] Ep 15: ||h_L||=8.676e+04 ||g||=7.381e-04 acc=0.2549 γ=0.0039 + [DFA-noLN] Ep 20: ||h_L||=2.707e+05 ||g||=7.761e-04 acc=0.1670 γ=0.0171 + [DFA-noLN] Ep 25: ||h_L||=6.628e+05 ||g||=7.894e-04 acc=0.1992 γ=0.0390 + [DFA-noLN] Ep 30: ||h_L||=1.245e+06 ||g||=7.944e-04 acc=0.1963 γ=0.0162 + [DFA-noLN] Ep 35: ||h_L||=2.131e+06 ||g||=8.014e-04 acc=0.1904 γ=0.0128 + [DFA-noLN] Ep 40: ||h_L||=3.242e+06 ||g||=7.965e-04 acc=0.1855 γ=0.0227 + [DFA-noLN] Ep 45: ||h_L||=4.568e+06 ||g||=8.172e-04 acc=0.1807 γ=0.0340 + [DFA-noLN] Ep 50: ||h_L||=6.031e+06 ||g||=8.070e-04 acc=0.1133 γ=0.0064 + [DFA-noLN] Ep 55: ||h_L||=7.447e+06 ||g||=7.821e-04 acc=0.1924 γ=0.0273 + [DFA-noLN] Ep 60: ||h_L||=8.862e+06 ||g||=8.033e-04 acc=0.1650 γ=0.0210 + [DFA-noLN] Ep 65: ||h_L||=1.008e+07 ||g||=8.274e-04 acc=0.1533 γ=0.0124 + [DFA-noLN] Ep 70: ||h_L||=1.111e+07 ||g||=7.999e-04 acc=0.2148 γ=0.0337 + [DFA-noLN] Ep 75: ||h_L||=1.197e+07 ||g||=7.703e-04 acc=0.1953 γ=0.0403 + [DFA-noLN] Ep 80: ||h_L||=1.256e+07 ||g||=7.954e-04 acc=0.1445 γ=-0.0076 + [DFA-noLN] Ep 85: ||h_L||=1.292e+07 ||g||=7.205e-04 acc=0.2607 γ=0.0257 + [DFA-noLN] Ep 90: ||h_L||=1.306e+07 ||g||=7.565e-04 acc=0.2402 γ=0.0119 + [DFA-noLN] Ep 95: ||h_L||=1.310e+07 ||g||=7.185e-04 acc=0.3164 γ=0.0157 + [DFA-noLN] Ep 100: ||h_L||=1.310e+07 ||g||=7.178e-04 acc=0.3359 γ=0.0173 + +Saved results/snapshot_no_outln_v1/snapshot_noLN_s456.json diff --git a/results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json b/results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json new file mode 100644 index 0000000..7e5cb37 --- /dev/null +++ b/results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json @@ -0,0 +1,1824 @@ +{ + "fa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_norms_per_sample_med": [ + 0.0005561555735766888, + 0.0005519049009308219, + 0.0005482902633957565, + 0.0005436676437966526, + 0.000538847001735121 + ], + "acc_eval": 0.1123046875, + "epoch": 0 + }, + { + "hidden_norms": [ + 736.34716796875, + 1637.1044921875, + 2033.1922607421875, + 2161.380859375, + 2126.18505859375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0006836718530394137, + 0.0006813183426856995, + 0.0006814387743361294, + 0.0006832550279796124, + 0.0006794488872401416 + ], + "acc_eval": 0.1953125, + "epoch": 1 + }, + { + "hidden_norms": [ + 1106.3868408203125, + 2963.552001953125, + 4087.33837890625, + 4421.4921875, + 4265.1083984375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007476353785023093, + 0.0007440777844749391, + 0.0007443943759426475, + 0.0007477496401406825, + 0.0007366884965449572 + ], + "acc_eval": 0.1044921875, + "epoch": 2 + }, + { + "hidden_norms": [ + 1371.9425048828125, + 4214.05078125, + 6238.47265625, + 6697.2333984375, + 6399.22314453125 + ], + "bp_grad_norms_per_sample_med": [ + 0.000730870058760047, + 0.00072717375587672, + 0.0007270713686011732, + 0.0007290731882676482, + 0.0007233614451251924 + ], + "acc_eval": 0.1943359375, + "epoch": 3 + }, + { + "hidden_norms": [ + 1574.7962646484375, + 4805.0556640625, + 7044.64599609375, + 7593.78955078125, + 7215.32763671875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007098641362972558, + 0.0007034889422357082, + 0.0007031699060462415, + 0.0007120345253497362, + 0.000694308546371758 + ], + "acc_eval": 0.2451171875, + "epoch": 4 + }, + { + "hidden_norms": [ + 1726.088623046875, + 6184.34521484375, + 9521.791015625, + 10387.7236328125, + 9721.431640625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007400272879749537, + 0.0007343650795519352, + 0.0007334973197430372, + 0.0007343514007516205, + 0.0007319966680370271 + ], + "acc_eval": 0.212890625, + "epoch": 5 + }, + { + "hidden_norms": [ + 1902.689697265625, + 7697.52197265625, + 12328.0595703125, + 13597.1787109375, + 12504.158203125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007165716378949583, + 0.0007126733544282615, + 0.0007124089752323925, + 0.0007126083364710212, + 0.0007107863784767687 + ], + "acc_eval": 0.15625, + "epoch": 6 + }, + { + "hidden_norms": [ + 2069.750244140625, + 10379.2958984375, + 16444.7421875, + 18267.94921875, + 16595.220703125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007099996437318623, + 0.0007088935235515237, + 0.0007090346189215779, + 0.000710709486156702, + 0.0007023006328381598 + ], + "acc_eval": 0.154296875, + "epoch": 7 + }, + { + "hidden_norms": [ + 2226.40673828125, + 12703.916015625, + 20184.30859375, + 22453.73828125, + 20183.220703125 + ], + "bp_grad_norms_per_sample_med": [ + 0.00072157580871135, + 0.0007210742915049195, + 0.0007212630589492619, + 0.0007244180305860937, + 0.0007163899717852473 + ], + "acc_eval": 0.2236328125, + "epoch": 8 + }, + { + "hidden_norms": [ + 2289.455078125, + 15611.2138671875, + 24559.412109375, + 27336.787109375, + 24451.6796875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007243232685141265, + 0.0007221215637400746, + 0.0007219284889288247, + 0.0007259267731569707, + 0.0007173537742346525 + ], + "acc_eval": 0.169921875, + "epoch": 9 + }, + { + "hidden_norms": [ + 2396.09814453125, + 19678.587890625, + 30417.08203125, + 34140.70703125, + 30261.052734375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007124242256395519, + 0.0007074667955748737, + 0.0007074963650666177, + 0.0007131542661227286, + 0.0007022957433946431 + ], + "acc_eval": 0.1904296875, + "epoch": 10 + }, + { + "hidden_norms": [ + 2467.864013671875, + 24019.642578125, + 41156.921875, + 46706.38671875, + 41256.71484375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007333463290706277, + 0.0007277126424014568, + 0.0007268521003425121, + 0.000731462670955807, + 0.0007225224399007857 + ], + "acc_eval": 0.169921875, + "epoch": 11 + }, + { + "hidden_norms": [ + 2518.561767578125, + 28957.451171875, + 55737.69140625, + 64112.609375, + 56246.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007202349370345473, + 0.0007073598098941147, + 0.0007049349951557815, + 0.0007059182389639318, + 0.0007044971571303904 + ], + "acc_eval": 0.1513671875, + "epoch": 12 + }, + { + "hidden_norms": [ + 2614.843994140625, + 34279.15625, + 74158.109375, + 86073.96875, + 75187.59375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007299556746147573, + 0.0007100331713445485, + 0.0007101728115230799, + 0.0007166104041971266, + 0.0007030466804280877 + ], + "acc_eval": 0.24609375, + "epoch": 13 + }, + { + "hidden_norms": [ + 2697.871337890625, + 41263.5390625, + 96222.8984375, + 112901.9765625, + 98551.3046875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007336065755225718, + 0.0007151410100050271, + 0.0007150733144953847, + 0.0007166287978179753, + 0.0007151660392992198 + ], + "acc_eval": 0.134765625, + "epoch": 14 + }, + { + "hidden_norms": [ + 2815.983154296875, + 53842.3828125, + 126185.5625, + 149526.796875, + 130144.4765625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007365003693848848, + 0.0007177364313974977, + 0.0007168670417740941, + 0.000717108603566885, + 0.0007130720769055188 + ], + "acc_eval": 0.150390625, + "epoch": 15 + }, + { + "hidden_norms": [ + 2928.448974609375, + 65162.98046875, + 153909.296875, + 184005.875, + 159483.03125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007613440393470228, + 0.000720723532140255, + 0.000720796815585345, + 0.0007208258030004799, + 0.0007211563643068075 + ], + "acc_eval": 0.166015625, + "epoch": 16 + }, + { + "hidden_norms": [ + 2970.975341796875, + 76176.9609375, + 179093.75, + 216167.875, + 186723.21875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007602480472996831, + 0.0007191941258497536, + 0.0007163456757552922, + 0.0007164765265770257, + 0.0007142137037590146 + ], + "acc_eval": 0.1796875, + "epoch": 17 + }, + { + "hidden_norms": [ + 3078.336181640625, + 91839.40625, + 215980.015625, + 263515.15625, + 227071.515625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007584959384985268, + 0.0007150565506890416, + 0.0007151922909542918, + 0.000715585716534406, + 0.0007152389152906835 + ], + "acc_eval": 0.1767578125, + "epoch": 18 + }, + { + "hidden_norms": [ + 3202.803466796875, + 104358.6875, + 248325.390625, + 305395.84375, + 262365.46875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007867171661928296, + 0.0007155268103815615, + 0.0007155817584134638, + 0.0007157608633860946, + 0.0007155768107622862 + ], + "acc_eval": 0.138671875, + "epoch": 19 + }, + { + "hidden_norms": [ + 3282.27490234375, + 117747.359375, + 284217.3125, + 351018.15625, + 300903.65625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007691550417803228, + 0.0007147297146730125, + 0.0007147309370338917, + 0.0007150261080823839, + 0.0007147534633986652 + ], + "acc_eval": 0.1923828125, + "epoch": 20 + }, + { + "hidden_norms": [ + 3394.945556640625, + 129443.9765625, + 317078.65625, + 393509.375, + 336658.40625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008442914695478976, + 0.0007179519161581993, + 0.0007190873729996383, + 0.000723545381333679, + 0.0007175213540904224 + ], + "acc_eval": 0.1376953125, + "epoch": 21 + }, + { + "hidden_norms": [ + 3484.2763671875, + 140426.171875, + 355086.84375, + 443148.09375, + 378501.53125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007702927687205374, + 0.0006826652679592371, + 0.0006794629734940827, + 0.0006826536264270544, + 0.0006794703076593578 + ], + "acc_eval": 0.19140625, + "epoch": 22 + }, + { + "hidden_norms": [ + 3529.414306640625, + 153612.265625, + 393522.9375, + 493183.03125, + 421284.90625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008731107809580863, + 0.0007047304534353316, + 0.0007038630428723991, + 0.000708943116478622, + 0.000701444165315479 + ], + "acc_eval": 0.16796875, + "epoch": 23 + }, + { + "hidden_norms": [ + 3604.90283203125, + 165405.75, + 423586.46875, + 533219.375, + 454992.90625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008110221242532134, + 0.0006812610663473606, + 0.0006812110659666359, + 0.0006817537359893322, + 0.0006813214858993888 + ], + "acc_eval": 0.20703125, + "epoch": 24 + }, + { + "hidden_norms": [ + 3761.85400390625, + 178944.296875, + 464984.875, + 587869.375, + 501438.21875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008038324886001647, + 0.0006578225293196738, + 0.0006502956384792924, + 0.000664222112391144, + 0.0006502254982478917 + ], + "acc_eval": 0.240234375, + "epoch": 25 + }, + { + "hidden_norms": [ + 3818.5869140625, + 193167.4375, + 505599.375, + 643764.4375, + 550033.3125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007956585614010692, + 0.0007038708426989615, + 0.0007025190279819071, + 0.0007078333292156458, + 0.0006988184759393334 + ], + "acc_eval": 0.185546875, + "epoch": 26 + }, + { + "hidden_norms": [ + 3924.1787109375, + 207801.1875, + 548741.125, + 701043.0625, + 599520.4375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009222823427990079, + 0.000673642847687006, + 0.0006724554114043713, + 0.0006726986612193286, + 0.0006725445855408907 + ], + "acc_eval": 0.216796875, + "epoch": 27 + }, + { + "hidden_norms": [ + 4061.806884765625, + 222595.921875, + 590807.5, + 755718.75, + 646775.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008092334610410035, + 0.0007093537133187056, + 0.0007078479393385351, + 0.0007069098646752536, + 0.0007029378321021795 + ], + "acc_eval": 0.2158203125, + "epoch": 28 + }, + { + "hidden_norms": [ + 4216.11083984375, + 237549.296875, + 636429.5625, + 816954.9375, + 699524.9375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008620031294412911, + 0.0007326522027142346, + 0.00072627910412848, + 0.000725903722923249, + 0.0007269763154909015 + ], + "acc_eval": 0.1533203125, + "epoch": 29 + }, + { + "hidden_norms": [ + 4319.05029296875, + 251667.5, + 681409.75, + 874567.9375, + 748820.1875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008448463049717247, + 0.0007160686072893441, + 0.000714016379788518, + 0.0007141274982132018, + 0.0007095346227288246 + ], + "acc_eval": 0.1591796875, + "epoch": 30 + }, + { + "hidden_norms": [ + 4387.8330078125, + 268470.375, + 733153.125, + 943456.375, + 808793.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009849616326391697, + 0.0007160623208619654, + 0.0007154300110414624, + 0.0007152247708290815, + 0.0007160453242249787 + ], + "acc_eval": 0.1884765625, + "epoch": 31 + }, + { + "hidden_norms": [ + 4495.54638671875, + 291274.59375, + 806698.75, + 1039374.875, + 892062.1875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008646573405712843, + 0.000731874315533787, + 0.0007177238585427403, + 0.0007205329020507634, + 0.0007192457560449839 + ], + "acc_eval": 0.17578125, + "epoch": 32 + }, + { + "hidden_norms": [ + 4596.96337890625, + 305228.46875, + 848072.5625, + 1092268.625, + 937583.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009474663529545069, + 0.0007221641135402024, + 0.000721680698916316, + 0.0007284134044311941, + 0.0007212713244371116 + ], + "acc_eval": 0.171875, + "epoch": 33 + }, + { + "hidden_norms": [ + 4724.111328125, + 321366.5, + 891238.9375, + 1149886.25, + 987910.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009131877450272441, + 0.0007397676818072796, + 0.0007398735033348203, + 0.0007397927111014724, + 0.0007406016811728477 + ], + "acc_eval": 0.125, + "epoch": 34 + }, + { + "hidden_norms": [ + 4865.970703125, + 344027.15625, + 946722.0625, + 1219714.625, + 1049445.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.001010064734145999, + 0.0007341124583035707, + 0.0007336883572861552, + 0.0007345521007664502, + 0.0007338698487728834 + ], + "acc_eval": 0.119140625, + "epoch": 35 + }, + { + "hidden_norms": [ + 5003.3857421875, + 373410.21875, + 1026535.0625, + 1321456.25, + 1139824.625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010555180488154292, + 0.0007112861494533718, + 0.0007111895247362554, + 0.0007112334715202451, + 0.000711193191818893 + ], + "acc_eval": 0.1591796875, + "epoch": 36 + }, + { + "hidden_norms": [ + 5121.19287109375, + 405646.9375, + 1111111.125, + 1430716.625, + 1237074.375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010308363707736135, + 0.0007563655963167548, + 0.0007560031372122467, + 0.000755665882024914, + 0.0007561628590337932 + ], + "acc_eval": 0.134765625, + "epoch": 37 + }, + { + "hidden_norms": [ + 5212.7294921875, + 434054.15625, + 1180238.125, + 1518019.875, + 1314350.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.001035128254443407, + 0.0007314062095247209, + 0.0007304889149963856, + 0.0007291524088941514, + 0.0007313747191801667 + ], + "acc_eval": 0.140625, + "epoch": 38 + }, + { + "hidden_norms": [ + 5322.74951171875, + 462000.6875, + 1248006.75, + 1606243.125, + 1392563.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009023830061778426, + 0.000720554031431675, + 0.0007195135112851858, + 0.0007197313825599849, + 0.0007196948863565922 + ], + "acc_eval": 0.1708984375, + "epoch": 39 + }, + { + "hidden_norms": [ + 5453.89111328125, + 498941.0625, + 1343521.0, + 1731177.375, + 1504101.125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010444134240970016, + 0.0007362678297795355, + 0.0007352089160121977, + 0.0007340405718423426, + 0.0007357052527368069 + ], + "acc_eval": 0.1328125, + "epoch": 40 + }, + { + "hidden_norms": [ + 5515.6982421875, + 529817.75, + 1409505.625, + 1816151.0, + 1580539.125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0011280628386884928, + 0.0007231750059872866, + 0.0007211649208329618, + 0.000721275107935071, + 0.0007212632917799056 + ], + "acc_eval": 0.1611328125, + "epoch": 41 + }, + { + "hidden_norms": [ + 5617.26513671875, + 567492.4375, + 1498097.5, + 1931607.875, + 1684206.875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010544253746047616, + 0.0007354306289926171, + 0.0007348860381171107, + 0.0007349851075559855, + 0.0007350810337811708 + ], + "acc_eval": 0.1416015625, + "epoch": 42 + }, + { + "hidden_norms": [ + 5740.7978515625, + 596215.625, + 1561745.25, + 2014107.25, + 1758526.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010764201870188117, + 0.0007244387525133789, + 0.000723967794328928, + 0.000724096957128495, + 0.0007241644198074937 + ], + "acc_eval": 0.19921875, + "epoch": 43 + }, + { + "hidden_norms": [ + 5808.19677734375, + 630780.3125, + 1636034.875, + 2109305.75, + 1845552.125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010526466649025679, + 0.0007206913433037698, + 0.0007207048474811018, + 0.0007211468764580786, + 0.0007207895396277308 + ], + "acc_eval": 0.173828125, + "epoch": 44 + }, + { + "hidden_norms": [ + 5868.3583984375, + 673578.625, + 1729325.25, + 2227518.0, + 1953361.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009479392319917679, + 0.0007091389270499349, + 0.0007090644794516265, + 0.0007082624360918999, + 0.0007085782708600163 + ], + "acc_eval": 0.1923828125, + "epoch": 45 + }, + { + "hidden_norms": [ + 5953.82421875, + 720273.0, + 1840695.5, + 2372038.0, + 2084658.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0014002618845552206, + 0.0007315247785300016, + 0.0007256051758304238, + 0.0007254919619299471, + 0.000725599646102637 + ], + "acc_eval": 0.17578125, + "epoch": 46 + }, + { + "hidden_norms": [ + 6054.7861328125, + 758000.6875, + 1930354.375, + 2488163.75, + 2190582.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.001109408913180232, + 0.0007018125616014004, + 0.0007016566814854741, + 0.000701890152413398, + 0.0007018494652584195 + ], + "acc_eval": 0.203125, + "epoch": 47 + }, + { + "hidden_norms": [ + 6155.0859375, + 790443.0, + 2009565.875, + 2590829.25, + 2285268.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010253023356199265, + 0.0007347314967773855, + 0.0007304528844542801, + 0.0007322027231566608, + 0.0007312395609915257 + ], + "acc_eval": 0.154296875, + "epoch": 48 + }, + { + "hidden_norms": [ + 6216.64453125, + 830678.125, + 2088773.5, + 2691122.0, + 2376731.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010403504129499197, + 0.0006902964669279754, + 0.0006906419876031578, + 0.0006905900663696229, + 0.0006906461785547435 + ], + "acc_eval": 0.1591796875, + "epoch": 49 + }, + { + "hidden_norms": [ + 6252.98486328125, + 867790.1875, + 2159729.75, + 2781409.5, + 2460902.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0011370684951543808, + 0.0007390088285319507, + 0.0007305812323465943, + 0.0007310720975510776, + 0.0007304322207346559 + ], + "acc_eval": 0.15234375, + "epoch": 50 + }, + { + "hidden_norms": [ + 6294.51611328125, + 897267.5625, + 2218282.5, + 2858224.75, + 2530432.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0013790406519547105, + 0.0007320911972783506, + 0.0007304649334400892, + 0.0007293879170902073, + 0.0007303770980797708 + ], + "acc_eval": 0.1591796875, + "epoch": 51 + }, + { + "hidden_norms": [ + 6312.2314453125, + 935570.375, + 2299086.0, + 2963619.0, + 2627515.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.000999285257421434, + 0.0007227054447866976, + 0.0007246703025884926, + 0.0007245387532748282, + 0.0007243558065965772 + ], + "acc_eval": 0.20703125, + "epoch": 52 + }, + { + "hidden_norms": [ + 6387.30322265625, + 977101.125, + 2387243.0, + 3077676.25, + 2733147.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.001396833686158061, + 0.0007110408041626215, + 0.0007093287422321737, + 0.000708233390469104, + 0.0007085108081810176 + ], + "acc_eval": 0.1787109375, + "epoch": 53 + }, + { + "hidden_norms": [ + 6406.59033203125, + 1011753.1875, + 2450391.25, + 3158275.0, + 2807055.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0012408416951075196, + 0.0007304692408069968, + 0.000724659999832511, + 0.0007247650064527988, + 0.0007249858463183045 + ], + "acc_eval": 0.130859375, + "epoch": 54 + }, + { + "hidden_norms": [ + 6396.32080078125, + 1051044.375, + 2521085.5, + 3249326.75, + 2890642.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010854896390810609, + 0.0006957638543099165, + 0.0006896257400512695, + 0.0006964386557228863, + 0.0006897017010487616 + ], + "acc_eval": 0.234375, + "epoch": 55 + }, + { + "hidden_norms": [ + 6413.91357421875, + 1083474.5, + 2597945.5, + 3348271.5, + 2981405.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.00098806235473603, + 0.000719150179065764, + 0.0007170068565756083, + 0.0007178731029853225, + 0.0007173708290793002 + ], + "acc_eval": 0.205078125, + "epoch": 56 + }, + { + "hidden_norms": [ + 6406.4228515625, + 1124429.875, + 2675529.5, + 3447474.25, + 3073241.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.001149638439528644, + 0.0007225789595395327, + 0.0007212197524495423, + 0.0007210947806015611, + 0.0007211659685708582 + ], + "acc_eval": 0.1494140625, + "epoch": 57 + }, + { + "hidden_norms": [ + 6443.423828125, + 1166184.375, + 2758561.25, + 3551879.75, + 3171214.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.001115654013119638, + 0.000685695675201714, + 0.0006846366450190544, + 0.0006861463189125061, + 0.0006862673326395452 + ], + "acc_eval": 0.2490234375, + "epoch": 58 + }, + { + "hidden_norms": [ + 6477.5, + 1208826.0, + 2842194.75, + 3654862.0, + 3267617.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.000923235435038805, + 0.0006659153732471168, + 0.0006642267107963562, + 0.0006722065154463053, + 0.000664416525978595 + ], + "acc_eval": 0.2353515625, + "epoch": 59 + }, + { + "hidden_norms": [ + 6486.1689453125, + 1249377.0, + 2928293.75, + 3765881.75, + 3370835.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008846685523167253, + 0.0006866253679618239, + 0.000686973100528121, + 0.0006869880016893148, + 0.0006870955694466829 + ], + "acc_eval": 0.2373046875, + "epoch": 60 + }, + { + "hidden_norms": [ + 6499.3720703125, + 1291233.25, + 3012714.75, + 3873429.75, + 3471234.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009820004925131798, + 0.0007174524944275618, + 0.0007178467349149287, + 0.0007176626822911203, + 0.0007174718775786459 + ], + "acc_eval": 0.216796875, + "epoch": 61 + }, + { + "hidden_norms": [ + 6486.14404296875, + 1327247.75, + 3088322.75, + 3971415.75, + 3562299.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010241338750347495, + 0.0007171124452725053, + 0.0007174332858994603, + 0.0007172181503847241, + 0.0007169945747591555 + ], + "acc_eval": 0.18359375, + "epoch": 62 + }, + { + "hidden_norms": [ + 6455.17236328125, + 1355067.375, + 3142698.25, + 4041006.5, + 3627490.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009781530825421214, + 0.0007034538430161774, + 0.000703376077581197, + 0.0007118352805264294, + 0.0007080681971274316 + ], + "acc_eval": 0.189453125, + "epoch": 63 + }, + { + "hidden_norms": [ + 6454.62841796875, + 1384795.75, + 3199654.0, + 4114095.75, + 3696468.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009227422997355461, + 0.0007023688522167504, + 0.0007012909045442939, + 0.0007004260551184416, + 0.0007006779196672142 + ], + "acc_eval": 0.21484375, + "epoch": 64 + }, + { + "hidden_norms": [ + 6451.345703125, + 1420232.75, + 3260116.5, + 4190244.25, + 3768354.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008870494784787297, + 0.0007146014831960201, + 0.0007149986922740936, + 0.0007148014265112579, + 0.0007145918207243085 + ], + "acc_eval": 0.197265625, + "epoch": 65 + }, + { + "hidden_norms": [ + 6445.890625, + 1448264.875, + 3319505.0, + 4267505.0, + 3840047.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010003555798903108, + 0.0007171350298449397, + 0.0007168895681388676, + 0.0007169176824390888, + 0.0007170233875513077 + ], + "acc_eval": 0.1591796875, + "epoch": 66 + }, + { + "hidden_norms": [ + 6440.8212890625, + 1478082.75, + 3376291.25, + 4340727.0, + 3909334.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009646597318351269, + 0.0007130720769055188, + 0.0007134011830203235, + 0.0007131980964913964, + 0.0007129770237952471 + ], + "acc_eval": 0.171875, + "epoch": 67 + }, + { + "hidden_norms": [ + 6398.03955078125, + 1508487.5, + 3436526.25, + 4417271.5, + 3981251.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009445869363844395, + 0.0007122856914065778, + 0.0007126569980755448, + 0.0007124742260202765, + 0.0007122504175640643 + ], + "acc_eval": 0.189453125, + "epoch": 68 + }, + { + "hidden_norms": [ + 6389.02392578125, + 1530834.625, + 3480246.5, + 4471170.0, + 4032576.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009853171650320292, + 0.0006874292739666998, + 0.0006876476109027863, + 0.0006881517474539578, + 0.0006880395230837166 + ], + "acc_eval": 0.1904296875, + "epoch": 69 + }, + { + "hidden_norms": [ + 6338.54443359375, + 1561198.875, + 3541681.5, + 4548099.0, + 4105499.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009333671187050641, + 0.0006952910916879773, + 0.0006947650690563023, + 0.0006940987077541649, + 0.0006943742628209293 + ], + "acc_eval": 0.23046875, + "epoch": 70 + }, + { + "hidden_norms": [ + 6280.18603515625, + 1585008.0, + 3589125.25, + 4608667.0, + 4162480.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009699579677544534, + 0.0007101434166543186, + 0.0007104446412995458, + 0.000710242718923837, + 0.0007100136135704815 + ], + "acc_eval": 0.146484375, + "epoch": 71 + }, + { + "hidden_norms": [ + 6252.455078125, + 1608187.875, + 3635014.75, + 4667478.5, + 4218253.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008955001248978078, + 0.0006863236776553094, + 0.0006864941096864641, + 0.000687020889017731, + 0.0006868807831779122 + ], + "acc_eval": 0.2431640625, + "epoch": 72 + }, + { + "hidden_norms": [ + 6201.6845703125, + 1619508.875, + 3661275.25, + 4700652.0, + 4249921.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009069991065189242, + 0.0006539999740198255, + 0.0006531713879667222, + 0.0006594359292648733, + 0.000653320224955678 + ], + "acc_eval": 0.2216796875, + "epoch": 73 + }, + { + "hidden_norms": [ + 6182.8115234375, + 1632587.875, + 3679586.25, + 4722070.5, + 4271567.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009595821611583233, + 0.0007079984061419964, + 0.0007082773372530937, + 0.0007081056828610599, + 0.000707884959410876 + ], + "acc_eval": 0.193359375, + "epoch": 74 + }, + { + "hidden_norms": [ + 6153.7392578125, + 1653576.875, + 3722935.0, + 4776921.0, + 4323508.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008598894928582013, + 0.0007073319284245372, + 0.0007075938628986478, + 0.0007074539898894727, + 0.0007072555599734187 + ], + "acc_eval": 0.201171875, + "epoch": 75 + }, + { + "hidden_norms": [ + 6135.21240234375, + 1667474.375, + 3750912.75, + 4812450.5, + 4357575.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009454588289372623, + 0.0007068001432344317, + 0.0007069715647958219, + 0.0007067638216540217, + 0.0007065933896228671 + ], + "acc_eval": 0.2158203125, + "epoch": 76 + }, + { + "hidden_norms": [ + 6085.7109375, + 1679251.75, + 3774334.5, + 4840148.5, + 4384792.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008410231093876064, + 0.0006843701121397316, + 0.0006845371681265533, + 0.00068506138632074, + 0.0006849151104688644 + ], + "acc_eval": 0.2578125, + "epoch": 77 + }, + { + "hidden_norms": [ + 6042.693359375, + 1685705.5, + 3787479.75, + 4856211.0, + 4400193.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008572259685024619, + 0.0006840305286459625, + 0.0006841861759312451, + 0.0006847094628028572, + 0.0006845552125014365 + ], + "acc_eval": 0.2568359375, + "epoch": 78 + }, + { + "hidden_norms": [ + 6003.5390625, + 1702685.5, + 3813174.5, + 4888481.0, + 4430612.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008342780056409538, + 0.0006777377566322684, + 0.0006779460818506777, + 0.0006789933540858328, + 0.0006781259435229003 + ], + "acc_eval": 0.2685546875, + "epoch": 79 + }, + { + "hidden_norms": [ + 5948.60107421875, + 1714243.125, + 3830846.5, + 4910337.5, + 4451921.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008218465954996645, + 0.0006832804065197706, + 0.0006831764476373792, + 0.0006826326716691256, + 0.0006829035119153559 + ], + "acc_eval": 0.2529296875, + "epoch": 80 + }, + { + "hidden_norms": [ + 5881.8525390625, + 1718113.375, + 3838036.5, + 4920025.5, + 4461931.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007958809728734195, + 0.000677398347761482, + 0.0006775528891012073, + 0.0006775871734134853, + 0.0006777321686968207 + ], + "acc_eval": 0.2548828125, + "epoch": 81 + }, + { + "hidden_norms": [ + 5816.7880859375, + 1723461.25, + 3850904.75, + 4936806.0, + 4478473.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008361428044736385, + 0.0006769691244699061, + 0.0006771331536583602, + 0.0006771665066480637, + 0.0006773129571229219 + ], + "acc_eval": 0.251953125, + "epoch": 82 + }, + { + "hidden_norms": [ + 5760.41845703125, + 1732135.25, + 3859576.0, + 4947171.0, + 4488986.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008036325452849269, + 0.0006821549613960087, + 0.0006806753808632493, + 0.0006799713592045009, + 0.0006802318384870887 + ], + "acc_eval": 0.2490234375, + "epoch": 83 + }, + { + "hidden_norms": [ + 5710.22998046875, + 1740014.25, + 3871992.25, + 4962337.5, + 4503463.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008278922759927809, + 0.0006754198693670332, + 0.000675307004712522, + 0.0006768241291865706, + 0.0006769676692783833 + ], + "acc_eval": 0.26171875, + "epoch": 84 + }, + { + "hidden_norms": [ + 5685.73828125, + 1745863.25, + 3880256.75, + 4973639.5, + 4514457.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008255501161329448, + 0.0006466225022450089, + 0.0006466452032327652, + 0.0006467151688411832, + 0.0006467655766755342 + ], + "acc_eval": 0.283203125, + "epoch": 85 + }, + { + "hidden_norms": [ + 5637.498046875, + 1743128.375, + 3879796.5, + 4973009.0, + 4514424.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008148956694640219, + 0.0006465681362897158, + 0.0006463592289946973, + 0.0006491504609584808, + 0.0006464755861088634 + ], + "acc_eval": 0.2587890625, + "epoch": 86 + }, + { + "hidden_norms": [ + 5601.87744140625, + 1741859.375, + 3884447.75, + 4978445.5, + 4518886.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008254973217844963, + 0.0006783050484955311, + 0.0006774527719244361, + 0.0006768335006199777, + 0.0006770920008420944 + ], + "acc_eval": 0.298828125, + "epoch": 87 + }, + { + "hidden_norms": [ + 5587.505859375, + 1748285.875, + 3887730.5, + 4982144.0, + 4523151.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008113561780191958, + 0.0006764904828742146, + 0.000676542054861784, + 0.0006762324483133852, + 0.0006764894351363182 + ], + "acc_eval": 0.2734375, + "epoch": 88 + }, + { + "hidden_norms": [ + 5553.013671875, + 1748456.75, + 3890722.0, + 4986538.5, + 4527315.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007909060223028064, + 0.0006763285491615534, + 0.0006762049742974341, + 0.0006756742368452251, + 0.000675930583383888 + ], + "acc_eval": 0.2861328125, + "epoch": 89 + }, + { + "hidden_norms": [ + 5524.611328125, + 1748210.0, + 3893003.75, + 4989732.5, + 4530436.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.000797618820797652, + 0.0006453269743360579, + 0.0006453663809224963, + 0.0006454290705733001, + 0.0006454723770730197 + ], + "acc_eval": 0.28515625, + "epoch": 90 + }, + { + "hidden_norms": [ + 5506.21923828125, + 1750958.0, + 3894639.5, + 4992073.0, + 4532399.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007834367570467293, + 0.0006762953125871718, + 0.0006754640489816666, + 0.0006748714949935675, + 0.0006751226610504091 + ], + "acc_eval": 0.2939453125, + "epoch": 91 + }, + { + "hidden_norms": [ + 5485.10791015625, + 1747546.25, + 3895030.0, + 4992480.5, + 4532805.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007779909064993262, + 0.0006450997898355126, + 0.0006451247027143836, + 0.0006455867551267147, + 0.0006452234229072928 + ], + "acc_eval": 0.2890625, + "epoch": 92 + }, + { + "hidden_norms": [ + 5464.07763671875, + 1749313.125, + 3894610.75, + 4991684.0, + 4532270.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008090221090242267, + 0.0006661301013082266, + 0.0006646219990216196, + 0.0006726695573888719, + 0.0006649038987234235 + ], + "acc_eval": 0.283203125, + "epoch": 93 + }, + { + "hidden_norms": [ + 5451.2841796875, + 1749389.0, + 3894315.25, + 4990837.5, + 4531011.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007907215040177107, + 0.0006448677740991116, + 0.0006448915228247643, + 0.0006451430963352323, + 0.0006449950742535293 + ], + "acc_eval": 0.2958984375, + "epoch": 94 + }, + { + "hidden_norms": [ + 5437.77099609375, + 1750653.125, + 3895251.75, + 4992303.0, + 4532441.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007774807745590806, + 0.000676269584801048, + 0.0006763145211152732, + 0.0006763775018043816, + 0.000676501716952771 + ], + "acc_eval": 0.2763671875, + "epoch": 95 + }, + { + "hidden_norms": [ + 5427.34619140625, + 1751408.875, + 3894547.75, + 4991554.5, + 4532145.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007797307334840298, + 0.000664835621137172, + 0.0006642266525886953, + 0.000671364541631192, + 0.0006645115208812058 + ], + "acc_eval": 0.296875, + "epoch": 96 + }, + { + "hidden_norms": [ + 5420.30615234375, + 1751757.5, + 3894027.5, + 4991042.0, + 4531674.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007797667058184743, + 0.0006446840125136077, + 0.0006447113119065762, + 0.0006447701598517597, + 0.0006448116037063301 + ], + "acc_eval": 0.2939453125, + "epoch": 97 + }, + { + "hidden_norms": [ + 5416.81396484375, + 1751629.625, + 3893959.25, + 4991021.5, + 4531639.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007706825854256749, + 0.0006446407060138881, + 0.0006406756583601236, + 0.0006447536870837212, + 0.0006393496878445148 + ], + "acc_eval": 0.306640625, + "epoch": 98 + }, + { + "hidden_norms": [ + 5415.3095703125, + 1751552.75, + 3893897.0, + 4990973.0, + 4531587.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007776900893077254, + 0.0006458400748670101, + 0.0006446869228966534, + 0.0006466003833338618, + 0.0006447876221500337 + ], + "acc_eval": 0.2978515625, + "epoch": 99 + }, + { + "hidden_norms": [ + 5414.92822265625, + 1751530.25, + 3893876.5, + 4990954.0, + 4531568.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007761479937471449, + 0.0006465426995418966, + 0.0006446881452575326, + 0.0006466349004767835, + 0.0006447875639423728 + ], + "acc_eval": 0.294921875, + "epoch": 100 + } + ], + "arch": "resmlp_noln", + "seed": 42 +} \ No newline at end of file diff --git a/results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json b/results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json new file mode 100644 index 0000000..7e5cb37 --- /dev/null +++ b/results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json @@ -0,0 +1,1824 @@ +{ + "fa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_norms_per_sample_med": [ + 0.0005561555735766888, + 0.0005519049009308219, + 0.0005482902633957565, + 0.0005436676437966526, + 0.000538847001735121 + ], + "acc_eval": 0.1123046875, + "epoch": 0 + }, + { + "hidden_norms": [ + 736.34716796875, + 1637.1044921875, + 2033.1922607421875, + 2161.380859375, + 2126.18505859375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0006836718530394137, + 0.0006813183426856995, + 0.0006814387743361294, + 0.0006832550279796124, + 0.0006794488872401416 + ], + "acc_eval": 0.1953125, + "epoch": 1 + }, + { + "hidden_norms": [ + 1106.3868408203125, + 2963.552001953125, + 4087.33837890625, + 4421.4921875, + 4265.1083984375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007476353785023093, + 0.0007440777844749391, + 0.0007443943759426475, + 0.0007477496401406825, + 0.0007366884965449572 + ], + "acc_eval": 0.1044921875, + "epoch": 2 + }, + { + "hidden_norms": [ + 1371.9425048828125, + 4214.05078125, + 6238.47265625, + 6697.2333984375, + 6399.22314453125 + ], + "bp_grad_norms_per_sample_med": [ + 0.000730870058760047, + 0.00072717375587672, + 0.0007270713686011732, + 0.0007290731882676482, + 0.0007233614451251924 + ], + "acc_eval": 0.1943359375, + "epoch": 3 + }, + { + "hidden_norms": [ + 1574.7962646484375, + 4805.0556640625, + 7044.64599609375, + 7593.78955078125, + 7215.32763671875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007098641362972558, + 0.0007034889422357082, + 0.0007031699060462415, + 0.0007120345253497362, + 0.000694308546371758 + ], + "acc_eval": 0.2451171875, + "epoch": 4 + }, + { + "hidden_norms": [ + 1726.088623046875, + 6184.34521484375, + 9521.791015625, + 10387.7236328125, + 9721.431640625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007400272879749537, + 0.0007343650795519352, + 0.0007334973197430372, + 0.0007343514007516205, + 0.0007319966680370271 + ], + "acc_eval": 0.212890625, + "epoch": 5 + }, + { + "hidden_norms": [ + 1902.689697265625, + 7697.52197265625, + 12328.0595703125, + 13597.1787109375, + 12504.158203125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007165716378949583, + 0.0007126733544282615, + 0.0007124089752323925, + 0.0007126083364710212, + 0.0007107863784767687 + ], + "acc_eval": 0.15625, + "epoch": 6 + }, + { + "hidden_norms": [ + 2069.750244140625, + 10379.2958984375, + 16444.7421875, + 18267.94921875, + 16595.220703125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007099996437318623, + 0.0007088935235515237, + 0.0007090346189215779, + 0.000710709486156702, + 0.0007023006328381598 + ], + "acc_eval": 0.154296875, + "epoch": 7 + }, + { + "hidden_norms": [ + 2226.40673828125, + 12703.916015625, + 20184.30859375, + 22453.73828125, + 20183.220703125 + ], + "bp_grad_norms_per_sample_med": [ + 0.00072157580871135, + 0.0007210742915049195, + 0.0007212630589492619, + 0.0007244180305860937, + 0.0007163899717852473 + ], + "acc_eval": 0.2236328125, + "epoch": 8 + }, + { + "hidden_norms": [ + 2289.455078125, + 15611.2138671875, + 24559.412109375, + 27336.787109375, + 24451.6796875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007243232685141265, + 0.0007221215637400746, + 0.0007219284889288247, + 0.0007259267731569707, + 0.0007173537742346525 + ], + "acc_eval": 0.169921875, + "epoch": 9 + }, + { + "hidden_norms": [ + 2396.09814453125, + 19678.587890625, + 30417.08203125, + 34140.70703125, + 30261.052734375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007124242256395519, + 0.0007074667955748737, + 0.0007074963650666177, + 0.0007131542661227286, + 0.0007022957433946431 + ], + "acc_eval": 0.1904296875, + "epoch": 10 + }, + { + "hidden_norms": [ + 2467.864013671875, + 24019.642578125, + 41156.921875, + 46706.38671875, + 41256.71484375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007333463290706277, + 0.0007277126424014568, + 0.0007268521003425121, + 0.000731462670955807, + 0.0007225224399007857 + ], + "acc_eval": 0.169921875, + "epoch": 11 + }, + { + "hidden_norms": [ + 2518.561767578125, + 28957.451171875, + 55737.69140625, + 64112.609375, + 56246.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007202349370345473, + 0.0007073598098941147, + 0.0007049349951557815, + 0.0007059182389639318, + 0.0007044971571303904 + ], + "acc_eval": 0.1513671875, + "epoch": 12 + }, + { + "hidden_norms": [ + 2614.843994140625, + 34279.15625, + 74158.109375, + 86073.96875, + 75187.59375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007299556746147573, + 0.0007100331713445485, + 0.0007101728115230799, + 0.0007166104041971266, + 0.0007030466804280877 + ], + "acc_eval": 0.24609375, + "epoch": 13 + }, + { + "hidden_norms": [ + 2697.871337890625, + 41263.5390625, + 96222.8984375, + 112901.9765625, + 98551.3046875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007336065755225718, + 0.0007151410100050271, + 0.0007150733144953847, + 0.0007166287978179753, + 0.0007151660392992198 + ], + "acc_eval": 0.134765625, + "epoch": 14 + }, + { + "hidden_norms": [ + 2815.983154296875, + 53842.3828125, + 126185.5625, + 149526.796875, + 130144.4765625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007365003693848848, + 0.0007177364313974977, + 0.0007168670417740941, + 0.000717108603566885, + 0.0007130720769055188 + ], + "acc_eval": 0.150390625, + "epoch": 15 + }, + { + "hidden_norms": [ + 2928.448974609375, + 65162.98046875, + 153909.296875, + 184005.875, + 159483.03125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007613440393470228, + 0.000720723532140255, + 0.000720796815585345, + 0.0007208258030004799, + 0.0007211563643068075 + ], + "acc_eval": 0.166015625, + "epoch": 16 + }, + { + "hidden_norms": [ + 2970.975341796875, + 76176.9609375, + 179093.75, + 216167.875, + 186723.21875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007602480472996831, + 0.0007191941258497536, + 0.0007163456757552922, + 0.0007164765265770257, + 0.0007142137037590146 + ], + "acc_eval": 0.1796875, + "epoch": 17 + }, + { + "hidden_norms": [ + 3078.336181640625, + 91839.40625, + 215980.015625, + 263515.15625, + 227071.515625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007584959384985268, + 0.0007150565506890416, + 0.0007151922909542918, + 0.000715585716534406, + 0.0007152389152906835 + ], + "acc_eval": 0.1767578125, + "epoch": 18 + }, + { + "hidden_norms": [ + 3202.803466796875, + 104358.6875, + 248325.390625, + 305395.84375, + 262365.46875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007867171661928296, + 0.0007155268103815615, + 0.0007155817584134638, + 0.0007157608633860946, + 0.0007155768107622862 + ], + "acc_eval": 0.138671875, + "epoch": 19 + }, + { + "hidden_norms": [ + 3282.27490234375, + 117747.359375, + 284217.3125, + 351018.15625, + 300903.65625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007691550417803228, + 0.0007147297146730125, + 0.0007147309370338917, + 0.0007150261080823839, + 0.0007147534633986652 + ], + "acc_eval": 0.1923828125, + "epoch": 20 + }, + { + "hidden_norms": [ + 3394.945556640625, + 129443.9765625, + 317078.65625, + 393509.375, + 336658.40625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008442914695478976, + 0.0007179519161581993, + 0.0007190873729996383, + 0.000723545381333679, + 0.0007175213540904224 + ], + "acc_eval": 0.1376953125, + "epoch": 21 + }, + { + "hidden_norms": [ + 3484.2763671875, + 140426.171875, + 355086.84375, + 443148.09375, + 378501.53125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007702927687205374, + 0.0006826652679592371, + 0.0006794629734940827, + 0.0006826536264270544, + 0.0006794703076593578 + ], + "acc_eval": 0.19140625, + "epoch": 22 + }, + { + "hidden_norms": [ + 3529.414306640625, + 153612.265625, + 393522.9375, + 493183.03125, + 421284.90625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008731107809580863, + 0.0007047304534353316, + 0.0007038630428723991, + 0.000708943116478622, + 0.000701444165315479 + ], + "acc_eval": 0.16796875, + "epoch": 23 + }, + { + "hidden_norms": [ + 3604.90283203125, + 165405.75, + 423586.46875, + 533219.375, + 454992.90625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008110221242532134, + 0.0006812610663473606, + 0.0006812110659666359, + 0.0006817537359893322, + 0.0006813214858993888 + ], + "acc_eval": 0.20703125, + "epoch": 24 + }, + { + "hidden_norms": [ + 3761.85400390625, + 178944.296875, + 464984.875, + 587869.375, + 501438.21875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008038324886001647, + 0.0006578225293196738, + 0.0006502956384792924, + 0.000664222112391144, + 0.0006502254982478917 + ], + "acc_eval": 0.240234375, + "epoch": 25 + }, + { + "hidden_norms": [ + 3818.5869140625, + 193167.4375, + 505599.375, + 643764.4375, + 550033.3125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007956585614010692, + 0.0007038708426989615, + 0.0007025190279819071, + 0.0007078333292156458, + 0.0006988184759393334 + ], + "acc_eval": 0.185546875, + "epoch": 26 + }, + { + "hidden_norms": [ + 3924.1787109375, + 207801.1875, + 548741.125, + 701043.0625, + 599520.4375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009222823427990079, + 0.000673642847687006, + 0.0006724554114043713, + 0.0006726986612193286, + 0.0006725445855408907 + ], + "acc_eval": 0.216796875, + "epoch": 27 + }, + { + "hidden_norms": [ + 4061.806884765625, + 222595.921875, + 590807.5, + 755718.75, + 646775.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008092334610410035, + 0.0007093537133187056, + 0.0007078479393385351, + 0.0007069098646752536, + 0.0007029378321021795 + ], + "acc_eval": 0.2158203125, + "epoch": 28 + }, + { + "hidden_norms": [ + 4216.11083984375, + 237549.296875, + 636429.5625, + 816954.9375, + 699524.9375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008620031294412911, + 0.0007326522027142346, + 0.00072627910412848, + 0.000725903722923249, + 0.0007269763154909015 + ], + "acc_eval": 0.1533203125, + "epoch": 29 + }, + { + "hidden_norms": [ + 4319.05029296875, + 251667.5, + 681409.75, + 874567.9375, + 748820.1875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008448463049717247, + 0.0007160686072893441, + 0.000714016379788518, + 0.0007141274982132018, + 0.0007095346227288246 + ], + "acc_eval": 0.1591796875, + "epoch": 30 + }, + { + "hidden_norms": [ + 4387.8330078125, + 268470.375, + 733153.125, + 943456.375, + 808793.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009849616326391697, + 0.0007160623208619654, + 0.0007154300110414624, + 0.0007152247708290815, + 0.0007160453242249787 + ], + "acc_eval": 0.1884765625, + "epoch": 31 + }, + { + "hidden_norms": [ + 4495.54638671875, + 291274.59375, + 806698.75, + 1039374.875, + 892062.1875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008646573405712843, + 0.000731874315533787, + 0.0007177238585427403, + 0.0007205329020507634, + 0.0007192457560449839 + ], + "acc_eval": 0.17578125, + "epoch": 32 + }, + { + "hidden_norms": [ + 4596.96337890625, + 305228.46875, + 848072.5625, + 1092268.625, + 937583.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009474663529545069, + 0.0007221641135402024, + 0.000721680698916316, + 0.0007284134044311941, + 0.0007212713244371116 + ], + "acc_eval": 0.171875, + "epoch": 33 + }, + { + "hidden_norms": [ + 4724.111328125, + 321366.5, + 891238.9375, + 1149886.25, + 987910.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009131877450272441, + 0.0007397676818072796, + 0.0007398735033348203, + 0.0007397927111014724, + 0.0007406016811728477 + ], + "acc_eval": 0.125, + "epoch": 34 + }, + { + "hidden_norms": [ + 4865.970703125, + 344027.15625, + 946722.0625, + 1219714.625, + 1049445.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.001010064734145999, + 0.0007341124583035707, + 0.0007336883572861552, + 0.0007345521007664502, + 0.0007338698487728834 + ], + "acc_eval": 0.119140625, + "epoch": 35 + }, + { + "hidden_norms": [ + 5003.3857421875, + 373410.21875, + 1026535.0625, + 1321456.25, + 1139824.625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010555180488154292, + 0.0007112861494533718, + 0.0007111895247362554, + 0.0007112334715202451, + 0.000711193191818893 + ], + "acc_eval": 0.1591796875, + "epoch": 36 + }, + { + "hidden_norms": [ + 5121.19287109375, + 405646.9375, + 1111111.125, + 1430716.625, + 1237074.375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010308363707736135, + 0.0007563655963167548, + 0.0007560031372122467, + 0.000755665882024914, + 0.0007561628590337932 + ], + "acc_eval": 0.134765625, + "epoch": 37 + }, + { + "hidden_norms": [ + 5212.7294921875, + 434054.15625, + 1180238.125, + 1518019.875, + 1314350.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.001035128254443407, + 0.0007314062095247209, + 0.0007304889149963856, + 0.0007291524088941514, + 0.0007313747191801667 + ], + "acc_eval": 0.140625, + "epoch": 38 + }, + { + "hidden_norms": [ + 5322.74951171875, + 462000.6875, + 1248006.75, + 1606243.125, + 1392563.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009023830061778426, + 0.000720554031431675, + 0.0007195135112851858, + 0.0007197313825599849, + 0.0007196948863565922 + ], + "acc_eval": 0.1708984375, + "epoch": 39 + }, + { + "hidden_norms": [ + 5453.89111328125, + 498941.0625, + 1343521.0, + 1731177.375, + 1504101.125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010444134240970016, + 0.0007362678297795355, + 0.0007352089160121977, + 0.0007340405718423426, + 0.0007357052527368069 + ], + "acc_eval": 0.1328125, + "epoch": 40 + }, + { + "hidden_norms": [ + 5515.6982421875, + 529817.75, + 1409505.625, + 1816151.0, + 1580539.125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0011280628386884928, + 0.0007231750059872866, + 0.0007211649208329618, + 0.000721275107935071, + 0.0007212632917799056 + ], + "acc_eval": 0.1611328125, + "epoch": 41 + }, + { + "hidden_norms": [ + 5617.26513671875, + 567492.4375, + 1498097.5, + 1931607.875, + 1684206.875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010544253746047616, + 0.0007354306289926171, + 0.0007348860381171107, + 0.0007349851075559855, + 0.0007350810337811708 + ], + "acc_eval": 0.1416015625, + "epoch": 42 + }, + { + "hidden_norms": [ + 5740.7978515625, + 596215.625, + 1561745.25, + 2014107.25, + 1758526.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010764201870188117, + 0.0007244387525133789, + 0.000723967794328928, + 0.000724096957128495, + 0.0007241644198074937 + ], + "acc_eval": 0.19921875, + "epoch": 43 + }, + { + "hidden_norms": [ + 5808.19677734375, + 630780.3125, + 1636034.875, + 2109305.75, + 1845552.125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010526466649025679, + 0.0007206913433037698, + 0.0007207048474811018, + 0.0007211468764580786, + 0.0007207895396277308 + ], + "acc_eval": 0.173828125, + "epoch": 44 + }, + { + "hidden_norms": [ + 5868.3583984375, + 673578.625, + 1729325.25, + 2227518.0, + 1953361.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009479392319917679, + 0.0007091389270499349, + 0.0007090644794516265, + 0.0007082624360918999, + 0.0007085782708600163 + ], + "acc_eval": 0.1923828125, + "epoch": 45 + }, + { + "hidden_norms": [ + 5953.82421875, + 720273.0, + 1840695.5, + 2372038.0, + 2084658.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0014002618845552206, + 0.0007315247785300016, + 0.0007256051758304238, + 0.0007254919619299471, + 0.000725599646102637 + ], + "acc_eval": 0.17578125, + "epoch": 46 + }, + { + "hidden_norms": [ + 6054.7861328125, + 758000.6875, + 1930354.375, + 2488163.75, + 2190582.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.001109408913180232, + 0.0007018125616014004, + 0.0007016566814854741, + 0.000701890152413398, + 0.0007018494652584195 + ], + "acc_eval": 0.203125, + "epoch": 47 + }, + { + "hidden_norms": [ + 6155.0859375, + 790443.0, + 2009565.875, + 2590829.25, + 2285268.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010253023356199265, + 0.0007347314967773855, + 0.0007304528844542801, + 0.0007322027231566608, + 0.0007312395609915257 + ], + "acc_eval": 0.154296875, + "epoch": 48 + }, + { + "hidden_norms": [ + 6216.64453125, + 830678.125, + 2088773.5, + 2691122.0, + 2376731.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010403504129499197, + 0.0006902964669279754, + 0.0006906419876031578, + 0.0006905900663696229, + 0.0006906461785547435 + ], + "acc_eval": 0.1591796875, + "epoch": 49 + }, + { + "hidden_norms": [ + 6252.98486328125, + 867790.1875, + 2159729.75, + 2781409.5, + 2460902.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0011370684951543808, + 0.0007390088285319507, + 0.0007305812323465943, + 0.0007310720975510776, + 0.0007304322207346559 + ], + "acc_eval": 0.15234375, + "epoch": 50 + }, + { + "hidden_norms": [ + 6294.51611328125, + 897267.5625, + 2218282.5, + 2858224.75, + 2530432.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0013790406519547105, + 0.0007320911972783506, + 0.0007304649334400892, + 0.0007293879170902073, + 0.0007303770980797708 + ], + "acc_eval": 0.1591796875, + "epoch": 51 + }, + { + "hidden_norms": [ + 6312.2314453125, + 935570.375, + 2299086.0, + 2963619.0, + 2627515.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.000999285257421434, + 0.0007227054447866976, + 0.0007246703025884926, + 0.0007245387532748282, + 0.0007243558065965772 + ], + "acc_eval": 0.20703125, + "epoch": 52 + }, + { + "hidden_norms": [ + 6387.30322265625, + 977101.125, + 2387243.0, + 3077676.25, + 2733147.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.001396833686158061, + 0.0007110408041626215, + 0.0007093287422321737, + 0.000708233390469104, + 0.0007085108081810176 + ], + "acc_eval": 0.1787109375, + "epoch": 53 + }, + { + "hidden_norms": [ + 6406.59033203125, + 1011753.1875, + 2450391.25, + 3158275.0, + 2807055.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0012408416951075196, + 0.0007304692408069968, + 0.000724659999832511, + 0.0007247650064527988, + 0.0007249858463183045 + ], + "acc_eval": 0.130859375, + "epoch": 54 + }, + { + "hidden_norms": [ + 6396.32080078125, + 1051044.375, + 2521085.5, + 3249326.75, + 2890642.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010854896390810609, + 0.0006957638543099165, + 0.0006896257400512695, + 0.0006964386557228863, + 0.0006897017010487616 + ], + "acc_eval": 0.234375, + "epoch": 55 + }, + { + "hidden_norms": [ + 6413.91357421875, + 1083474.5, + 2597945.5, + 3348271.5, + 2981405.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.00098806235473603, + 0.000719150179065764, + 0.0007170068565756083, + 0.0007178731029853225, + 0.0007173708290793002 + ], + "acc_eval": 0.205078125, + "epoch": 56 + }, + { + "hidden_norms": [ + 6406.4228515625, + 1124429.875, + 2675529.5, + 3447474.25, + 3073241.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.001149638439528644, + 0.0007225789595395327, + 0.0007212197524495423, + 0.0007210947806015611, + 0.0007211659685708582 + ], + "acc_eval": 0.1494140625, + "epoch": 57 + }, + { + "hidden_norms": [ + 6443.423828125, + 1166184.375, + 2758561.25, + 3551879.75, + 3171214.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.001115654013119638, + 0.000685695675201714, + 0.0006846366450190544, + 0.0006861463189125061, + 0.0006862673326395452 + ], + "acc_eval": 0.2490234375, + "epoch": 58 + }, + { + "hidden_norms": [ + 6477.5, + 1208826.0, + 2842194.75, + 3654862.0, + 3267617.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.000923235435038805, + 0.0006659153732471168, + 0.0006642267107963562, + 0.0006722065154463053, + 0.000664416525978595 + ], + "acc_eval": 0.2353515625, + "epoch": 59 + }, + { + "hidden_norms": [ + 6486.1689453125, + 1249377.0, + 2928293.75, + 3765881.75, + 3370835.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008846685523167253, + 0.0006866253679618239, + 0.000686973100528121, + 0.0006869880016893148, + 0.0006870955694466829 + ], + "acc_eval": 0.2373046875, + "epoch": 60 + }, + { + "hidden_norms": [ + 6499.3720703125, + 1291233.25, + 3012714.75, + 3873429.75, + 3471234.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009820004925131798, + 0.0007174524944275618, + 0.0007178467349149287, + 0.0007176626822911203, + 0.0007174718775786459 + ], + "acc_eval": 0.216796875, + "epoch": 61 + }, + { + "hidden_norms": [ + 6486.14404296875, + 1327247.75, + 3088322.75, + 3971415.75, + 3562299.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010241338750347495, + 0.0007171124452725053, + 0.0007174332858994603, + 0.0007172181503847241, + 0.0007169945747591555 + ], + "acc_eval": 0.18359375, + "epoch": 62 + }, + { + "hidden_norms": [ + 6455.17236328125, + 1355067.375, + 3142698.25, + 4041006.5, + 3627490.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009781530825421214, + 0.0007034538430161774, + 0.000703376077581197, + 0.0007118352805264294, + 0.0007080681971274316 + ], + "acc_eval": 0.189453125, + "epoch": 63 + }, + { + "hidden_norms": [ + 6454.62841796875, + 1384795.75, + 3199654.0, + 4114095.75, + 3696468.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009227422997355461, + 0.0007023688522167504, + 0.0007012909045442939, + 0.0007004260551184416, + 0.0007006779196672142 + ], + "acc_eval": 0.21484375, + "epoch": 64 + }, + { + "hidden_norms": [ + 6451.345703125, + 1420232.75, + 3260116.5, + 4190244.25, + 3768354.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008870494784787297, + 0.0007146014831960201, + 0.0007149986922740936, + 0.0007148014265112579, + 0.0007145918207243085 + ], + "acc_eval": 0.197265625, + "epoch": 65 + }, + { + "hidden_norms": [ + 6445.890625, + 1448264.875, + 3319505.0, + 4267505.0, + 3840047.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010003555798903108, + 0.0007171350298449397, + 0.0007168895681388676, + 0.0007169176824390888, + 0.0007170233875513077 + ], + "acc_eval": 0.1591796875, + "epoch": 66 + }, + { + "hidden_norms": [ + 6440.8212890625, + 1478082.75, + 3376291.25, + 4340727.0, + 3909334.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009646597318351269, + 0.0007130720769055188, + 0.0007134011830203235, + 0.0007131980964913964, + 0.0007129770237952471 + ], + "acc_eval": 0.171875, + "epoch": 67 + }, + { + "hidden_norms": [ + 6398.03955078125, + 1508487.5, + 3436526.25, + 4417271.5, + 3981251.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009445869363844395, + 0.0007122856914065778, + 0.0007126569980755448, + 0.0007124742260202765, + 0.0007122504175640643 + ], + "acc_eval": 0.189453125, + "epoch": 68 + }, + { + "hidden_norms": [ + 6389.02392578125, + 1530834.625, + 3480246.5, + 4471170.0, + 4032576.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009853171650320292, + 0.0006874292739666998, + 0.0006876476109027863, + 0.0006881517474539578, + 0.0006880395230837166 + ], + "acc_eval": 0.1904296875, + "epoch": 69 + }, + { + "hidden_norms": [ + 6338.54443359375, + 1561198.875, + 3541681.5, + 4548099.0, + 4105499.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009333671187050641, + 0.0006952910916879773, + 0.0006947650690563023, + 0.0006940987077541649, + 0.0006943742628209293 + ], + "acc_eval": 0.23046875, + "epoch": 70 + }, + { + "hidden_norms": [ + 6280.18603515625, + 1585008.0, + 3589125.25, + 4608667.0, + 4162480.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009699579677544534, + 0.0007101434166543186, + 0.0007104446412995458, + 0.000710242718923837, + 0.0007100136135704815 + ], + "acc_eval": 0.146484375, + "epoch": 71 + }, + { + "hidden_norms": [ + 6252.455078125, + 1608187.875, + 3635014.75, + 4667478.5, + 4218253.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008955001248978078, + 0.0006863236776553094, + 0.0006864941096864641, + 0.000687020889017731, + 0.0006868807831779122 + ], + "acc_eval": 0.2431640625, + "epoch": 72 + }, + { + "hidden_norms": [ + 6201.6845703125, + 1619508.875, + 3661275.25, + 4700652.0, + 4249921.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009069991065189242, + 0.0006539999740198255, + 0.0006531713879667222, + 0.0006594359292648733, + 0.000653320224955678 + ], + "acc_eval": 0.2216796875, + "epoch": 73 + }, + { + "hidden_norms": [ + 6182.8115234375, + 1632587.875, + 3679586.25, + 4722070.5, + 4271567.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009595821611583233, + 0.0007079984061419964, + 0.0007082773372530937, + 0.0007081056828610599, + 0.000707884959410876 + ], + "acc_eval": 0.193359375, + "epoch": 74 + }, + { + "hidden_norms": [ + 6153.7392578125, + 1653576.875, + 3722935.0, + 4776921.0, + 4323508.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008598894928582013, + 0.0007073319284245372, + 0.0007075938628986478, + 0.0007074539898894727, + 0.0007072555599734187 + ], + "acc_eval": 0.201171875, + "epoch": 75 + }, + { + "hidden_norms": [ + 6135.21240234375, + 1667474.375, + 3750912.75, + 4812450.5, + 4357575.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009454588289372623, + 0.0007068001432344317, + 0.0007069715647958219, + 0.0007067638216540217, + 0.0007065933896228671 + ], + "acc_eval": 0.2158203125, + "epoch": 76 + }, + { + "hidden_norms": [ + 6085.7109375, + 1679251.75, + 3774334.5, + 4840148.5, + 4384792.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008410231093876064, + 0.0006843701121397316, + 0.0006845371681265533, + 0.00068506138632074, + 0.0006849151104688644 + ], + "acc_eval": 0.2578125, + "epoch": 77 + }, + { + "hidden_norms": [ + 6042.693359375, + 1685705.5, + 3787479.75, + 4856211.0, + 4400193.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008572259685024619, + 0.0006840305286459625, + 0.0006841861759312451, + 0.0006847094628028572, + 0.0006845552125014365 + ], + "acc_eval": 0.2568359375, + "epoch": 78 + }, + { + "hidden_norms": [ + 6003.5390625, + 1702685.5, + 3813174.5, + 4888481.0, + 4430612.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008342780056409538, + 0.0006777377566322684, + 0.0006779460818506777, + 0.0006789933540858328, + 0.0006781259435229003 + ], + "acc_eval": 0.2685546875, + "epoch": 79 + }, + { + "hidden_norms": [ + 5948.60107421875, + 1714243.125, + 3830846.5, + 4910337.5, + 4451921.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008218465954996645, + 0.0006832804065197706, + 0.0006831764476373792, + 0.0006826326716691256, + 0.0006829035119153559 + ], + "acc_eval": 0.2529296875, + "epoch": 80 + }, + { + "hidden_norms": [ + 5881.8525390625, + 1718113.375, + 3838036.5, + 4920025.5, + 4461931.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007958809728734195, + 0.000677398347761482, + 0.0006775528891012073, + 0.0006775871734134853, + 0.0006777321686968207 + ], + "acc_eval": 0.2548828125, + "epoch": 81 + }, + { + "hidden_norms": [ + 5816.7880859375, + 1723461.25, + 3850904.75, + 4936806.0, + 4478473.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008361428044736385, + 0.0006769691244699061, + 0.0006771331536583602, + 0.0006771665066480637, + 0.0006773129571229219 + ], + "acc_eval": 0.251953125, + "epoch": 82 + }, + { + "hidden_norms": [ + 5760.41845703125, + 1732135.25, + 3859576.0, + 4947171.0, + 4488986.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008036325452849269, + 0.0006821549613960087, + 0.0006806753808632493, + 0.0006799713592045009, + 0.0006802318384870887 + ], + "acc_eval": 0.2490234375, + "epoch": 83 + }, + { + "hidden_norms": [ + 5710.22998046875, + 1740014.25, + 3871992.25, + 4962337.5, + 4503463.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008278922759927809, + 0.0006754198693670332, + 0.000675307004712522, + 0.0006768241291865706, + 0.0006769676692783833 + ], + "acc_eval": 0.26171875, + "epoch": 84 + }, + { + "hidden_norms": [ + 5685.73828125, + 1745863.25, + 3880256.75, + 4973639.5, + 4514457.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008255501161329448, + 0.0006466225022450089, + 0.0006466452032327652, + 0.0006467151688411832, + 0.0006467655766755342 + ], + "acc_eval": 0.283203125, + "epoch": 85 + }, + { + "hidden_norms": [ + 5637.498046875, + 1743128.375, + 3879796.5, + 4973009.0, + 4514424.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008148956694640219, + 0.0006465681362897158, + 0.0006463592289946973, + 0.0006491504609584808, + 0.0006464755861088634 + ], + "acc_eval": 0.2587890625, + "epoch": 86 + }, + { + "hidden_norms": [ + 5601.87744140625, + 1741859.375, + 3884447.75, + 4978445.5, + 4518886.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008254973217844963, + 0.0006783050484955311, + 0.0006774527719244361, + 0.0006768335006199777, + 0.0006770920008420944 + ], + "acc_eval": 0.298828125, + "epoch": 87 + }, + { + "hidden_norms": [ + 5587.505859375, + 1748285.875, + 3887730.5, + 4982144.0, + 4523151.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008113561780191958, + 0.0006764904828742146, + 0.000676542054861784, + 0.0006762324483133852, + 0.0006764894351363182 + ], + "acc_eval": 0.2734375, + "epoch": 88 + }, + { + "hidden_norms": [ + 5553.013671875, + 1748456.75, + 3890722.0, + 4986538.5, + 4527315.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007909060223028064, + 0.0006763285491615534, + 0.0006762049742974341, + 0.0006756742368452251, + 0.000675930583383888 + ], + "acc_eval": 0.2861328125, + "epoch": 89 + }, + { + "hidden_norms": [ + 5524.611328125, + 1748210.0, + 3893003.75, + 4989732.5, + 4530436.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.000797618820797652, + 0.0006453269743360579, + 0.0006453663809224963, + 0.0006454290705733001, + 0.0006454723770730197 + ], + "acc_eval": 0.28515625, + "epoch": 90 + }, + { + "hidden_norms": [ + 5506.21923828125, + 1750958.0, + 3894639.5, + 4992073.0, + 4532399.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007834367570467293, + 0.0006762953125871718, + 0.0006754640489816666, + 0.0006748714949935675, + 0.0006751226610504091 + ], + "acc_eval": 0.2939453125, + "epoch": 91 + }, + { + "hidden_norms": [ + 5485.10791015625, + 1747546.25, + 3895030.0, + 4992480.5, + 4532805.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007779909064993262, + 0.0006450997898355126, + 0.0006451247027143836, + 0.0006455867551267147, + 0.0006452234229072928 + ], + "acc_eval": 0.2890625, + "epoch": 92 + }, + { + "hidden_norms": [ + 5464.07763671875, + 1749313.125, + 3894610.75, + 4991684.0, + 4532270.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008090221090242267, + 0.0006661301013082266, + 0.0006646219990216196, + 0.0006726695573888719, + 0.0006649038987234235 + ], + "acc_eval": 0.283203125, + "epoch": 93 + }, + { + "hidden_norms": [ + 5451.2841796875, + 1749389.0, + 3894315.25, + 4990837.5, + 4531011.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007907215040177107, + 0.0006448677740991116, + 0.0006448915228247643, + 0.0006451430963352323, + 0.0006449950742535293 + ], + "acc_eval": 0.2958984375, + "epoch": 94 + }, + { + "hidden_norms": [ + 5437.77099609375, + 1750653.125, + 3895251.75, + 4992303.0, + 4532441.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007774807745590806, + 0.000676269584801048, + 0.0006763145211152732, + 0.0006763775018043816, + 0.000676501716952771 + ], + "acc_eval": 0.2763671875, + "epoch": 95 + }, + { + "hidden_norms": [ + 5427.34619140625, + 1751408.875, + 3894547.75, + 4991554.5, + 4532145.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007797307334840298, + 0.000664835621137172, + 0.0006642266525886953, + 0.000671364541631192, + 0.0006645115208812058 + ], + "acc_eval": 0.296875, + "epoch": 96 + }, + { + "hidden_norms": [ + 5420.30615234375, + 1751757.5, + 3894027.5, + 4991042.0, + 4531674.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007797667058184743, + 0.0006446840125136077, + 0.0006447113119065762, + 0.0006447701598517597, + 0.0006448116037063301 + ], + "acc_eval": 0.2939453125, + "epoch": 97 + }, + { + "hidden_norms": [ + 5416.81396484375, + 1751629.625, + 3893959.25, + 4991021.5, + 4531639.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007706825854256749, + 0.0006446407060138881, + 0.0006406756583601236, + 0.0006447536870837212, + 0.0006393496878445148 + ], + "acc_eval": 0.306640625, + "epoch": 98 + }, + { + "hidden_norms": [ + 5415.3095703125, + 1751552.75, + 3893897.0, + 4990973.0, + 4531587.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007776900893077254, + 0.0006458400748670101, + 0.0006446869228966534, + 0.0006466003833338618, + 0.0006447876221500337 + ], + "acc_eval": 0.2978515625, + "epoch": 99 + }, + { + "hidden_norms": [ + 5414.92822265625, + 1751530.25, + 3893876.5, + 4990954.0, + 4531568.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007761479937471449, + 0.0006465426995418966, + 0.0006446881452575326, + 0.0006466349004767835, + 0.0006447875639423728 + ], + "acc_eval": 0.294921875, + "epoch": 100 + } + ], + "arch": "resmlp_noln", + "seed": 42 +} \ No newline at end of file diff --git a/results/snapshot_no_outln_v1/snapshot_noLN_s123.json b/results/snapshot_no_outln_v1/snapshot_noLN_s123.json new file mode 100644 index 0000000..f3f6392 --- /dev/null +++ b/results/snapshot_no_outln_v1/snapshot_noLN_s123.json @@ -0,0 +1,4766 @@ +{ + "config": { + "output_dir": "results/snapshot_no_outln_v1", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 123, + "depth": 4, + "d_hidden": 256 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "architecture": "ResidualMLP_NoOutLN", + "bp_log": [ + { + "hidden_norms": [ + 8.690464973449707, + 8.719978332519531, + 8.73093318939209, + 8.75937271118164, + 8.790542602539062 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005465824506245553, + 0.0005437708459794521, + 0.0005393712199293077, + 0.0005331890424713492, + 0.0005310169071890414 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.1015625, + "loss_eval": 2.3754236698150635, + "epoch": 0 + }, + { + "hidden_norms": [ + 40.83987808227539, + 37.75401306152344, + 36.1661376953125, + 34.91564178466797, + 34.55687713623047 + ], + "bp_grad_per_sample_l2_med": [ + 0.00012231437722221017, + 0.00012846711615566164, + 0.00013815351121593267, + 0.00015655385504942387, + 0.0002070761693175882 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.435546875, + "loss_eval": 1.5918896198272705, + "epoch": 1 + }, + { + "hidden_norms": [ + 54.60358810424805, + 49.46598434448242, + 46.75371170043945, + 44.21198272705078, + 42.52875900268555 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010624218703014776, + 0.00011056899529648945, + 0.0001174700737465173, + 0.00012732982577290386, + 0.00015480577712878585 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4755859375, + "loss_eval": 1.464656114578247, + "epoch": 2 + }, + { + "hidden_norms": [ + 65.05919647216797, + 58.81830596923828, + 54.65021896362305, + 50.87609100341797, + 48.61247253417969 + ], + "bp_grad_per_sample_l2_med": [ + 9.24510313780047e-05, + 9.810000483412296e-05, + 0.00010529180872254074, + 0.00011547923350008205, + 0.00013095361646264791 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.509765625, + "loss_eval": 1.4144818782806396, + "epoch": 3 + }, + { + "hidden_norms": [ + 71.89185333251953, + 63.81675338745117, + 58.61539077758789, + 53.633819580078125, + 50.85374450683594 + ], + "bp_grad_per_sample_l2_med": [ + 9.624486119719222e-05, + 0.00010101673979079351, + 0.00010665278387023136, + 0.00011629729851847515, + 0.0001258883421542123 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5009765625, + "loss_eval": 1.4042909145355225, + "epoch": 4 + }, + { + "hidden_norms": [ + 77.86115264892578, + 68.96236419677734, + 62.764793395996094, + 56.297122955322266, + 51.927825927734375 + ], + "bp_grad_per_sample_l2_med": [ + 8.636285201646388e-05, + 9.12561226869002e-05, + 9.721348760649562e-05, + 0.0001029788691084832, + 0.00010866572119994089 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5048828125, + "loss_eval": 1.362424373626709, + "epoch": 5 + }, + { + "hidden_norms": [ + 86.97894287109375, + 76.51913452148438, + 68.91358947753906, + 61.691619873046875, + 55.97148132324219 + ], + "bp_grad_per_sample_l2_med": [ + 8.555527165299281e-05, + 9.211624274030328e-05, + 9.770254109753296e-05, + 0.00010545850091148168, + 0.00011015798372682184 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4990234375, + "loss_eval": 1.4210331439971924, + "epoch": 6 + }, + { + "hidden_norms": [ + 91.98681640625, + 80.48826599121094, + 72.19147491455078, + 63.2117919921875, + 57.618526458740234 + ], + "bp_grad_per_sample_l2_med": [ + 8.108472684398293e-05, + 8.69045325089246e-05, + 9.184813097817823e-05, + 9.785865404410288e-05, + 0.00010359002772020176 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.50390625, + "loss_eval": 1.395978569984436, + "epoch": 7 + }, + { + "hidden_norms": [ + 97.7012939453125, + 84.81765747070312, + 75.55701446533203, + 65.7588119506836, + 58.28969955444336 + ], + "bp_grad_per_sample_l2_med": [ + 8.22104630060494e-05, + 8.808301208773628e-05, + 9.288280853070319e-05, + 0.0001000006013782695, + 0.00010321019362891093 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.525390625, + "loss_eval": 1.3341916799545288, + "epoch": 8 + }, + { + "hidden_norms": [ + 102.29643249511719, + 88.3180923461914, + 78.02013397216797, + 67.14125061035156, + 59.45139694213867 + ], + "bp_grad_per_sample_l2_med": [ + 8.297000749735162e-05, + 8.909840107662603e-05, + 9.493192192167044e-05, + 0.00010043827933259308, + 0.00010197651863563806 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5166015625, + "loss_eval": 1.3378056287765503, + "epoch": 9 + }, + { + "hidden_norms": [ + 107.60400390625, + 93.19139862060547, + 81.3952407836914, + 70.16273498535156, + 61.15400314331055 + ], + "bp_grad_per_sample_l2_med": [ + 7.625297439517453e-05, + 8.249503298429772e-05, + 8.778223127592355e-05, + 9.526272333459929e-05, + 9.708418656373397e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.54296875, + "loss_eval": 1.3057411909103394, + "epoch": 10 + }, + { + "hidden_norms": [ + 111.52012634277344, + 95.61714935302734, + 83.3553695678711, + 70.52283477783203, + 61.52479553222656 + ], + "bp_grad_per_sample_l2_med": [ + 7.589814777020365e-05, + 8.213706314563751e-05, + 8.74441975611262e-05, + 9.462270099902526e-05, + 9.573540592100471e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5400390625, + "loss_eval": 1.2877662181854248, + "epoch": 11 + }, + { + "hidden_norms": [ + 116.06771850585938, + 99.79177856445312, + 86.30980682373047, + 72.20254516601562, + 62.78416442871094 + ], + "bp_grad_per_sample_l2_med": [ + 7.193555939011276e-05, + 7.673310028621927e-05, + 8.175434049917385e-05, + 8.827414421830326e-05, + 9.135493019130081e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5478515625, + "loss_eval": 1.2685296535491943, + "epoch": 12 + }, + { + "hidden_norms": [ + 119.3271484375, + 102.65406799316406, + 88.69587707519531, + 74.90689849853516, + 63.780494689941406 + ], + "bp_grad_per_sample_l2_med": [ + 7.618113158969209e-05, + 8.220612653531134e-05, + 8.806472760625184e-05, + 9.463543392485008e-05, + 9.703192336019129e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.54296875, + "loss_eval": 1.276496410369873, + "epoch": 13 + }, + { + "hidden_norms": [ + 123.31849670410156, + 105.7769775390625, + 90.95068359375, + 76.97051239013672, + 64.97062683105469 + ], + "bp_grad_per_sample_l2_med": [ + 7.194027421064675e-05, + 7.883367652539164e-05, + 8.381865336559713e-05, + 9.018390846904367e-05, + 8.924194844439626e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.552734375, + "loss_eval": 1.2604155540466309, + "epoch": 14 + }, + { + "hidden_norms": [ + 127.73625946044922, + 109.2970199584961, + 94.82887268066406, + 79.42200469970703, + 66.68120574951172 + ], + "bp_grad_per_sample_l2_med": [ + 7.26957805454731e-05, + 7.816226570867002e-05, + 8.386534318560734e-05, + 9.044967737281695e-05, + 9.091151150641963e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.55859375, + "loss_eval": 1.2421667575836182, + "epoch": 15 + }, + { + "hidden_norms": [ + 129.39227294921875, + 110.16195678710938, + 95.65125274658203, + 79.63654327392578, + 66.4422836303711 + ], + "bp_grad_per_sample_l2_med": [ + 7.170928438426927e-05, + 7.703503069933504e-05, + 8.211386011680588e-05, + 8.873116166796535e-05, + 9.066827624337748e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5615234375, + "loss_eval": 1.2539770603179932, + "epoch": 16 + }, + { + "hidden_norms": [ + 132.24916076660156, + 113.025634765625, + 96.19522857666016, + 80.5164566040039, + 67.23816680908203 + ], + "bp_grad_per_sample_l2_med": [ + 7.194816862465814e-05, + 7.835567521397024e-05, + 8.341929060406983e-05, + 8.761802746448666e-05, + 8.926806913223118e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5732421875, + "loss_eval": 1.2596629858016968, + "epoch": 17 + }, + { + "hidden_norms": [ + 136.37730407714844, + 116.11273956298828, + 98.82146453857422, + 81.83920288085938, + 67.72627258300781 + ], + "bp_grad_per_sample_l2_med": [ + 7.331569941015914e-05, + 7.95917512732558e-05, + 8.647916547488421e-05, + 9.198131010634825e-05, + 9.28269510040991e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.53515625, + "loss_eval": 1.2714436054229736, + "epoch": 18 + }, + { + "hidden_norms": [ + 137.7354736328125, + 119.1905288696289, + 102.62776184082031, + 84.3735580444336, + 69.55421447753906 + ], + "bp_grad_per_sample_l2_med": [ + 7.105377881089225e-05, + 7.70094629842788e-05, + 8.26972391223535e-05, + 8.802180673228577e-05, + 8.82365129655227e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5498046875, + "loss_eval": 1.25264310836792, + "epoch": 19 + }, + { + "hidden_norms": [ + 139.01124572753906, + 119.05533599853516, + 101.28179168701172, + 83.50191497802734, + 68.7996826171875 + ], + "bp_grad_per_sample_l2_med": [ + 7.610249303979799e-05, + 8.31697034300305e-05, + 8.997280383482575e-05, + 9.514019620837644e-05, + 9.370686893817037e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.517578125, + "loss_eval": 1.2884626388549805, + "epoch": 20 + }, + { + "hidden_norms": [ + 142.8061981201172, + 121.41246795654297, + 104.47654724121094, + 86.13514709472656, + 70.62234497070312 + ], + "bp_grad_per_sample_l2_med": [ + 7.287831977009773e-05, + 7.990973244886845e-05, + 8.473258640151471e-05, + 9.054663678398356e-05, + 9.23949119169265e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5498046875, + "loss_eval": 1.2458946704864502, + "epoch": 21 + }, + { + "hidden_norms": [ + 145.03463745117188, + 124.42599487304688, + 105.64387512207031, + 87.60891723632812, + 71.11911010742188 + ], + "bp_grad_per_sample_l2_med": [ + 6.878219573991373e-05, + 7.463164365617558e-05, + 7.942628144519404e-05, + 8.418951620114967e-05, + 8.709819667274132e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5654296875, + "loss_eval": 1.2031928300857544, + "epoch": 22 + }, + { + "hidden_norms": [ + 145.368896484375, + 124.08200073242188, + 106.14088439941406, + 87.3053970336914, + 70.22563171386719 + ], + "bp_grad_per_sample_l2_med": [ + 6.987902452237904e-05, + 7.564797124359757e-05, + 8.058137609623373e-05, + 8.513103239238262e-05, + 8.664488268550485e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5830078125, + "loss_eval": 1.2048817873001099, + "epoch": 23 + }, + { + "hidden_norms": [ + 149.82542419433594, + 127.8211898803711, + 109.31559753417969, + 88.96003723144531, + 71.56672668457031 + ], + "bp_grad_per_sample_l2_med": [ + 7.123420073185116e-05, + 7.683804142288864e-05, + 8.418370271101594e-05, + 8.922854613047093e-05, + 8.777298353379592e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5654296875, + "loss_eval": 1.2408947944641113, + "epoch": 24 + }, + { + "hidden_norms": [ + 151.1898193359375, + 128.61166381835938, + 110.0819320678711, + 89.33537292480469, + 70.91573333740234 + ], + "bp_grad_per_sample_l2_med": [ + 7.046251994324848e-05, + 7.593455666210502e-05, + 8.183503086911514e-05, + 8.78809587447904e-05, + 8.738410542719066e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5849609375, + "loss_eval": 1.2345162630081177, + "epoch": 25 + }, + { + "hidden_norms": [ + 153.0899200439453, + 130.6381072998047, + 110.78546905517578, + 90.43073272705078, + 72.28581237792969 + ], + "bp_grad_per_sample_l2_med": [ + 7.224789442261681e-05, + 7.864048529881984e-05, + 8.493732457282022e-05, + 9.218508785124868e-05, + 9.127514931606129e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.548828125, + "loss_eval": 1.234302282333374, + "epoch": 26 + }, + { + "hidden_norms": [ + 156.78964233398438, + 132.35365295410156, + 114.26016998291016, + 93.03483581542969, + 73.8830337524414 + ], + "bp_grad_per_sample_l2_med": [ + 7.004363578744233e-05, + 7.51781408325769e-05, + 8.189951768144965e-05, + 8.64862377056852e-05, + 8.457603689748794e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.572265625, + "loss_eval": 1.226435661315918, + "epoch": 27 + }, + { + "hidden_norms": [ + 154.7094268798828, + 132.68295288085938, + 112.78950500488281, + 91.68452453613281, + 72.69532012939453 + ], + "bp_grad_per_sample_l2_med": [ + 6.871543155284598e-05, + 7.408537931041792e-05, + 7.912247383501381e-05, + 8.584219176555052e-05, + 8.712658018339425e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5693359375, + "loss_eval": 1.186962604522705, + "epoch": 28 + }, + { + "hidden_norms": [ + 156.5343475341797, + 133.95303344726562, + 113.44208526611328, + 91.55599212646484, + 72.66578674316406 + ], + "bp_grad_per_sample_l2_med": [ + 6.697547360090539e-05, + 7.314077083719894e-05, + 7.949489372549579e-05, + 8.466470171697438e-05, + 8.366732799913734e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.595703125, + "loss_eval": 1.1845954656600952, + "epoch": 29 + }, + { + "hidden_norms": [ + 158.63601684570312, + 134.8338165283203, + 115.27066802978516, + 93.78146362304688, + 72.8468017578125 + ], + "bp_grad_per_sample_l2_med": [ + 6.742558616679162e-05, + 7.408189412672073e-05, + 7.9598423326388e-05, + 8.415436604991555e-05, + 8.754149166634306e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5693359375, + "loss_eval": 1.208282470703125, + "epoch": 30 + }, + { + "hidden_norms": [ + 158.21023559570312, + 136.07545471191406, + 116.15364837646484, + 93.98001098632812, + 73.68004608154297 + ], + "bp_grad_per_sample_l2_med": [ + 7.207741873571649e-05, + 7.860636833356693e-05, + 8.520736446371302e-05, + 9.168307587970048e-05, + 8.956313104135916e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5859375, + "loss_eval": 1.2018094062805176, + "epoch": 31 + }, + { + "hidden_norms": [ + 160.46771240234375, + 136.1265411376953, + 116.0124282836914, + 93.3584976196289, + 73.7890396118164 + ], + "bp_grad_per_sample_l2_med": [ + 7.191704207798466e-05, + 7.717879634583369e-05, + 8.299856563098729e-05, + 8.967710164142773e-05, + 8.699094178155065e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5810546875, + "loss_eval": 1.1889103651046753, + "epoch": 32 + }, + { + "hidden_norms": [ + 160.90545654296875, + 137.0214080810547, + 115.83223724365234, + 94.28914642333984, + 73.96448516845703 + ], + "bp_grad_per_sample_l2_med": [ + 7.10546228219755e-05, + 7.790922973072156e-05, + 8.321165660163388e-05, + 8.87274945853278e-05, + 8.640237501822412e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5859375, + "loss_eval": 1.1516971588134766, + "epoch": 33 + }, + { + "hidden_norms": [ + 163.9844207763672, + 138.9420166015625, + 118.25187683105469, + 94.9247817993164, + 73.99342346191406 + ], + "bp_grad_per_sample_l2_med": [ + 7.05249622114934e-05, + 7.705103053012863e-05, + 8.39303684188053e-05, + 8.84484761627391e-05, + 8.569705096306279e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5888671875, + "loss_eval": 1.1713684797286987, + "epoch": 34 + }, + { + "hidden_norms": [ + 162.2567596435547, + 139.536376953125, + 118.07953643798828, + 96.10607147216797, + 75.22054290771484 + ], + "bp_grad_per_sample_l2_med": [ + 6.98907533660531e-05, + 7.564698171336204e-05, + 8.246934885391966e-05, + 8.673300180817023e-05, + 8.65447727846913e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5869140625, + "loss_eval": 1.1986680030822754, + "epoch": 35 + }, + { + "hidden_norms": [ + 163.85494995117188, + 140.6683807373047, + 120.20167541503906, + 96.79766845703125, + 74.6565933227539 + ], + "bp_grad_per_sample_l2_med": [ + 6.933045369805768e-05, + 7.555640331702307e-05, + 8.187161438399926e-05, + 8.634777623228729e-05, + 8.516138041159138e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.58203125, + "loss_eval": 1.17092764377594, + "epoch": 36 + }, + { + "hidden_norms": [ + 163.91464233398438, + 141.8627166748047, + 120.35345458984375, + 96.861083984375, + 74.91275024414062 + ], + "bp_grad_per_sample_l2_med": [ + 6.821981514804065e-05, + 7.462653593393043e-05, + 7.9863122664392e-05, + 8.513165812473744e-05, + 8.408474968746305e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.607421875, + "loss_eval": 1.1603121757507324, + "epoch": 37 + }, + { + "hidden_norms": [ + 166.6566162109375, + 142.48072814941406, + 120.16492462158203, + 96.4870376586914, + 75.0911636352539 + ], + "bp_grad_per_sample_l2_med": [ + 6.862134614493698e-05, + 7.509759598178789e-05, + 8.221028838306665e-05, + 8.709747635293752e-05, + 8.625433838460594e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5927734375, + "loss_eval": 1.163398027420044, + "epoch": 38 + }, + { + "hidden_norms": [ + 165.2766571044922, + 140.6273193359375, + 119.01939392089844, + 96.45698547363281, + 74.86931610107422 + ], + "bp_grad_per_sample_l2_med": [ + 6.741421384504065e-05, + 7.467559044016525e-05, + 8.113843068713322e-05, + 8.498551324009895e-05, + 8.365403482457623e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.1174335479736328, + "epoch": 39 + }, + { + "hidden_norms": [ + 166.8720703125, + 141.94195556640625, + 119.73834228515625, + 96.83306884765625, + 75.50749206542969 + ], + "bp_grad_per_sample_l2_med": [ + 6.83375183143653e-05, + 7.506174733862281e-05, + 8.1863887317013e-05, + 8.717682067072019e-05, + 8.521847485098988e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6201171875, + "loss_eval": 1.128427267074585, + "epoch": 40 + }, + { + "hidden_norms": [ + 166.10345458984375, + 140.8309783935547, + 119.59312438964844, + 96.5144271850586, + 75.01549530029297 + ], + "bp_grad_per_sample_l2_med": [ + 7.117655331967399e-05, + 7.808134250808507e-05, + 8.549879566999152e-05, + 9.121275070356205e-05, + 8.961764251580462e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6025390625, + "loss_eval": 1.1407405138015747, + "epoch": 41 + }, + { + "hidden_norms": [ + 168.5572052001953, + 144.19313049316406, + 121.29338836669922, + 98.18904113769531, + 75.74433898925781 + ], + "bp_grad_per_sample_l2_med": [ + 7.024689693935215e-05, + 7.835906581021845e-05, + 8.28477568575181e-05, + 8.988843183033168e-05, + 9.142952330876142e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5791015625, + "loss_eval": 1.188612699508667, + "epoch": 42 + }, + { + "hidden_norms": [ + 167.82464599609375, + 142.2963104248047, + 120.96216583251953, + 98.01409149169922, + 76.0032730102539 + ], + "bp_grad_per_sample_l2_med": [ + 7.296045077964664e-05, + 7.839543832233176e-05, + 8.31817596917972e-05, + 9.021619916893542e-05, + 8.68452261784114e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.60546875, + "loss_eval": 1.1675610542297363, + "epoch": 43 + }, + { + "hidden_norms": [ + 168.66015625, + 143.3383026123047, + 121.46915435791016, + 97.43902587890625, + 75.26473236083984 + ], + "bp_grad_per_sample_l2_med": [ + 7.207799353636801e-05, + 8.018259541131556e-05, + 8.563740993849933e-05, + 9.22580948099494e-05, + 9.03013497008942e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.591796875, + "loss_eval": 1.1672401428222656, + "epoch": 44 + }, + { + "hidden_norms": [ + 168.55662536621094, + 142.82704162597656, + 120.73102569580078, + 96.30245971679688, + 74.20568084716797 + ], + "bp_grad_per_sample_l2_med": [ + 7.172006007749587e-05, + 7.97949469415471e-05, + 8.564699237467721e-05, + 9.092836262425408e-05, + 9.031151421368122e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.591796875, + "loss_eval": 1.1739519834518433, + "epoch": 45 + }, + { + "hidden_norms": [ + 169.05859375, + 143.376953125, + 122.22779083251953, + 98.1865234375, + 75.46460723876953 + ], + "bp_grad_per_sample_l2_med": [ + 7.164492853917181e-05, + 8.059864194365218e-05, + 8.811463339952752e-05, + 9.420064452569932e-05, + 9.068247891264036e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5869140625, + "loss_eval": 1.1654919385910034, + "epoch": 46 + }, + { + "hidden_norms": [ + 167.85174560546875, + 143.98324584960938, + 121.09931945800781, + 97.61621856689453, + 75.3441390991211 + ], + "bp_grad_per_sample_l2_med": [ + 7.121654198272154e-05, + 7.876066229073331e-05, + 8.58678831718862e-05, + 9.374372893944383e-05, + 8.886006980901584e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6015625, + "loss_eval": 1.1619040966033936, + "epoch": 47 + }, + { + "hidden_norms": [ + 169.16136169433594, + 144.1681671142578, + 121.65021514892578, + 97.65489959716797, + 75.40325927734375 + ], + "bp_grad_per_sample_l2_med": [ + 7.085441029630601e-05, + 7.872789865359664e-05, + 8.54654426802881e-05, + 9.159239561995491e-05, + 8.735150913707912e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.60546875, + "loss_eval": 1.1553215980529785, + "epoch": 48 + }, + { + "hidden_norms": [ + 170.07469177246094, + 144.21502685546875, + 122.42488098144531, + 97.60433959960938, + 75.30228424072266 + ], + "bp_grad_per_sample_l2_med": [ + 7.460799679392949e-05, + 8.310206612804905e-05, + 8.914316276786849e-05, + 9.709167352411896e-05, + 9.34089912334457e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5947265625, + "loss_eval": 1.1511603593826294, + "epoch": 49 + }, + { + "hidden_norms": [ + 169.58541870117188, + 143.38230895996094, + 121.96705627441406, + 97.77040100097656, + 74.732177734375 + ], + "bp_grad_per_sample_l2_med": [ + 7.605904102092609e-05, + 8.306169183924794e-05, + 9.093777771340683e-05, + 9.604891965864226e-05, + 9.101478644879535e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.583984375, + "loss_eval": 1.150202751159668, + "epoch": 50 + }, + { + "hidden_norms": [ + 169.28955078125, + 143.6193084716797, + 122.43891906738281, + 97.91162109375, + 75.27656555175781 + ], + "bp_grad_per_sample_l2_med": [ + 7.325071055674925e-05, + 8.037279621930793e-05, + 8.85110639501363e-05, + 9.169802797259763e-05, + 8.926681766752154e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6201171875, + "loss_eval": 1.1172325611114502, + "epoch": 51 + }, + { + "hidden_norms": [ + 170.01052856445312, + 143.45779418945312, + 122.65426635742188, + 98.24798583984375, + 75.68919372558594 + ], + "bp_grad_per_sample_l2_med": [ + 7.252323121065274e-05, + 8.011860336409882e-05, + 8.620596781838685e-05, + 9.34487470658496e-05, + 9.04093321878463e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.611328125, + "loss_eval": 1.1147592067718506, + "epoch": 52 + }, + { + "hidden_norms": [ + 168.67430114746094, + 143.25802612304688, + 119.88789367675781, + 96.92530822753906, + 74.42180633544922 + ], + "bp_grad_per_sample_l2_med": [ + 7.410924445139244e-05, + 8.137265831464902e-05, + 8.864435949362814e-05, + 9.472777310293168e-05, + 9.015527029987425e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.625, + "loss_eval": 1.1209393739700317, + "epoch": 53 + }, + { + "hidden_norms": [ + 169.25973510742188, + 142.8248291015625, + 120.75433349609375, + 96.85049438476562, + 74.96371459960938 + ], + "bp_grad_per_sample_l2_med": [ + 7.351540989475325e-05, + 8.063198038144037e-05, + 8.647661161376163e-05, + 9.411892096977681e-05, + 9.352037159260362e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.1025673151016235, + "epoch": 54 + }, + { + "hidden_norms": [ + 170.8097381591797, + 143.562744140625, + 121.1410903930664, + 97.70262145996094, + 75.55540466308594 + ], + "bp_grad_per_sample_l2_med": [ + 7.382583135040477e-05, + 8.104312291834503e-05, + 8.895712380763143e-05, + 9.191031131194904e-05, + 8.924967551138252e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.1013734340667725, + "epoch": 55 + }, + { + "hidden_norms": [ + 169.41827392578125, + 143.60491943359375, + 119.79347229003906, + 96.5761947631836, + 74.94788360595703 + ], + "bp_grad_per_sample_l2_med": [ + 7.506331166950986e-05, + 8.308376709464937e-05, + 9.05599954421632e-05, + 9.552844858262688e-05, + 9.322594269178808e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6259765625, + "loss_eval": 1.1202704906463623, + "epoch": 56 + }, + { + "hidden_norms": [ + 169.0540008544922, + 144.03970336914062, + 121.87033081054688, + 98.80317687988281, + 76.42084503173828 + ], + "bp_grad_per_sample_l2_med": [ + 7.446128438459709e-05, + 8.153915405273438e-05, + 8.840708323987201e-05, + 9.388235048390925e-05, + 9.186066017718986e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6171875, + "loss_eval": 1.1205706596374512, + "epoch": 57 + }, + { + "hidden_norms": [ + 168.36595153808594, + 141.80178833007812, + 120.2418212890625, + 96.8748779296875, + 75.01248168945312 + ], + "bp_grad_per_sample_l2_med": [ + 7.731275400146842e-05, + 8.405288099311292e-05, + 9.186116949422285e-05, + 9.942329052137211e-05, + 9.51286856434308e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6162109375, + "loss_eval": 1.1108977794647217, + "epoch": 58 + }, + { + "hidden_norms": [ + 169.39569091796875, + 142.4537353515625, + 120.81804656982422, + 97.19158172607422, + 75.20236206054688 + ], + "bp_grad_per_sample_l2_med": [ + 7.883378566475585e-05, + 8.777670154813677e-05, + 9.416328248335049e-05, + 0.00010057339386548847, + 9.685986879048869e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6259765625, + "loss_eval": 1.1141078472137451, + "epoch": 59 + }, + { + "hidden_norms": [ + 169.97256469726562, + 143.7432098388672, + 121.0943832397461, + 97.53318786621094, + 75.44910430908203 + ], + "bp_grad_per_sample_l2_med": [ + 7.617164374096319e-05, + 8.471525507047772e-05, + 9.014597890200093e-05, + 9.796666563488543e-05, + 9.110565588343889e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.0869580507278442, + "epoch": 60 + }, + { + "hidden_norms": [ + 168.3030242919922, + 142.93931579589844, + 120.8933334350586, + 97.99317932128906, + 75.29071044921875 + ], + "bp_grad_per_sample_l2_med": [ + 7.692870713071898e-05, + 8.63347522681579e-05, + 9.28592708078213e-05, + 9.994371794164181e-05, + 9.114396380027756e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6357421875, + "loss_eval": 1.102014183998108, + "epoch": 61 + }, + { + "hidden_norms": [ + 168.24777221679688, + 142.03550720214844, + 120.25982666015625, + 97.82561492919922, + 75.54430389404297 + ], + "bp_grad_per_sample_l2_med": [ + 7.734074461041018e-05, + 8.487069862894714e-05, + 9.25088970689103e-05, + 9.827558096731082e-05, + 9.154371218755841e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.642578125, + "loss_eval": 1.0736993551254272, + "epoch": 62 + }, + { + "hidden_norms": [ + 168.08807373046875, + 142.24661254882812, + 119.9559555053711, + 96.72630310058594, + 74.6895523071289 + ], + "bp_grad_per_sample_l2_med": [ + 8.049221651162952e-05, + 8.925019210437313e-05, + 9.64810824370943e-05, + 0.00010555233166087419, + 9.567404049448669e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6328125, + "loss_eval": 1.0822858810424805, + "epoch": 63 + }, + { + "hidden_norms": [ + 167.2539825439453, + 141.55946350097656, + 119.37681579589844, + 97.13011169433594, + 75.02286529541016 + ], + "bp_grad_per_sample_l2_med": [ + 7.919344352558255e-05, + 8.567116310587153e-05, + 9.377488458994776e-05, + 9.892786329146475e-05, + 9.566175140207633e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6328125, + "loss_eval": 1.1096018552780151, + "epoch": 64 + }, + { + "hidden_norms": [ + 168.11643981933594, + 142.01052856445312, + 119.23418426513672, + 96.38211059570312, + 75.08849334716797 + ], + "bp_grad_per_sample_l2_med": [ + 7.787172216922045e-05, + 8.574797539040446e-05, + 9.008680353872478e-05, + 9.943459735950455e-05, + 9.4872091722209e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6455078125, + "loss_eval": 1.1080338954925537, + "epoch": 65 + }, + { + "hidden_norms": [ + 168.09153747558594, + 141.83984375, + 120.16891479492188, + 97.12582397460938, + 74.98177337646484 + ], + "bp_grad_per_sample_l2_med": [ + 7.894716691225767e-05, + 8.66493719513528e-05, + 9.518097795080394e-05, + 0.00010154353367397562, + 9.530662646284327e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.634765625, + "loss_eval": 1.1069355010986328, + "epoch": 66 + }, + { + "hidden_norms": [ + 167.35382080078125, + 142.33642578125, + 120.0411148071289, + 96.53257751464844, + 75.0328598022461 + ], + "bp_grad_per_sample_l2_med": [ + 7.973265019245446e-05, + 8.856245403876528e-05, + 9.601243800716475e-05, + 0.00010215263318968937, + 9.676075569586828e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.63671875, + "loss_eval": 1.100548505783081, + "epoch": 67 + }, + { + "hidden_norms": [ + 167.418701171875, + 140.93800354003906, + 119.4802017211914, + 96.3717269897461, + 74.67574310302734 + ], + "bp_grad_per_sample_l2_med": [ + 8.022025576792657e-05, + 8.782520308159292e-05, + 9.638317715143785e-05, + 0.0001046421384671703, + 9.856691031018272e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.63671875, + "loss_eval": 1.1227837800979614, + "epoch": 68 + }, + { + "hidden_norms": [ + 166.9136962890625, + 140.45266723632812, + 119.06848907470703, + 95.9060287475586, + 74.79631042480469 + ], + "bp_grad_per_sample_l2_med": [ + 7.995362102519721e-05, + 8.583935414208099e-05, + 9.508246148470789e-05, + 0.00010096231562783942, + 9.634289017412812e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6416015625, + "loss_eval": 1.1006299257278442, + "epoch": 69 + }, + { + "hidden_norms": [ + 165.4694366455078, + 139.69601440429688, + 117.53054809570312, + 95.05348205566406, + 74.65673065185547 + ], + "bp_grad_per_sample_l2_med": [ + 7.79753245296888e-05, + 8.487935701850802e-05, + 9.169900295091793e-05, + 9.879520075628534e-05, + 9.398034308105707e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.623046875, + "loss_eval": 1.0988688468933105, + "epoch": 70 + }, + { + "hidden_norms": [ + 165.3974609375, + 139.54141235351562, + 117.3493881225586, + 94.9970474243164, + 74.31880187988281 + ], + "bp_grad_per_sample_l2_med": [ + 7.893131260061637e-05, + 8.71433803695254e-05, + 9.492320532444865e-05, + 0.00010128845315193757, + 9.578587196301669e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6484375, + "loss_eval": 1.0860004425048828, + "epoch": 71 + }, + { + "hidden_norms": [ + 165.16651916503906, + 138.63233947753906, + 117.15692138671875, + 94.41555786132812, + 74.16561889648438 + ], + "bp_grad_per_sample_l2_med": [ + 8.611902012489736e-05, + 9.412867802893743e-05, + 0.0001005554513540119, + 0.00010507499246159568, + 0.00010004997602663934 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.638671875, + "loss_eval": 1.0985480546951294, + "epoch": 72 + }, + { + "hidden_norms": [ + 166.48802185058594, + 139.67433166503906, + 117.13744354248047, + 94.41883087158203, + 74.25392150878906 + ], + "bp_grad_per_sample_l2_med": [ + 8.272679406218231e-05, + 9.101553587242961e-05, + 9.994471474783495e-05, + 0.00010372102406108752, + 9.65072977123782e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.63671875, + "loss_eval": 1.1026251316070557, + "epoch": 73 + }, + { + "hidden_norms": [ + 164.66531372070312, + 138.62359619140625, + 117.72949981689453, + 95.40411376953125, + 74.5541763305664 + ], + "bp_grad_per_sample_l2_med": [ + 8.516917296219617e-05, + 9.385120938532054e-05, + 0.00010402742918813601, + 0.00010775420378195122, + 0.00010169474262511358 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6298828125, + "loss_eval": 1.1083872318267822, + "epoch": 74 + }, + { + "hidden_norms": [ + 164.67889404296875, + 138.3468017578125, + 116.61951446533203, + 93.94100952148438, + 74.09746551513672 + ], + "bp_grad_per_sample_l2_med": [ + 8.641117165097967e-05, + 9.53027411014773e-05, + 0.0001029834384098649, + 0.0001086485426640138, + 0.0001005055892164819 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6455078125, + "loss_eval": 1.1155339479446411, + "epoch": 75 + }, + { + "hidden_norms": [ + 164.2607421875, + 138.0647735595703, + 116.18480682373047, + 93.95038604736328, + 73.88935089111328 + ], + "bp_grad_per_sample_l2_med": [ + 8.567768963985145e-05, + 9.307480650022626e-05, + 9.939757728716359e-05, + 0.00010579575609881431, + 9.849719936028123e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.638671875, + "loss_eval": 1.1126312017440796, + "epoch": 76 + }, + { + "hidden_norms": [ + 163.9792938232422, + 137.88185119628906, + 116.34628295898438, + 93.93537139892578, + 73.83805084228516 + ], + "bp_grad_per_sample_l2_med": [ + 8.795045869192109e-05, + 9.678495553089306e-05, + 0.00010362159082433209, + 0.0001105417322833091, + 0.00010525066318223253 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6337890625, + "loss_eval": 1.110876202583313, + "epoch": 77 + }, + { + "hidden_norms": [ + 164.1384735107422, + 137.82691955566406, + 115.94445037841797, + 94.01095581054688, + 73.68436431884766 + ], + "bp_grad_per_sample_l2_med": [ + 8.610311488155276e-05, + 9.507987851975486e-05, + 0.00010208813182543963, + 0.00010807226499309763, + 0.00010176940850215033 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6318359375, + "loss_eval": 1.1176977157592773, + "epoch": 78 + }, + { + "hidden_norms": [ + 163.91049194335938, + 136.9142608642578, + 115.37925720214844, + 93.2219009399414, + 73.2654800415039 + ], + "bp_grad_per_sample_l2_med": [ + 8.745997183723375e-05, + 9.566589869791642e-05, + 0.00010251311323372647, + 0.00011129804624943063, + 0.0001056971013895236 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6318359375, + "loss_eval": 1.1140623092651367, + "epoch": 79 + }, + { + "hidden_norms": [ + 163.40182495117188, + 137.21026611328125, + 115.46720123291016, + 93.46426391601562, + 73.12786102294922 + ], + "bp_grad_per_sample_l2_med": [ + 8.96864221431315e-05, + 9.8639284260571e-05, + 0.0001043426527758129, + 0.00010869379184441641, + 0.00010685920278774574 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.630859375, + "loss_eval": 1.1114736795425415, + "epoch": 80 + }, + { + "hidden_norms": [ + 163.22100830078125, + 136.5157012939453, + 115.2002944946289, + 93.15667724609375, + 73.07371520996094 + ], + "bp_grad_per_sample_l2_med": [ + 8.870210876921192e-05, + 9.846940520219505e-05, + 0.0001080361835192889, + 0.0001128382355091162, + 0.00010244990698993206 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.634765625, + "loss_eval": 1.1125456094741821, + "epoch": 81 + }, + { + "hidden_norms": [ + 163.21449279785156, + 136.63999938964844, + 114.51496124267578, + 92.76043701171875, + 73.22138214111328 + ], + "bp_grad_per_sample_l2_med": [ + 8.551862265449017e-05, + 9.3683076556772e-05, + 0.00010453341383254156, + 0.00010722207662183791, + 0.00010129058500751853 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.638671875, + "loss_eval": 1.0996887683868408, + "epoch": 82 + }, + { + "hidden_norms": [ + 162.75770568847656, + 136.49710083007812, + 114.6112060546875, + 92.87682342529297, + 73.25039672851562 + ], + "bp_grad_per_sample_l2_med": [ + 8.870910096447915e-05, + 9.74184149526991e-05, + 0.00010446018859511241, + 0.00011418589565437287, + 0.00010412647679913789 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.634765625, + "loss_eval": 1.1063097715377808, + "epoch": 83 + }, + { + "hidden_norms": [ + 163.11697387695312, + 136.4162139892578, + 114.9229507446289, + 93.17060089111328, + 73.40281677246094 + ], + "bp_grad_per_sample_l2_med": [ + 8.790192077867687e-05, + 9.763163689058274e-05, + 0.00010599731467664242, + 0.00011016600910807028, + 0.00010507069964660332 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6435546875, + "loss_eval": 1.1009955406188965, + "epoch": 84 + }, + { + "hidden_norms": [ + 162.4318389892578, + 136.2643280029297, + 114.47940826416016, + 92.43824005126953, + 72.75123596191406 + ], + "bp_grad_per_sample_l2_med": [ + 8.680798055138439e-05, + 9.524248889647424e-05, + 0.00010346775525249541, + 0.00010771532106446102, + 0.00010157373617403209 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.106760025024414, + "epoch": 85 + }, + { + "hidden_norms": [ + 162.55992126464844, + 136.00660705566406, + 114.44908142089844, + 92.65226745605469, + 73.14122772216797 + ], + "bp_grad_per_sample_l2_med": [ + 8.55888138175942e-05, + 9.422176663065329e-05, + 0.00010130204464076087, + 0.0001082807284547016, + 0.00010286335600540042 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6435546875, + "loss_eval": 1.1080232858657837, + "epoch": 86 + }, + { + "hidden_norms": [ + 162.33607482910156, + 136.22657775878906, + 114.64276885986328, + 92.26687622070312, + 72.99312591552734 + ], + "bp_grad_per_sample_l2_med": [ + 9.005892934510484e-05, + 9.746963041834533e-05, + 0.00010383747576270252, + 0.00010905141971306875, + 0.00010293527157045901 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6455078125, + "loss_eval": 1.0989083051681519, + "epoch": 87 + }, + { + "hidden_norms": [ + 161.69874572753906, + 135.9654998779297, + 113.88583374023438, + 91.72888946533203, + 72.5824966430664 + ], + "bp_grad_per_sample_l2_med": [ + 9.02136744116433e-05, + 9.903020691126585e-05, + 0.0001059234855347313, + 0.00011399909999454394, + 0.00010543780081206933 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6435546875, + "loss_eval": 1.1039698123931885, + "epoch": 88 + }, + { + "hidden_norms": [ + 162.3827362060547, + 136.0760498046875, + 114.07840728759766, + 91.95870971679688, + 72.59473419189453 + ], + "bp_grad_per_sample_l2_med": [ + 9.043919999385253e-05, + 9.950586536433548e-05, + 0.00010800046584336087, + 0.00011628754145931453, + 0.00010360861051594839 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6435546875, + "loss_eval": 1.1007411479949951, + "epoch": 89 + }, + { + "hidden_norms": [ + 161.50054931640625, + 135.7166748046875, + 113.83382415771484, + 91.96630096435547, + 72.61833953857422 + ], + "bp_grad_per_sample_l2_med": [ + 9.075389243662357e-05, + 9.988105011871085e-05, + 0.00010788880899781361, + 0.00011431374150561169, + 0.00010596351057756692 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.64453125, + "loss_eval": 1.0992103815078735, + "epoch": 90 + }, + { + "hidden_norms": [ + 161.48770141601562, + 135.71417236328125, + 114.12840270996094, + 91.98160552978516, + 72.64606475830078 + ], + "bp_grad_per_sample_l2_med": [ + 9.050803782884032e-05, + 9.805837908061221e-05, + 0.00010800142626976594, + 0.00011649157386273146, + 0.00010660875705070794 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.640625, + "loss_eval": 1.1021543741226196, + "epoch": 91 + }, + { + "hidden_norms": [ + 162.0372314453125, + 135.4561767578125, + 114.00292205810547, + 91.83483123779297, + 72.68809509277344 + ], + "bp_grad_per_sample_l2_med": [ + 8.82204039953649e-05, + 9.769284224603325e-05, + 0.00010632916382746771, + 0.00011439422814873978, + 0.00010489066335139796 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6416015625, + "loss_eval": 1.1001535654067993, + "epoch": 92 + }, + { + "hidden_norms": [ + 161.88534545898438, + 135.54629516601562, + 113.90684509277344, + 91.81143188476562, + 72.64588165283203 + ], + "bp_grad_per_sample_l2_med": [ + 9.120439790422097e-05, + 9.779920219443738e-05, + 0.00010798833682201803, + 0.00011447365250205621, + 0.00010797424329211935 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.642578125, + "loss_eval": 1.0961315631866455, + "epoch": 93 + }, + { + "hidden_norms": [ + 162.06427001953125, + 135.49281311035156, + 113.69275665283203, + 91.76304626464844, + 72.4867935180664 + ], + "bp_grad_per_sample_l2_med": [ + 9.100054739974439e-05, + 9.935065463650972e-05, + 0.00010879126784857363, + 0.00011589765199460089, + 0.00010837834270205349 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6416015625, + "loss_eval": 1.097299337387085, + "epoch": 94 + }, + { + "hidden_norms": [ + 162.06063842773438, + 135.57981872558594, + 113.76399230957031, + 91.94515991210938, + 72.56278991699219 + ], + "bp_grad_per_sample_l2_med": [ + 9.139141184277833e-05, + 9.897649579215795e-05, + 0.00010867504897760227, + 0.0001159063758677803, + 0.00010943930828943849 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6376953125, + "loss_eval": 1.0986907482147217, + "epoch": 95 + }, + { + "hidden_norms": [ + 161.8842315673828, + 135.4130859375, + 113.66045379638672, + 91.80276489257812, + 72.58989715576172 + ], + "bp_grad_per_sample_l2_med": [ + 9.080857125809416e-05, + 0.00010123007814399898, + 0.00010883246432058513, + 0.00011908033775398508, + 0.00010963032400468364 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.0988240242004395, + "epoch": 96 + }, + { + "hidden_norms": [ + 161.86744689941406, + 135.38331604003906, + 113.66378784179688, + 91.70223236083984, + 72.4896240234375 + ], + "bp_grad_per_sample_l2_med": [ + 9.091695392271504e-05, + 0.00010080484207719564, + 0.00010940106585621834, + 0.00011762498616008088, + 0.00010917771578533575 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.0987744331359863, + "epoch": 97 + }, + { + "hidden_norms": [ + 161.89633178710938, + 135.33140563964844, + 113.67347717285156, + 91.68895721435547, + 72.49469757080078 + ], + "bp_grad_per_sample_l2_med": [ + 9.099576709559187e-05, + 0.00010038664186140522, + 0.0001086170959752053, + 0.00011788319534389302, + 0.00010914496670011431 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.0990701913833618, + "epoch": 98 + }, + { + "hidden_norms": [ + 161.9002227783203, + 135.33474731445312, + 113.68601989746094, + 91.69290924072266, + 72.48957061767578 + ], + "bp_grad_per_sample_l2_med": [ + 9.096309076994658e-05, + 0.00010059915803140029, + 0.00010838409070856869, + 0.00011784962407546118, + 0.00010893247235799208 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.098876953125, + "epoch": 99 + }, + { + "hidden_norms": [ + 161.8989715576172, + 135.33889770507812, + 113.69281768798828, + 91.6856689453125, + 72.48480224609375 + ], + "bp_grad_per_sample_l2_med": [ + 9.085259807761759e-05, + 0.00010061707871500403, + 0.00010823038610396907, + 0.00011745247320504859, + 0.00010919221676886082 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6396484375, + "loss_eval": 1.0987944602966309, + "epoch": 100 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.690464973449707, + 8.719978332519531, + 8.73093318939209, + 8.75937271118164, + 8.790542602539062 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005465824506245553, + 0.0005437708459794521, + 0.0005393712199293077, + 0.0005331890424713492, + 0.0005310169071890414 + ], + "gamma_dfa": 0.007568402143078856, + "gamma_dfa_per_layer": [ + 0.002326551591977477, + 0.0009101498289965093, + -0.013218702748417854, + 0.04025560989975929 + ], + "acc_eval": 0.1015625, + "loss_eval": 2.3754236698150635, + "epoch": 0 + }, + { + "hidden_norms": [ + 536.5761108398438, + 845.265625, + 979.7896118164062, + 1192.0323486328125, + 1230.83935546875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006465085316449404, + 0.0006462159799411893, + 0.0006460825679823756, + 0.0006459451396949589, + 0.0006460213917307556 + ], + "gamma_dfa": 0.013024769607000053, + "gamma_dfa_per_layer": [ + 0.035579413175582886, + -0.0025600260123610497, + -0.0014369464479386806, + 0.020516637712717056 + ], + "acc_eval": 0.212890625, + "loss_eval": 8.137651443481445, + "epoch": 1 + }, + { + "hidden_norms": [ + 886.7508544921875, + 1871.2640380859375, + 2198.631591796875, + 2689.22412109375, + 2904.254150390625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007187994197010994, + 0.0007172312471084297, + 0.0007172476034611464, + 0.0007177897496148944, + 0.000717311049811542 + ], + "gamma_dfa": 0.004487544531002641, + "gamma_dfa_per_layer": [ + 0.04744107276201248, + -0.011962954886257648, + -0.02088175155222416, + 0.003353811800479889 + ], + "acc_eval": 0.203125, + "loss_eval": 16.637451171875, + "epoch": 2 + }, + { + "hidden_norms": [ + 1117.1649169921875, + 3064.644775390625, + 3849.060546875, + 4987.09130859375, + 5690.720703125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000734492321498692, + 0.0007317167473956943, + 0.0007317643612623215, + 0.0007318624993786216, + 0.0007319750147871673 + ], + "gamma_dfa": 0.0065072893630713224, + "gamma_dfa_per_layer": [ + 0.0597357451915741, + -0.0063293795101344585, + -0.033218011260032654, + 0.0058408030308783054 + ], + "acc_eval": 0.224609375, + "loss_eval": 29.753459930419922, + "epoch": 3 + }, + { + "hidden_norms": [ + 1279.7017822265625, + 4015.093017578125, + 5594.23828125, + 7459.69091796875, + 8727.64453125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007434640428982675, + 0.0007419881876558065, + 0.0007416673470288515, + 0.000741377065423876, + 0.0007413675775751472 + ], + "gamma_dfa": 0.0072651703376322985, + "gamma_dfa_per_layer": [ + 0.07467889785766602, + -0.02277005836367607, + -0.009787362068891525, + -0.013060796074569225 + ], + "acc_eval": 0.1640625, + "loss_eval": 54.22368621826172, + "epoch": 4 + }, + { + "hidden_norms": [ + 1399.06787109375, + 4862.35302734375, + 9250.7666015625, + 10789.8828125, + 12902.6591796875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007491935975849628, + 0.0007442779606208205, + 0.0007423132774420083, + 0.0007422835915349424, + 0.0007422153139486909 + ], + "gamma_dfa": -0.005301014054566622, + "gamma_dfa_per_layer": [ + 0.06516245007514954, + -0.03411812335252762, + -0.034175027161836624, + -0.01807335577905178 + ], + "acc_eval": 0.2080078125, + "loss_eval": 62.78772735595703, + "epoch": 5 + }, + { + "hidden_norms": [ + 1478.1070556640625, + 5865.33935546875, + 15407.5283203125, + 16717.609375, + 19284.30078125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000746070989407599, + 0.0007320672739297152, + 0.0007320406148210168, + 0.0007324790931306779, + 0.0007322196033783257 + ], + "gamma_dfa": -0.0043716938234865665, + "gamma_dfa_per_layer": [ + 0.0889529138803482, + -0.03475068882107735, + -0.06096648424863815, + -0.010722516104578972 + ], + "acc_eval": 0.21875, + "loss_eval": 84.72342681884766, + "epoch": 6 + }, + { + "hidden_norms": [ + 1569.764892578125, + 7991.109375, + 22041.46484375, + 23657.2890625, + 27372.69140625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007371728424914181, + 0.0007328476058319211, + 0.0007317248382605612, + 0.0007321859593503177, + 0.0007314819958992302 + ], + "gamma_dfa": -0.006586531409993768, + "gamma_dfa_per_layer": [ + 0.08020298182964325, + -0.038106564432382584, + -0.05412164330482483, + -0.014320899732410908 + ], + "acc_eval": 0.21484375, + "loss_eval": 87.40310668945312, + "epoch": 7 + }, + { + "hidden_norms": [ + 1649.8133544921875, + 12248.005859375, + 30825.916015625, + 32827.55078125, + 38153.3828125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007630810141563416, + 0.0007434195140376687, + 0.0007433100836351514, + 0.0007435025763697922, + 0.0007434298167936504 + ], + "gamma_dfa": -0.0035092607140541077, + "gamma_dfa_per_layer": [ + 0.1012866348028183, + -0.029570601880550385, + -0.04660683125257492, + -0.039146244525909424 + ], + "acc_eval": 0.1708984375, + "loss_eval": 157.51614379882812, + "epoch": 8 + }, + { + "hidden_norms": [ + 1712.73193359375, + 20302.939453125, + 43360.37109375, + 46000.90234375, + 53154.84765625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007849909015931189, + 0.0007540763472206891, + 0.0007541946833953261, + 0.0007542177918367088, + 0.0007542550447396934 + ], + "gamma_dfa": 0.006478439085185528, + "gamma_dfa_per_layer": [ + 0.1487787812948227, + -0.03583626449108124, + -0.0212298221886158, + -0.06579893827438354 + ], + "acc_eval": 0.138671875, + "loss_eval": 512.7744750976562, + "epoch": 9 + }, + { + "hidden_norms": [ + 1763.957763671875, + 29818.015625, + 57092.5546875, + 60514.234375, + 69695.1015625 + ], + "bp_grad_per_sample_l2_med": [ + 0.00080581457586959, + 0.0007400442264042795, + 0.0007398677407763898, + 0.0007363590411841869, + 0.0007358043803833425 + ], + "gamma_dfa": -0.003822646103799343, + "gamma_dfa_per_layer": [ + 0.1044168770313263, + -0.0318819060921669, + -0.054846249520778656, + -0.03297930583357811 + ], + "acc_eval": 0.203125, + "loss_eval": 288.6083984375, + "epoch": 10 + }, + { + "hidden_norms": [ + 1841.6363525390625, + 43646.69921875, + 76665.53125, + 80991.453125, + 91946.4765625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008064995636232197, + 0.0007405033684335649, + 0.0007410499965772033, + 0.0007410682155750692, + 0.0007410107646137476 + ], + "gamma_dfa": -0.005903353448957205, + "gamma_dfa_per_layer": [ + 0.15344271063804626, + -0.06077828258275986, + -0.0893951952457428, + -0.02688264660537243 + ], + "acc_eval": 0.1630859375, + "loss_eval": 462.175537109375, + "epoch": 11 + }, + { + "hidden_norms": [ + 1938.4581298828125, + 63804.453125, + 101178.828125, + 106970.6171875, + 119676.0390625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008472055778838694, + 0.0007312041707336903, + 0.0007307010819204152, + 0.0007308369968086481, + 0.000730738160200417 + ], + "gamma_dfa": 0.015948185697197914, + "gamma_dfa_per_layer": [ + 0.19398558139801025, + -0.05326637625694275, + -0.057601772248744965, + -0.019324690103530884 + ], + "acc_eval": 0.1572265625, + "loss_eval": 481.7687072753906, + "epoch": 12 + }, + { + "hidden_norms": [ + 2059.50390625, + 86267.453125, + 127668.078125, + 134690.953125, + 148832.21875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008536268142051995, + 0.0007572658942081034, + 0.0007572331232950091, + 0.0007572534959763288, + 0.0007572824251838028 + ], + "gamma_dfa": 0.007115887477993965, + "gamma_dfa_per_layer": [ + 0.19894848763942719, + -0.06199394166469574, + -0.04606857895851135, + -0.06242241710424423 + ], + "acc_eval": 0.162109375, + "loss_eval": 442.7697448730469, + "epoch": 13 + }, + { + "hidden_norms": [ + 2162.650390625, + 111971.2421875, + 158544.5, + 167081.546875, + 183230.21875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009137325105257332, + 0.0007456843741238117, + 0.0007456432213075459, + 0.0007455914164893329, + 0.0007455993909388781 + ], + "gamma_dfa": 0.008699490688741207, + "gamma_dfa_per_layer": [ + 0.22433382272720337, + -0.07114191353321075, + -0.07720339298248291, + -0.041190553456544876 + ], + "acc_eval": 0.16796875, + "loss_eval": 631.255859375, + "epoch": 14 + }, + { + "hidden_norms": [ + 2287.1767578125, + 140028.015625, + 188737.5625, + 197952.296875, + 214414.0625 + ], + "bp_grad_per_sample_l2_med": [ + 0.000864461821038276, + 0.0007380775641649961, + 0.0007383264601230621, + 0.000738749688025564, + 0.0007389392121694982 + ], + "gamma_dfa": 0.01581217348575592, + "gamma_dfa_per_layer": [ + 0.21350334584712982, + -0.05864371731877327, + -0.039877790957689285, + -0.051733143627643585 + ], + "acc_eval": 0.1806640625, + "loss_eval": 720.0626220703125, + "epoch": 15 + }, + { + "hidden_norms": [ + 2390.364013671875, + 180786.796875, + 233030.703125, + 243522.09375, + 260648.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010889085242524743, + 0.0007420245674438775, + 0.0007420974434353411, + 0.0007420690963044763, + 0.0007420206675305963 + ], + "gamma_dfa": 0.01692677615210414, + "gamma_dfa_per_layer": [ + 0.22792349755764008, + -0.06613948941230774, + -0.0679212138056755, + -0.026155689731240273 + ], + "acc_eval": 0.1904296875, + "loss_eval": 1348.43115234375, + "epoch": 16 + }, + { + "hidden_norms": [ + 2525.60009765625, + 226341.015625, + 282575.21875, + 294521.5, + 313155.65625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010620173998177052, + 0.0007694299565628171, + 0.0007695311214774847, + 0.0007694744854234159, + 0.000769737409427762 + ], + "gamma_dfa": 0.012939120642840862, + "gamma_dfa_per_layer": [ + 0.24798060953617096, + -0.07888300716876984, + -0.03452270105481148, + -0.0828184187412262 + ], + "acc_eval": 0.1572265625, + "loss_eval": 1277.5867919921875, + "epoch": 17 + }, + { + "hidden_norms": [ + 2738.423828125, + 284434.5625, + 346282.90625, + 359909.125, + 379330.46875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009644942474551499, + 0.0007429496035911143, + 0.0007425086805596948, + 0.0007422671769745648, + 0.0007426248048432171 + ], + "gamma_dfa": 0.02641105931252241, + "gamma_dfa_per_layer": [ + 0.2637922763824463, + -0.06210581958293915, + -0.05640384927392006, + -0.039638370275497437 + ], + "acc_eval": 0.220703125, + "loss_eval": 802.8688354492188, + "epoch": 18 + }, + { + "hidden_norms": [ + 2890.100830078125, + 346858.71875, + 414202.09375, + 429987.3125, + 451374.3125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010854159481823444, + 0.0007560763042420149, + 0.0007561030797660351, + 0.0007562912651337683, + 0.0007561809034086764 + ], + "gamma_dfa": -0.006043614819645882, + "gamma_dfa_per_layer": [ + 0.18550744652748108, + -0.07387037575244904, + -0.0915735587477684, + -0.04423797130584717 + ], + "acc_eval": 0.0927734375, + "loss_eval": 2067.48974609375, + "epoch": 19 + }, + { + "hidden_norms": [ + 3048.9677734375, + 416326.4375, + 488715.9375, + 506779.0, + 528907.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.001142722088843584, + 0.0007379497401416302, + 0.0007378923473879695, + 0.0007379662129096687, + 0.0007378893787972629 + ], + "gamma_dfa": 0.020490088500082493, + "gamma_dfa_per_layer": [ + 0.21813809871673584, + -0.053681232035160065, + -0.04219571128487587, + -0.040300801396369934 + ], + "acc_eval": 0.2294921875, + "loss_eval": 1929.7166748046875, + "epoch": 20 + }, + { + "hidden_norms": [ + 3216.734619140625, + 499057.0, + 577401.1875, + 597297.0, + 620542.125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014556541573256254, + 0.0007413470884785056, + 0.0007413764833472669, + 0.0007412104168906808, + 0.0007420589681714773 + ], + "gamma_dfa": 0.03948488784953952, + "gamma_dfa_per_layer": [ + 0.27680304646492004, + -0.05157003924250603, + -0.039460550993680954, + -0.02783290483057499 + ], + "acc_eval": 0.1474609375, + "loss_eval": 2699.9052734375, + "epoch": 21 + }, + { + "hidden_norms": [ + 3342.216064453125, + 584495.625, + 665696.625, + 687533.1875, + 710813.9375 + ], + "bp_grad_per_sample_l2_med": [ + 0.001884044730104506, + 0.0007584495469927788, + 0.0007583577535115182, + 0.0007583281840197742, + 0.0007583273691125214 + ], + "gamma_dfa": 0.004080784507095814, + "gamma_dfa_per_layer": [ + 0.1770291030406952, + -0.056366197764873505, + -0.057933274656534195, + -0.046406492590904236 + ], + "acc_eval": 0.2373046875, + "loss_eval": 1742.9925537109375, + "epoch": 22 + }, + { + "hidden_norms": [ + 3566.038818359375, + 674756.3125, + 760463.3125, + 784571.125, + 808618.6875 + ], + "bp_grad_per_sample_l2_med": [ + 0.001965342788025737, + 0.0007340435404330492, + 0.0007341310847550631, + 0.0007343373727053404, + 0.0007337987190112472 + ], + "gamma_dfa": 0.030578704085201025, + "gamma_dfa_per_layer": [ + 0.24771088361740112, + -0.05749209225177765, + -0.04569869861006737, + -0.022205276414752007 + ], + "acc_eval": 0.1611328125, + "loss_eval": 2397.3916015625, + "epoch": 23 + }, + { + "hidden_norms": [ + 3779.54296875, + 786509.5, + 877152.1875, + 903987.8125, + 928449.375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016364307375624776, + 0.0007935749599710107, + 0.000793365528807044, + 0.0007934189052321017, + 0.0007935216999612749 + ], + "gamma_dfa": 0.01740677817724645, + "gamma_dfa_per_layer": [ + 0.2701166570186615, + -0.0851234570145607, + 0.004913746379315853, + -0.12027983367443085 + ], + "acc_eval": 0.12109375, + "loss_eval": 4908.0458984375, + "epoch": 24 + }, + { + "hidden_norms": [ + 3969.119873046875, + 900145.9375, + 993945.75, + 1023047.9375, + 1047156.125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012235429603606462, + 0.0007582573452964425, + 0.0007582195685245097, + 0.000758210604544729, + 0.0007582050748169422 + ], + "gamma_dfa": -0.005556041374802589, + "gamma_dfa_per_layer": [ + 0.2166597992181778, + -0.09299580752849579, + -0.09515514969825745, + -0.05073300749063492 + ], + "acc_eval": 0.1728515625, + "loss_eval": 3738.029541015625, + "epoch": 25 + }, + { + "hidden_norms": [ + 4167.24169921875, + 1027096.125, + 1126300.25, + 1158199.625, + 1183064.875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015538743464276195, + 0.0007320540607906878, + 0.0007321767043322325, + 0.0007325086044147611, + 0.0007322292076423764 + ], + "gamma_dfa": 0.013890675269067287, + "gamma_dfa_per_layer": [ + 0.25793927907943726, + -0.09288333356380463, + -0.07571414113044739, + -0.03377910330891609 + ], + "acc_eval": 0.10546875, + "loss_eval": 6202.408203125, + "epoch": 26 + }, + { + "hidden_norms": [ + 4332.73046875, + 1157313.5, + 1261637.875, + 1297158.5, + 1323617.625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015948566142469645, + 0.0007783056935295463, + 0.00077825813787058, + 0.0007782406755723059, + 0.0007781987660564482 + ], + "gamma_dfa": 0.02306488621979952, + "gamma_dfa_per_layer": [ + 0.2585013508796692, + -0.07491485029459, + -0.058371271938085556, + -0.03295568376779556 + ], + "acc_eval": 0.208984375, + "loss_eval": 4646.37451171875, + "epoch": 27 + }, + { + "hidden_norms": [ + 4508.3486328125, + 1310938.125, + 1421261.875, + 1460382.75, + 1487384.375 + ], + "bp_grad_per_sample_l2_med": [ + 0.001599438488483429, + 0.0007645513396710157, + 0.0007644708384759724, + 0.00076470518251881, + 0.0007645483710803092 + ], + "gamma_dfa": 0.017900947481393814, + "gamma_dfa_per_layer": [ + 0.24153774976730347, + -0.06473007053136826, + -0.06562119722366333, + -0.039582692086696625 + ], + "acc_eval": 0.173828125, + "loss_eval": 5292.640625, + "epoch": 28 + }, + { + "hidden_norms": [ + 4729.70556640625, + 1458380.25, + 1572980.125, + 1615003.0, + 1642261.875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014249716186895967, + 0.0007341640302911401, + 0.00073421117849648, + 0.0007345581543631852, + 0.0007344211917370558 + ], + "gamma_dfa": 0.03120402991771698, + "gamma_dfa_per_layer": [ + 0.2725849747657776, + -0.07284568250179291, + -0.05128118395805359, + -0.02364198863506317 + ], + "acc_eval": 0.17578125, + "loss_eval": 4871.27001953125, + "epoch": 29 + }, + { + "hidden_norms": [ + 4886.33984375, + 1617197.25, + 1735577.625, + 1780813.375, + 1808887.125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018187292153015733, + 0.0007682304712943733, + 0.0007675564847886562, + 0.0007677674293518066, + 0.0007678233087062836 + ], + "gamma_dfa": 0.017138252966105938, + "gamma_dfa_per_layer": [ + 0.2494080811738968, + -0.08018361777067184, + -0.027287419885396957, + -0.07338403165340424 + ], + "acc_eval": 0.193359375, + "loss_eval": 3960.6728515625, + "epoch": 30 + }, + { + "hidden_norms": [ + 5119.7841796875, + 1765219.5, + 1886735.375, + 1934213.125, + 1961976.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0022127064876258373, + 0.000754481996409595, + 0.0007539362413808703, + 0.0007542265811935067, + 0.0007539446814917028 + ], + "gamma_dfa": 0.0332237659022212, + "gamma_dfa_per_layer": [ + 0.30639636516571045, + -0.08304375410079956, + -0.06092921271920204, + -0.029528334736824036 + ], + "acc_eval": 0.193359375, + "loss_eval": 4306.7734375, + "epoch": 31 + }, + { + "hidden_norms": [ + 5354.88720703125, + 1941186.125, + 2066860.125, + 2117348.25, + 2144884.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013304626336321235, + 0.0007719467394053936, + 0.0007719435379840434, + 0.0007721700239926577, + 0.0007720825960859656 + ], + "gamma_dfa": 0.01764332875609398, + "gamma_dfa_per_layer": [ + 0.2670303285121918, + -0.07338991016149521, + -0.05201137810945511, + -0.07105572521686554 + ], + "acc_eval": 0.1845703125, + "loss_eval": 4018.3662109375, + "epoch": 32 + }, + { + "hidden_norms": [ + 5519.78759765625, + 2116056.25, + 2246081.5, + 2300078.25, + 2327378.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016995095647871494, + 0.0007534062024205923, + 0.0007532716845162213, + 0.0007533822790719569, + 0.0007532139425165951 + ], + "gamma_dfa": 0.021287068724632263, + "gamma_dfa_per_layer": [ + 0.2717400789260864, + -0.08038187026977539, + -0.05876553803682327, + -0.04744439572095871 + ], + "acc_eval": 0.216796875, + "loss_eval": 6509.134765625, + "epoch": 33 + }, + { + "hidden_norms": [ + 5700.9130859375, + 2317603.75, + 2452612.5, + 2509779.5, + 2537064.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.001880816649645567, + 0.0007947525009512901, + 0.0007945421966724098, + 0.0007944482495076954, + 0.0007949797436594963 + ], + "gamma_dfa": 0.02851281687617302, + "gamma_dfa_per_layer": [ + 0.2822743058204651, + -0.08248982578516006, + -0.05187612026929855, + -0.03385709226131439 + ], + "acc_eval": 0.1337890625, + "loss_eval": 8231.9248046875, + "epoch": 34 + }, + { + "hidden_norms": [ + 5855.8310546875, + 2515524.75, + 2653569.0, + 2713748.5, + 2740903.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018560283351689577, + 0.0007757823332212865, + 0.0007757038110867143, + 0.0007756180129945278, + 0.0007759004947729409 + ], + "gamma_dfa": 0.018099953944329172, + "gamma_dfa_per_layer": [ + 0.2729976773262024, + -0.08800812810659409, + -0.002550901612266898, + -0.11003883183002472 + ], + "acc_eval": 0.150390625, + "loss_eval": 7247.7216796875, + "epoch": 35 + }, + { + "hidden_norms": [ + 6036.9033203125, + 2711563.0, + 2854179.0, + 2918077.75, + 2945814.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.001862754113972187, + 0.0007525583496317267, + 0.0007525330875068903, + 0.0007526627741754055, + 0.0007525623659603298 + ], + "gamma_dfa": 0.02487885858863592, + "gamma_dfa_per_layer": [ + 0.29685819149017334, + -0.08635345101356506, + -0.056181322783231735, + -0.054807983338832855 + ], + "acc_eval": 0.1435546875, + "loss_eval": 7513.36376953125, + "epoch": 36 + }, + { + "hidden_norms": [ + 6188.01611328125, + 2906995.5, + 3054202.25, + 3121279.0, + 3149996.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013340733712539077, + 0.0007529910071752965, + 0.0007524905377067626, + 0.0007527912384830415, + 0.0007525555556640029 + ], + "gamma_dfa": 0.027058321982622147, + "gamma_dfa_per_layer": [ + 0.25763267278671265, + -0.06575162708759308, + -0.04412994533777237, + -0.03951781243085861 + ], + "acc_eval": 0.2431640625, + "loss_eval": 12329.697265625, + "epoch": 37 + }, + { + "hidden_norms": [ + 6390.7060546875, + 3133419.5, + 3288636.0, + 3360502.75, + 3390539.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014776778407394886, + 0.0007607035804539919, + 0.0007607110310345888, + 0.0007606975850649178, + 0.000760715629439801 + ], + "gamma_dfa": 0.022189474664628506, + "gamma_dfa_per_layer": [ + 0.2616554796695709, + -0.07128072530031204, + -0.06259018927812576, + -0.039026666432619095 + ], + "acc_eval": 0.173828125, + "loss_eval": 6832.28955078125, + "epoch": 38 + }, + { + "hidden_norms": [ + 6548.68115234375, + 3356773.75, + 3517968.25, + 3593598.5, + 3624375.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.002129003871232271, + 0.0007741872104816139, + 0.000774160900618881, + 0.0007743749301880598, + 0.0007743173046037555 + ], + "gamma_dfa": 0.034090133383870125, + "gamma_dfa_per_layer": [ + 0.3182219862937927, + -0.08398662507534027, + -0.06546281278133392, + -0.03241201490163803 + ], + "acc_eval": 0.1904296875, + "loss_eval": 5371.0859375, + "epoch": 39 + }, + { + "hidden_norms": [ + 6723.9697265625, + 3592963.25, + 3757696.25, + 3837777.75, + 3868088.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018772021867334843, + 0.0007547365385107696, + 0.0007547002169303596, + 0.0007546909037046134, + 0.000754650856833905 + ], + "gamma_dfa": 0.003609549254179001, + "gamma_dfa_per_layer": [ + 0.282962441444397, + -0.10840916633605957, + -0.10053665935993195, + -0.05957841873168945 + ], + "acc_eval": 0.1376953125, + "loss_eval": 8650.76953125, + "epoch": 40 + }, + { + "hidden_norms": [ + 6887.81005859375, + 3829273.5, + 3999416.75, + 4084005.5, + 4113581.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020062020048499107, + 0.0007521071238443255, + 0.0007519447826780379, + 0.0007520412327721715, + 0.0007518909987993538 + ], + "gamma_dfa": 0.01951257325708866, + "gamma_dfa_per_layer": [ + 0.2743881344795227, + -0.08543786406517029, + -0.05402272939682007, + -0.056877247989177704 + ], + "acc_eval": 0.1796875, + "loss_eval": 15509.98828125, + "epoch": 41 + }, + { + "hidden_norms": [ + 7027.42626953125, + 4050130.5, + 4223340.0, + 4310667.5, + 4340882.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016777552664279938, + 0.0007508718408644199, + 0.0007508369744755328, + 0.0007509454735554755, + 0.0007508718408644199 + ], + "gamma_dfa": 0.02786387037485838, + "gamma_dfa_per_layer": [ + 0.2803051769733429, + -0.07360324263572693, + -0.04823639243841171, + -0.04701006039977074 + ], + "acc_eval": 0.2275390625, + "loss_eval": 7618.71533203125, + "epoch": 42 + }, + { + "hidden_norms": [ + 7157.845703125, + 4292685.0, + 4471049.5, + 4562175.0, + 4591811.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016224944265559316, + 0.0007538175559602678, + 0.0007538740755990148, + 0.0007538648205809295, + 0.0007538393838331103 + ], + "gamma_dfa": 0.0053657907992601395, + "gamma_dfa_per_layer": [ + 0.26428842544555664, + -0.10051027685403824, + -0.08806045353412628, + -0.05425453186035156 + ], + "acc_eval": 0.166015625, + "loss_eval": 7869.64111328125, + "epoch": 43 + }, + { + "hidden_norms": [ + 7275.4365234375, + 4532040.5, + 4714971.5, + 4809776.0, + 4839258.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.002823092043399811, + 0.0007887987303547561, + 0.0007888769032433629, + 0.0007889135158620775, + 0.0007889300468377769 + ], + "gamma_dfa": 0.008974121417850256, + "gamma_dfa_per_layer": [ + 0.25932246446609497, + -0.10199789702892303, + 0.012336602434515953, + -0.13376468420028687 + ], + "acc_eval": 0.091796875, + "loss_eval": 19789.41796875, + "epoch": 44 + }, + { + "hidden_norms": [ + 7393.93212890625, + 4772152.5, + 4958566.0, + 5058113.0, + 5086560.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0019131727749481797, + 0.0007677456014789641, + 0.0007676532259210944, + 0.000767527730204165, + 0.0007678664987906814 + ], + "gamma_dfa": 0.014807725325226784, + "gamma_dfa_per_layer": [ + 0.23344306647777557, + -0.08349616825580597, + -0.0560825914144516, + -0.03463340550661087 + ], + "acc_eval": 0.224609375, + "loss_eval": 12636.65625, + "epoch": 45 + }, + { + "hidden_norms": [ + 7527.99462890625, + 5048336.0, + 5239027.5, + 5342244.0, + 5370085.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018555351998656988, + 0.000769329781178385, + 0.0007686647586524487, + 0.0007689501508139074, + 0.0007690390921197832 + ], + "gamma_dfa": 0.004876136779785156, + "gamma_dfa_per_layer": [ + 0.21739649772644043, + -0.08506827056407928, + -0.03674054145812988, + -0.07608313858509064 + ], + "acc_eval": 0.232421875, + "loss_eval": 12248.12109375, + "epoch": 46 + }, + { + "hidden_norms": [ + 7638.85693359375, + 5287113.0, + 5479795.0, + 5586404.5, + 5613225.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0025236238725483418, + 0.0007688805344514549, + 0.000768228666856885, + 0.0007684807060286403, + 0.0007685597520321608 + ], + "gamma_dfa": -0.006854387931525707, + "gamma_dfa_per_layer": [ + 0.17993390560150146, + -0.08751687407493591, + -0.030272338539361954, + -0.08956224471330643 + ], + "acc_eval": 0.1796875, + "loss_eval": 18537.177734375, + "epoch": 47 + }, + { + "hidden_norms": [ + 7754.390625, + 5527426.0, + 5724221.0, + 5833576.5, + 5860100.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020714402198791504, + 0.0007631001644767821, + 0.0007630567415617406, + 0.0007630541222169995, + 0.0007631017942912877 + ], + "gamma_dfa": 0.02875693328678608, + "gamma_dfa_per_layer": [ + 0.29564130306243896, + -0.08437579870223999, + -0.050235565751791, + -0.04600220546126366 + ], + "acc_eval": 0.208984375, + "loss_eval": 10527.2578125, + "epoch": 48 + }, + { + "hidden_norms": [ + 7888.46923828125, + 5787159.5, + 5987915.0, + 6101035.0, + 6127097.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0026283818297088146, + 0.0007835617288947105, + 0.0007836156873963773, + 0.000783648225478828, + 0.0007836673175916076 + ], + "gamma_dfa": 0.011204172391444445, + "gamma_dfa_per_layer": [ + 0.26796066761016846, + -0.10181419551372528, + 0.010023357346653938, + -0.13135313987731934 + ], + "acc_eval": 0.0966796875, + "loss_eval": 15481.84375, + "epoch": 49 + }, + { + "hidden_norms": [ + 7975.13671875, + 6029198.0, + 6234359.5, + 6352162.0, + 6377873.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001740386476740241, + 0.0007632866618223488, + 0.0007632256019860506, + 0.0007631148328073323, + 0.0007634586072526872 + ], + "gamma_dfa": -0.000985240563750267, + "gamma_dfa_per_layer": [ + 0.20569762587547302, + -0.0866088718175888, + -0.04746733605861664, + -0.07556238025426865 + ], + "acc_eval": 0.2001953125, + "loss_eval": 12020.572265625, + "epoch": 50 + }, + { + "hidden_norms": [ + 8109.23095703125, + 6280213.0, + 6488845.5, + 6610432.5, + 6636101.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018630403792485595, + 0.0007671525236219168, + 0.000766951881814748, + 0.0007671291241422296, + 0.0007672281353734434 + ], + "gamma_dfa": -0.0027379142120480537, + "gamma_dfa_per_layer": [ + 0.22697225213050842, + -0.10085368156433105, + -0.059774767607450485, + -0.0772954598069191 + ], + "acc_eval": 0.13671875, + "loss_eval": 12490.904296875, + "epoch": 51 + }, + { + "hidden_norms": [ + 8223.3388671875, + 6520398.5, + 6731145.5, + 6855487.0, + 6880542.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020134998485445976, + 0.0007573508773930371, + 0.0007573754992336035, + 0.0007574421470053494, + 0.0007576147909276187 + ], + "gamma_dfa": 0.00887075625360012, + "gamma_dfa_per_layer": [ + 0.260132372379303, + -0.08125708997249603, + -0.07711100578308105, + -0.06628125160932541 + ], + "acc_eval": 0.12890625, + "loss_eval": 13286.50390625, + "epoch": 52 + }, + { + "hidden_norms": [ + 8317.2099609375, + 6773551.0, + 6990263.5, + 7117609.5, + 7143509.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016349060460925102, + 0.000744542689062655, + 0.0007445236551575363, + 0.000744638848118484, + 0.0007445821538567543 + ], + "gamma_dfa": 0.036132486537098885, + "gamma_dfa_per_layer": [ + 0.35822737216949463, + -0.09246134012937546, + -0.05995674431324005, + -0.06127934157848358 + ], + "acc_eval": 0.1318359375, + "loss_eval": 12961.923828125, + "epoch": 53 + }, + { + "hidden_norms": [ + 8396.16015625, + 7036334.0, + 7256480.5, + 7388541.0, + 7414023.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016424244968220592, + 0.0007655483204871416, + 0.0007653584470972419, + 0.0007655261433683336, + 0.0007656112429685891 + ], + "gamma_dfa": 0.00855250470340252, + "gamma_dfa_per_layer": [ + 0.31318342685699463, + -0.11486171185970306, + -0.07210143655538559, + -0.0920102596282959 + ], + "acc_eval": 0.0986328125, + "loss_eval": 14289.1396484375, + "epoch": 54 + }, + { + "hidden_norms": [ + 8425.91796875, + 7268265.0, + 7491250.5, + 7626377.5, + 7651502.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014321975177153945, + 0.0007547372952103615, + 0.0007547161658294499, + 0.0007547704153694212, + 0.000754979089833796 + ], + "gamma_dfa": 0.019777772948145866, + "gamma_dfa_per_layer": [ + 0.3146383762359619, + -0.0827077254652977, + -0.0876566469669342, + -0.06516291201114655 + ], + "acc_eval": 0.0908203125, + "loss_eval": 12761.185546875, + "epoch": 55 + }, + { + "hidden_norms": [ + 8519.505859375, + 7514964.5, + 7741589.0, + 7880037.0, + 7905207.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017787133110687137, + 0.0007505406392738223, + 0.0007507357513532043, + 0.0007507326663471758, + 0.0007507237605750561 + ], + "gamma_dfa": -0.012186199426651001, + "gamma_dfa_per_layer": [ + 0.2306034117937088, + -0.11392365396022797, + -0.1025918573141098, + -0.06283269822597504 + ], + "acc_eval": 0.1455078125, + "loss_eval": 8573.3310546875, + "epoch": 56 + }, + { + "hidden_norms": [ + 8575.814453125, + 7701015.5, + 7930432.0, + 8070523.0, + 8095346.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013273135991767049, + 0.0007214294746518135, + 0.0007213159115053713, + 0.0007215962978079915, + 0.0007215975201688707 + ], + "gamma_dfa": 0.02046024613082409, + "gamma_dfa_per_layer": [ + 0.2830252945423126, + -0.09345690906047821, + -0.06962529569864273, + -0.038102105259895325 + ], + "acc_eval": 0.1923828125, + "loss_eval": 6201.162109375, + "epoch": 57 + }, + { + "hidden_norms": [ + 8635.1220703125, + 7939687.0, + 8172801.5, + 8315327.5, + 8340462.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.002125338651239872, + 0.0007551790331490338, + 0.0007551065064035356, + 0.0007549694273620844, + 0.000755314074922353 + ], + "gamma_dfa": 0.019076894968748093, + "gamma_dfa_per_layer": [ + 0.25508445501327515, + -0.07673472911119461, + -0.04303552210330963, + -0.059006623923778534 + ], + "acc_eval": 0.1865234375, + "loss_eval": 12055.595703125, + "epoch": 58 + }, + { + "hidden_norms": [ + 8706.6689453125, + 8158003.0, + 8394169.0, + 8539798.0, + 8565165.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001350156613625586, + 0.0007560249068774283, + 0.0007559725781902671, + 0.0007558663492091, + 0.0007561935926787555 + ], + "gamma_dfa": 0.028152598068118095, + "gamma_dfa_per_layer": [ + 0.28580546379089355, + -0.08475945889949799, + -0.05238167941570282, + -0.03605393320322037 + ], + "acc_eval": 0.220703125, + "loss_eval": 12085.9541015625, + "epoch": 59 + }, + { + "hidden_norms": [ + 8758.453125, + 8374766.0, + 8613513.0, + 8761622.0, + 8786363.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.002377285622060299, + 0.0007197813247330487, + 0.0007195555372163653, + 0.0007198317907750607, + 0.000719684932846576 + ], + "gamma_dfa": 0.025455349124968052, + "gamma_dfa_per_layer": [ + 0.27419814467430115, + -0.08699844777584076, + -0.04594934359192848, + -0.0394289568066597 + ], + "acc_eval": 0.1669921875, + "loss_eval": 13302.744140625, + "epoch": 60 + }, + { + "hidden_norms": [ + 8795.5654296875, + 8572136.0, + 8812910.0, + 8963599.0, + 8987706.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015984047204256058, + 0.0007187420851550996, + 0.0007185072172433138, + 0.000718816474545747, + 0.000718718278221786 + ], + "gamma_dfa": 0.020128127187490463, + "gamma_dfa_per_layer": [ + 0.3066103458404541, + -0.1022094339132309, + -0.07834567129611969, + -0.04554273188114166 + ], + "acc_eval": 0.1181640625, + "loss_eval": 6553.7236328125, + "epoch": 61 + }, + { + "hidden_norms": [ + 8811.46875, + 8766653.0, + 9009529.0, + 9162389.0, + 9185680.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0019123096717521548, + 0.0007724921451881528, + 0.0007725215400569141, + 0.0007725482573732734, + 0.0007725649629719555 + ], + "gamma_dfa": 0.03271363768726587, + "gamma_dfa_per_layer": [ + 0.2947639226913452, + -0.08735189586877823, + -0.04557036980986595, + -0.030987106263637543 + ], + "acc_eval": 0.18359375, + "loss_eval": 11607.7158203125, + "epoch": 62 + }, + { + "hidden_norms": [ + 8860.6220703125, + 8977001.0, + 9224122.0, + 9379773.0, + 9402851.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013403806369751692, + 0.0007685344316996634, + 0.0007685531745664775, + 0.0007685986929573119, + 0.0007685821619816124 + ], + "gamma_dfa": 0.020242065889760852, + "gamma_dfa_per_layer": [ + 0.30239802598953247, + -0.09480112791061401, + -0.014634584076702595, + -0.11199405044317245 + ], + "acc_eval": 0.1337890625, + "loss_eval": 9788.81640625, + "epoch": 63 + }, + { + "hidden_norms": [ + 8904.9482421875, + 9185937.0, + 9436793.0, + 9595000.0, + 9618183.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012845145538449287, + 0.0007421535556204617, + 0.0007421503541991115, + 0.0007421293412335217, + 0.0007421668851748109 + ], + "gamma_dfa": 0.02229973580688238, + "gamma_dfa_per_layer": [ + 0.2927352786064148, + -0.08628389239311218, + -0.060364432632923126, + -0.05688801035284996 + ], + "acc_eval": 0.1728515625, + "loss_eval": 8114.20458984375, + "epoch": 64 + }, + { + "hidden_norms": [ + 8892.296875, + 9356716.0, + 9611136.0, + 9771064.0, + 9794530.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001351315644569695, + 0.0007599962409585714, + 0.0007597811054438353, + 0.0007599799428135157, + 0.0007600505487062037 + ], + "gamma_dfa": 0.019069598987698555, + "gamma_dfa_per_layer": [ + 0.29072487354278564, + -0.0944916158914566, + -0.05359811335802078, + -0.06635674834251404 + ], + "acc_eval": 0.169921875, + "loss_eval": 8773.3408203125, + "epoch": 65 + }, + { + "hidden_norms": [ + 8905.83984375, + 9511506.0, + 9766884.0, + 9928659.0, + 9951002.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017338081961497664, + 0.0007696599350310862, + 0.0007696837419643998, + 0.0007697126129642129, + 0.0007697291439399123 + ], + "gamma_dfa": 0.028427925892174244, + "gamma_dfa_per_layer": [ + 0.3319295644760132, + -0.09938425570726395, + 0.004324089735746384, + -0.12315769493579865 + ], + "acc_eval": 0.1142578125, + "loss_eval": 12823.435546875, + "epoch": 66 + }, + { + "hidden_norms": [ + 8944.53125, + 9692436.0, + 9950194.0, + 10113948.0, + 10136307.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017030658200383186, + 0.000714489258825779, + 0.0007141575333662331, + 0.0007145405979827046, + 0.0007144163828343153 + ], + "gamma_dfa": 0.055724941194057465, + "gamma_dfa_per_layer": [ + 0.3514706492424011, + -0.07685236632823944, + -0.031716104596853256, + -0.020002413541078568 + ], + "acc_eval": 0.18359375, + "loss_eval": 10412.890625, + "epoch": 67 + }, + { + "hidden_norms": [ + 8926.98828125, + 9838798.0, + 10099141.0, + 10264565.0, + 10286604.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015448650810867548, + 0.0007684402517043054, + 0.0007684584707021713, + 0.0007684882148168981, + 0.0007685049204155803 + ], + "gamma_dfa": 0.032529132440686226, + "gamma_dfa_per_layer": [ + 0.3082513213157654, + -0.0888272076845169, + -0.032446227967739105, + -0.056861355900764465 + ], + "acc_eval": 0.19921875, + "loss_eval": 8345.18359375, + "epoch": 68 + }, + { + "hidden_norms": [ + 8903.689453125, + 10005445.0, + 10266980.0, + 10434005.0, + 10454617.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017746278317645192, + 0.0007130402373149991, + 0.0007127230055630207, + 0.0007131076999939978, + 0.0007130174781195819 + ], + "gamma_dfa": 0.05443635303527117, + "gamma_dfa_per_layer": [ + 0.35508570075035095, + -0.08241431415081024, + -0.03841204196214676, + -0.01651393249630928 + ], + "acc_eval": 0.140625, + "loss_eval": 7877.36181640625, + "epoch": 69 + }, + { + "hidden_norms": [ + 8910.42578125, + 10173785.0, + 10439506.0, + 10609011.0, + 10630571.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011222161119803786, + 0.0007312637171708047, + 0.0007313191890716553, + 0.0007313672685995698, + 0.0007313768728636205 + ], + "gamma_dfa": 0.023520448245108128, + "gamma_dfa_per_layer": [ + 0.29335978627204895, + -0.08935706317424774, + -0.06947942078113556, + -0.04044150933623314 + ], + "acc_eval": 0.2421875, + "loss_eval": 5653.23388671875, + "epoch": 70 + }, + { + "hidden_norms": [ + 8876.2041015625, + 10317365.0, + 10586095.0, + 10757344.0, + 10779691.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011208312353119254, + 0.0007571111200377345, + 0.0007568965083919466, + 0.0007570943562313914, + 0.0007571595488116145 + ], + "gamma_dfa": 0.025294490158557892, + "gamma_dfa_per_layer": [ + 0.331506609916687, + -0.09467847645282745, + -0.06287634372711182, + -0.07277382910251617 + ], + "acc_eval": 0.1884765625, + "loss_eval": 3869.094970703125, + "epoch": 71 + }, + { + "hidden_norms": [ + 8852.7001953125, + 10449657.0, + 10719980.0, + 10891483.0, + 10913594.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001109768869355321, + 0.0007331773522309959, + 0.0007331601809710264, + 0.0007332302629947662, + 0.0007332285749725997 + ], + "gamma_dfa": 0.03539558406919241, + "gamma_dfa_per_layer": [ + 0.3268349766731262, + -0.08062416315078735, + -0.055393531918525696, + -0.04923494532704353 + ], + "acc_eval": 0.2353515625, + "loss_eval": 7111.935546875, + "epoch": 72 + }, + { + "hidden_norms": [ + 8827.3955078125, + 10582167.0, + 10855077.0, + 11028114.0, + 11050690.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001240618177689612, + 0.0007623998681083322, + 0.0007624404970556498, + 0.0007624777499586344, + 0.0007624629070051014 + ], + "gamma_dfa": 0.03839550958946347, + "gamma_dfa_per_layer": [ + 0.36802345514297485, + -0.09764832258224487, + -0.0042990874499082565, + -0.11249400675296783 + ], + "acc_eval": 0.1357421875, + "loss_eval": 6752.0322265625, + "epoch": 73 + }, + { + "hidden_norms": [ + 8814.1962890625, + 10696667.0, + 10971925.0, + 11146316.0, + 11168931.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001309843035414815, + 0.0007403214112855494, + 0.0007405314245261252, + 0.0007405264186672866, + 0.0007405087817460299 + ], + "gamma_dfa": 0.038134077563881874, + "gamma_dfa_per_layer": [ + 0.3364037275314331, + -0.08192241191864014, + -0.03633008152246475, + -0.06561492383480072 + ], + "acc_eval": 0.212890625, + "loss_eval": 6998.021484375, + "epoch": 74 + }, + { + "hidden_norms": [ + 8779.0400390625, + 10798076.0, + 11075004.0, + 11250115.0, + 11272600.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011087025050073862, + 0.0007316112169064581, + 0.0007316232076846063, + 0.0007316932315006852, + 0.00073169672396034 + ], + "gamma_dfa": 0.04451032355427742, + "gamma_dfa_per_layer": [ + 0.34500744938850403, + -0.07661331444978714, + -0.04388073831796646, + -0.04647210240364075 + ], + "acc_eval": 0.2490234375, + "loss_eval": 3624.614013671875, + "epoch": 75 + }, + { + "hidden_norms": [ + 8751.8486328125, + 10906611.0, + 11185716.0, + 11362176.0, + 11384611.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001067605335265398, + 0.0007393756532110274, + 0.0007396025466732681, + 0.000739598530344665, + 0.000739583745598793 + ], + "gamma_dfa": 0.03648093156516552, + "gamma_dfa_per_layer": [ + 0.31906285881996155, + -0.07843812555074692, + -0.051880721002817154, + -0.0428202860057354 + ], + "acc_eval": 0.2509765625, + "loss_eval": 2816.3427734375, + "epoch": 76 + }, + { + "hidden_norms": [ + 8743.0078125, + 10999747.0, + 11279813.0, + 11457343.0, + 11479737.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010900371707975864, + 0.0007332717068493366, + 0.0007332694949582219, + 0.0007332508685067296, + 0.0007332859677262604 + ], + "gamma_dfa": 0.03520212788134813, + "gamma_dfa_per_layer": [ + 0.3010096549987793, + -0.07223288714885712, + -0.05185239389538765, + -0.036115862429142 + ], + "acc_eval": 0.2451171875, + "loss_eval": 3747.66748046875, + "epoch": 77 + }, + { + "hidden_norms": [ + 8693.3349609375, + 11081850.0, + 11362476.0, + 11540274.0, + 11562006.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010161141399294138, + 0.0007433417486026883, + 0.0007432828424498439, + 0.000743163691367954, + 0.0007434578728862107 + ], + "gamma_dfa": 0.04203554056584835, + "gamma_dfa_per_layer": [ + 0.3622134029865265, + -0.08443501591682434, + -0.020812533795833588, + -0.08882369101047516 + ], + "acc_eval": 0.1953125, + "loss_eval": 3283.453125, + "epoch": 78 + }, + { + "hidden_norms": [ + 8679.0673828125, + 11176062.0, + 11458995.0, + 11637744.0, + 11660108.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010180213721469045, + 0.0007298000273294747, + 0.000729813240468502, + 0.0007298758719116449, + 0.0007298807031475008 + ], + "gamma_dfa": 0.03867925424128771, + "gamma_dfa_per_layer": [ + 0.3430703282356262, + -0.08001460134983063, + -0.05243712291121483, + -0.05590158700942993 + ], + "acc_eval": 0.22265625, + "loss_eval": 3249.233154296875, + "epoch": 79 + }, + { + "hidden_norms": [ + 8630.8896484375, + 11249126.0, + 11532709.0, + 11711592.0, + 11733760.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001043561496771872, + 0.0007425911608152092, + 0.0007425197982229292, + 0.0007423801580443978, + 0.000742721778806299 + ], + "gamma_dfa": 0.028339628130197525, + "gamma_dfa_per_layer": [ + 0.32279035449028015, + -0.09357395768165588, + -0.06377816200256348, + -0.05207972228527069 + ], + "acc_eval": 0.1904296875, + "loss_eval": 3085.4638671875, + "epoch": 80 + }, + { + "hidden_norms": [ + 8578.060546875, + 11304050.0, + 11589802.0, + 11769234.0, + 11792299.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000967628788203001, + 0.0007289479253813624, + 0.0007289598579518497, + 0.0007290169014595449, + 0.0007290222565643489 + ], + "gamma_dfa": 0.02121756039559841, + "gamma_dfa_per_layer": [ + 0.31049084663391113, + -0.09504136443138123, + -0.07916043698787689, + -0.05141880363225937 + ], + "acc_eval": 0.236328125, + "loss_eval": 1885.889404296875, + "epoch": 81 + }, + { + "hidden_norms": [ + 8522.4794921875, + 11393685.0, + 11680880.0, + 11860855.0, + 11883774.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010794082190841436, + 0.0007521919906139374, + 0.0007519960636273026, + 0.0007521732477471232, + 0.0007522284286096692 + ], + "gamma_dfa": 0.026587368920445442, + "gamma_dfa_per_layer": [ + 0.37745779752731323, + -0.11168865859508514, + -0.0728297159075737, + -0.08658994734287262 + ], + "acc_eval": 0.1220703125, + "loss_eval": 2588.15478515625, + "epoch": 82 + }, + { + "hidden_norms": [ + 8482.1484375, + 11447732.0, + 11736021.0, + 11916302.0, + 11939110.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009376976522617042, + 0.0007250583730638027, + 0.000724694284144789, + 0.0007250410853885114, + 0.0007250093622133136 + ], + "gamma_dfa": 0.0355191919952631, + "gamma_dfa_per_layer": [ + 0.31943440437316895, + -0.07911509275436401, + -0.0536213181912899, + -0.04462122544646263 + ], + "acc_eval": 0.2783203125, + "loss_eval": 1507.2919921875, + "epoch": 83 + }, + { + "hidden_norms": [ + 8430.1455078125, + 11492522.0, + 11781554.0, + 11962317.0, + 11985175.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009387033060193062, + 0.0007079826318658888, + 0.0007078545750118792, + 0.0007080811192281544, + 0.0007080849609337747 + ], + "gamma_dfa": 0.036465028300881386, + "gamma_dfa_per_layer": [ + 0.3066443204879761, + -0.07488954067230225, + -0.03129498288035393, + -0.05459968373179436 + ], + "acc_eval": 0.275390625, + "loss_eval": 1614.5029296875, + "epoch": 84 + }, + { + "hidden_norms": [ + 8369.6298828125, + 11532036.0, + 11821641.0, + 12002443.0, + 12025323.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009389162878505886, + 0.0007232772768475115, + 0.0007233347278088331, + 0.0007233632495626807, + 0.000723376520909369 + ], + "gamma_dfa": 0.040183850564062595, + "gamma_dfa_per_layer": [ + 0.34539365768432617, + -0.08373545110225677, + -0.05380668863654137, + -0.04711611568927765 + ], + "acc_eval": 0.25, + "loss_eval": 1501.9444580078125, + "epoch": 85 + }, + { + "hidden_norms": [ + 8319.4169921875, + 11569238.0, + 11860199.0, + 12041371.0, + 12064573.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009176665917038918, + 0.0007041870849207044, + 0.0007039242191240191, + 0.0007042758516035974, + 0.0007042170618660748 + ], + "gamma_dfa": 0.035514961928129196, + "gamma_dfa_per_layer": [ + 0.2879785895347595, + -0.07180146872997284, + -0.037917762994766235, + -0.03619951009750366 + ], + "acc_eval": 0.30859375, + "loss_eval": 1078.8165283203125, + "epoch": 86 + }, + { + "hidden_norms": [ + 8282.478515625, + 11596869.0, + 11888039.0, + 12069453.0, + 12092582.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00098571612033993, + 0.000731602602172643, + 0.0007312855450436473, + 0.0007312477100640535, + 0.0007316134287975729 + ], + "gamma_dfa": 0.04066215269267559, + "gamma_dfa_per_layer": [ + 0.33381348848342896, + -0.08063024282455444, + -0.055662885308265686, + -0.034871749579906464 + ], + "acc_eval": 0.234375, + "loss_eval": 1841.648193359375, + "epoch": 87 + }, + { + "hidden_norms": [ + 8242.1005859375, + 11624052.0, + 11916218.0, + 12098548.0, + 12121911.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009184937225654721, + 0.0007233315263874829, + 0.000723001197911799, + 0.0007232833886519074, + 0.0007232468342408538 + ], + "gamma_dfa": 0.03233872726559639, + "gamma_dfa_per_layer": [ + 0.2990570068359375, + -0.07802218198776245, + -0.04814079403877258, + -0.04353912174701691 + ], + "acc_eval": 0.2890625, + "loss_eval": 980.395751953125, + "epoch": 88 + }, + { + "hidden_norms": [ + 8216.91796875, + 11647355.0, + 11939175.0, + 12121172.0, + 12144056.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008776114555075765, + 0.0007067625410854816, + 0.0007066249381750822, + 0.0007068619015626609, + 0.0007068667327985168 + ], + "gamma_dfa": 0.027417242527008057, + "gamma_dfa_per_layer": [ + 0.28433892130851746, + -0.07622525095939636, + -0.050822652876377106, + -0.04762204736471176 + ], + "acc_eval": 0.326171875, + "loss_eval": 776.0946044921875, + "epoch": 89 + }, + { + "hidden_norms": [ + 8169.76513671875, + 11658648.0, + 11950474.0, + 12132456.0, + 12155182.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008986471802927554, + 0.0007065801764838398, + 0.0007064181263558567, + 0.000706693041138351, + 0.0007066999096423388 + ], + "gamma_dfa": 0.03352018166333437, + "gamma_dfa_per_layer": [ + 0.296892374753952, + -0.07546264678239822, + -0.04814247041940689, + -0.03920653089880943 + ], + "acc_eval": 0.3095703125, + "loss_eval": 893.558349609375, + "epoch": 90 + }, + { + "hidden_norms": [ + 8142.11669921875, + 11667783.0, + 11959690.0, + 12141714.0, + 12164439.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009172433638013899, + 0.0007064292440190911, + 0.0007062776712700725, + 0.0007065359968692064, + 0.000706541701219976 + ], + "gamma_dfa": 0.03799809701740742, + "gamma_dfa_per_layer": [ + 0.31104975938796997, + -0.07753260433673859, + -0.04483959078788757, + -0.03668517619371414 + ], + "acc_eval": 0.2763671875, + "loss_eval": 918.902099609375, + "epoch": 91 + }, + { + "hidden_norms": [ + 8113.36474609375, + 11673688.0, + 11965558.0, + 12147558.0, + 12170198.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009179572225548327, + 0.0007257050601765513, + 0.0007257269462570548, + 0.0007257769466377795, + 0.0007257869001477957 + ], + "gamma_dfa": 0.03620104119181633, + "gamma_dfa_per_layer": [ + 0.3097808361053467, + -0.07722775638103485, + -0.0500766858458519, + -0.03767222911119461 + ], + "acc_eval": 0.2880859375, + "loss_eval": 1033.579833984375, + "epoch": 92 + }, + { + "hidden_norms": [ + 8085.35595703125, + 11678927.0, + 11970798.0, + 12152808.0, + 12175446.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008720594923943281, + 0.0007061808719299734, + 0.0007060291827656329, + 0.0007062855875119567, + 0.0007062909426167607 + ], + "gamma_dfa": 0.03221010882407427, + "gamma_dfa_per_layer": [ + 0.2895042598247528, + -0.07448285818099976, + -0.04004380851984024, + -0.04613715782761574 + ], + "acc_eval": 0.3046875, + "loss_eval": 827.44140625, + "epoch": 93 + }, + { + "hidden_norms": [ + 8072.322265625, + 11682684.0, + 11974490.0, + 12156499.0, + 12179080.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008837314089760184, + 0.0007061065407469869, + 0.0007059663184918463, + 0.00070620869519189, + 0.000706215447280556 + ], + "gamma_dfa": 0.026722624897956848, + "gamma_dfa_per_layer": [ + 0.28959959745407104, + -0.08210700005292892, + -0.05253326892852783, + -0.048068828880786896 + ], + "acc_eval": 0.291015625, + "loss_eval": 795.6766357421875, + "epoch": 94 + }, + { + "hidden_norms": [ + 8063.02001953125, + 11684947.0, + 11976758.0, + 12158785.0, + 12181362.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008943622815422714, + 0.0007086708792485297, + 0.0007086790283210576, + 0.0007087094127200544, + 0.0007087020785547793 + ], + "gamma_dfa": 0.02946585137397051, + "gamma_dfa_per_layer": [ + 0.29232603311538696, + -0.08056485652923584, + -0.05102770775556564, + -0.042870063334703445 + ], + "acc_eval": 0.2919921875, + "loss_eval": 839.8633422851562, + "epoch": 95 + }, + { + "hidden_norms": [ + 8055.40576171875, + 11685775.0, + 11977584.0, + 12159594.0, + 12182165.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008769903797656298, + 0.0007059753406792879, + 0.0007058423361741006, + 0.0007060715579427779, + 0.0007060769130475819 + ], + "gamma_dfa": 0.02765239030122757, + "gamma_dfa_per_layer": [ + 0.2855387032032013, + -0.07872132211923599, + -0.051525406539440155, + -0.04468241333961487 + ], + "acc_eval": 0.3115234375, + "loss_eval": 736.9282836914062, + "epoch": 96 + }, + { + "hidden_norms": [ + 8050.93310546875, + 11685670.0, + 11977453.0, + 12159452.0, + 12182004.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008705379441380501, + 0.0007085780380293727, + 0.0007085860124789178, + 0.0007086164550855756, + 0.0007086091791279614 + ], + "gamma_dfa": 0.026861276477575302, + "gamma_dfa_per_layer": [ + 0.2898082733154297, + -0.07899712026119232, + -0.046087510883808136, + -0.05727853626012802 + ], + "acc_eval": 0.302734375, + "loss_eval": 737.6731567382812, + "epoch": 97 + }, + { + "hidden_norms": [ + 8048.384765625, + 11685821.0, + 11977554.0, + 12159347.0, + 12182068.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008696588920429349, + 0.0007085675024427474, + 0.0007085754186846316, + 0.0007086056284606457, + 0.0007085986435413361 + ], + "gamma_dfa": 0.02852465771138668, + "gamma_dfa_per_layer": [ + 0.2933640480041504, + -0.07862062007188797, + -0.04777185618877411, + -0.05287294089794159 + ], + "acc_eval": 0.30859375, + "loss_eval": 716.3431396484375, + "epoch": 98 + }, + { + "hidden_norms": [ + 8047.294921875, + 11685550.0, + 11977281.0, + 12159072.0, + 12181796.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000868224713485688, + 0.0007059023482725024, + 0.0007057614857330918, + 0.0007060033385641873, + 0.0007060095085762441 + ], + "gamma_dfa": 0.026804575696587563, + "gamma_dfa_per_layer": [ + 0.2827316224575043, + -0.07767541706562042, + -0.051301658153533936, + -0.046536244451999664 + ], + "acc_eval": 0.32421875, + "loss_eval": 693.041259765625, + "epoch": 99 + }, + { + "hidden_norms": [ + 8047.01025390625, + 11685479.0, + 11977214.0, + 12159006.0, + 12181733.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008688519592396915, + 0.0007085604593157768, + 0.0007085682009346783, + 0.0007085984107106924, + 0.0007085916586220264 + ], + "gamma_dfa": 0.027284779585897923, + "gamma_dfa_per_layer": [ + 0.2883991003036499, + -0.07865853607654572, + -0.04951424151659012, + -0.05108720436692238 + ], + "acc_eval": 0.3134765625, + "loss_eval": 705.9644775390625, + "epoch": 100 + } + ] +} \ No newline at end of file diff --git a/results/snapshot_no_outln_v1/snapshot_noLN_s42.json b/results/snapshot_no_outln_v1/snapshot_noLN_s42.json new file mode 100644 index 0000000..6bf0a61 --- /dev/null +++ b/results/snapshot_no_outln_v1/snapshot_noLN_s42.json @@ -0,0 +1,4766 @@ +{ + "config": { + "output_dir": "results/snapshot_no_outln_v1", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 42, + "depth": 4, + "d_hidden": 256 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "architecture": "ResidualMLP_NoOutLN", + "bp_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005561555735766888, + 0.0005519049009308219, + 0.0005482902633957565, + 0.0005436676437966526, + 0.000538847001735121 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.1123046875, + "loss_eval": 2.3168468475341797, + "epoch": 0 + }, + { + "hidden_norms": [ + 39.5714225769043, + 36.241031646728516, + 34.50772476196289, + 33.32059097290039, + 33.10130310058594 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001264682796318084, + 0.00013185068382881582, + 0.0001420896005583927, + 0.00016605440760031343, + 0.0002204339689342305 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4228515625, + "loss_eval": 1.6010748147964478, + "epoch": 1 + }, + { + "hidden_norms": [ + 52.47050857543945, + 48.28652572631836, + 45.496219635009766, + 43.2078857421875, + 41.36874008178711 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010761933663161471, + 0.00011420303053455427, + 0.00012131234689150006, + 0.00013399586896412075, + 0.00016239506658166647 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.453125, + "loss_eval": 1.4937903881072998, + "epoch": 2 + }, + { + "hidden_norms": [ + 62.092323303222656, + 56.274635314941406, + 52.64373016357422, + 49.852622985839844, + 46.636131286621094 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010067893890663981, + 0.00010744533210527152, + 0.000112645146145951, + 0.00012268377759028226, + 0.00014184287283569574 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.46484375, + "loss_eval": 1.495908498764038, + "epoch": 3 + }, + { + "hidden_norms": [ + 70.92781829833984, + 62.570072174072266, + 57.76173400878906, + 53.9067497253418, + 49.468414306640625 + ], + "bp_grad_per_sample_l2_med": [ + 9.065420454135165e-05, + 9.659545321483165e-05, + 0.00010056291648652405, + 0.00010604548879200593, + 0.0001232008944498375 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5048828125, + "loss_eval": 1.4103548526763916, + "epoch": 4 + }, + { + "hidden_norms": [ + 77.77008056640625, + 68.82622528076172, + 62.881927490234375, + 57.43979263305664, + 52.381675720214844 + ], + "bp_grad_per_sample_l2_med": [ + 8.967184840003029e-05, + 9.561960905557498e-05, + 9.984008647734299e-05, + 0.0001043190059135668, + 0.00011724776413757354 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5009765625, + "loss_eval": 1.3900126218795776, + "epoch": 5 + }, + { + "hidden_norms": [ + 84.3420639038086, + 73.14466094970703, + 66.25099182128906, + 60.290985107421875, + 54.196815490722656 + ], + "bp_grad_per_sample_l2_med": [ + 8.548566984245554e-05, + 9.279063669964671e-05, + 9.806034358916804e-05, + 0.00010389943781774491, + 0.00011231016833335161 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.509765625, + "loss_eval": 1.3721935749053955, + "epoch": 6 + }, + { + "hidden_norms": [ + 91.67733764648438, + 79.67963409423828, + 70.7928466796875, + 63.614192962646484, + 56.76249694824219 + ], + "bp_grad_per_sample_l2_med": [ + 8.422173414146528e-05, + 9.07716530491598e-05, + 9.6989817393478e-05, + 0.00010211832704953849, + 0.00011144059681100771 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5166015625, + "loss_eval": 1.344391107559204, + "epoch": 7 + }, + { + "hidden_norms": [ + 96.60388946533203, + 83.8042221069336, + 74.53706359863281, + 66.99102020263672, + 58.020408630371094 + ], + "bp_grad_per_sample_l2_med": [ + 8.360752690350637e-05, + 9.003488958114758e-05, + 9.634223533794284e-05, + 0.00010073634621221572, + 0.00010698751430027187 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5185546875, + "loss_eval": 1.3327906131744385, + "epoch": 8 + }, + { + "hidden_norms": [ + 101.24382781982422, + 87.08720397949219, + 76.92607116699219, + 68.23351287841797, + 59.4285888671875 + ], + "bp_grad_per_sample_l2_med": [ + 8.019094821065664e-05, + 8.715572766959667e-05, + 9.189714910462499e-05, + 9.61213736445643e-05, + 0.00010296071559423581 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.533203125, + "loss_eval": 1.3403639793395996, + "epoch": 9 + }, + { + "hidden_norms": [ + 107.04126739501953, + 91.77833557128906, + 80.73109436035156, + 70.98918914794922, + 61.11309051513672 + ], + "bp_grad_per_sample_l2_med": [ + 7.710429053986445e-05, + 8.402510866289958e-05, + 8.972393698059022e-05, + 9.477136336499825e-05, + 9.921709715854377e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5517578125, + "loss_eval": 1.3021693229675293, + "epoch": 10 + }, + { + "hidden_norms": [ + 111.9730224609375, + 94.8844985961914, + 83.01356506347656, + 72.39442443847656, + 61.61451721191406 + ], + "bp_grad_per_sample_l2_med": [ + 7.266257307492197e-05, + 8.069563045864925e-05, + 8.615722617832944e-05, + 8.979514677776024e-05, + 9.45624997257255e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5458984375, + "loss_eval": 1.298128604888916, + "epoch": 11 + }, + { + "hidden_norms": [ + 116.69439697265625, + 99.29745483398438, + 84.83220672607422, + 72.58226013183594, + 61.799560546875 + ], + "bp_grad_per_sample_l2_med": [ + 7.808519876562059e-05, + 8.509745384799317e-05, + 9.162558853859082e-05, + 9.594277798896655e-05, + 0.00010088863200508058 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5361328125, + "loss_eval": 1.327142596244812, + "epoch": 12 + }, + { + "hidden_norms": [ + 118.57154083251953, + 100.65165710449219, + 86.92396545410156, + 75.52800750732422, + 63.40058898925781 + ], + "bp_grad_per_sample_l2_med": [ + 7.507520058425143e-05, + 8.161060395650566e-05, + 8.807337144389749e-05, + 9.307889558840543e-05, + 9.839278209256008e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.529296875, + "loss_eval": 1.301376223564148, + "epoch": 13 + }, + { + "hidden_norms": [ + 123.16495513916016, + 104.0947265625, + 90.54090118408203, + 79.24758911132812, + 66.25940704345703 + ], + "bp_grad_per_sample_l2_med": [ + 7.567028660560027e-05, + 8.223088661907241e-05, + 8.735521987546235e-05, + 9.217277693096548e-05, + 9.719380614114925e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5615234375, + "loss_eval": 1.2765182256698608, + "epoch": 14 + }, + { + "hidden_norms": [ + 126.89250946044922, + 107.54840087890625, + 93.0474853515625, + 79.41374206542969, + 66.3965835571289 + ], + "bp_grad_per_sample_l2_med": [ + 7.546511915279552e-05, + 8.2636863226071e-05, + 8.891599281923845e-05, + 9.294570190832019e-05, + 9.809954644879326e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.51953125, + "loss_eval": 1.300541877746582, + "epoch": 15 + }, + { + "hidden_norms": [ + 130.00201416015625, + 110.14152526855469, + 95.71183776855469, + 81.57356262207031, + 68.07804107666016 + ], + "bp_grad_per_sample_l2_med": [ + 7.271749927895144e-05, + 7.90783524280414e-05, + 8.341569628100842e-05, + 8.888234879123047e-05, + 9.289903391618282e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.55859375, + "loss_eval": 1.253805160522461, + "epoch": 16 + }, + { + "hidden_norms": [ + 132.4821014404297, + 112.55132293701172, + 96.15247344970703, + 82.20439147949219, + 67.68408203125 + ], + "bp_grad_per_sample_l2_med": [ + 7.47043450246565e-05, + 8.161538426065817e-05, + 8.696810255059972e-05, + 9.05536362552084e-05, + 9.490203956374899e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5634765625, + "loss_eval": 1.2818918228149414, + "epoch": 17 + }, + { + "hidden_norms": [ + 136.31614685058594, + 116.76542663574219, + 100.04906463623047, + 85.71382141113281, + 70.02954864501953 + ], + "bp_grad_per_sample_l2_med": [ + 7.14207926648669e-05, + 7.859354082029313e-05, + 8.420498488703743e-05, + 8.882852853275836e-05, + 9.116062574321404e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5595703125, + "loss_eval": 1.2435299158096313, + "epoch": 18 + }, + { + "hidden_norms": [ + 138.36990356445312, + 117.38836669921875, + 101.75880432128906, + 86.79072570800781, + 70.66394805908203 + ], + "bp_grad_per_sample_l2_med": [ + 7.72569328546524e-05, + 8.451085159322247e-05, + 8.929366595111787e-05, + 9.467442578170449e-05, + 9.868820779956877e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.53515625, + "loss_eval": 1.3142390251159668, + "epoch": 19 + }, + { + "hidden_norms": [ + 140.71449279785156, + 119.23265838623047, + 101.22541809082031, + 85.75491333007812, + 69.77205657958984 + ], + "bp_grad_per_sample_l2_med": [ + 7.5247859058436e-05, + 8.147219341481104e-05, + 8.72978416737169e-05, + 9.33377887122333e-05, + 9.715931082610041e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.548828125, + "loss_eval": 1.26747465133667, + "epoch": 20 + }, + { + "hidden_norms": [ + 143.37794494628906, + 121.56777954101562, + 105.97654724121094, + 90.9666748046875, + 72.01183319091797 + ], + "bp_grad_per_sample_l2_med": [ + 7.179555541370064e-05, + 7.918629125924781e-05, + 8.409017755184323e-05, + 8.838798385113478e-05, + 9.469009819440544e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.564453125, + "loss_eval": 1.2752306461334229, + "epoch": 21 + }, + { + "hidden_norms": [ + 144.44107055664062, + 122.94657135009766, + 106.18299102783203, + 89.72506713867188, + 71.56814575195312 + ], + "bp_grad_per_sample_l2_med": [ + 7.250273483805358e-05, + 7.833781273802742e-05, + 8.349631389137357e-05, + 8.67474009282887e-05, + 8.975700620794669e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.56640625, + "loss_eval": 1.214519739151001, + "epoch": 22 + }, + { + "hidden_norms": [ + 145.68658447265625, + 123.7938232421875, + 107.63272857666016, + 91.90914154052734, + 72.97653198242188 + ], + "bp_grad_per_sample_l2_med": [ + 6.909506919328123e-05, + 7.67810779507272e-05, + 8.248597441706806e-05, + 8.500050898874179e-05, + 8.80209991009906e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.578125, + "loss_eval": 1.2490482330322266, + "epoch": 23 + }, + { + "hidden_norms": [ + 149.15159606933594, + 125.77446746826172, + 106.84111022949219, + 90.89909362792969, + 72.29488372802734 + ], + "bp_grad_per_sample_l2_med": [ + 7.051522698020563e-05, + 7.787953654769808e-05, + 8.355934551218525e-05, + 8.837382483761758e-05, + 9.125470387516543e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5634765625, + "loss_eval": 1.2157257795333862, + "epoch": 24 + }, + { + "hidden_norms": [ + 149.9364776611328, + 126.3508529663086, + 107.00386047363281, + 89.69956970214844, + 70.79742431640625 + ], + "bp_grad_per_sample_l2_med": [ + 7.40521791158244e-05, + 8.231549145421013e-05, + 8.598146814620122e-05, + 9.036294795805588e-05, + 9.211329597746953e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5546875, + "loss_eval": 1.2515935897827148, + "epoch": 25 + }, + { + "hidden_norms": [ + 152.33641052246094, + 127.60247039794922, + 109.31637573242188, + 91.78147888183594, + 71.85491180419922 + ], + "bp_grad_per_sample_l2_med": [ + 7.096086483215913e-05, + 7.774732512189075e-05, + 8.330845594173297e-05, + 8.756548049859703e-05, + 9.018366108648479e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5791015625, + "loss_eval": 1.234102487564087, + "epoch": 26 + }, + { + "hidden_norms": [ + 154.90924072265625, + 129.49365234375, + 111.0758285522461, + 94.2232666015625, + 73.4395523071289 + ], + "bp_grad_per_sample_l2_med": [ + 7.217184611363336e-05, + 7.90508056525141e-05, + 8.487315790262073e-05, + 9.130351099884138e-05, + 9.386075544171035e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5693359375, + "loss_eval": 1.2473926544189453, + "epoch": 27 + }, + { + "hidden_norms": [ + 155.88226318359375, + 130.6912384033203, + 111.4398193359375, + 93.5534896850586, + 73.1227035522461 + ], + "bp_grad_per_sample_l2_med": [ + 7.115830521797761e-05, + 7.749604992568493e-05, + 8.24403905426152e-05, + 8.617334970040247e-05, + 8.857186185196042e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5625, + "loss_eval": 1.232407569885254, + "epoch": 28 + }, + { + "hidden_norms": [ + 155.35606384277344, + 131.03033447265625, + 112.69044494628906, + 95.1001968383789, + 74.01049041748047 + ], + "bp_grad_per_sample_l2_med": [ + 7.353001274168491e-05, + 8.054459613049403e-05, + 8.64928078954108e-05, + 8.998846897156909e-05, + 9.453124948777258e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.576171875, + "loss_eval": 1.2427477836608887, + "epoch": 29 + }, + { + "hidden_norms": [ + 157.87423706054688, + 132.91993713378906, + 114.23269653320312, + 96.04922485351562, + 74.40912628173828 + ], + "bp_grad_per_sample_l2_med": [ + 7.218361861305311e-05, + 8.000781963346526e-05, + 8.621480083093047e-05, + 9.079690062208101e-05, + 9.179109474644065e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.572265625, + "loss_eval": 1.2170917987823486, + "epoch": 30 + }, + { + "hidden_norms": [ + 159.94407653808594, + 134.98342895507812, + 116.59188842773438, + 96.52700805664062, + 74.13409423828125 + ], + "bp_grad_per_sample_l2_med": [ + 6.996722368057817e-05, + 7.723316957708448e-05, + 8.291137055493891e-05, + 8.800445357337594e-05, + 8.874708146322519e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5888671875, + "loss_eval": 1.1662731170654297, + "epoch": 31 + }, + { + "hidden_norms": [ + 159.40000915527344, + 134.68307495117188, + 115.32740783691406, + 95.89759826660156, + 73.79962158203125 + ], + "bp_grad_per_sample_l2_med": [ + 7.17860457370989e-05, + 7.931615255074576e-05, + 8.509325562044978e-05, + 8.835212793201208e-05, + 9.002821025205776e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5732421875, + "loss_eval": 1.1779483556747437, + "epoch": 32 + }, + { + "hidden_norms": [ + 160.3310089111328, + 135.494140625, + 116.1007308959961, + 96.30546569824219, + 74.54843139648438 + ], + "bp_grad_per_sample_l2_med": [ + 6.925644993316382e-05, + 7.548897701781243e-05, + 8.256838918896392e-05, + 8.621955930721015e-05, + 8.84741239133291e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.59375, + "loss_eval": 1.1561952829360962, + "epoch": 33 + }, + { + "hidden_norms": [ + 161.94854736328125, + 135.6446075439453, + 116.58970642089844, + 96.99983978271484, + 74.31636810302734 + ], + "bp_grad_per_sample_l2_med": [ + 7.260960410349071e-05, + 8.003232505870983e-05, + 8.696899749338627e-05, + 9.040992881637067e-05, + 9.149286051979288e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5810546875, + "loss_eval": 1.1946098804473877, + "epoch": 34 + }, + { + "hidden_norms": [ + 163.52120971679688, + 138.41390991210938, + 118.427490234375, + 98.19206237792969, + 75.36811828613281 + ], + "bp_grad_per_sample_l2_med": [ + 6.831327482359484e-05, + 7.447604730259627e-05, + 7.990537415025756e-05, + 8.471667388221249e-05, + 8.780926145846024e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6025390625, + "loss_eval": 1.184380054473877, + "epoch": 35 + }, + { + "hidden_norms": [ + 164.48324584960938, + 138.1424102783203, + 118.34252166748047, + 98.4327621459961, + 75.36869049072266 + ], + "bp_grad_per_sample_l2_med": [ + 7.150783494580537e-05, + 7.926567923277617e-05, + 8.36653562146239e-05, + 8.762039215071127e-05, + 8.95786433829926e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5859375, + "loss_eval": 1.2110118865966797, + "epoch": 36 + }, + { + "hidden_norms": [ + 164.0553741455078, + 138.08517456054688, + 118.49005126953125, + 98.67227172851562, + 74.64473724365234 + ], + "bp_grad_per_sample_l2_med": [ + 7.029619155218825e-05, + 7.684711454203352e-05, + 8.26816976768896e-05, + 8.846465789247304e-05, + 9.003532613860443e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5908203125, + "loss_eval": 1.1644396781921387, + "epoch": 37 + }, + { + "hidden_norms": [ + 165.32000732421875, + 138.64366149902344, + 119.2437515258789, + 99.25880432128906, + 75.45353698730469 + ], + "bp_grad_per_sample_l2_med": [ + 7.045984239084646e-05, + 7.836698205210268e-05, + 8.392294694203883e-05, + 8.778785559115931e-05, + 8.954900113167241e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5810546875, + "loss_eval": 1.18137526512146, + "epoch": 38 + }, + { + "hidden_norms": [ + 164.7397918701172, + 138.3001251220703, + 117.6864242553711, + 97.29838562011719, + 73.79444122314453 + ], + "bp_grad_per_sample_l2_med": [ + 7.162813562899828e-05, + 7.83513969508931e-05, + 8.275063009932637e-05, + 8.855803025653586e-05, + 8.704853098606691e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.583984375, + "loss_eval": 1.1727752685546875, + "epoch": 39 + }, + { + "hidden_norms": [ + 166.1660919189453, + 138.93536376953125, + 118.51292419433594, + 97.88706970214844, + 75.51615905761719 + ], + "bp_grad_per_sample_l2_med": [ + 7.430704863509163e-05, + 8.242860349128023e-05, + 8.74657926033251e-05, + 9.10981761990115e-05, + 9.303457773057744e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5859375, + "loss_eval": 1.1664979457855225, + "epoch": 40 + }, + { + "hidden_norms": [ + 167.8816375732422, + 140.1188201904297, + 119.77051544189453, + 99.83518981933594, + 75.69395446777344 + ], + "bp_grad_per_sample_l2_med": [ + 7.187369919847697e-05, + 7.945671677589417e-05, + 8.597246051067486e-05, + 8.931689808377996e-05, + 8.963213622337207e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.587890625, + "loss_eval": 1.19194757938385, + "epoch": 41 + }, + { + "hidden_norms": [ + 168.21185302734375, + 141.76817321777344, + 121.40872192382812, + 100.61127471923828, + 76.76028442382812 + ], + "bp_grad_per_sample_l2_med": [ + 7.174632628448308e-05, + 7.968613499542698e-05, + 8.514403452863917e-05, + 8.922909910324961e-05, + 9.091905667446554e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5888671875, + "loss_eval": 1.1679599285125732, + "epoch": 42 + }, + { + "hidden_norms": [ + 167.2344207763672, + 140.6108856201172, + 120.0829849243164, + 99.8038330078125, + 76.13324737548828 + ], + "bp_grad_per_sample_l2_med": [ + 7.436795567627996e-05, + 8.090144547168165e-05, + 8.729894761927426e-05, + 9.00863014976494e-05, + 8.991207869257778e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.595703125, + "loss_eval": 1.1705546379089355, + "epoch": 43 + }, + { + "hidden_norms": [ + 167.59393310546875, + 140.7035369873047, + 120.24620056152344, + 99.91508483886719, + 75.96212005615234 + ], + "bp_grad_per_sample_l2_med": [ + 7.446305971825495e-05, + 8.234894630732015e-05, + 8.821392111713067e-05, + 9.209391282638535e-05, + 9.261125524062663e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5791015625, + "loss_eval": 1.1846892833709717, + "epoch": 44 + }, + { + "hidden_norms": [ + 168.69448852539062, + 141.26541137695312, + 121.04974365234375, + 100.46004486083984, + 75.70881652832031 + ], + "bp_grad_per_sample_l2_med": [ + 7.222096610348672e-05, + 7.875960727687925e-05, + 8.227298530982807e-05, + 8.841860108077526e-05, + 9.022892481880262e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.591796875, + "loss_eval": 1.1577212810516357, + "epoch": 45 + }, + { + "hidden_norms": [ + 169.7440185546875, + 142.39825439453125, + 121.89653778076172, + 100.77093505859375, + 76.56221008300781 + ], + "bp_grad_per_sample_l2_med": [ + 7.555038610007614e-05, + 8.296242594951764e-05, + 9.037082054419443e-05, + 9.527869406156242e-05, + 9.701496310299262e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5908203125, + "loss_eval": 1.1768805980682373, + "epoch": 46 + }, + { + "hidden_norms": [ + 167.24928283691406, + 140.36639404296875, + 119.20468139648438, + 99.04094696044922, + 75.62102508544922 + ], + "bp_grad_per_sample_l2_med": [ + 7.741156878182665e-05, + 8.454316412098706e-05, + 9.005220636026934e-05, + 9.321123798144981e-05, + 9.260981460101902e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5908203125, + "loss_eval": 1.166186809539795, + "epoch": 47 + }, + { + "hidden_norms": [ + 170.72845458984375, + 142.466796875, + 120.5933837890625, + 100.26793670654297, + 76.15065002441406 + ], + "bp_grad_per_sample_l2_med": [ + 7.659869879717007e-05, + 8.334196172654629e-05, + 9.012148075271398e-05, + 9.564686479279771e-05, + 9.513212717138231e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.591796875, + "loss_eval": 1.1720219850540161, + "epoch": 48 + }, + { + "hidden_norms": [ + 169.83580017089844, + 141.82705688476562, + 121.11093139648438, + 100.64865112304688, + 76.17137145996094 + ], + "bp_grad_per_sample_l2_med": [ + 7.593600457767025e-05, + 8.458431693725288e-05, + 9.001771832117811e-05, + 9.566119115334004e-05, + 9.762388071976602e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5927734375, + "loss_eval": 1.184555172920227, + "epoch": 49 + }, + { + "hidden_norms": [ + 168.68116760253906, + 141.1621856689453, + 119.57838439941406, + 98.55834197998047, + 75.13648223876953 + ], + "bp_grad_per_sample_l2_med": [ + 8.207417704397812e-05, + 9.170681732939556e-05, + 9.716026397654787e-05, + 0.0001007765022222884, + 0.0001005034864647314 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5810546875, + "loss_eval": 1.1981369256973267, + "epoch": 50 + }, + { + "hidden_norms": [ + 171.0980682373047, + 143.56202697753906, + 121.67494201660156, + 101.36307525634766, + 76.57723999023438 + ], + "bp_grad_per_sample_l2_med": [ + 7.634361099917442e-05, + 8.294743747683242e-05, + 8.85644112713635e-05, + 9.305671119363979e-05, + 9.303687693318352e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5927734375, + "loss_eval": 1.1646153926849365, + "epoch": 51 + }, + { + "hidden_norms": [ + 170.58717346191406, + 143.18809509277344, + 120.9772720336914, + 100.8180923461914, + 77.12872314453125 + ], + "bp_grad_per_sample_l2_med": [ + 7.599191303597763e-05, + 8.41239161673002e-05, + 8.960344712249935e-05, + 9.63989004958421e-05, + 9.756541112437844e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6025390625, + "loss_eval": 1.1623225212097168, + "epoch": 52 + }, + { + "hidden_norms": [ + 169.49244689941406, + 142.66770935058594, + 122.00574493408203, + 101.84593963623047, + 77.40425109863281 + ], + "bp_grad_per_sample_l2_med": [ + 7.701734284637496e-05, + 8.374643221031874e-05, + 9.025474719237536e-05, + 9.504661284154281e-05, + 9.925573249347508e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.59765625, + "loss_eval": 1.1574187278747559, + "epoch": 53 + }, + { + "hidden_norms": [ + 169.3027801513672, + 143.11941528320312, + 120.9614486694336, + 101.5257797241211, + 77.17151641845703 + ], + "bp_grad_per_sample_l2_med": [ + 7.559885852970183e-05, + 8.217129652621225e-05, + 8.892706682672724e-05, + 9.235734614776447e-05, + 9.276533091906458e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6015625, + "loss_eval": 1.149141788482666, + "epoch": 54 + }, + { + "hidden_norms": [ + 168.70281982421875, + 141.82730102539062, + 120.2729263305664, + 99.75395965576172, + 76.92571258544922 + ], + "bp_grad_per_sample_l2_med": [ + 7.91895727161318e-05, + 8.787367551121861e-05, + 9.60014876909554e-05, + 0.0001018140246742405, + 9.86503655440174e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6005859375, + "loss_eval": 1.1657415628433228, + "epoch": 55 + }, + { + "hidden_norms": [ + 169.94361877441406, + 142.49684143066406, + 120.18767547607422, + 100.32206726074219, + 76.59700012207031 + ], + "bp_grad_per_sample_l2_med": [ + 7.673597428947687e-05, + 8.517439709976315e-05, + 9.201091597788036e-05, + 9.491065429756418e-05, + 9.497139399172738e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6083984375, + "loss_eval": 1.170656442642212, + "epoch": 56 + }, + { + "hidden_norms": [ + 168.98934936523438, + 142.45361328125, + 120.9234848022461, + 101.12970733642578, + 76.8805160522461 + ], + "bp_grad_per_sample_l2_med": [ + 7.979186193551868e-05, + 8.849770529195666e-05, + 9.661864896770567e-05, + 0.00010212804772891104, + 9.96212984318845e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.59375, + "loss_eval": 1.153792142868042, + "epoch": 57 + }, + { + "hidden_norms": [ + 169.1288604736328, + 141.414306640625, + 119.56535339355469, + 99.89313507080078, + 76.44340515136719 + ], + "bp_grad_per_sample_l2_med": [ + 8.042863919399679e-05, + 8.848145080264658e-05, + 9.505209163762629e-05, + 0.00010096383630298078, + 9.844720625551417e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6044921875, + "loss_eval": 1.1363590955734253, + "epoch": 58 + }, + { + "hidden_norms": [ + 167.93479919433594, + 140.53518676757812, + 118.76004028320312, + 99.56035614013672, + 76.20387268066406 + ], + "bp_grad_per_sample_l2_med": [ + 8.038699888857082e-05, + 8.754427108215168e-05, + 9.549371316097677e-05, + 0.00010098952043335885, + 0.0001008743784041144 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5927734375, + "loss_eval": 1.1666439771652222, + "epoch": 59 + }, + { + "hidden_norms": [ + 168.28646850585938, + 140.67718505859375, + 118.55599975585938, + 98.98268127441406, + 75.81230163574219 + ], + "bp_grad_per_sample_l2_med": [ + 8.297240128740668e-05, + 8.875853382050991e-05, + 9.902577585307881e-05, + 0.00010285823373124003, + 0.00010488184489076957 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.611328125, + "loss_eval": 1.1589187383651733, + "epoch": 60 + }, + { + "hidden_norms": [ + 168.05776977539062, + 140.5435791015625, + 119.5470962524414, + 99.72227478027344, + 76.00287628173828 + ], + "bp_grad_per_sample_l2_med": [ + 8.011830504983664e-05, + 8.830082515487447e-05, + 9.65106810326688e-05, + 0.00010251552885165438, + 0.00010001847840612754 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.615234375, + "loss_eval": 1.157954216003418, + "epoch": 61 + }, + { + "hidden_norms": [ + 168.4709014892578, + 140.92843627929688, + 119.31693267822266, + 98.76548767089844, + 75.95777893066406 + ], + "bp_grad_per_sample_l2_med": [ + 8.56209808262065e-05, + 9.390609193360433e-05, + 0.00010086362453876063, + 0.00010554264736128971, + 0.00010187114821746945 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.603515625, + "loss_eval": 1.147390365600586, + "epoch": 62 + }, + { + "hidden_norms": [ + 167.48707580566406, + 139.8479766845703, + 118.25393676757812, + 99.32323455810547, + 75.72100830078125 + ], + "bp_grad_per_sample_l2_med": [ + 8.738139877095819e-05, + 9.79254036792554e-05, + 0.00010459231998538598, + 0.00011052342597395182, + 0.00010695838136598468 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5966796875, + "loss_eval": 1.1785132884979248, + "epoch": 63 + }, + { + "hidden_norms": [ + 167.5928955078125, + 140.20948791503906, + 118.63544464111328, + 99.02739715576172, + 75.8176040649414 + ], + "bp_grad_per_sample_l2_med": [ + 8.539798727724701e-05, + 9.423612937098369e-05, + 0.00010523338278289884, + 0.00010897681931965053, + 0.00010739201388787478 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.60546875, + "loss_eval": 1.1509130001068115, + "epoch": 64 + }, + { + "hidden_norms": [ + 167.19003295898438, + 138.91221618652344, + 117.57588195800781, + 98.43026733398438, + 75.48680114746094 + ], + "bp_grad_per_sample_l2_med": [ + 8.238407463068143e-05, + 9.25329077290371e-05, + 0.00010089747956953943, + 0.00010575826308922842, + 0.00010581395326880738 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6220703125, + "loss_eval": 1.151381254196167, + "epoch": 65 + }, + { + "hidden_norms": [ + 165.7104034423828, + 138.99298095703125, + 117.33794403076172, + 98.08374786376953, + 75.52032470703125 + ], + "bp_grad_per_sample_l2_med": [ + 8.850001177052036e-05, + 9.699742804514244e-05, + 0.00010492365981917828, + 0.00011017896758858114, + 0.00010667099559213966 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.607421875, + "loss_eval": 1.151253581047058, + "epoch": 66 + }, + { + "hidden_norms": [ + 165.87271118164062, + 138.727783203125, + 118.21571350097656, + 97.76729583740234, + 75.68400573730469 + ], + "bp_grad_per_sample_l2_med": [ + 9.00067898328416e-05, + 9.841559221968055e-05, + 0.00010505259706405923, + 0.00010942742665065452, + 0.00010504219244467095 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.60546875, + "loss_eval": 1.1535770893096924, + "epoch": 67 + }, + { + "hidden_norms": [ + 165.17666625976562, + 138.45004272460938, + 117.10303497314453, + 97.36707305908203, + 75.38941192626953 + ], + "bp_grad_per_sample_l2_med": [ + 8.911191252991557e-05, + 9.853249503066763e-05, + 0.00010691725765354931, + 0.00011312783317407593, + 0.0001101552988984622 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.59765625, + "loss_eval": 1.1582581996917725, + "epoch": 68 + }, + { + "hidden_norms": [ + 165.94325256347656, + 138.6524200439453, + 117.50881958007812, + 97.7616958618164, + 75.20433807373047 + ], + "bp_grad_per_sample_l2_med": [ + 8.616734703537077e-05, + 9.347109880764037e-05, + 0.00010103159002028406, + 0.00010616267536533996, + 0.00010419132013339549 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6083984375, + "loss_eval": 1.1453883647918701, + "epoch": 69 + }, + { + "hidden_norms": [ + 165.7154541015625, + 138.506591796875, + 117.28874206542969, + 97.05110168457031, + 75.29759979248047 + ], + "bp_grad_per_sample_l2_med": [ + 8.980780694400892e-05, + 9.973136184271425e-05, + 0.00010883707000175491, + 0.00011757094762288034, + 0.00011409710714360699 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.607421875, + "loss_eval": 1.1474578380584717, + "epoch": 70 + }, + { + "hidden_norms": [ + 164.83221435546875, + 138.6868133544922, + 116.98916625976562, + 96.52086639404297, + 75.43351745605469 + ], + "bp_grad_per_sample_l2_med": [ + 8.988294575829059e-05, + 9.790070907911286e-05, + 0.00010740302968770266, + 0.00011267260560998693, + 0.0001108170035877265 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.61328125, + "loss_eval": 1.143803358078003, + "epoch": 71 + }, + { + "hidden_norms": [ + 164.63592529296875, + 137.5937042236328, + 116.08668518066406, + 96.16253662109375, + 74.92699432373047 + ], + "bp_grad_per_sample_l2_med": [ + 9.160200715996325e-05, + 0.00010001687769545242, + 0.00010771892993943766, + 0.00011699824244715273, + 0.00011338551848893985 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.609375, + "loss_eval": 1.1410948038101196, + "epoch": 72 + }, + { + "hidden_norms": [ + 164.91123962402344, + 137.8173828125, + 116.79219818115234, + 96.76990509033203, + 74.76392364501953 + ], + "bp_grad_per_sample_l2_med": [ + 8.93947362783365e-05, + 9.948704246198758e-05, + 0.00010810969251906499, + 0.00011499693209771067, + 0.0001114657279686071 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.623046875, + "loss_eval": 1.1341216564178467, + "epoch": 73 + }, + { + "hidden_norms": [ + 164.64288330078125, + 137.3013153076172, + 116.4471206665039, + 96.7668228149414, + 74.69876861572266 + ], + "bp_grad_per_sample_l2_med": [ + 8.85727204149589e-05, + 9.913302346831188e-05, + 0.00011003073450410739, + 0.00011727867240551859, + 0.00011272053234279156 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6044921875, + "loss_eval": 1.1379802227020264, + "epoch": 74 + }, + { + "hidden_norms": [ + 163.62106323242188, + 137.2855682373047, + 115.62771606445312, + 95.8958969116211, + 74.53977966308594 + ], + "bp_grad_per_sample_l2_med": [ + 8.984863961813971e-05, + 9.98539908323437e-05, + 0.00010817578731803223, + 0.00011364965030224994, + 0.00011257777805440128 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.130206823348999, + "epoch": 75 + }, + { + "hidden_norms": [ + 164.09976196289062, + 137.23387145996094, + 116.05545043945312, + 96.66761016845703, + 75.32057189941406 + ], + "bp_grad_per_sample_l2_med": [ + 8.984812302514911e-05, + 9.734687773743644e-05, + 0.00010578137880656868, + 0.00011179807916050777, + 0.0001108815340558067 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.607421875, + "loss_eval": 1.1422557830810547, + "epoch": 76 + }, + { + "hidden_norms": [ + 162.94369506835938, + 136.59678649902344, + 115.43162536621094, + 95.96286010742188, + 74.39228057861328 + ], + "bp_grad_per_sample_l2_med": [ + 9.308777953265235e-05, + 0.00010392161493655294, + 0.00011047742736991495, + 0.00011820423969766125, + 0.00011209066724404693 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6083984375, + "loss_eval": 1.1316850185394287, + "epoch": 77 + }, + { + "hidden_norms": [ + 163.14993286132812, + 136.48724365234375, + 115.7430648803711, + 96.20491790771484, + 74.71761322021484 + ], + "bp_grad_per_sample_l2_med": [ + 9.024026803672314e-05, + 0.00010025065421359614, + 0.00011008324509020895, + 0.00011521186388563365, + 0.00011174430255778134 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.61328125, + "loss_eval": 1.1380174160003662, + "epoch": 78 + }, + { + "hidden_norms": [ + 163.56654357910156, + 136.04368591308594, + 114.58287048339844, + 95.99482727050781, + 74.26864624023438 + ], + "bp_grad_per_sample_l2_med": [ + 9.700806549517438e-05, + 0.0001051941653713584, + 0.00011597082630032673, + 0.0001224641309818253, + 0.00011469785385997966 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.61328125, + "loss_eval": 1.1528915166854858, + "epoch": 79 + }, + { + "hidden_norms": [ + 162.7240753173828, + 135.9139862060547, + 114.86207580566406, + 95.29146575927734, + 74.25565338134766 + ], + "bp_grad_per_sample_l2_med": [ + 9.666816185927019e-05, + 0.0001055657266988419, + 0.00011615711264312267, + 0.00012476630217861384, + 0.00011797657498391345 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6123046875, + "loss_eval": 1.1539390087127686, + "epoch": 80 + }, + { + "hidden_norms": [ + 162.158203125, + 135.1398468017578, + 114.53036499023438, + 94.93306732177734, + 73.95748901367188 + ], + "bp_grad_per_sample_l2_med": [ + 9.333287016488612e-05, + 0.0001032597865560092, + 0.00011410381557652727, + 0.00012122129555791616, + 0.00011711813567671925 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.607421875, + "loss_eval": 1.1506534814834595, + "epoch": 81 + }, + { + "hidden_norms": [ + 162.415283203125, + 135.51370239257812, + 114.56376647949219, + 94.92838287353516, + 74.06205749511719 + ], + "bp_grad_per_sample_l2_med": [ + 9.082158794626594e-05, + 0.00010185714199906215, + 0.00011048805754398927, + 0.00011587562767090276, + 0.0001120776214520447 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.611328125, + "loss_eval": 1.1497812271118164, + "epoch": 82 + }, + { + "hidden_norms": [ + 161.77337646484375, + 135.19717407226562, + 114.20987701416016, + 94.77679443359375, + 73.99730682373047 + ], + "bp_grad_per_sample_l2_med": [ + 9.745426359586418e-05, + 0.00010718397970777005, + 0.00011704466305673122, + 0.00012522070028353482, + 0.00012164646614110097 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6123046875, + "loss_eval": 1.155759572982788, + "epoch": 83 + }, + { + "hidden_norms": [ + 161.48892211914062, + 135.2348175048828, + 114.12451171875, + 94.8083267211914, + 73.4517822265625 + ], + "bp_grad_per_sample_l2_med": [ + 9.549259266350418e-05, + 0.00010579569061519578, + 0.00011430429003667086, + 0.00012098137813154608, + 0.00011664297198876739 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6171875, + "loss_eval": 1.15834379196167, + "epoch": 84 + }, + { + "hidden_norms": [ + 161.6995849609375, + 135.2989959716797, + 114.2784194946289, + 94.69004821777344, + 73.529541015625 + ], + "bp_grad_per_sample_l2_med": [ + 9.579937614034861e-05, + 0.00010731106885941699, + 0.00011613505921559408, + 0.00012203569349367172, + 0.00011712868581525981 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6083984375, + "loss_eval": 1.1583144664764404, + "epoch": 85 + }, + { + "hidden_norms": [ + 161.00369262695312, + 134.7657012939453, + 114.10606384277344, + 94.362060546875, + 73.65673065185547 + ], + "bp_grad_per_sample_l2_med": [ + 9.818092075875029e-05, + 0.00010859747999347746, + 0.00011724254727596417, + 0.00012138402962591499, + 0.00011800935317296535 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6162109375, + "loss_eval": 1.1536951065063477, + "epoch": 86 + }, + { + "hidden_norms": [ + 161.0053253173828, + 134.59410095214844, + 113.69575500488281, + 94.29032135009766, + 73.46531677246094 + ], + "bp_grad_per_sample_l2_med": [ + 9.722611866891384e-05, + 0.00010765776823973283, + 0.0001188350870506838, + 0.00012322816473897547, + 0.00011940464901272207 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.15749192237854, + "epoch": 87 + }, + { + "hidden_norms": [ + 161.33126831054688, + 134.94166564941406, + 113.90135955810547, + 94.50862884521484, + 73.39297485351562 + ], + "bp_grad_per_sample_l2_med": [ + 9.938049333868548e-05, + 0.0001076548287528567, + 0.00011934098438359797, + 0.00012375488586258143, + 0.00011877582437591627 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.61328125, + "loss_eval": 1.157106637954712, + "epoch": 88 + }, + { + "hidden_norms": [ + 161.05789184570312, + 134.59825134277344, + 113.87554931640625, + 94.37042999267578, + 73.5987548828125 + ], + "bp_grad_per_sample_l2_med": [ + 9.70072578638792e-05, + 0.00010533058957662433, + 0.00011765053932322189, + 0.00012162782513769343, + 0.00012223162048030645 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6171875, + "loss_eval": 1.1565823554992676, + "epoch": 89 + }, + { + "hidden_norms": [ + 160.39405822753906, + 134.43434143066406, + 113.540283203125, + 94.05237579345703, + 73.39077758789062 + ], + "bp_grad_per_sample_l2_med": [ + 9.608148684492335e-05, + 0.00010612589539960027, + 0.00011680866009555757, + 0.00012219352356623858, + 0.00011590561916818842 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6123046875, + "loss_eval": 1.1539617776870728, + "epoch": 90 + }, + { + "hidden_norms": [ + 160.60440063476562, + 134.6214141845703, + 113.45699310302734, + 93.85929870605469, + 73.18849182128906 + ], + "bp_grad_per_sample_l2_med": [ + 9.81277771643363e-05, + 0.00010970587754854932, + 0.00011871931201312691, + 0.00012303274706937373, + 0.00011832414020318538 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.611328125, + "loss_eval": 1.1519787311553955, + "epoch": 91 + }, + { + "hidden_norms": [ + 160.69932556152344, + 134.37420654296875, + 113.30387115478516, + 93.87930297851562, + 73.2369384765625 + ], + "bp_grad_per_sample_l2_med": [ + 9.748790762387216e-05, + 0.00010789754742290825, + 0.00011884274135809392, + 0.00012259349750820547, + 0.00012160756887169555 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6162109375, + "loss_eval": 1.1536774635314941, + "epoch": 92 + }, + { + "hidden_norms": [ + 160.83596801757812, + 134.3319854736328, + 113.4552230834961, + 94.0063705444336, + 73.16248321533203 + ], + "bp_grad_per_sample_l2_med": [ + 9.70613255049102e-05, + 0.00010844107600860298, + 0.0001184809225378558, + 0.00012342457193881273, + 0.00011970168998232111 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6220703125, + "loss_eval": 1.152658462524414, + "epoch": 93 + }, + { + "hidden_norms": [ + 160.8366241455078, + 134.48265075683594, + 113.25139617919922, + 93.83488464355469, + 73.08296203613281 + ], + "bp_grad_per_sample_l2_med": [ + 9.66933585004881e-05, + 0.00010815998393809423, + 0.00011774426093325019, + 0.0001224545994773507, + 0.00011890953464899212 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6181640625, + "loss_eval": 1.1551861763000488, + "epoch": 94 + }, + { + "hidden_norms": [ + 160.7191162109375, + 134.44659423828125, + 113.33219146728516, + 93.93790435791016, + 73.0753402709961 + ], + "bp_grad_per_sample_l2_med": [ + 9.675837645772845e-05, + 0.00010675707017071545, + 0.00011643637844827026, + 0.00012197842443129048, + 0.0001190306429634802 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.15492582321167, + "epoch": 95 + }, + { + "hidden_norms": [ + 160.51898193359375, + 134.29307556152344, + 113.27383422851562, + 94.04198455810547, + 73.003662109375 + ], + "bp_grad_per_sample_l2_med": [ + 9.737682557897642e-05, + 0.00010710594506235793, + 0.00011601457663346082, + 0.0001232696376973763, + 0.0001181336774607189 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6162109375, + "loss_eval": 1.1535921096801758, + "epoch": 96 + }, + { + "hidden_norms": [ + 160.5992431640625, + 134.43368530273438, + 113.30790710449219, + 94.0107192993164, + 73.01823425292969 + ], + "bp_grad_per_sample_l2_med": [ + 9.668481652624905e-05, + 0.00010705058230087161, + 0.0001163838169304654, + 0.0001232351060025394, + 0.00011791065480792895 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.615234375, + "loss_eval": 1.1539404392242432, + "epoch": 97 + }, + { + "hidden_norms": [ + 160.6013946533203, + 134.46824645996094, + 113.25690460205078, + 93.99237060546875, + 73.00788879394531 + ], + "bp_grad_per_sample_l2_med": [ + 9.74524809862487e-05, + 0.00010689684131648391, + 0.00011608003114815801, + 0.00012245487596374005, + 0.00011877176439156756 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.615234375, + "loss_eval": 1.1537361145019531, + "epoch": 98 + }, + { + "hidden_norms": [ + 160.6110076904297, + 134.44720458984375, + 113.29548645019531, + 93.96721649169922, + 72.96358489990234 + ], + "bp_grad_per_sample_l2_med": [ + 9.775274520507082e-05, + 0.00010722322622314095, + 0.00011578563862713054, + 0.00012414308730512857, + 0.00011851716408273205 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6162109375, + "loss_eval": 1.1537935733795166, + "epoch": 99 + }, + { + "hidden_norms": [ + 160.61090087890625, + 134.45262145996094, + 113.2977066040039, + 93.9543685913086, + 72.96540069580078 + ], + "bp_grad_per_sample_l2_med": [ + 9.751630568644032e-05, + 0.00010700579878175631, + 0.00011575232201721519, + 0.0001240932324435562, + 0.00011847950372612104 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6162109375, + "loss_eval": 1.153747320175171, + "epoch": 100 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005561555735766888, + 0.0005519049009308219, + 0.0005482902633957565, + 0.0005436676437966526, + 0.000538847001735121 + ], + "gamma_dfa": 0.008468771702609956, + "gamma_dfa_per_layer": [ + 0.0002397641073912382, + 0.021293632686138153, + -0.0031478723976761103, + 0.015489562414586544 + ], + "acc_eval": 0.1123046875, + "loss_eval": 2.3168468475341797, + "epoch": 0 + }, + { + "hidden_norms": [ + 481.5912780761719, + 951.0988159179688, + 1076.1094970703125, + 1320.2431640625, + 1560.1331787109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006860869470983744, + 0.000686013896483928, + 0.0006859428831376135, + 0.0006858126726001501, + 0.0006857643602415919 + ], + "gamma_dfa": 0.008383387292269617, + "gamma_dfa_per_layer": [ + 0.030579306185245514, + 0.012463560327887535, + -0.009617818519473076, + 0.00010850117541849613 + ], + "acc_eval": 0.1494140625, + "loss_eval": 6.441287040710449, + "epoch": 1 + }, + { + "hidden_norms": [ + 803.455322265625, + 1877.8646240234375, + 2352.25390625, + 2999.778564453125, + 3690.3037109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007094781612977386, + 0.0007074660388752818, + 0.0007073783199302852, + 0.0007076358306221664, + 0.0007076164474710822 + ], + "gamma_dfa": -0.002415801805909723, + "gamma_dfa_per_layer": [ + 0.04413381963968277, + -0.0021541656460613012, + -0.028202872723340988, + -0.023439988493919373 + ], + "acc_eval": 0.236328125, + "loss_eval": 9.331591606140137, + "epoch": 2 + }, + { + "hidden_norms": [ + 1023.6770629882812, + 2787.596923828125, + 3518.2734375, + 4732.96337890625, + 6139.98486328125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007535111508332193, + 0.00075019511859864, + 0.0007504230597987771, + 0.0007509100250899792, + 0.0007509145070798695 + ], + "gamma_dfa": -0.004518487432505935, + "gamma_dfa_per_layer": [ + 0.049626171588897705, + -0.0017164160963147879, + -0.029111474752426147, + -0.03687223047018051 + ], + "acc_eval": 0.1943359375, + "loss_eval": 33.82752990722656, + "epoch": 3 + }, + { + "hidden_norms": [ + 1163.0250244140625, + 3340.40087890625, + 4668.20654296875, + 6551.25927734375, + 8839.166015625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007571951719000936, + 0.0007542021339759231, + 0.0007538797217421234, + 0.0007539798971265554, + 0.0007538445643149316 + ], + "gamma_dfa": -0.0057786391116678715, + "gamma_dfa_per_layer": [ + 0.06502002477645874, + -0.02495962381362915, + -0.035328082740306854, + -0.02784687466919422 + ], + "acc_eval": 0.1875, + "loss_eval": 50.81904983520508, + "epoch": 4 + }, + { + "hidden_norms": [ + 1288.871337890625, + 3822.7880859375, + 5365.59130859375, + 7605.025390625, + 10502.0478515625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007548240246251225, + 0.0007521823281422257, + 0.0007521542138420045, + 0.00075240881415084, + 0.0007523542735725641 + ], + "gamma_dfa": -0.006262022419832647, + "gamma_dfa_per_layer": [ + 0.0670417994260788, + -0.00757558410987258, + -0.044654928147792816, + -0.03985937684774399 + ], + "acc_eval": 0.1748046875, + "loss_eval": 41.77630615234375, + "epoch": 5 + }, + { + "hidden_norms": [ + 1393.3045654296875, + 4566.75341796875, + 6398.4619140625, + 9144.8193359375, + 12855.005859375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007480952190235257, + 0.0007420883048325777, + 0.0007418331224471331, + 0.0007423029164783657, + 0.0007423472707159817 + ], + "gamma_dfa": -0.012987596448510885, + "gamma_dfa_per_layer": [ + 0.07368794828653336, + -0.022242246195673943, + -0.04769526422023773, + -0.05570082366466522 + ], + "acc_eval": 0.2255859375, + "loss_eval": 34.67824172973633, + "epoch": 6 + }, + { + "hidden_norms": [ + 1492.14599609375, + 4914.71142578125, + 7309.0888671875, + 10380.2900390625, + 14994.3798828125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007586176507174969, + 0.0007474496378563344, + 0.0007472135475836694, + 0.0007474484154954553, + 0.0007475449237972498 + ], + "gamma_dfa": -0.009481166722252965, + "gamma_dfa_per_layer": [ + 0.07966121286153793, + -0.014550731517374516, + -0.05317254737019539, + -0.04986260086297989 + ], + "acc_eval": 0.2265625, + "loss_eval": 47.53326416015625, + "epoch": 7 + }, + { + "hidden_norms": [ + 1561.8521728515625, + 5346.5771484375, + 8036.01171875, + 11400.638671875, + 16846.158203125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007513429154641926, + 0.000743337906897068, + 0.0007433209684677422, + 0.0007435117149725556, + 0.0007433460559695959 + ], + "gamma_dfa": -0.020332499407231808, + "gamma_dfa_per_layer": [ + 0.07914174348115921, + -0.03499722480773926, + -0.0528150238096714, + -0.07265949249267578 + ], + "acc_eval": 0.203125, + "loss_eval": 44.3652458190918, + "epoch": 8 + }, + { + "hidden_norms": [ + 1634.708740234375, + 5771.3779296875, + 9056.50390625, + 14017.43359375, + 18666.166015625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007612781482748687, + 0.000746309058740735, + 0.0007445007795467973, + 0.000742616830393672, + 0.000742737902328372 + ], + "gamma_dfa": -0.02017525304108858, + "gamma_dfa_per_layer": [ + 0.07873347401618958, + -0.0398627370595932, + -0.05772021412849426, + -0.061851534992456436 + ], + "acc_eval": 0.1962890625, + "loss_eval": 76.75175476074219, + "epoch": 9 + }, + { + "hidden_norms": [ + 1703.975830078125, + 6538.35400390625, + 10825.435546875, + 18506.091796875, + 22004.94140625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007676634704694152, + 0.0007641310803592205, + 0.0007641207776032388, + 0.0007640842813998461, + 0.0007641611155122519 + ], + "gamma_dfa": -0.016695345751941204, + "gamma_dfa_per_layer": [ + 0.08918984234333038, + -0.029809486120939255, + -0.06516598165035248, + -0.06099575757980347 + ], + "acc_eval": 0.14453125, + "loss_eval": 82.11173248291016, + "epoch": 10 + }, + { + "hidden_norms": [ + 1742.7552490234375, + 10617.021484375, + 14353.39453125, + 26320.365234375, + 29618.58984375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007739505381323397, + 0.0007467114483006299, + 0.0007445442606694996, + 0.0007397353765554726, + 0.0007397329318337142 + ], + "gamma_dfa": -0.01567553821951151, + "gamma_dfa_per_layer": [ + 0.08600987493991852, + -0.03431041166186333, + -0.056060850620269775, + -0.05834076553583145 + ], + "acc_eval": 0.1943359375, + "loss_eval": 223.91172790527344, + "epoch": 11 + }, + { + "hidden_norms": [ + 1824.1932373046875, + 15453.6865234375, + 18834.18359375, + 34960.33984375, + 37989.41796875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007750834338366985, + 0.0007619780953973532, + 0.0007621922995895147, + 0.0007620578981004655, + 0.0007621044642291963 + ], + "gamma_dfa": -0.010786167811602354, + "gamma_dfa_per_layer": [ + 0.12150975316762924, + -0.02778821997344494, + -0.057943932712078094, + -0.07892227172851562 + ], + "acc_eval": 0.2236328125, + "loss_eval": 176.59576416015625, + "epoch": 12 + }, + { + "hidden_norms": [ + 1874.6923828125, + 24413.89453125, + 27520.30859375, + 49373.3984375, + 52416.24609375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007790470262989402, + 0.0007622907287441194, + 0.0007622726843692362, + 0.0007622543489560485, + 0.0007623030105605721 + ], + "gamma_dfa": -0.014462455175817013, + "gamma_dfa_per_layer": [ + 0.12855470180511475, + -0.04145955294370651, + -0.05751717463135719, + -0.08742779493331909 + ], + "acc_eval": 0.1787109375, + "loss_eval": 262.8403625488281, + "epoch": 13 + }, + { + "hidden_norms": [ + 1946.8936767578125, + 36272.8125, + 40333.21875, + 69530.5, + 73388.2890625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008108754991553724, + 0.0007635678630322218, + 0.0007621092372573912, + 0.0007623478886671364, + 0.0007624892168678343 + ], + "gamma_dfa": -0.0001736646518111229, + "gamma_dfa_per_layer": [ + 0.17327094078063965, + -0.03242593631148338, + -0.06580278277397156, + -0.0757368803024292 + ], + "acc_eval": 0.203125, + "loss_eval": 413.348876953125, + "epoch": 14 + }, + { + "hidden_norms": [ + 2032.87255859375, + 51780.58984375, + 56919.1484375, + 94829.1484375, + 100403.8828125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008237292058765888, + 0.0007614542846567929, + 0.0007608170853927732, + 0.0007589491433463991, + 0.0007590141030959785 + ], + "gamma_dfa": -0.011795124970376492, + "gamma_dfa_per_layer": [ + 0.1382066011428833, + -0.05588943883776665, + -0.061218664050102234, + -0.06827899813652039 + ], + "acc_eval": 0.173828125, + "loss_eval": 476.64752197265625, + "epoch": 15 + }, + { + "hidden_norms": [ + 2114.94287109375, + 69492.1875, + 75388.1796875, + 119789.3125, + 127585.7109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.000832556514069438, + 0.0007537039346061647, + 0.000749573518987745, + 0.0007496002363041043, + 0.0007496204925701022 + ], + "gamma_dfa": 0.0006226245313882828, + "gamma_dfa_per_layer": [ + 0.18075576424598694, + -0.03305089473724365, + -0.06780679523944855, + -0.07740757614374161 + ], + "acc_eval": 0.1982421875, + "loss_eval": 537.6473388671875, + "epoch": 16 + }, + { + "hidden_norms": [ + 2253.870849609375, + 95625.234375, + 102645.28125, + 154236.78125, + 164149.109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008362202788703144, + 0.0007716236286796629, + 0.0007702361326664686, + 0.0007688606856390834, + 0.0007688601035624743 + ], + "gamma_dfa": 0.0006011892110109329, + "gamma_dfa_per_layer": [ + 0.16114464402198792, + -0.029663734138011932, + -0.06491248309612274, + -0.06416366994380951 + ], + "acc_eval": 0.1640625, + "loss_eval": 581.9083251953125, + "epoch": 17 + }, + { + "hidden_norms": [ + 2351.805419921875, + 125897.7421875, + 133955.1875, + 192500.78125, + 204528.875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009331249166280031, + 0.0007676270324736834, + 0.000767629942856729, + 0.0007676497916691005, + 0.0007678864640183747 + ], + "gamma_dfa": 0.0174247776158154, + "gamma_dfa_per_layer": [ + 0.2389061450958252, + -0.028650319203734398, + -0.08226999640464783, + -0.058286719024181366 + ], + "acc_eval": 0.18359375, + "loss_eval": 913.2538452148438, + "epoch": 18 + }, + { + "hidden_norms": [ + 2513.170166015625, + 162182.9375, + 171449.59375, + 239781.78125, + 254673.765625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010568156139925122, + 0.0007681881543248892, + 0.0007537052151747048, + 0.0007537882192991674, + 0.0007537372293882072 + ], + "gamma_dfa": -0.005793072283267975, + "gamma_dfa_per_layer": [ + 0.16605031490325928, + -0.03780411183834076, + -0.07320450246334076, + -0.07821398973464966 + ], + "acc_eval": 0.16796875, + "loss_eval": 1265.55859375, + "epoch": 19 + }, + { + "hidden_norms": [ + 2644.6826171875, + 207142.84375, + 218342.21875, + 296423.21875, + 314992.625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011496657971292734, + 0.0007783269393257797, + 0.0007782486500218511, + 0.0007782430038787425, + 0.0007782124448567629 + ], + "gamma_dfa": 0.0026588989421725273, + "gamma_dfa_per_layer": [ + 0.23294636607170105, + -0.04264959320425987, + -0.083626389503479, + -0.09603478759527206 + ], + "acc_eval": 0.20703125, + "loss_eval": 1426.623046875, + "epoch": 20 + }, + { + "hidden_norms": [ + 2796.434814453125, + 252884.71875, + 265445.65625, + 352069.8125, + 373355.1875 + ], + "bp_grad_per_sample_l2_med": [ + 0.001035262132063508, + 0.0007528892601840198, + 0.0007526214467361569, + 0.0007527145207859576, + 0.0007528204005211592 + ], + "gamma_dfa": 0.006789525970816612, + "gamma_dfa_per_layer": [ + 0.22278103232383728, + -0.04876326024532318, + -0.07404369860887527, + -0.07281596958637238 + ], + "acc_eval": 0.1640625, + "loss_eval": 1487.587158203125, + "epoch": 21 + }, + { + "hidden_norms": [ + 2927.763671875, + 309847.03125, + 323644.75, + 419166.875, + 443365.71875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010502212680876255, + 0.0007627566810697317, + 0.0007627056329511106, + 0.000762629380915314, + 0.0007625716971233487 + ], + "gamma_dfa": 0.02364537864923477, + "gamma_dfa_per_layer": [ + 0.29678860306739807, + -0.041244715452194214, + -0.08115403354167938, + -0.07980833947658539 + ], + "acc_eval": 0.169921875, + "loss_eval": 920.2720947265625, + "epoch": 22 + }, + { + "hidden_norms": [ + 3096.798583984375, + 369599.1875, + 385129.65625, + 491132.78125, + 518903.8125 + ], + "bp_grad_per_sample_l2_med": [ + 0.001009905245155096, + 0.0007581011741422117, + 0.0007581054233014584, + 0.0007580683450214565, + 0.0007581928512081504 + ], + "gamma_dfa": 0.003264583647251129, + "gamma_dfa_per_layer": [ + 0.2218201905488968, + -0.04958157241344452, + -0.07964619994163513, + -0.07953408360481262 + ], + "acc_eval": 0.2001953125, + "loss_eval": 1496.309814453125, + "epoch": 23 + }, + { + "hidden_norms": [ + 3268.982666015625, + 428585.28125, + 445459.5625, + 561163.625, + 592376.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.001033863751217723, + 0.0007647433667443693, + 0.0007646661251783371, + 0.0007653636857867241, + 0.0007653713691979647 + ], + "gamma_dfa": -0.0003395974636077881, + "gamma_dfa_per_layer": [ + 0.2477388083934784, + -0.05594494938850403, + -0.08699506521224976, + -0.10615718364715576 + ], + "acc_eval": 0.1669921875, + "loss_eval": 1579.9014892578125, + "epoch": 24 + }, + { + "hidden_norms": [ + 3455.88134765625, + 503646.0, + 521880.0, + 646881.0, + 681678.4375 + ], + "bp_grad_per_sample_l2_med": [ + 0.001110030454583466, + 0.000788405304774642, + 0.0007884047226980329, + 0.0007886688108555973, + 0.0007884959923103452 + ], + "gamma_dfa": 0.03397770132869482, + "gamma_dfa_per_layer": [ + 0.325829416513443, + -0.034700896590948105, + -0.09419499337673187, + -0.061022721230983734 + ], + "acc_eval": 0.1572265625, + "loss_eval": 3785.62744140625, + "epoch": 25 + }, + { + "hidden_norms": [ + 3642.92626953125, + 585772.8125, + 606436.25, + 744826.125, + 783648.0625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014668661169707775, + 0.0007638748502358794, + 0.000763841497246176, + 0.0007643977296538651, + 0.000764367519877851 + ], + "gamma_dfa": 0.01312381774187088, + "gamma_dfa_per_layer": [ + 0.23922428488731384, + -0.0393734946846962, + -0.07718683779239655, + -0.07016868144273758 + ], + "acc_eval": 0.232421875, + "loss_eval": 4151.03466796875, + "epoch": 26 + }, + { + "hidden_norms": [ + 3766.637939453125, + 680946.4375, + 702914.3125, + 850315.25, + 892276.625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012596967862918973, + 0.0007629106985405087, + 0.0007628659950569272, + 0.0007628875900991261, + 0.0007628927705809474 + ], + "gamma_dfa": 0.034322043880820274, + "gamma_dfa_per_layer": [ + 0.2786872386932373, + -0.04257660359144211, + -0.046638332307338715, + -0.052184127271175385 + ], + "acc_eval": 0.1396484375, + "loss_eval": 3629.718017578125, + "epoch": 27 + }, + { + "hidden_norms": [ + 3968.325927734375, + 788450.875, + 812297.0625, + 972239.1875, + 1018608.3125 + ], + "bp_grad_per_sample_l2_med": [ + 0.001368838595226407, + 0.0007680156268179417, + 0.0007679847767576575, + 0.0007678329711779952, + 0.0007678261026740074 + ], + "gamma_dfa": -0.004100106656551361, + "gamma_dfa_per_layer": [ + 0.2793079614639282, + -0.07087238132953644, + -0.09966391324996948, + -0.12517209351062775 + ], + "acc_eval": 0.0908203125, + "loss_eval": 4779.9248046875, + "epoch": 28 + }, + { + "hidden_norms": [ + 4129.07666015625, + 894723.3125, + 920476.5, + 1091407.125, + 1142044.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012168982066214085, + 0.0007647873135283589, + 0.0007647885358892381, + 0.0007647658349014819, + 0.0007648474420420825 + ], + "gamma_dfa": 0.008089051581919193, + "gamma_dfa_per_layer": [ + 0.24180662631988525, + -0.05241226777434349, + -0.08961856365203857, + -0.06741958856582642 + ], + "acc_eval": 0.2158203125, + "loss_eval": 4783.03515625, + "epoch": 29 + }, + { + "hidden_norms": [ + 4306.06396484375, + 1029326.875, + 1057140.5, + 1242169.625, + 1298018.875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011723857605829835, + 0.0007771517848595977, + 0.000777057372033596, + 0.0007771223317831755, + 0.0007771406089887023 + ], + "gamma_dfa": 0.039280178025364876, + "gamma_dfa_per_layer": [ + 0.3913160562515259, + -0.04802073538303375, + -0.09416519105434418, + -0.09200941771268845 + ], + "acc_eval": 0.1298828125, + "loss_eval": 3595.0546875, + "epoch": 30 + }, + { + "hidden_norms": [ + 4460.63916015625, + 1158344.75, + 1187641.625, + 1385118.375, + 1445341.375 + ], + "bp_grad_per_sample_l2_med": [ + 0.001693590427748859, + 0.0007734080427326262, + 0.0007734334794804454, + 0.0007733569364063442, + 0.0007734467508271337 + ], + "gamma_dfa": 0.023572785779833794, + "gamma_dfa_per_layer": [ + 0.2822916507720947, + -0.054915353655815125, + -0.06488456577062607, + -0.06820058822631836 + ], + "acc_eval": 0.1728515625, + "loss_eval": 4587.541015625, + "epoch": 31 + }, + { + "hidden_norms": [ + 4647.95556640625, + 1300320.625, + 1331227.625, + 1539845.25, + 1603645.625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012949237134307623, + 0.0007672033389098942, + 0.000767192745115608, + 0.0007670199265703559, + 0.0007670176564715803 + ], + "gamma_dfa": 0.004104164429008961, + "gamma_dfa_per_layer": [ + 0.2596903145313263, + -0.053032513707876205, + -0.0918058454990387, + -0.09843529760837555 + ], + "acc_eval": 0.236328125, + "loss_eval": 3593.60400390625, + "epoch": 32 + }, + { + "hidden_norms": [ + 4817.267578125, + 1453979.25, + 1486502.375, + 1706268.875, + 1774371.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014480708632618189, + 0.0007800625753588974, + 0.000779640453401953, + 0.0007796672289259732, + 0.000779696914833039 + ], + "gamma_dfa": 0.02201501652598381, + "gamma_dfa_per_layer": [ + 0.310447633266449, + -0.051143430173397064, + -0.08497071266174316, + -0.0862734243273735 + ], + "acc_eval": 0.1708984375, + "loss_eval": 5472.59521484375, + "epoch": 33 + }, + { + "hidden_norms": [ + 4990.40625, + 1611329.25, + 1646018.625, + 1880434.25, + 1953768.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018194144358858466, + 0.000765332777518779, + 0.0007653048378415406, + 0.0007655462250113487, + 0.0007656100788153708 + ], + "gamma_dfa": 0.033283455297350883, + "gamma_dfa_per_layer": [ + 0.3083266317844391, + -0.04947835952043533, + -0.06329820305109024, + -0.06241624802350998 + ], + "acc_eval": 0.2021484375, + "loss_eval": 4069.216796875, + "epoch": 34 + }, + { + "hidden_norms": [ + 5174.12255859375, + 1781529.0, + 1818275.25, + 2064802.5, + 2142905.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015505037736147642, + 0.0007980199297890067, + 0.0007979664951562881, + 0.0007982755196280777, + 0.000798304914496839 + ], + "gamma_dfa": 0.019624613225460052, + "gamma_dfa_per_layer": [ + 0.3409179449081421, + -0.05889412760734558, + -0.10494701564311981, + -0.09857834875583649 + ], + "acc_eval": 0.099609375, + "loss_eval": 8309.7119140625, + "epoch": 35 + }, + { + "hidden_norms": [ + 5347.279296875, + 1968104.0, + 2006811.625, + 2265948.5, + 2349278.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.001387596596032381, + 0.0007817883160896599, + 0.0007816275465302169, + 0.000781797047238797, + 0.0007817737059667706 + ], + "gamma_dfa": 0.000422419048845768, + "gamma_dfa_per_layer": [ + 0.25772032141685486, + -0.06083279475569725, + -0.09708747267723083, + -0.0981103777885437 + ], + "acc_eval": 0.1689453125, + "loss_eval": 4254.474609375, + "epoch": 36 + }, + { + "hidden_norms": [ + 5501.59130859375, + 2140827.0, + 2181494.0, + 2452387.75, + 2540377.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001305495505221188, + 0.0007833651034161448, + 0.0007831369293853641, + 0.0007831998518668115, + 0.0007831742987036705 + ], + "gamma_dfa": 0.019166686572134495, + "gamma_dfa_per_layer": [ + 0.3015354871749878, + -0.04834163561463356, + -0.08644455671310425, + -0.090082548558712 + ], + "acc_eval": 0.2060546875, + "loss_eval": 7909.48291015625, + "epoch": 37 + }, + { + "hidden_norms": [ + 5605.65625, + 2338654.5, + 2381249.75, + 2662644.5, + 2754823.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001968128141015768, + 0.0008015396306291223, + 0.0008015292696654797, + 0.0008016829378902912, + 0.0008016840438358486 + ], + "gamma_dfa": 0.01810804195702076, + "gamma_dfa_per_layer": [ + 0.352972149848938, + -0.05855761468410492, + -0.11013064533472061, + -0.11185172200202942 + ], + "acc_eval": 0.091796875, + "loss_eval": 9552.5458984375, + "epoch": 38 + }, + { + "hidden_norms": [ + 5776.4921875, + 2524649.5, + 2569209.25, + 2862403.25, + 2959360.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001521907513961196, + 0.0007685177261009812, + 0.0007685192977078259, + 0.0007685712771490216, + 0.0007685913005843759 + ], + "gamma_dfa": 0.006301743909716606, + "gamma_dfa_per_layer": [ + 0.3194616436958313, + -0.07331519573926926, + -0.09753184020519257, + -0.12340763211250305 + ], + "acc_eval": 0.123046875, + "loss_eval": 9288.3515625, + "epoch": 39 + }, + { + "hidden_norms": [ + 5893.2958984375, + 2719236.25, + 2766489.0, + 3076192.25, + 3179584.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.001874743727967143, + 0.0007690778584219515, + 0.0007690794300287962, + 0.000769136706367135, + 0.000769163656514138 + ], + "gamma_dfa": -0.008455535396933556, + "gamma_dfa_per_layer": [ + 0.27458086609840393, + -0.07574597001075745, + -0.10251512378454208, + -0.13014191389083862 + ], + "acc_eval": 0.1015625, + "loss_eval": 9500.7265625, + "epoch": 40 + }, + { + "hidden_norms": [ + 6037.26904296875, + 2917167.0, + 2966218.0, + 3287947.75, + 3395999.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015074120601639152, + 0.0007870618137530982, + 0.0007870634435676038, + 0.00078706128988415, + 0.0007870564586482942 + ], + "gamma_dfa": 0.003465494140982628, + "gamma_dfa_per_layer": [ + 0.23106470704078674, + -0.04510585218667984, + -0.1033426821231842, + -0.06875419616699219 + ], + "acc_eval": 0.1484375, + "loss_eval": 13665.34375, + "epoch": 41 + }, + { + "hidden_norms": [ + 6165.3271484375, + 3150321.25, + 3201845.5, + 3537869.5, + 3651609.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0038438383489847183, + 0.0007633256609551609, + 0.0007633093046024442, + 0.0007634069188497961, + 0.0007634120993316174 + ], + "gamma_dfa": 0.05023553688079119, + "gamma_dfa_per_layer": [ + 0.36768630146980286, + -0.05948590859770775, + -0.06263985484838486, + -0.0446183905005455 + ], + "acc_eval": 0.130859375, + "loss_eval": 15518.396484375, + "epoch": 42 + }, + { + "hidden_norms": [ + 6322.185546875, + 3356179.75, + 3409150.0, + 3756998.75, + 3874858.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017886407440528274, + 0.0007953053573146462, + 0.000795268511865288, + 0.0007953139720484614, + 0.0007953820750117302 + ], + "gamma_dfa": -0.004728740081191063, + "gamma_dfa_per_layer": [ + 0.26050812005996704, + -0.07150034606456757, + -0.10889407992362976, + -0.09902865439653397 + ], + "acc_eval": 0.1474609375, + "loss_eval": 13731.47265625, + "epoch": 43 + }, + { + "hidden_norms": [ + 6455.05615234375, + 3581075.75, + 3636212.25, + 3997916.75, + 4121800.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014103130670264363, + 0.0008020435925573111, + 0.0008020424866117537, + 0.0008023462723940611, + 0.0008024003473110497 + ], + "gamma_dfa": 0.03236876800656319, + "gamma_dfa_per_layer": [ + 0.3784361481666565, + -0.05973149091005325, + -0.09747618436813354, + -0.09175340086221695 + ], + "acc_eval": 0.1396484375, + "loss_eval": 8173.1318359375, + "epoch": 44 + }, + { + "hidden_norms": [ + 6596.92529296875, + 3790696.25, + 3847633.75, + 4219067.0, + 4346740.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.001376444473862648, + 0.0007939717615954578, + 0.0007933968445286155, + 0.0007933415472507477, + 0.0007934658788144588 + ], + "gamma_dfa": 0.026161080226302147, + "gamma_dfa_per_layer": [ + 0.35278040170669556, + -0.07518108189105988, + -0.09520787000656128, + -0.07774712890386581 + ], + "acc_eval": 0.158203125, + "loss_eval": 10093.57421875, + "epoch": 45 + }, + { + "hidden_norms": [ + 6752.326171875, + 4013893.75, + 4072463.0, + 4456049.5, + 4588960.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016587942373007536, + 0.000801959540694952, + 0.0008019180968403816, + 0.0008022981346584857, + 0.0008023587288334966 + ], + "gamma_dfa": 0.0014634709805250168, + "gamma_dfa_per_layer": [ + 0.26356324553489685, + -0.05649265646934509, + -0.09903856366872787, + -0.10217814147472382 + ], + "acc_eval": 0.16796875, + "loss_eval": 11805.994140625, + "epoch": 46 + }, + { + "hidden_norms": [ + 6883.87158203125, + 4249640.0, + 4310267.0, + 4705052.0, + 4842379.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017551308264955878, + 0.0007804373744875193, + 0.0007804358028806746, + 0.0007804319611750543, + 0.0007804720080457628 + ], + "gamma_dfa": -0.00971926562488079, + "gamma_dfa_per_layer": [ + 0.23957225680351257, + -0.06951768696308136, + -0.09375166893005371, + -0.11517996340990067 + ], + "acc_eval": 0.16015625, + "loss_eval": 19465.8828125, + "epoch": 47 + }, + { + "hidden_norms": [ + 7004.37841796875, + 4461495.0, + 4523850.0, + 4930553.5, + 5072236.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015129564562812448, + 0.0007847726810723543, + 0.0007845073123462498, + 0.000784386123996228, + 0.0007843819330446422 + ], + "gamma_dfa": 0.0085066519677639, + "gamma_dfa_per_layer": [ + 0.2637098431587219, + -0.05605460703372955, + -0.08905251324176788, + -0.08457611501216888 + ], + "acc_eval": 0.2021484375, + "loss_eval": 7892.26611328125, + "epoch": 48 + }, + { + "hidden_norms": [ + 7112.80078125, + 4708139.0, + 4772392.0, + 5193498.0, + 5341091.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015166979283094406, + 0.0007669071783311665, + 0.0007669082842767239, + 0.0007670924533158541, + 0.0007671677158214152 + ], + "gamma_dfa": 0.015125783160328865, + "gamma_dfa_per_layer": [ + 0.2562488615512848, + -0.046804703772068024, + -0.08796676248311996, + -0.06097426265478134 + ], + "acc_eval": 0.2333984375, + "loss_eval": 8893.0791015625, + "epoch": 49 + }, + { + "hidden_norms": [ + 7200.81201171875, + 4906775.0, + 4972128.5, + 5401281.5, + 5552169.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015469590434804559, + 0.0007871663547120988, + 0.0007869182154536247, + 0.0007867610547691584, + 0.0007867159438319504 + ], + "gamma_dfa": 0.016506953164935112, + "gamma_dfa_per_layer": [ + 0.29171258211135864, + -0.05020506680011749, + -0.09062528610229492, + -0.08485441654920578 + ], + "acc_eval": 0.2197265625, + "loss_eval": 10566.345703125, + "epoch": 50 + }, + { + "hidden_norms": [ + 7296.0625, + 5134799.0, + 5202023.5, + 5643737.5, + 5799758.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018195129232481122, + 0.0007844618521630764, + 0.0007844566716812551, + 0.000784536823630333, + 0.000784553587436676 + ], + "gamma_dfa": 0.019483929499983788, + "gamma_dfa_per_layer": [ + 0.29106640815734863, + -0.05478575825691223, + -0.07833737879991531, + -0.08000755310058594 + ], + "acc_eval": 0.1650390625, + "loss_eval": 9639.78125, + "epoch": 51 + }, + { + "hidden_norms": [ + 7403.17138671875, + 5361356.5, + 5429682.0, + 5879784.5, + 6039432.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.002603700151666999, + 0.000755469489376992, + 0.0007554262992925942, + 0.0007555284537374973, + 0.0007555308402515948 + ], + "gamma_dfa": 0.05388479772955179, + "gamma_dfa_per_layer": [ + 0.3746236264705658, + -0.060121551156044006, + -0.06174459308385849, + -0.03721829131245613 + ], + "acc_eval": 0.1494140625, + "loss_eval": 12397.41015625, + "epoch": 52 + }, + { + "hidden_norms": [ + 7488.30126953125, + 5582023.0, + 5651748.5, + 6110668.5, + 6273320.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.00202713580802083, + 0.0007801816100254655, + 0.000780182599555701, + 0.0007801790488883853, + 0.0007801697356626391 + ], + "gamma_dfa": 0.01045304723083973, + "gamma_dfa_per_layer": [ + 0.25068047642707825, + -0.06100655347108841, + -0.0828605443239212, + -0.06500118970870972 + ], + "acc_eval": 0.2138671875, + "loss_eval": 18765.955078125, + "epoch": 53 + }, + { + "hidden_norms": [ + 7561.47265625, + 5795100.5, + 5866105.0, + 6334896.0, + 6501444.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017575331730768085, + 0.0007978819194249809, + 0.0007978450739756227, + 0.000798230292275548, + 0.0007982761017046869 + ], + "gamma_dfa": 0.011411387473344803, + "gamma_dfa_per_layer": [ + 0.29157841205596924, + -0.05369853973388672, + -0.09859319031238556, + -0.09364113211631775 + ], + "acc_eval": 0.1875, + "loss_eval": 10589.0087890625, + "epoch": 54 + }, + { + "hidden_norms": [ + 7636.35595703125, + 6016687.0, + 6089686.0, + 6570658.5, + 6741688.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001416882500052452, + 0.0007854877039790154, + 0.0007851187838241458, + 0.0007847094675526023, + 0.0007846617372706532 + ], + "gamma_dfa": 0.004635758697986603, + "gamma_dfa_per_layer": [ + 0.2832094430923462, + -0.06018421798944473, + -0.10714054107666016, + -0.09734164923429489 + ], + "acc_eval": 0.1884765625, + "loss_eval": 11045.0107421875, + "epoch": 55 + }, + { + "hidden_norms": [ + 7700.8466796875, + 6215443.5, + 6289647.5, + 6780492.0, + 6955139.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017022350803017616, + 0.0007623002748005092, + 0.000762303126975894, + 0.000762506271712482, + 0.0007625941070728004 + ], + "gamma_dfa": 0.026831449940800667, + "gamma_dfa_per_layer": [ + 0.339847594499588, + -0.0706903263926506, + -0.0816052109003067, + -0.08022625744342804 + ], + "acc_eval": 0.154296875, + "loss_eval": 9215.373046875, + "epoch": 56 + }, + { + "hidden_norms": [ + 7773.85986328125, + 6413204.5, + 6488502.5, + 6988337.0, + 7166683.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013730988139286637, + 0.0007787180948071182, + 0.0007787116337567568, + 0.0007787745562382042, + 0.0007787866634316742 + ], + "gamma_dfa": 0.013194277882575989, + "gamma_dfa_per_layer": [ + 0.30715805292129517, + -0.0632064938545227, + -0.09261326491832733, + -0.09856118261814117 + ], + "acc_eval": 0.2236328125, + "loss_eval": 6176.3076171875, + "epoch": 57 + }, + { + "hidden_norms": [ + 7820.23388671875, + 6598801.0, + 6675650.0, + 7184845.0, + 7367520.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015506811905652285, + 0.000799653644207865, + 0.0007990750018507242, + 0.0007989082369022071, + 0.0007991326274350286 + ], + "gamma_dfa": 0.00773581862449646, + "gamma_dfa_per_layer": [ + 0.28355157375335693, + -0.054453425109386444, + -0.11499008536338806, + -0.08316478878259659 + ], + "acc_eval": 0.205078125, + "loss_eval": 7889.31005859375, + "epoch": 58 + }, + { + "hidden_norms": [ + 7864.2060546875, + 6797904.5, + 6876033.0, + 7392718.0, + 7578431.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020978215616196394, + 0.0007834822754375637, + 0.0007832171395421028, + 0.0007829645182937384, + 0.0007829380920156837 + ], + "gamma_dfa": 0.033629802986979485, + "gamma_dfa_per_layer": [ + 0.34407293796539307, + -0.05567466467618942, + -0.08536086976528168, + -0.06851819157600403 + ], + "acc_eval": 0.15625, + "loss_eval": 14391.9736328125, + "epoch": 59 + }, + { + "hidden_norms": [ + 7871.78173828125, + 7003051.0, + 7083124.0, + 7611188.0, + 7801170.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012560655595734715, + 0.0007599582313559949, + 0.0007599598611705005, + 0.0007601079414598644, + 0.0007601887919008732 + ], + "gamma_dfa": 0.004498079419136047, + "gamma_dfa_per_layer": [ + 0.32327917218208313, + -0.07260935008525848, + -0.10525670647621155, + -0.1274207979440689 + ], + "acc_eval": 0.1572265625, + "loss_eval": 7188.275390625, + "epoch": 60 + }, + { + "hidden_norms": [ + 7934.14794921875, + 7210797.0, + 7292245.5, + 7829288.0, + 8023057.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001343236886896193, + 0.0007599524687975645, + 0.0007598291267640889, + 0.0007597675430588424, + 0.0007598883821628988 + ], + "gamma_dfa": 0.02613817434757948, + "gamma_dfa_per_layer": [ + 0.3003483712673187, + -0.0427340604364872, + -0.09165668487548828, + -0.06140492856502533 + ], + "acc_eval": 0.259765625, + "loss_eval": 7055.94677734375, + "epoch": 61 + }, + { + "hidden_norms": [ + 7964.50244140625, + 7416797.0, + 7500505.0, + 8048676.5, + 8247824.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015083092730492353, + 0.0007851184927858412, + 0.0007850866531953216, + 0.0007850754773244262, + 0.0007851301343180239 + ], + "gamma_dfa": 0.027105171233415604, + "gamma_dfa_per_layer": [ + 0.37000784277915955, + -0.05895276367664337, + -0.10036876797676086, + -0.1022656261920929 + ], + "acc_eval": 0.166015625, + "loss_eval": 7052.08203125, + "epoch": 62 + }, + { + "hidden_norms": [ + 8006.1318359375, + 7588913.0, + 7673353.5, + 8229041.0, + 8431689.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014928504824638367, + 0.0007839660393074155, + 0.000783930707257241, + 0.0007839277386665344, + 0.0007839910103939474 + ], + "gamma_dfa": 0.018935419619083405, + "gamma_dfa_per_layer": [ + 0.3158775568008423, + -0.051478639245033264, + -0.09881415218114853, + -0.08984308689832687 + ], + "acc_eval": 0.2119140625, + "loss_eval": 6266.041015625, + "epoch": 63 + }, + { + "hidden_norms": [ + 8030.2109375, + 7754257.5, + 7839832.5, + 8400781.0, + 8605522.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012633835431188345, + 0.0007809567032381892, + 0.0007807457586750388, + 0.0007805972127243876, + 0.0007805809145793319 + ], + "gamma_dfa": 0.009956683963537216, + "gamma_dfa_per_layer": [ + 0.30735114216804504, + -0.06991781294345856, + -0.09387198090553284, + -0.10373461246490479 + ], + "acc_eval": 0.1806640625, + "loss_eval": 8467.8125, + "epoch": 64 + }, + { + "hidden_norms": [ + 8048.080078125, + 7913574.5, + 8000306.0, + 8567918.0, + 8775169.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001400441862642765, + 0.0007796542486175895, + 0.0007795418496243656, + 0.0007795065175741911, + 0.0007797059370204806 + ], + "gamma_dfa": 0.008816102519631386, + "gamma_dfa_per_layer": [ + 0.28880423307418823, + -0.05614739656448364, + -0.11088694632053375, + -0.0865054801106453 + ], + "acc_eval": 0.203125, + "loss_eval": 9558.021484375, + "epoch": 65 + }, + { + "hidden_norms": [ + 8067.34375, + 8070731.5, + 8158800.0, + 8733572.0, + 8943043.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014346289681270719, + 0.000756031135097146, + 0.0007560329977422953, + 0.0007561623933725059, + 0.0007562324753962457 + ], + "gamma_dfa": 0.009170351549983025, + "gamma_dfa_per_layer": [ + 0.3515056073665619, + -0.0781104564666748, + -0.10490105301141739, + -0.1318126916885376 + ], + "acc_eval": 0.1103515625, + "loss_eval": 11967.486328125, + "epoch": 66 + }, + { + "hidden_norms": [ + 8073.40283203125, + 8227977.0, + 8317204.5, + 8898513.0, + 9110756.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015745362034067512, + 0.0007811843534000218, + 0.000781158625613898, + 0.0007811560644768178, + 0.0007812076364643872 + ], + "gamma_dfa": 0.011113166809082031, + "gamma_dfa_per_layer": [ + 0.30191734433174133, + -0.05505914241075516, + -0.10382715612649918, + -0.09857837855815887 + ], + "acc_eval": 0.177734375, + "loss_eval": 7797.017578125, + "epoch": 67 + }, + { + "hidden_norms": [ + 8071.63623046875, + 8375112.0, + 8465576.0, + 9052592.0, + 9267093.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.002133303554728627, + 0.0007824470521882176, + 0.0007822668994776905, + 0.0007822004845365882, + 0.0007824745844118297 + ], + "gamma_dfa": 0.03663862869143486, + "gamma_dfa_per_layer": [ + 0.34291785955429077, + -0.036236945539712906, + -0.10749906301498413, + -0.052627336233854294 + ], + "acc_eval": 0.1396484375, + "loss_eval": 11433.0302734375, + "epoch": 68 + }, + { + "hidden_norms": [ + 8084.59130859375, + 8523176.0, + 8614498.0, + 9207429.0, + 9424164.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001537870615720749, + 0.0007688916521146894, + 0.0007688923506066203, + 0.0007689034100621939, + 0.0007689160411246121 + ], + "gamma_dfa": 0.020611698739230633, + "gamma_dfa_per_layer": [ + 0.3258458971977234, + -0.053132835775613785, + -0.10754033923149109, + -0.08272592723369598 + ], + "acc_eval": 0.1787109375, + "loss_eval": 6151.634765625, + "epoch": 69 + }, + { + "hidden_norms": [ + 8098.82373046875, + 8648680.0, + 8741121.0, + 9338018.0, + 9556207.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014389777788892388, + 0.0007975181215442717, + 0.0007967942510731518, + 0.0007966712000779808, + 0.0007968792924657464 + ], + "gamma_dfa": 0.009284427389502525, + "gamma_dfa_per_layer": [ + 0.29391974210739136, + -0.058484748005867004, + -0.11177978664636612, + -0.08651749789714813 + ], + "acc_eval": 0.18359375, + "loss_eval": 5277.328125, + "epoch": 70 + }, + { + "hidden_norms": [ + 8113.7255859375, + 8773553.0, + 8866719.0, + 9469018.0, + 9689706.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00145814404822886, + 0.0007955037872307003, + 0.0007954062311910093, + 0.0007954093161970377, + 0.0007956796325743198 + ], + "gamma_dfa": 0.01389121450483799, + "gamma_dfa_per_layer": [ + 0.28217679262161255, + -0.058154717087745667, + -0.08273636549711227, + -0.08572085201740265 + ], + "acc_eval": 0.1923828125, + "loss_eval": 10207.12109375, + "epoch": 71 + }, + { + "hidden_norms": [ + 8063.9951171875, + 8889169.0, + 8984089.0, + 9593494.0, + 9817277.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011409161379560828, + 0.0007544065010733902, + 0.0007542934035882354, + 0.000754217617213726, + 0.0007543462561443448 + ], + "gamma_dfa": 0.018794666975736618, + "gamma_dfa_per_layer": [ + 0.2941493093967438, + -0.0533231720328331, + -0.09251905977725983, + -0.07312840968370438 + ], + "acc_eval": 0.2626953125, + "loss_eval": 4281.3994140625, + "epoch": 72 + }, + { + "hidden_norms": [ + 8021.80126953125, + 9019768.0, + 9115790.0, + 9730846.0, + 9956825.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012580875772982836, + 0.0007680498529225588, + 0.0007680428680032492, + 0.0007680479320697486, + 0.0007680551498197019 + ], + "gamma_dfa": 0.027317012660205364, + "gamma_dfa_per_layer": [ + 0.3265392780303955, + -0.04611017927527428, + -0.09342358261346817, + -0.0777374655008316 + ], + "acc_eval": 0.2275390625, + "loss_eval": 4907.6142578125, + "epoch": 73 + }, + { + "hidden_norms": [ + 7995.38916015625, + 9118244.0, + 9214531.0, + 9832139.0, + 10058956.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012337823864072561, + 0.0007691435748711228, + 0.000768946367315948, + 0.000768885191064328, + 0.0007689236663281918 + ], + "gamma_dfa": 0.012230871245265007, + "gamma_dfa_per_layer": [ + 0.2935040593147278, + -0.06186644732952118, + -0.09978199750185013, + -0.08293212950229645 + ], + "acc_eval": 0.2001953125, + "loss_eval": 7199.5888671875, + "epoch": 74 + }, + { + "hidden_norms": [ + 7966.3759765625, + 9213122.0, + 9310022.0, + 9931662.0, + 10160365.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011302486527711153, + 0.0007655700901523232, + 0.0007655754452571273, + 0.0007655742228962481, + 0.0007655934314243495 + ], + "gamma_dfa": 0.01679898425936699, + "gamma_dfa_per_layer": [ + 0.3025580048561096, + -0.05692540109157562, + -0.10290184617042542, + -0.07553482055664062 + ], + "acc_eval": 0.2490234375, + "loss_eval": 2667.806640625, + "epoch": 75 + }, + { + "hidden_norms": [ + 7937.92041015625, + 9292608.0, + 9390243.0, + 10015125.0, + 10244868.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011147550540044904, + 0.0007753095123916864, + 0.0007750216755084693, + 0.000774735352024436, + 0.0007747214986011386 + ], + "gamma_dfa": 0.027967805042862892, + "gamma_dfa_per_layer": [ + 0.3572651743888855, + -0.05705829709768295, + -0.09071685373783112, + -0.09761880338191986 + ], + "acc_eval": 0.1923828125, + "loss_eval": 3299.91259765625, + "epoch": 76 + }, + { + "hidden_norms": [ + 7904.56689453125, + 9393010.0, + 9491687.0, + 10122118.0, + 10354408.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00107352074701339, + 0.0007645431905984879, + 0.0007645484292879701, + 0.0007645472651347518, + 0.0007645685109309852 + ], + "gamma_dfa": 0.02625838667154312, + "gamma_dfa_per_layer": [ + 0.3598015606403351, + -0.06442467868328094, + -0.09077714383602142, + -0.09956619143486023 + ], + "acc_eval": 0.2119140625, + "loss_eval": 2758.64599609375, + "epoch": 77 + }, + { + "hidden_norms": [ + 7855.07861328125, + 9500690.0, + 9600497.0, + 10235757.0, + 10469660.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001235201139934361, + 0.0007838172605261207, + 0.000783789437264204, + 0.0007840599282644689, + 0.00078408676199615 + ], + "gamma_dfa": 0.02602401003241539, + "gamma_dfa_per_layer": [ + 0.35960710048675537, + -0.06299363076686859, + -0.10128454864025116, + -0.09123288094997406 + ], + "acc_eval": 0.1689453125, + "loss_eval": 4279.3154296875, + "epoch": 78 + }, + { + "hidden_norms": [ + 7826.134765625, + 9581674.0, + 9682195.0, + 10320423.0, + 10555402.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010469084372743964, + 0.0007737708510830998, + 0.0007735842373222113, + 0.0007734137470833957, + 0.0007734144455753267 + ], + "gamma_dfa": 0.024147922173142433, + "gamma_dfa_per_layer": [ + 0.37674999237060547, + -0.07557321339845657, + -0.09047992527484894, + -0.11410516500473022 + ], + "acc_eval": 0.1669921875, + "loss_eval": 3201.240966796875, + "epoch": 79 + }, + { + "hidden_norms": [ + 7779.2138671875, + 9660604.0, + 9761859.0, + 10404086.0, + 10640750.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010143390391021967, + 0.0007633482455275953, + 0.0007633481291122735, + 0.0007633698405697942, + 0.0007633839850313962 + ], + "gamma_dfa": 0.019840596243739128, + "gamma_dfa_per_layer": [ + 0.30444687604904175, + -0.049144186079502106, + -0.09650193899869919, + -0.07943836599588394 + ], + "acc_eval": 0.2763671875, + "loss_eval": 1991.417236328125, + "epoch": 80 + }, + { + "hidden_norms": [ + 7760.08642578125, + 9716882.0, + 9818513.0, + 10462903.0, + 10700433.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00105896289460361, + 0.0007729134522378445, + 0.0007727605989202857, + 0.0007726037292741239, + 0.000772611063439399 + ], + "gamma_dfa": 0.026730000041425228, + "gamma_dfa_per_layer": [ + 0.34768593311309814, + -0.056363869458436966, + -0.09562714397907257, + -0.0887749195098877 + ], + "acc_eval": 0.2177734375, + "loss_eval": 2112.26025390625, + "epoch": 81 + }, + { + "hidden_norms": [ + 7743.93798828125, + 9786243.0, + 9888395.0, + 10535762.0, + 10774483.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010133162140846252, + 0.0007726953481324017, + 0.0007724745664745569, + 0.0007722667651250958, + 0.0007722647860646248 + ], + "gamma_dfa": 0.019241390749812126, + "gamma_dfa_per_layer": [ + 0.3473237156867981, + -0.06556949764490128, + -0.10282130539417267, + -0.10196734964847565 + ], + "acc_eval": 0.193359375, + "loss_eval": 2962.46826171875, + "epoch": 82 + }, + { + "hidden_norms": [ + 7708.34033203125, + 9842047.0, + 9944650.0, + 10594529.0, + 10834219.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000999346375465393, + 0.0007619770476594567, + 0.0007619837997481227, + 0.0007619837415404618, + 0.0007620092947036028 + ], + "gamma_dfa": 0.019368495792150497, + "gamma_dfa_per_layer": [ + 0.3106932044029236, + -0.057876452803611755, + -0.09636038541793823, + -0.0789823830127716 + ], + "acc_eval": 0.2607421875, + "loss_eval": 1792.6400146484375, + "epoch": 83 + }, + { + "hidden_norms": [ + 7673.24560546875, + 9901470.0, + 10004649.0, + 10656950.0, + 10898699.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009565355721861124, + 0.0007485878886654973, + 0.0007484929519705474, + 0.000748424616176635, + 0.0007485424866899848 + ], + "gamma_dfa": 0.01748405210673809, + "gamma_dfa_per_layer": [ + 0.2931858003139496, + -0.05277211219072342, + -0.09270339459180832, + -0.07777408510446548 + ], + "acc_eval": 0.29296875, + "loss_eval": 974.1173095703125, + "epoch": 84 + }, + { + "hidden_norms": [ + 7628.22412109375, + 9951868.0, + 10055369.0, + 10709207.0, + 10951317.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000980330049060285, + 0.0007466387469321489, + 0.0007466417155228555, + 0.0007467885152436793, + 0.0007468488765880466 + ], + "gamma_dfa": 0.019473757594823837, + "gamma_dfa_per_layer": [ + 0.29309791326522827, + -0.05341349542140961, + -0.08986704051494598, + -0.07192234694957733 + ], + "acc_eval": 0.27734375, + "loss_eval": 1743.6519775390625, + "epoch": 85 + }, + { + "hidden_norms": [ + 7586.08837890625, + 9992418.0, + 10096238.0, + 10751557.0, + 10993641.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009816273814067245, + 0.0007609970052726567, + 0.000761001487262547, + 0.0007610011962242424, + 0.0007610262255184352 + ], + "gamma_dfa": 0.017493372783064842, + "gamma_dfa_per_layer": [ + 0.307644248008728, + -0.054675400257110596, + -0.09402725845575333, + -0.08896809816360474 + ], + "acc_eval": 0.2783203125, + "loss_eval": 986.1089477539062, + "epoch": 86 + }, + { + "hidden_norms": [ + 7546.07666015625, + 10019561.0, + 10123471.0, + 10779392.0, + 11021634.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010106659028679132, + 0.0007606986328028142, + 0.0007606985163874924, + 0.0007607255247421563, + 0.0007607414736412466 + ], + "gamma_dfa": 0.0189383989199996, + "gamma_dfa_per_layer": [ + 0.3057447671890259, + -0.05296015366911888, + -0.09528908133506775, + -0.08174193650484085 + ], + "acc_eval": 0.2412109375, + "loss_eval": 1453.539306640625, + "epoch": 87 + }, + { + "hidden_norms": [ + 7507.373046875, + 10034866.0, + 10138899.0, + 10794880.0, + 11037002.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009441400761716068, + 0.0007457168539986014, + 0.0007457205792888999, + 0.0007458969485014677, + 0.0007459585904143751 + ], + "gamma_dfa": 0.016358308494091034, + "gamma_dfa_per_layer": [ + 0.29192131757736206, + -0.054730333387851715, + -0.08949868381023407, + -0.08225906640291214 + ], + "acc_eval": 0.2939453125, + "loss_eval": 889.3756103515625, + "epoch": 88 + }, + { + "hidden_norms": [ + 7475.10595703125, + 10059038.0, + 10163330.0, + 10820810.0, + 11063516.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009275015909224749, + 0.0007406340446323156, + 0.0007405761862173676, + 0.0007405940559692681, + 0.0007405842188745737 + ], + "gamma_dfa": 0.019343840889632702, + "gamma_dfa_per_layer": [ + 0.2714617848396301, + -0.049602191895246506, + -0.07989576458930969, + -0.06458846479654312 + ], + "acc_eval": 0.322265625, + "loss_eval": 778.108642578125, + "epoch": 89 + }, + { + "hidden_norms": [ + 7444.8466796875, + 10064810.0, + 10169219.0, + 10827134.0, + 11070129.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009403944713994861, + 0.000745263765566051, + 0.0007452677236869931, + 0.0007454471196979284, + 0.0007455073646269739 + ], + "gamma_dfa": 0.01310044713318348, + "gamma_dfa_per_layer": [ + 0.28572195768356323, + -0.054389551281929016, + -0.09277918189764023, + -0.08615143597126007 + ], + "acc_eval": 0.26953125, + "loss_eval": 932.53662109375, + "epoch": 90 + }, + { + "hidden_norms": [ + 7414.4970703125, + 10075394.0, + 10179775.0, + 10837778.0, + 11080979.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009539846796542406, + 0.0007622878183610737, + 0.0007622832781635225, + 0.0007622758857905865, + 0.0007622810662724078 + ], + "gamma_dfa": 0.02442830428481102, + "gamma_dfa_per_layer": [ + 0.34633398056030273, + -0.059510812163352966, + -0.09629844129085541, + -0.09281150996685028 + ], + "acc_eval": 0.228515625, + "loss_eval": 1020.4122924804688, + "epoch": 91 + }, + { + "hidden_norms": [ + 7385.740234375, + 10098198.0, + 10202575.0, + 10860396.0, + 11103300.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009258585050702095, + 0.0007462432840839028, + 0.0007461663917638361, + 0.000746095203794539, + 0.0007462148205377162 + ], + "gamma_dfa": 0.021881024353206158, + "gamma_dfa_per_layer": [ + 0.3117921054363251, + -0.0562119297683239, + -0.0811537504196167, + -0.08690232783555984 + ], + "acc_eval": 0.2783203125, + "loss_eval": 812.965576171875, + "epoch": 92 + }, + { + "hidden_norms": [ + 7372.93115234375, + 10112263.0, + 10216603.0, + 10874068.0, + 11116538.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009158457978628576, + 0.000744756544008851, + 0.0007447608513757586, + 0.0007449553813785315, + 0.0007450156263075769 + ], + "gamma_dfa": 0.018241400830447674, + "gamma_dfa_per_layer": [ + 0.27702248096466064, + -0.048618000000715256, + -0.0829005166888237, + -0.072538360953331 + ], + "acc_eval": 0.330078125, + "loss_eval": 675.6625366210938, + "epoch": 93 + }, + { + "hidden_norms": [ + 7363.2099609375, + 10119183.0, + 10223550.0, + 10881119.0, + 11123569.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009229940478689969, + 0.0007447171374224126, + 0.000744720280636102, + 0.0007448522374033928, + 0.000744906603358686 + ], + "gamma_dfa": 0.016729017719626427, + "gamma_dfa_per_layer": [ + 0.27939361333847046, + -0.048901431262493134, + -0.08870212733745575, + -0.07487398386001587 + ], + "acc_eval": 0.3251953125, + "loss_eval": 708.3804931640625, + "epoch": 94 + }, + { + "hidden_norms": [ + 7355.3544921875, + 10123197.0, + 10227558.0, + 10885026.0, + 11127411.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009278868092224002, + 0.0007445889641530812, + 0.0007445933879353106, + 0.0007447681855410337, + 0.0007448261021636426 + ], + "gamma_dfa": 0.014646172523498535, + "gamma_dfa_per_layer": [ + 0.28425437211990356, + -0.053754955530166626, + -0.08852015435695648, + -0.08339457213878632 + ], + "acc_eval": 0.310546875, + "loss_eval": 688.0819091796875, + "epoch": 95 + }, + { + "hidden_norms": [ + 7349.30078125, + 10126695.0, + 10231071.0, + 10888593.0, + 11130985.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000914200150873512, + 0.0007393965497612953, + 0.000739329494535923, + 0.0007393491105176508, + 0.0007393329287879169 + ], + "gamma_dfa": 0.01913625281304121, + "gamma_dfa_per_layer": [ + 0.26301705837249756, + -0.04846196621656418, + -0.07772514969110489, + -0.06028493121266365 + ], + "acc_eval": 0.3203125, + "loss_eval": 697.3836669921875, + "epoch": 96 + }, + { + "hidden_norms": [ + 7345.333984375, + 10127832.0, + 10232199.0, + 10889673.0, + 11132020.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009217644692398608, + 0.0007456630119122565, + 0.0007455685408785939, + 0.0007454968290403485, + 0.0007456148159690201 + ], + "gamma_dfa": 0.017519758082926273, + "gamma_dfa_per_layer": [ + 0.29056763648986816, + -0.05349243804812431, + -0.08799343556165695, + -0.0790027305483818 + ], + "acc_eval": 0.30859375, + "loss_eval": 661.5548095703125, + "epoch": 97 + }, + { + "hidden_norms": [ + 7343.10888671875, + 10128861.0, + 10233227.0, + 10890713.0, + 11133060.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009042566525749862, + 0.0007393184932880104, + 0.0007392505649477243, + 0.0007392706465907395, + 0.0007392524858005345 + ], + "gamma_dfa": 0.018206479027867317, + "gamma_dfa_per_layer": [ + 0.2680240869522095, + -0.047486238181591034, + -0.08014586567878723, + -0.06756606698036194 + ], + "acc_eval": 0.3388671875, + "loss_eval": 636.5595703125, + "epoch": 98 + }, + { + "hidden_norms": [ + 7342.0625, + 10129300.0, + 10233666.0, + 10891137.0, + 11133475.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009002314181998372, + 0.0007393373525701463, + 0.0007392485276795924, + 0.0007392755360342562, + 0.0007392438710667193 + ], + "gamma_dfa": 0.01726893801242113, + "gamma_dfa_per_layer": [ + 0.2736765742301941, + -0.05038469657301903, + -0.0817006528377533, + -0.07251547276973724 + ], + "acc_eval": 0.3330078125, + "loss_eval": 611.882080078125, + "epoch": 99 + }, + { + "hidden_norms": [ + 7341.77294921875, + 10129401.0, + 10233766.0, + 10891235.0, + 11133570.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009032402304001153, + 0.0007393273408524692, + 0.0007392435800284147, + 0.0007392680854536593, + 0.0007392411935143173 + ], + "gamma_dfa": 0.01641188934445381, + "gamma_dfa_per_layer": [ + 0.2728629410266876, + -0.05080822855234146, + -0.08297968655824661, + -0.0734274685382843 + ], + "acc_eval": 0.33203125, + "loss_eval": 625.6834106445312, + "epoch": 100 + } + ] +} \ No newline at end of file diff --git a/results/snapshot_no_outln_v1/snapshot_noLN_s456.json b/results/snapshot_no_outln_v1/snapshot_noLN_s456.json new file mode 100644 index 0000000..f490ffc --- /dev/null +++ b/results/snapshot_no_outln_v1/snapshot_noLN_s456.json @@ -0,0 +1,4766 @@ +{ + "config": { + "output_dir": "results/snapshot_no_outln_v1", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 456, + "depth": 4, + "d_hidden": 256 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "architecture": "ResidualMLP_NoOutLN", + "bp_log": [ + { + "hidden_norms": [ + 8.696551322937012, + 8.737784385681152, + 8.813130378723145, + 8.844642639160156, + 8.889528274536133 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005607507191598415, + 0.0005558764678426087, + 0.0005541853606700897, + 0.0005498801474459469, + 0.0005458085797727108 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.091796875, + "loss_eval": 2.3707523345947266, + "epoch": 0 + }, + { + "hidden_norms": [ + 40.06809616088867, + 37.16851043701172, + 35.97419738769531, + 34.98802185058594, + 34.09989547729492 + ], + "bp_grad_per_sample_l2_med": [ + 0.00013246900925878435, + 0.00013836311700288206, + 0.00014998784172348678, + 0.00017555677914060652, + 0.0002279145992361009 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4365234375, + "loss_eval": 1.5941123962402344, + "epoch": 1 + }, + { + "hidden_norms": [ + 51.32597732543945, + 46.865997314453125, + 44.336944580078125, + 42.399295806884766, + 41.083709716796875 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010603138071019202, + 0.00011028712469851598, + 0.00011670063395285979, + 0.00013331198715604842, + 0.00016258291725534946 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4736328125, + "loss_eval": 1.4793150424957275, + "epoch": 2 + }, + { + "hidden_norms": [ + 62.084197998046875, + 56.17497253417969, + 52.24001693725586, + 48.81613540649414, + 45.96797561645508 + ], + "bp_grad_per_sample_l2_med": [ + 9.958917507901788e-05, + 0.00010542560630710796, + 0.00011132164945593104, + 0.00012339121894910932, + 0.00014191119407769293 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.48046875, + "loss_eval": 1.4157963991165161, + "epoch": 3 + }, + { + "hidden_norms": [ + 70.11115264892578, + 62.7204704284668, + 57.0128059387207, + 52.67961883544922, + 49.0619010925293 + ], + "bp_grad_per_sample_l2_med": [ + 9.119982860283926e-05, + 9.68000604189001e-05, + 0.0001028164042509161, + 0.0001113277321564965, + 0.00012708066788036376 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.529296875, + "loss_eval": 1.3824131488800049, + "epoch": 4 + }, + { + "hidden_norms": [ + 77.96520233154297, + 68.33187866210938, + 62.02028274536133, + 56.785953521728516, + 52.50190734863281 + ], + "bp_grad_per_sample_l2_med": [ + 9.251978190150112e-05, + 9.91317501757294e-05, + 0.00010523655510041863, + 0.00011500742402859032, + 0.00012610112025868148 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.49609375, + "loss_eval": 1.4219003915786743, + "epoch": 5 + }, + { + "hidden_norms": [ + 84.35594940185547, + 73.65497589111328, + 65.76171875, + 59.78555679321289, + 54.72732925415039 + ], + "bp_grad_per_sample_l2_med": [ + 8.53061064844951e-05, + 9.119947208091617e-05, + 9.546471119392663e-05, + 0.00010272912186337635, + 0.00011094262299593538 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5107421875, + "loss_eval": 1.3764042854309082, + "epoch": 6 + }, + { + "hidden_norms": [ + 90.34719848632812, + 78.86559295654297, + 69.58448028564453, + 62.62751388549805, + 56.49700164794922 + ], + "bp_grad_per_sample_l2_med": [ + 8.279601024696603e-05, + 8.869311568560079e-05, + 9.525373752694577e-05, + 0.00010276824468746781, + 0.00011047293082810938 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.521484375, + "loss_eval": 1.3063517808914185, + "epoch": 7 + }, + { + "hidden_norms": [ + 94.70899200439453, + 82.14017486572266, + 72.3757553100586, + 63.97325134277344, + 57.261043548583984 + ], + "bp_grad_per_sample_l2_med": [ + 8.42147201183252e-05, + 8.977072138804942e-05, + 9.571140253683552e-05, + 0.00010196219227509573, + 0.00010500354983378202 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.521484375, + "loss_eval": 1.3536221981048584, + "epoch": 8 + }, + { + "hidden_norms": [ + 101.69925689697266, + 87.86920928955078, + 77.13504791259766, + 68.15769958496094, + 60.63106918334961 + ], + "bp_grad_per_sample_l2_med": [ + 8.040699322009459e-05, + 8.682452607899904e-05, + 9.194648009724915e-05, + 9.875267278403044e-05, + 0.00010358950385125354 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.517578125, + "loss_eval": 1.3398748636245728, + "epoch": 9 + }, + { + "hidden_norms": [ + 106.84738159179688, + 92.9166259765625, + 81.7030029296875, + 71.8150863647461, + 63.29521179199219 + ], + "bp_grad_per_sample_l2_med": [ + 7.807361544109881e-05, + 8.290779078379273e-05, + 8.751150744501501e-05, + 9.41800099099055e-05, + 9.622493234928697e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5595703125, + "loss_eval": 1.3021488189697266, + "epoch": 10 + }, + { + "hidden_norms": [ + 110.62977600097656, + 96.08146667480469, + 83.02938842773438, + 71.82244873046875, + 62.47097396850586 + ], + "bp_grad_per_sample_l2_med": [ + 7.582613034173846e-05, + 8.177754352800548e-05, + 8.888287266017869e-05, + 9.501135355094448e-05, + 9.754132042871788e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.53125, + "loss_eval": 1.2963578701019287, + "epoch": 11 + }, + { + "hidden_norms": [ + 115.87433624267578, + 99.99412536621094, + 86.81661987304688, + 75.194580078125, + 65.24598693847656 + ], + "bp_grad_per_sample_l2_med": [ + 7.453945727320388e-05, + 7.999759691301733e-05, + 8.587146294303238e-05, + 9.281275561079383e-05, + 9.684430551715195e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.537109375, + "loss_eval": 1.300926685333252, + "epoch": 12 + }, + { + "hidden_norms": [ + 115.8588638305664, + 100.0324478149414, + 87.23123931884766, + 75.2608871459961, + 64.53407287597656 + ], + "bp_grad_per_sample_l2_med": [ + 7.783657201798633e-05, + 8.2304140960332e-05, + 8.792509470367804e-05, + 9.308305016020313e-05, + 9.498461440671235e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5302734375, + "loss_eval": 1.2952370643615723, + "epoch": 13 + }, + { + "hidden_norms": [ + 121.24994659423828, + 103.9144515991211, + 88.99864959716797, + 75.50836944580078, + 64.28103637695312 + ], + "bp_grad_per_sample_l2_med": [ + 7.956428453326225e-05, + 8.667269139550626e-05, + 9.291838068747893e-05, + 9.890568617265671e-05, + 0.00010031831334345043 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.537109375, + "loss_eval": 1.3034818172454834, + "epoch": 14 + }, + { + "hidden_norms": [ + 124.64612579345703, + 107.64379119873047, + 92.03299713134766, + 77.67626190185547, + 66.19109344482422 + ], + "bp_grad_per_sample_l2_med": [ + 7.466476381523535e-05, + 8.086472371360287e-05, + 8.857141801854596e-05, + 9.320858225692064e-05, + 9.685206168796867e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.521484375, + "loss_eval": 1.2701925039291382, + "epoch": 15 + }, + { + "hidden_norms": [ + 128.4908905029297, + 110.93827819824219, + 95.34327697753906, + 80.90787506103516, + 68.56732940673828 + ], + "bp_grad_per_sample_l2_med": [ + 7.461471977876499e-05, + 8.18013577372767e-05, + 8.659388549858704e-05, + 9.226851398125291e-05, + 9.443429007660598e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5537109375, + "loss_eval": 1.2619553804397583, + "epoch": 16 + }, + { + "hidden_norms": [ + 130.65846252441406, + 112.31464385986328, + 95.85350036621094, + 79.80601501464844, + 67.30303192138672 + ], + "bp_grad_per_sample_l2_med": [ + 7.368716615019366e-05, + 8.01649657660164e-05, + 8.653382974443957e-05, + 9.32966941036284e-05, + 9.312365727964789e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5576171875, + "loss_eval": 1.2436624765396118, + "epoch": 17 + }, + { + "hidden_norms": [ + 133.13165283203125, + 114.61791229248047, + 97.15895080566406, + 81.40515899658203, + 69.13287353515625 + ], + "bp_grad_per_sample_l2_med": [ + 7.137899228837341e-05, + 7.771244418108836e-05, + 8.332561264978722e-05, + 8.920324762584642e-05, + 8.9491848484613e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.56640625, + "loss_eval": 1.239585518836975, + "epoch": 18 + }, + { + "hidden_norms": [ + 136.59140014648438, + 117.42953491210938, + 99.51315307617188, + 83.76544189453125, + 69.16895294189453 + ], + "bp_grad_per_sample_l2_med": [ + 7.198385719675571e-05, + 7.928090053610504e-05, + 8.52016091812402e-05, + 9.1185538622085e-05, + 9.257275087293237e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5673828125, + "loss_eval": 1.2780827283859253, + "epoch": 19 + }, + { + "hidden_norms": [ + 139.33346557617188, + 119.61570739746094, + 102.05357360839844, + 85.16582489013672, + 70.09222412109375 + ], + "bp_grad_per_sample_l2_med": [ + 7.267932232934982e-05, + 7.949839346110821e-05, + 8.610116492491215e-05, + 9.125673386733979e-05, + 9.256677003577352e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5419921875, + "loss_eval": 1.2823748588562012, + "epoch": 20 + }, + { + "hidden_norms": [ + 141.82034301757812, + 122.27132415771484, + 103.36873626708984, + 86.49518585205078, + 71.40383911132812 + ], + "bp_grad_per_sample_l2_med": [ + 7.251821807585657e-05, + 7.807672955095768e-05, + 8.464990969514474e-05, + 8.788360719336197e-05, + 8.839634392643347e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.55859375, + "loss_eval": 1.2162373065948486, + "epoch": 21 + }, + { + "hidden_norms": [ + 144.1250762939453, + 123.32146453857422, + 105.33419036865234, + 87.95057678222656, + 71.54405975341797 + ], + "bp_grad_per_sample_l2_med": [ + 7.141266542021185e-05, + 7.827960507711396e-05, + 8.527522732038051e-05, + 9.162349306279793e-05, + 8.910013275453821e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5712890625, + "loss_eval": 1.2267348766326904, + "epoch": 22 + }, + { + "hidden_norms": [ + 145.35816955566406, + 123.92304229736328, + 106.45323944091797, + 89.38124084472656, + 72.80756378173828 + ], + "bp_grad_per_sample_l2_med": [ + 6.914530968060717e-05, + 7.74021100369282e-05, + 8.25833558337763e-05, + 8.843685645842925e-05, + 8.765731763560325e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5615234375, + "loss_eval": 1.2464958429336548, + "epoch": 23 + }, + { + "hidden_norms": [ + 146.9630126953125, + 126.59661102294922, + 108.23934936523438, + 90.85575103759766, + 72.80107879638672 + ], + "bp_grad_per_sample_l2_med": [ + 7.045341044431552e-05, + 7.726218609604985e-05, + 8.23774971649982e-05, + 8.931937190936878e-05, + 9.00102750165388e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5556640625, + "loss_eval": 1.226228952407837, + "epoch": 24 + }, + { + "hidden_norms": [ + 150.7821044921875, + 129.61668395996094, + 108.98286437988281, + 89.68734741210938, + 72.85277557373047 + ], + "bp_grad_per_sample_l2_med": [ + 7.34334607841447e-05, + 7.900002674432471e-05, + 8.469617750961334e-05, + 8.900847751647234e-05, + 8.846351556712762e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.572265625, + "loss_eval": 1.2140324115753174, + "epoch": 25 + }, + { + "hidden_norms": [ + 151.44703674316406, + 129.4413604736328, + 110.14541625976562, + 91.28382110595703, + 74.19001770019531 + ], + "bp_grad_per_sample_l2_med": [ + 6.830286292824894e-05, + 7.440579793183133e-05, + 8.040962711675093e-05, + 8.615498518338427e-05, + 8.749076368985698e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5771484375, + "loss_eval": 1.2101829051971436, + "epoch": 26 + }, + { + "hidden_norms": [ + 153.631591796875, + 132.0617218017578, + 110.9275894165039, + 92.176513671875, + 73.5614242553711 + ], + "bp_grad_per_sample_l2_med": [ + 7.137414650060236e-05, + 7.97546817921102e-05, + 8.503787830704823e-05, + 9.110210521612316e-05, + 9.112519910559058e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5859375, + "loss_eval": 1.1954376697540283, + "epoch": 27 + }, + { + "hidden_norms": [ + 155.2130584716797, + 133.7564697265625, + 113.44039916992188, + 93.51616668701172, + 74.26422882080078 + ], + "bp_grad_per_sample_l2_med": [ + 7.436865416821092e-05, + 8.266629447462037e-05, + 8.722272468730807e-05, + 9.24940686672926e-05, + 9.228193084709346e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.568359375, + "loss_eval": 1.2368288040161133, + "epoch": 28 + }, + { + "hidden_norms": [ + 156.52346801757812, + 134.0899200439453, + 113.28357696533203, + 93.11508178710938, + 74.41522216796875 + ], + "bp_grad_per_sample_l2_med": [ + 7.232115603983402e-05, + 7.883219950599596e-05, + 8.385341061512008e-05, + 8.885351417120546e-05, + 8.985922613646835e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5849609375, + "loss_eval": 1.1935406923294067, + "epoch": 29 + }, + { + "hidden_norms": [ + 157.1343536376953, + 136.0911102294922, + 115.831298828125, + 94.6191177368164, + 74.93243408203125 + ], + "bp_grad_per_sample_l2_med": [ + 6.815487722633407e-05, + 7.527582783950493e-05, + 8.152059308486059e-05, + 8.597332634963095e-05, + 8.487412560498342e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.59375, + "loss_eval": 1.1716928482055664, + "epoch": 30 + }, + { + "hidden_norms": [ + 158.87771606445312, + 136.84617614746094, + 115.38484191894531, + 95.1522445678711, + 75.46046447753906 + ], + "bp_grad_per_sample_l2_med": [ + 7.11698376107961e-05, + 7.946270488901064e-05, + 8.58406419865787e-05, + 8.943407010519877e-05, + 8.97061254363507e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5908203125, + "loss_eval": 1.1900701522827148, + "epoch": 31 + }, + { + "hidden_norms": [ + 158.57237243652344, + 135.3989715576172, + 115.39788818359375, + 94.26459503173828, + 74.65320587158203 + ], + "bp_grad_per_sample_l2_med": [ + 7.135280611691996e-05, + 7.875803567003459e-05, + 8.35385944810696e-05, + 9.056212002178654e-05, + 8.802927186479792e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.58984375, + "loss_eval": 1.1936118602752686, + "epoch": 32 + }, + { + "hidden_norms": [ + 161.12164306640625, + 138.0847930908203, + 116.51541137695312, + 96.06510925292969, + 75.79708862304688 + ], + "bp_grad_per_sample_l2_med": [ + 7.089033169904724e-05, + 7.788193033775315e-05, + 8.262616029242054e-05, + 8.66727132233791e-05, + 8.98441721801646e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6044921875, + "loss_eval": 1.1777372360229492, + "epoch": 33 + }, + { + "hidden_norms": [ + 162.0608673095703, + 138.521728515625, + 117.39189147949219, + 96.19066619873047, + 75.76524353027344 + ], + "bp_grad_per_sample_l2_med": [ + 7.102260860847309e-05, + 7.727317279204726e-05, + 8.381292718695477e-05, + 8.586590411141515e-05, + 8.668057853356004e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5888671875, + "loss_eval": 1.1749277114868164, + "epoch": 34 + }, + { + "hidden_norms": [ + 161.66477966308594, + 138.45208740234375, + 118.22246551513672, + 96.99449920654297, + 76.40058135986328 + ], + "bp_grad_per_sample_l2_med": [ + 6.717143696732819e-05, + 7.219286635518074e-05, + 7.78083413024433e-05, + 8.173672540578991e-05, + 8.14773520687595e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.607421875, + "loss_eval": 1.183088779449463, + "epoch": 35 + }, + { + "hidden_norms": [ + 163.6893310546875, + 140.37518310546875, + 119.34339904785156, + 96.78111267089844, + 75.42987823486328 + ], + "bp_grad_per_sample_l2_med": [ + 6.809990736655891e-05, + 7.472001743735746e-05, + 7.982164243003353e-05, + 8.6645879491698e-05, + 8.662666368763894e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.599609375, + "loss_eval": 1.1695549488067627, + "epoch": 36 + }, + { + "hidden_norms": [ + 164.063232421875, + 140.68441772460938, + 118.45069122314453, + 96.70316314697266, + 75.4270248413086 + ], + "bp_grad_per_sample_l2_med": [ + 7.114750769687817e-05, + 7.883143553044647e-05, + 8.33458179840818e-05, + 8.941504347603768e-05, + 8.57952400110662e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5927734375, + "loss_eval": 1.1776624917984009, + "epoch": 37 + }, + { + "hidden_norms": [ + 163.89480590820312, + 140.18966674804688, + 119.30622863769531, + 97.97473907470703, + 76.34546661376953 + ], + "bp_grad_per_sample_l2_med": [ + 6.944040069356561e-05, + 7.674084190512076e-05, + 8.196813723770902e-05, + 8.950124902185053e-05, + 8.920513209886849e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.591796875, + "loss_eval": 1.1852729320526123, + "epoch": 38 + }, + { + "hidden_norms": [ + 165.47622680664062, + 141.58221435546875, + 119.55635070800781, + 98.0240707397461, + 76.13150787353516 + ], + "bp_grad_per_sample_l2_med": [ + 7.238827674882486e-05, + 7.85816737334244e-05, + 8.403261745115742e-05, + 8.998374687507749e-05, + 8.897150837583467e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5869140625, + "loss_eval": 1.1676307916641235, + "epoch": 39 + }, + { + "hidden_norms": [ + 164.69053649902344, + 142.07537841796875, + 121.09794616699219, + 99.6556396484375, + 77.98886108398438 + ], + "bp_grad_per_sample_l2_med": [ + 7.123505201889202e-05, + 7.861913036322221e-05, + 8.443401020485908e-05, + 8.940586121752858e-05, + 8.976398385129869e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.59375, + "loss_eval": 1.1959164142608643, + "epoch": 40 + }, + { + "hidden_norms": [ + 164.97906494140625, + 141.9008026123047, + 120.19933319091797, + 98.47044372558594, + 76.0770263671875 + ], + "bp_grad_per_sample_l2_med": [ + 7.325963088078424e-05, + 8.044692367548123e-05, + 8.460321987513453e-05, + 9.052005771081895e-05, + 8.883728878572583e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5888671875, + "loss_eval": 1.1650420427322388, + "epoch": 41 + }, + { + "hidden_norms": [ + 167.11508178710938, + 144.4076690673828, + 121.90902709960938, + 99.70268249511719, + 77.1493911743164 + ], + "bp_grad_per_sample_l2_med": [ + 6.938715523574501e-05, + 7.598697993671522e-05, + 8.122843428282067e-05, + 8.419268124271184e-05, + 8.758077456150204e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6103515625, + "loss_eval": 1.1334974765777588, + "epoch": 42 + }, + { + "hidden_norms": [ + 167.23953247070312, + 143.8128662109375, + 121.41165924072266, + 99.37804412841797, + 76.86026763916016 + ], + "bp_grad_per_sample_l2_med": [ + 7.253287185449153e-05, + 7.92228602222167e-05, + 8.514960791217163e-05, + 9.06435088836588e-05, + 8.896931103663519e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.59375, + "loss_eval": 1.1443839073181152, + "epoch": 43 + }, + { + "hidden_norms": [ + 167.02175903320312, + 143.56179809570312, + 121.07357025146484, + 98.59805297851562, + 76.59933471679688 + ], + "bp_grad_per_sample_l2_med": [ + 7.202434790087864e-05, + 7.884378283051774e-05, + 8.405950211454183e-05, + 8.979378617368639e-05, + 8.789195271674544e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6123046875, + "loss_eval": 1.1233543157577515, + "epoch": 44 + }, + { + "hidden_norms": [ + 168.8506622314453, + 144.7351531982422, + 122.07427978515625, + 100.25342559814453, + 77.3443832397461 + ], + "bp_grad_per_sample_l2_med": [ + 6.906851194798946e-05, + 7.469953561667353e-05, + 7.91402708273381e-05, + 8.30625431262888e-05, + 8.482224802719429e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.1078553199768066, + "epoch": 45 + }, + { + "hidden_norms": [ + 167.80520629882812, + 145.0210418701172, + 123.11544036865234, + 101.08995056152344, + 77.6504898071289 + ], + "bp_grad_per_sample_l2_med": [ + 6.715168274240568e-05, + 7.365776400547475e-05, + 7.808832015143707e-05, + 8.405041444348171e-05, + 8.283500210382044e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6142578125, + "loss_eval": 1.1213364601135254, + "epoch": 46 + }, + { + "hidden_norms": [ + 168.5064697265625, + 144.57977294921875, + 122.67310333251953, + 100.03209686279297, + 76.30200958251953 + ], + "bp_grad_per_sample_l2_med": [ + 7.193082274170592e-05, + 7.761332381051034e-05, + 8.224599878303707e-05, + 8.772317232796922e-05, + 8.76585254445672e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6025390625, + "loss_eval": 1.1593999862670898, + "epoch": 47 + }, + { + "hidden_norms": [ + 168.2687225341797, + 145.1931610107422, + 123.04153442382812, + 100.33060455322266, + 77.3511734008789 + ], + "bp_grad_per_sample_l2_med": [ + 7.396154978778213e-05, + 8.14273880678229e-05, + 8.724145300220698e-05, + 9.166308882413432e-05, + 9.03390027815476e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6044921875, + "loss_eval": 1.1506351232528687, + "epoch": 48 + }, + { + "hidden_norms": [ + 169.19711303710938, + 145.7348175048828, + 122.21668243408203, + 100.78398895263672, + 77.85338592529297 + ], + "bp_grad_per_sample_l2_med": [ + 7.148115400923416e-05, + 7.858182652853429e-05, + 8.472947956761345e-05, + 8.831475861370564e-05, + 9.002227307064459e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.607421875, + "loss_eval": 1.1426208019256592, + "epoch": 49 + }, + { + "hidden_norms": [ + 169.87611389160156, + 144.65980529785156, + 122.2470932006836, + 99.39762115478516, + 76.66820526123047 + ], + "bp_grad_per_sample_l2_med": [ + 7.574502524221316e-05, + 8.358684863196686e-05, + 8.949989569373429e-05, + 9.581056656315923e-05, + 9.291989408666268e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.599609375, + "loss_eval": 1.146412968635559, + "epoch": 50 + }, + { + "hidden_norms": [ + 167.4952850341797, + 143.16302490234375, + 119.86161804199219, + 97.8775863647461, + 75.75617980957031 + ], + "bp_grad_per_sample_l2_med": [ + 7.487049151677638e-05, + 8.140889985952526e-05, + 8.958375110523775e-05, + 9.491044329479337e-05, + 9.230020805262029e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6064453125, + "loss_eval": 1.1555390357971191, + "epoch": 51 + }, + { + "hidden_norms": [ + 169.03530883789062, + 144.57913208007812, + 122.20657348632812, + 100.42291259765625, + 77.34142303466797 + ], + "bp_grad_per_sample_l2_med": [ + 7.283290324267e-05, + 8.043479465413839e-05, + 8.612027886556461e-05, + 9.16399949346669e-05, + 9.119778405874968e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.611328125, + "loss_eval": 1.145568609237671, + "epoch": 52 + }, + { + "hidden_norms": [ + 168.97242736816406, + 144.64987182617188, + 121.88980865478516, + 99.5838394165039, + 76.98419952392578 + ], + "bp_grad_per_sample_l2_med": [ + 7.706385804340243e-05, + 8.52798912092112e-05, + 9.141799091594294e-05, + 9.48576707742177e-05, + 9.280487574869767e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6044921875, + "loss_eval": 1.173735499382019, + "epoch": 53 + }, + { + "hidden_norms": [ + 169.5861053466797, + 145.18853759765625, + 123.36368560791016, + 100.5948257446289, + 77.515380859375 + ], + "bp_grad_per_sample_l2_med": [ + 7.197257218649611e-05, + 7.774284313200042e-05, + 8.511826308676973e-05, + 9.136695007327944e-05, + 8.776389586273581e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6201171875, + "loss_eval": 1.125669240951538, + "epoch": 54 + }, + { + "hidden_norms": [ + 168.54624938964844, + 144.20028686523438, + 120.96566009521484, + 98.61659240722656, + 75.90725708007812 + ], + "bp_grad_per_sample_l2_med": [ + 7.784854824421927e-05, + 8.512740896549076e-05, + 9.021186269819736e-05, + 9.572209819452837e-05, + 9.406798199051991e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6201171875, + "loss_eval": 1.143272042274475, + "epoch": 55 + }, + { + "hidden_norms": [ + 167.1956024169922, + 144.33364868164062, + 121.39191436767578, + 99.15605926513672, + 76.89862060546875 + ], + "bp_grad_per_sample_l2_med": [ + 7.683308649575338e-05, + 8.338083716807887e-05, + 9.210927237290889e-05, + 9.760970715433359e-05, + 9.435461106477305e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.603515625, + "loss_eval": 1.1492671966552734, + "epoch": 56 + }, + { + "hidden_norms": [ + 168.5964813232422, + 144.6849365234375, + 122.38106536865234, + 99.73613739013672, + 77.72384643554688 + ], + "bp_grad_per_sample_l2_med": [ + 7.762440509395674e-05, + 8.45814065542072e-05, + 9.048492211150005e-05, + 9.445888281334192e-05, + 9.163413778878748e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6103515625, + "loss_eval": 1.1285452842712402, + "epoch": 57 + }, + { + "hidden_norms": [ + 169.4349365234375, + 145.3781280517578, + 122.81243896484375, + 100.45063781738281, + 77.73384094238281 + ], + "bp_grad_per_sample_l2_med": [ + 7.32980333850719e-05, + 8.07973847258836e-05, + 8.676065772306174e-05, + 8.88932918314822e-05, + 8.98713551578112e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.623046875, + "loss_eval": 1.1177959442138672, + "epoch": 58 + }, + { + "hidden_norms": [ + 167.85089111328125, + 143.60365295410156, + 120.23004913330078, + 98.14772033691406, + 76.00984191894531 + ], + "bp_grad_per_sample_l2_med": [ + 7.664797885809094e-05, + 8.470165630569682e-05, + 9.283467807108536e-05, + 9.794873039936647e-05, + 9.169583063339815e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6201171875, + "loss_eval": 1.1301027536392212, + "epoch": 59 + }, + { + "hidden_norms": [ + 167.4250946044922, + 144.43685913085938, + 120.5447769165039, + 98.6132583618164, + 76.67144775390625 + ], + "bp_grad_per_sample_l2_med": [ + 7.264616579050198e-05, + 8.033386984607205e-05, + 8.730305125936866e-05, + 9.157789463642985e-05, + 9.014589886646718e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6337890625, + "loss_eval": 1.1262563467025757, + "epoch": 60 + }, + { + "hidden_norms": [ + 167.57273864746094, + 143.9201202392578, + 120.18034362792969, + 99.7088851928711, + 77.43472290039062 + ], + "bp_grad_per_sample_l2_med": [ + 7.527784327976406e-05, + 8.20689310785383e-05, + 8.86347406776622e-05, + 9.488592331763357e-05, + 9.351663175038993e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6259765625, + "loss_eval": 1.1255381107330322, + "epoch": 61 + }, + { + "hidden_norms": [ + 168.32432556152344, + 143.3669891357422, + 120.5047378540039, + 98.29914093017578, + 76.91972351074219 + ], + "bp_grad_per_sample_l2_med": [ + 8.1095946370624e-05, + 9.126035001827404e-05, + 9.773251076694578e-05, + 0.00010036173625849187, + 9.892736852634698e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.625, + "loss_eval": 1.121397614479065, + "epoch": 62 + }, + { + "hidden_norms": [ + 167.19789123535156, + 143.76556396484375, + 120.66227722167969, + 98.42743682861328, + 76.89801788330078 + ], + "bp_grad_per_sample_l2_med": [ + 7.633089262526482e-05, + 8.335815800819546e-05, + 9.061676246346906e-05, + 9.574641444487497e-05, + 9.495441918261349e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.62109375, + "loss_eval": 1.1192781925201416, + "epoch": 63 + }, + { + "hidden_norms": [ + 166.93948364257812, + 142.26893615722656, + 119.55793762207031, + 97.94837951660156, + 76.42357635498047 + ], + "bp_grad_per_sample_l2_med": [ + 7.782453758409247e-05, + 8.425768464803696e-05, + 9.212247096002102e-05, + 9.447304182685912e-05, + 9.302303078584373e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.607421875, + "loss_eval": 1.1216533184051514, + "epoch": 64 + }, + { + "hidden_norms": [ + 166.6027069091797, + 143.06201171875, + 120.18063354492188, + 98.2688217163086, + 76.29009246826172 + ], + "bp_grad_per_sample_l2_med": [ + 8.051560871535912e-05, + 8.871743193594739e-05, + 9.67002852121368e-05, + 0.00010364756599301472, + 9.896839765133336e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.623046875, + "loss_eval": 1.1287095546722412, + "epoch": 65 + }, + { + "hidden_norms": [ + 167.1055908203125, + 142.63758850097656, + 119.64879608154297, + 97.64229583740234, + 76.44933319091797 + ], + "bp_grad_per_sample_l2_med": [ + 7.66752491472289e-05, + 8.481083932565525e-05, + 9.087422949960455e-05, + 9.747539297677577e-05, + 9.831935312831774e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.62109375, + "loss_eval": 1.1142747402191162, + "epoch": 66 + }, + { + "hidden_norms": [ + 165.7790985107422, + 141.932861328125, + 119.308349609375, + 97.3916244506836, + 76.28073120117188 + ], + "bp_grad_per_sample_l2_med": [ + 8.054008503677323e-05, + 8.828196587273851e-05, + 9.400352428201586e-05, + 0.0001006148086162284, + 9.63730999501422e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6220703125, + "loss_eval": 1.1091513633728027, + "epoch": 67 + }, + { + "hidden_norms": [ + 166.0056915283203, + 142.36737060546875, + 119.14185333251953, + 97.59127044677734, + 76.91047668457031 + ], + "bp_grad_per_sample_l2_med": [ + 7.921652286313474e-05, + 8.842039096634835e-05, + 9.518962178844959e-05, + 9.989101090468466e-05, + 9.532425610814244e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.634765625, + "loss_eval": 1.109208106994629, + "epoch": 68 + }, + { + "hidden_norms": [ + 165.06881713867188, + 141.9323272705078, + 119.31546783447266, + 97.39105987548828, + 76.88532257080078 + ], + "bp_grad_per_sample_l2_med": [ + 7.891654968261719e-05, + 8.609334327047691e-05, + 9.276948549086228e-05, + 9.923002653522417e-05, + 9.674452303443104e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.62890625, + "loss_eval": 1.102659821510315, + "epoch": 69 + }, + { + "hidden_norms": [ + 165.70677185058594, + 141.7493896484375, + 119.19147491455078, + 97.61845397949219, + 76.11932373046875 + ], + "bp_grad_per_sample_l2_med": [ + 8.021068788366392e-05, + 8.757255272939801e-05, + 9.637014591135085e-05, + 0.00010106353875016794, + 9.785306610865518e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6259765625, + "loss_eval": 1.1182312965393066, + "epoch": 70 + }, + { + "hidden_norms": [ + 164.398193359375, + 141.26121520996094, + 118.28160095214844, + 96.55244445800781, + 75.79473876953125 + ], + "bp_grad_per_sample_l2_med": [ + 8.341020293300971e-05, + 9.248757123714313e-05, + 9.663405944593251e-05, + 0.00010157335054827854, + 9.801337728276849e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.62890625, + "loss_eval": 1.1038966178894043, + "epoch": 71 + }, + { + "hidden_norms": [ + 164.95956420898438, + 141.71456909179688, + 118.70948028564453, + 96.87312316894531, + 76.1374740600586 + ], + "bp_grad_per_sample_l2_med": [ + 8.227327634813264e-05, + 9.05249617062509e-05, + 9.777413652045652e-05, + 0.00010368443327024579, + 9.96799353742972e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6259765625, + "loss_eval": 1.1255979537963867, + "epoch": 72 + }, + { + "hidden_norms": [ + 164.7284393310547, + 140.8751678466797, + 118.047607421875, + 96.35321044921875, + 75.17439270019531 + ], + "bp_grad_per_sample_l2_med": [ + 7.813700358383358e-05, + 8.510561019647866e-05, + 9.316992509411648e-05, + 9.944752673618495e-05, + 9.348603634862229e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6298828125, + "loss_eval": 1.1074620485305786, + "epoch": 73 + }, + { + "hidden_norms": [ + 164.93450927734375, + 140.53248596191406, + 117.69375610351562, + 96.16271209716797, + 75.15106201171875 + ], + "bp_grad_per_sample_l2_med": [ + 8.089678158285096e-05, + 9.048588981386274e-05, + 9.746959403855726e-05, + 0.00010185279097640887, + 9.633745503379032e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.630859375, + "loss_eval": 1.118239164352417, + "epoch": 74 + }, + { + "hidden_norms": [ + 164.21043395996094, + 139.88815307617188, + 117.45735931396484, + 95.94420623779297, + 75.4442138671875 + ], + "bp_grad_per_sample_l2_med": [ + 8.050485485000536e-05, + 8.884233102435246e-05, + 9.638822666602209e-05, + 9.927270002663136e-05, + 9.542587213218212e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6337890625, + "loss_eval": 1.1022429466247559, + "epoch": 75 + }, + { + "hidden_norms": [ + 163.64498901367188, + 139.56788635253906, + 117.33267974853516, + 95.80303192138672, + 75.07954406738281 + ], + "bp_grad_per_sample_l2_med": [ + 8.35943064885214e-05, + 9.346263686893508e-05, + 0.0001004879450192675, + 0.00010487801773706451, + 0.0001030422281473875 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.630859375, + "loss_eval": 1.101865530014038, + "epoch": 76 + }, + { + "hidden_norms": [ + 163.15895080566406, + 139.2528533935547, + 116.07748413085938, + 94.62651824951172, + 74.8349380493164 + ], + "bp_grad_per_sample_l2_med": [ + 8.33335579955019e-05, + 9.210313146468252e-05, + 9.823974687606096e-05, + 0.00010392737749498338, + 9.883133316179737e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6337890625, + "loss_eval": 1.107062816619873, + "epoch": 77 + }, + { + "hidden_norms": [ + 162.9849090576172, + 138.823974609375, + 116.6355972290039, + 95.05895233154297, + 74.80722045898438 + ], + "bp_grad_per_sample_l2_med": [ + 8.333245204994455e-05, + 9.167871758108959e-05, + 9.739672532305121e-05, + 0.00010222326818620786, + 9.918824798660353e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6328125, + "loss_eval": 1.1088743209838867, + "epoch": 78 + }, + { + "hidden_norms": [ + 162.9673614501953, + 138.89553833007812, + 116.67662811279297, + 94.80388641357422, + 74.41240692138672 + ], + "bp_grad_per_sample_l2_med": [ + 8.250313112512231e-05, + 9.097345173358917e-05, + 9.694542677607387e-05, + 0.00010250341438222677, + 9.611865971237421e-05 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6318359375, + "loss_eval": 1.1069759130477905, + "epoch": 79 + }, + { + "hidden_norms": [ + 163.01101684570312, + 138.9472198486328, + 116.52082824707031, + 94.81626892089844, + 74.34078216552734 + ], + "bp_grad_per_sample_l2_med": [ + 8.468546730000526e-05, + 9.535141725791618e-05, + 9.998930181609467e-05, + 0.00010477996693225577, + 0.00010350123920943588 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6455078125, + "loss_eval": 1.11004638671875, + "epoch": 80 + }, + { + "hidden_norms": [ + 162.48593139648438, + 138.60171508789062, + 116.15435028076172, + 94.63046264648438, + 74.77122497558594 + ], + "bp_grad_per_sample_l2_med": [ + 8.888062438927591e-05, + 9.835455421125516e-05, + 0.00010451052366988733, + 0.00010972235031658784, + 0.00010192779154749587 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.63671875, + "loss_eval": 1.1166486740112305, + "epoch": 81 + }, + { + "hidden_norms": [ + 162.33985900878906, + 138.57908630371094, + 115.86516571044922, + 94.62572479248047, + 74.61656951904297 + ], + "bp_grad_per_sample_l2_med": [ + 8.704938227310777e-05, + 9.788614988792688e-05, + 0.00010670957271941006, + 0.00011224307672819123, + 0.00010563644173089415 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6337890625, + "loss_eval": 1.1027870178222656, + "epoch": 82 + }, + { + "hidden_norms": [ + 162.28363037109375, + 137.98855590820312, + 115.68619537353516, + 94.57305145263672, + 74.67822265625 + ], + "bp_grad_per_sample_l2_med": [ + 8.545320451958105e-05, + 9.513215627521276e-05, + 0.00010359021689509973, + 0.00010905940871452913, + 0.00010360238957218826 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6416015625, + "loss_eval": 1.1074315309524536, + "epoch": 83 + }, + { + "hidden_norms": [ + 161.65008544921875, + 138.2888946533203, + 115.37015533447266, + 94.0649185180664, + 74.40010070800781 + ], + "bp_grad_per_sample_l2_med": [ + 8.725856605451554e-05, + 9.554363350616768e-05, + 0.00010503961675567552, + 0.00011096282105427235, + 0.00010341637971578166 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.638671875, + "loss_eval": 1.104964017868042, + "epoch": 84 + }, + { + "hidden_norms": [ + 162.56822204589844, + 138.35604858398438, + 115.56212615966797, + 93.74854278564453, + 74.29190826416016 + ], + "bp_grad_per_sample_l2_med": [ + 8.511068881489336e-05, + 9.339748066850007e-05, + 0.00010132823081221431, + 0.00010685007873689756, + 0.00010203333658864722 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.634765625, + "loss_eval": 1.110845923423767, + "epoch": 85 + }, + { + "hidden_norms": [ + 161.8057861328125, + 137.9845733642578, + 115.51632690429688, + 94.12870788574219, + 74.2806167602539 + ], + "bp_grad_per_sample_l2_med": [ + 8.701891783857718e-05, + 9.453850361751392e-05, + 0.00010162424587178975, + 0.00010690372437238693, + 0.0001028447222779505 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.640625, + "loss_eval": 1.108534574508667, + "epoch": 86 + }, + { + "hidden_norms": [ + 161.5404815673828, + 137.67727661132812, + 115.56287384033203, + 94.2837142944336, + 74.19786834716797 + ], + "bp_grad_per_sample_l2_med": [ + 8.555947715649381e-05, + 9.61149125942029e-05, + 0.00010081662185257301, + 0.00010581265814835206, + 0.00010205370926996693 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.642578125, + "loss_eval": 1.1068053245544434, + "epoch": 87 + }, + { + "hidden_norms": [ + 161.6155242919922, + 137.77752685546875, + 115.26612854003906, + 93.79004669189453, + 74.01652526855469 + ], + "bp_grad_per_sample_l2_med": [ + 8.888345473678783e-05, + 9.766507719177753e-05, + 0.00010646588634699583, + 0.0001093660102924332, + 0.0001023485092446208 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.640625, + "loss_eval": 1.112060308456421, + "epoch": 88 + }, + { + "hidden_norms": [ + 161.4155731201172, + 137.4070281982422, + 114.93219757080078, + 93.83850860595703, + 74.04694366455078 + ], + "bp_grad_per_sample_l2_med": [ + 8.62668312038295e-05, + 9.635779133532196e-05, + 0.00010364993795519695, + 0.00010628051677485928, + 0.00010416742588859051 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.638671875, + "loss_eval": 1.1054459810256958, + "epoch": 89 + }, + { + "hidden_norms": [ + 161.10385131835938, + 137.37892150878906, + 114.876953125, + 93.37522888183594, + 73.81317901611328 + ], + "bp_grad_per_sample_l2_med": [ + 8.967578469309956e-05, + 9.864033199846745e-05, + 0.00010763857426354662, + 0.00011277131852693856, + 0.0001057170593412593 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.634765625, + "loss_eval": 1.1104364395141602, + "epoch": 90 + }, + { + "hidden_norms": [ + 160.9930419921875, + 137.13717651367188, + 114.8873062133789, + 93.33486938476562, + 74.0313949584961 + ], + "bp_grad_per_sample_l2_med": [ + 8.793028973741457e-05, + 9.762586705619469e-05, + 0.00010612032929202542, + 0.00010882189963012934, + 0.00010218457464361563 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.638671875, + "loss_eval": 1.107926607131958, + "epoch": 91 + }, + { + "hidden_norms": [ + 161.131103515625, + 136.96864318847656, + 114.8429183959961, + 93.4638442993164, + 74.06806945800781 + ], + "bp_grad_per_sample_l2_med": [ + 8.899801468942314e-05, + 9.761646651895717e-05, + 0.00010549664148129523, + 0.00011210257798666134, + 0.000105380589957349 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.646484375, + "loss_eval": 1.1014349460601807, + "epoch": 92 + }, + { + "hidden_norms": [ + 160.92770385742188, + 137.00291442871094, + 114.67124938964844, + 93.55059051513672, + 73.94056701660156 + ], + "bp_grad_per_sample_l2_med": [ + 8.758921467233449e-05, + 9.86124505288899e-05, + 0.0001072377126547508, + 0.00011291914415778592, + 0.00010492445289855823 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.646484375, + "loss_eval": 1.1031121015548706, + "epoch": 93 + }, + { + "hidden_norms": [ + 160.88087463378906, + 136.80621337890625, + 114.49836730957031, + 93.34219360351562, + 73.85013580322266 + ], + "bp_grad_per_sample_l2_med": [ + 8.935505320550874e-05, + 9.829271584749222e-05, + 0.00010722390288719907, + 0.00011369076673872769, + 0.0001048692429321818 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.64453125, + "loss_eval": 1.105837106704712, + "epoch": 94 + }, + { + "hidden_norms": [ + 160.87530517578125, + 136.97203063964844, + 114.57328033447266, + 93.34746551513672, + 73.79950714111328 + ], + "bp_grad_per_sample_l2_med": [ + 8.837936184136197e-05, + 9.732619946589693e-05, + 0.00010843550262507051, + 0.00011282044579274952, + 0.00010489222768228501 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6435546875, + "loss_eval": 1.1061646938323975, + "epoch": 95 + }, + { + "hidden_norms": [ + 160.83152770996094, + 136.82012939453125, + 114.41039276123047, + 93.26609802246094, + 73.75130462646484 + ], + "bp_grad_per_sample_l2_med": [ + 8.924134453991428e-05, + 9.699882502900437e-05, + 0.00010844215285032988, + 0.00011508698662510142, + 0.00010382343316450715 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.646484375, + "loss_eval": 1.1083133220672607, + "epoch": 96 + }, + { + "hidden_norms": [ + 160.8388214111328, + 136.79220581054688, + 114.45349884033203, + 93.23229217529297, + 73.71869659423828 + ], + "bp_grad_per_sample_l2_med": [ + 8.902873378247023e-05, + 9.731733007356524e-05, + 0.0001077003325917758, + 0.00011335347517160699, + 0.00010528459824854508 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.646484375, + "loss_eval": 1.1074192523956299, + "epoch": 97 + }, + { + "hidden_norms": [ + 160.82676696777344, + 136.7546844482422, + 114.41687774658203, + 93.24365234375, + 73.72588348388672 + ], + "bp_grad_per_sample_l2_med": [ + 8.967860048869625e-05, + 9.900779696181417e-05, + 0.00010877639579121023, + 0.00011359385825926438, + 0.0001041799841914326 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.646484375, + "loss_eval": 1.1075721979141235, + "epoch": 98 + }, + { + "hidden_norms": [ + 160.8055419921875, + 136.8428955078125, + 114.41191864013672, + 93.23294067382812, + 73.72472381591797 + ], + "bp_grad_per_sample_l2_med": [ + 8.870402962202206e-05, + 9.879077697405592e-05, + 0.00010879703768296167, + 0.00011367550177965313, + 0.00010426441440358758 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.646484375, + "loss_eval": 1.107743263244629, + "epoch": 99 + }, + { + "hidden_norms": [ + 160.795166015625, + 136.82778930664062, + 114.41122436523438, + 93.22368621826172, + 73.72713470458984 + ], + "bp_grad_per_sample_l2_med": [ + 8.868239092407748e-05, + 9.911284723784775e-05, + 0.00010880655463552102, + 0.00011359110794728622, + 0.00010424658830743283 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.646484375, + "loss_eval": 1.1077194213867188, + "epoch": 100 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.696551322937012, + 8.737784385681152, + 8.813130378723145, + 8.844642639160156, + 8.889528274536133 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005607507191598415, + 0.0005558764678426087, + 0.0005541853606700897, + 0.0005498801474459469, + 0.0005458085797727108 + ], + "gamma_dfa": 0.002593531389720738, + "gamma_dfa_per_layer": [ + 0.011040969751775265, + 0.0018278355710208416, + -0.019951725378632545, + 0.01745704561471939 + ], + "acc_eval": 0.091796875, + "loss_eval": 2.3707523345947266, + "epoch": 0 + }, + { + "hidden_norms": [ + 543.6214599609375, + 970.167724609375, + 1128.5582275390625, + 1385.4898681640625, + 1506.6824951171875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006441785371862352, + 0.0006426527979783714, + 0.0006424304447136819, + 0.000642389350105077, + 0.0006423307931981981 + ], + "gamma_dfa": 0.013619338162243366, + "gamma_dfa_per_layer": [ + 0.044537801295518875, + 0.008280456066131592, + -0.026753954589366913, + 0.02841304987668991 + ], + "acc_eval": 0.224609375, + "loss_eval": 7.057413101196289, + "epoch": 1 + }, + { + "hidden_norms": [ + 877.8099365234375, + 2093.12060546875, + 2686.85400390625, + 3536.0849609375, + 3998.738037109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007192303892225027, + 0.000718857510946691, + 0.0007187117007561028, + 0.0007188154268078506, + 0.0007185889990068972 + ], + "gamma_dfa": -0.0027784015983343124, + "gamma_dfa_per_layer": [ + 0.04956255108118057, + -0.024007968604564667, + -0.02988382987678051, + -0.006784358993172646 + ], + "acc_eval": 0.2197265625, + "loss_eval": 11.82400131225586, + "epoch": 2 + }, + { + "hidden_norms": [ + 1082.57763671875, + 3122.52001953125, + 4171.595703125, + 5502.81494140625, + 6367.2392578125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007569500594399869, + 0.0007553253090009093, + 0.0007550596492365003, + 0.0007549565634690225, + 0.0007544843829236925 + ], + "gamma_dfa": -0.004858810920268297, + "gamma_dfa_per_layer": [ + 0.06696394830942154, + -0.024477044120430946, + -0.04227307811379433, + -0.019649069756269455 + ], + "acc_eval": 0.18359375, + "loss_eval": 24.264713287353516, + "epoch": 3 + }, + { + "hidden_norms": [ + 1244.07275390625, + 4114.89111328125, + 5548.310546875, + 7262.12744140625, + 8410.1474609375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007311897934414446, + 0.0007286664913408458, + 0.0007287323824129999, + 0.0007287483895197511, + 0.0007287858170457184 + ], + "gamma_dfa": -0.003940413473173976, + "gamma_dfa_per_layer": [ + 0.06546925008296967, + -0.03793267905712128, + -0.03520221635699272, + -0.008096008561551571 + ], + "acc_eval": 0.197265625, + "loss_eval": 21.850379943847656, + "epoch": 4 + }, + { + "hidden_norms": [ + 1357.7320556640625, + 5130.4609375, + 7149.40380859375, + 9744.58984375, + 11396.052734375 + ], + "bp_grad_per_sample_l2_med": [ + 0.000750180275645107, + 0.0007480062777176499, + 0.0007475404418073595, + 0.0007476753671653569, + 0.0007474455051124096 + ], + "gamma_dfa": -6.745467544533312e-06, + "gamma_dfa_per_layer": [ + 0.08006488531827927, + -0.0292807687073946, + -0.04997118189930916, + -0.0008399165817536414 + ], + "acc_eval": 0.2314453125, + "loss_eval": 30.650737762451172, + "epoch": 5 + }, + { + "hidden_norms": [ + 1438.5594482421875, + 5736.68994140625, + 8271.92578125, + 11658.373046875, + 13768.2861328125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000744938850402832, + 0.0007369474042207003, + 0.0007347911596298218, + 0.0007346841157414019, + 0.000734883826225996 + ], + "gamma_dfa": -0.0024929028004407883, + "gamma_dfa_per_layer": [ + 0.08933529257774353, + -0.03695790469646454, + -0.04257381707429886, + -0.019775182008743286 + ], + "acc_eval": 0.23046875, + "loss_eval": 42.61720275878906, + "epoch": 6 + }, + { + "hidden_norms": [ + 1512.00244140625, + 6517.73779296875, + 9229.724609375, + 13440.5166015625, + 16669.212890625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007609400781802833, + 0.0007555288611911237, + 0.0007558621582575142, + 0.0007557112840004265, + 0.0007554451585747302 + ], + "gamma_dfa": -0.007545993197709322, + "gamma_dfa_per_layer": [ + 0.08795229345560074, + -0.03476891666650772, + -0.06410981714725494, + -0.01925753243267536 + ], + "acc_eval": 0.208984375, + "loss_eval": 50.873321533203125, + "epoch": 7 + }, + { + "hidden_norms": [ + 1582.1080322265625, + 7188.6318359375, + 9899.5947265625, + 15346.5009765625, + 19886.591796875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007456639432348311, + 0.0007417471497319639, + 0.0007396289147436619, + 0.0007396984728984535, + 0.0007395402644760907 + ], + "gamma_dfa": -0.009718619287014008, + "gamma_dfa_per_layer": [ + 0.09109380096197128, + -0.042414966970682144, + -0.04605134204030037, + -0.0415019690990448 + ], + "acc_eval": 0.189453125, + "loss_eval": 54.14390182495117, + "epoch": 8 + }, + { + "hidden_norms": [ + 1618.51708984375, + 7916.01416015625, + 10608.3408203125, + 17416.95703125, + 24058.658203125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007598118390887976, + 0.0007534913602285087, + 0.0007532819290645421, + 0.0007532560266554356, + 0.0007529302965849638 + ], + "gamma_dfa": 0.0011779842898249626, + "gamma_dfa_per_layer": [ + 0.10601411014795303, + -0.0355507917702198, + -0.04322661831974983, + -0.022524762898683548 + ], + "acc_eval": 0.169921875, + "loss_eval": 79.9201889038086, + "epoch": 9 + }, + { + "hidden_norms": [ + 1708.6558837890625, + 8872.5908203125, + 11589.568359375, + 19666.24609375, + 28447.203125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000754358887206763, + 0.0007440761546604335, + 0.0007443547365255654, + 0.0007444044458679855, + 0.0007447295938618481 + ], + "gamma_dfa": -0.006681790575385094, + "gamma_dfa_per_layer": [ + 0.12310357391834259, + -0.054726000875234604, + -0.061426255851984024, + -0.03367847949266434 + ], + "acc_eval": 0.189453125, + "loss_eval": 117.76714324951172, + "epoch": 10 + }, + { + "hidden_norms": [ + 1757.5994873046875, + 10265.8017578125, + 13090.66796875, + 22099.814453125, + 34584.30078125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000756443478167057, + 0.0007464477675966918, + 0.000743720680475235, + 0.0007434834260493517, + 0.0007420994224958122 + ], + "gamma_dfa": -0.01398628018796444, + "gamma_dfa_per_layer": [ + 0.12564796209335327, + -0.05404478684067726, + -0.07238315045833588, + -0.05516514554619789 + ], + "acc_eval": 0.189453125, + "loss_eval": 103.90010070800781, + "epoch": 11 + }, + { + "hidden_norms": [ + 1799.9754638671875, + 11735.4208984375, + 14739.4091796875, + 24244.48828125, + 40467.53125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007648739847354591, + 0.0007477994076907635, + 0.0007476488244719803, + 0.0007475496386177838, + 0.0007478601182810962 + ], + "gamma_dfa": -0.005489904433488846, + "gamma_dfa_per_layer": [ + 0.1469549834728241, + -0.04884009808301926, + -0.05759190022945404, + -0.06248260289430618 + ], + "acc_eval": 0.2041015625, + "loss_eval": 124.61287689208984, + "epoch": 12 + }, + { + "hidden_norms": [ + 1851.51123046875, + 13681.8662109375, + 17609.712890625, + 27533.84375, + 52049.0703125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007830688264220953, + 0.0007742528687231243, + 0.0007744400063529611, + 0.0007723497110418975, + 0.0007720965659245849 + ], + "gamma_dfa": -0.0014207642525434494, + "gamma_dfa_per_layer": [ + 0.18515333533287048, + -0.04434240236878395, + -0.09712066501379013, + -0.0493733249604702 + ], + "acc_eval": 0.142578125, + "loss_eval": 212.8883056640625, + "epoch": 13 + }, + { + "hidden_norms": [ + 1899.2525634765625, + 16269.4736328125, + 21580.724609375, + 31947.771484375, + 66851.5703125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000794055697042495, + 0.0007606232538819313, + 0.0007601877441629767, + 0.0007598533411510289, + 0.000759296934120357 + ], + "gamma_dfa": 0.012796862982213497, + "gamma_dfa_per_layer": [ + 0.206809401512146, + -0.04797299578785896, + -0.0716182291507721, + -0.03603072464466095 + ], + "acc_eval": 0.1591796875, + "loss_eval": 268.9534912109375, + "epoch": 14 + }, + { + "hidden_norms": [ + 1988.337890625, + 20679.96484375, + 27719.126953125, + 37757.640625, + 86759.0234375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007827074150554836, + 0.0007373052649199963, + 0.0007380677270703018, + 0.000736265501473099, + 0.0007371739484369755 + ], + "gamma_dfa": 0.003913283348083496, + "gamma_dfa_per_layer": [ + 0.18332748115062714, + -0.05311701446771622, + -0.06076449155807495, + -0.053792841732501984 + ], + "acc_eval": 0.2548828125, + "loss_eval": 367.0162048339844, + "epoch": 15 + }, + { + "hidden_norms": [ + 2074.877685546875, + 25397.2421875, + 35934.484375, + 45723.14453125, + 111497.4296875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008315286249853671, + 0.0007900919299572706, + 0.0007844009087421, + 0.0007838390883989632, + 0.0007860813639126718 + ], + "gamma_dfa": -0.002616437152028084, + "gamma_dfa_per_layer": [ + 0.21044191718101501, + -0.05741831660270691, + -0.1141648143529892, + -0.049324534833431244 + ], + "acc_eval": 0.1220703125, + "loss_eval": 449.4093322753906, + "epoch": 16 + }, + { + "hidden_norms": [ + 2160.0703125, + 30060.396484375, + 43998.6953125, + 54128.03515625, + 137197.4375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007943993550725281, + 0.0007568124565295875, + 0.0007565468549728394, + 0.0007549119181931019, + 0.0007542246603406966 + ], + "gamma_dfa": 0.005578489974141121, + "gamma_dfa_per_layer": [ + 0.21836650371551514, + -0.057003527879714966, + -0.08258379250764847, + -0.05646522343158722 + ], + "acc_eval": 0.2099609375, + "loss_eval": 505.51385498046875, + "epoch": 17 + }, + { + "hidden_norms": [ + 2261.926025390625, + 35914.08203125, + 53701.83203125, + 65022.0234375, + 174995.234375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008322449866682291, + 0.0007640637923032045, + 0.0007639409159310162, + 0.000764198659453541, + 0.0007642150158062577 + ], + "gamma_dfa": 0.017949961125850677, + "gamma_dfa_per_layer": [ + 0.23718158900737762, + -0.05374513193964958, + -0.062201935797929764, + -0.04943467676639557 + ], + "acc_eval": 0.2109375, + "loss_eval": 610.7471923828125, + "epoch": 18 + }, + { + "hidden_norms": [ + 2326.78271484375, + 42755.171875, + 66353.453125, + 77731.328125, + 221615.828125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008451915346086025, + 0.0007553622708655894, + 0.0007553161703981459, + 0.0007546090637333691, + 0.0007550025475211442 + ], + "gamma_dfa": 0.029257358983159065, + "gamma_dfa_per_layer": [ + 0.26171058416366577, + -0.04214981198310852, + -0.06413372606039047, + -0.03839761018753052 + ], + "acc_eval": 0.19921875, + "loss_eval": 652.3941650390625, + "epoch": 19 + }, + { + "hidden_norms": [ + 2443.6630859375, + 48300.12109375, + 77390.1015625, + 91484.09375, + 270700.96875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009103405755013227, + 0.0007761572487652302, + 0.0007760545704513788, + 0.0007730794604867697, + 0.0007728201453574002 + ], + "gamma_dfa": 0.017114468850195408, + "gamma_dfa_per_layer": [ + 0.26115190982818604, + -0.050561077892780304, + -0.08694136142730713, + -0.05519159510731697 + ], + "acc_eval": 0.1669921875, + "loss_eval": 1354.747314453125, + "epoch": 20 + }, + { + "hidden_norms": [ + 2499.429931640625, + 57379.33203125, + 93242.0859375, + 111601.9921875, + 332709.625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010016581509262323, + 0.0007549687870778143, + 0.0007551733287982643, + 0.0007543734973296523, + 0.0007547553977929056 + ], + "gamma_dfa": 0.047867871820926666, + "gamma_dfa_per_layer": [ + 0.3270750641822815, + -0.037589848041534424, + -0.06097441166639328, + -0.037039317190647125 + ], + "acc_eval": 0.2041015625, + "loss_eval": 1818.91650390625, + "epoch": 21 + }, + { + "hidden_norms": [ + 2615.140625, + 75715.7109375, + 109683.390625, + 132553.84375, + 406621.46875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008831259910948575, + 0.0007625823491252959, + 0.0007627239683642983, + 0.0007604075944982469, + 0.0007611791370436549 + ], + "gamma_dfa": 0.022762255743145943, + "gamma_dfa_per_layer": [ + 0.27839380502700806, + -0.05395745486021042, + -0.07682197540998459, + -0.05656535178422928 + ], + "acc_eval": 0.2119140625, + "loss_eval": 1167.954833984375, + "epoch": 22 + }, + { + "hidden_norms": [ + 2742.37353515625, + 97227.28125, + 131140.8125, + 155048.3125, + 481929.84375 + ], + "bp_grad_per_sample_l2_med": [ + 0.001124670379795134, + 0.0007696108077652752, + 0.0007702686125412583, + 0.0007697975379414856, + 0.0007697619148530066 + ], + "gamma_dfa": 0.03202100656926632, + "gamma_dfa_per_layer": [ + 0.300557404756546, + -0.04680653661489487, + -0.052118271589279175, + -0.0735485702753067 + ], + "acc_eval": 0.240234375, + "loss_eval": 2470.89453125, + "epoch": 23 + }, + { + "hidden_norms": [ + 2858.224609375, + 126260.15625, + 160387.703125, + 186178.890625, + 564007.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.001086456119082868, + 0.0007698858971707523, + 0.0007706494652666152, + 0.0007701858412474394, + 0.0007703170995227993 + ], + "gamma_dfa": 0.03411092050373554, + "gamma_dfa_per_layer": [ + 0.3229827582836151, + -0.03976103663444519, + -0.05624774843454361, + -0.09053029119968414 + ], + "acc_eval": 0.2080078125, + "loss_eval": 1589.14599609375, + "epoch": 24 + }, + { + "hidden_norms": [ + 3010.89697265625, + 156964.375, + 194623.5, + 223223.875, + 662826.6875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010667620226740837, + 0.0007900846539996564, + 0.0007894287118688226, + 0.0007884356309659779, + 0.0007912488654255867 + ], + "gamma_dfa": 0.03901553526520729, + "gamma_dfa_per_layer": [ + 0.34151530265808105, + -0.04678330570459366, + -0.06850147247314453, + -0.0701683834195137 + ], + "acc_eval": 0.19921875, + "loss_eval": 1886.69091796875, + "epoch": 25 + }, + { + "hidden_norms": [ + 3121.8056640625, + 191038.40625, + 232148.296875, + 265744.1875, + 761219.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011186219053342938, + 0.0007986227865330875, + 0.0007986134733073413, + 0.0007980577065609396, + 0.0007973008905537426 + ], + "gamma_dfa": 0.027425863780081272, + "gamma_dfa_per_layer": [ + 0.35862213373184204, + -0.061674464493989944, + -0.0841888040304184, + -0.10305541008710861 + ], + "acc_eval": 0.185546875, + "loss_eval": 1700.765869140625, + "epoch": 26 + }, + { + "hidden_norms": [ + 3283.62646484375, + 232390.3125, + 279218.25, + 315312.8125, + 875470.4375 + ], + "bp_grad_per_sample_l2_med": [ + 0.001439103507436812, + 0.0007854723371565342, + 0.0007857424207031727, + 0.0007855244330130517, + 0.0007853199495002627 + ], + "gamma_dfa": 0.03129031043499708, + "gamma_dfa_per_layer": [ + 0.33073610067367554, + -0.058702368289232254, + -0.06629009544849396, + -0.080582395195961 + ], + "acc_eval": 0.201171875, + "loss_eval": 3809.69873046875, + "epoch": 27 + }, + { + "hidden_norms": [ + 3407.8984375, + 272082.28125, + 324674.25, + 365055.125, + 983575.625 + ], + "bp_grad_per_sample_l2_med": [ + 0.001244095852598548, + 0.0008176793926395476, + 0.0008168797940015793, + 0.000815192295704037, + 0.0008157575502991676 + ], + "gamma_dfa": 0.02919871360063553, + "gamma_dfa_per_layer": [ + 0.3321998715400696, + -0.048228584229946136, + -0.057734884321689606, + -0.10944154858589172 + ], + "acc_eval": 0.1650390625, + "loss_eval": 5145.80615234375, + "epoch": 28 + }, + { + "hidden_norms": [ + 3570.579833984375, + 325919.34375, + 383859.84375, + 429527.59375, + 1121656.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013903328217566013, + 0.0008181754965335131, + 0.0008133396040648222, + 0.0008111604838632047, + 0.0008120551356114447 + ], + "gamma_dfa": 0.04902177257463336, + "gamma_dfa_per_layer": [ + 0.33004581928253174, + -0.017712868750095367, + -0.016218842938542366, + -0.10002701729536057 + ], + "acc_eval": 0.1220703125, + "loss_eval": 4755.40869140625, + "epoch": 29 + }, + { + "hidden_norms": [ + 3675.836181640625, + 381066.84375, + 446664.84375, + 495540.4375, + 1244910.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013685236917808652, + 0.0007945130346342921, + 0.0007943777018226683, + 0.0007925048121251166, + 0.0007924467790871859 + ], + "gamma_dfa": 0.01623274479061365, + "gamma_dfa_per_layer": [ + 0.27984413504600525, + -0.06000320240855217, + -0.06209240108728409, + -0.09281755238771439 + ], + "acc_eval": 0.1962890625, + "loss_eval": 3555.3525390625, + "epoch": 30 + }, + { + "hidden_norms": [ + 3779.81103515625, + 443408.34375, + 515845.65625, + 568047.125, + 1396404.125 + ], + "bp_grad_per_sample_l2_med": [ + 0.001294015790335834, + 0.0007740295841358602, + 0.0007753889658488333, + 0.0007745815673843026, + 0.000773973239120096 + ], + "gamma_dfa": 0.048758171033114195, + "gamma_dfa_per_layer": [ + 0.3447470963001251, + -0.05413726717233658, + -0.0899808406829834, + -0.005596304312348366 + ], + "acc_eval": 0.1103515625, + "loss_eval": 8851.5302734375, + "epoch": 31 + }, + { + "hidden_norms": [ + 3920.750732421875, + 517289.40625, + 595296.5625, + 655510.1875, + 1569922.125 + ], + "bp_grad_per_sample_l2_med": [ + 0.001448597526177764, + 0.0008134506642818451, + 0.0008149920613504946, + 0.0008116801618598402, + 0.0008117944234982133 + ], + "gamma_dfa": 0.016455436125397682, + "gamma_dfa_per_layer": [ + 0.28803595900535583, + -0.048596471548080444, + -0.07654894888401031, + -0.09706879407167435 + ], + "acc_eval": 0.1767578125, + "loss_eval": 4626.505859375, + "epoch": 32 + }, + { + "hidden_norms": [ + 4035.357666015625, + 605458.75, + 691596.8125, + 758344.75, + 1762235.125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013269236078485847, + 0.0007732360390946269, + 0.0007741436711512506, + 0.000773612700868398, + 0.0007734647369943559 + ], + "gamma_dfa": 0.029436825774610043, + "gamma_dfa_per_layer": [ + 0.2940990924835205, + -0.04052134230732918, + -0.05536778271198273, + -0.08046266436576843 + ], + "acc_eval": 0.2578125, + "loss_eval": 2423.88037109375, + "epoch": 33 + }, + { + "hidden_norms": [ + 4180.47998046875, + 680883.875, + 781089.375, + 856024.9375, + 1949442.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015648282133042812, + 0.0007914449088275433, + 0.0007915649330243468, + 0.0007914216257631779, + 0.0007914576563052833 + ], + "gamma_dfa": 0.019646714441478252, + "gamma_dfa_per_layer": [ + 0.2821764647960663, + -0.0451091043651104, + -0.08556324988603592, + -0.07291725277900696 + ], + "acc_eval": 0.2314453125, + "loss_eval": 3942.80810546875, + "epoch": 34 + }, + { + "hidden_norms": [ + 4309.49462890625, + 763385.4375, + 877493.9375, + 964321.4375, + 2131046.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.001357953529804945, + 0.0008006176794879138, + 0.000801383052021265, + 0.0008009205921553075, + 0.0008007651194930077 + ], + "gamma_dfa": 0.012816952541470528, + "gamma_dfa_per_layer": [ + 0.3179120421409607, + -0.07943161576986313, + -0.08064424991607666, + -0.1065683662891388 + ], + "acc_eval": 0.1904296875, + "loss_eval": 4230.3056640625, + "epoch": 35 + }, + { + "hidden_norms": [ + 4492.82568359375, + 851087.875, + 976163.875, + 1072469.125, + 2314147.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.001730966498143971, + 0.000772459723521024, + 0.0007729437202215195, + 0.0007728235796093941, + 0.0007726353942416608 + ], + "gamma_dfa": 0.03693788964301348, + "gamma_dfa_per_layer": [ + 0.29988259077072144, + -0.0496492013335228, + -0.08479931950569153, + -0.0176825113594532 + ], + "acc_eval": 0.1484375, + "loss_eval": 8231.34765625, + "epoch": 36 + }, + { + "hidden_norms": [ + 4624.63720703125, + 951948.25, + 1092683.875, + 1196542.75, + 2542183.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.002538386033847928, + 0.0007714434177614748, + 0.0007710265927016735, + 0.0007713963277637959, + 0.0007713483064435422 + ], + "gamma_dfa": 0.04740711580961943, + "gamma_dfa_per_layer": [ + 0.33979880809783936, + -0.04041346162557602, + -0.07300114631652832, + -0.03675573691725731 + ], + "acc_eval": 0.1923828125, + "loss_eval": 8949.130859375, + "epoch": 37 + }, + { + "hidden_norms": [ + 4807.11767578125, + 1054507.625, + 1214753.0, + 1323814.0, + 2764538.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0027727719862014055, + 0.000796200183685869, + 0.0007976335473358631, + 0.0007973454194143414, + 0.0007971985614858568 + ], + "gamma_dfa": 0.08554775826632977, + "gamma_dfa_per_layer": [ + 0.5049943923950195, + -0.037710923701524734, + -0.07092456519603729, + -0.05416787043213844 + ], + "acc_eval": 0.1162109375, + "loss_eval": 12713.4443359375, + "epoch": 38 + }, + { + "hidden_norms": [ + 4955.41943359375, + 1174053.875, + 1354818.125, + 1476400.375, + 3014463.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020058690570294857, + 0.0008079316467046738, + 0.0008077211095951498, + 0.0008079909021034837, + 0.000808066048193723 + ], + "gamma_dfa": -0.01097937673330307, + "gamma_dfa_per_layer": [ + 0.23371317982673645, + -0.07769355922937393, + -0.08009498566389084, + -0.11984214186668396 + ], + "acc_eval": 0.169921875, + "loss_eval": 5398.2822265625, + "epoch": 39 + }, + { + "hidden_norms": [ + 5098.02978515625, + 1282560.25, + 1488493.125, + 1621443.25, + 3242451.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017661951715126634, + 0.0007956374902278185, + 0.0007964695687405765, + 0.0007961427327245474, + 0.0007956251502037048 + ], + "gamma_dfa": 0.022673148661851883, + "gamma_dfa_per_layer": [ + 0.3096145689487457, + -0.05532063543796539, + -0.08393190801143646, + -0.07966943085193634 + ], + "acc_eval": 0.185546875, + "loss_eval": 4639.80908203125, + "epoch": 40 + }, + { + "hidden_norms": [ + 5239.9326171875, + 1391390.625, + 1615340.375, + 1765558.375, + 3480115.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020867532584816217, + 0.0007667955360375345, + 0.0007673996733501554, + 0.0007673778454773128, + 0.0007672442006878555 + ], + "gamma_dfa": 0.0395392719656229, + "gamma_dfa_per_layer": [ + 0.33367329835891724, + -0.043648943305015564, + -0.055444151163101196, + -0.07642311602830887 + ], + "acc_eval": 0.234375, + "loss_eval": 9990.30859375, + "epoch": 41 + }, + { + "hidden_norms": [ + 5359.44677734375, + 1521280.0, + 1767789.625, + 1930907.75, + 3750866.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017118212999776006, + 0.0007934573804959655, + 0.0007942463853396475, + 0.000793949409853667, + 0.0007934118038974702 + ], + "gamma_dfa": 0.03361810464411974, + "gamma_dfa_per_layer": [ + 0.3103788495063782, + -0.03702692314982414, + -0.055835530161857605, + -0.08304397761821747 + ], + "acc_eval": 0.216796875, + "loss_eval": 9768.205078125, + "epoch": 42 + }, + { + "hidden_norms": [ + 5546.62451171875, + 1660698.625, + 1925789.375, + 2096456.25, + 4028953.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017267497023567557, + 0.000821329711470753, + 0.0008239842718467116, + 0.0008229895029217005, + 0.0008229521918110549 + ], + "gamma_dfa": 0.029660841450095177, + "gamma_dfa_per_layer": [ + 0.35288333892822266, + -0.043948374688625336, + -0.0895853042602539, + -0.10070629417896271 + ], + "acc_eval": 0.1884765625, + "loss_eval": 8935.0380859375, + "epoch": 43 + }, + { + "hidden_norms": [ + 5664.30810546875, + 1784317.875, + 2078188.375, + 2264432.75, + 4288914.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0022900900803506374, + 0.0007636325899511576, + 0.0007642185082659125, + 0.0007641956908628345, + 0.0007639650139026344 + ], + "gamma_dfa": 0.06175872636958957, + "gamma_dfa_per_layer": [ + 0.4067830443382263, + -0.03052734024822712, + -0.06545087695121765, + -0.06376992166042328 + ], + "acc_eval": 0.2197265625, + "loss_eval": 8287.39453125, + "epoch": 44 + }, + { + "hidden_norms": [ + 5794.2666015625, + 1915382.125, + 2237977.75, + 2434797.75, + 4568056.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001793600502423942, + 0.0008144167950376868, + 0.0008172079687938094, + 0.0008157116826623678, + 0.0008155000978149474 + ], + "gamma_dfa": 0.034024693071842194, + "gamma_dfa_per_layer": [ + 0.35199591517448425, + -0.03579515218734741, + -0.09812411665916443, + -0.08197787404060364 + ], + "acc_eval": 0.1806640625, + "loss_eval": 8560.4384765625, + "epoch": 45 + }, + { + "hidden_norms": [ + 5928.12158203125, + 2057562.625, + 2403872.5, + 2624509.5, + 4865204.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001855076989158988, + 0.0007629086030647159, + 0.0007635788642801344, + 0.0007633934146724641, + 0.0007630206528119743 + ], + "gamma_dfa": 0.023082666099071503, + "gamma_dfa_per_layer": [ + 0.27648454904556274, + -0.05024096742272377, + -0.0845799595117569, + -0.049332957714796066 + ], + "acc_eval": 0.197265625, + "loss_eval": 10714.77734375, + "epoch": 46 + }, + { + "hidden_norms": [ + 6079.8232421875, + 2190046.5, + 2564464.5, + 2797927.0, + 5132383.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015576905570924282, + 0.0007896191673353314, + 0.0007904896046966314, + 0.0007902018842287362, + 0.0007895485614426434 + ], + "gamma_dfa": 0.03866780921816826, + "gamma_dfa_per_layer": [ + 0.37201371788978577, + -0.049719154834747314, + -0.07755836844444275, + -0.09006495773792267 + ], + "acc_eval": 0.19140625, + "loss_eval": 7322.5205078125, + "epoch": 47 + }, + { + "hidden_norms": [ + 6184.03369140625, + 2339567.0, + 2744136.25, + 2990721.25, + 5426845.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020522314589470625, + 0.0007883926737122238, + 0.0007893759175203741, + 0.0007890417473390698, + 0.0007883401704020798 + ], + "gamma_dfa": 0.021758251823484898, + "gamma_dfa_per_layer": [ + 0.2855323553085327, + -0.04375234618782997, + -0.07049872726202011, + -0.08424827456474304 + ], + "acc_eval": 0.2080078125, + "loss_eval": 13975.05859375, + "epoch": 48 + }, + { + "hidden_norms": [ + 6295.5458984375, + 2477445.75, + 2917469.0, + 3179694.0, + 5727252.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.002105356426909566, + 0.0008074102224782109, + 0.0008063287241384387, + 0.000806407246273011, + 0.0008067074231803417 + ], + "gamma_dfa": 0.0267162024974823, + "gamma_dfa_per_layer": [ + 0.30986034870147705, + -0.05209521949291229, + -0.09783680737018585, + -0.05306351184844971 + ], + "acc_eval": 0.1435546875, + "loss_eval": 9590.544921875, + "epoch": 49 + }, + { + "hidden_norms": [ + 6367.55029296875, + 2638468.75, + 3095811.75, + 3362978.75, + 6030941.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015475827967748046, + 0.0008064319263212383, + 0.0008070095209404826, + 0.0008065010770224035, + 0.0008065410074777901 + ], + "gamma_dfa": 0.00636688619852066, + "gamma_dfa_per_layer": [ + 0.29843205213546753, + -0.03980886936187744, + -0.06682014465332031, + -0.16633549332618713 + ], + "acc_eval": 0.11328125, + "loss_eval": 12254.064453125, + "epoch": 50 + }, + { + "hidden_norms": [ + 6482.18798828125, + 2769282.5, + 3257572.75, + 3548043.5, + 6284645.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0022430147510021925, + 0.0008079760009422898, + 0.000807179429102689, + 0.0008071344927884638, + 0.0008072732598520815 + ], + "gamma_dfa": 0.04464401211589575, + "gamma_dfa_per_layer": [ + 0.3536185026168823, + -0.02255946770310402, + -0.07369404286146164, + -0.07878894358873367 + ], + "acc_eval": 0.181640625, + "loss_eval": 10079.115234375, + "epoch": 51 + }, + { + "hidden_norms": [ + 6566.8623046875, + 2899506.0, + 3420720.5, + 3728966.75, + 6555012.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.001695870072580874, + 0.000820032088086009, + 0.0008200806332752109, + 0.0008201819728128612, + 0.0008201953023672104 + ], + "gamma_dfa": 0.034856872633099556, + "gamma_dfa_per_layer": [ + 0.3895777463912964, + -0.057720690965652466, + -0.08937396109104156, + -0.10305560380220413 + ], + "acc_eval": 0.1181640625, + "loss_eval": 10401.4013671875, + "epoch": 52 + }, + { + "hidden_norms": [ + 6618.705078125, + 3056073.5, + 3608076.25, + 3938206.0, + 6870646.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014620226575061679, + 0.000811390345916152, + 0.0008111409260891378, + 0.000811099074780941, + 0.000811324454843998 + ], + "gamma_dfa": 0.002492595463991165, + "gamma_dfa_per_layer": [ + 0.2934489846229553, + -0.07660828530788422, + -0.0814061164855957, + -0.12546420097351074 + ], + "acc_eval": 0.16796875, + "loss_eval": 11906.7060546875, + "epoch": 53 + }, + { + "hidden_norms": [ + 6674.03759765625, + 3201735.0, + 3787927.75, + 4133561.75, + 7173546.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015491953818127513, + 0.0007825249340385199, + 0.0007832346600480378, + 0.0007830507238395512, + 0.0007823925698176026 + ], + "gamma_dfa": 0.054443607572466135, + "gamma_dfa_per_layer": [ + 0.38785266876220703, + -0.022086789831519127, + -0.062120988965034485, + -0.08587045967578888 + ], + "acc_eval": 0.2373046875, + "loss_eval": 9465.3525390625, + "epoch": 54 + }, + { + "hidden_norms": [ + 6740.52392578125, + 3338670.5, + 3953341.75, + 4315309.5, + 7447204.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015645271632820368, + 0.0007820724858902395, + 0.0007820809260010719, + 0.0007819690508767962, + 0.0007819557213224471 + ], + "gamma_dfa": 0.027317455038428307, + "gamma_dfa_per_layer": [ + 0.3320838212966919, + -0.06272841989994049, + -0.06253603100776672, + -0.09754955023527145 + ], + "acc_eval": 0.1923828125, + "loss_eval": 9605.2587890625, + "epoch": 55 + }, + { + "hidden_norms": [ + 6826.42578125, + 3488233.5, + 4125392.0, + 4514242.0, + 7747655.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018625661032274365, + 0.0008403572137467563, + 0.0008396300836466253, + 0.0008392629097215831, + 0.000840048654936254 + ], + "gamma_dfa": 0.018042685464024544, + "gamma_dfa_per_layer": [ + 0.34575170278549194, + -0.061284519731998444, + -0.08629278838634491, + -0.12600365281105042 + ], + "acc_eval": 0.1494140625, + "loss_eval": 13453.193359375, + "epoch": 56 + }, + { + "hidden_norms": [ + 6878.60009765625, + 3647417.5, + 4303500.5, + 4707215.0, + 8039602.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001495232223533094, + 0.0008112883078865707, + 0.0008119228295981884, + 0.0008115706732496619, + 0.0008112648501992226 + ], + "gamma_dfa": 0.025581182446330786, + "gamma_dfa_per_layer": [ + 0.301077663898468, + -0.015085713937878609, + -0.07233025878667831, + -0.11133696138858795 + ], + "acc_eval": 0.1513671875, + "loss_eval": 10446.5498046875, + "epoch": 57 + }, + { + "hidden_norms": [ + 6956.30126953125, + 3782040.0, + 4474453.5, + 4889139.0, + 8311892.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.001576881273649633, + 0.0008043631678447127, + 0.0008050674805417657, + 0.0008046348229981959, + 0.0008046681759878993 + ], + "gamma_dfa": 0.005857756361365318, + "gamma_dfa_per_layer": [ + 0.28321602940559387, + -0.03702875226736069, + -0.06707675755023956, + -0.15567949414253235 + ], + "acc_eval": 0.1484375, + "loss_eval": 6591.0849609375, + "epoch": 58 + }, + { + "hidden_norms": [ + 7021.955078125, + 3911149.5, + 4636672.0, + 5064123.0, + 8571758.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.002099651610478759, + 0.0008183405152522027, + 0.0008207465871237218, + 0.0008196401176974177, + 0.000819449604023248 + ], + "gamma_dfa": 0.006074780598282814, + "gamma_dfa_per_layer": [ + 0.2577749490737915, + -0.05066239833831787, + -0.06501314789056778, + -0.1178002804517746 + ], + "acc_eval": 0.2109375, + "loss_eval": 7962.04443359375, + "epoch": 59 + }, + { + "hidden_norms": [ + 7101.7373046875, + 4061103.5, + 4820611.0, + 5257086.0, + 8861818.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018932655220851302, + 0.0008025900460779667, + 0.0008032865589484572, + 0.000802954426035285, + 0.0008029173477552831 + ], + "gamma_dfa": 0.020984639413654804, + "gamma_dfa_per_layer": [ + 0.3329803943634033, + -0.03559138998389244, + -0.06842450797557831, + -0.14502593874931335 + ], + "acc_eval": 0.1650390625, + "loss_eval": 8638.353515625, + "epoch": 60 + }, + { + "hidden_norms": [ + 7120.71240234375, + 4194965.0, + 4982087.0, + 5430094.5, + 9121286.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015255591133609414, + 0.0007772985845804214, + 0.0007780406740494072, + 0.0007778139552101493, + 0.000777201319579035 + ], + "gamma_dfa": 0.0210345396772027, + "gamma_dfa_per_layer": [ + 0.3191820979118347, + -0.05588069185614586, + -0.0712573379278183, + -0.10790590941905975 + ], + "acc_eval": 0.22265625, + "loss_eval": 8870.3212890625, + "epoch": 61 + }, + { + "hidden_norms": [ + 7166.24462890625, + 4326872.0, + 5144769.0, + 5605003.0, + 9390572.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0019027154194191098, + 0.000822498113848269, + 0.0008225358324125409, + 0.0008226112113334239, + 0.0008225055644288659 + ], + "gamma_dfa": 0.01758619397878647, + "gamma_dfa_per_layer": [ + 0.29208946228027344, + -0.046764522790908813, + -0.10779638588428497, + -0.06718377768993378 + ], + "acc_eval": 0.154296875, + "loss_eval": 18607.9921875, + "epoch": 62 + }, + { + "hidden_norms": [ + 7173.86865234375, + 4454190.5, + 5300661.5, + 5764316.0, + 9633685.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017527258023619652, + 0.0008042250410653651, + 0.0008040837710723281, + 0.0008041510009206831, + 0.0008041784167289734 + ], + "gamma_dfa": 0.04197401413694024, + "gamma_dfa_per_layer": [ + 0.31714165210723877, + -0.025468191131949425, + -0.05378583073616028, + -0.0699915736913681 + ], + "acc_eval": 0.1826171875, + "loss_eval": 10768.23046875, + "epoch": 63 + }, + { + "hidden_norms": [ + 7200.1064453125, + 4569527.5, + 5448454.0, + 5924151.0, + 9865530.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016467028763145208, + 0.0007759482250548899, + 0.0007759520667605102, + 0.0007758319843560457, + 0.0007757880375720561 + ], + "gamma_dfa": 0.019114631228148937, + "gamma_dfa_per_layer": [ + 0.3342781364917755, + -0.05670151486992836, + -0.0891423374414444, + -0.111975759267807 + ], + "acc_eval": 0.1865234375, + "loss_eval": 9049.12109375, + "epoch": 64 + }, + { + "hidden_norms": [ + 7198.30419921875, + 4679779.5, + 5583911.5, + 6073903.5, + 10075961.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015529918018728495, + 0.0008276477456092834, + 0.0008274043793790042, + 0.0008273764979094267, + 0.00082727539120242 + ], + "gamma_dfa": 0.012379471212625504, + "gamma_dfa_per_layer": [ + 0.33610183000564575, + -0.0668979212641716, + -0.09369023889303207, + -0.12599578499794006 + ], + "acc_eval": 0.1533203125, + "loss_eval": 9929.3125, + "epoch": 65 + }, + { + "hidden_norms": [ + 7191.220703125, + 4787683.5, + 5730170.5, + 6223255.0, + 10287596.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.002624395303428173, + 0.0008026033756323159, + 0.0008024688577279449, + 0.0008025110582821071, + 0.000802531314548105 + ], + "gamma_dfa": 0.041071049869060516, + "gamma_dfa_per_layer": [ + 0.3911614418029785, + -0.03441564738750458, + -0.07384517788887024, + -0.11861641705036163 + ], + "acc_eval": 0.1669921875, + "loss_eval": 9811.68359375, + "epoch": 66 + }, + { + "hidden_norms": [ + 7184.458984375, + 4895536.0, + 5864442.5, + 6369317.5, + 10509902.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016685851151123643, + 0.0007737133419141173, + 0.0007737109554000199, + 0.0007736092084087431, + 0.0007735762046650052 + ], + "gamma_dfa": 0.03856207150965929, + "gamma_dfa_per_layer": [ + 0.3347627520561218, + -0.05478603392839432, + -0.09395486861467361, + -0.03177356347441673 + ], + "acc_eval": 0.15625, + "loss_eval": 7798.90283203125, + "epoch": 67 + }, + { + "hidden_norms": [ + 7166.86083984375, + 4995598.0, + 5984263.5, + 6498221.0, + 10708319.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013723000884056091, + 0.0008002148242667317, + 0.0007998319924809039, + 0.0007997409556992352, + 0.0008000954985618591 + ], + "gamma_dfa": 0.024815326556563377, + "gamma_dfa_per_layer": [ + 0.3238403797149658, + -0.05496574938297272, + -0.0969959944486618, + -0.07261732965707779 + ], + "acc_eval": 0.1552734375, + "loss_eval": 6333.236328125, + "epoch": 68 + }, + { + "hidden_norms": [ + 7156.17236328125, + 5093715.5, + 6108802.5, + 6629623.5, + 10896864.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001458030310459435, + 0.0007727351039648056, + 0.0007727306219749153, + 0.0007726310286670923, + 0.0007726071053184569 + ], + "gamma_dfa": 0.018785862252116203, + "gamma_dfa_per_layer": [ + 0.31862637400627136, + -0.06633786112070084, + -0.07025538384914398, + -0.10688968002796173 + ], + "acc_eval": 0.2060546875, + "loss_eval": 5966.35400390625, + "epoch": 69 + }, + { + "hidden_norms": [ + 7127.96875, + 5203388.5, + 6229672.5, + 6756540.5, + 11105730.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018821367993950844, + 0.000799131637904793, + 0.0007999413646757603, + 0.0007995158084668219, + 0.0007994744228199124 + ], + "gamma_dfa": 0.033654400147497654, + "gamma_dfa_per_layer": [ + 0.3480244278907776, + -0.0470522977411747, + -0.08066973835229874, + -0.08568479120731354 + ], + "acc_eval": 0.21484375, + "loss_eval": 8679.373046875, + "epoch": 70 + }, + { + "hidden_norms": [ + 7127.84326171875, + 5291613.5, + 6343081.5, + 6873492.5, + 11283083.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013305873144418001, + 0.0008001387468539178, + 0.0007999925292097032, + 0.0008000367670319974, + 0.0008000454981811345 + ], + "gamma_dfa": 0.026681816205382347, + "gamma_dfa_per_layer": [ + 0.33079925179481506, + -0.04635504633188248, + -0.060725681483745575, + -0.11699125915765762 + ], + "acc_eval": 0.2001953125, + "loss_eval": 7321.45654296875, + "epoch": 71 + }, + { + "hidden_norms": [ + 7118.43115234375, + 5399320.5, + 6461637.5, + 6995765.0, + 11479911.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0027539313305169344, + 0.0007441912894137204, + 0.000744749209843576, + 0.0007447105017490685, + 0.0007443142239935696 + ], + "gamma_dfa": 0.0691906102001667, + "gamma_dfa_per_layer": [ + 0.4505346715450287, + -0.03461931645870209, + -0.07136575877666473, + -0.06778715550899506 + ], + "acc_eval": 0.16015625, + "loss_eval": 10899.68359375, + "epoch": 72 + }, + { + "hidden_norms": [ + 7104.958984375, + 5484605.5, + 6570873.0, + 7105816.5, + 11646348.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011745812371373177, + 0.000797195709310472, + 0.0007963370881043375, + 0.0007962601375766098, + 0.0007965530967339873 + ], + "gamma_dfa": 0.016523053869605064, + "gamma_dfa_per_layer": [ + 0.3157949447631836, + -0.05805324763059616, + -0.0915503203868866, + -0.10009916126728058 + ], + "acc_eval": 0.185546875, + "loss_eval": 4549.11328125, + "epoch": 73 + }, + { + "hidden_norms": [ + 7046.66552734375, + 5575192.0, + 6682143.0, + 7216392.5, + 11814821.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014973932411521673, + 0.0007987518329173326, + 0.000798598921392113, + 0.0007986334967426956, + 0.00079863186692819 + ], + "gamma_dfa": 0.006323261186480522, + "gamma_dfa_per_layer": [ + 0.3186365067958832, + -0.07689585536718369, + -0.08955803513526917, + -0.12688957154750824 + ], + "acc_eval": 0.1845703125, + "loss_eval": 5873.4677734375, + "epoch": 74 + }, + { + "hidden_norms": [ + 6997.1630859375, + 5656117.0, + 6779526.0, + 7314913.5, + 11969090.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014266286743804812, + 0.0007692458457313478, + 0.0007703236187808216, + 0.0007699450361542404, + 0.0007692069630138576 + ], + "gamma_dfa": 0.04031236469745636, + "gamma_dfa_per_layer": [ + 0.3853839635848999, + -0.054634347558021545, + -0.08128909766674042, + -0.0882110595703125 + ], + "acc_eval": 0.1953125, + "loss_eval": 4200.4296875, + "epoch": 75 + }, + { + "hidden_norms": [ + 6970.02099609375, + 5731178.0, + 6870747.5, + 7405309.0, + 12120166.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013568063732236624, + 0.0007682641153223813, + 0.000768258236348629, + 0.0007681549177505076, + 0.0007681125425733626 + ], + "gamma_dfa": 0.04615131672471762, + "gamma_dfa_per_layer": [ + 0.3717971444129944, + -0.05474664270877838, + -0.05301285162568092, + -0.07943238317966461 + ], + "acc_eval": 0.1943359375, + "loss_eval": 3897.47607421875, + "epoch": 76 + }, + { + "hidden_norms": [ + 6942.25, + 5793439.5, + 6946580.5, + 7481325.5, + 12242140.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011983924778178334, + 0.0007509839488193393, + 0.0007508245762437582, + 0.0007505225948989391, + 0.0007505776011385024 + ], + "gamma_dfa": 0.03128352388739586, + "gamma_dfa_per_layer": [ + 0.31842517852783203, + -0.03316807746887207, + -0.06335921585559845, + -0.09676378965377808 + ], + "acc_eval": 0.2685546875, + "loss_eval": 3095.559814453125, + "epoch": 77 + }, + { + "hidden_norms": [ + 6881.80810546875, + 5850806.5, + 7011394.5, + 7546550.5, + 12350002.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011590005597099662, + 0.0007501945947296917, + 0.0007500603678636253, + 0.0007497719489037991, + 0.0007498189806938171 + ], + "gamma_dfa": 0.01806825865060091, + "gamma_dfa_per_layer": [ + 0.313739538192749, + -0.047393035143613815, + -0.07615944743156433, + -0.11791402101516724 + ], + "acc_eval": 0.205078125, + "loss_eval": 3942.599853515625, + "epoch": 78 + }, + { + "hidden_norms": [ + 6837.1533203125, + 5897771.5, + 7073526.0, + 7607611.5, + 12444407.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001163899782113731, + 0.0007416060543619096, + 0.0007419964531436563, + 0.0007419841131195426, + 0.0007417319575324655 + ], + "gamma_dfa": 0.03044590726494789, + "gamma_dfa_per_layer": [ + 0.30829477310180664, + -0.03881052881479263, + -0.07340054214000702, + -0.07430007308721542 + ], + "acc_eval": 0.2939453125, + "loss_eval": 2950.356689453125, + "epoch": 79 + }, + { + "hidden_norms": [ + 6806.5322265625, + 5963679.5, + 7147126.0, + 7679290.5, + 12557362.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012401024578139186, + 0.0007945983088575304, + 0.0007953918538987637, + 0.0007950742146931589, + 0.0007950655417516828 + ], + "gamma_dfa": -0.007623729296028614, + "gamma_dfa_per_layer": [ + 0.24250081181526184, + -0.04293825104832649, + -0.07043637335300446, + -0.15962110459804535 + ], + "acc_eval": 0.14453125, + "loss_eval": 3910.8994140625, + "epoch": 80 + }, + { + "hidden_norms": [ + 6782.47607421875, + 5997089.0, + 7185317.5, + 7719894.5, + 12633342.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012797614326700568, + 0.0007944905664771795, + 0.0007951240986585617, + 0.0007947491831146181, + 0.0007947032572701573 + ], + "gamma_dfa": 0.03983990382403135, + "gamma_dfa_per_layer": [ + 0.35600101947784424, + -0.023466136306524277, + -0.07362768054008484, + -0.09954758733510971 + ], + "acc_eval": 0.193359375, + "loss_eval": 3587.8212890625, + "epoch": 81 + }, + { + "hidden_norms": [ + 6723.70654296875, + 6042461.0, + 7238613.0, + 7771656.5, + 12718382.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012927292846143246, + 0.000765398726798594, + 0.0007653928478248417, + 0.0007653140346519649, + 0.0007652752683497965 + ], + "gamma_dfa": 0.03482971154153347, + "gamma_dfa_per_layer": [ + 0.34003761410713196, + -0.05069781839847565, + -0.05738937109708786, + -0.09263157844543457 + ], + "acc_eval": 0.23046875, + "loss_eval": 2805.9716796875, + "epoch": 82 + }, + { + "hidden_norms": [ + 6669.96435546875, + 6085424.0, + 7288909.5, + 7821635.0, + 12799732.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011438996298238635, + 0.000740286021027714, + 0.0007406995864585042, + 0.0007406825898215175, + 0.0007403898634947836 + ], + "gamma_dfa": 0.03725961223244667, + "gamma_dfa_per_layer": [ + 0.32540398836135864, + -0.04895278066396713, + -0.07243393361568451, + -0.05497882515192032 + ], + "acc_eval": 0.2373046875, + "loss_eval": 2089.305908203125, + "epoch": 83 + }, + { + "hidden_norms": [ + 6611.064453125, + 6121666.0, + 7328789.5, + 7859580.5, + 12864450.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010610584868118167, + 0.0007183317793533206, + 0.0007201047264970839, + 0.0007199530373327434, + 0.0007199217798188329 + ], + "gamma_dfa": 0.03143393341451883, + "gamma_dfa_per_layer": [ + 0.2940787076950073, + -0.035069357603788376, + -0.0604243278503418, + -0.07284928858280182 + ], + "acc_eval": 0.3076171875, + "loss_eval": 1459.638916015625, + "epoch": 84 + }, + { + "hidden_norms": [ + 6564.220703125, + 6147971.0, + 7358806.5, + 7888597.5, + 12918884.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001103258109651506, + 0.0007199789397418499, + 0.0007205012370832264, + 0.0007201395928859711, + 0.000719686911907047 + ], + "gamma_dfa": 0.02568601444363594, + "gamma_dfa_per_layer": [ + 0.3047623038291931, + -0.05378233641386032, + -0.07432089745998383, + -0.0739150121808052 + ], + "acc_eval": 0.2607421875, + "loss_eval": 1398.54931640625, + "epoch": 85 + }, + { + "hidden_norms": [ + 6523.052734375, + 6163991.5, + 7377848.0, + 7906464.0, + 12959929.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010483200894668698, + 0.0007394760614261031, + 0.0007398684392683208, + 0.0007398549350909889, + 0.0007395940483547747 + ], + "gamma_dfa": 0.028113607317209244, + "gamma_dfa_per_layer": [ + 0.2919086515903473, + -0.04769399017095566, + -0.06982402503490448, + -0.06193620711565018 + ], + "acc_eval": 0.294921875, + "loss_eval": 1247.0958251953125, + "epoch": 86 + }, + { + "hidden_norms": [ + 6480.38134765625, + 6177022.5, + 7396143.5, + 7924145.0, + 12992374.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011187344789505005, + 0.0007568535511381924, + 0.0007568564033135772, + 0.0007567762513644993, + 0.0007568445871584117 + ], + "gamma_dfa": 0.029856184497475624, + "gamma_dfa_per_layer": [ + 0.32282522320747375, + -0.05086465924978256, + -0.06785817444324493, + -0.08467765152454376 + ], + "acc_eval": 0.267578125, + "loss_eval": 1623.752197265625, + "epoch": 87 + }, + { + "hidden_norms": [ + 6430.5322265625, + 6198352.0, + 7419959.0, + 7946585.0, + 13023161.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010678176768124104, + 0.0007456489838659763, + 0.0007455460145138204, + 0.0007452794816344976, + 0.000745359982829541 + ], + "gamma_dfa": 0.019207272678613663, + "gamma_dfa_per_layer": [ + 0.28421786427497864, + -0.04965135455131531, + -0.07151313126087189, + -0.08622428774833679 + ], + "acc_eval": 0.291015625, + "loss_eval": 1205.84716796875, + "epoch": 88 + }, + { + "hidden_norms": [ + 6396.35009765625, + 6216262.0, + 7436144.0, + 7961794.0, + 13045224.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010295198298990726, + 0.0007388790836557746, + 0.0007392680854536593, + 0.000739254173822701, + 0.000738998525775969 + ], + "gamma_dfa": 0.02955447882413864, + "gamma_dfa_per_layer": [ + 0.2954120337963104, + -0.046598292887210846, + -0.069032222032547, + -0.061563603579998016 + ], + "acc_eval": 0.298828125, + "loss_eval": 1123.675048828125, + "epoch": 89 + }, + { + "hidden_norms": [ + 6366.1259765625, + 6230148.5, + 7451647.0, + 7975150.0, + 13064555.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010110137518495321, + 0.0007565211853943765, + 0.0007565242704004049, + 0.0007563806138932705, + 0.0007564250845462084 + ], + "gamma_dfa": 0.011881772428750992, + "gamma_dfa_per_layer": [ + 0.2693521976470947, + -0.04482053220272064, + -0.07126723229885101, + -0.1057373434305191 + ], + "acc_eval": 0.240234375, + "loss_eval": 1118.5343017578125, + "epoch": 90 + }, + { + "hidden_norms": [ + 6341.41796875, + 6233793.0, + 7457683.5, + 7981064.5, + 13074395.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010112811578437686, + 0.0007385196513496339, + 0.0007389356032945216, + 0.000738917791750282, + 0.0007386352517642081 + ], + "gamma_dfa": 0.0292903920635581, + "gamma_dfa_per_layer": [ + 0.28946253657341003, + -0.033900823444128036, + -0.06436440348625183, + -0.07403574138879776 + ], + "acc_eval": 0.306640625, + "loss_eval": 1028.103515625, + "epoch": 91 + }, + { + "hidden_norms": [ + 6319.90185546875, + 6241203.5, + 7463285.5, + 7986068.5, + 13084655.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010045261587947607, + 0.0007187838782556355, + 0.0007187584415078163, + 0.0007185733411461115, + 0.0007185345166362822 + ], + "gamma_dfa": 0.02470484748482704, + "gamma_dfa_per_layer": [ + 0.2734910249710083, + -0.0429413765668869, + -0.06623440980911255, + -0.06549584865570068 + ], + "acc_eval": 0.3271484375, + "loss_eval": 879.8018798828125, + "epoch": 92 + }, + { + "hidden_norms": [ + 6299.453125, + 6240490.0, + 7464953.0, + 7988364.0, + 13086769.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010041827335953712, + 0.0007186768343672156, + 0.0007186515722423792, + 0.0007184677524492145, + 0.0007184296264313161 + ], + "gamma_dfa": 0.022233721800148487, + "gamma_dfa_per_layer": [ + 0.2633175849914551, + -0.04053181782364845, + -0.06492872536182404, + -0.06892215460538864 + ], + "acc_eval": 0.322265625, + "loss_eval": 871.9059448242188, + "epoch": 93 + }, + { + "hidden_norms": [ + 6280.70068359375, + 6248322.5, + 7472246.5, + 7994814.0, + 13094255.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000998231815174222, + 0.0007185792201198637, + 0.0007185565191321075, + 0.0007183970883488655, + 0.0007183645502664149 + ], + "gamma_dfa": 0.02329079993069172, + "gamma_dfa_per_layer": [ + 0.27325427532196045, + -0.04209248721599579, + -0.0645713210105896, + -0.07342726737260818 + ], + "acc_eval": 0.326171875, + "loss_eval": 876.770263671875, + "epoch": 94 + }, + { + "hidden_norms": [ + 6259.79541015625, + 6251884.0, + 7473855.0, + 7995730.5, + 13095582.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.001000022399239242, + 0.0007185632712207735, + 0.0007185383583419025, + 0.0007183536072261631, + 0.0007183143752627075 + ], + "gamma_dfa": 0.01565107237547636, + "gamma_dfa_per_layer": [ + 0.26019614934921265, + -0.042762644588947296, + -0.06100854650139809, + -0.09382066875696182 + ], + "acc_eval": 0.31640625, + "loss_eval": 847.3887939453125, + "epoch": 95 + }, + { + "hidden_norms": [ + 6250.6630859375, + 6252472.0, + 7474356.5, + 7996154.0, + 13096382.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009951539104804397, + 0.000718452560249716, + 0.0007184353889897466, + 0.0007182956906035542, + 0.0007182672270573676 + ], + "gamma_dfa": 0.01607441157102585, + "gamma_dfa_per_layer": [ + 0.2622864246368408, + -0.04606177657842636, + -0.06511188298463821, + -0.08681511878967285 + ], + "acc_eval": 0.3125, + "loss_eval": 820.6640625, + "epoch": 96 + }, + { + "hidden_norms": [ + 6245.84228515625, + 6252136.5, + 7473891.5, + 7995642.0, + 13095543.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009887836640700698, + 0.0007184472633525729, + 0.0007184235146269202, + 0.0007182589615695179, + 0.0007182253757491708 + ], + "gamma_dfa": 0.01632563304156065, + "gamma_dfa_per_layer": [ + 0.2587689757347107, + -0.041752640157938004, + -0.06282168626785278, + -0.08889211714267731 + ], + "acc_eval": 0.3271484375, + "loss_eval": 794.9835815429688, + "epoch": 97 + }, + { + "hidden_norms": [ + 6243.275390625, + 6252353.5, + 7474147.5, + 7995911.0, + 13095907.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010000880574807525, + 0.0007184495334513485, + 0.0007184281130321324, + 0.0007182535482570529, + 0.0007182166446000338 + ], + "gamma_dfa": 0.01966456975787878, + "gamma_dfa_per_layer": [ + 0.26670968532562256, + -0.04189712926745415, + -0.06575733423233032, + -0.08039694279432297 + ], + "acc_eval": 0.3173828125, + "loss_eval": 809.9351196289062, + "epoch": 98 + }, + { + "hidden_norms": [ + 6242.01708984375, + 6252447.5, + 7474218.0, + 7995986.5, + 13096086.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009963318007066846, + 0.000718410883564502, + 0.000718392024282366, + 0.0007182427798397839, + 0.0007182121044024825 + ], + "gamma_dfa": 0.017472295090556145, + "gamma_dfa_per_layer": [ + 0.26097655296325684, + -0.042458876967430115, + -0.06487732380628586, + -0.08375117182731628 + ], + "acc_eval": 0.326171875, + "loss_eval": 790.8746337890625, + "epoch": 99 + }, + { + "hidden_norms": [ + 6241.6884765625, + 6252462.0, + 7474227.5, + 7995996.0, + 13096118.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009859646670520306, + 0.0007156162173487246, + 0.0007178352097980678, + 0.0007174411439336836, + 0.0007168283336795866 + ], + "gamma_dfa": 0.01725842524319887, + "gamma_dfa_per_layer": [ + 0.25597745180130005, + -0.041728582233190536, + -0.06328003108501434, + -0.08193513751029968 + ], + "acc_eval": 0.3359375, + "loss_eval": 790.8336181640625, + "epoch": 100 + } + ] +} \ No newline at end of file diff --git a/results/snapshot_synth_v1/run_a1.0_s42.log b/results/snapshot_synth_v1/run_a1.0_s42.log new file mode 100644 index 0000000..d1e834a --- /dev/null +++ b/results/snapshot_synth_v1/run_a1.0_s42.log @@ -0,0 +1,44 @@ +device=cuda:0, alpha=1.0, depth=4, d_hidden=128, epochs=80, seed=42 +train: torch.Size([12800, 128]), test eval buffer: torch.Size([2000, 128]) + +=== BP training === + [BP] Ep 0: ||h_L||=1.140e+01 ||g||=2.816e-04 acc=0.0845 + [BP] Ep 1: ||h_L||=1.393e+01 ||g||=3.616e-04 acc=0.7095 + [BP] Ep 5: ||h_L||=2.067e+01 ||g||=2.195e-04 acc=0.7855 + [BP] Ep 10: ||h_L||=2.332e+01 ||g||=1.576e-04 acc=0.7915 + [BP] Ep 15: ||h_L||=2.609e+01 ||g||=9.301e-05 acc=0.8000 + [BP] Ep 20: ||h_L||=2.880e+01 ||g||=4.764e-05 acc=0.7950 + [BP] Ep 25: ||h_L||=3.096e+01 ||g||=3.036e-05 acc=0.7995 + [BP] Ep 30: ||h_L||=3.235e+01 ||g||=1.972e-05 acc=0.7975 + [BP] Ep 35: ||h_L||=3.329e+01 ||g||=1.527e-05 acc=0.8000 + [BP] Ep 40: ||h_L||=3.398e+01 ||g||=1.181e-05 acc=0.7975 + [BP] Ep 45: ||h_L||=3.449e+01 ||g||=1.028e-05 acc=0.7980 + [BP] Ep 50: ||h_L||=3.489e+01 ||g||=9.180e-06 acc=0.7980 + [BP] Ep 55: ||h_L||=3.516e+01 ||g||=8.594e-06 acc=0.7975 + [BP] Ep 60: ||h_L||=3.538e+01 ||g||=8.124e-06 acc=0.7960 + [BP] Ep 65: ||h_L||=3.553e+01 ||g||=7.551e-06 acc=0.7960 + [BP] Ep 70: ||h_L||=3.561e+01 ||g||=7.443e-06 acc=0.7960 + [BP] Ep 75: ||h_L||=3.565e+01 ||g||=7.344e-06 acc=0.7960 + [BP] Ep 80: ||h_L||=3.565e+01 ||g||=7.323e-06 acc=0.7960 + +=== DFA training === + [DFA] Ep 0: ||h_L||=1.140e+01 ||g||=2.816e-04 acc=0.0845 + [DFA] Ep 1: ||h_L||=1.244e+01 ||g||=2.737e-04 acc=0.3775 γ_dfa=0.1151 + [DFA] Ep 5: ||h_L||=5.072e+01 ||g||=1.943e-04 acc=0.7350 γ_dfa=0.1674 + [DFA] Ep 10: ||h_L||=1.381e+02 ||g||=1.229e-04 acc=0.7175 γ_dfa=0.1132 + [DFA] Ep 15: ||h_L||=2.302e+02 ||g||=1.030e-04 acc=0.7110 γ_dfa=0.0913 + [DFA] Ep 20: ||h_L||=3.213e+02 ||g||=1.112e-04 acc=0.7070 γ_dfa=0.0795 + [DFA] Ep 25: ||h_L||=4.041e+02 ||g||=1.027e-04 acc=0.7035 γ_dfa=0.0709 + [DFA] Ep 30: ||h_L||=4.810e+02 ||g||=1.014e-04 acc=0.6845 γ_dfa=0.0650 + [DFA] Ep 35: ||h_L||=5.483e+02 ||g||=1.116e-04 acc=0.6955 γ_dfa=0.0630 + [DFA] Ep 40: ||h_L||=6.078e+02 ||g||=1.203e-04 acc=0.6880 γ_dfa=0.0578 + [DFA] Ep 45: ||h_L||=6.578e+02 ||g||=1.118e-04 acc=0.6845 γ_dfa=0.0563 + [DFA] Ep 50: ||h_L||=6.988e+02 ||g||=1.262e-04 acc=0.6945 γ_dfa=0.0562 + [DFA] Ep 55: ||h_L||=7.301e+02 ||g||=1.428e-04 acc=0.6720 γ_dfa=0.0559 + [DFA] Ep 60: ||h_L||=7.519e+02 ||g||=1.238e-04 acc=0.6910 γ_dfa=0.0542 + [DFA] Ep 65: ||h_L||=7.678e+02 ||g||=1.230e-04 acc=0.6895 γ_dfa=0.0530 + [DFA] Ep 70: ||h_L||=7.757e+02 ||g||=1.224e-04 acc=0.6950 γ_dfa=0.0530 + [DFA] Ep 75: ||h_L||=7.791e+02 ||g||=1.214e-04 acc=0.6915 γ_dfa=0.0526 + [DFA] Ep 80: ||h_L||=7.797e+02 ||g||=1.203e-04 acc=0.6930 γ_dfa=0.0526 + +Saved results/snapshot_synth_v1/snapshot_synth_a1.0_L4_s42.json diff --git a/results/snapshot_synth_v1/snapshot_fa_canonical_s42.json b/results/snapshot_synth_v1/snapshot_fa_canonical_s42.json new file mode 100644 index 0000000..6ff85e7 --- /dev/null +++ b/results/snapshot_synth_v1/snapshot_fa_canonical_s42.json @@ -0,0 +1,2276 @@ +{ + "fa_log": [ + { + "hidden_norms": [ + 11.269571304321289, + 11.290447235107422, + 11.313605308532715, + 11.351215362548828, + 11.398087501525879 + ], + "bp_grad_per_sample_l2_med": [ + 0.00028353024390526116, + 0.0002828188880812377, + 0.00028162598027847707, + 0.0002799496578518301, + 0.0002791006409097463 + ], + "bp_grad_F": [ + 0.012684082612395287, + 0.01264861598610878, + 0.012589854188263416, + 0.012511610053479671, + 0.012471316382288933 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.08450000733137131, + "loss_eval": 2.4790313243865967, + "epoch": 0 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.457883834838867, + 11.697802543640137, + 12.001762390136719, + 12.303658485412598 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004113642207812518, + 0.00037613665335811675, + 0.0003495849668979645, + 0.0003221812949050218, + 0.00025295966770499945 + ], + "bp_grad_F": [ + 0.018967075273394585, + 0.017186719924211502, + 0.015851320698857307, + 0.01445167325437069, + 0.011211601085960865 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5270000100135803, + "loss_eval": 1.4865981340408325, + "epoch": 1 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.734084129333496, + 12.481009483337402, + 13.659913063049316, + 15.730950355529785 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007782558677718043, + 0.0006171928835101426, + 0.0004891889402642846, + 0.00038687532651238143, + 0.000231728219659999 + ], + "bp_grad_F": [ + 0.04103676602244377, + 0.03172670304775238, + 0.024926593527197838, + 0.019472092390060425, + 0.011657902970910072 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6360000371932983, + "loss_eval": 0.965207040309906, + "epoch": 2 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.973358154296875, + 13.411399841308594, + 16.07562255859375, + 20.911983489990234 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008172825910151005, + 0.0005784342647530138, + 0.000417369301430881, + 0.0003010776126757264, + 0.000168764207046479 + ], + "bp_grad_F": [ + 0.05745441094040871, + 0.04039904102683067, + 0.028755735605955124, + 0.020857004448771477, + 0.011488317511975765 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.687000036239624, + "loss_eval": 0.8154960870742798, + "epoch": 3 + }, + { + "hidden_norms": [ + 11.269571304321289, + 12.203580856323242, + 14.659997940063477, + 19.929065704345703, + 27.998876571655273 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007437548483721912, + 0.00048129685455933213, + 0.00031908220262266695, + 0.00022696926316712052, + 0.00012886490731034428 + ], + "bp_grad_F": [ + 0.06721046566963196, + 0.043338593095541, + 0.028462719172239304, + 0.019943350926041603, + 0.01114331278949976 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.703000009059906, + "loss_eval": 0.7722610831260681, + "epoch": 4 + }, + { + "hidden_norms": [ + 11.269571304321289, + 12.476441383361816, + 16.378177642822266, + 25.748563766479492, + 36.580970764160156 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007116686902008951, + 0.00042677627061493695, + 0.0002665013598743826, + 0.00019125515245832503, + 0.0001178958555101417 + ], + "bp_grad_F": [ + 0.06977967172861099, + 0.04175141453742981, + 0.02600390836596489, + 0.018256530165672302, + 0.010964884422719479 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7070000171661377, + "loss_eval": 0.7697932720184326, + "epoch": 5 + }, + { + "hidden_norms": [ + 11.269571304321289, + 12.808075904846191, + 19.022871017456055, + 33.50295639038086, + 45.75634002685547 + ], + "bp_grad_per_sample_l2_med": [ + 0.000760514521971345, + 0.000416931085055694, + 0.0002524603623896837, + 0.00018262627418152988, + 0.0001200677506858483 + ], + "bp_grad_F": [ + 0.0695224478840828, + 0.03927718475461006, + 0.023749928921461105, + 0.01698874868452549, + 0.011118472553789616 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7035000324249268, + "loss_eval": 0.7977719902992249, + "epoch": 6 + }, + { + "hidden_norms": [ + 11.269571304321289, + 13.191008567810059, + 22.44864273071289, + 42.65863800048828, + 54.38147735595703 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007628297316841781, + 0.0003877072886098176, + 0.00022262487618718296, + 0.00016918807523325086, + 0.0001183631393359974 + ], + "bp_grad_F": [ + 0.06797165423631668, + 0.03639831766486168, + 0.02157149650156498, + 0.015874147415161133, + 0.011150078848004341 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.70250004529953, + "loss_eval": 0.8099735975265503, + "epoch": 7 + }, + { + "hidden_norms": [ + 11.269571304321289, + 13.587474822998047, + 26.61025619506836, + 51.025230407714844, + 61.79695129394531 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007774661062285304, + 0.00037008023355156183, + 0.00019806883938144892, + 0.0001550534798298031, + 0.00011658846779027954 + ], + "bp_grad_F": [ + 0.06822231411933899, + 0.03484996780753136, + 0.02039053477346897, + 0.015457017347216606, + 0.011438230983912945 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6920000314712524, + "loss_eval": 0.8282882571220398, + "epoch": 8 + }, + { + "hidden_norms": [ + 11.269571304321289, + 14.02984619140625, + 31.27604866027832, + 59.14579391479492, + 68.8819580078125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000821497815195471, + 0.000388532382203266, + 0.0002036481600953266, + 0.0001647671015234664, + 0.00012798182433471084 + ], + "bp_grad_F": [ + 0.06896942853927612, + 0.03378934785723686, + 0.019570810720324516, + 0.015211639925837517, + 0.01168233621865511 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6785000562667847, + "loss_eval": 0.8751994967460632, + "epoch": 9 + }, + { + "hidden_norms": [ + 11.269571304321289, + 14.566975593566895, + 37.15107345581055, + 66.83728790283203, + 76.04595184326172 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008561373106203973, + 0.00037220801459625363, + 0.00018477423873264343, + 0.0001600280374987051, + 0.00012663347297348082 + ], + "bp_grad_F": [ + 0.06949204951524734, + 0.033161722123622894, + 0.019245225936174393, + 0.015247669070959091, + 0.012057062238454819 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6585000157356262, + "loss_eval": 0.9142682552337646, + "epoch": 10 + }, + { + "hidden_norms": [ + 11.269571304321289, + 15.22678279876709, + 44.73517990112305, + 74.21520233154297, + 82.72914123535156 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008647029753774405, + 0.0003551499976310879, + 0.00016902851348277181, + 0.00014951576304156333, + 0.0001220703707076609 + ], + "bp_grad_F": [ + 0.06799578666687012, + 0.03190648928284645, + 0.018390726298093796, + 0.015047998167574406, + 0.01216125674545765 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6635000109672546, + "loss_eval": 0.9312959313392639, + "epoch": 11 + }, + { + "hidden_norms": [ + 11.269571304321289, + 15.982205390930176, + 53.03363037109375, + 81.01543426513672, + 88.02293395996094 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008814894827082753, + 0.0003609499253798276, + 0.00016691464406903833, + 0.00015374798385892063, + 0.00012832213542424142 + ], + "bp_grad_F": [ + 0.06737235933542252, + 0.030633311718702316, + 0.017514588311314583, + 0.014722960069775581, + 0.012166885659098625 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6665000319480896, + "loss_eval": 0.9171096086502075, + "epoch": 12 + }, + { + "hidden_norms": [ + 11.269571304321289, + 17.348485946655273, + 65.39360046386719, + 94.1773452758789, + 97.79885864257812 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008671359973959625, + 0.0003543675411492586, + 0.00017760474293027073, + 0.00016833240806590766, + 0.0001419015898136422 + ], + "bp_grad_F": [ + 0.06303472071886063, + 0.027784455567598343, + 0.016537917777895927, + 0.01453208364546299, + 0.012470746412873268 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6520000100135803, + "loss_eval": 0.9543019533157349, + "epoch": 13 + }, + { + "hidden_norms": [ + 11.269571304321289, + 19.79836082458496, + 82.84272003173828, + 118.11077880859375, + 117.29456329345703 + ], + "bp_grad_per_sample_l2_med": [ + 0.000835613114759326, + 0.00034002913162112236, + 0.00017855060286819935, + 0.00017689696687739342, + 0.0001562273973831907 + ], + "bp_grad_F": [ + 0.05830768123269081, + 0.025488071143627167, + 0.01599927246570587, + 0.014500983990728855, + 0.012853534892201424 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6320000290870667, + "loss_eval": 0.9986603260040283, + "epoch": 14 + }, + { + "hidden_norms": [ + 11.269571304321289, + 24.028667449951172, + 104.24053192138672, + 151.45233154296875, + 148.85594177246094 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008604780305176973, + 0.0003412840305827558, + 0.00020471647439990193, + 0.00020128543837927282, + 0.00018673941667657346 + ], + "bp_grad_F": [ + 0.05637207254767418, + 0.023704711347818375, + 0.016045723110437393, + 0.015071108937263489, + 0.013779145665466785 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6110000014305115, + "loss_eval": 1.08339262008667, + "epoch": 15 + }, + { + "hidden_norms": [ + 11.269571304321289, + 31.199304580688477, + 135.36643981933594, + 190.8426971435547, + 189.1505126953125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000760686700232327, + 0.0002976131218019873, + 0.00019266465096734464, + 0.0001927861594595015, + 0.0001783591287676245 + ], + "bp_grad_F": [ + 0.04442710801959038, + 0.020077738910913467, + 0.0149933947250247, + 0.014391067437827587, + 0.01344863511621952 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6480000019073486, + "loss_eval": 1.0371382236480713, + "epoch": 16 + }, + { + "hidden_norms": [ + 11.269571304321289, + 41.846805572509766, + 170.3418731689453, + 225.09695434570312, + 224.6548614501953 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007461759960278869, + 0.00026667246129363775, + 0.00018387376621831208, + 0.00018445710884407163, + 0.00017204758478328586 + ], + "bp_grad_F": [ + 0.039136338979005814, + 0.018771812319755554, + 0.015547079034149647, + 0.01513050775974989, + 0.01431551855057478 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6200000047683716, + "loss_eval": 1.1162669658660889, + "epoch": 17 + }, + { + "hidden_norms": [ + 11.269571304321289, + 57.18465042114258, + 206.83914184570312, + 262.21197509765625, + 260.03485107421875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007871078560128808, + 0.00029353986610658467, + 0.00022458977764472365, + 0.00022484370856545866, + 0.00021257037587929517 + ], + "bp_grad_F": [ + 0.03888345882296562, + 0.01824026368558407, + 0.015890181064605713, + 0.015627194195985794, + 0.014916189946234226 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5615000128746033, + "loss_eval": 1.2106062173843384, + "epoch": 18 + }, + { + "hidden_norms": [ + 11.269571304321289, + 75.66644287109375, + 241.24891662597656, + 298.0739440917969, + 293.95281982421875 + ], + "bp_grad_per_sample_l2_med": [ + 0.000782749499194324, + 0.0002943766303360462, + 0.00024086510529741645, + 0.00024184907670132816, + 0.0002289286785526201 + ], + "bp_grad_F": [ + 0.03717740252614021, + 0.01794801466166973, + 0.016123440116643906, + 0.0158899687230587, + 0.015260584652423859 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5680000185966492, + "loss_eval": 1.1780248880386353, + "epoch": 19 + }, + { + "hidden_norms": [ + 11.269571304321289, + 97.68470764160156, + 276.2217712402344, + 334.56146240234375, + 329.1627502441406 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007400053436867893, + 0.00028874175040982664, + 0.00024344309349544346, + 0.0002433314366498962, + 0.00023140427947510034 + ], + "bp_grad_F": [ + 0.03569746017456055, + 0.0169936865568161, + 0.015504195354878902, + 0.015339999459683895, + 0.014785589650273323 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5745000243186951, + "loss_eval": 1.1848244667053223, + "epoch": 20 + }, + { + "hidden_norms": [ + 11.269571304321289, + 123.06426239013672, + 312.8515625, + 373.4215087890625, + 366.50213623046875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007171913748607039, + 0.00026914477348327637, + 0.00023370776034425944, + 0.00023370303097181022, + 0.0002235924475826323 + ], + "bp_grad_F": [ + 0.03427436947822571, + 0.016933348029851913, + 0.015780098736286163, + 0.015659287571907043, + 0.015169495716691017 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5715000033378601, + "loss_eval": 1.2063732147216797, + "epoch": 21 + }, + { + "hidden_norms": [ + 11.269571304321289, + 153.3316650390625, + 353.62042236328125, + 417.3258361816406, + 408.16680908203125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007328973151743412, + 0.000268118514213711, + 0.00024018273688852787, + 0.00024114495317917317, + 0.0002314754092367366 + ], + "bp_grad_F": [ + 0.033994678407907486, + 0.016857070848345757, + 0.01595945656299591, + 0.01587284542620182, + 0.015459166839718819 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5450000166893005, + "loss_eval": 1.2801684141159058, + "epoch": 22 + }, + { + "hidden_norms": [ + 11.269571304321289, + 187.16934204101562, + 397.18280029296875, + 464.5965881347656, + 453.26629638671875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007429302204400301, + 0.0002756037574727088, + 0.0002533047809265554, + 0.0002549285418353975, + 0.00024467214825563133 + ], + "bp_grad_F": [ + 0.03400976210832596, + 0.017134130001068115, + 0.016380103304982185, + 0.016292234882712364, + 0.015935255214571953 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5055000185966492, + "loss_eval": 1.4238585233688354, + "epoch": 23 + }, + { + "hidden_norms": [ + 11.269571304321289, + 221.9723663330078, + 441.26580810546875, + 512.8148193359375, + 498.7379455566406 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006891476223245263, + 0.00027131737442687154, + 0.0002505357551854104, + 0.000251909252256155, + 0.0002428782609058544 + ], + "bp_grad_F": [ + 0.032484397292137146, + 0.01684476062655449, + 0.01627412810921669, + 0.016195174306631088, + 0.015904447063803673 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5290000438690186, + "loss_eval": 1.3381338119506836, + "epoch": 24 + }, + { + "hidden_norms": [ + 11.269571304321289, + 256.86456298828125, + 485.2987060546875, + 561.24755859375, + 544.2046508789062 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007065363461151719, + 0.0002826322161126882, + 0.00026495553902350366, + 0.0002664696949068457, + 0.0002584822941571474 + ], + "bp_grad_F": [ + 0.032581742852926254, + 0.017135880887508392, + 0.01663898676633835, + 0.01656418852508068, + 0.016318844631314278 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.468500018119812, + "loss_eval": 1.4673320055007935, + "epoch": 25 + }, + { + "hidden_norms": [ + 11.269571304321289, + 290.3281555175781, + 528.4644165039062, + 609.61181640625, + 589.482421875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007876601885072887, + 0.000328866473864764, + 0.0003142827481497079, + 0.0003149702097289264, + 0.00030780391534790397 + ], + "bp_grad_F": [ + 0.0356873981654644, + 0.01825507916510105, + 0.01779749058187008, + 0.017760321497917175, + 0.0175130907446146 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.35200002789497375, + "loss_eval": 1.82278311252594, + "epoch": 26 + }, + { + "hidden_norms": [ + 11.269571304321289, + 324.2997131347656, + 572.9197387695312, + 659.7073364257812, + 635.6883544921875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006818437832407653, + 0.000307896378217265, + 0.0002974055823870003, + 0.000297438440611586, + 0.0002942352439276874 + ], + "bp_grad_F": [ + 0.03148573637008667, + 0.017155593261122704, + 0.016821201890707016, + 0.01674988865852356, + 0.016609078273177147 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4540000259876251, + "loss_eval": 1.4913204908370972, + "epoch": 27 + }, + { + "hidden_norms": [ + 11.269571304321289, + 357.986572265625, + 616.8123168945312, + 709.2523193359375, + 681.3218994140625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006822228315286338, + 0.00030397844966501, + 0.0002927799359895289, + 0.0002928805770352483, + 0.0002893624478019774 + ], + "bp_grad_F": [ + 0.03142063319683075, + 0.017380017787218094, + 0.017113016918301582, + 0.017052780836820602, + 0.01693262904882431 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.42250001430511475, + "loss_eval": 1.574558138847351, + "epoch": 28 + }, + { + "hidden_norms": [ + 11.269571304321289, + 391.00396728515625, + 660.1432495117188, + 758.46875, + 726.479248046875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006576834712177515, + 0.00029913688194938004, + 0.0002909695322159678, + 0.00029160548001527786, + 0.0002882194530684501 + ], + "bp_grad_F": [ + 0.03063797578215599, + 0.01751694455742836, + 0.017304742708802223, + 0.017256034538149834, + 0.017157413065433502 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.41700002551078796, + "loss_eval": 1.5943682193756104, + "epoch": 29 + }, + { + "hidden_norms": [ + 11.269571304321289, + 423.0135803222656, + 702.8653564453125, + 807.1064453125, + 771.0443115234375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007106211851350963, + 0.00032867168192751706, + 0.0003195058961864561, + 0.0003205789253115654, + 0.00031724729342386127 + ], + "bp_grad_F": [ + 0.032083574682474136, + 0.018385307863354683, + 0.01818086951971054, + 0.018159352242946625, + 0.01808425784111023 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3240000009536743, + "loss_eval": 1.9495495557785034, + "epoch": 30 + }, + { + "hidden_norms": [ + 11.269571304321289, + 453.1861267089844, + 743.7100219726562, + 853.8812255859375, + 813.7102661132812 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006489204824902117, + 0.0002889770839828998, + 0.00028184326947666705, + 0.00028282302082516253, + 0.00027834190404973924 + ], + "bp_grad_F": [ + 0.029847772791981697, + 0.017620669677853584, + 0.017466910183429718, + 0.01743420958518982, + 0.017375603318214417 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3970000147819519, + "loss_eval": 1.6998002529144287, + "epoch": 31 + }, + { + "hidden_norms": [ + 11.269571304321289, + 480.8240661621094, + 781.491943359375, + 897.1333618164062, + 853.1820678710938 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006337798549793661, + 0.0003062748000957072, + 0.0003002039447892457, + 0.00030039221746847034, + 0.0002973877126350999 + ], + "bp_grad_F": [ + 0.029168229550123215, + 0.017783651128411293, + 0.017649564892053604, + 0.017613932490348816, + 0.01756826601922512 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3865000307559967, + "loss_eval": 1.7693381309509277, + "epoch": 32 + }, + { + "hidden_norms": [ + 11.269571304321289, + 505.9931945800781, + 816.3653564453125, + 937.6511840820312, + 890.0263061523438 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006363698630593717, + 0.000327500601997599, + 0.0003217202320229262, + 0.0003208804700989276, + 0.0003201036306563765 + ], + "bp_grad_F": [ + 0.029376372694969177, + 0.018225492909550667, + 0.01810493879020214, + 0.01805899664759636, + 0.018048716709017754 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3400000035762787, + "loss_eval": 1.777511477470398, + "epoch": 33 + }, + { + "hidden_norms": [ + 11.269571304321289, + 530.9385375976562, + 850.9844970703125, + 977.412841796875, + 926.3417358398438 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006240232032723725, + 0.00032233193633146584, + 0.00031883586780168116, + 0.0003202730731572956, + 0.0003188494883943349 + ], + "bp_grad_F": [ + 0.028516914695501328, + 0.018217962235212326, + 0.018127964809536934, + 0.018103662878274918, + 0.018076416105031967 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.36250001192092896, + "loss_eval": 1.7461223602294922, + "epoch": 34 + }, + { + "hidden_norms": [ + 11.269571304321289, + 555.9691162109375, + 885.6592407226562, + 1017.6103515625, + 962.8530883789062 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005949487676844001, + 0.0003172095457557589, + 0.00031312211649492383, + 0.0003130651020910591, + 0.0003118007443845272 + ], + "bp_grad_F": [ + 0.027917204424738884, + 0.018052855506539345, + 0.017963001504540443, + 0.01793370023369789, + 0.017934400588274002 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3775000274181366, + "loss_eval": 1.7961357831954956, + "epoch": 35 + }, + { + "hidden_norms": [ + 11.269571304321289, + 580.1717529296875, + 919.149169921875, + 1056.32470703125, + 998.1345825195312 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006010148790664971, + 0.0003237369528505951, + 0.00031987245893105865, + 0.00031991174910217524, + 0.0003188104019500315 + ], + "bp_grad_F": [ + 0.027771273627877235, + 0.017915818840265274, + 0.017828019335865974, + 0.017802555114030838, + 0.017808666452765465 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.37400001287460327, + "loss_eval": 1.8124159574508667, + "epoch": 36 + }, + { + "hidden_norms": [ + 11.269571304321289, + 602.5966186523438, + 950.484619140625, + 1092.6507568359375, + 1031.02294921875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005852986359968781, + 0.0003249783185310662, + 0.00032142180134542286, + 0.0003207105037290603, + 0.00032108003506436944 + ], + "bp_grad_F": [ + 0.02701820805668831, + 0.01796947605907917, + 0.017892232164740562, + 0.017859354615211487, + 0.01788966730237007 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.34950003027915955, + "loss_eval": 1.7797815799713135, + "epoch": 37 + }, + { + "hidden_norms": [ + 11.269571304321289, + 624.4447021484375, + 981.1150512695312, + 1127.90234375, + 1063.09228515625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005775236058980227, + 0.0003046133788302541, + 0.00030120721203275025, + 0.00030136521672829986, + 0.00029937425279058516 + ], + "bp_grad_F": [ + 0.026447290554642677, + 0.017799606546759605, + 0.017730647698044777, + 0.017701666802167892, + 0.017717311158776283 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3630000054836273, + "loss_eval": 1.7884948253631592, + "epoch": 38 + }, + { + "hidden_norms": [ + 11.269571304321289, + 644.9402465820312, + 1010.1371459960938, + 1161.7808837890625, + 1093.9410400390625 + ], + "bp_grad_per_sample_l2_med": [ + 0.000567529525142163, + 0.00032071411260403693, + 0.0003186226240359247, + 0.0003186469548381865, + 0.000316357531119138 + ], + "bp_grad_F": [ + 0.02652687579393387, + 0.018418341875076294, + 0.018360882997512817, + 0.018340308219194412, + 0.018352536484599113 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3375000059604645, + "loss_eval": 1.894034743309021, + "epoch": 39 + }, + { + "hidden_norms": [ + 11.269571304321289, + 664.6719970703125, + 1038.15478515625, + 1194.3914794921875, + 1123.5455322265625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005615526461042464, + 0.0003110080724582076, + 0.00030868081375956535, + 0.00030884178704582155, + 0.0003081669274251908 + ], + "bp_grad_F": [ + 0.025895435363054276, + 0.01783018186688423, + 0.017772147431969643, + 0.017754852771759033, + 0.01777641288936138 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3395000100135803, + "loss_eval": 1.9033000469207764, + "epoch": 40 + }, + { + "hidden_norms": [ + 11.269571304321289, + 683.78173828125, + 1065.281005859375, + 1225.9638671875, + 1152.131591796875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005448339506983757, + 0.0003069988451898098, + 0.0003048715298064053, + 0.0003052430984098464, + 0.00030476890970021486 + ], + "bp_grad_F": [ + 0.025077223777770996, + 0.017541181296110153, + 0.017490437254309654, + 0.01747160218656063, + 0.017498185858130455 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3840000033378601, + "loss_eval": 1.7054094076156616, + "epoch": 41 + }, + { + "hidden_norms": [ + 11.269571304321289, + 701.634033203125, + 1090.699462890625, + 1255.5677490234375, + 1178.950927734375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005554261151701212, + 0.0003436058177612722, + 0.0003414751263335347, + 0.0003412873193155974, + 0.0003412757650949061 + ], + "bp_grad_F": [ + 0.025991667062044144, + 0.018797792494297028, + 0.01875895820558071, + 0.018737811595201492, + 0.01877579651772976 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.2985000014305115, + "loss_eval": 1.9454095363616943, + "epoch": 42 + }, + { + "hidden_norms": [ + 11.269571304321289, + 718.1909790039062, + 1114.3717041015625, + 1283.2196044921875, + 1204.0418701171875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005466453148983419, + 0.00032576482044532895, + 0.00032447546254843473, + 0.0003244927211198956, + 0.0003245829720981419 + ], + "bp_grad_F": [ + 0.025174839422106743, + 0.01795799843966961, + 0.01791331358253956, + 0.017896415665745735, + 0.017930971458554268 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3190000057220459, + "loss_eval": 1.9117376804351807, + "epoch": 43 + }, + { + "hidden_norms": [ + 11.269571304321289, + 734.4074096679688, + 1137.696044921875, + 1310.3448486328125, + 1228.5693359375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005316757597029209, + 0.00032565969740971923, + 0.00032383095822297037, + 0.00032448669662699103, + 0.0003247321583330631 + ], + "bp_grad_F": [ + 0.024759862571954727, + 0.01794862188398838, + 0.01790694147348404, + 0.017891528084874153, + 0.017931628972291946 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3320000171661377, + "loss_eval": 1.8898653984069824, + "epoch": 44 + }, + { + "hidden_norms": [ + 11.269571304321289, + 749.4878540039062, + 1159.565185546875, + 1335.8013916015625, + 1251.6041259765625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005168311763554811, + 0.00031509375548921525, + 0.0003133788122795522, + 0.0003133984573651105, + 0.0003139932523481548 + ], + "bp_grad_F": [ + 0.0242743082344532, + 0.01778865046799183, + 0.0177480336278677, + 0.017732009291648865, + 0.01776931621134281 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3360000252723694, + "loss_eval": 1.809171199798584, + "epoch": 45 + }, + { + "hidden_norms": [ + 11.269571304321289, + 763.5787353515625, + 1180.0230712890625, + 1359.6865234375, + 1273.1715087890625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005242779734544456, + 0.0003271555178798735, + 0.00032485066913068295, + 0.0003253788163419813, + 0.00032494115293957293 + ], + "bp_grad_F": [ + 0.024425320327281952, + 0.01821528747677803, + 0.018175508826971054, + 0.018160372972488403, + 0.01819770224392414 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3290000259876251, + "loss_eval": 1.8727153539657593, + "epoch": 46 + }, + { + "hidden_norms": [ + 11.269571304321289, + 777.29833984375, + 1199.8975830078125, + 1382.7962646484375, + 1294.0777587890625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005091701750643551, + 0.0003165322996210307, + 0.00031451781978830695, + 0.00031486450461670756, + 0.00031427579233422875 + ], + "bp_grad_F": [ + 0.023803148418664932, + 0.017688797786831856, + 0.017653871327638626, + 0.01764090545475483, + 0.017672821879386902 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3570000231266022, + "loss_eval": 1.7817366123199463, + "epoch": 47 + }, + { + "hidden_norms": [ + 11.269571304321289, + 789.7103881835938, + 1218.070556640625, + 1403.869384765625, + 1313.1611328125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000508163939230144, + 0.00031658579246141016, + 0.0003145384253002703, + 0.0003149410185869783, + 0.000314467353746295 + ], + "bp_grad_F": [ + 0.023785017430782318, + 0.017845386639237404, + 0.01781085878610611, + 0.017796490341424942, + 0.017827292904257774 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3255000114440918, + "loss_eval": 1.9139658212661743, + "epoch": 48 + }, + { + "hidden_norms": [ + 11.269571304321289, + 801.9373779296875, + 1235.8994140625, + 1424.5323486328125, + 1331.8375244140625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004862714558839798, + 0.0002926513261627406, + 0.0002908864407800138, + 0.0002910781477112323, + 0.0002900509862229228 + ], + "bp_grad_F": [ + 0.023361189290881157, + 0.01766069605946541, + 0.01763027161359787, + 0.017619280144572258, + 0.017652587965130806 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.36100003123283386, + "loss_eval": 1.8068753480911255, + "epoch": 49 + }, + { + "hidden_norms": [ + 11.269571304321289, + 813.853515625, + 1253.337890625, + 1444.873779296875, + 1350.2630615234375 + ], + "bp_grad_per_sample_l2_med": [ + 0.00048765321844257414, + 0.000307347479974851, + 0.00030599997262470424, + 0.000306078844005242, + 0.000305346620734781 + ], + "bp_grad_F": [ + 0.023688213899731636, + 0.01818004995584488, + 0.018153388053178787, + 0.018142297863960266, + 0.018173247575759888 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3360000252723694, + "loss_eval": 1.8813791275024414, + "epoch": 50 + }, + { + "hidden_norms": [ + 11.269571304321289, + 824.7192993164062, + 1269.39208984375, + 1463.5384521484375, + 1367.15625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004835445433855057, + 0.0003096247965004295, + 0.0003079361922573298, + 0.00030804326524958014, + 0.0003073872940149158 + ], + "bp_grad_F": [ + 0.02330639213323593, + 0.01797325722873211, + 0.0179448202252388, + 0.017932146787643433, + 0.0179706122726202 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.34150001406669617, + "loss_eval": 1.8429521322250366, + "epoch": 51 + }, + { + "hidden_norms": [ + 11.269571304321289, + 834.9524536132812, + 1284.4827880859375, + 1481.0673828125, + 1383.0155029296875 + ], + "bp_grad_per_sample_l2_med": [ + 0.00047791830729693174, + 0.0003027814091183245, + 0.0003019821015186608, + 0.0003020255535375327, + 0.0003012260131072253 + ], + "bp_grad_F": [ + 0.02303098328411579, + 0.01771283708512783, + 0.01768432930111885, + 0.017673376947641373, + 0.01770668476819992 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.34850001335144043, + "loss_eval": 1.8080617189407349, + "epoch": 52 + }, + { + "hidden_norms": [ + 11.269571304321289, + 844.5447998046875, + 1298.628662109375, + 1497.57373046875, + 1397.9241943359375 + ], + "bp_grad_per_sample_l2_med": [ + 0.000483115843962878, + 0.0003182529762852937, + 0.00031743990257382393, + 0.0003175203746650368, + 0.0003175794845446944 + ], + "bp_grad_F": [ + 0.02306683361530304, + 0.01790531352162361, + 0.017880147323012352, + 0.017869742587208748, + 0.017903709784150124 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.33100003004074097, + "loss_eval": 1.8166543245315552, + "epoch": 53 + }, + { + "hidden_norms": [ + 11.269571304321289, + 853.7017822265625, + 1312.1446533203125, + 1513.2933349609375, + 1412.1080322265625 + ], + "bp_grad_per_sample_l2_med": [ + 0.00047640595585107803, + 0.00031948628020472825, + 0.00031817753915674984, + 0.00031873476109467447, + 0.0003185000387020409 + ], + "bp_grad_F": [ + 0.022898783907294273, + 0.017956143245100975, + 0.017929796129465103, + 0.017917128279805183, + 0.017962384968996048 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.33800002932548523, + "loss_eval": 1.8004838228225708, + "epoch": 54 + }, + { + "hidden_norms": [ + 11.269571304321289, + 862.0558471679688, + 1324.4920654296875, + 1527.697509765625, + 1425.1290283203125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004698090488091111, + 0.00029860963695682585, + 0.0002971645735669881, + 0.0002974079397972673, + 0.00029624722083099186 + ], + "bp_grad_F": [ + 0.022676818072795868, + 0.01772218942642212, + 0.017698047682642937, + 0.017688868567347527, + 0.01772254891693592 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3530000150203705, + "loss_eval": 1.8075289726257324, + "epoch": 55 + }, + { + "hidden_norms": [ + 11.269571304321289, + 869.9756469726562, + 1336.185791015625, + 1541.3792724609375, + 1437.4677734375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004706987820100039, + 0.0003098493325524032, + 0.0003085599164478481, + 0.0003086493816226721, + 0.0003082384937442839 + ], + "bp_grad_F": [ + 0.022675253450870514, + 0.01779225468635559, + 0.017767589539289474, + 0.017757505178451538, + 0.017791779711842537 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.34150001406669617, + "loss_eval": 1.827038288116455, + "epoch": 56 + }, + { + "hidden_norms": [ + 11.269571304321289, + 877.3834838867188, + 1347.156982421875, + 1554.1087646484375, + 1448.9537353515625 + ], + "bp_grad_per_sample_l2_med": [ + 0.000473314750706777, + 0.00030716857872903347, + 0.0003054763947147876, + 0.0003060955787077546, + 0.0003047685313504189 + ], + "bp_grad_F": [ + 0.02272479608654976, + 0.01781822182238102, + 0.017794664949178696, + 0.01778644695878029, + 0.01781868003308773 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.32450002431869507, + "loss_eval": 1.8790045976638794, + "epoch": 57 + }, + { + "hidden_norms": [ + 11.269571304321289, + 884.1793212890625, + 1357.25146484375, + 1565.88232421875, + 1459.538818359375 + ], + "bp_grad_per_sample_l2_med": [ + 0.00046717250370420516, + 0.00030950061045587063, + 0.000308411312289536, + 0.00030838610837236047, + 0.00030820758547633886 + ], + "bp_grad_F": [ + 0.02260792814195156, + 0.017898347228765488, + 0.017876161262392998, + 0.017865851521492004, + 0.01790330745279789 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3225000202655792, + "loss_eval": 1.8583427667617798, + "epoch": 58 + }, + { + "hidden_norms": [ + 11.269571304321289, + 890.4108276367188, + 1366.517333984375, + 1576.69921875, + 1469.300537109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004612848279066384, + 0.00030920191784389317, + 0.0003086488868575543, + 0.0003085103817284107, + 0.0003084034251514822 + ], + "bp_grad_F": [ + 0.022702287882566452, + 0.018074622377753258, + 0.01805359311401844, + 0.018043993040919304, + 0.018074078485369682 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.33250001072883606, + "loss_eval": 1.8819878101348877, + "epoch": 59 + }, + { + "hidden_norms": [ + 11.269571304321289, + 896.1082763671875, + 1374.973388671875, + 1586.524169921875, + 1478.1490478515625 + ], + "bp_grad_per_sample_l2_med": [ + 0.00046731752809137106, + 0.0003127296222373843, + 0.00031115938327275217, + 0.0003112337435595691, + 0.00031117399339564145 + ], + "bp_grad_F": [ + 0.022609086707234383, + 0.018025977537035942, + 0.01800408773124218, + 0.017995676025748253, + 0.018028175458312035 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3150000274181366, + "loss_eval": 1.8731034994125366, + "epoch": 60 + }, + { + "hidden_norms": [ + 11.269571304321289, + 901.4246826171875, + 1382.871337890625, + 1595.7164306640625, + 1486.465576171875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004559764638543129, + 0.00029873938183300197, + 0.00029821961652487516, + 0.0002982193836942315, + 0.0002976148098241538 + ], + "bp_grad_F": [ + 0.022443631663918495, + 0.017807144671678543, + 0.01778426393866539, + 0.017775312066078186, + 0.017809107899665833 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3190000057220459, + "loss_eval": 1.9132741689682007, + "epoch": 61 + }, + { + "hidden_norms": [ + 11.269571304321289, + 906.219970703125, + 1389.97998046875, + 1603.95458984375, + 1493.869384765625 + ], + "bp_grad_per_sample_l2_med": [ + 0.00045692393905483186, + 0.000307796144625172, + 0.0003068537334911525, + 0.0003067644138354808, + 0.0003064550110138953 + ], + "bp_grad_F": [ + 0.022245025262236595, + 0.017795003950595856, + 0.0177734587341547, + 0.017764581367373466, + 0.017800522968173027 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3270000219345093, + "loss_eval": 1.8190391063690186, + "epoch": 62 + }, + { + "hidden_norms": [ + 11.269571304321289, + 910.5570678710938, + 1396.3927001953125, + 1611.4957275390625, + 1500.6524658203125 + ], + "bp_grad_per_sample_l2_med": [ + 0.00045115925604477525, + 0.00029847086989320815, + 0.0002977230178657919, + 0.0002977572148665786, + 0.0002975583774968982 + ], + "bp_grad_F": [ + 0.02203645370900631, + 0.017681924626231194, + 0.01766141690313816, + 0.017652763053774834, + 0.0176865067332983 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.35500001907348633, + "loss_eval": 1.7965762615203857, + "epoch": 63 + }, + { + "hidden_norms": [ + 11.269571304321289, + 914.5003662109375, + 1402.2757568359375, + 1618.2999267578125, + 1506.7991943359375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004569143056869507, + 0.00029972344054840505, + 0.0002987241605296731, + 0.0002987434563692659, + 0.00029907189309597015 + ], + "bp_grad_F": [ + 0.022272884845733643, + 0.01781252957880497, + 0.017791228368878365, + 0.017782466486096382, + 0.017818717285990715 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.328000009059906, + "loss_eval": 1.8610442876815796, + "epoch": 64 + }, + { + "hidden_norms": [ + 11.269571304321289, + 918.0006103515625, + 1407.5118408203125, + 1624.3853759765625, + 1512.30029296875 + ], + "bp_grad_per_sample_l2_med": [ + 0.00045414711348712444, + 0.00030931030050851405, + 0.0003081976028624922, + 0.0003081892791669816, + 0.0003081847680732608 + ], + "bp_grad_F": [ + 0.022085461765527725, + 0.01779778115451336, + 0.017776912078261375, + 0.017768092453479767, + 0.01780613884329796 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.34300002455711365, + "loss_eval": 1.804802417755127, + "epoch": 65 + }, + { + "hidden_norms": [ + 11.269571304321289, + 921.121826171875, + 1412.175537109375, + 1629.830810546875, + 1517.2005615234375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004531690792646259, + 0.00031135816243477166, + 0.00031044447678141296, + 0.00031072759884409606, + 0.0003106470685452223 + ], + "bp_grad_F": [ + 0.022044293582439423, + 0.017750630155205727, + 0.017730476334691048, + 0.017722314223647118, + 0.017757223919034004 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.34150001406669617, + "loss_eval": 1.8111987113952637, + "epoch": 66 + }, + { + "hidden_norms": [ + 11.269571304321289, + 923.8903198242188, + 1416.300048828125, + 1634.646484375, + 1521.5411376953125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004468595434445888, + 0.0003022409218829125, + 0.00030127677018754184, + 0.00030117464484646916, + 0.00030144210904836655 + ], + "bp_grad_F": [ + 0.02193099819123745, + 0.017699316143989563, + 0.017679594457149506, + 0.017671333625912666, + 0.017706507816910744 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3525000214576721, + "loss_eval": 1.797281265258789, + "epoch": 67 + }, + { + "hidden_norms": [ + 11.269571304321289, + 926.2950439453125, + 1419.8856201171875, + 1638.8184814453125, + 1525.284423828125 + ], + "bp_grad_per_sample_l2_med": [ + 0.00044905568938702345, + 0.00030229080584831536, + 0.00030173707637004554, + 0.0003015522670466453, + 0.0003012538072653115 + ], + "bp_grad_F": [ + 0.021881939843297005, + 0.017657367512583733, + 0.017637958750128746, + 0.017629873007535934, + 0.01766354590654373 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.34800001978874207, + "loss_eval": 1.8036439418792725, + "epoch": 68 + }, + { + "hidden_norms": [ + 11.269571304321289, + 928.36181640625, + 1422.943359375, + 1642.3917236328125, + 1528.47705078125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004465414967853576, + 0.00030299098580144346, + 0.00030190899269655347, + 0.00030191292171366513, + 0.000301982625387609 + ], + "bp_grad_F": [ + 0.02188783325254917, + 0.01768629439175129, + 0.01766696758568287, + 0.017658723518252373, + 0.017692700028419495 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.359000027179718, + "loss_eval": 1.7996938228607178, + "epoch": 69 + }, + { + "hidden_norms": [ + 11.269571304321289, + 930.1182861328125, + 1425.561279296875, + 1645.422607421875, + 1531.2088623046875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004439539334271103, + 0.00030093194800429046, + 0.00030001465347595513, + 0.0003001568838953972, + 0.0002998457639478147 + ], + "bp_grad_F": [ + 0.021926432847976685, + 0.01775786094367504, + 0.017738472670316696, + 0.01773017831146717, + 0.01776653714478016 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.35200002789497375, + "loss_eval": 1.8030681610107422, + "epoch": 70 + }, + { + "hidden_norms": [ + 11.269571304321289, + 931.579345703125, + 1427.7337646484375, + 1647.9693603515625, + 1533.509033203125 + ], + "bp_grad_per_sample_l2_med": [ + 0.00044511700980365276, + 0.00030080872238613665, + 0.00030003004940226674, + 0.0003000932920258492, + 0.00029993904172442853 + ], + "bp_grad_F": [ + 0.021828416734933853, + 0.017681054770946503, + 0.017661932855844498, + 0.017653752118349075, + 0.017688728868961334 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.35200002789497375, + "loss_eval": 1.7960853576660156, + "epoch": 71 + }, + { + "hidden_norms": [ + 11.269571304321289, + 932.7696533203125, + 1429.520751953125, + 1650.0577392578125, + 1535.389892578125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004446738166734576, + 0.0003006414044648409, + 0.00030009649344719946, + 0.0003001675067935139, + 0.00029965140856802464 + ], + "bp_grad_F": [ + 0.021837500855326653, + 0.01768680103123188, + 0.017667656764388084, + 0.017659684643149376, + 0.017694275826215744 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.35450002551078796, + "loss_eval": 1.8004000186920166, + "epoch": 72 + }, + { + "hidden_norms": [ + 11.269571304321289, + 933.7157592773438, + 1430.9381103515625, + 1651.7154541015625, + 1536.879638671875 + ], + "bp_grad_per_sample_l2_med": [ + 0.00044473307207226753, + 0.00030047594918869436, + 0.0002997968113049865, + 0.00029963525594212115, + 0.00029955641366541386 + ], + "bp_grad_F": [ + 0.0217889491468668, + 0.01765742339193821, + 0.01763851009309292, + 0.01763063855469227, + 0.017664924263954163 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3555000126361847, + "loss_eval": 1.7942780256271362, + "epoch": 73 + }, + { + "hidden_norms": [ + 11.269571304321289, + 934.4593505859375, + 1432.0382080078125, + 1652.9989013671875, + 1538.0234375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004453740257304162, + 0.0003002033627126366, + 0.00029949398594908416, + 0.00029964259010739625, + 0.0002993734087795019 + ], + "bp_grad_F": [ + 0.021799130365252495, + 0.017666727304458618, + 0.0176478810608387, + 0.017639974132180214, + 0.017674267292022705 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.34550002217292786, + "loss_eval": 1.800949215888977, + "epoch": 74 + }, + { + "hidden_norms": [ + 11.269571304321289, + 934.9984741210938, + 1432.84814453125, + 1653.939697265625, + 1538.8624267578125 + ], + "bp_grad_per_sample_l2_med": [ + 0.00044546957360580564, + 0.0003038236463908106, + 0.000302964064758271, + 0.00030298702768050134, + 0.00030283271917141974 + ], + "bp_grad_F": [ + 0.021853182464838028, + 0.017717286944389343, + 0.017698239535093307, + 0.017690137028694153, + 0.01772582344710827 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.35600000619888306, + "loss_eval": 1.800832986831665, + "epoch": 75 + }, + { + "hidden_norms": [ + 11.269571304321289, + 935.3856201171875, + 1433.427490234375, + 1654.6126708984375, + 1539.4669189453125 + ], + "bp_grad_per_sample_l2_med": [ + 0.00044487748527899384, + 0.00030164900817908347, + 0.00030081532895565033, + 0.00030082385637797415, + 0.000300481216982007 + ], + "bp_grad_F": [ + 0.02177177555859089, + 0.017657004296779633, + 0.017638202756643295, + 0.017630264163017273, + 0.01766461506485939 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3490000069141388, + "loss_eval": 1.794891119003296, + "epoch": 76 + }, + { + "hidden_norms": [ + 11.269571304321289, + 935.636474609375, + 1433.79345703125, + 1655.038330078125, + 1539.8505859375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004437313473317772, + 0.00030232034623622894, + 0.0003012971137650311, + 0.00030129036167636514, + 0.00030084658646956086 + ], + "bp_grad_F": [ + 0.021787401288747787, + 0.0176764614880085, + 0.017657602205872536, + 0.017649594694375992, + 0.017684470862150192 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.35350000858306885, + "loss_eval": 1.7952260971069336, + "epoch": 77 + }, + { + "hidden_norms": [ + 11.269571304321289, + 935.7716064453125, + 1433.996826171875, + 1655.2738037109375, + 1540.06298828125 + ], + "bp_grad_per_sample_l2_med": [ + 0.00044510490261018276, + 0.0003025131591130048, + 0.00030167156364768744, + 0.0003019055584445596, + 0.00030186952790245414 + ], + "bp_grad_F": [ + 0.02179691381752491, + 0.017687244340777397, + 0.017668338492512703, + 0.017660312354564667, + 0.01769554615020752 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.35200002789497375, + "loss_eval": 1.7945536375045776, + "epoch": 78 + }, + { + "hidden_norms": [ + 11.269571304321289, + 935.8350830078125, + 1434.09326171875, + 1655.3861083984375, + 1540.164794921875 + ], + "bp_grad_per_sample_l2_med": [ + 0.00044426857493817806, + 0.0003006447514053434, + 0.0002995560353156179, + 0.0002996143593918532, + 0.0002996891853399575 + ], + "bp_grad_F": [ + 0.02177303098142147, + 0.017660290002822876, + 0.017641469836235046, + 0.017633574083447456, + 0.01766815222799778 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.35850000381469727, + "loss_eval": 1.7939436435699463, + "epoch": 79 + }, + { + "hidden_norms": [ + 11.269571304321289, + 935.8506469726562, + 1434.11669921875, + 1655.4130859375, + 1540.189208984375 + ], + "bp_grad_per_sample_l2_med": [ + 0.00044382456690073013, + 0.0003010118380188942, + 0.0003002960584126413, + 0.00030042475555092096, + 0.00029991925111971796 + ], + "bp_grad_F": [ + 0.021775126457214355, + 0.01766343042254448, + 0.017644599080085754, + 0.017636677250266075, + 0.017671329900622368 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3595000207424164, + "loss_eval": 1.7936068773269653, + "epoch": 80 + } + ], + "seed": 42, + "alpha": 1.0, + "depth": 4, + "d_hidden": 128 +} \ No newline at end of file diff --git a/results/snapshot_synth_v1/snapshot_fa_synth_a1.0_L4_s42.json b/results/snapshot_synth_v1/snapshot_fa_synth_a1.0_L4_s42.json new file mode 100644 index 0000000..438739c --- /dev/null +++ b/results/snapshot_synth_v1/snapshot_fa_synth_a1.0_L4_s42.json @@ -0,0 +1,2276 @@ +{ + "fa_log": [ + { + "hidden_norms": [ + 11.269571304321289, + 11.290447235107422, + 11.313605308532715, + 11.351215362548828, + 11.398087501525879 + ], + "bp_grad_per_sample_l2_med": [ + 0.00028353024390526116, + 0.0002828188880812377, + 0.00028162598027847707, + 0.0002799496578518301, + 0.0002791006409097463 + ], + "bp_grad_F": [ + 0.012684082612395287, + 0.01264861598610878, + 0.012589854188263416, + 0.012511610053479671, + 0.012471316382288933 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.08450000733137131, + "loss_eval": 2.4790313243865967, + "epoch": 0 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.460872650146484, + 11.70040512084961, + 12.004783630371094, + 12.311223030090332 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004118149809073657, + 0.0003761148836929351, + 0.00034950554254464805, + 0.00032246875343844295, + 0.0002528287877794355 + ], + "bp_grad_F": [ + 0.018988799303770065, + 0.017196672037243843, + 0.015853216871619225, + 0.014456234872341156, + 0.011207858100533485 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5265000462532043, + "loss_eval": 1.4851115942001343, + "epoch": 1 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.751569747924805, + 12.541290283203125, + 13.77841567993164, + 15.976567268371582 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007904200465418398, + 0.0006201046635396779, + 0.0004867047828156501, + 0.0003823215956799686, + 0.00022867691586725414 + ], + "bp_grad_F": [ + 0.041881538927555084, + 0.03210915997624397, + 0.025059428066015244, + 0.01950555481016636, + 0.011618814431130886 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6350000500679016, + "loss_eval": 0.959205687046051, + "epoch": 2 + }, + { + "hidden_norms": [ + 11.269571304321289, + 12.018173217773438, + 13.625839233398438, + 16.65739631652832, + 22.032325744628906 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008111135102808475, + 0.0005643682088702917, + 0.0004009789554402232, + 0.00029031067970208824, + 0.00016489777772221714 + ], + "bp_grad_F": [ + 0.059235598891973495, + 0.040808264166116714, + 0.02855612151324749, + 0.020608671009540558, + 0.011410079896450043 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6855000257492065, + "loss_eval": 0.818859875202179, + "epoch": 3 + }, + { + "hidden_norms": [ + 11.269571304321289, + 12.308274269104004, + 15.27676010131836, + 21.78426170349121, + 30.742971420288086 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007430269033648074, + 0.000469190941657871, + 0.00030379975214600563, + 0.00021638885664287955, + 0.00012503107427619398 + ], + "bp_grad_F": [ + 0.06859903037548065, + 0.04267093911767006, + 0.027331173419952393, + 0.01921078749001026, + 0.01109629962593317 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6940000057220459, + "loss_eval": 0.7901937365531921, + "epoch": 4 + }, + { + "hidden_norms": [ + 11.269571304321289, + 12.659590721130371, + 17.736019134521484, + 29.108901977539062, + 40.405487060546875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007397185545414686, + 0.0004240924317855388, + 0.00025522997020743787, + 0.00018211310089100152, + 0.00011715881555574015 + ], + "bp_grad_F": [ + 0.07044756412506104, + 0.040140341967344284, + 0.024354523047804832, + 0.017343631014227867, + 0.01095715630799532 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6975000500679016, + "loss_eval": 0.8005170822143555, + "epoch": 5 + }, + { + "hidden_norms": [ + 11.269571304321289, + 13.09460735321045, + 21.214082717895508, + 38.0382194519043, + 49.941673278808594 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007781236781738698, + 0.00040500680916011333, + 0.00022763953893445432, + 0.00017000116349663585, + 0.0001182492560474202 + ], + "bp_grad_F": [ + 0.0692453384399414, + 0.037047095596790314, + 0.021944386884570122, + 0.016124187037348747, + 0.011101995594799519 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6925000548362732, + "loss_eval": 0.8182728290557861, + "epoch": 6 + }, + { + "hidden_norms": [ + 11.269571304321289, + 13.613083839416504, + 25.80984878540039, + 47.72332763671875, + 58.812931060791016 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007534404867328703, + 0.00035873899469152093, + 0.00019843837071675807, + 0.00015793486090842634, + 0.00011804765381384641 + ], + "bp_grad_F": [ + 0.06768736243247986, + 0.034021928906440735, + 0.019909236580133438, + 0.015198245644569397, + 0.011175908148288727 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6945000290870667, + "loss_eval": 0.8370131254196167, + "epoch": 7 + }, + { + "hidden_norms": [ + 11.269571304321289, + 14.181544303894043, + 31.215173721313477, + 57.29954147338867, + 67.44005584716797 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008308067917823792, + 0.0003639743954408914, + 0.00018776576325763017, + 0.00015568821982014924, + 0.00012153007264714688 + ], + "bp_grad_F": [ + 0.0664583221077919, + 0.03186826407909393, + 0.018696729093790054, + 0.014834162779152393, + 0.011486423201858997 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6775000095367432, + "loss_eval": 0.8666528463363647, + "epoch": 8 + }, + { + "hidden_norms": [ + 11.269571304321289, + 14.879924774169922, + 37.906219482421875, + 67.32949829101562, + 75.90506744384766 + ], + "bp_grad_per_sample_l2_med": [ + 0.000856662227306515, + 0.0003640915092546493, + 0.0001897388428915292, + 0.00016743727610446513, + 0.00013579493679571897 + ], + "bp_grad_F": [ + 0.06490001082420349, + 0.0302249975502491, + 0.018041465431451797, + 0.014820784330368042, + 0.011990511789917946 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6565000414848328, + "loss_eval": 0.9446665048599243, + "epoch": 9 + }, + { + "hidden_norms": [ + 11.269571304321289, + 15.732318878173828, + 45.59952163696289, + 76.33224487304688, + 84.44403076171875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008764212252572179, + 0.00035432647564448416, + 0.00017862815002445132, + 0.00016163433610927314, + 0.0001364263880532235 + ], + "bp_grad_F": [ + 0.06546498835086823, + 0.02990337274968624, + 0.01799662783741951, + 0.015155031345784664, + 0.012622621841728687 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6390000581741333, + "loss_eval": 1.0291955471038818, + "epoch": 10 + }, + { + "hidden_norms": [ + 11.269571304321289, + 16.836196899414062, + 55.33602523803711, + 84.32881164550781, + 92.9534912109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.000854950922075659, + 0.00036200409522280097, + 0.00018266236293129623, + 0.0001705951290205121, + 0.00014654053666163236 + ], + "bp_grad_F": [ + 0.06433594971895218, + 0.0289771668612957, + 0.017391620203852654, + 0.015173865482211113, + 0.012928354553878307 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6330000162124634, + "loss_eval": 1.076339840888977, + "epoch": 11 + }, + { + "hidden_norms": [ + 11.269571304321289, + 19.05539894104004, + 69.66182708740234, + 97.1963119506836, + 102.74567413330078 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008397337514907122, + 0.00034183592651970685, + 0.00018204437219537795, + 0.00017718512390274554, + 0.0001551504828967154 + ], + "bp_grad_F": [ + 0.062221452593803406, + 0.027522921562194824, + 0.01681770198047161, + 0.01498384214937687, + 0.013089192099869251 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.643500030040741, + "loss_eval": 1.0531169176101685, + "epoch": 12 + }, + { + "hidden_norms": [ + 11.269571304321289, + 23.65813636779785, + 86.25741577148438, + 120.24312591552734, + 124.2949447631836 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008297308231703937, + 0.0003140757908113301, + 0.00017996964743360877, + 0.00017669204680714756, + 0.00015717324276920408 + ], + "bp_grad_F": [ + 0.06484393030405045, + 0.028613954782485962, + 0.01715104468166828, + 0.01567785255610943, + 0.014462707564234734 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6255000233650208, + "loss_eval": 1.3249526023864746, + "epoch": 13 + }, + { + "hidden_norms": [ + 11.269571304321289, + 30.92644500732422, + 102.1397705078125, + 147.9296417236328, + 157.7542266845703 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008446995634585619, + 0.000312876160023734, + 0.00019047399109695107, + 0.00018901094153989106, + 0.00017103466961998492 + ], + "bp_grad_F": [ + 0.063303142786026, + 0.02876628190279007, + 0.01635562814772129, + 0.015436392277479172, + 0.014697290025651455 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6045000553131104, + "loss_eval": 1.394450306892395, + "epoch": 14 + }, + { + "hidden_norms": [ + 11.269571304321289, + 40.05237579345703, + 123.65401458740234, + 173.33119201660156, + 188.9973907470703 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008657039143145084, + 0.0003323613782413304, + 0.0002161249576602131, + 0.0002138354757335037, + 0.00019650986359920353 + ], + "bp_grad_F": [ + 0.054496586322784424, + 0.025836922228336334, + 0.0159344132989645, + 0.015238149091601372, + 0.014629158191382885 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5950000286102295, + "loss_eval": 1.1977143287658691, + "epoch": 15 + }, + { + "hidden_norms": [ + 11.269571304321289, + 50.589420318603516, + 147.02255249023438, + 197.975830078125, + 217.0601806640625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008191568194888532, + 0.00030697352485731244, + 0.00021884859597776085, + 0.00021713844034820795, + 0.00020184220920782536 + ], + "bp_grad_F": [ + 0.04439451918005943, + 0.021627753973007202, + 0.015079431235790253, + 0.0144795598462224, + 0.014037052169442177 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6115000247955322, + "loss_eval": 1.1207692623138428, + "epoch": 16 + }, + { + "hidden_norms": [ + 11.269571304321289, + 61.36143112182617, + 169.08056640625, + 221.02748107910156, + 240.8756561279297 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007864299113862216, + 0.0002859561063814908, + 0.0002155074180336669, + 0.00021533406106755137, + 0.00020066267461515963 + ], + "bp_grad_F": [ + 0.04005742073059082, + 0.01873522810637951, + 0.014609597623348236, + 0.014084910042583942, + 0.013653460890054703 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6175000071525574, + "loss_eval": 1.059693694114685, + "epoch": 17 + }, + { + "hidden_norms": [ + 11.269571304321289, + 72.36003875732422, + 188.58563232421875, + 241.86294555664062, + 258.58087158203125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007837018347345293, + 0.0002863232512027025, + 0.00022506402456201613, + 0.00022481133055407554, + 0.00021070068760309368 + ], + "bp_grad_F": [ + 0.039807844907045364, + 0.01775156892836094, + 0.01470963191241026, + 0.014359688386321068, + 0.01395167876034975 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6025000214576721, + "loss_eval": 1.1027324199676514, + "epoch": 18 + }, + { + "hidden_norms": [ + 11.269571304321289, + 81.18446350097656, + 200.67935180664062, + 257.0839538574219, + 267.81317138671875 + ], + "bp_grad_per_sample_l2_med": [ + 0.00082020164700225, + 0.0003102799819316715, + 0.0002470446634106338, + 0.0002463961427565664, + 0.00023495900677517056 + ], + "bp_grad_F": [ + 0.041444260627031326, + 0.01803578995168209, + 0.014944672584533691, + 0.014712288975715637, + 0.014517528004944324 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5820000171661377, + "loss_eval": 1.146970272064209, + "epoch": 19 + }, + { + "hidden_norms": [ + 11.269571304321289, + 91.12315368652344, + 208.71234130859375, + 269.7666931152344, + 278.79949951171875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008638632134534419, + 0.0003278621006757021, + 0.00026185397291556, + 0.00026034258189611137, + 0.0002510476915631443 + ], + "bp_grad_F": [ + 0.04429177567362785, + 0.018727537244558334, + 0.015489915385842323, + 0.01529665943235159, + 0.015330186113715172 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5394999980926514, + "loss_eval": 1.2919961214065552, + "epoch": 20 + }, + { + "hidden_norms": [ + 11.269571304321289, + 104.20027160644531, + 224.12327575683594, + 292.86212158203125, + 302.2417297363281 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008091026684269309, + 0.0002788364654406905, + 0.0002307023387402296, + 0.0002291825512656942, + 0.0002224020572612062 + ], + "bp_grad_F": [ + 0.043314289301633835, + 0.018204446882009506, + 0.01538326870650053, + 0.015148352831602097, + 0.015248478390276432 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5615000128746033, + "loss_eval": 1.3774936199188232, + "epoch": 21 + }, + { + "hidden_norms": [ + 11.269571304321289, + 119.46916198730469, + 246.84373474121094, + 322.8492736816406, + 331.5632019042969 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007946055266074836, + 0.0002993302186951041, + 0.0002581049920991063, + 0.00025690835900604725, + 0.00025083290529437363 + ], + "bp_grad_F": [ + 0.04004265367984772, + 0.017564039677381516, + 0.015413369052112103, + 0.01514766737818718, + 0.015221393667161465 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5430000424385071, + "loss_eval": 1.3054314851760864, + "epoch": 22 + }, + { + "hidden_norms": [ + 11.269571304321289, + 136.81655883789062, + 275.0496826171875, + 359.30596923828125, + 365.4009704589844 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007907089893706143, + 0.00031880626920610666, + 0.00028100365307182074, + 0.0002786303812172264, + 0.00027127860812470317 + ], + "bp_grad_F": [ + 0.03825194016098976, + 0.017261793836951256, + 0.01555734220892191, + 0.01527914684265852, + 0.015313600189983845 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5270000100135803, + "loss_eval": 1.3047609329223633, + "epoch": 23 + }, + { + "hidden_norms": [ + 11.269571304321289, + 154.3377227783203, + 303.1491394042969, + 395.8551330566406, + 398.4109191894531 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007455120794475079, + 0.0002850848250091076, + 0.00025729817571118474, + 0.00025698516401462257, + 0.0002516870736144483 + ], + "bp_grad_F": [ + 0.03626802936196327, + 0.01676987297832966, + 0.015425236895680428, + 0.015152523294091225, + 0.015204805880784988 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5555000305175781, + "loss_eval": 1.2945412397384644, + "epoch": 24 + }, + { + "hidden_norms": [ + 11.269571304321289, + 172.51333618164062, + 332.53106689453125, + 434.6177978515625, + 432.9015197753906 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007499566418118775, + 0.00028473397833295166, + 0.0002601774758659303, + 0.0002574811805970967, + 0.00025375629775226116 + ], + "bp_grad_F": [ + 0.035628896206617355, + 0.016559967771172523, + 0.015500359237194061, + 0.015283019281923771, + 0.01530501153320074 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5250000357627869, + "loss_eval": 1.348174810409546, + "epoch": 25 + }, + { + "hidden_norms": [ + 11.269571304321289, + 191.6818084716797, + 362.3817138671875, + 473.73529052734375, + 468.3863830566406 + ], + "bp_grad_per_sample_l2_med": [ + 0.00077909289393574, + 0.0003061260504182428, + 0.0002848915464710444, + 0.000283668254269287, + 0.00027828654856421053 + ], + "bp_grad_F": [ + 0.03710347041487694, + 0.01679745502769947, + 0.01587643474340439, + 0.01569107361137867, + 0.015713181346654892 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.48750001192092896, + "loss_eval": 1.513879418373108, + "epoch": 26 + }, + { + "hidden_norms": [ + 11.269571304321289, + 212.49392700195312, + 393.7915954589844, + 515.7852172851562, + 507.1173095703125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007443951326422393, + 0.000309632858261466, + 0.00028767462936230004, + 0.0002863617264665663, + 0.00028263547574169934 + ], + "bp_grad_F": [ + 0.034536320716142654, + 0.01654498465359211, + 0.015813451260328293, + 0.015621310099959373, + 0.0156637541949749 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5090000033378601, + "loss_eval": 1.345898151397705, + "epoch": 27 + }, + { + "hidden_norms": [ + 11.269571304321289, + 231.91209411621094, + 422.3776550292969, + 553.1364135742188, + 540.5762329101562 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007372196414507926, + 0.0002908413589466363, + 0.00027582875918596983, + 0.0002760514325927943, + 0.00027193804271519184 + ], + "bp_grad_F": [ + 0.034806184470653534, + 0.01654907502233982, + 0.01595865748822689, + 0.01580234244465828, + 0.01584061235189438 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4970000088214874, + "loss_eval": 1.4695581197738647, + "epoch": 28 + }, + { + "hidden_norms": [ + 11.269571304321289, + 251.87222290039062, + 452.5732116699219, + 591.4275512695312, + 574.1845703125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007362416945397854, + 0.0002964947489090264, + 0.0002815316547639668, + 0.0002831071906257421, + 0.0002781452494673431 + ], + "bp_grad_F": [ + 0.034162748605012894, + 0.016219308599829674, + 0.01574064791202545, + 0.015600688755512238, + 0.015627028420567513 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.48100003600120544, + "loss_eval": 1.4220975637435913, + "epoch": 29 + }, + { + "hidden_norms": [ + 11.269571304321289, + 272.3019104003906, + 483.1678161621094, + 631.2042846679688, + 609.8804931640625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007130270241759717, + 0.0003075756540056318, + 0.00029428518610075116, + 0.00029221284785307944, + 0.0002892380871344358 + ], + "bp_grad_F": [ + 0.033144623041152954, + 0.01614796556532383, + 0.015754450112581253, + 0.015617748722434044, + 0.015651794150471687 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.49550002813339233, + "loss_eval": 1.398095726966858, + "epoch": 30 + }, + { + "hidden_norms": [ + 11.269571304321289, + 293.1174621582031, + 513.9456176757812, + 671.4954223632812, + 646.9434204101562 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007292498485185206, + 0.0003146968665532768, + 0.0003013227542396635, + 0.000301573658362031, + 0.00029794115107506514 + ], + "bp_grad_F": [ + 0.033789947628974915, + 0.016436096280813217, + 0.016089752316474915, + 0.015960095450282097, + 0.0159769207239151 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4570000171661377, + "loss_eval": 1.5174756050109863, + "epoch": 31 + }, + { + "hidden_norms": [ + 11.269571304321289, + 312.291748046875, + 542.6367797851562, + 708.0426025390625, + 679.9037475585938 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007159899105317891, + 0.0003197023761458695, + 0.00030903122387826443, + 0.0003080730966757983, + 0.00030512994271703064 + ], + "bp_grad_F": [ + 0.03305007144808769, + 0.016458848491311073, + 0.0161746796220541, + 0.01604822278022766, + 0.016068853437900543 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.45350003242492676, + "loss_eval": 1.4785963296890259, + "epoch": 32 + }, + { + "hidden_norms": [ + 11.269571304321289, + 330.2493896484375, + 569.4765625, + 741.90380859375, + 710.49609375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007181349792517722, + 0.0003215835604351014, + 0.00031238331575877964, + 0.00031264303834177554, + 0.0003104021889157593 + ], + "bp_grad_F": [ + 0.0329170823097229, + 0.016988366842269897, + 0.01674317568540573, + 0.01661907136440277, + 0.01665792241692543 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4320000112056732, + "loss_eval": 1.545434594154358, + "epoch": 33 + }, + { + "hidden_norms": [ + 11.269571304321289, + 348.3463439941406, + 596.8388061523438, + 776.8276977539062, + 742.1928100585938 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006930733215995133, + 0.0003099350433330983, + 0.0003020780859515071, + 0.0003008935309480876, + 0.00029881703085266054 + ], + "bp_grad_F": [ + 0.03210154175758362, + 0.0165875144302845, + 0.016380906105041504, + 0.016269827261567116, + 0.01630542054772377 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.46150001883506775, + "loss_eval": 1.4990708827972412, + "epoch": 34 + }, + { + "hidden_norms": [ + 11.269571304321289, + 367.8572998046875, + 624.6773071289062, + 813.023193359375, + 774.825439453125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006842412985861301, + 0.00032654378446750343, + 0.00031924000359140337, + 0.0003176531463395804, + 0.00031533741275779903 + ], + "bp_grad_F": [ + 0.03194142132997513, + 0.016769496724009514, + 0.01658361405134201, + 0.016465021297335625, + 0.016491062939167023 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4345000088214874, + "loss_eval": 1.5226876735687256, + "epoch": 35 + }, + { + "hidden_norms": [ + 11.269571304321289, + 386.9555969238281, + 652.0831298828125, + 847.6653442382812, + 805.962158203125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007009130204096437, + 0.00033408711897209287, + 0.00032650009961798787, + 0.00032573731732554734, + 0.00032366803498007357 + ], + "bp_grad_F": [ + 0.032547831535339355, + 0.01727951131761074, + 0.017110776156187057, + 0.017009133473038673, + 0.017040319740772247 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4025000333786011, + "loss_eval": 1.6661202907562256, + "epoch": 36 + }, + { + "hidden_norms": [ + 11.269571304321289, + 405.57061767578125, + 678.9530639648438, + 881.5497436523438, + 835.913330078125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006714131450280547, + 0.00031647825380787253, + 0.0003093808190897107, + 0.00030856815283186734, + 0.00030731584411114454 + ], + "bp_grad_F": [ + 0.030830882489681244, + 0.016467954963445663, + 0.016322584822773933, + 0.016228536143898964, + 0.01625511236488819 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.44850000739097595, + "loss_eval": 1.5340722799301147, + "epoch": 37 + }, + { + "hidden_norms": [ + 11.269571304321289, + 423.3720703125, + 705.0136108398438, + 914.5001831054688, + 865.4478759765625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006793327047489583, + 0.0003244458057451993, + 0.0003182501532137394, + 0.00031923994538374245, + 0.00031612347811460495 + ], + "bp_grad_F": [ + 0.03101767599582672, + 0.01673293113708496, + 0.01659614033997059, + 0.016509832814335823, + 0.01653491146862507 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.42000001668930054, + "loss_eval": 1.6198900938034058, + "epoch": 38 + }, + { + "hidden_norms": [ + 11.269571304321289, + 440.53741455078125, + 729.8703002929688, + 945.1349487304688, + 892.7785034179688 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006624915986321867, + 0.00031068388489075005, + 0.00030363586847670376, + 0.00030243129003793, + 0.00030108148348517716 + ], + "bp_grad_F": [ + 0.030339404940605164, + 0.01675509847700596, + 0.016639690846204758, + 0.01655009388923645, + 0.016594169661402702 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4280000329017639, + "loss_eval": 1.6058467626571655, + "epoch": 39 + }, + { + "hidden_norms": [ + 11.269571304321289, + 457.5261535644531, + 754.3056640625, + 975.5144653320312, + 919.8758544921875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006706257117912173, + 0.0003283233381807804, + 0.00032177154207602143, + 0.0003207549743819982, + 0.0003196784819010645 + ], + "bp_grad_F": [ + 0.03072393499314785, + 0.016925832256674767, + 0.01681169681251049, + 0.01673683524131775, + 0.016768047586083412 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.39000001549720764, + "loss_eval": 1.7052431106567383, + "epoch": 40 + }, + { + "hidden_norms": [ + 11.269571304321289, + 474.70233154296875, + 778.4963989257812, + 1005.5798950195312, + 947.08251953125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006340838735923171, + 0.00030884164152666926, + 0.000303937413264066, + 0.00030318956123664975, + 0.0003018545394297689 + ], + "bp_grad_F": [ + 0.02923908829689026, + 0.016514884307980537, + 0.016419367864727974, + 0.016349095851182938, + 0.0163878221064806 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4390000104904175, + "loss_eval": 1.564381718635559, + "epoch": 41 + }, + { + "hidden_norms": [ + 11.269571304321289, + 489.3309631347656, + 799.4293823242188, + 1031.868408203125, + 970.6136474609375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006363792927004397, + 0.00032453436870127916, + 0.000319232844049111, + 0.0003183995431754738, + 0.00031706615118309855 + ], + "bp_grad_F": [ + 0.02950570173561573, + 0.016813522204756737, + 0.016721611842513084, + 0.016652515158057213, + 0.016693497076630592 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.42100003361701965, + "loss_eval": 1.605594515800476, + "epoch": 42 + }, + { + "hidden_norms": [ + 11.269571304321289, + 502.8161315917969, + 819.462890625, + 1056.7576904296875, + 992.5881958007812 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006477028946392238, + 0.00033125586924143136, + 0.0003257581265643239, + 0.000326100125676021, + 0.00032460023066960275 + ], + "bp_grad_F": [ + 0.029688136652112007, + 0.01694806106388569, + 0.01685865968465805, + 0.016797136515378952, + 0.016836510971188545 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3830000162124634, + "loss_eval": 1.673546552658081, + "epoch": 43 + }, + { + "hidden_norms": [ + 11.269571304321289, + 517.00634765625, + 839.9920654296875, + 1082.26025390625, + 1015.0608520507812 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006337560480460525, + 0.0003340205585118383, + 0.00032972541521303356, + 0.00032889688736759126, + 0.0003277511859778315 + ], + "bp_grad_F": [ + 0.029322637245059013, + 0.01695762574672699, + 0.016879092901945114, + 0.01681896671652794, + 0.016858574002981186 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.38350000977516174, + "loss_eval": 1.6975816488265991, + "epoch": 44 + }, + { + "hidden_norms": [ + 11.269571304321289, + 529.66064453125, + 858.3285522460938, + 1104.83544921875, + 1035.074951171875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006231985753402114, + 0.00033350964076817036, + 0.00032944625127129257, + 0.00032876565819606185, + 0.00032806835952214897 + ], + "bp_grad_F": [ + 0.029069310054183006, + 0.016890447586774826, + 0.016818689182400703, + 0.016763897612690926, + 0.016804050654172897 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3930000066757202, + "loss_eval": 1.676193356513977, + "epoch": 45 + }, + { + "hidden_norms": [ + 11.269571304321289, + 541.9931030273438, + 875.95556640625, + 1126.6197509765625, + 1054.3516845703125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006226357654668391, + 0.00032438969356007874, + 0.0003203299711458385, + 0.0003203903906978667, + 0.00031863307231105864 + ], + "bp_grad_F": [ + 0.028472919017076492, + 0.016746005043387413, + 0.016683315858244896, + 0.016633223742246628, + 0.016673142090439796 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4165000319480896, + "loss_eval": 1.6569225788116455, + "epoch": 46 + }, + { + "hidden_norms": [ + 11.269571304321289, + 555.5247802734375, + 895.108642578125, + 1150.2750244140625, + 1075.3402099609375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006058313883841038, + 0.00031499756732955575, + 0.00031102998764254153, + 0.0003108317614533007, + 0.00030999473528936505 + ], + "bp_grad_F": [ + 0.028057299554347992, + 0.016642672941088676, + 0.016584018245339394, + 0.016536688432097435, + 0.016577772796154022 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.41850000619888306, + "loss_eval": 1.622230887413025, + "epoch": 47 + }, + { + "hidden_norms": [ + 11.269571304321289, + 566.745361328125, + 911.0077514648438, + 1169.5748291015625, + 1092.4599609375 + ], + "bp_grad_per_sample_l2_med": [ + 0.000616180885117501, + 0.0003297157527413219, + 0.00032601068960502744, + 0.0003262106911279261, + 0.00032522634137421846 + ], + "bp_grad_F": [ + 0.02835526503622532, + 0.016961509361863136, + 0.016903148964047432, + 0.01685917004942894, + 0.01690032333135605 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.39250001311302185, + "loss_eval": 1.714435338973999, + "epoch": 48 + }, + { + "hidden_norms": [ + 11.269571304321289, + 578.6380004882812, + 927.9735107421875, + 1190.5294189453125, + 1111.001220703125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006051660166122019, + 0.0003138712199870497, + 0.0003094248822890222, + 0.000309422001009807, + 0.0003081281029153615 + ], + "bp_grad_F": [ + 0.027995921671390533, + 0.016778133809566498, + 0.016729604452848434, + 0.01668645441532135, + 0.016727875918149948 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.40450000762939453, + "loss_eval": 1.6801645755767822, + "epoch": 49 + }, + { + "hidden_norms": [ + 11.269571304321289, + 591.34326171875, + 945.9314575195312, + 1212.5030517578125, + 1130.69580078125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000600961095187813, + 0.00032534165075048804, + 0.0003221939841751009, + 0.00032207692856900394, + 0.00032122948323376477 + ], + "bp_grad_F": [ + 0.027977745980024338, + 0.017148323357105255, + 0.017105158418416977, + 0.017058631405234337, + 0.01710781268775463 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3930000066757202, + "loss_eval": 1.7086997032165527, + "epoch": 50 + }, + { + "hidden_norms": [ + 11.269571304321289, + 602.791015625, + 962.1253051757812, + 1232.407958984375, + 1148.6063232421875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005954196094535291, + 0.00032203743467107415, + 0.0003193309239577502, + 0.00031976529862731695, + 0.00031836770358495414 + ], + "bp_grad_F": [ + 0.027640262618660927, + 0.016875414177775383, + 0.01683391071856022, + 0.016794128343462944, + 0.016835639253258705 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.38750001788139343, + "loss_eval": 1.7161617279052734, + "epoch": 51 + }, + { + "hidden_norms": [ + 11.269571304321289, + 613.0055541992188, + 976.7833251953125, + 1250.490966796875, + 1164.8575439453125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005885999999009073, + 0.00031236460199579597, + 0.00030869650072418153, + 0.00030896696262061596, + 0.0003076815919484943 + ], + "bp_grad_F": [ + 0.027101732790470123, + 0.01670675352215767, + 0.016670193523168564, + 0.01663014106452465, + 0.016672657802700996 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.41100001335144043, + "loss_eval": 1.6481956243515015, + "epoch": 52 + }, + { + "hidden_norms": [ + 11.269571304321289, + 622.8380126953125, + 990.931640625, + 1267.7691650390625, + 1180.291015625 + ], + "bp_grad_per_sample_l2_med": [ + 0.000587237358558923, + 0.0003190709976479411, + 0.0003160224005114287, + 0.00031612091697752476, + 0.00031501890043728054 + ], + "bp_grad_F": [ + 0.027042290195822716, + 0.016803324222564697, + 0.016769535839557648, + 0.016731148585677147, + 0.016775181517004967 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.40450000762939453, + "loss_eval": 1.6591061353683472, + "epoch": 53 + }, + { + "hidden_norms": [ + 11.269571304321289, + 632.4323120117188, + 1004.666259765625, + 1284.4637451171875, + 1195.189697265625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005885775317437947, + 0.0003397047985345125, + 0.0003383393050171435, + 0.00033765248372219503, + 0.00033701834036037326 + ], + "bp_grad_F": [ + 0.027301670983433723, + 0.017337650060653687, + 0.017313728109002113, + 0.017269184812903404, + 0.0173148512840271 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3565000295639038, + "loss_eval": 1.7250425815582275, + "epoch": 54 + }, + { + "hidden_norms": [ + 11.269571304321289, + 639.983154296875, + 1015.8214721679688, + 1297.94091796875, + 1207.160400390625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005771536380052567, + 0.00031455705175176263, + 0.0003114652936346829, + 0.0003115544968750328, + 0.00031060961191542447 + ], + "bp_grad_F": [ + 0.026900731027126312, + 0.01682351529598236, + 0.01679442636668682, + 0.016759345307946205, + 0.016801798716187477 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.398000031709671, + "loss_eval": 1.6931191682815552, + "epoch": 55 + }, + { + "hidden_norms": [ + 11.269571304321289, + 648.44189453125, + 1027.905517578125, + 1312.5484619140625, + 1220.3349609375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005807234556414187, + 0.0003243165265303105, + 0.00032131426269188523, + 0.0003215263714082539, + 0.0003202861698810011 + ], + "bp_grad_F": [ + 0.02689860761165619, + 0.016972798854112625, + 0.016945669427514076, + 0.016909556463360786, + 0.01695423573255539 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3850000202655792, + "loss_eval": 1.713501214981079, + "epoch": 56 + }, + { + "hidden_norms": [ + 11.269571304321289, + 656.1256103515625, + 1038.9337158203125, + 1326.0384521484375, + 1232.491455078125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005809550639241934, + 0.0003213974996469915, + 0.0003191177383996546, + 0.0003187706752214581, + 0.0003176441532559693 + ], + "bp_grad_F": [ + 0.026944397017359734, + 0.016979368403553963, + 0.01695428043603897, + 0.01692255586385727, + 0.016963332891464233 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3800000250339508, + "loss_eval": 1.7483241558074951, + "epoch": 57 + }, + { + "hidden_norms": [ + 11.269571304321289, + 663.1458740234375, + 1049.1085205078125, + 1338.4049072265625, + 1243.709228515625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005775660974904895, + 0.00032701215241104364, + 0.000323877960909158, + 0.00032368660322390497, + 0.00032316104625351727 + ], + "bp_grad_F": [ + 0.026842813938856125, + 0.017009008675813675, + 0.016984863206744194, + 0.016950154677033424, + 0.016992947086691856 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.36650002002716064, + "loss_eval": 1.7447302341461182, + "epoch": 58 + }, + { + "hidden_norms": [ + 11.269571304321289, + 669.32080078125, + 1058.1265869140625, + 1349.383544921875, + 1253.68603515625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005691531114280224, + 0.0003169954870827496, + 0.0003141614724881947, + 0.00031412398675456643, + 0.00031352281803265214 + ], + "bp_grad_F": [ + 0.026560034602880478, + 0.01695145107805729, + 0.016930771991610527, + 0.016894754022359848, + 0.016942735761404037 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3830000162124634, + "loss_eval": 1.7227482795715332, + "epoch": 59 + }, + { + "hidden_norms": [ + 11.269571304321289, + 675.035888671875, + 1066.407958984375, + 1359.420654296875, + 1262.8460693359375 + ], + "bp_grad_per_sample_l2_med": [ + 0.000574529985897243, + 0.000330567971104756, + 0.0003291864413768053, + 0.0003286501159891486, + 0.00032822080538608134 + ], + "bp_grad_F": [ + 0.02670128643512726, + 0.017140112817287445, + 0.017120162025094032, + 0.01708981581032276, + 0.017130881547927856 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.37800002098083496, + "loss_eval": 1.7512460947036743, + "epoch": 60 + }, + { + "hidden_norms": [ + 11.269571304321289, + 680.7155151367188, + 1074.5833740234375, + 1369.3917236328125, + 1271.9488525390625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005727651296183467, + 0.00031855711131356657, + 0.0003159786283504218, + 0.00031576541368849576, + 0.0003150397096760571 + ], + "bp_grad_F": [ + 0.02646380476653576, + 0.016906103119254112, + 0.016886914148926735, + 0.016857335343956947, + 0.016896924003958702 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.39100003242492676, + "loss_eval": 1.7765766382217407, + "epoch": 61 + }, + { + "hidden_norms": [ + 11.269571304321289, + 685.6483154296875, + 1081.7335205078125, + 1378.0848388671875, + 1279.824462890625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005669392994605005, + 0.00032193740480579436, + 0.0003195095050614327, + 0.00031930883415043354, + 0.00031847937498241663 + ], + "bp_grad_F": [ + 0.02628612145781517, + 0.01694479025900364, + 0.016926957294344902, + 0.016897274181246758, + 0.016937877982854843 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.38200002908706665, + "loss_eval": 1.6996668577194214, + "epoch": 62 + }, + { + "hidden_norms": [ + 11.269571304321289, + 690.3829345703125, + 1088.4320068359375, + 1386.209228515625, + 1287.180908203125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005609798245131969, + 0.0003164574736729264, + 0.00031414616387337446, + 0.0003141844645142555, + 0.0003133733116555959 + ], + "bp_grad_F": [ + 0.025919275358319283, + 0.01681407354772091, + 0.016797930002212524, + 0.01676807552576065, + 0.016810856759548187 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4035000205039978, + "loss_eval": 1.6783148050308228, + "epoch": 63 + }, + { + "hidden_norms": [ + 11.269571304321289, + 694.658935546875, + 1094.5535888671875, + 1393.6761474609375, + 1293.9659423828125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005624280893243849, + 0.00031574408058077097, + 0.0003139691543765366, + 0.00031461575417779386, + 0.00031346286414191127 + ], + "bp_grad_F": [ + 0.02617610991001129, + 0.016873449087142944, + 0.016857409849762917, + 0.01682792603969574, + 0.016867902129888535 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3830000162124634, + "loss_eval": 1.7127265930175781, + "epoch": 64 + }, + { + "hidden_norms": [ + 11.269571304321289, + 698.4141235351562, + 1099.921875, + 1400.2060546875, + 1299.92919921875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005497613456100225, + 0.00031591873266734183, + 0.00031333384686149657, + 0.00031392619712278247, + 0.00031339324777945876 + ], + "bp_grad_F": [ + 0.025806115940213203, + 0.016780776903033257, + 0.016766363754868507, + 0.016736920922994614, + 0.01677793264389038 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4165000319480896, + "loss_eval": 1.6823266744613647, + "epoch": 65 + }, + { + "hidden_norms": [ + 11.269571304321289, + 701.8402099609375, + 1104.8636474609375, + 1406.2545166015625, + 1305.4110107421875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005536439130082726, + 0.0003222717496100813, + 0.0003193898010067642, + 0.0003197654150426388, + 0.00031906200456433 + ], + "bp_grad_F": [ + 0.02591872774064541, + 0.016899071633815765, + 0.01688431203365326, + 0.01685412786900997, + 0.016896730288863182 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3895000219345093, + "loss_eval": 1.6973413228988647, + "epoch": 66 + }, + { + "hidden_norms": [ + 11.269571304321289, + 704.84814453125, + 1109.2054443359375, + 1411.5528564453125, + 1310.220458984375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005509129259735346, + 0.0003127358213532716, + 0.00031018650042824447, + 0.00031017058063298464, + 0.0003093581763096154 + ], + "bp_grad_F": [ + 0.02567744068801403, + 0.01674523949623108, + 0.01673281565308571, + 0.016704324632883072, + 0.01674455776810646 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.40400001406669617, + "loss_eval": 1.6765486001968384, + "epoch": 67 + }, + { + "hidden_norms": [ + 11.269571304321289, + 707.4666137695312, + 1112.9517822265625, + 1416.120361328125, + 1314.365478515625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005525590386241674, + 0.0003146192757412791, + 0.000312337331706658, + 0.0003126179799437523, + 0.00031193779432214797 + ], + "bp_grad_F": [ + 0.025625307112932205, + 0.016738714650273323, + 0.01672603376209736, + 0.016697421669960022, + 0.016738519072532654 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.406000018119812, + "loss_eval": 1.681616187095642, + "epoch": 68 + }, + { + "hidden_norms": [ + 11.269571304321289, + 709.6942749023438, + 1116.1553955078125, + 1420.0328369140625, + 1317.9129638671875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005520040867850184, + 0.0003149699477944523, + 0.0003132218262180686, + 0.00031297295936383307, + 0.0003122398047707975 + ], + "bp_grad_F": [ + 0.02563839592039585, + 0.01678294688463211, + 0.016770213842391968, + 0.01674121432006359, + 0.01678287237882614 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3985000252723694, + "loss_eval": 1.6824655532836914, + "epoch": 69 + }, + { + "hidden_norms": [ + 11.269571304321289, + 711.4514770507812, + 1118.6820068359375, + 1423.118408203125, + 1320.7220458984375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005478749517351389, + 0.0003126654773950577, + 0.00031092006247490644, + 0.0003107163356617093, + 0.00030992255778983235 + ], + "bp_grad_F": [ + 0.025653105229139328, + 0.016804352402687073, + 0.01679334044456482, + 0.016765642911195755, + 0.016805216670036316 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3970000147819519, + "loss_eval": 1.6816198825836182, + "epoch": 70 + }, + { + "hidden_norms": [ + 11.269571304321289, + 712.941162109375, + 1120.8258056640625, + 1425.7293701171875, + 1323.110595703125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005502297426573932, + 0.00031594440224580467, + 0.00031323955045081675, + 0.0003133862919639796, + 0.00031268122256733477 + ], + "bp_grad_F": [ + 0.025557825341820717, + 0.01675795204937458, + 0.01674625650048256, + 0.01671820878982544, + 0.016758527606725693 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4025000333786011, + "loss_eval": 1.6777657270431519, + "epoch": 71 + }, + { + "hidden_norms": [ + 11.269571304321289, + 714.2026977539062, + 1122.637451171875, + 1427.94921875, + 1325.1287841796875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005491463234648108, + 0.0003148230316583067, + 0.00031261687399819493, + 0.0003126751398667693, + 0.00031198892975226045 + ], + "bp_grad_F": [ + 0.025629354640841484, + 0.016796274110674858, + 0.016784505918622017, + 0.016756094992160797, + 0.01679658703505993 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.3985000252723694, + "loss_eval": 1.6832109689712524, + "epoch": 72 + }, + { + "hidden_norms": [ + 11.269571304321289, + 715.1837158203125, + 1124.0401611328125, + 1429.676025390625, + 1326.6959228515625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005472805933095515, + 0.00031123129883781075, + 0.0003085967618972063, + 0.00030910191708244383, + 0.00030826785950921476 + ], + "bp_grad_F": [ + 0.025491509586572647, + 0.01673061214387417, + 0.016719412058591843, + 0.01669108308851719, + 0.016732096672058105 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.41350001096725464, + "loss_eval": 1.6768076419830322, + "epoch": 73 + }, + { + "hidden_norms": [ + 11.269571304321289, + 715.9666137695312, + 1125.15869140625, + 1431.054931640625, + 1327.940185546875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005469402531161904, + 0.0003141815832350403, + 0.0003117373853456229, + 0.0003121092449873686, + 0.00031146654509939253 + ], + "bp_grad_F": [ + 0.02553613670170307, + 0.016766469925642014, + 0.016755321994423866, + 0.01672743633389473, + 0.01676766574382782 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.40050002932548523, + "loss_eval": 1.6803343296051025, + "epoch": 74 + }, + { + "hidden_norms": [ + 11.269571304321289, + 716.54345703125, + 1125.9932861328125, + 1432.0760498046875, + 1328.8612060546875 + ], + "bp_grad_per_sample_l2_med": [ + 0.000544340000487864, + 0.0003152569697704166, + 0.00031408306676894426, + 0.00031385221518576145, + 0.0003130683908239007 + ], + "bp_grad_F": [ + 0.025559071451425552, + 0.016799958422780037, + 0.01678895764052868, + 0.016760708764195442, + 0.01680118963122368 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.40050002932548523, + "loss_eval": 1.6816425323486328, + "epoch": 75 + }, + { + "hidden_norms": [ + 11.269571304321289, + 716.944580078125, + 1126.5697021484375, + 1432.786376953125, + 1329.5032958984375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005474911304190755, + 0.00031179687357507646, + 0.0003097430744674057, + 0.00030947139021009207, + 0.00030854580109007657 + ], + "bp_grad_F": [ + 0.025479920208454132, + 0.01673789508640766, + 0.016726836562156677, + 0.016698846593499184, + 0.01673932373523712 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4010000228881836, + "loss_eval": 1.6769893169403076, + "epoch": 76 + }, + { + "hidden_norms": [ + 11.269571304321289, + 717.2020263671875, + 1126.9422607421875, + 1433.2410888671875, + 1329.9195556640625 + ], + "bp_grad_per_sample_l2_med": [ + 0.000546319643035531, + 0.00031345203751698136, + 0.000311522395350039, + 0.000311847630655393, + 0.0003111722180619836 + ], + "bp_grad_F": [ + 0.025481175631284714, + 0.01675844006240368, + 0.016747308894991875, + 0.016719479113817215, + 0.0167598407715559 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4075000286102295, + "loss_eval": 1.6769570112228394, + "epoch": 77 + }, + { + "hidden_norms": [ + 11.269571304321289, + 717.3436889648438, + 1127.1475830078125, + 1433.49072265625, + 1330.1451416015625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005438647349365056, + 0.00031364860478788614, + 0.0003113296115770936, + 0.0003115428553428501, + 0.00031094413134269416 + ], + "bp_grad_F": [ + 0.025495020672678947, + 0.016764776781201363, + 0.016753805801272392, + 0.016725784167647362, + 0.016766248270869255 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.40800002217292786, + "loss_eval": 1.6758222579956055, + "epoch": 78 + }, + { + "hidden_norms": [ + 11.269571304321289, + 717.4073486328125, + 1127.239501953125, + 1433.60302734375, + 1330.2476806640625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005444776033982635, + 0.0003124381182715297, + 0.0003098779125139117, + 0.0003102763439528644, + 0.0003094278508797288 + ], + "bp_grad_F": [ + 0.025471549481153488, + 0.016743116080760956, + 0.016732197254896164, + 0.016704153269529343, + 0.016744764521718025 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.41450002789497375, + "loss_eval": 1.675687551498413, + "epoch": 79 + }, + { + "hidden_norms": [ + 11.269571304321289, + 717.4231567382812, + 1127.262451171875, + 1433.6309814453125, + 1330.273193359375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005445098504424095, + 0.0003131923731416464, + 0.00031077052699401975, + 0.0003107219818048179, + 0.00031013842090032995 + ], + "bp_grad_F": [ + 0.02547312155365944, + 0.016745658591389656, + 0.016734709963202477, + 0.016706665977835655, + 0.016747286543250084 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4140000343322754, + "loss_eval": 1.6754448413848877, + "epoch": 80 + } + ], + "seed": 42, + "alpha": 1.0, + "depth": 4, + "d_hidden": 128 +} \ No newline at end of file diff --git a/results/snapshot_synth_v1/snapshot_synth_a1.0_L4_s42.json b/results/snapshot_synth_v1/snapshot_synth_a1.0_L4_s42.json new file mode 100644 index 0000000..9972e9a --- /dev/null +++ b/results/snapshot_synth_v1/snapshot_synth_a1.0_L4_s42.json @@ -0,0 +1,4960 @@ +{ + "config": { + "output_dir": "results/snapshot_synth_v1", + "epochs": 80, + "alpha": 1.0, + "depth": 4, + "seed": 42, + "d_hidden": 128, + "lr": 0.001, + "wd": 0.01 + }, + "depth": 4, + "d_hidden": 128, + "num_classes": 10, + "bp_log": [ + { + "hidden_norms": [ + 11.269571304321289, + 11.290447235107422, + 11.313605308532715, + 11.351215362548828, + 11.398087501525879 + ], + "bp_grad_per_sample_l2_med": [ + 0.00028353024390526116, + 0.0002828188880812377, + 0.00028162598027847707, + 0.0002799496578518301, + 0.0002791006409097463 + ], + "bp_grad_F": [ + 0.012684082612395287, + 0.01264861598610878, + 0.012589854188263416, + 0.012511610053479671, + 0.012471316382288933 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.08450000733137131, + "loss_eval": 2.4790313243865967, + "epoch": 0 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.301911354064941, + 11.659679412841797, + 12.48208999633789, + 13.934065818786621 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006583131616935134, + 0.0004948809510096908, + 0.00036159728188067675, + 0.00026353230350650847, + 0.00020344744552858174 + ], + "bp_grad_F": [ + 0.03319504112005234, + 0.0246991366147995, + 0.017943235114216805, + 0.012967471033334732, + 0.009912492707371712 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7095000147819519, + "loss_eval": 0.8666461110115051, + "epoch": 1 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.28874397277832, + 12.022683143615723, + 13.943255424499512, + 17.510770797729492 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007016682648099959, + 0.00048243277706205845, + 0.00031948124524205923, + 0.00020489063172135502, + 0.00014097581151872873 + ], + "bp_grad_F": [ + 0.05366413667798042, + 0.03651106730103493, + 0.023700030520558357, + 0.015033061616122723, + 0.010093427263200283 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7725000381469727, + "loss_eval": 0.6004051566123962, + "epoch": 2 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.268131256103516, + 12.138687133789062, + 14.603575706481934, + 19.109115600585938 + ], + "bp_grad_per_sample_l2_med": [ + 0.000659371551591903, + 0.0004339825245551765, + 0.00027271744329482317, + 0.0001733575772959739, + 0.0001116431230911985 + ], + "bp_grad_F": [ + 0.06363420188426971, + 0.04213711991906166, + 0.0264370646327734, + 0.016141116619110107, + 0.010473517701029778 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7745000123977661, + "loss_eval": 0.5640328526496887, + "epoch": 3 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.245299339294434, + 12.213927268981934, + 14.944411277770996, + 19.937482833862305 + ], + "bp_grad_per_sample_l2_med": [ + 0.000589758506976068, + 0.00038736555143259466, + 0.000245077651925385, + 0.00015142903430387378, + 9.591270645614713e-05 + ], + "bp_grad_F": [ + 0.06846851110458374, + 0.04497711360454559, + 0.027850953862071037, + 0.01671868935227394, + 0.01068752072751522 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7835000157356262, + "loss_eval": 0.5508342981338501, + "epoch": 4 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.22258186340332, + 12.241990089416504, + 15.219721794128418, + 20.66508674621582 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005271711852401495, + 0.00034995534224435687, + 0.00021946353081148118, + 0.00013214732462074608, + 8.23614391265437e-05 + ], + "bp_grad_F": [ + 0.07378005236387253, + 0.04831067472696304, + 0.02961091324687004, + 0.01746201328933239, + 0.010955682955682278 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7855000495910645, + "loss_eval": 0.5423576831817627, + "epoch": 5 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.190115928649902, + 12.27110481262207, + 15.450979232788086, + 21.203943252563477 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005092737264931202, + 0.00033784759580157697, + 0.00020663061877712607, + 0.0001207139139296487, + 7.417408050969243e-05 + ], + "bp_grad_F": [ + 0.07774882018566132, + 0.051034994423389435, + 0.031082650646567345, + 0.018063966184854507, + 0.01114849466830492 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7845000624656677, + "loss_eval": 0.5346181392669678, + "epoch": 6 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.167141914367676, + 12.275080680847168, + 15.592608451843262, + 21.725374221801758 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005083799478597939, + 0.00033595148124732077, + 0.0002061770501313731, + 0.00011957385140703991, + 7.27532897144556e-05 + ], + "bp_grad_F": [ + 0.08175421506166458, + 0.053990282118320465, + 0.03277580440044403, + 0.01879614032804966, + 0.011419840157032013 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7905000448226929, + "loss_eval": 0.5348329544067383, + "epoch": 7 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.135689735412598, + 12.291831016540527, + 15.776432991027832, + 22.2913761138916 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004477855109144002, + 0.0003000828146468848, + 0.00018366402946412563, + 0.00010473958536749706, + 6.266004493227229e-05 + ], + "bp_grad_F": [ + 0.08535438776016235, + 0.05686107277870178, + 0.03441749885678291, + 0.019436663016676903, + 0.011580240912735462 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796500027179718, + "loss_eval": 0.5225732326507568, + "epoch": 8 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.113900184631348, + 12.296534538269043, + 15.874000549316406, + 22.73569107055664 + ], + "bp_grad_per_sample_l2_med": [ + 0.00041620698175393045, + 0.00028262173873372376, + 0.0001732171222101897, + 9.77468880591914e-05, + 5.725537994294427e-05 + ], + "bp_grad_F": [ + 0.09095799922943115, + 0.061118144541978836, + 0.036917947232723236, + 0.020527740940451622, + 0.011972126550972462 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7945000529289246, + "loss_eval": 0.5336357355117798, + "epoch": 9 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.088306427001953, + 12.3102388381958, + 16.0321102142334, + 23.320507049560547 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003761165135074407, + 0.0002580824075266719, + 0.00015763533883728087, + 8.57545601320453e-05, + 5.005364437238313e-05 + ], + "bp_grad_F": [ + 0.09630071371793747, + 0.06542361527681351, + 0.039454828947782516, + 0.02160210721194744, + 0.012356426566839218 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7915000319480896, + "loss_eval": 0.5405644774436951, + "epoch": 10 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.062504768371582, + 12.296314239501953, + 16.1483211517334, + 23.885089874267578 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003359524707775563, + 0.00023470049200113863, + 0.00014604303578380495, + 7.898044714238495e-05, + 4.356990029918961e-05 + ], + "bp_grad_F": [ + 0.09961758553981781, + 0.06847036629915237, + 0.04127706214785576, + 0.02224603295326233, + 0.01243517268449068 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8020000457763672, + "loss_eval": 0.5290275812149048, + "epoch": 11 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.040243148803711, + 12.293885231018066, + 16.26875114440918, + 24.44219207763672 + ], + "bp_grad_per_sample_l2_med": [ + 0.00028416418354026973, + 0.0001959044166142121, + 0.00011818648636108264, + 6.387147004716098e-05, + 3.619954804889858e-05 + ], + "bp_grad_F": [ + 0.10626755654811859, + 0.07399805635213852, + 0.044546131044626236, + 0.023592140525579453, + 0.012874037958681583 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8005000352859497, + "loss_eval": 0.5458852648735046, + "epoch": 12 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.011943817138672, + 12.278276443481445, + 16.34218978881836, + 24.94852066040039 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002902932756114751, + 0.00020653512910939753, + 0.0001265774480998516, + 6.573591963388026e-05, + 3.462762470007874e-05 + ], + "bp_grad_F": [ + 0.1133178174495697, + 0.07985687255859375, + 0.048010025173425674, + 0.025017691776156425, + 0.013337739743292332 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7990000247955322, + "loss_eval": 0.5682750940322876, + "epoch": 13 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.992447853088379, + 12.299921035766602, + 16.492944717407227, + 25.524486541748047 + ], + "bp_grad_per_sample_l2_med": [ + 0.00023213925305753946, + 0.00016858529124874622, + 0.00010339246364310384, + 5.375607725000009e-05, + 2.8085371013730764e-05 + ], + "bp_grad_F": [ + 0.11885266751050949, + 0.08489131927490234, + 0.051101066172122955, + 0.02628019079566002, + 0.013745996169745922 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7975000143051147, + "loss_eval": 0.5884183645248413, + "epoch": 14 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.968864440917969, + 12.2804536819458, + 16.559459686279297, + 26.08506965637207 + ], + "bp_grad_per_sample_l2_med": [ + 0.00020740363106597215, + 0.00015108383377082646, + 9.300659439759329e-05, + 4.728052954305895e-05, + 2.4296168703585863e-05 + ], + "bp_grad_F": [ + 0.12586721777915955, + 0.09100162982940674, + 0.0545843243598938, + 0.027565589174628258, + 0.014059619046747684 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.800000011920929, + "loss_eval": 0.5945348143577576, + "epoch": 15 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.95374870300293, + 12.280479431152344, + 16.662782669067383, + 26.677371978759766 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001737641723593697, + 0.00012793064524885267, + 7.821117469575256e-05, + 3.888122591888532e-05, + 2.000005952140782e-05 + ], + "bp_grad_F": [ + 0.1330755203962326, + 0.09730331599712372, + 0.05829176306724548, + 0.028968123719096184, + 0.014443416148424149 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7985000610351562, + "loss_eval": 0.6085594296455383, + "epoch": 16 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.9340181350708, + 12.276576042175293, + 16.712459564208984, + 27.161230087280273 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001674877858022228, + 0.00012590538244694471, + 7.574073242722079e-05, + 3.732396726263687e-05, + 1.86969518836122e-05 + ], + "bp_grad_F": [ + 0.13938488066196442, + 0.10323134809732437, + 0.061863236129283905, + 0.0303154569119215, + 0.01477954164147377 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7935000658035278, + "loss_eval": 0.6137893199920654, + "epoch": 17 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.915549278259277, + 12.273784637451172, + 16.833044052124023, + 27.70804214477539 + ], + "bp_grad_per_sample_l2_med": [ + 0.00013765814946964383, + 0.00010384680354036391, + 6.252297316677868e-05, + 3.0995015549706295e-05, + 1.5171532140811905e-05 + ], + "bp_grad_F": [ + 0.1456620693206787, + 0.10904198884963989, + 0.06525038182735443, + 0.03156846761703491, + 0.015115385875105858 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8065000176429749, + "loss_eval": 0.646562933921814, + "epoch": 18 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.900074005126953, + 12.271150588989258, + 16.89704704284668, + 28.26544761657715 + ], + "bp_grad_per_sample_l2_med": [ + 0.00012433489609975368, + 9.527598012937233e-05, + 5.774956298409961e-05, + 2.7581723770708777e-05, + 1.282800621993374e-05 + ], + "bp_grad_F": [ + 0.15205088257789612, + 0.11483236402273178, + 0.06858030706644058, + 0.03275969997048378, + 0.015405165031552315 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8020000457763672, + "loss_eval": 0.6640118360519409, + "epoch": 19 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.890129089355469, + 12.265545845031738, + 16.95741844177246, + 28.79555320739746 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010217817907687277, + 7.912378350738436e-05, + 4.763850665767677e-05, + 2.3046186470310204e-05, + 1.088724638975691e-05 + ], + "bp_grad_F": [ + 0.1597365438938141, + 0.12170909345149994, + 0.07251270860433578, + 0.034210700541734695, + 0.015816442668437958 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7950000166893005, + "loss_eval": 0.6770148277282715, + "epoch": 20 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.874495506286621, + 12.249778747558594, + 17.042072296142578, + 29.30438995361328 + ], + "bp_grad_per_sample_l2_med": [ + 9.667076665209606e-05, + 7.482587534468621e-05, + 4.6152406866895035e-05, + 2.1790863684145734e-05, + 1.0080756510433275e-05 + ], + "bp_grad_F": [ + 0.16798135638237, + 0.1287383735179901, + 0.07646958529949188, + 0.03567665442824364, + 0.016245704144239426 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7975000143051147, + "loss_eval": 0.7074151635169983, + "epoch": 21 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.860309600830078, + 12.262276649475098, + 17.10471534729004, + 29.77037811279297 + ], + "bp_grad_per_sample_l2_med": [ + 8.177604468073696e-05, + 6.404842861229554e-05, + 3.929789818357676e-05, + 1.8207463654107414e-05, + 8.330911441589706e-06 + ], + "bp_grad_F": [ + 0.17336878180503845, + 0.13393178582191467, + 0.07944471389055252, + 0.03667045012116432, + 0.016434919089078903 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8005000352859497, + "loss_eval": 0.7185518741607666, + "epoch": 22 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.851460456848145, + 12.24251651763916, + 17.171558380126953, + 30.212722778320312 + ], + "bp_grad_per_sample_l2_med": [ + 7.376902067335322e-05, + 5.6489287089789286e-05, + 3.395874227862805e-05, + 1.6138041246449575e-05, + 6.9637526394217275e-06 + ], + "bp_grad_F": [ + 0.17967616021633148, + 0.13954690098762512, + 0.08263248950242996, + 0.037825122475624084, + 0.016747957095503807 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.800000011920929, + "loss_eval": 0.7408589124679565, + "epoch": 23 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.842126846313477, + 12.243563652038574, + 17.238094329833984, + 30.57369613647461 + ], + "bp_grad_per_sample_l2_med": [ + 6.96977149345912e-05, + 5.455461359815672e-05, + 3.149309486616403e-05, + 1.4526599443343002e-05, + 6.351157480821712e-06 + ], + "bp_grad_F": [ + 0.1842736005783081, + 0.14376932382583618, + 0.08495213091373444, + 0.038578059524297714, + 0.01690361276268959 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.800000011920929, + "loss_eval": 0.7459465265274048, + "epoch": 24 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.834511756896973, + 12.231362342834473, + 17.27652931213379, + 30.958032608032227 + ], + "bp_grad_per_sample_l2_med": [ + 6.340271647786722e-05, + 5.11680482304655e-05, + 3.0357710784301162e-05, + 1.3866035260434728e-05, + 5.900054475205252e-06 + ], + "bp_grad_F": [ + 0.1903817504644394, + 0.14911234378814697, + 0.08797255158424377, + 0.03965744748711586, + 0.01718064583837986 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.799500048160553, + "loss_eval": 0.7703561186790466, + "epoch": 25 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.825489044189453, + 12.22317886352539, + 17.32727813720703, + 31.295225143432617 + ], + "bp_grad_per_sample_l2_med": [ + 5.839894583914429e-05, + 4.5580356527352706e-05, + 2.747728103713598e-05, + 1.2357729247014504e-05, + 5.190840511204442e-06 + ], + "bp_grad_F": [ + 0.19528549909591675, + 0.15347032248973846, + 0.09032707661390305, + 0.04043765366077423, + 0.017367515712976456 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796500027179718, + "loss_eval": 0.7836824655532837, + "epoch": 26 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.819538116455078, + 12.222261428833008, + 17.363719940185547, + 31.59310531616211 + ], + "bp_grad_per_sample_l2_med": [ + 5.029122257838026e-05, + 3.970409306930378e-05, + 2.4377433874178678e-05, + 1.1113867913081776e-05, + 4.727653049485525e-06 + ], + "bp_grad_F": [ + 0.19932542741298676, + 0.15725064277648926, + 0.09246863424777985, + 0.0411805622279644, + 0.017557309940457344 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.800000011920929, + "loss_eval": 0.797913134098053, + "epoch": 27 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.811884880065918, + 12.215055465698242, + 17.399166107177734, + 31.893146514892578 + ], + "bp_grad_per_sample_l2_med": [ + 4.582677502185106e-05, + 3.702253525261767e-05, + 2.1835987354279496e-05, + 9.762208719621412e-06, + 4.239610916556558e-06 + ], + "bp_grad_F": [ + 0.20321832597255707, + 0.16079877316951752, + 0.0944279357790947, + 0.04182669520378113, + 0.01770154759287834 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8015000224113464, + "loss_eval": 0.8103511929512024, + "epoch": 28 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.8074951171875, + 12.208087921142578, + 17.4328670501709, + 32.0993537902832 + ], + "bp_grad_per_sample_l2_med": [ + 4.3260886741336435e-05, + 3.466813359409571e-05, + 2.0653966203099117e-05, + 9.232544471160509e-06, + 3.864107839035569e-06 + ], + "bp_grad_F": [ + 0.20730803906917572, + 0.16447876393795013, + 0.09640119969844818, + 0.042481184005737305, + 0.017861463129520416 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8030000329017639, + "loss_eval": 0.8259979486465454, + "epoch": 29 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.802508354187012, + 12.201593399047852, + 17.472795486450195, + 32.34526824951172 + ], + "bp_grad_per_sample_l2_med": [ + 4.115825140615925e-05, + 3.3230924600502476e-05, + 1.9723833247553557e-05, + 8.868120858096518e-06, + 3.842445494228741e-06 + ], + "bp_grad_F": [ + 0.21079479157924652, + 0.16765208542346954, + 0.09817153960466385, + 0.04308956116437912, + 0.018017521128058434 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7975000143051147, + "loss_eval": 0.835996687412262, + "epoch": 30 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.79713249206543, + 12.19255542755127, + 17.48019790649414, + 32.53469467163086 + ], + "bp_grad_per_sample_l2_med": [ + 3.9538805140182376e-05, + 3.1396168196806684e-05, + 1.915965367516037e-05, + 8.288401659228839e-06, + 3.5655145893542795e-06 + ], + "bp_grad_F": [ + 0.2140273153781891, + 0.1706041693687439, + 0.09975717961788177, + 0.043599311262369156, + 0.018129423260688782 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7990000247955322, + "loss_eval": 0.8454185724258423, + "epoch": 31 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.793066024780273, + 12.186600685119629, + 17.523115158081055, + 32.76158905029297 + ], + "bp_grad_per_sample_l2_med": [ + 3.902446405845694e-05, + 3.034434666915331e-05, + 1.7979460608330555e-05, + 8.018372682272457e-06, + 3.2052466849563643e-06 + ], + "bp_grad_F": [ + 0.217476025223732, + 0.17371903359889984, + 0.10147368907928467, + 0.04418298602104187, + 0.018276885151863098 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8025000095367432, + "loss_eval": 0.8576318621635437, + "epoch": 32 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.788265228271484, + 12.18388557434082, + 17.53253173828125, + 32.96540832519531 + ], + "bp_grad_per_sample_l2_med": [ + 3.487027424853295e-05, + 2.7703388695954345e-05, + 1.6244883227045648e-05, + 6.949686849111458e-06, + 3.01652812595421e-06 + ], + "bp_grad_F": [ + 0.2205507904291153, + 0.17653042078018188, + 0.10301276296377182, + 0.04468648508191109, + 0.018391530960798264 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7990000247955322, + "loss_eval": 0.8676812648773193, + "epoch": 33 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.782870292663574, + 12.177481651306152, + 17.572200775146484, + 33.13017654418945 + ], + "bp_grad_per_sample_l2_med": [ + 3.207056215615012e-05, + 2.538906664995011e-05, + 1.4797540643485263e-05, + 6.3980214690673165e-06, + 2.7153869268659037e-06 + ], + "bp_grad_F": [ + 0.22312353551387787, + 0.17893576622009277, + 0.10432329773902893, + 0.045110564678907394, + 0.018488196656107903 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8015000224113464, + "loss_eval": 0.8748663663864136, + "epoch": 34 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.778507232666016, + 12.176526069641113, + 17.577714920043945, + 33.292396545410156 + ], + "bp_grad_per_sample_l2_med": [ + 3.117206506431103e-05, + 2.5556160835549235e-05, + 1.5269728464772925e-05, + 6.6313673414697405e-06, + 2.837193505911273e-06 + ], + "bp_grad_F": [ + 0.22575876116752625, + 0.18135619163513184, + 0.10563197731971741, + 0.045539867132902145, + 0.01859084889292717 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.800000011920929, + "loss_eval": 0.8849357962608337, + "epoch": 35 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.775252342224121, + 12.169761657714844, + 17.6116943359375, + 33.44955062866211 + ], + "bp_grad_per_sample_l2_med": [ + 3.0056495234020986e-05, + 2.4113667677738704e-05, + 1.408176376571646e-05, + 6.1218188420752995e-06, + 2.6174138838541694e-06 + ], + "bp_grad_F": [ + 0.2284391075372696, + 0.18377536535263062, + 0.1069609671831131, + 0.04599269852042198, + 0.018708044663071632 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8015000224113464, + "loss_eval": 0.8959856629371643, + "epoch": 36 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.772398948669434, + 12.164031028747559, + 17.635194778442383, + 33.5887451171875 + ], + "bp_grad_per_sample_l2_med": [ + 2.7790018066298217e-05, + 2.2673413695883937e-05, + 1.327950394625077e-05, + 5.801120551041095e-06, + 2.3991885882423958e-06 + ], + "bp_grad_F": [ + 0.23064540326595306, + 0.1858666092157364, + 0.10809148848056793, + 0.04634574428200722, + 0.018780354410409927 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8005000352859497, + "loss_eval": 0.9018086194992065, + "epoch": 37 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.76898193359375, + 12.161084175109863, + 17.64798927307129, + 33.7384033203125 + ], + "bp_grad_per_sample_l2_med": [ + 2.7914453312405385e-05, + 2.2498874386656098e-05, + 1.335815068159718e-05, + 5.8119312598137185e-06, + 2.478651822457323e-06 + ], + "bp_grad_F": [ + 0.2330632209777832, + 0.1880374252796173, + 0.10926036536693573, + 0.04673014581203461, + 0.01887366734445095 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.800000011920929, + "loss_eval": 0.9126823544502258, + "epoch": 38 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.765782356262207, + 12.157867431640625, + 17.654565811157227, + 33.87545394897461 + ], + "bp_grad_per_sample_l2_med": [ + 2.617536301841028e-05, + 2.155852780560963e-05, + 1.26063732750481e-05, + 5.598193638434168e-06, + 2.3114046143746236e-06 + ], + "bp_grad_F": [ + 0.23493894934654236, + 0.18982405960559845, + 0.11023002117872238, + 0.0470343716442585, + 0.018937399610877037 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8010000586509705, + "loss_eval": 0.918436586856842, + "epoch": 39 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.76235294342041, + 12.158239364624023, + 17.692272186279297, + 33.97838592529297 + ], + "bp_grad_per_sample_l2_med": [ + 2.5225266654160805e-05, + 2.0318799215601757e-05, + 1.18104180728551e-05, + 5.113367024023319e-06, + 2.0679383396782214e-06 + ], + "bp_grad_F": [ + 0.23714447021484375, + 0.1918695867061615, + 0.11135337501764297, + 0.047415897250175476, + 0.019037041813135147 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7975000143051147, + "loss_eval": 0.926592230796814, + "epoch": 40 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.761220932006836, + 12.152015686035156, + 17.702022552490234, + 34.099910736083984 + ], + "bp_grad_per_sample_l2_med": [ + 2.4690283680683933e-05, + 2.0103743736399338e-05, + 1.1646708117041271e-05, + 5.211788447923027e-06, + 2.065433818643214e-06 + ], + "bp_grad_F": [ + 0.23883607983589172, + 0.1934758871793747, + 0.11221782118082047, + 0.04768490791320801, + 0.019090749323368073 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.799500048160553, + "loss_eval": 0.9292308688163757, + "epoch": 41 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.758316993713379, + 12.149521827697754, + 17.706113815307617, + 34.19028091430664 + ], + "bp_grad_per_sample_l2_med": [ + 2.3211940060718916e-05, + 1.8614891814650036e-05, + 1.1040006938856095e-05, + 4.901159627479501e-06, + 2.003940153372241e-06 + ], + "bp_grad_F": [ + 0.24076926708221436, + 0.19526584446430206, + 0.1131957471370697, + 0.048007190227508545, + 0.019170215353369713 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7990000247955322, + "loss_eval": 0.939300000667572, + "epoch": 42 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.7562894821167, + 12.145485877990723, + 17.72273063659668, + 34.302001953125 + ], + "bp_grad_per_sample_l2_med": [ + 2.3761875127092935e-05, + 1.9169772713212296e-05, + 1.1290117072348949e-05, + 4.916772468277486e-06, + 1.9402432371862233e-06 + ], + "bp_grad_F": [ + 0.2422482967376709, + 0.19667460024356842, + 0.11394675076007843, + 0.04823824390769005, + 0.019216476008296013 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.800000011920929, + "loss_eval": 0.9442830681800842, + "epoch": 43 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.753690719604492, + 12.144105911254883, + 17.737106323242188, + 34.404640197753906 + ], + "bp_grad_per_sample_l2_med": [ + 2.1792104234918952e-05, + 1.8292348613613285e-05, + 1.0393917364126537e-05, + 4.534665094979573e-06, + 1.8929350744656404e-06 + ], + "bp_grad_F": [ + 0.2442140281200409, + 0.1984620988368988, + 0.11491919308900833, + 0.04856158792972565, + 0.019297350198030472 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.799500048160553, + "loss_eval": 0.9510068297386169, + "epoch": 44 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.751104354858398, + 12.139998435974121, + 17.73967170715332, + 34.49326705932617 + ], + "bp_grad_per_sample_l2_med": [ + 2.228700031992048e-05, + 1.800662539608311e-05, + 1.02799631349626e-05, + 4.365918812254677e-06, + 1.763435875545838e-06 + ], + "bp_grad_F": [ + 0.24558202922344208, + 0.19977517426013947, + 0.11561965942382812, + 0.04877489432692528, + 0.019342035055160522 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7980000376701355, + "loss_eval": 0.9541275501251221, + "epoch": 45 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.748708724975586, + 12.140083312988281, + 17.75340461730957, + 34.58064651489258 + ], + "bp_grad_per_sample_l2_med": [ + 2.0954081264790148e-05, + 1.69687900779536e-05, + 1.0029441000369843e-05, + 4.277889729564777e-06, + 1.7006685766318697e-06 + ], + "bp_grad_F": [ + 0.24700944125652313, + 0.20111818611621857, + 0.11635513603687286, + 0.04901802912354469, + 0.019400382414460182 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7990000247955322, + "loss_eval": 0.9603452086448669, + "epoch": 46 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.747987747192383, + 12.13515567779541, + 17.773204803466797, + 34.66823196411133 + ], + "bp_grad_per_sample_l2_med": [ + 2.019237945205532e-05, + 1.6703623259672895e-05, + 9.940931704477407e-06, + 4.2076449062733445e-06, + 1.6902752122405218e-06 + ], + "bp_grad_F": [ + 0.2484009861946106, + 0.20242078602313995, + 0.11704456806182861, + 0.04923176020383835, + 0.019446346908807755 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7980000376701355, + "loss_eval": 0.9656705260276794, + "epoch": 47 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.746366500854492, + 12.134767532348633, + 17.78083038330078, + 34.744384765625 + ], + "bp_grad_per_sample_l2_med": [ + 1.9601726307882927e-05, + 1.625595541554503e-05, + 9.70309520198498e-06, + 4.2589249460434075e-06, + 1.6490113239342463e-06 + ], + "bp_grad_F": [ + 0.2497195154428482, + 0.20365330576896667, + 0.1177029013633728, + 0.0494362898170948, + 0.019490210339426994 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7985000610351562, + "loss_eval": 0.9694753885269165, + "epoch": 48 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.745685577392578, + 12.132808685302734, + 17.785594940185547, + 34.818721771240234 + ], + "bp_grad_per_sample_l2_med": [ + 1.9891656847903505e-05, + 1.645386146265082e-05, + 9.532630429021083e-06, + 4.012633780803299e-06, + 1.5627846323695849e-06 + ], + "bp_grad_F": [ + 0.25097453594207764, + 0.2048366218805313, + 0.11835213750600815, + 0.04964917525649071, + 0.019541876390576363 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7970000505447388, + "loss_eval": 0.9751549363136292, + "epoch": 49 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.744300842285156, + 12.130931854248047, + 17.797060012817383, + 34.88679885864258 + ], + "bp_grad_per_sample_l2_med": [ + 1.86829984158976e-05, + 1.5538031220785342e-05, + 9.179881089949049e-06, + 3.900266619893955e-06, + 1.5405096291942755e-06 + ], + "bp_grad_F": [ + 0.2520725131034851, + 0.20589254796504974, + 0.11892128735780716, + 0.04982898011803627, + 0.0195804163813591 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7980000376701355, + "loss_eval": 0.9781593084335327, + "epoch": 50 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.742894172668457, + 12.128829002380371, + 17.800174713134766, + 34.937950134277344 + ], + "bp_grad_per_sample_l2_med": [ + 1.839629840105772e-05, + 1.504779083916219e-05, + 8.953754331741948e-06, + 3.7526185678871116e-06, + 1.5395226000691764e-06 + ], + "bp_grad_F": [ + 0.25313958525657654, + 0.2068854719400406, + 0.11944505572319031, + 0.0499873124063015, + 0.019611038267612457 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7990000247955322, + "loss_eval": 0.9819083213806152, + "epoch": 51 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.741170883178711, + 12.12833309173584, + 17.80767822265625, + 35.008392333984375 + ], + "bp_grad_per_sample_l2_med": [ + 1.8736680431175046e-05, + 1.5372819689218886e-05, + 9.080923518922646e-06, + 3.7873542169108987e-06, + 1.4909855963196605e-06 + ], + "bp_grad_F": [ + 0.2542133629322052, + 0.20790545642375946, + 0.11999284476041794, + 0.05016028508543968, + 0.019651155918836594 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7975000143051147, + "loss_eval": 0.9845340847969055, + "epoch": 52 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.739892959594727, + 12.124402046203613, + 17.814624786376953, + 35.0652961730957 + ], + "bp_grad_per_sample_l2_med": [ + 1.820523539208807e-05, + 1.4827967788733076e-05, + 8.919139872887172e-06, + 3.8056493849580875e-06, + 1.4648703654529527e-06 + ], + "bp_grad_F": [ + 0.25528770685195923, + 0.2089182734489441, + 0.12054150551557541, + 0.05034028738737106, + 0.019695136696100235 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7975000143051147, + "loss_eval": 0.9892162680625916, + "epoch": 53 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.738609313964844, + 12.125777244567871, + 17.821733474731445, + 35.119747161865234 + ], + "bp_grad_per_sample_l2_med": [ + 1.807287299016025e-05, + 1.485222401242936e-05, + 8.809645805740729e-06, + 3.601295475164079e-06, + 1.3953541611044784e-06 + ], + "bp_grad_F": [ + 0.25628989934921265, + 0.2098524272441864, + 0.12104840576648712, + 0.05050570145249367, + 0.019734907895326614 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7970000505447388, + "loss_eval": 0.9929525852203369, + "epoch": 54 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.738442420959473, + 12.123546600341797, + 17.828126907348633, + 35.1645393371582 + ], + "bp_grad_per_sample_l2_med": [ + 1.7838316125562415e-05, + 1.4615891814173665e-05, + 8.594040991738439e-06, + 3.6455955978453858e-06, + 1.4180122889229096e-06 + ], + "bp_grad_F": [ + 0.25709325075149536, + 0.21062038838863373, + 0.12145251780748367, + 0.05062393099069595, + 0.019757961854338646 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7975000143051147, + "loss_eval": 0.9955189228057861, + "epoch": 55 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.736928939819336, + 12.120393753051758, + 17.832061767578125, + 35.21808624267578 + ], + "bp_grad_per_sample_l2_med": [ + 1.690394310571719e-05, + 1.4294129869085737e-05, + 8.27510575618362e-06, + 3.6071653539693216e-06, + 1.3830640455125831e-06 + ], + "bp_grad_F": [ + 0.25789716839790344, + 0.21137811243534088, + 0.12185957282781601, + 0.050752829760313034, + 0.019786853343248367 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7975000143051147, + "loss_eval": 0.9983878135681152, + "epoch": 56 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.7359619140625, + 12.122570991516113, + 17.835556030273438, + 35.264137268066406 + ], + "bp_grad_per_sample_l2_med": [ + 1.6666754163452424e-05, + 1.4025285963725764e-05, + 8.179616088455077e-06, + 3.4237471027154243e-06, + 1.3576167248174897e-06 + ], + "bp_grad_F": [ + 0.25863000750541687, + 0.21208500862121582, + 0.12223963439464569, + 0.050873447209596634, + 0.0198147501796484 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0010322332382202, + "epoch": 57 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.73526668548584, + 12.120652198791504, + 17.842275619506836, + 35.31349182128906 + ], + "bp_grad_per_sample_l2_med": [ + 1.6808457075967453e-05, + 1.3759586181549821e-05, + 8.023761438380461e-06, + 3.3788217024266487e-06, + 1.3503363334166352e-06 + ], + "bp_grad_F": [ + 0.2594156563282013, + 0.2128157913684845, + 0.12262928485870361, + 0.050996698439121246, + 0.01984303817152977 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7990000247955322, + "loss_eval": 1.0038610696792603, + "epoch": 58 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.735087394714355, + 12.11837387084961, + 17.846410751342773, + 35.347412109375 + ], + "bp_grad_per_sample_l2_med": [ + 1.662989416217897e-05, + 1.3822269465890713e-05, + 7.92401988292113e-06, + 3.472342541499529e-06, + 1.327858285549155e-06 + ], + "bp_grad_F": [ + 0.26001590490341187, + 0.21339008212089539, + 0.12293757498264313, + 0.05109258368611336, + 0.01986365020275116 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796500027179718, + "loss_eval": 1.0062025785446167, + "epoch": 59 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.734339714050293, + 12.117914199829102, + 17.84966468811035, + 35.381446838378906 + ], + "bp_grad_per_sample_l2_med": [ + 1.6489182598888874e-05, + 1.3682294593309052e-05, + 8.124485248117708e-06, + 3.407540134503506e-06, + 1.3195593737691524e-06 + ], + "bp_grad_F": [ + 0.2605873942375183, + 0.21394510567188263, + 0.1232379749417305, + 0.05118485540151596, + 0.019882848486304283 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0082966089248657, + "epoch": 60 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.733570098876953, + 12.118681907653809, + 17.854442596435547, + 35.417537689208984 + ], + "bp_grad_per_sample_l2_med": [ + 1.6188618246815167e-05, + 1.3713249245483894e-05, + 7.876165909692645e-06, + 3.343990783832851e-06, + 1.2941204659000505e-06 + ], + "bp_grad_F": [ + 0.2612352669239044, + 0.21454451978206635, + 0.12355507910251617, + 0.05128618702292442, + 0.019906867295503616 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0103161334991455, + "epoch": 61 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.73337459564209, + 12.116337776184082, + 17.85533332824707, + 35.44430160522461 + ], + "bp_grad_per_sample_l2_med": [ + 1.6262945791822858e-05, + 1.3456610759021714e-05, + 7.976923370733857e-06, + 3.304621941424557e-06, + 1.2957953003933653e-06 + ], + "bp_grad_F": [ + 0.2618514895439148, + 0.21511761844158173, + 0.12386228144168854, + 0.05138511210680008, + 0.019930575042963028 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0126534700393677, + "epoch": 62 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.732640266418457, + 12.11673641204834, + 17.85984992980957, + 35.47673797607422 + ], + "bp_grad_per_sample_l2_med": [ + 1.5915471522021107e-05, + 1.3434865650197025e-05, + 7.765964255668223e-06, + 3.272770300100092e-06, + 1.2807531675207429e-06 + ], + "bp_grad_F": [ + 0.26224803924560547, + 0.2155023217201233, + 0.124069944024086, + 0.051448848098516464, + 0.019943425431847572 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0140384435653687, + "epoch": 63 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.732240676879883, + 12.115690231323242, + 17.86297035217285, + 35.500823974609375 + ], + "bp_grad_per_sample_l2_med": [ + 1.557435462018475e-05, + 1.2797115232388023e-05, + 7.646640369785018e-06, + 3.2042576094681863e-06, + 1.2790382015737123e-06 + ], + "bp_grad_F": [ + 0.26270976662635803, + 0.2159367799758911, + 0.12429951131343842, + 0.051519569009542465, + 0.01995890960097313 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796500027179718, + "loss_eval": 1.0154695510864258, + "epoch": 64 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.731745719909668, + 12.114669799804688, + 17.86736297607422, + 35.528076171875 + ], + "bp_grad_per_sample_l2_med": [ + 1.58700677275192e-05, + 1.3018690879107453e-05, + 7.55094788473798e-06, + 3.2220066259469604e-06, + 1.2598871990121552e-06 + ], + "bp_grad_F": [ + 0.26308032870292664, + 0.2162918895483017, + 0.12448756396770477, + 0.051577214151620865, + 0.019970662891864777 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0169501304626465, + "epoch": 65 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.731338500976562, + 12.113511085510254, + 17.86815643310547, + 35.54944610595703 + ], + "bp_grad_per_sample_l2_med": [ + 1.5586350855301134e-05, + 1.2824431905755773e-05, + 7.649568942724727e-06, + 3.1966815186024178e-06, + 1.2639170563488733e-06 + ], + "bp_grad_F": [ + 0.26345473527908325, + 0.21664129197597504, + 0.12467629462480545, + 0.051637567579746246, + 0.01998509280383587 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796500027179718, + "loss_eval": 1.018563985824585, + "epoch": 66 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.731039047241211, + 12.113682746887207, + 17.872100830078125, + 35.56554412841797 + ], + "bp_grad_per_sample_l2_med": [ + 1.5501789675909095e-05, + 1.2836935638915747e-05, + 7.47852936910931e-06, + 3.1328777367889415e-06, + 1.2308250916248653e-06 + ], + "bp_grad_F": [ + 0.2637687623500824, + 0.2169436365365982, + 0.124836765229702, + 0.0516866035759449, + 0.019995568320155144 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0192590951919556, + "epoch": 67 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.730656623840332, + 12.114008903503418, + 17.87257194519043, + 35.58961486816406 + ], + "bp_grad_per_sample_l2_med": [ + 1.5237865227391012e-05, + 1.2954994417668786e-05, + 7.515009656344773e-06, + 3.2117325190483825e-06, + 1.2425814475136576e-06 + ], + "bp_grad_F": [ + 0.2640174925327301, + 0.21717986464500427, + 0.1249629333615303, + 0.051725782454013824, + 0.020004095509648323 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0201796293258667, + "epoch": 68 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.730304718017578, + 12.112882614135742, + 17.87510108947754, + 35.60005569458008 + ], + "bp_grad_per_sample_l2_med": [ + 1.5281846572179347e-05, + 1.280397191294469e-05, + 7.457324500137474e-06, + 3.1238730571203632e-06, + 1.2271989362488966e-06 + ], + "bp_grad_F": [ + 0.26432526111602783, + 0.2174660563468933, + 0.12511758506298065, + 0.05177601799368858, + 0.02001647651195526 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0214923620224, + "epoch": 69 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.730023384094238, + 12.112593650817871, + 17.87718963623047, + 35.61077880859375 + ], + "bp_grad_per_sample_l2_med": [ + 1.5160739167185966e-05, + 1.2885939213447273e-05, + 7.442678906954825e-06, + 3.1402662443724694e-06, + 1.2329509218034218e-06 + ], + "bp_grad_F": [ + 0.2645094394683838, + 0.21764276921749115, + 0.12521088123321533, + 0.051804810762405396, + 0.020022746175527573 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0221376419067383, + "epoch": 70 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.729791641235352, + 12.11282730102539, + 17.878896713256836, + 35.62131118774414 + ], + "bp_grad_per_sample_l2_med": [ + 1.4924515198799782e-05, + 1.2676942787948065e-05, + 7.327739240281517e-06, + 3.135102815576829e-06, + 1.2368633406367735e-06 + ], + "bp_grad_F": [ + 0.26469096541404724, + 0.2178148329257965, + 0.12530171871185303, + 0.051832377910614014, + 0.02002853713929653 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0227359533309937, + "epoch": 71 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.72957706451416, + 12.112420082092285, + 17.879562377929688, + 35.631195068359375 + ], + "bp_grad_per_sample_l2_med": [ + 1.5078092474141158e-05, + 1.2648180018004496e-05, + 7.402486517094076e-06, + 3.110948682660819e-06, + 1.2303731864449219e-06 + ], + "bp_grad_F": [ + 0.26483553647994995, + 0.2179516702890396, + 0.12537437677383423, + 0.051855091005563736, + 0.020033741369843483 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0231714248657227, + "epoch": 72 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.72945499420166, + 12.112156867980957, + 17.8814754486084, + 35.639610290527344 + ], + "bp_grad_per_sample_l2_med": [ + 1.4999122868175618e-05, + 1.2563705240609124e-05, + 7.3636233537399676e-06, + 3.091453436354641e-06, + 1.2325838270044187e-06 + ], + "bp_grad_F": [ + 0.2649652361869812, + 0.21807390451431274, + 0.12544025480747223, + 0.05187588557600975, + 0.020038409158587456 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0237369537353516, + "epoch": 73 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.729272842407227, + 12.112222671508789, + 17.881935119628906, + 35.644290924072266 + ], + "bp_grad_per_sample_l2_med": [ + 1.4974531950429082e-05, + 1.2648583833652083e-05, + 7.3520282057870645e-06, + 3.080302576563554e-06, + 1.2291716302570421e-06 + ], + "bp_grad_F": [ + 0.2650584876537323, + 0.21816210448741913, + 0.12548699975013733, + 0.051890380680561066, + 0.020041609182953835 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0240200757980347, + "epoch": 74 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.72924518585205, + 12.112285614013672, + 17.88214683532715, + 35.64848709106445 + ], + "bp_grad_per_sample_l2_med": [ + 1.4959082363930065e-05, + 1.2588670870172791e-05, + 7.344425739574945e-06, + 3.080124088228331e-06, + 1.2237677537996206e-06 + ], + "bp_grad_F": [ + 0.26513636112213135, + 0.21823462843894958, + 0.12552553415298462, + 0.051902592182159424, + 0.020044438540935516 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0243031978607178, + "epoch": 75 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.72916030883789, + 12.112074851989746, + 17.882980346679688, + 35.650428771972656 + ], + "bp_grad_per_sample_l2_med": [ + 1.4942641428206116e-05, + 1.2567295925691724e-05, + 7.336187991313636e-06, + 3.0725423130206764e-06, + 1.2260832136234967e-06 + ], + "bp_grad_F": [ + 0.26517778635025024, + 0.21827547252178192, + 0.12554767727851868, + 0.0519094243645668, + 0.02004585973918438 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0244944095611572, + "epoch": 76 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.729132652282715, + 12.112125396728516, + 17.883481979370117, + 35.65312576293945 + ], + "bp_grad_per_sample_l2_med": [ + 1.4903710507496726e-05, + 1.2576123481267132e-05, + 7.317236850212794e-06, + 3.078314875892829e-06, + 1.2210558679726091e-06 + ], + "bp_grad_F": [ + 0.26521575450897217, + 0.2183104306459427, + 0.1255662441253662, + 0.051915280520915985, + 0.02004723809659481 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0246349573135376, + "epoch": 77 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.729104995727539, + 12.11208724975586, + 17.88361167907715, + 35.65410614013672 + ], + "bp_grad_per_sample_l2_med": [ + 1.4916706277290359e-05, + 1.2563130439957604e-05, + 7.323697445826838e-06, + 3.0812991553830216e-06, + 1.2211262401251588e-06 + ], + "bp_grad_F": [ + 0.26523175835609436, + 0.2183263599872589, + 0.12557478249073029, + 0.05191792547702789, + 0.02004779316484928 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0246796607971191, + "epoch": 78 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.729097366333008, + 12.112085342407227, + 17.88372230529785, + 35.65440368652344 + ], + "bp_grad_per_sample_l2_med": [ + 1.4912001461198088e-05, + 1.2556130059238058e-05, + 7.32138505554758e-06, + 3.077205747104017e-06, + 1.2217307130413246e-06 + ], + "bp_grad_F": [ + 0.2652417719364166, + 0.21833550930023193, + 0.1255796104669571, + 0.05191945284605026, + 0.02004816010594368 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.0247222185134888, + "epoch": 79 + }, + { + "hidden_norms": [ + 11.269571304321289, + 10.729093551635742, + 12.112082481384277, + 17.88372230529785, + 35.65460205078125 + ], + "bp_grad_per_sample_l2_med": [ + 1.4914756320649758e-05, + 1.2556190995383076e-05, + 7.322747933358187e-06, + 3.0772835089010186e-06, + 1.2216489722050028e-06 + ], + "bp_grad_F": [ + 0.2652438282966614, + 0.21833744645118713, + 0.12558062374591827, + 0.051919758319854736, + 0.020048221573233604 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796000063419342, + "loss_eval": 1.024727463722229, + "epoch": 80 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 11.269571304321289, + 11.290447235107422, + 11.313605308532715, + 11.351215362548828, + 11.398087501525879 + ], + "bp_grad_per_sample_l2_med": [ + 0.00028353024390526116, + 0.0002828188880812377, + 0.00028162598027847707, + 0.0002799496578518301, + 0.0002791006409097463 + ], + "bp_grad_F": [ + 0.012684082612395287, + 0.01264861598610878, + 0.012589854188263416, + 0.012511610053479671, + 0.012471316382288933 + ], + "gamma_dfa": -0.0034942624624818563, + "gamma_dfa_per_layer": [ + -0.029981477186083794, + 0.023911481723189354, + 0.0022033676505088806, + -0.010110422037541866 + ], + "acc_eval": 0.08450000733137131, + "loss_eval": 2.4790313243865967, + "epoch": 0 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.505881309509277, + 11.757291793823242, + 12.0764741897583, + 12.435522079467773 + ], + "bp_grad_per_sample_l2_med": [ + 0.00031470530666410923, + 0.0002926285960711539, + 0.00027369827148504555, + 0.0002595284313429147, + 0.0002512428327463567 + ], + "bp_grad_F": [ + 0.014148155227303505, + 0.013173527084290981, + 0.01228535920381546, + 0.0115915322676301, + 0.01116928644478321 + ], + "gamma_dfa": 0.11511426232755184, + "gamma_dfa_per_layer": [ + 0.12020161747932434, + 0.12450753152370453, + 0.12499555945396423, + 0.09075234085321426 + ], + "acc_eval": 0.3775000274181366, + "loss_eval": 1.8237801790237427, + "epoch": 1 + }, + { + "hidden_norms": [ + 11.269571304321289, + 11.90947437286377, + 13.027632713317871, + 14.888558387756348, + 17.22944450378418 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006904517649672925, + 0.000503765360917896, + 0.0003708408330567181, + 0.00028136910987086594, + 0.00023244605108629912 + ], + "bp_grad_F": [ + 0.03382011875510216, + 0.024346396327018738, + 0.017825284972786903, + 0.013448701240122318, + 0.011137359775602818 + ], + "gamma_dfa": 0.219235859811306, + "gamma_dfa_per_layer": [ + 0.2247210592031479, + 0.20836304128170013, + 0.23224417865276337, + 0.2116151601076126 + ], + "acc_eval": 0.6325000524520874, + "loss_eval": 1.0442804098129272, + "epoch": 2 + }, + { + "hidden_norms": [ + 11.269571304321289, + 12.249103546142578, + 14.663236618041992, + 19.286497116088867, + 24.994598388671875 + ], + "bp_grad_per_sample_l2_med": [ + 0.000785678334068507, + 0.0004984966944903135, + 0.00031956040766090155, + 0.00021816199296154082, + 0.00017694469715934247 + ], + "bp_grad_F": [ + 0.049792274832725525, + 0.03142387419939041, + 0.020070550963282585, + 0.01388809084892273, + 0.011133435182273388 + ], + "gamma_dfa": 0.20651238784193993, + "gamma_dfa_per_layer": [ + 0.19393788278102875, + 0.1939619481563568, + 0.23087021708488464, + 0.2072795033454895 + ], + "acc_eval": 0.690500020980835, + "loss_eval": 0.8105630278587341, + "epoch": 3 + }, + { + "hidden_norms": [ + 11.269571304321289, + 12.623353004455566, + 17.037206649780273, + 26.137210845947266, + 36.338985443115234 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007407923694700003, + 0.0004117340431548655, + 0.00024256351753138006, + 0.00016813547699712217, + 0.00014022440882399678 + ], + "bp_grad_F": [ + 0.06029670313000679, + 0.0337882824242115, + 0.0196156557649374, + 0.01336250826716423, + 0.011071481741964817 + ], + "gamma_dfa": 0.18698954582214355, + "gamma_dfa_per_layer": [ + 0.15680347383022308, + 0.17669467628002167, + 0.2232135385274887, + 0.19124649465084076 + ], + "acc_eval": 0.7130000591278076, + "loss_eval": 0.7352707386016846, + "epoch": 4 + }, + { + "hidden_norms": [ + 11.269571304321289, + 13.056242942810059, + 20.31708526611328, + 35.354278564453125, + 50.72277069091797 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007306670304387808, + 0.000362707331078127, + 0.00019432755652815104, + 0.00014284192002378404, + 0.0001259525743080303 + ], + "bp_grad_F": [ + 0.06756022572517395, + 0.03394190967082977, + 0.018268020823597908, + 0.012735997326672077, + 0.011040973477065563 + ], + "gamma_dfa": 0.16737862676382065, + "gamma_dfa_per_layer": [ + 0.12552234530448914, + 0.16295458376407623, + 0.2097114473581314, + 0.17132613062858582 + ], + "acc_eval": 0.7350000143051147, + "loss_eval": 0.716023862361908, + "epoch": 5 + }, + { + "hidden_norms": [ + 11.269571304321289, + 13.544439315795898, + 24.727155685424805, + 46.518768310546875, + 67.0296859741211 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007029862026683986, + 0.0003191934374626726, + 0.00016633918858133256, + 0.00012432104267645627, + 0.00011442468530731276 + ], + "bp_grad_F": [ + 0.07251796871423721, + 0.03311065956950188, + 0.016890449449419975, + 0.012321571819484234, + 0.011077084578573704 + ], + "gamma_dfa": 0.15210051462054253, + "gamma_dfa_per_layer": [ + 0.10109913349151611, + 0.15017138421535492, + 0.20331066846847534, + 0.15382087230682373 + ], + "acc_eval": 0.7305000424385071, + "loss_eval": 0.7123240828514099, + "epoch": 6 + }, + { + "hidden_norms": [ + 11.269571304321289, + 14.096785545349121, + 29.970369338989258, + 58.48172378540039, + 84.44245910644531 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007362618925981224, + 0.0003065088822040707, + 0.00015729048755019903, + 0.00012451721704564989, + 0.00011588833149289712 + ], + "bp_grad_F": [ + 0.07530932128429413, + 0.03182085230946541, + 0.01569041982293129, + 0.012093811295926571, + 0.011190102435648441 + ], + "gamma_dfa": 0.14102506078779697, + "gamma_dfa_per_layer": [ + 0.08732745796442032, + 0.14003422856330872, + 0.19598272442817688, + 0.14075583219528198 + ], + "acc_eval": 0.7235000133514404, + "loss_eval": 0.727388858795166, + "epoch": 7 + }, + { + "hidden_norms": [ + 11.269571304321289, + 14.721030235290527, + 35.83012008666992, + 70.75320434570312, + 101.73139953613281 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007345590856857598, + 0.00026920062373392284, + 0.000134471949422732, + 0.00011552426440175623, + 0.000110697525087744 + ], + "bp_grad_F": [ + 0.0819108858704567, + 0.03190097585320473, + 0.015249059535562992, + 0.012194199487566948, + 0.011436647735536098 + ], + "gamma_dfa": 0.1306514535099268, + "gamma_dfa_per_layer": [ + 0.07609214633703232, + 0.13159415125846863, + 0.18644346296787262, + 0.12847605347633362 + ], + "acc_eval": 0.7155000567436218, + "loss_eval": 0.7610863447189331, + "epoch": 8 + }, + { + "hidden_norms": [ + 11.269571304321289, + 15.34220027923584, + 42.35697937011719, + 83.51715850830078, + 120.42235565185547 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006878858548589051, + 0.0002570476208347827, + 0.00012823278666473925, + 0.00011104762234026566, + 0.00010812593973241746 + ], + "bp_grad_F": [ + 0.08083735406398773, + 0.029663894325494766, + 0.014093351550400257, + 0.01174441073089838, + 0.011170739307999611 + ], + "gamma_dfa": 0.12087789550423622, + "gamma_dfa_per_layer": [ + 0.06335650384426117, + 0.12819789350032806, + 0.17300739884376526, + 0.1189497858285904 + ], + "acc_eval": 0.7225000262260437, + "loss_eval": 0.737341046333313, + "epoch": 9 + }, + { + "hidden_norms": [ + 11.269571304321289, + 16.00116729736328, + 49.21657943725586, + 96.05623626708984, + 138.10394287109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007566744461655617, + 0.0002493424981366843, + 0.0001229145418619737, + 0.00010773885151138529, + 0.00010482135257916525 + ], + "bp_grad_F": [ + 0.08636438101530075, + 0.029551593586802483, + 0.013877596706151962, + 0.011869709938764572, + 0.011369508691132069 + ], + "gamma_dfa": 0.11321612633764744, + "gamma_dfa_per_layer": [ + 0.05804715305566788, + 0.11809944361448288, + 0.16106289625167847, + 0.11565501242876053 + ], + "acc_eval": 0.7175000309944153, + "loss_eval": 0.7598624229431152, + "epoch": 10 + }, + { + "hidden_norms": [ + 11.269571304321289, + 16.664016723632812, + 56.4381103515625, + 109.18519592285156, + 157.13400268554688 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007165206479839981, + 0.00021803597337566316, + 0.00010753094829851761, + 0.00010056991595774889, + 9.790556214284152e-05 + ], + "bp_grad_F": [ + 0.09135312587022781, + 0.029706060886383057, + 0.013932082802057266, + 0.012196206487715244, + 0.011740063317120075 + ], + "gamma_dfa": 0.1071977848187089, + "gamma_dfa_per_layer": [ + 0.04954911395907402, + 0.1143685057759285, + 0.1548140048980713, + 0.11005951464176178 + ], + "acc_eval": 0.7000000476837158, + "loss_eval": 0.825758159160614, + "epoch": 11 + }, + { + "hidden_norms": [ + 11.269571304321289, + 17.334924697875977, + 63.52719497680664, + 121.75878143310547, + 175.05706787109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007098973728716373, + 0.0002017641963902861, + 0.00010367313370807096, + 9.554869029670954e-05, + 9.339704411104321e-05 + ], + "bp_grad_F": [ + 0.0928206816315651, + 0.02807745151221752, + 0.013300982303917408, + 0.011954967863857746, + 0.011584528721868992 + ], + "gamma_dfa": 0.10307322815060616, + "gamma_dfa_per_layer": [ + 0.046224936842918396, + 0.11165355145931244, + 0.14536075294017792, + 0.10905367136001587 + ], + "acc_eval": 0.7085000276565552, + "loss_eval": 0.8147838711738586, + "epoch": 12 + }, + { + "hidden_norms": [ + 11.269571304321289, + 18.066408157348633, + 71.18386840820312, + 135.29449462890625, + 194.25502014160156 + ], + "bp_grad_per_sample_l2_med": [ + 0.000749382539652288, + 0.00023277483705896884, + 0.00012272220919840038, + 0.00011419993097661063, + 0.00011211293895030394 + ], + "bp_grad_F": [ + 0.08808046579360962, + 0.026459064334630966, + 0.01287052407860756, + 0.011758155189454556, + 0.01143786869943142 + ], + "gamma_dfa": 0.09524188842624426, + "gamma_dfa_per_layer": [ + 0.042861852794885635, + 0.09963438659906387, + 0.1363406628370285, + 0.10213065147399902 + ], + "acc_eval": 0.7090000510215759, + "loss_eval": 0.7797307372093201, + "epoch": 13 + }, + { + "hidden_norms": [ + 11.269571304321289, + 18.722259521484375, + 78.48313903808594, + 148.08277893066406, + 213.12060546875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007828621892258525, + 0.00022329931380227208, + 0.0001217587196151726, + 0.00011403425014577806, + 0.00011114090739283711 + ], + "bp_grad_F": [ + 0.09129610657691956, + 0.02616111747920513, + 0.012879838235676289, + 0.011936144903302193, + 0.011643719859421253 + ], + "gamma_dfa": 0.0928388200700283, + "gamma_dfa_per_layer": [ + 0.04325374215841293, + 0.09723485261201859, + 0.13119162619113922, + 0.09967505931854248 + ], + "acc_eval": 0.7015000581741333, + "loss_eval": 0.810487687587738, + "epoch": 14 + }, + { + "hidden_norms": [ + 11.269571304321289, + 19.439603805541992, + 86.18466186523438, + 160.40892028808594, + 230.23739624023438 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007217489182949066, + 0.00018824212020263076, + 0.00010298609413439408, + 9.960142779164016e-05, + 9.748922457220033e-05 + ], + "bp_grad_F": [ + 0.09306738525629044, + 0.02548908442258835, + 0.012566950172185898, + 0.011724555864930153, + 0.011449399404227734 + ], + "gamma_dfa": 0.09134612884372473, + "gamma_dfa_per_layer": [ + 0.040905896574258804, + 0.09668857604265213, + 0.12694117426872253, + 0.10084886848926544 + ], + "acc_eval": 0.7110000252723694, + "loss_eval": 0.7941330075263977, + "epoch": 15 + }, + { + "hidden_norms": [ + 11.269571304321289, + 20.229736328125, + 94.05648040771484, + 173.3369903564453, + 248.50965881347656 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007364301127381623, + 0.00019103182421531528, + 0.00010473190195625648, + 0.00010049886623164639, + 9.873881208477542e-05 + ], + "bp_grad_F": [ + 0.09542964398860931, + 0.025049429386854172, + 0.012468041852116585, + 0.011731654405593872, + 0.011484012007713318 + ], + "gamma_dfa": 0.08733212016522884, + "gamma_dfa_per_layer": [ + 0.034523673355579376, + 0.09200998395681381, + 0.12135256081819534, + 0.10144226253032684 + ], + "acc_eval": 0.7200000286102295, + "loss_eval": 0.806917130947113, + "epoch": 16 + }, + { + "hidden_norms": [ + 11.269571304321289, + 20.94115447998047, + 101.5516128540039, + 185.91993713378906, + 265.6839294433594 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008022052352316678, + 0.00020157739345449954, + 0.00011702251504175365, + 0.00011363227531546727, + 0.00011240412277402356 + ], + "bp_grad_F": [ + 0.09439960867166519, + 0.024019507691264153, + 0.01232285425066948, + 0.011713731102645397, + 0.011482013389468193 + ], + "gamma_dfa": 0.08548407163470984, + "gamma_dfa_per_layer": [ + 0.038230378180742264, + 0.08889900892972946, + 0.11632363498210907, + 0.09848326444625854 + ], + "acc_eval": 0.7120000123977661, + "loss_eval": 0.8131889700889587, + "epoch": 17 + }, + { + "hidden_norms": [ + 11.269571304321289, + 21.71381950378418, + 109.32372283935547, + 199.24642944335938, + 285.1650085449219 + ], + "bp_grad_per_sample_l2_med": [ + 0.00076432921923697, + 0.00018322077812626958, + 0.00010481786011951044, + 0.00010164766717934981, + 0.00010087565897265449 + ], + "bp_grad_F": [ + 0.09489408135414124, + 0.023419344797730446, + 0.01224115677177906, + 0.011706860736012459, + 0.011501944623887539 + ], + "gamma_dfa": 0.08550543524324894, + "gamma_dfa_per_layer": [ + 0.04093854874372482, + 0.09244771301746368, + 0.11161119490861893, + 0.09702428430318832 + ], + "acc_eval": 0.7150000333786011, + "loss_eval": 0.8401313424110413, + "epoch": 18 + }, + { + "hidden_norms": [ + 11.269571304321289, + 22.474592208862305, + 117.0955810546875, + 212.0178680419922, + 303.7491455078125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008428111323155463, + 0.00020001262600999326, + 0.00012667309783864766, + 0.00012337132648099214, + 0.00012319188681431115 + ], + "bp_grad_F": [ + 0.09607862681150436, + 0.023683469742536545, + 0.01269453763961792, + 0.012188468128442764, + 0.011980941519141197 + ], + "gamma_dfa": 0.07937186863273382, + "gamma_dfa_per_layer": [ + 0.036147553473711014, + 0.08243555575609207, + 0.1066455990076065, + 0.0922587662935257 + ], + "acc_eval": 0.6840000152587891, + "loss_eval": 0.881807267665863, + "epoch": 19 + }, + { + "hidden_norms": [ + 11.269571304321289, + 23.23648452758789, + 124.45619201660156, + 224.60977172851562, + 321.2709655761719 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007923559751361609, + 0.00018490788352210075, + 0.00011116286623291671, + 0.00010867219680221751, + 0.00010773272515507415 + ], + "bp_grad_F": [ + 0.09617631882429123, + 0.02261228673160076, + 0.012236458249390125, + 0.011800081469118595, + 0.011619490571320057 + ], + "gamma_dfa": 0.07946366257965565, + "gamma_dfa_per_layer": [ + 0.036630548536777496, + 0.08521611988544464, + 0.10408685356378555, + 0.0919211283326149 + ], + "acc_eval": 0.7070000171661377, + "loss_eval": 0.8307667374610901, + "epoch": 20 + }, + { + "hidden_norms": [ + 11.269571304321289, + 23.941816329956055, + 131.71353149414062, + 236.79910278320312, + 338.2337951660156 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007988678989931941, + 0.00017439998919144273, + 0.0001077677879948169, + 0.00010501289216335863, + 0.00010426317021483555 + ], + "bp_grad_F": [ + 0.09615935385227203, + 0.02214771881699562, + 0.012244326062500477, + 0.01184793096035719, + 0.011676526628434658 + ], + "gamma_dfa": 0.0779404304921627, + "gamma_dfa_per_layer": [ + 0.032858967781066895, + 0.0826181098818779, + 0.10167358815670013, + 0.09461105614900589 + ], + "acc_eval": 0.6955000162124634, + "loss_eval": 0.8431603312492371, + "epoch": 21 + }, + { + "hidden_norms": [ + 11.269571304321289, + 24.736867904663086, + 139.1349639892578, + 248.7137908935547, + 355.0362243652344 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008002957911230624, + 0.00016955590399447829, + 0.00010642779670888558, + 0.00010389652743469924, + 0.00010333865793654695 + ], + "bp_grad_F": [ + 0.10074009746313095, + 0.022332124412059784, + 0.012284242548048496, + 0.011890492402017117, + 0.011716442182660103 + ], + "gamma_dfa": 0.07599243335425854, + "gamma_dfa_per_layer": [ + 0.03026191145181656, + 0.07909790426492691, + 0.10020720213651657, + 0.09440271556377411 + ], + "acc_eval": 0.6995000243186951, + "loss_eval": 0.8646643161773682, + "epoch": 22 + }, + { + "hidden_norms": [ + 11.269571304321289, + 25.527332305908203, + 146.32603454589844, + 260.3341064453125, + 371.9651184082031 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008058008388616145, + 0.00016914791194722056, + 0.00010861256305361167, + 0.00010723753075581044, + 0.00010632628982421011 + ], + "bp_grad_F": [ + 0.10164787620306015, + 0.02202906273305416, + 0.01239779032766819, + 0.012042474001646042, + 0.011877987533807755 + ], + "gamma_dfa": 0.07324381358921528, + "gamma_dfa_per_layer": [ + 0.03170452266931534, + 0.07619009912014008, + 0.09431108087301254, + 0.09076955169439316 + ], + "acc_eval": 0.6910000443458557, + "loss_eval": 0.9011825919151306, + "epoch": 23 + }, + { + "hidden_norms": [ + 11.269571304321289, + 26.24439239501953, + 153.2904510498047, + 271.96038818359375, + 388.2030029296875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007652259082533419, + 0.00016368107753805816, + 0.00010516044130781665, + 0.0001030244748108089, + 0.00010207654122496024 + ], + "bp_grad_F": [ + 0.09788329899311066, + 0.021043717861175537, + 0.012156899087131023, + 0.011852008290588856, + 0.011708464473485947 + ], + "gamma_dfa": 0.07162218820303679, + "gamma_dfa_per_layer": [ + 0.032286133617162704, + 0.0729740634560585, + 0.09137451648712158, + 0.08985403925180435 + ], + "acc_eval": 0.7015000581741333, + "loss_eval": 0.8572027683258057, + "epoch": 24 + }, + { + "hidden_norms": [ + 11.269571304321289, + 26.939895629882812, + 160.01840209960938, + 282.9203796386719, + 404.1251220703125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007471513818018138, + 0.00015666495892219245, + 0.0001027472535497509, + 0.00010242985445074737, + 0.00010123744141310453 + ], + "bp_grad_F": [ + 0.09715361893177032, + 0.02044457010924816, + 0.011886605061590672, + 0.011604394763708115, + 0.01146735716611147 + ], + "gamma_dfa": 0.07091694697737694, + "gamma_dfa_per_layer": [ + 0.0328441858291626, + 0.07304085046052933, + 0.08939228951931, + 0.08839046210050583 + ], + "acc_eval": 0.7035000324249268, + "loss_eval": 0.8259502649307251, + "epoch": 25 + }, + { + "hidden_norms": [ + 11.269571304321289, + 27.655963897705078, + 166.2253875732422, + 293.953857421875, + 419.2309265136719 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008196054841391742, + 0.000168012484209612, + 0.00011266919318586588, + 0.0001119820517487824, + 0.00011136133980471641 + ], + "bp_grad_F": [ + 0.09666500240564346, + 0.020363574847579002, + 0.012169744819402695, + 0.011900369077920914, + 0.011767606250941753 + ], + "gamma_dfa": 0.07011445891112089, + "gamma_dfa_per_layer": [ + 0.03361910209059715, + 0.07148489356040955, + 0.08753866702318192, + 0.08781517297029495 + ], + "acc_eval": 0.6930000185966492, + "loss_eval": 0.8744071125984192, + "epoch": 26 + }, + { + "hidden_norms": [ + 11.269571304321289, + 28.399173736572266, + 173.29478454589844, + 305.1183776855469, + 435.8616027832031 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008379096980206668, + 0.00016787118511274457, + 0.00011563840962480754, + 0.00011382131197024137, + 0.00011414202890591696 + ], + "bp_grad_F": [ + 0.09941841661930084, + 0.01996329240500927, + 0.012196086347103119, + 0.011958655901253223, + 0.011834335513412952 + ], + "gamma_dfa": 0.06707034399732947, + "gamma_dfa_per_layer": [ + 0.027506088837981224, + 0.07163777202367783, + 0.08489245176315308, + 0.08424506336450577 + ], + "acc_eval": 0.6860000491142273, + "loss_eval": 0.8969190716743469, + "epoch": 27 + }, + { + "hidden_norms": [ + 11.269571304321289, + 29.067270278930664, + 179.52621459960938, + 315.666015625, + 450.67449951171875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007646313752047718, + 0.00014840309449937195, + 9.849335037870333e-05, + 9.682594100013375e-05, + 9.619411139283329e-05 + ], + "bp_grad_F": [ + 0.10344142466783524, + 0.020078541710972786, + 0.012122261337935925, + 0.011881489306688309, + 0.011760085821151733 + ], + "gamma_dfa": 0.06692653149366379, + "gamma_dfa_per_layer": [ + 0.027295783162117004, + 0.06953233480453491, + 0.08493673801422119, + 0.08594126999378204 + ], + "acc_eval": 0.6980000138282776, + "loss_eval": 0.9112558960914612, + "epoch": 28 + }, + { + "hidden_norms": [ + 11.269571304321289, + 29.80398941040039, + 186.03025817871094, + 326.7105407714844, + 466.4792785644531 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008647075155749917, + 0.00016527411935385317, + 0.00011362476652720943, + 0.00011306258238619193, + 0.00011151444778079167 + ], + "bp_grad_F": [ + 0.0982326790690422, + 0.0193523820489645, + 0.012001772411167622, + 0.011787012219429016, + 0.011672897264361382 + ], + "gamma_dfa": 0.06665132055059075, + "gamma_dfa_per_layer": [ + 0.028357060626149178, + 0.06870155036449432, + 0.0840969979763031, + 0.08544967323541641 + ], + "acc_eval": 0.6960000395774841, + "loss_eval": 0.8792264461517334, + "epoch": 29 + }, + { + "hidden_norms": [ + 11.269571304321289, + 30.495162963867188, + 192.21092224121094, + 336.62432861328125, + 480.96929931640625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007892370922490954, + 0.00014862553507555276, + 0.00010144516272703186, + 0.00010014566942118108, + 9.811606287257746e-05 + ], + "bp_grad_F": [ + 0.10485321283340454, + 0.01980445720255375, + 0.012311456725001335, + 0.01209663413465023, + 0.011984387412667274 + ], + "gamma_dfa": 0.0650303359143436, + "gamma_dfa_per_layer": [ + 0.02565421722829342, + 0.06553934514522552, + 0.08334222435951233, + 0.08558555692434311 + ], + "acc_eval": 0.6845000386238098, + "loss_eval": 0.9355857968330383, + "epoch": 30 + }, + { + "hidden_norms": [ + 11.269571304321289, + 31.204212188720703, + 198.0793914794922, + 346.7908020019531, + 494.94366455078125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008273097337223589, + 0.00016349409997928888, + 0.00011394457396818325, + 0.00011259203165536746, + 0.00011180129513377324 + ], + "bp_grad_F": [ + 0.10106314718723297, + 0.019085418432950974, + 0.01192714087665081, + 0.011723030358552933, + 0.011616164818406105 + ], + "gamma_dfa": 0.06359042041003704, + "gamma_dfa_per_layer": [ + 0.025547169148921967, + 0.06356105208396912, + 0.08179818838834763, + 0.08345527201890945 + ], + "acc_eval": 0.7055000066757202, + "loss_eval": 0.8810407519340515, + "epoch": 31 + }, + { + "hidden_norms": [ + 11.269571304321289, + 31.86461067199707, + 203.8866424560547, + 357.24273681640625, + 509.47283935546875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007937258342280984, + 0.0001423554786015302, + 0.0001006650782073848, + 9.906977356877178e-05, + 9.873251110548154e-05 + ], + "bp_grad_F": [ + 0.10255990922451019, + 0.018815871328115463, + 0.012050059624016285, + 0.011867615394294262, + 0.011764303781092167 + ], + "gamma_dfa": 0.06225612107664347, + "gamma_dfa_per_layer": [ + 0.026912778615951538, + 0.060097675770521164, + 0.07986276596784592, + 0.08215126395225525 + ], + "acc_eval": 0.6975000500679016, + "loss_eval": 0.8993597626686096, + "epoch": 32 + }, + { + "hidden_norms": [ + 11.269571304321289, + 32.55842590332031, + 209.36538696289062, + 366.7745056152344, + 523.1634521484375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009271818562410772, + 0.00017398923228029162, + 0.00012348532618489116, + 0.00012206545943627134, + 0.00011946412996621802 + ], + "bp_grad_F": [ + 0.10045517235994339, + 0.018744034692645073, + 0.0122413644567132, + 0.012060520239174366, + 0.011960742995142937 + ], + "gamma_dfa": 0.06293319165706635, + "gamma_dfa_per_layer": [ + 0.02326873689889908, + 0.06609776616096497, + 0.07875392585992813, + 0.0836123377084732 + ], + "acc_eval": 0.6760000586509705, + "loss_eval": 0.9358338713645935, + "epoch": 33 + }, + { + "hidden_norms": [ + 11.269571304321289, + 33.2861213684082, + 214.81686401367188, + 376.10357666015625, + 536.3932495117188 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008684046333655715, + 0.0001622825366212055, + 0.00011986666504526511, + 0.00011786946561187506, + 0.00011659466690616682 + ], + "bp_grad_F": [ + 0.10286933183670044, + 0.018639566376805305, + 0.012188107706606388, + 0.01201487798243761, + 0.011918813921511173 + ], + "gamma_dfa": 0.06226353673264384, + "gamma_dfa_per_layer": [ + 0.023258207365870476, + 0.06267606467008591, + 0.0803714394569397, + 0.08274843543767929 + ], + "acc_eval": 0.6810000538825989, + "loss_eval": 0.9304502010345459, + "epoch": 34 + }, + { + "hidden_norms": [ + 11.269571304321289, + 33.87834167480469, + 220.428466796875, + 384.2508850097656, + 548.2610473632812 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007953296881169081, + 0.00014800684584770352, + 0.00011162432201672345, + 0.00011058645759476349, + 0.00010956013284157962 + ], + "bp_grad_F": [ + 0.10028568655252457, + 0.018069755285978317, + 0.011859637685120106, + 0.011696909554302692, + 0.01160619780421257 + ], + "gamma_dfa": 0.06300693331286311, + "gamma_dfa_per_layer": [ + 0.027522550895810127, + 0.06186108663678169, + 0.07987839728593826, + 0.08276569843292236 + ], + "acc_eval": 0.6955000162124634, + "loss_eval": 0.8840450048446655, + "epoch": 35 + }, + { + "hidden_norms": [ + 11.269571304321289, + 34.509605407714844, + 225.59780883789062, + 393.6628112792969, + 561.568115234375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008583659655414522, + 0.00015650303976144642, + 0.00011532937787706032, + 0.00011489073949633166, + 0.00011400022049201652 + ], + "bp_grad_F": [ + 0.09966019541025162, + 0.018014561384916306, + 0.012010997161269188, + 0.011846955865621567, + 0.011755259707570076 + ], + "gamma_dfa": 0.06271304981783032, + "gamma_dfa_per_layer": [ + 0.029912440106272697, + 0.06141362711787224, + 0.0793088749051094, + 0.08021725714206696 + ], + "acc_eval": 0.687000036239624, + "loss_eval": 0.9074093103408813, + "epoch": 36 + }, + { + "hidden_norms": [ + 11.269571304321289, + 35.15583801269531, + 230.31370544433594, + 402.0650634765625, + 574.2296752929688 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008762985817156732, + 0.00015229854034259915, + 0.00011411930609028786, + 0.0001132417019107379, + 0.00011245955829508603 + ], + "bp_grad_F": [ + 0.09909173101186752, + 0.017660830169916153, + 0.011859647929668427, + 0.011700768023729324, + 0.011612875387072563 + ], + "gamma_dfa": 0.059298016130924225, + "gamma_dfa_per_layer": [ + 0.026200097054243088, + 0.0549272783100605, + 0.0762626901268959, + 0.0798019990324974 + ], + "acc_eval": 0.7035000324249268, + "loss_eval": 0.8701910376548767, + "epoch": 37 + }, + { + "hidden_norms": [ + 11.269571304321289, + 35.66206741333008, + 234.8238983154297, + 409.3634033203125, + 584.876953125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009031461668200791, + 0.00016782402235548943, + 0.00012555152352433652, + 0.0001250550412805751, + 0.000123959660413675 + ], + "bp_grad_F": [ + 0.09997168928384781, + 0.01780031807720661, + 0.012050634250044823, + 0.011898917146027088, + 0.011813494376838207 + ], + "gamma_dfa": 0.06037319032475352, + "gamma_dfa_per_layer": [ + 0.028592003509402275, + 0.05390740931034088, + 0.07796172052621841, + 0.08103162795305252 + ], + "acc_eval": 0.6850000619888306, + "loss_eval": 0.9033781886100769, + "epoch": 38 + }, + { + "hidden_norms": [ + 11.269571304321289, + 36.278228759765625, + 239.4936981201172, + 417.3722229003906, + 596.1981201171875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009072510292753577, + 0.00015473780513275415, + 0.00011584340245462954, + 0.00011548803740879521, + 0.00011424912372604012 + ], + "bp_grad_F": [ + 0.10279728472232819, + 0.017760641872882843, + 0.012076830491423607, + 0.01192280650138855, + 0.011838974431157112 + ], + "gamma_dfa": 0.05956542398780584, + "gamma_dfa_per_layer": [ + 0.025189489126205444, + 0.05668117478489876, + 0.07571582496166229, + 0.08067520707845688 + ], + "acc_eval": 0.6835000514984131, + "loss_eval": 0.9166074395179749, + "epoch": 39 + }, + { + "hidden_norms": [ + 11.269571304321289, + 36.87733459472656, + 244.1138153076172, + 425.2259826660156, + 607.8081665039062 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008976306999102235, + 0.00015640830679330975, + 0.00012026254989905283, + 0.00011915730283362791, + 0.00011880237434525043 + ], + "bp_grad_F": [ + 0.10276701301336288, + 0.017705289646983147, + 0.012149399146437645, + 0.01199993398040533, + 0.01191749982535839 + ], + "gamma_dfa": 0.05778269004076719, + "gamma_dfa_per_layer": [ + 0.02565983682870865, + 0.051832567900419235, + 0.07554878294467926, + 0.07808957248926163 + ], + "acc_eval": 0.6880000233650208, + "loss_eval": 0.9326384663581848, + "epoch": 40 + }, + { + "hidden_norms": [ + 11.269571304321289, + 37.373634338378906, + 248.1051483154297, + 432.9554748535156, + 618.172607421875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009300907258875668, + 0.00016527887783013284, + 0.00012494091060943902, + 0.00012375703954603523, + 0.00012343957496341318 + ], + "bp_grad_F": [ + 0.10167930275201797, + 0.017580606043338776, + 0.01197358313947916, + 0.01181697752326727, + 0.011733012273907661 + ], + "gamma_dfa": 0.059646998066455126, + "gamma_dfa_per_layer": [ + 0.025086766108870506, + 0.05520859733223915, + 0.0782475471496582, + 0.08004508167505264 + ], + "acc_eval": 0.6935000419616699, + "loss_eval": 0.9074762463569641, + "epoch": 41 + }, + { + "hidden_norms": [ + 11.269571304321289, + 37.94633483886719, + 252.25924682617188, + 439.8863525390625, + 628.1370239257812 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008688273373991251, + 0.00015619541227351874, + 0.00011818459461210296, + 0.00011805404938058928, + 0.00011655993148451671 + ], + "bp_grad_F": [ + 0.10280012339353561, + 0.017362425103783607, + 0.012144921347498894, + 0.012009261175990105, + 0.011929930187761784 + ], + "gamma_dfa": 0.057152220979332924, + "gamma_dfa_per_layer": [ + 0.026838082820177078, + 0.05145636573433876, + 0.07389623671770096, + 0.0764181986451149 + ], + "acc_eval": 0.6780000329017639, + "loss_eval": 0.9220576286315918, + "epoch": 42 + }, + { + "hidden_norms": [ + 11.269571304321289, + 38.43475341796875, + 256.3348388671875, + 446.7797546386719, + 638.6549072265625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009689890430308878, + 0.0001675912644714117, + 0.00013143723481334746, + 0.00012922017776872963, + 0.00012865127064287663 + ], + "bp_grad_F": [ + 0.10019267350435257, + 0.017157867550849915, + 0.012005961500108242, + 0.01186591386795044, + 0.011786815710365772 + ], + "gamma_dfa": 0.05704171909019351, + "gamma_dfa_per_layer": [ + 0.02657354436814785, + 0.04850248247385025, + 0.07429356873035431, + 0.07879728078842163 + ], + "acc_eval": 0.6815000176429749, + "loss_eval": 0.9045827388763428, + "epoch": 43 + }, + { + "hidden_norms": [ + 11.269571304321289, + 38.949981689453125, + 259.91455078125, + 453.5318603515625, + 649.1691284179688 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008703607600182295, + 0.0001509855646872893, + 0.00011334709415677935, + 0.00011273188283666968, + 0.00011187820200575516 + ], + "bp_grad_F": [ + 0.10038246959447861, + 0.017015060409903526, + 0.011884159408509731, + 0.011748326942324638, + 0.01167102251201868 + ], + "gamma_dfa": 0.056442280765622854, + "gamma_dfa_per_layer": [ + 0.024923482909798622, + 0.04813612625002861, + 0.07466092705726624, + 0.07804858684539795 + ], + "acc_eval": 0.6880000233650208, + "loss_eval": 0.8986373543739319, + "epoch": 44 + }, + { + "hidden_norms": [ + 11.269571304321289, + 39.40317916870117, + 263.8382873535156, + 459.8589782714844, + 657.81396484375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008396115736104548, + 0.00014526791346725076, + 0.0001117709616664797, + 0.0001101615052903071, + 0.00010919143096543849 + ], + "bp_grad_F": [ + 0.10223646461963654, + 0.01701364293694496, + 0.011921641416847706, + 0.011793220415711403, + 0.01171908900141716 + ], + "gamma_dfa": 0.05634786421433091, + "gamma_dfa_per_layer": [ + 0.023860810324549675, + 0.05130583420395851, + 0.0730678141117096, + 0.07715699821710587 + ], + "acc_eval": 0.6845000386238098, + "loss_eval": 0.9070615172386169, + "epoch": 45 + }, + { + "hidden_norms": [ + 11.269571304321289, + 39.78729248046875, + 267.06787109375, + 465.8781433105469, + 665.705078125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008805220131762326, + 0.0001506610424257815, + 0.0001190964540001005, + 0.00011831042502308264, + 0.0001174084609374404 + ], + "bp_grad_F": [ + 0.09873763471841812, + 0.01661210134625435, + 0.011734068393707275, + 0.011604530736804008, + 0.011532736010849476 + ], + "gamma_dfa": 0.057100610341876745, + "gamma_dfa_per_layer": [ + 0.025687912479043007, + 0.05223910138010979, + 0.07347920536994934, + 0.07699622213840485 + ], + "acc_eval": 0.7010000348091125, + "loss_eval": 0.8647292256355286, + "epoch": 46 + }, + { + "hidden_norms": [ + 11.269571304321289, + 40.20953369140625, + 270.48760986328125, + 471.71197509765625, + 674.6234741210938 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008946783491410315, + 0.0001546104613225907, + 0.00012653943849727511, + 0.0001261695142602548, + 0.00012597300519701093 + ], + "bp_grad_F": [ + 0.10005417466163635, + 0.016553794965147972, + 0.011853700503706932, + 0.011732862330973148, + 0.01166335679590702 + ], + "gamma_dfa": 0.056281615514308214, + "gamma_dfa_per_layer": [ + 0.02603459171950817, + 0.051092494279146194, + 0.07222969830036163, + 0.07576967775821686 + ], + "acc_eval": 0.6895000338554382, + "loss_eval": 0.8898184299468994, + "epoch": 47 + }, + { + "hidden_norms": [ + 11.269571304321289, + 40.61681365966797, + 273.5674743652344, + 477.6903381347656, + 683.2316284179688 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009305709972977638, + 0.0001684492890490219, + 0.00013056330499239266, + 0.00013055883755441755, + 0.00012972661352250725 + ], + "bp_grad_F": [ + 0.10108529776334763, + 0.01676928997039795, + 0.012042575515806675, + 0.011920345947146416, + 0.011849730275571346 + ], + "gamma_dfa": 0.05756285693496466, + "gamma_dfa_per_layer": [ + 0.028283007442951202, + 0.04865947738289833, + 0.0757322907447815, + 0.0775766521692276 + ], + "acc_eval": 0.6825000047683716, + "loss_eval": 0.9249827861785889, + "epoch": 48 + }, + { + "hidden_norms": [ + 11.269571304321289, + 40.986331939697266, + 276.55340576171875, + 482.9735412597656, + 690.4827880859375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009371762280352414, + 0.00015377832460217178, + 0.00011931644257856533, + 0.00011877353972522542, + 0.00011843052197946236 + ], + "bp_grad_F": [ + 0.10423478484153748, + 0.01686144433915615, + 0.012089447118341923, + 0.011962956748902798, + 0.011895008385181427 + ], + "gamma_dfa": 0.05634950753301382, + "gamma_dfa_per_layer": [ + 0.024047940969467163, + 0.05029236152768135, + 0.07294473052024841, + 0.07811299711465836 + ], + "acc_eval": 0.6770000457763672, + "loss_eval": 0.9276119470596313, + "epoch": 49 + }, + { + "hidden_norms": [ + 11.269571304321289, + 41.36444091796875, + 279.21368408203125, + 487.9245910644531, + 698.8203735351562 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009180991910398006, + 0.00016040228365454823, + 0.00012619509652722627, + 0.0001242315920535475, + 0.00012414241791702807 + ], + "bp_grad_F": [ + 0.09876055270433426, + 0.016378939151763916, + 0.011831536889076233, + 0.011710439808666706, + 0.011641835793852806 + ], + "gamma_dfa": 0.056217589881271124, + "gamma_dfa_per_layer": [ + 0.026943759992718697, + 0.04981214925646782, + 0.0719020888209343, + 0.07621236145496368 + ], + "acc_eval": 0.6945000290870667, + "loss_eval": 0.8922800421714783, + "epoch": 50 + }, + { + "hidden_norms": [ + 11.269571304321289, + 41.725521087646484, + 282.2077331542969, + 492.55194091796875, + 705.709228515625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009282235405407846, + 0.00015841209096834064, + 0.00012215816241223365, + 0.0001216854143422097, + 0.0001213739305967465 + ], + "bp_grad_F": [ + 0.10062722116708755, + 0.016464965417981148, + 0.011968642473220825, + 0.011850792914628983, + 0.011783461086452007 + ], + "gamma_dfa": 0.05594501877203584, + "gamma_dfa_per_layer": [ + 0.027507653459906578, + 0.047868166118860245, + 0.07275017350912094, + 0.07565408200025558 + ], + "acc_eval": 0.674500048160553, + "loss_eval": 0.9168669581413269, + "epoch": 51 + }, + { + "hidden_norms": [ + 11.269571304321289, + 42.07438659667969, + 284.91143798828125, + 497.33489990234375, + 712.7407836914062 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008946438319981098, + 0.0001599262177478522, + 0.0001243542501470074, + 0.00012355486978776753, + 0.0001230162160936743 + ], + "bp_grad_F": [ + 0.09976927936077118, + 0.016204386949539185, + 0.011793862096965313, + 0.011675998568534851, + 0.01161060482263565 + ], + "gamma_dfa": 0.057106493040919304, + "gamma_dfa_per_layer": [ + 0.025031987577676773, + 0.05149566009640694, + 0.07346570491790771, + 0.07843261957168579 + ], + "acc_eval": 0.6895000338554382, + "loss_eval": 0.8812824487686157, + "epoch": 52 + }, + { + "hidden_norms": [ + 11.269571304321289, + 42.312625885009766, + 287.158447265625, + 501.61053466796875, + 718.7759399414062 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008852323517203331, + 0.0001484409294789657, + 0.00011503385030664504, + 0.00011482135596452281, + 0.00011442313552834094 + ], + "bp_grad_F": [ + 0.10061701387166977, + 0.016211561858654022, + 0.011752818711102009, + 0.011636910028755665, + 0.011571302078664303 + ], + "gamma_dfa": 0.055246823001652956, + "gamma_dfa_per_layer": [ + 0.024583658203482628, + 0.04850705340504646, + 0.07144256681203842, + 0.07645401358604431 + ], + "acc_eval": 0.6955000162124634, + "loss_eval": 0.888053834438324, + "epoch": 53 + }, + { + "hidden_norms": [ + 11.269571304321289, + 42.61886978149414, + 289.2788391113281, + 505.75390625, + 724.4559326171875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009071374079212546, + 0.00015266452101059258, + 0.00011854806507471949, + 0.00011884445120813325, + 0.00011772327707149088 + ], + "bp_grad_F": [ + 0.10303837805986404, + 0.016465138643980026, + 0.011987767182290554, + 0.011867417953908443, + 0.011802136898040771 + ], + "gamma_dfa": 0.05469688028097153, + "gamma_dfa_per_layer": [ + 0.02719976380467415, + 0.04610869660973549, + 0.07147730141878128, + 0.07400175929069519 + ], + "acc_eval": 0.6820000410079956, + "loss_eval": 0.9107973575592041, + "epoch": 54 + }, + { + "hidden_norms": [ + 11.269571304321289, + 42.90008544921875, + 291.5098876953125, + 509.49200439453125, + 730.070068359375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009346315637230873, + 0.00017380902136210352, + 0.00014277170703280717, + 0.0001402509369654581, + 0.00014013791223987937 + ], + "bp_grad_F": [ + 0.10035568475723267, + 0.016459215432405472, + 0.012036965228617191, + 0.011920913122594357, + 0.01185610517859459 + ], + "gamma_dfa": 0.055851065553724766, + "gamma_dfa_per_layer": [ + 0.026028182357549667, + 0.04594290256500244, + 0.07459361851215363, + 0.07683955878019333 + ], + "acc_eval": 0.6720000505447388, + "loss_eval": 0.9282984733581543, + "epoch": 55 + }, + { + "hidden_norms": [ + 11.269571304321289, + 43.15349197387695, + 293.65966796875, + 513.3607177734375, + 735.3644409179688 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009396777604706585, + 0.00015277721104212105, + 0.00012291918392293155, + 0.00012154672003816813, + 0.00012096676073269919 + ], + "bp_grad_F": [ + 0.10190626233816147, + 0.016208121553063393, + 0.011865625157952309, + 0.011748027056455612, + 0.011683868244290352 + ], + "gamma_dfa": 0.05457223346456885, + "gamma_dfa_per_layer": [ + 0.02600257657468319, + 0.046096257865428925, + 0.0713086724281311, + 0.0748814269900322 + ], + "acc_eval": 0.6920000314712524, + "loss_eval": 0.8892928957939148, + "epoch": 56 + }, + { + "hidden_norms": [ + 11.269571304321289, + 43.37159729003906, + 295.3875732421875, + 516.53369140625, + 740.1768798828125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008509810431860387, + 0.000149228420923464, + 0.00012114718265365809, + 0.00012038950808346272, + 0.00011932845518458635 + ], + "bp_grad_F": [ + 0.09941542148590088, + 0.015937170013785362, + 0.01166422851383686, + 0.011551388539373875, + 0.011488799005746841 + ], + "gamma_dfa": 0.053473991341888905, + "gamma_dfa_per_layer": [ + 0.0227724090218544, + 0.045084040611982346, + 0.07109282910823822, + 0.07494668662548065 + ], + "acc_eval": 0.6945000290870667, + "loss_eval": 0.8690445423126221, + "epoch": 57 + }, + { + "hidden_norms": [ + 11.269571304321289, + 43.58628463745117, + 297.0165710449219, + 519.4993286132812, + 744.6467895507812 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009939862648025155, + 0.0001676510728430003, + 0.00013252485950943083, + 0.0001307348720729351, + 0.0001300926087424159 + ], + "bp_grad_F": [ + 0.10170887410640717, + 0.016186155378818512, + 0.011895725503563881, + 0.011782051995396614, + 0.0117182033136487 + ], + "gamma_dfa": 0.05389358149841428, + "gamma_dfa_per_layer": [ + 0.024122020229697227, + 0.04528462514281273, + 0.0715978741645813, + 0.07456980645656586 + ], + "acc_eval": 0.6840000152587891, + "loss_eval": 0.9150904417037964, + "epoch": 58 + }, + { + "hidden_norms": [ + 11.269571304321289, + 43.756309509277344, + 298.4603576660156, + 522.1862182617188, + 748.0980224609375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009121120092459023, + 0.00015141229960136116, + 0.00012266664998605847, + 0.00012074616097379476, + 0.00012072239769622684 + ], + "bp_grad_F": [ + 0.09929168969392776, + 0.015882758423686028, + 0.011736094020307064, + 0.011626454070210457, + 0.011565400287508965 + ], + "gamma_dfa": 0.05446606734767556, + "gamma_dfa_per_layer": [ + 0.023944402113556862, + 0.04696139693260193, + 0.07070320099592209, + 0.07625526934862137 + ], + "acc_eval": 0.6895000338554382, + "loss_eval": 0.8752753138542175, + "epoch": 59 + }, + { + "hidden_norms": [ + 11.269571304321289, + 43.956050872802734, + 299.8046569824219, + 524.5073852539062, + 751.9002075195312 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009328208980150521, + 0.00015578871534671634, + 0.00012375388178043067, + 0.00012286445416975766, + 0.0001222269784193486 + ], + "bp_grad_F": [ + 0.09782548248767853, + 0.015724968165159225, + 0.011678245849907398, + 0.01156895887106657, + 0.01150886993855238 + ], + "gamma_dfa": 0.05415696511045098, + "gamma_dfa_per_layer": [ + 0.025110432878136635, + 0.04582852125167847, + 0.07056943327188492, + 0.07511947304010391 + ], + "acc_eval": 0.6910000443458557, + "loss_eval": 0.8689600825309753, + "epoch": 60 + }, + { + "hidden_norms": [ + 11.269571304321289, + 44.10476303100586, + 301.22088623046875, + 527.0880737304688, + 755.537109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009187725954689085, + 0.0001580083044245839, + 0.00012691691517829895, + 0.00012647418770939112, + 0.00012595193402376026 + ], + "bp_grad_F": [ + 0.09907824546098709, + 0.01592797227203846, + 0.011772784404456615, + 0.011660448275506496, + 0.011597777716815472 + ], + "gamma_dfa": 0.053306530229747295, + "gamma_dfa_per_layer": [ + 0.025752168148756027, + 0.04250373691320419, + 0.07085125893354416, + 0.0741189569234848 + ], + "acc_eval": 0.6785000562667847, + "loss_eval": 0.8745812773704529, + "epoch": 61 + }, + { + "hidden_norms": [ + 11.269571304321289, + 44.272037506103516, + 302.41107177734375, + 529.3627319335938, + 758.9468383789062 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009381037671118975, + 0.00015578897728119045, + 0.00012793939094990492, + 0.00012725923443213105, + 0.00012640930071938783 + ], + "bp_grad_F": [ + 0.09839630872011185, + 0.015703976154327393, + 0.011679527349770069, + 0.01157388836145401, + 0.011512565426528454 + ], + "gamma_dfa": 0.053105687256902456, + "gamma_dfa_per_layer": [ + 0.022858327254652977, + 0.04474852979183197, + 0.06992355734109879, + 0.07489233464002609 + ], + "acc_eval": 0.6865000128746033, + "loss_eval": 0.8636536002159119, + "epoch": 62 + }, + { + "hidden_norms": [ + 11.269571304321289, + 44.36368942260742, + 303.7563781738281, + 531.5054931640625, + 762.388427734375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009112239349633455, + 0.0001562510442454368, + 0.00013036206655669957, + 0.00012987821537535638, + 0.0001294936373597011 + ], + "bp_grad_F": [ + 0.09861280024051666, + 0.015790371224284172, + 0.011699686758220196, + 0.01159034576267004, + 0.011528948321938515 + ], + "gamma_dfa": 0.05348377674818039, + "gamma_dfa_per_layer": [ + 0.0251171812415123, + 0.04412227123975754, + 0.07024820148944855, + 0.07444745302200317 + ], + "acc_eval": 0.6885000467300415, + "loss_eval": 0.8699802160263062, + "epoch": 63 + }, + { + "hidden_norms": [ + 11.269571304321289, + 44.498130798339844, + 304.7552185058594, + 533.51318359375, + 765.1610717773438 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008680672035552561, + 0.00014313006249722093, + 0.00011654605623334646, + 0.00011439070658525452, + 0.00011445816198829561 + ], + "bp_grad_F": [ + 0.0990181565284729, + 0.015660114586353302, + 0.011611604131758213, + 0.011503342539072037, + 0.011442977003753185 + ], + "gamma_dfa": 0.05415269639343023, + "gamma_dfa_per_layer": [ + 0.024549636989831924, + 0.0454377755522728, + 0.07077726721763611, + 0.0758461058139801 + ], + "acc_eval": 0.6960000395774841, + "loss_eval": 0.8598873615264893, + "epoch": 64 + }, + { + "hidden_norms": [ + 11.269571304321289, + 44.600582122802734, + 305.7388610839844, + 534.99951171875, + 767.8171997070312 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008962214924395084, + 0.00015309070295188576, + 0.00012299958325456828, + 0.000121716657304205, + 0.0001212474235217087 + ], + "bp_grad_F": [ + 0.10033439099788666, + 0.015828289091587067, + 0.011728483252227306, + 0.01162028405815363, + 0.011559616774320602 + ], + "gamma_dfa": 0.05304920673370361, + "gamma_dfa_per_layer": [ + 0.02494572103023529, + 0.043708547949790955, + 0.06946250051259995, + 0.07408005744218826 + ], + "acc_eval": 0.6895000338554382, + "loss_eval": 0.8800998330116272, + "epoch": 65 + }, + { + "hidden_norms": [ + 11.269571304321289, + 44.70732879638672, + 306.55181884765625, + 536.31005859375, + 769.971923828125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009149253601208329, + 0.00015781939146108925, + 0.00012933975085616112, + 0.00012773934577126056, + 0.00012716377386823297 + ], + "bp_grad_F": [ + 0.09770160913467407, + 0.015633704140782356, + 0.011657179333269596, + 0.011551215313374996, + 0.011491267941892147 + ], + "gamma_dfa": 0.05268599092960358, + "gamma_dfa_per_layer": [ + 0.024415917694568634, + 0.04385191947221756, + 0.06913819909095764, + 0.07333792746067047 + ], + "acc_eval": 0.6930000185966492, + "loss_eval": 0.8666836023330688, + "epoch": 66 + }, + { + "hidden_norms": [ + 11.269571304321289, + 44.78550338745117, + 307.4527893066406, + 537.914306640625, + 771.5177612304688 + ], + "bp_grad_per_sample_l2_med": [ + 0.000909268157556653, + 0.0001503752137068659, + 0.00012163108476670459, + 0.00012035916006425396, + 0.00012008652265649289 + ], + "bp_grad_F": [ + 0.09915008395910263, + 0.015667738392949104, + 0.011642162688076496, + 0.01153358444571495, + 0.011473594233393669 + ], + "gamma_dfa": 0.05392309743911028, + "gamma_dfa_per_layer": [ + 0.023599978536367416, + 0.04531348496675491, + 0.07121817022562027, + 0.07556075602769852 + ], + "acc_eval": 0.6955000162124634, + "loss_eval": 0.8635799884796143, + "epoch": 67 + }, + { + "hidden_norms": [ + 11.269571304321289, + 44.858604431152344, + 308.1347961425781, + 538.9302368164062, + 773.1725463867188 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009114991407841444, + 0.00015059093129821122, + 0.00012239563511684537, + 0.00012128813978051767, + 0.00012036858242936432 + ], + "bp_grad_F": [ + 0.0976131409406662, + 0.015529998578131199, + 0.01157119870185852, + 0.011464742012321949, + 0.01140571665018797 + ], + "gamma_dfa": 0.05296219326555729, + "gamma_dfa_per_layer": [ + 0.02382323145866394, + 0.04349217563867569, + 0.0696524977684021, + 0.07488086819648743 + ], + "acc_eval": 0.6940000057220459, + "loss_eval": 0.8525131344795227, + "epoch": 68 + }, + { + "hidden_norms": [ + 11.269571304321289, + 44.92080307006836, + 308.6539001464844, + 539.7476806640625, + 774.7044067382812 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009130545658990741, + 0.0001561250537633896, + 0.00012542278273031116, + 0.0001241281715920195, + 0.0001238062686752528 + ], + "bp_grad_F": [ + 0.0973346009850502, + 0.015503575094044209, + 0.01158667542040348, + 0.011482889764010906, + 0.01142406091094017 + ], + "gamma_dfa": 0.05284834885969758, + "gamma_dfa_per_layer": [ + 0.023774540051817894, + 0.04253865405917168, + 0.0699956938624382, + 0.07508450746536255 + ], + "acc_eval": 0.6875000596046448, + "loss_eval": 0.8490641713142395, + "epoch": 69 + }, + { + "hidden_norms": [ + 11.269571304321289, + 44.97352600097656, + 309.19366455078125, + 540.6045532226562, + 775.7159423828125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008941096602939069, + 0.0001490603171987459, + 0.00012243444507475942, + 0.00012086174683645368, + 0.00011930170876439661 + ], + "bp_grad_F": [ + 0.0978497788310051, + 0.015526177361607552, + 0.011586111970245838, + 0.011480187065899372, + 0.011420912109315395 + ], + "gamma_dfa": 0.052993528079241514, + "gamma_dfa_per_layer": [ + 0.02384653501212597, + 0.04263130575418472, + 0.0702076405286789, + 0.07528863102197647 + ], + "acc_eval": 0.6950000524520874, + "loss_eval": 0.8494359850883484, + "epoch": 70 + }, + { + "hidden_norms": [ + 11.269571304321289, + 45.018131256103516, + 309.6293640136719, + 541.2432861328125, + 776.7703857421875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009062750032171607, + 0.00015435971727129072, + 0.00012295282795093954, + 0.00012264182441867888, + 0.00012187549873488024 + ], + "bp_grad_F": [ + 0.0975913405418396, + 0.015510785393416882, + 0.011592722497880459, + 0.011488175950944424, + 0.011429551988840103 + ], + "gamma_dfa": 0.05261069582775235, + "gamma_dfa_per_layer": [ + 0.023613562807440758, + 0.04278940334916115, + 0.06959826499223709, + 0.07444155216217041 + ], + "acc_eval": 0.6895000338554382, + "loss_eval": 0.8503831624984741, + "epoch": 71 + }, + { + "hidden_norms": [ + 11.269571304321289, + 45.05687713623047, + 309.88616943359375, + 541.6970825195312, + 777.6474609375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009167437092401087, + 0.00015087658539414406, + 0.00012154471187386662, + 0.00012103841436328366, + 0.00012099531886633486 + ], + "bp_grad_F": [ + 0.09737422317266464, + 0.015458790585398674, + 0.011581062339246273, + 0.011477372609078884, + 0.01141849160194397 + ], + "gamma_dfa": 0.05269155744463205, + "gamma_dfa_per_layer": [ + 0.02412768080830574, + 0.04288121312856674, + 0.06955435872077942, + 0.07420297712087631 + ], + "acc_eval": 0.6875000596046448, + "loss_eval": 0.8513321280479431, + "epoch": 72 + }, + { + "hidden_norms": [ + 11.269571304321289, + 45.083457946777344, + 310.21551513671875, + 542.2005615234375, + 778.2576904296875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009331087348982692, + 0.00015250151045620441, + 0.00012407499889377505, + 0.00012352959311101586, + 0.0001235192030435428 + ], + "bp_grad_F": [ + 0.09731114655733109, + 0.015489363111555576, + 0.011589608155190945, + 0.011484977789223194, + 0.01142611913383007 + ], + "gamma_dfa": 0.05234858160838485, + "gamma_dfa_per_layer": [ + 0.023583704605698586, + 0.04196107015013695, + 0.06969348341226578, + 0.07415606826543808 + ], + "acc_eval": 0.6885000467300415, + "loss_eval": 0.8485224843025208, + "epoch": 73 + }, + { + "hidden_norms": [ + 11.269571304321289, + 45.10480499267578, + 310.4107360839844, + 542.5189819335938, + 778.7670288085938 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009211195865646005, + 0.00015081235324032605, + 0.00012383687135297805, + 0.00012388851610012352, + 0.0001234857481904328 + ], + "bp_grad_F": [ + 0.097723089158535, + 0.015484371222555637, + 0.011575440876185894, + 0.011470203287899494, + 0.011411197483539581 + ], + "gamma_dfa": 0.052400246262550354, + "gamma_dfa_per_layer": [ + 0.023820150643587112, + 0.04187368229031563, + 0.06974346935749054, + 0.07416368275880814 + ], + "acc_eval": 0.690500020980835, + "loss_eval": 0.8478801250457764, + "epoch": 74 + }, + { + "hidden_norms": [ + 11.269571304321289, + 45.121337890625, + 310.5526123046875, + 542.789794921875, + 779.1331787109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009062032913789153, + 0.00014932811609469354, + 0.00012137479643570259, + 0.00012096992577426136, + 0.00012082025205017999 + ], + "bp_grad_F": [ + 0.09714466333389282, + 0.015453615225851536, + 0.011561346240341663, + 0.011457313783466816, + 0.0113987410441041 + ], + "gamma_dfa": 0.05261371610686183, + "gamma_dfa_per_layer": [ + 0.023706024512648582, + 0.04261678457260132, + 0.06977313756942749, + 0.07435891777276993 + ], + "acc_eval": 0.6915000081062317, + "loss_eval": 0.846295177936554, + "epoch": 75 + }, + { + "hidden_norms": [ + 11.269571304321289, + 45.13352584838867, + 310.6623840332031, + 542.9544067382812, + 779.3726196289062 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009290048037655652, + 0.0001487880654167384, + 0.00012229036656208336, + 0.0001213839859701693, + 0.00012132866686442867 + ], + "bp_grad_F": [ + 0.09700886905193329, + 0.015427183359861374, + 0.011550018563866615, + 0.011446088552474976, + 0.011387485079467297 + ], + "gamma_dfa": 0.05256890505552292, + "gamma_dfa_per_layer": [ + 0.023696668446063995, + 0.04250160604715347, + 0.06959902495145798, + 0.07447832077741623 + ], + "acc_eval": 0.6925000548362732, + "loss_eval": 0.8456347584724426, + "epoch": 76 + }, + { + "hidden_norms": [ + 11.269571304321289, + 45.14185333251953, + 310.71917724609375, + 543.0736694335938, + 779.531982421875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009128348319791257, + 0.00014947194722481072, + 0.0001214019866893068, + 0.000121481396490708, + 0.00012067624629708007 + ], + "bp_grad_F": [ + 0.09731098264455795, + 0.015439406037330627, + 0.011552426032721996, + 0.01144845224916935, + 0.011389924213290215 + ], + "gamma_dfa": 0.0525772743858397, + "gamma_dfa_per_layer": [ + 0.023648327216506004, + 0.0424870140850544, + 0.06964967399835587, + 0.07452408224344254 + ], + "acc_eval": 0.6945000290870667, + "loss_eval": 0.8456541895866394, + "epoch": 77 + }, + { + "hidden_norms": [ + 11.269571304321289, + 45.14662170410156, + 310.7527160644531, + 543.1363525390625, + 779.6199951171875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009132170234806836, + 0.00014713683049194515, + 0.00012075807899236679, + 0.00011999421985819936, + 0.00011943812569370493 + ], + "bp_grad_F": [ + 0.09724143892526627, + 0.01543473545461893, + 0.011546480469405651, + 0.0114423343911767, + 0.011383815668523312 + ], + "gamma_dfa": 0.0526476064696908, + "gamma_dfa_per_layer": [ + 0.023711953312158585, + 0.0426546186208725, + 0.06969036906957626, + 0.07453348487615585 + ], + "acc_eval": 0.6925000548362732, + "loss_eval": 0.8444594740867615, + "epoch": 78 + }, + { + "hidden_norms": [ + 11.269571304321289, + 45.14855194091797, + 310.77044677734375, + 543.1617431640625, + 779.6598510742188 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009067560313269496, + 0.00014785665553063154, + 0.00012018840061500669, + 0.00011918631935259327, + 0.00011903052654815838 + ], + "bp_grad_F": [ + 0.09721538424491882, + 0.015435173176229, + 0.01154935173690319, + 0.011445209383964539, + 0.011386674828827381 + ], + "gamma_dfa": 0.05261166812852025, + "gamma_dfa_per_layer": [ + 0.023721175268292427, + 0.042552798986434937, + 0.06965683400630951, + 0.07451586425304413 + ], + "acc_eval": 0.6930000185966492, + "loss_eval": 0.8448338508605957, + "epoch": 79 + }, + { + "hidden_norms": [ + 11.269571304321289, + 45.149070739746094, + 310.77496337890625, + 543.169189453125, + 779.66943359375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009094586130231619, + 0.00014742475468665361, + 0.00012030002835672349, + 0.00011929625179618597, + 0.00011879605881404132 + ], + "bp_grad_F": [ + 0.09719900041818619, + 0.015434404835104942, + 0.011549265123903751, + 0.011445139534771442, + 0.011386608704924583 + ], + "gamma_dfa": 0.05260759778320789, + "gamma_dfa_per_layer": [ + 0.023730866611003876, + 0.04254307597875595, + 0.06965382397174835, + 0.0745026245713234 + ], + "acc_eval": 0.6930000185966492, + "loss_eval": 0.844819962978363, + "epoch": 80 + } + ] +} \ No newline at end of file diff --git a/results/snapshot_time/time_sweep_L4_d256_s42.json b/results/snapshot_time/time_sweep_L4_d256_s42.json new file mode 100644 index 0000000..69dbce5 --- /dev/null +++ b/results/snapshot_time/time_sweep_L4_d256_s42.json @@ -0,0 +1,128 @@ +[ + { + "snapshot_epoch": 5, + "method": "dfa", + "snapshot_acc": 0.4923, + "best_eta": 0.01, + "dl_same_1": -0.011249661445617676, + "dl_held_1": 6.842613220214844e-05, + "pur_1": -0.006082505907119671, + "dl_same_5": -0.004767775535583496, + "dl_held_5": 0.0032531023025512695, + "pur_5": -0.6823102886429895, + "update_cos": 0.09974875922004382, + "update_var": 42.993629455566406 + }, + { + "snapshot_epoch": 5, + "method": "vec_eT_M4", + "snapshot_acc": 0.4923, + "best_eta": 0.01, + "dl_same_1": -0.011568784713745117, + "dl_held_1": -0.0002554655075073242, + "pur_1": 0.02208231147924448, + "dl_same_5": -0.007385373115539551, + "dl_held_5": -0.005142092704772949, + "pur_5": 0.6962536115145255, + "update_cos": 0.09175282468398412, + "update_var": 0.8272696733474731 + }, + { + "snapshot_epoch": 5, + "method": "oracle_bp", + "snapshot_acc": 0.4923, + "best_eta": 0.01, + "dl_same_1": -0.011359930038452148, + "dl_held_1": -0.0002244710922241211, + "pur_1": 0.019759900936409867, + "dl_same_5": -0.008551597595214844, + "dl_held_5": -0.008973956108093262, + "pur_5": 1.0493894277795957, + "update_cos": 0.09107316409548123, + "update_var": 0.8150736093521118 + }, + { + "snapshot_epoch": 20, + "method": "dfa", + "snapshot_acc": 0.5666, + "best_eta": 0.01, + "dl_same_1": -0.0050983428955078125, + "dl_held_1": 0.0006439685821533203, + "pur_1": -0.12630939017350448, + "dl_same_5": -0.001807570457458496, + "dl_held_5": 0.0009417533874511719, + "pur_5": -0.5210050778625267, + "update_cos": 0.0594960767775774, + "update_var": 63.26374053955078 + }, + { + "snapshot_epoch": 20, + "method": "vec_eT_M4", + "snapshot_acc": 0.5666, + "best_eta": 0.01, + "dl_same_1": -0.005342721939086914, + "dl_held_1": 4.982948303222656e-05, + "pur_1": -0.009326609842513336, + "dl_same_5": -0.00039839744567871094, + "dl_held_5": 0.0015401840209960938, + "pur_5": -3.8659485241083402, + "update_cos": 0.051668012514710426, + "update_var": 0.4448654055595398 + }, + { + "snapshot_epoch": 20, + "method": "oracle_bp", + "snapshot_acc": 0.5666, + "best_eta": 0.01, + "dl_same_1": -0.004968762397766113, + "dl_held_1": 6.651878356933594e-05, + "pur_1": -0.01338739473351643, + "dl_same_5": -0.0005745887756347656, + "dl_held_5": 0.0003821849822998047, + "pur_5": -0.6651452270581655, + "update_cos": 0.051125471790631614, + "update_var": 0.4208375811576843 + }, + { + "snapshot_epoch": 100, + "method": "dfa", + "snapshot_acc": 0.6161, + "best_eta": 0.01, + "dl_same_1": -0.003733694553375244, + "dl_held_1": 0.0010018348693847656, + "pur_1": -0.2683226639979932, + "dl_same_5": 9.971857070922852e-05, + "dl_held_5": 8.255243301391602e-05, + "pur_5": NaN, + "update_cos": -0.029832556028850377, + "update_var": 55.150901794433594 + }, + { + "snapshot_epoch": 100, + "method": "vec_eT_M4", + "snapshot_acc": 0.6161, + "best_eta": 0.01, + "dl_same_1": -0.004258632659912109, + "dl_held_1": -0.00026106834411621094, + "pur_1": 0.061303325481070155, + "dl_same_5": -0.0005500912666320801, + "dl_held_5": 0.0005577206611633301, + "pur_5": -1.0138693231108566, + "update_cos": -0.0078733639481167, + "update_var": 0.38437512516975403 + }, + { + "snapshot_epoch": 100, + "method": "oracle_bp", + "snapshot_acc": 0.6161, + "best_eta": 0.01, + "dl_same_1": -0.002860128879547119, + "dl_held_1": -0.0001398921012878418, + "pur_1": 0.048911118040625354, + "dl_same_5": 6.985664367675781e-05, + "dl_held_5": -0.0006976127624511719, + "pur_5": NaN, + "update_cos": -0.015690920564035576, + "update_var": 0.26965656876564026 + } +] \ No newline at end of file diff --git a/results/snapshot_vit_v1/run_s123.log b/results/snapshot_vit_v1/run_s123.log new file mode 100644 index 0000000..e23f876 --- /dev/null +++ b/results/snapshot_vit_v1/run_s123.log @@ -0,0 +1,36 @@ +ViT-MINI: depth=4, d_model=128, n_heads=4, epochs=60, seed=123 + +=== BP training (ViT-Mini) === + n_params=809354 + [BP-vit] Ep 0: ||h_L_cls||=7.591e+00 ||g_2||=9.667e-04 acc=0.1250 + [BP-vit] Ep 1: ||h_L_cls||=3.242e+01 ||g_2||=1.457e-04 acc=0.4697 + [BP-vit] Ep 5: ||h_L_cls||=3.030e+01 ||g_2||=1.731e-04 acc=0.5957 + [BP-vit] Ep 10: ||h_L_cls||=2.876e+01 ||g_2||=1.742e-04 acc=0.6768 + [BP-vit] Ep 15: ||h_L_cls||=2.787e+01 ||g_2||=1.661e-04 acc=0.7129 + [BP-vit] Ep 20: ||h_L_cls||=2.435e+01 ||g_2||=1.685e-04 acc=0.7461 + [BP-vit] Ep 25: ||h_L_cls||=2.108e+01 ||g_2||=1.419e-04 acc=0.7627 + [BP-vit] Ep 30: ||h_L_cls||=1.855e+01 ||g_2||=1.543e-04 acc=0.7783 + [BP-vit] Ep 35: ||h_L_cls||=1.614e+01 ||g_2||=1.360e-04 acc=0.7939 + [BP-vit] Ep 40: ||h_L_cls||=1.470e+01 ||g_2||=1.014e-04 acc=0.7822 + [BP-vit] Ep 45: ||h_L_cls||=1.305e+01 ||g_2||=9.261e-05 acc=0.7822 + [BP-vit] Ep 50: ||h_L_cls||=1.282e+01 ||g_2||=4.534e-05 acc=0.7822 + [BP-vit] Ep 55: ||h_L_cls||=1.249e+01 ||g_2||=4.168e-05 acc=0.7910 + [BP-vit] Ep 60: ||h_L_cls||=1.250e+01 ||g_2||=3.572e-05 acc=0.7871 + +=== DFA training (ViT-Mini, block-level DFA) === + [DFA-vit] Ep 0: ||h_L_cls||=7.591e+00 ||g_2||=9.667e-04 acc=0.1250 + [DFA-vit] Ep 1: ||h_L_cls||=1.532e+04 ||g_2||=4.354e-07 acc=0.2158 γ=0.0090 + [DFA-vit] Ep 5: ||h_L_cls||=7.063e+05 ||g_2||=1.320e-08 acc=0.2197 γ=0.0009 + [DFA-vit] Ep 10: ||h_L_cls||=4.235e+06 ||g_2||=2.736e-09 acc=0.2373 γ=0.0020 + [DFA-vit] Ep 15: ||h_L_cls||=7.955e+06 ||g_2||=1.467e-09 acc=0.2266 γ=0.0020 + [DFA-vit] Ep 20: ||h_L_cls||=1.460e+07 ||g_2||=9.774e-10 acc=0.2139 γ=0.0018 + [DFA-vit] Ep 25: ||h_L_cls||=2.068e+07 ||g_2||=7.712e-10 acc=0.2080 γ=0.0013 + [DFA-vit] Ep 30: ||h_L_cls||=3.012e+07 ||g_2||=5.962e-10 acc=0.2139 γ=0.0010 + [DFA-vit] Ep 35: ||h_L_cls||=4.466e+07 ||g_2||=4.717e-10 acc=0.1396 γ=0.0040 + [DFA-vit] Ep 40: ||h_L_cls||=4.770e+07 ||g_2||=4.407e-10 acc=0.1963 γ=0.0032 + [DFA-vit] Ep 45: ||h_L_cls||=4.536e+07 ||g_2||=3.493e-10 acc=0.2031 γ=0.0021 + [DFA-vit] Ep 50: ||h_L_cls||=4.727e+07 ||g_2||=3.342e-10 acc=0.1904 γ=0.0017 + [DFA-vit] Ep 55: ||h_L_cls||=4.865e+07 ||g_2||=3.534e-10 acc=0.1982 γ=0.0019 + [DFA-vit] Ep 60: ||h_L_cls||=5.080e+07 ||g_2||=3.359e-10 acc=0.2021 γ=0.0017 + +Saved results/snapshot_vit_v1/snapshot_vit_s123.json diff --git a/results/snapshot_vit_v1/run_s42.log b/results/snapshot_vit_v1/run_s42.log new file mode 100644 index 0000000..2bd76dd --- /dev/null +++ b/results/snapshot_vit_v1/run_s42.log @@ -0,0 +1,36 @@ +ViT-MINI: depth=4, d_model=128, n_heads=4, epochs=60, seed=42 + +=== BP training (ViT-Mini) === + n_params=809354 + [BP-vit] Ep 0: ||h_L_cls||=7.124e+00 ||g_2||=9.976e-04 acc=0.1377 + [BP-vit] Ep 1: ||h_L_cls||=3.181e+01 ||g_2||=1.631e-04 acc=0.4502 + [BP-vit] Ep 5: ||h_L_cls||=3.236e+01 ||g_2||=1.881e-04 acc=0.6035 + [BP-vit] Ep 10: ||h_L_cls||=3.166e+01 ||g_2||=1.970e-04 acc=0.6846 + [BP-vit] Ep 15: ||h_L_cls||=2.804e+01 ||g_2||=1.690e-04 acc=0.7334 + [BP-vit] Ep 20: ||h_L_cls||=2.521e+01 ||g_2||=1.525e-04 acc=0.7637 + [BP-vit] Ep 25: ||h_L_cls||=2.196e+01 ||g_2||=1.524e-04 acc=0.7568 + [BP-vit] Ep 30: ||h_L_cls||=1.903e+01 ||g_2||=1.451e-04 acc=0.7822 + [BP-vit] Ep 35: ||h_L_cls||=1.669e+01 ||g_2||=1.225e-04 acc=0.7852 + [BP-vit] Ep 40: ||h_L_cls||=1.509e+01 ||g_2||=9.628e-05 acc=0.7998 + [BP-vit] Ep 45: ||h_L_cls||=1.395e+01 ||g_2||=5.592e-05 acc=0.8066 + [BP-vit] Ep 50: ||h_L_cls||=1.327e+01 ||g_2||=4.421e-05 acc=0.7998 + [BP-vit] Ep 55: ||h_L_cls||=1.307e+01 ||g_2||=3.098e-05 acc=0.7959 + [BP-vit] Ep 60: ||h_L_cls||=1.297e+01 ||g_2||=3.051e-05 acc=0.7988 + +=== DFA training (ViT-Mini, block-level DFA) === + [DFA-vit] Ep 0: ||h_L_cls||=7.124e+00 ||g_2||=9.976e-04 acc=0.1377 + [DFA-vit] Ep 1: ||h_L_cls||=1.008e+04 ||g_2||=6.152e-07 acc=0.2402 γ=0.0062 + [DFA-vit] Ep 5: ||h_L_cls||=3.966e+05 ||g_2||=1.957e-08 acc=0.2266 γ=0.0066 + [DFA-vit] Ep 10: ||h_L_cls||=1.798e+06 ||g_2||=4.677e-09 acc=0.2266 γ=0.0045 + [DFA-vit] Ep 15: ||h_L_cls||=7.772e+06 ||g_2||=1.681e-09 acc=0.2334 γ=0.0003 + [DFA-vit] Ep 20: ||h_L_cls||=1.204e+07 ||g_2||=1.003e-09 acc=0.2402 γ=-0.0002 + [DFA-vit] Ep 25: ||h_L_cls||=1.835e+07 ||g_2||=6.058e-10 acc=0.2451 γ=-0.0014 + [DFA-vit] Ep 30: ||h_L_cls||=2.502e+07 ||g_2||=4.425e-10 acc=0.2266 γ=-0.0011 + [DFA-vit] Ep 35: ||h_L_cls||=3.150e+07 ||g_2||=3.412e-10 acc=0.2344 γ=-0.0003 + [DFA-vit] Ep 40: ||h_L_cls||=3.778e+07 ||g_2||=3.106e-10 acc=0.2549 γ=-0.0003 + [DFA-vit] Ep 45: ||h_L_cls||=4.166e+07 ||g_2||=2.891e-10 acc=0.2344 γ=-0.0004 + [DFA-vit] Ep 50: ||h_L_cls||=4.633e+07 ||g_2||=2.688e-10 acc=0.2549 γ=0.0004 + [DFA-vit] Ep 55: ||h_L_cls||=4.796e+07 ||g_2||=2.616e-10 acc=0.2510 γ=0.0005 + [DFA-vit] Ep 60: ||h_L_cls||=4.761e+07 ||g_2||=2.622e-10 acc=0.2559 γ=0.0007 + +Saved results/snapshot_vit_v1/snapshot_vit_s42.json diff --git a/results/snapshot_vit_v1/run_s456.log b/results/snapshot_vit_v1/run_s456.log new file mode 100644 index 0000000..ba19529 --- /dev/null +++ b/results/snapshot_vit_v1/run_s456.log @@ -0,0 +1,36 @@ +ViT-MINI: depth=4, d_model=128, n_heads=4, epochs=60, seed=456 + +=== BP training (ViT-Mini) === + n_params=809354 + [BP-vit] Ep 0: ||h_L_cls||=6.653e+00 ||g_2||=1.039e-03 acc=0.0791 + [BP-vit] Ep 1: ||h_L_cls||=2.995e+01 ||g_2||=1.710e-04 acc=0.4590 + [BP-vit] Ep 5: ||h_L_cls||=3.062e+01 ||g_2||=1.845e-04 acc=0.6113 + [BP-vit] Ep 10: ||h_L_cls||=3.123e+01 ||g_2||=1.730e-04 acc=0.6709 + [BP-vit] Ep 15: ||h_L_cls||=2.697e+01 ||g_2||=1.889e-04 acc=0.7012 + [BP-vit] Ep 20: ||h_L_cls||=2.387e+01 ||g_2||=1.801e-04 acc=0.7295 + [BP-vit] Ep 25: ||h_L_cls||=2.080e+01 ||g_2||=1.754e-04 acc=0.7578 + [BP-vit] Ep 30: ||h_L_cls||=1.773e+01 ||g_2||=1.553e-04 acc=0.7666 + [BP-vit] Ep 35: ||h_L_cls||=1.553e+01 ||g_2||=1.576e-04 acc=0.7705 + [BP-vit] Ep 40: ||h_L_cls||=1.420e+01 ||g_2||=1.193e-04 acc=0.7812 + [BP-vit] Ep 45: ||h_L_cls||=1.271e+01 ||g_2||=9.615e-05 acc=0.7773 + [BP-vit] Ep 50: ||h_L_cls||=1.230e+01 ||g_2||=7.114e-05 acc=0.8008 + [BP-vit] Ep 55: ||h_L_cls||=1.201e+01 ||g_2||=6.104e-05 acc=0.7920 + [BP-vit] Ep 60: ||h_L_cls||=1.197e+01 ||g_2||=5.866e-05 acc=0.7910 + +=== DFA training (ViT-Mini, block-level DFA) === + [DFA-vit] Ep 0: ||h_L_cls||=6.653e+00 ||g_2||=1.039e-03 acc=0.0791 + [DFA-vit] Ep 1: ||h_L_cls||=6.750e+03 ||g_2||=9.114e-07 acc=0.2334 γ=0.0073 + [DFA-vit] Ep 5: ||h_L_cls||=2.891e+05 ||g_2||=3.080e-08 acc=0.1963 γ=0.0068 + [DFA-vit] Ep 10: ||h_L_cls||=1.709e+06 ||g_2||=4.513e-09 acc=0.1973 γ=0.0061 + [DFA-vit] Ep 15: ||h_L_cls||=5.106e+06 ||g_2||=1.561e-09 acc=0.2363 γ=0.0023 + [DFA-vit] Ep 20: ||h_L_cls||=1.160e+07 ||g_2||=6.526e-10 acc=0.2559 γ=0.0012 + [DFA-vit] Ep 25: ||h_L_cls||=2.239e+07 ||g_2||=4.283e-10 acc=0.2568 γ=0.0006 + [DFA-vit] Ep 30: ||h_L_cls||=3.290e+07 ||g_2||=3.264e-10 acc=0.2656 γ=0.0005 + [DFA-vit] Ep 35: ||h_L_cls||=4.443e+07 ||g_2||=3.018e-10 acc=0.2354 γ=0.0008 + [DFA-vit] Ep 40: ||h_L_cls||=5.315e+07 ||g_2||=2.841e-10 acc=0.2559 γ=0.0004 + [DFA-vit] Ep 45: ||h_L_cls||=5.912e+07 ||g_2||=3.038e-10 acc=0.2441 γ=0.0004 + [DFA-vit] Ep 50: ||h_L_cls||=6.210e+07 ||g_2||=3.006e-10 acc=0.2578 γ=0.0002 + [DFA-vit] Ep 55: ||h_L_cls||=6.344e+07 ||g_2||=3.079e-10 acc=0.2529 γ=0.0001 + [DFA-vit] Ep 60: ||h_L_cls||=6.367e+07 ||g_2||=3.069e-10 acc=0.2529 γ=0.0000 + +Saved results/snapshot_vit_v1/snapshot_vit_s456.json diff --git a/results/snapshot_vit_v1/snapshot_fa_canonical_s42.json b/results/snapshot_vit_v1/snapshot_fa_canonical_s42.json new file mode 100644 index 0000000..87675ca --- /dev/null +++ b/results/snapshot_vit_v1/snapshot_fa_canonical_s42.json @@ -0,0 +1,1104 @@ +{ + "fa_log": [ + { + "hidden_norms_cls": [ + 0.31052109599113464, + 3.2536301612854004, + 4.7681732177734375, + 6.129599571228027, + 7.124356746673584 + ], + "bp_grad_per_sample_l2_med": [ + 0.006941193714737892, + 0.001723448047414422, + 0.0008084969012998044, + 0.00040042176260612905, + 0.00019880379841197282 + ], + "acc_eval": 0.123046875, + "epoch": 0 + }, + { + "hidden_norms_cls": [ + 0.5545730590820312, + 1099.6082763671875, + 1397.880126953125, + 1557.6058349609375, + 1625.5528564453125 + ], + "bp_grad_per_sample_l2_med": [ + 0.003943991847336292, + 4.105754669581074e-06, + 2.034018280028249e-06, + 1.0202892326560686e-06, + 5.029408498558041e-07 + ], + "acc_eval": 0.25, + "epoch": 1 + }, + { + "hidden_norms_cls": [ + 0.5561315417289734, + 1825.42822265625, + 3141.504638671875, + 5072.111328125, + 5524.6123046875 + ], + "bp_grad_per_sample_l2_med": [ + 0.006327113136649132, + 1.8617935211295844e-06, + 9.007959533846588e-07, + 4.491473930556822e-07, + 2.2173806257796969e-07 + ], + "acc_eval": 0.236328125, + "epoch": 2 + }, + { + "hidden_norms_cls": [ + 0.538809597492218, + 4488.783203125, + 6229.931640625, + 13038.5927734375, + 14604.98828125 + ], + "bp_grad_per_sample_l2_med": [ + 0.00814820732921362, + 7.318813572965155e-07, + 3.619582003011601e-07, + 1.8043300542558427e-07, + 9.003725409684193e-08 + ], + "acc_eval": 0.24609375, + "epoch": 3 + }, + { + "hidden_norms_cls": [ + 0.5289841294288635, + 11559.1318359375, + 21324.697265625, + 33157.46484375, + 34513.00390625 + ], + "bp_grad_per_sample_l2_med": [ + 0.004759137984365225, + 2.922441524333408e-07, + 1.4508636070331704e-07, + 7.107593802402334e-08, + 3.5740285397878324e-08 + ], + "acc_eval": 0.1953125, + "epoch": 4 + }, + { + "hidden_norms_cls": [ + 0.5187227725982666, + 13567.609375, + 31900.357421875, + 41906.99609375, + 44904.33984375 + ], + "bp_grad_per_sample_l2_med": [ + 0.008981491439044476, + 2.3057019404859602e-07, + 1.1323756154979492e-07, + 5.645526357511699e-08, + 2.834152468267348e-08 + ], + "acc_eval": 0.2373046875, + "epoch": 5 + }, + { + "hidden_norms_cls": [ + 0.5072101950645447, + 19264.873046875, + 40929.52734375, + 53545.33203125, + 56968.43359375 + ], + "bp_grad_per_sample_l2_med": [ + 0.011568969115614891, + 1.827240510010597e-07, + 9.02516177347934e-08, + 4.502405914763585e-08, + 2.257244524628277e-08 + ], + "acc_eval": 0.2333984375, + "epoch": 6 + }, + { + "hidden_norms_cls": [ + 0.49512261152267456, + 17510.943359375, + 48323.71875, + 50008.49609375, + 51787.2734375 + ], + "bp_grad_per_sample_l2_med": [ + 0.010693231597542763, + 1.6911585021262e-07, + 8.260560235839876e-08, + 4.064630942934855e-08, + 2.0301804681821523e-08 + ], + "acc_eval": 0.2158203125, + "epoch": 7 + }, + { + "hidden_norms_cls": [ + 0.48422321677207947, + 41544.78515625, + 71321.0625, + 150438.3125, + 155715.5625 + ], + "bp_grad_per_sample_l2_med": [ + 0.03921247273683548, + 1.1485686712831011e-07, + 5.667784108709384e-08, + 2.8099817583893127e-08, + 1.4131681602691515e-08 + ], + "acc_eval": 0.2109375, + "epoch": 8 + }, + { + "hidden_norms_cls": [ + 0.47471165657043457, + 61683.44921875, + 81806.375, + 149131.84375, + 154680.453125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0444764718413353, + 8.208751012261928e-08, + 4.092110117426273e-08, + 2.041711866240803e-08, + 1.0249735282741312e-08 + ], + "acc_eval": 0.24609375, + "epoch": 9 + }, + { + "hidden_norms_cls": [ + 0.4715467393398285, + 100863.953125, + 117647.9453125, + 198225.390625, + 210929.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.018913062289357185, + 4.7114983914298136e-08, + 2.3594729725573416e-08, + 1.1833483526402233e-08, + 5.916069856226613e-09 + ], + "acc_eval": 0.2021484375, + "epoch": 10 + }, + { + "hidden_norms_cls": [ + 0.4661370813846588, + 155109.703125, + 179093.8125, + 259543.703125, + 261068.453125 + ], + "bp_grad_per_sample_l2_med": [ + 0.014048838056623936, + 2.8752721092928368e-08, + 1.4348634280736405e-08, + 7.019417935794081e-09, + 3.5147973420635026e-09 + ], + "acc_eval": 0.205078125, + "epoch": 11 + }, + { + "hidden_norms_cls": [ + 0.45670604705810547, + 139276.359375, + 179938.421875, + 286296.46875, + 287724.21875 + ], + "bp_grad_per_sample_l2_med": [ + 0.01842617429792881, + 3.2641882086181795e-08, + 1.6271862079975108e-08, + 8.13431366708528e-09, + 4.065131786745724e-09 + ], + "acc_eval": 0.19140625, + "epoch": 12 + }, + { + "hidden_norms_cls": [ + 0.4475501775741577, + 243322.703125, + 291619.53125, + 393543.1875, + 453741.9375 + ], + "bp_grad_per_sample_l2_med": [ + 0.017274944111704826, + 2.0982721338214105e-08, + 1.0508765413419496e-08, + 5.2403605899087324e-09, + 2.6231921079755693e-09 + ], + "acc_eval": 0.216796875, + "epoch": 13 + }, + { + "hidden_norms_cls": [ + 0.44052183628082275, + 378946.46875, + 454064.40625, + 486236.65625, + 545435.0625 + ], + "bp_grad_per_sample_l2_med": [ + 0.011560702696442604, + 1.302930296986915e-08, + 6.4620948592164495e-09, + 3.2205806910212686e-09, + 1.6108331335473736e-09 + ], + "acc_eval": 0.177734375, + "epoch": 14 + }, + { + "hidden_norms_cls": [ + 0.43271052837371826, + 603185.0, + 706685.875, + 754365.6875, + 781386.0625 + ], + "bp_grad_per_sample_l2_med": [ + 0.027027767151594162, + 8.183165256525626e-09, + 4.085152216504184e-09, + 2.0333199568511873e-09, + 1.0129016514426326e-09 + ], + "acc_eval": 0.1923828125, + "epoch": 15 + }, + { + "hidden_norms_cls": [ + 0.42688167095184326, + 897163.875, + 1069202.125, + 1126727.125, + 1146658.875 + ], + "bp_grad_per_sample_l2_med": [ + 0.013954665511846542, + 5.21436360756411e-09, + 2.6102418004825267e-09, + 1.3076516536258964e-09, + 6.521915230095487e-10 + ], + "acc_eval": 0.17578125, + "epoch": 16 + }, + { + "hidden_norms_cls": [ + 0.419918030500412, + 1210681.5, + 1492631.25, + 1582945.75, + 1604470.375 + ], + "bp_grad_per_sample_l2_med": [ + 0.016081038862466812, + 3.6842373596357447e-09, + 1.8416679292698745e-09, + 9.214698448722913e-10, + 4.6121051422431947e-10 + ], + "acc_eval": 0.205078125, + "epoch": 17 + }, + { + "hidden_norms_cls": [ + 0.41367214918136597, + 1474524.0, + 1896333.625, + 2048261.125, + 2075013.625 + ], + "bp_grad_per_sample_l2_med": [ + 0.015561909414827824, + 2.9148632396669427e-09, + 1.4711201146155872e-09, + 7.326692585962746e-10, + 3.6670635972235743e-10 + ], + "acc_eval": 0.1748046875, + "epoch": 18 + }, + { + "hidden_norms_cls": [ + 0.4075075685977936, + 1721647.75, + 2392353.5, + 2664490.25, + 2676219.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.013573882170021534, + 2.4936914755357975e-09, + 1.2590603004625223e-09, + 6.301172361666829e-10, + 3.1474217676574767e-10 + ], + "acc_eval": 0.171875, + "epoch": 19 + }, + { + "hidden_norms_cls": [ + 0.40185868740081787, + 2061658.75, + 3070974.0, + 3363148.5, + 3355996.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.01332809403538704, + 1.9996668765287495e-09, + 9.928408095660757e-10, + 4.968849776076922e-10, + 2.4808827214783946e-10 + ], + "acc_eval": 0.1728515625, + "epoch": 20 + }, + { + "hidden_norms_cls": [ + 0.3959394693374634, + 2567158.5, + 4022831.25, + 4366507.5, + 4360674.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.012877865694463253, + 1.5711227874248834e-09, + 7.865745832447146e-10, + 3.9232733728411517e-10, + 1.9626268665806634e-10 + ], + "acc_eval": 0.1689453125, + "epoch": 21 + }, + { + "hidden_norms_cls": [ + 0.3908536732196808, + 2855278.0, + 4821230.0, + 5318397.5, + 5261785.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.01991885155439377, + 1.3769393403251229e-09, + 6.908043581610457e-10, + 3.4423255912408024e-10, + 1.725469211955044e-10 + ], + "acc_eval": 0.1748046875, + "epoch": 22 + }, + { + "hidden_norms_cls": [ + 0.38593825697898865, + 3174507.75, + 5821231.0, + 6397560.5, + 6354021.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.011731060221791267, + 1.1907397290400468e-09, + 6.002150998440925e-10, + 2.995812764527983e-10, + 1.4982258489393274e-10 + ], + "acc_eval": 0.1953125, + "epoch": 23 + }, + { + "hidden_norms_cls": [ + 0.38131335377693176, + 4292486.5, + 7334872.5, + 8481275.0, + 7987194.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.015600440092384815, + 9.097935183000061e-10, + 4.627094263298659e-10, + 2.3154314576778745e-10, + 1.1568761226765645e-10 + ], + "acc_eval": 0.1650390625, + "epoch": 24 + }, + { + "hidden_norms_cls": [ + 0.3768307864665985, + 4066144.5, + 8089341.0, + 8840942.0, + 8750187.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.01041770912706852, + 9.491230024138986e-10, + 4.764759142794617e-10, + 2.383013231188613e-10, + 1.1919720765973807e-10 + ], + "acc_eval": 0.158203125, + "epoch": 25 + }, + { + "hidden_norms_cls": [ + 0.3725484013557434, + 4660335.5, + 9398058.0, + 10277586.0, + 10159446.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.012610528618097305, + 8.221311964540234e-10, + 4.1212994128514424e-10, + 2.0628378172293793e-10, + 1.0312824205715998e-10 + ], + "acc_eval": 0.162109375, + "epoch": 26 + }, + { + "hidden_norms_cls": [ + 0.3689132332801819, + 5871612.5, + 11057573.0, + 12074060.0, + 11979049.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.022938355803489685, + 6.959858245281225e-10, + 3.601695330868182e-10, + 1.795542742266676e-10, + 9.003973955312716e-11 + ], + "acc_eval": 0.1748046875, + "epoch": 27 + }, + { + "hidden_norms_cls": [ + 0.3653584122657776, + 6549866.5, + 12457973.0, + 13667217.0, + 13488831.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.01968899369239807, + 5.967032423725982e-10, + 3.0872890355304605e-10, + 1.5443717138463597e-10, + 7.714055783036855e-11 + ], + "acc_eval": 0.1669921875, + "epoch": 28 + }, + { + "hidden_norms_cls": [ + 0.36252257227897644, + 7083078.0, + 13728239.0, + 15048567.0, + 14800666.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.024753496050834656, + 5.776352174358124e-10, + 2.965032941393275e-10, + 1.4841036732882174e-10, + 7.41542729998379e-11 + ], + "acc_eval": 0.1728515625, + "epoch": 29 + }, + { + "hidden_norms_cls": [ + 0.3597593307495117, + 7156219.5, + 14613827.0, + 16177184.0, + 15867089.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.012417457066476345, + 5.718481799199537e-10, + 2.867320547661478e-10, + 1.4365150735606846e-10, + 7.184561279238721e-11 + ], + "acc_eval": 0.1650390625, + "epoch": 30 + }, + { + "hidden_norms_cls": [ + 0.35805046558380127, + 8087894.5, + 16279937.0, + 18019618.0, + 17642490.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.017159853130578995, + 5.130134095310268e-10, + 2.612176586147541e-10, + 1.3114326291585598e-10, + 6.563268678538847e-11 + ], + "acc_eval": 0.1796875, + "epoch": 31 + }, + { + "hidden_norms_cls": [ + 0.35514453053474426, + 8415584.0, + 17452890.0, + 19574252.0, + 19044988.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.017893649637699127, + 5.072835485009364e-10, + 2.5544158455126365e-10, + 1.2795793591369176e-10, + 6.410054431693624e-11 + ], + "acc_eval": 0.1962890625, + "epoch": 32 + }, + { + "hidden_norms_cls": [ + 0.35366830229759216, + 9040861.0, + 18928378.0, + 21235278.0, + 20689608.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.01662450097501278, + 4.760899452449507e-10, + 2.391463138629035e-10, + 1.19767168405005e-10, + 5.980976131025884e-11 + ], + "acc_eval": 0.177734375, + "epoch": 33 + }, + { + "hidden_norms_cls": [ + 0.35274940729141235, + 10105909.0, + 20575994.0, + 22869280.0, + 22381648.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.04045082628726959, + 4.454907553963494e-10, + 2.224223166757966e-10, + 1.1117023274165305e-10, + 5.573364339483966e-11 + ], + "acc_eval": 0.173828125, + "epoch": 34 + }, + { + "hidden_norms_cls": [ + 0.35230201482772827, + 10649243.0, + 21849520.0, + 24383386.0, + 23809486.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.03625870868563652, + 4.062269409743635e-10, + 2.0919388443729758e-10, + 1.0517077486671411e-10, + 5.271013833740845e-11 + ], + "acc_eval": 0.158203125, + "epoch": 35 + }, + { + "hidden_norms_cls": [ + 0.35188645124435425, + 11225758.0, + 23225336.0, + 25744754.0, + 25098318.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.04868545010685921, + 4.2478476292018286e-10, + 2.1696269780768773e-10, + 1.0849423442982342e-10, + 5.422649829167625e-11 + ], + "acc_eval": 0.181640625, + "epoch": 36 + }, + { + "hidden_norms_cls": [ + 0.35190674662590027, + 11552205.0, + 24186280.0, + 27053836.0, + 26295722.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.04053955897688866, + 4.0922154553868495e-10, + 2.0564389080490741e-10, + 1.0180161574835367e-10, + 5.100607436414606e-11 + ], + "acc_eval": 0.1708984375, + "epoch": 37 + }, + { + "hidden_norms_cls": [ + 0.3533709645271301, + 12511109.0, + 25674238.0, + 28429464.0, + 27729346.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.04322395101189613, + 3.725502961682281e-10, + 1.895077428315517e-10, + 9.475340650988429e-11, + 4.7370347228126164e-11 + ], + "acc_eval": 0.1943359375, + "epoch": 38 + }, + { + "hidden_norms_cls": [ + 0.35590660572052, + 12274717.0, + 26252202.0, + 29145476.0, + 28407090.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0458325557410717, + 3.9338646229403196e-10, + 1.9832839537325953e-10, + 9.937214245914205e-11, + 4.97785458686284e-11 + ], + "acc_eval": 0.162109375, + "epoch": 39 + }, + { + "hidden_norms_cls": [ + 0.35598739981651306, + 13010948.0, + 27253844.0, + 30244608.0, + 29436354.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.050111040472984314, + 3.8191338980198e-10, + 1.9492148173316792e-10, + 9.78909453497323e-11, + 4.898272759623623e-11 + ], + "acc_eval": 0.17578125, + "epoch": 40 + }, + { + "hidden_norms_cls": [ + 0.359886109828949, + 12949905.0, + 27785034.0, + 30987020.0, + 30162430.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.04287939891219139, + 3.569295692340546e-10, + 1.7953295794459478e-10, + 8.970056641910418e-11, + 4.4947719157750754e-11 + ], + "acc_eval": 0.1669921875, + "epoch": 41 + }, + { + "hidden_norms_cls": [ + 0.3610597252845764, + 13297263.0, + 28490094.0, + 31717372.0, + 30903264.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.059325557202100754, + 3.555903349550249e-10, + 1.8439673399317513e-10, + 9.228186964582719e-11, + 4.604394990281868e-11 + ], + "acc_eval": 0.1630859375, + "epoch": 42 + }, + { + "hidden_norms_cls": [ + 0.36371150612831116, + 13593509.0, + 29189264.0, + 32363910.0, + 31583456.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.08067209273576736, + 3.748426291583229e-10, + 1.9037708909319662e-10, + 9.613144308362465e-11, + 4.7860448243453035e-11 + ], + "acc_eval": 0.1669921875, + "epoch": 43 + }, + { + "hidden_norms_cls": [ + 0.3678953945636749, + 13002685.0, + 29272840.0, + 32833962.0, + 31996856.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.046668969094753265, + 3.5862279812448605e-10, + 1.8444731852973462e-10, + 9.241421516925641e-11, + 4.614601409325125e-11 + ], + "acc_eval": 0.162109375, + "epoch": 44 + }, + { + "hidden_norms_cls": [ + 0.3722097873687744, + 13026701.0, + 29583132.0, + 33140148.0, + 32223962.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.05778568983078003, + 3.8914271804912914e-10, + 1.9742661672150774e-10, + 9.861946675959743e-11, + 4.930081343168524e-11 + ], + "acc_eval": 0.1640625, + "epoch": 45 + }, + { + "hidden_norms_cls": [ + 0.3784724175930023, + 13060913.0, + 29952154.0, + 33663012.0, + 32716300.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.058499205857515335, + 3.8859623852083303e-10, + 1.9628629277512744e-10, + 9.875016082627752e-11, + 4.9333759299940994e-11 + ], + "acc_eval": 0.16015625, + "epoch": 46 + }, + { + "hidden_norms_cls": [ + 0.3851682245731354, + 13061307.0, + 30283974.0, + 33786364.0, + 32963536.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.05969119817018509, + 4.036749268188089e-10, + 2.051936537350585e-10, + 1.0281481221952049e-10, + 5.1408790419094075e-11 + ], + "acc_eval": 0.1591796875, + "epoch": 47 + }, + { + "hidden_norms_cls": [ + 0.38858678936958313, + 13053480.0, + 30258368.0, + 34267304.0, + 33358036.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.05216536298394203, + 3.8322026107984186e-10, + 1.942517396935628e-10, + 9.742346512853217e-11, + 4.861935506972337e-11 + ], + "acc_eval": 0.1630859375, + "epoch": 48 + }, + { + "hidden_norms_cls": [ + 0.3970814645290375, + 12785361.0, + 30453750.0, + 34537440.0, + 33524112.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0512184239923954, + 3.618580712849706e-10, + 1.8165123572000397e-10, + 9.080205337630431e-11, + 4.5350091737450526e-11 + ], + "acc_eval": 0.1611328125, + "epoch": 49 + }, + { + "hidden_norms_cls": [ + 0.41041070222854614, + 12378014.0, + 30515276.0, + 34276956.0, + 33306668.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.04064331203699112, + 4.035453082806839e-10, + 2.059644121921167e-10, + 1.030020096992601e-10, + 5.144335651907639e-11 + ], + "acc_eval": 0.1591796875, + "epoch": 50 + }, + { + "hidden_norms_cls": [ + 0.4208085834980011, + 12229696.0, + 30525590.0, + 34345932.0, + 33357842.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.04530888423323631, + 4.160819744303268e-10, + 2.0900184360961305e-10, + 1.0429850733073565e-10, + 5.2114305926220794e-11 + ], + "acc_eval": 0.166015625, + "epoch": 51 + }, + { + "hidden_norms_cls": [ + 0.4249289929866791, + 12130639.0, + 30354396.0, + 34678540.0, + 33531180.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.04047567769885063, + 4.068767545106766e-10, + 2.0768058106579446e-10, + 1.0380588749692166e-10, + 5.188600937788834e-11 + ], + "acc_eval": 0.162109375, + "epoch": 52 + }, + { + "hidden_norms_cls": [ + 0.4318743348121643, + 11880541.0, + 30505546.0, + 34958524.0, + 33653512.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.03571970760822296, + 4.0090192277020265e-10, + 2.011875527285767e-10, + 1.0030835884133893e-10, + 5.012859571884576e-11 + ], + "acc_eval": 0.1630859375, + "epoch": 53 + }, + { + "hidden_norms_cls": [ + 0.43913060426712036, + 11708532.0, + 30355660.0, + 34920048.0, + 33497518.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0396106131374836, + 4.1890893531792983e-10, + 2.084224598464246e-10, + 1.0319496646093995e-10, + 5.16515094584058e-11 + ], + "acc_eval": 0.1611328125, + "epoch": 54 + }, + { + "hidden_norms_cls": [ + 0.44122788310050964, + 11552111.0, + 30335972.0, + 35070540.0, + 33779876.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.03454306349158287, + 3.9193837064743775e-10, + 1.9659923689019365e-10, + 9.868480338459662e-11, + 4.934370273490529e-11 + ], + "acc_eval": 0.1552734375, + "epoch": 55 + }, + { + "hidden_norms_cls": [ + 0.4431604743003845, + 11393902.0, + 30399024.0, + 35148924.0, + 33730668.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.03607407212257385, + 4.01606164990298e-10, + 2.01549305023363e-10, + 1.0008825018781309e-10, + 5.001985631247763e-11 + ], + "acc_eval": 0.1611328125, + "epoch": 56 + }, + { + "hidden_norms_cls": [ + 0.44458895921707153, + 11456393.0, + 30366940.0, + 35126152.0, + 33815292.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.03673577681183815, + 3.9196515477790683e-10, + 1.9733305267610746e-10, + 9.858801275353102e-11, + 4.931045849421167e-11 + ], + "acc_eval": 0.16015625, + "epoch": 57 + }, + { + "hidden_norms_cls": [ + 0.44609925150871277, + 11285367.0, + 30391162.0, + 35039688.0, + 33859112.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.03655927628278732, + 3.98514693467078e-10, + 1.9965135100719067e-10, + 9.972099535016099e-11, + 4.983467111197015e-11 + ], + "acc_eval": 0.1630859375, + "epoch": 58 + }, + { + "hidden_norms_cls": [ + 0.4466340243816376, + 11309850.0, + 30354550.0, + 35045136.0, + 33748968.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.03679952770471573, + 4.077362614207658e-10, + 2.0270646272635418e-10, + 1.015226652745227e-10, + 5.069205818997169e-11 + ], + "acc_eval": 0.1630859375, + "epoch": 59 + }, + { + "hidden_norms_cls": [ + 0.4467651844024658, + 11222298.0, + 30325882.0, + 35035856.0, + 33763052.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.03729122504591942, + 4.0734565720512705e-10, + 2.0311738402334356e-10, + 1.015596079456671e-10, + 5.085605200849663e-11 + ], + "acc_eval": 0.1630859375, + "epoch": 60 + } + ], + "arch": "vit", + "seed": 42 +} \ No newline at end of file diff --git a/results/snapshot_vit_v1/snapshot_fa_vit_s42.json b/results/snapshot_vit_v1/snapshot_fa_vit_s42.json new file mode 100644 index 0000000..450351d --- /dev/null +++ b/results/snapshot_vit_v1/snapshot_fa_vit_s42.json @@ -0,0 +1,1104 @@ +{ + "fa_log": [ + { + "hidden_norms_cls": [ + 0.31052109599113464, + 3.2536301612854004, + 4.7681732177734375, + 6.129599571228027, + 7.124356746673584 + ], + "bp_grad_per_sample_l2_med": [ + 0.006941193714737892, + 0.001723448047414422, + 0.0008084969012998044, + 0.00040042176260612905, + 0.00019880379841197282 + ], + "acc_eval": 0.123046875, + "epoch": 0 + }, + { + "hidden_norms_cls": [ + 1.6919748783111572, + 3842.78515625, + 9341.6923828125, + 9920.3046875, + 9136.099609375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017624060856178403, + 1.1595898286032025e-06, + 5.700691758647736e-07, + 2.8373631266731536e-07, + 1.4022531047430675e-07 + ], + "acc_eval": 0.1962890625, + "epoch": 1 + }, + { + "hidden_norms_cls": [ + 2.213810443878174, + 13173.2275390625, + 20675.927734375, + 21090.544921875, + 20256.06640625 + ], + "bp_grad_per_sample_l2_med": [ + 0.00036340864608064294, + 4.792477170667553e-07, + 2.2975714841777517e-07, + 1.1404723920804827e-07, + 5.58470958367252e-08 + ], + "acc_eval": 0.130859375, + "epoch": 2 + }, + { + "hidden_norms_cls": [ + 2.4401588439941406, + 27950.775390625, + 42258.1171875, + 42646.40625, + 40386.3671875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006889981450513005, + 2.183849545644989e-07, + 1.0780762949025302e-07, + 5.330540986392407e-08, + 2.567051815560717e-08 + ], + "acc_eval": 0.1259765625, + "epoch": 3 + }, + { + "hidden_norms_cls": [ + 2.4965271949768066, + 35298.37890625, + 71921.4921875, + 73662.3828125, + 71502.1171875 + ], + "bp_grad_per_sample_l2_med": [ + 0.00035679180291481316, + 1.280830304040137e-07, + 5.992792750930676e-08, + 3.021023786686783e-08, + 1.4932888703356184e-08 + ], + "acc_eval": 0.1474609375, + "epoch": 4 + }, + { + "hidden_norms_cls": [ + 2.542451858520508, + 596.9271240234375, + 15138.552734375, + 20439.001953125, + 63235.2109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007700499845668674, + 4.321308608723484e-07, + 1.9291219643946533e-07, + 9.676254819623864e-08, + 4.7916582701645893e-08 + ], + "acc_eval": 0.12890625, + "epoch": 5 + }, + { + "hidden_norms_cls": [ + 2.6066854000091553, + 172636.59375, + 290436.34375, + 356619.71875, + 363143.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.000482373550767079, + 2.2872455929245916e-08, + 1.1479056816199318e-08, + 5.759448917785903e-09, + 2.8778499583381745e-09 + ], + "acc_eval": 0.1201171875, + "epoch": 6 + }, + { + "hidden_norms_cls": [ + 2.549955129623413, + 247359.046875, + 456810.46875, + 542983.1875, + 536014.5625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003394677478354424, + 1.5884587867276423e-08, + 8.104618309801026e-09, + 4.073737347454198e-09, + 2.0375214848655787e-09 + ], + "acc_eval": 0.125, + "epoch": 7 + }, + { + "hidden_norms_cls": [ + 2.4600400924682617, + 507.6882629394531, + 55412.9140625, + 58117.875, + 71533.109375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005215128185227513, + 1.720908642255381e-07, + 7.895193476770146e-08, + 3.936664327852668e-08, + 1.950460415400812e-08 + ], + "acc_eval": 0.166015625, + "epoch": 8 + }, + { + "hidden_norms_cls": [ + 2.377673387527466, + 492.4173583984375, + 72010.8515625, + 80733.3828125, + 88499.03125 + ], + "bp_grad_per_sample_l2_med": [ + 0.000300612737191841, + 1.303562839893857e-07, + 5.4381189329433255e-08, + 2.712311264474465e-08, + 1.3531170850455965e-08 + ], + "acc_eval": 0.1953125, + "epoch": 9 + }, + { + "hidden_norms_cls": [ + 2.2829232215881348, + 70101.53125, + 273366.84375, + 380567.40625, + 436148.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003461186133790761, + 2.5325679331444917e-08, + 1.3804578813392254e-08, + 7.191788053972914e-09, + 3.5467115910847724e-09 + ], + "acc_eval": 0.1982421875, + "epoch": 10 + }, + { + "hidden_norms_cls": [ + 2.2401251792907715, + 95090.734375, + 434796.5, + 535611.6875, + 555035.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003575912269297987, + 2.0430407587923582e-08, + 1.013873163202561e-08, + 5.240056832889195e-09, + 2.62253840865867e-09 + ], + "acc_eval": 0.19140625, + "epoch": 11 + }, + { + "hidden_norms_cls": [ + 2.213266134262085, + 371645.75, + 623563.875, + 694904.125, + 745774.625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003485995694063604, + 1.2734847842921226e-08, + 6.490221693411513e-09, + 3.23543081215405e-09, + 1.6088937959679583e-09 + ], + "acc_eval": 0.185546875, + "epoch": 12 + }, + { + "hidden_norms_cls": [ + 2.3490853309631348, + 1521.5958251953125, + 117621.15625, + 153339.328125, + 234005.4375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001710709184408188, + 8.239747018023991e-08, + 2.854269354202188e-08, + 1.4295378214512766e-08, + 7.217904940404196e-09 + ], + "acc_eval": 0.181640625, + "epoch": 13 + }, + { + "hidden_norms_cls": [ + 2.568831205368042, + 461180.78125, + 1827924.375, + 2293298.0, + 2130660.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002101986901834607, + 7.077860963988769e-09, + 3.564110562237488e-09, + 1.7704799848416997e-09, + 8.853479060988434e-10 + ], + "acc_eval": 0.201171875, + "epoch": 14 + }, + { + "hidden_norms_cls": [ + 2.6825993061065674, + 2726.72314453125, + 97672.5703125, + 471438.28125, + 779993.8125 + ], + "bp_grad_per_sample_l2_med": [ + 9.469804354012012e-05, + 6.38537613895096e-08, + 7.950252012278725e-09, + 3.422149452703138e-09, + 1.7092232074134017e-09 + ], + "acc_eval": 0.201171875, + "epoch": 15 + }, + { + "hidden_norms_cls": [ + 2.7971737384796143, + 313802.15625, + 3608552.75, + 4391356.0, + 4212764.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015007780166342854, + 3.938802173308886e-09, + 1.8008210478370756e-09, + 9.022776970013524e-10, + 4.517709262241709e-10 + ], + "acc_eval": 0.203125, + "epoch": 16 + }, + { + "hidden_norms_cls": [ + 2.8100268840789795, + 2875.376708984375, + 96749.3671875, + 983606.125, + 1150911.625 + ], + "bp_grad_per_sample_l2_med": [ + 0.001228083623573184, + 6.225434390216833e-08, + 7.879610741667875e-09, + 3.8225227427801656e-09, + 1.923271097936663e-09 + ], + "acc_eval": 0.1787109375, + "epoch": 17 + }, + { + "hidden_norms_cls": [ + 2.8279852867126465, + 2183.419677734375, + 65646.7734375, + 320722.65625, + 442094.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.00120502186473459, + 8.017538988269735e-08, + 2.5245032730936146e-08, + 1.1776578823230466e-08, + 5.894425836316941e-09 + ], + "acc_eval": 0.1044921875, + "epoch": 18 + }, + { + "hidden_norms_cls": [ + 2.8702030181884766, + 2139.65234375, + 95514.8359375, + 324949.6875, + 462647.84375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014194594696164131, + 5.5903008444602165e-08, + 2.0797312316744865e-08, + 9.60299928465247e-09, + 4.690376087523873e-09 + ], + "acc_eval": 0.1103515625, + "epoch": 19 + }, + { + "hidden_norms_cls": [ + 2.7991764545440674, + 15302.53125, + 190705.796875, + 494117.90625, + 543885.625 + ], + "bp_grad_per_sample_l2_med": [ + 0.00047307764180004597, + 2.4012980048837562e-08, + 1.1153974632804875e-08, + 5.289668258967595e-09, + 2.6598685476386663e-09 + ], + "acc_eval": 0.0888671875, + "epoch": 20 + }, + { + "hidden_norms_cls": [ + 2.8112618923187256, + 534165.625, + 9562196.0, + 11356111.0, + 11261478.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002835187187884003, + 1.1553467071934165e-09, + 5.117212764638168e-10, + 2.5636526235217616e-10, + 1.2813658467614175e-10 + ], + "acc_eval": 0.107421875, + "epoch": 21 + }, + { + "hidden_norms_cls": [ + 2.7986021041870117, + 1302347.875, + 12959677.0, + 15286166.0, + 15075608.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000172777334228158, + 7.537985791117308e-10, + 3.5877870119271904e-10, + 1.7971832355634376e-10, + 8.955045038838705e-11 + ], + "acc_eval": 0.126953125, + "epoch": 22 + }, + { + "hidden_norms_cls": [ + 2.756831169128418, + 422432.40625, + 12218335.0, + 15267431.0, + 14942667.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015324499690905213, + 1.1144170031229805e-09, + 3.578760898736988e-10, + 1.796912063589673e-10, + 8.906290982491072e-11 + ], + "acc_eval": 0.166015625, + "epoch": 23 + }, + { + "hidden_norms_cls": [ + 2.713092088699341, + 441085.75, + 13975295.0, + 17594034.0, + 17150196.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001009844709187746, + 9.29383403569517e-10, + 2.9464700124215426e-10, + 1.481769429378943e-10, + 7.335923535300992e-11 + ], + "acc_eval": 0.1826171875, + "epoch": 24 + }, + { + "hidden_norms_cls": [ + 2.677187204360962, + 329657.125, + 11149057.0, + 16110063.0, + 15466966.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00021013693185523152, + 1.6009201742051005e-09, + 3.1313171500180204e-10, + 1.5797228802849617e-10, + 7.763964471330098e-11 + ], + "acc_eval": 0.1796875, + "epoch": 25 + }, + { + "hidden_norms_cls": [ + 2.6366331577301025, + 5142.62060546875, + 367599.71875, + 988076.75, + 1002302.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.00011194300896022469, + 9.242073772952608e-09, + 4.35089919648135e-09, + 2.032314094790877e-09, + 1.016630779560046e-09 + ], + "acc_eval": 0.181640625, + "epoch": 26 + }, + { + "hidden_norms_cls": [ + 2.599846601486206, + 5072.9931640625, + 354873.9375, + 1104508.0, + 1055959.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014896050561219454, + 1.0939302796941774e-08, + 4.676385056967547e-09, + 2.02762540091328e-09, + 1.0192051647095468e-09 + ], + "acc_eval": 0.1806640625, + "epoch": 27 + }, + { + "hidden_norms_cls": [ + 2.598066568374634, + 116168.1875, + 10078028.0, + 18893916.0, + 17647230.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001877687027445063, + 2.095827511539028e-09, + 2.405041166220201e-10, + 1.2486357781060775e-10, + 6.205166935835393e-11 + ], + "acc_eval": 0.1962890625, + "epoch": 28 + }, + { + "hidden_norms_cls": [ + 2.6015524864196777, + 740986.875, + 24883748.0, + 31021810.0, + 30329238.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00018684851238504052, + 3.8257660928131543e-10, + 1.594476078947693e-10, + 8.13158151924398e-11, + 4.050663623966777e-11 + ], + "acc_eval": 0.1845703125, + "epoch": 29 + }, + { + "hidden_norms_cls": [ + 2.589724063873291, + 2141793.5, + 28624410.0, + 34863924.0, + 34267120.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002886186121031642, + 3.2890931644935506e-10, + 1.5246036377813965e-10, + 7.833261816969639e-11, + 3.898681030789497e-11 + ], + "acc_eval": 0.1748046875, + "epoch": 30 + }, + { + "hidden_norms_cls": [ + 2.5866215229034424, + 2836275.25, + 30209988.0, + 36742252.0, + 36121420.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004315464466344565, + 3.6725425478500995e-10, + 1.698625962109901e-10, + 8.663138262310355e-11, + 4.2701918390175564e-11 + ], + "acc_eval": 0.1787109375, + "epoch": 31 + }, + { + "hidden_norms_cls": [ + 2.581477642059326, + 3276328.25, + 31851982.0, + 38643076.0, + 37988372.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006185675738379359, + 3.898423250880967e-10, + 1.803390908827751e-10, + 9.224612046443426e-11, + 4.599535682880962e-11 + ], + "acc_eval": 0.181640625, + "epoch": 32 + }, + { + "hidden_norms_cls": [ + 2.6230173110961914, + 3459700.75, + 33572172.0, + 40661440.0, + 39924348.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009694760083220899, + 3.8904643395731853e-10, + 1.8190765560532896e-10, + 9.24886070508002e-11, + 4.616174456573141e-11 + ], + "acc_eval": 0.189453125, + "epoch": 33 + }, + { + "hidden_norms_cls": [ + 2.9775710105895996, + 10399.8671875, + 571599.6875, + 1836598.625, + 1908883.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.00016216874064411968, + 7.749568453618849e-08, + 8.983486843305855e-09, + 2.0125863198217075e-09, + 1.0150218443527592e-09 + ], + "acc_eval": 0.0986328125, + "epoch": 34 + }, + { + "hidden_norms_cls": [ + 3.015839099884033, + 12101.009765625, + 561385.0625, + 1955154.125, + 1975725.375 + ], + "bp_grad_per_sample_l2_med": [ + 0.00012338445230852813, + 6.92784638545163e-08, + 9.938768030792744e-09, + 1.8663843803778946e-09, + 9.43250033635934e-10 + ], + "acc_eval": 0.103515625, + "epoch": 35 + }, + { + "hidden_norms_cls": [ + 3.002318859100342, + 13969.6484375, + 549761.875, + 2067254.5, + 2046448.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.00011628194624790922, + 5.204710973316651e-08, + 8.372143867063642e-09, + 1.751683464945586e-09, + 8.823823893777671e-10 + ], + "acc_eval": 0.1025390625, + "epoch": 36 + }, + { + "hidden_norms_cls": [ + 3.033550262451172, + 16014.7802734375, + 542334.375, + 2185907.75, + 2132718.0 + ], + "bp_grad_per_sample_l2_med": [ + 7.604974234709516e-05, + 4.623546701054693e-08, + 9.098562792075882e-09, + 1.7713268629648837e-09, + 8.977130705467573e-10 + ], + "acc_eval": 0.1025390625, + "epoch": 37 + }, + { + "hidden_norms_cls": [ + 2.9693667888641357, + 17655.8203125, + 542724.0, + 2311982.5, + 2234848.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001330485101789236, + 3.560405303915104e-08, + 7.560966963637838e-09, + 1.5777356088264582e-09, + 7.958586012435376e-10 + ], + "acc_eval": 0.0966796875, + "epoch": 38 + }, + { + "hidden_norms_cls": [ + 2.9733641147613525, + 18918.01171875, + 540951.6875, + 2434576.5, + 2336018.25 + ], + "bp_grad_per_sample_l2_med": [ + 9.626700193621218e-05, + 3.403155446335404e-08, + 8.177446275681177e-09, + 1.5839350941959651e-09, + 8.022257858009141e-10 + ], + "acc_eval": 0.1201171875, + "epoch": 39 + }, + { + "hidden_norms_cls": [ + 3.0027060508728027, + 20108.37890625, + 544636.5, + 2550452.75, + 2438166.75 + ], + "bp_grad_per_sample_l2_med": [ + 7.119941437849775e-05, + 3.794270853063608e-08, + 9.455917826528548e-09, + 1.7259683682269156e-09, + 8.75004957379133e-10 + ], + "acc_eval": 0.1083984375, + "epoch": 40 + }, + { + "hidden_norms_cls": [ + 2.9846291542053223, + 21615.2578125, + 547112.625, + 2664214.25, + 2538743.25 + ], + "bp_grad_per_sample_l2_med": [ + 9.802342538023368e-05, + 3.710788476496418e-08, + 9.733276407075664e-09, + 1.7067438573548088e-09, + 8.65347682399431e-10 + ], + "acc_eval": 0.1083984375, + "epoch": 41 + }, + { + "hidden_norms_cls": [ + 3.009104013442993, + 22886.44921875, + 554807.0625, + 2772577.5, + 2636159.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001160762258223258, + 3.776746737571557e-08, + 9.48633260833276e-09, + 1.7762409321164796e-09, + 8.999931910835812e-10 + ], + "acc_eval": 0.107421875, + "epoch": 42 + }, + { + "hidden_norms_cls": [ + 3.0807487964630127, + 24102.28515625, + 560303.4375, + 2871532.75, + 2723516.0 + ], + "bp_grad_per_sample_l2_med": [ + 6.469501386163756e-05, + 4.052726865211298e-08, + 6.607923985768593e-09, + 1.986373288076493e-09, + 1.005414418386863e-09 + ], + "acc_eval": 0.111328125, + "epoch": 43 + }, + { + "hidden_norms_cls": [ + 3.0981693267822266, + 25397.25390625, + 569329.25, + 2967934.75, + 2808716.5 + ], + "bp_grad_per_sample_l2_med": [ + 8.018066000659019e-05, + 3.965687156437525e-08, + 8.188467681691236e-09, + 1.9840931120285177e-09, + 1.0038238018594825e-09 + ], + "acc_eval": 0.1064453125, + "epoch": 44 + }, + { + "hidden_norms_cls": [ + 3.1128475666046143, + 26593.50390625, + 578056.75, + 3059475.5, + 2888212.0 + ], + "bp_grad_per_sample_l2_med": [ + 8.603822061559185e-05, + 3.689373073711977e-08, + 6.842784561200688e-09, + 1.961748541390307e-09, + 9.92456117288043e-10 + ], + "acc_eval": 0.1064453125, + "epoch": 45 + }, + { + "hidden_norms_cls": [ + 3.126692771911621, + 27752.5, + 586243.125, + 3147350.0, + 2962444.5 + ], + "bp_grad_per_sample_l2_med": [ + 7.914086017990485e-05, + 3.278608318169063e-08, + 4.82215689601162e-09, + 1.8859560579898016e-09, + 9.505569664725044e-10 + ], + "acc_eval": 0.107421875, + "epoch": 46 + }, + { + "hidden_norms_cls": [ + 3.1628687381744385, + 28661.537109375, + 592898.875, + 3223267.75, + 3025087.0 + ], + "bp_grad_per_sample_l2_med": [ + 7.642550917807966e-05, + 3.200472065145732e-08, + 5.030188265919833e-09, + 1.7837261667708049e-09, + 9.011961177307626e-10 + ], + "acc_eval": 0.111328125, + "epoch": 47 + }, + { + "hidden_norms_cls": [ + 3.1804893016815186, + 29497.119140625, + 601081.125, + 3294916.75, + 3083660.25 + ], + "bp_grad_per_sample_l2_med": [ + 8.01319838501513e-05, + 3.0802997486034656e-08, + 4.8026316257221424e-09, + 1.7661813123126535e-09, + 8.969202602848725e-10 + ], + "acc_eval": 0.111328125, + "epoch": 48 + }, + { + "hidden_norms_cls": [ + 3.201361894607544, + 30248.82421875, + 612577.625, + 3357942.0, + 3135999.25 + ], + "bp_grad_per_sample_l2_med": [ + 8.080735278781503e-05, + 3.106945101194469e-08, + 4.879642911959081e-09, + 1.7795440676593444e-09, + 9.0354357329403e-10 + ], + "acc_eval": 0.1103515625, + "epoch": 49 + }, + { + "hidden_norms_cls": [ + 3.2230916023254395, + 31060.8359375, + 621329.6875, + 3412872.75, + 3180218.0 + ], + "bp_grad_per_sample_l2_med": [ + 7.493209704989567e-05, + 3.203697929166083e-08, + 5.23388132833702e-09, + 1.7845065425348139e-09, + 9.061755235073576e-10 + ], + "acc_eval": 0.111328125, + "epoch": 50 + }, + { + "hidden_norms_cls": [ + 3.2431774139404297, + 31627.490234375, + 631077.4375, + 3459407.75, + 3218656.25 + ], + "bp_grad_per_sample_l2_med": [ + 6.88562577124685e-05, + 3.010745786014013e-08, + 4.799196151594742e-09, + 1.7849065558905863e-09, + 9.058673811068729e-10 + ], + "acc_eval": 0.111328125, + "epoch": 51 + }, + { + "hidden_norms_cls": [ + 3.250222682952881, + 32081.44921875, + 639738.5, + 3499162.5, + 3250836.0 + ], + "bp_grad_per_sample_l2_med": [ + 6.744447455275804e-05, + 2.8871626867044142e-08, + 4.598368352759508e-09, + 1.781051417459878e-09, + 9.045134086171913e-10 + ], + "acc_eval": 0.11328125, + "epoch": 52 + }, + { + "hidden_norms_cls": [ + 3.258018970489502, + 32488.755859375, + 647751.75, + 3532386.25, + 3277588.75 + ], + "bp_grad_per_sample_l2_med": [ + 7.57749512558803e-05, + 3.006854853992991e-08, + 4.75430272928179e-09, + 1.7687115105857742e-09, + 8.985628907609566e-10 + ], + "acc_eval": 0.1162109375, + "epoch": 53 + }, + { + "hidden_norms_cls": [ + 3.268540143966675, + 32846.26171875, + 653093.8125, + 3557156.75, + 3297180.25 + ], + "bp_grad_per_sample_l2_med": [ + 6.825588206993416e-05, + 3.074128329672021e-08, + 4.992171565021408e-09, + 1.775832703110325e-09, + 9.020287849992314e-10 + ], + "acc_eval": 0.1162109375, + "epoch": 54 + }, + { + "hidden_norms_cls": [ + 3.277456760406494, + 33144.296875, + 656811.625, + 3575374.5, + 3311610.25 + ], + "bp_grad_per_sample_l2_med": [ + 6.744571874151006e-05, + 3.093562384037796e-08, + 5.061019603402883e-09, + 1.7779399064110635e-09, + 9.031043690654883e-10 + ], + "acc_eval": 0.1181640625, + "epoch": 55 + }, + { + "hidden_norms_cls": [ + 3.2813076972961426, + 33291.59765625, + 660069.8125, + 3588556.5, + 3322374.0 + ], + "bp_grad_per_sample_l2_med": [ + 6.797127571189776e-05, + 3.067998122219251e-08, + 4.995078572989087e-09, + 1.7760940496103217e-09, + 9.021596802938348e-10 + ], + "acc_eval": 0.1162109375, + "epoch": 56 + }, + { + "hidden_norms_cls": [ + 3.283642292022705, + 33408.87109375, + 662075.8125, + 3597291.5, + 3329052.75 + ], + "bp_grad_per_sample_l2_med": [ + 6.738945376127958e-05, + 3.091497902119045e-08, + 5.170774475260487e-09, + 1.7745169778038417e-09, + 9.013288448933565e-10 + ], + "acc_eval": 0.1162109375, + "epoch": 57 + }, + { + "hidden_norms_cls": [ + 3.285024404525757, + 33476.29296875, + 663102.5, + 3601966.75, + 3333036.25 + ], + "bp_grad_per_sample_l2_med": [ + 6.544289499288425e-05, + 3.0026765074353534e-08, + 4.907802608755674e-09, + 1.7734476109865227e-09, + 9.008140344768378e-10 + ], + "acc_eval": 0.1181640625, + "epoch": 58 + }, + { + "hidden_norms_cls": [ + 3.285569667816162, + 33510.2890625, + 663440.8125, + 3604244.75, + 3334545.25 + ], + "bp_grad_per_sample_l2_med": [ + 6.654243770753965e-05, + 3.0157259800489555e-08, + 4.895804206483945e-09, + 1.773489466394551e-09, + 9.008297996437875e-10 + ], + "acc_eval": 0.1171875, + "epoch": 59 + }, + { + "hidden_norms_cls": [ + 3.2856643199920654, + 33519.1015625, + 663484.0, + 3604572.0, + 3334760.75 + ], + "bp_grad_per_sample_l2_med": [ + 6.647893314948305e-05, + 3.0106672710417115e-08, + 4.919553653337516e-09, + 1.7735447555011774e-09, + 9.008529477938509e-10 + ], + "acc_eval": 0.1171875, + "epoch": 60 + } + ], + "arch": "vit", + "seed": 42 +} \ No newline at end of file diff --git a/results/snapshot_vit_v1/snapshot_vit_s123.json b/results/snapshot_vit_v1/snapshot_vit_s123.json new file mode 100644 index 0000000..93853cf --- /dev/null +++ b/results/snapshot_vit_v1/snapshot_vit_s123.json @@ -0,0 +1,4594 @@ +{ + "config": { + "output_dir": "results/snapshot_vit_v1", + "epochs": 60, + "lr": 0.001, + "wd": 0.05, + "seed": 123, + "depth": 4, + "d_model": 128, + "n_heads": 4 + }, + "depth": 4, + "d_model": 128, + "architecture": "ViTMini", + "bp_log": [ + { + "hidden_norms_cls": [ + 0.3210873007774353, + 3.3568029403686523, + 4.891699314117432, + 6.200707912445068, + 7.5911865234375 + ], + "hidden_norms_avg": [ + 5.7549052238464355, + 6.750590801239014, + 7.9020819664001465, + 8.925304412841797, + 10.076716423034668 + ], + "bp_grad_per_sample_l2_med": [ + 0.004074312746524811, + 0.0011155740357935429, + 0.0009667170234024525, + 0.0008621186716482043, + 0.0008127145702019334 + ], + "bp_grad_F": [ + 0.20160320401191711, + 0.039521340280771255, + 0.033098917454481125, + 0.029271923005580902, + 0.027136052027344704 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.125, + "loss_eval": 2.422111988067627, + "epoch": 0 + }, + { + "hidden_norms_cls": [ + 0.4782717227935791, + 11.874238014221191, + 20.313709259033203, + 26.86528778076172, + 32.42327880859375 + ], + "hidden_norms_avg": [ + 3.8830745220184326, + 11.266603469848633, + 17.881502151489258, + 23.234352111816406, + 28.51181411743164 + ], + "bp_grad_per_sample_l2_med": [ + 0.002827065996825695, + 0.00024586476502008736, + 0.00014567613834515214, + 0.00013882767234463245, + 0.0001400413311785087 + ], + "bp_grad_F": [ + 0.12621107697486877, + 0.009982436895370483, + 0.00507162231951952, + 0.004677945747971535, + 0.004658848978579044 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4697265625, + "loss_eval": 1.4472862482070923, + "epoch": 1 + }, + { + "hidden_norms_cls": [ + 0.6104467511177063, + 13.787332534790039, + 22.073436737060547, + 28.480369567871094, + 33.141117095947266 + ], + "hidden_norms_avg": [ + 3.951775074005127, + 12.005932807922363, + 18.336896896362305, + 23.67597198486328, + 27.899608612060547 + ], + "bp_grad_per_sample_l2_med": [ + 0.002604336943477392, + 0.00026667251950129867, + 0.00014805165119469166, + 0.00013079405471216887, + 0.00012911780504509807 + ], + "bp_grad_F": [ + 0.12487494200468063, + 0.010650832206010818, + 0.005604646634310484, + 0.004644650500267744, + 0.00448915408924222 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5146484375, + "loss_eval": 1.291869878768921, + "epoch": 2 + }, + { + "hidden_norms_cls": [ + 0.7104504108428955, + 13.74225902557373, + 21.90972328186035, + 28.958967208862305, + 33.262393951416016 + ], + "hidden_norms_avg": [ + 3.9180142879486084, + 13.097892761230469, + 19.570770263671875, + 24.899248123168945, + 28.65104866027832 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020766372326761484, + 0.00025831969105638564, + 0.00014769421250093728, + 0.00012920337030664086, + 0.00012324318231549114 + ], + "bp_grad_F": [ + 0.09676238149404526, + 0.010603155009448528, + 0.005832126829773188, + 0.00465927692130208, + 0.004435759503394365 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.529296875, + "loss_eval": 1.2694497108459473, + "epoch": 3 + }, + { + "hidden_norms_cls": [ + 0.801612377166748, + 12.882991790771484, + 20.474157333374023, + 27.37413215637207, + 32.06389617919922 + ], + "hidden_norms_avg": [ + 3.8871910572052, + 13.333250999450684, + 19.042104721069336, + 24.029348373413086, + 27.96086311340332 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020045258570462465, + 0.000285606540273875, + 0.00016217664233408868, + 0.00013080642384011298, + 0.00011968115722993389 + ], + "bp_grad_F": [ + 0.09496191889047623, + 0.011928788386285305, + 0.006509022321552038, + 0.005044482182711363, + 0.004537967965006828 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.58203125, + "loss_eval": 1.119094967842102, + "epoch": 4 + }, + { + "hidden_norms_cls": [ + 0.8653663396835327, + 12.994612693786621, + 20.49618148803711, + 26.709278106689453, + 30.303852081298828 + ], + "hidden_norms_avg": [ + 4.018242835998535, + 13.520885467529297, + 19.090721130371094, + 23.6751651763916, + 26.93212890625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018953323597088456, + 0.000296358106425032, + 0.00017310198745690286, + 0.0001364975469186902, + 0.00012098452862119302 + ], + "bp_grad_F": [ + 0.09499228745698929, + 0.012825642712414265, + 0.007407570723444223, + 0.005570532754063606, + 0.004951393231749535 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.595703125, + "loss_eval": 1.0847156047821045, + "epoch": 5 + }, + { + "hidden_norms_cls": [ + 0.9313029646873474, + 13.966381072998047, + 21.648372650146484, + 28.33364486694336, + 32.91484069824219 + ], + "hidden_norms_avg": [ + 4.053382396697998, + 15.042261123657227, + 20.74883270263672, + 25.032489776611328, + 28.55679702758789 + ], + "bp_grad_per_sample_l2_med": [ + 0.001841629622504115, + 0.0002753600711002946, + 0.0001624371943762526, + 0.0001305017649428919, + 0.00011278261081315577 + ], + "bp_grad_F": [ + 0.09068351984024048, + 0.0128449946641922, + 0.007257991470396519, + 0.005361978895962238, + 0.004660472739487886 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6103515625, + "loss_eval": 1.095273494720459, + "epoch": 6 + }, + { + "hidden_norms_cls": [ + 0.9818395972251892, + 13.022477149963379, + 20.385391235351562, + 27.03214454650879, + 31.324769973754883 + ], + "hidden_norms_avg": [ + 4.1024041175842285, + 14.697205543518066, + 19.634239196777344, + 23.90021324157715, + 27.306678771972656 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015902157174423337, + 0.00027956697158515453, + 0.0001692597143119201, + 0.0001353132538497448, + 0.00011523282591952011 + ], + "bp_grad_F": [ + 0.07967441529035568, + 0.012528380379080772, + 0.007520876359194517, + 0.00570708978921175, + 0.004875381011515856 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.62890625, + "loss_eval": 1.0069011449813843, + "epoch": 7 + }, + { + "hidden_norms_cls": [ + 1.0194361209869385, + 13.912450790405273, + 20.85824203491211, + 27.968477249145508, + 32.243431091308594 + ], + "hidden_norms_avg": [ + 4.178755283355713, + 14.875143051147461, + 20.261545181274414, + 24.636741638183594, + 27.893512725830078 + ], + "bp_grad_per_sample_l2_med": [ + 0.001506888889707625, + 0.00028421770548447967, + 0.0001727779454085976, + 0.00013076694449409842, + 0.00010860477777896449 + ], + "bp_grad_F": [ + 0.07398127764463425, + 0.013124965131282806, + 0.007798053789883852, + 0.005717460531741381, + 0.004830002784729004 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.638671875, + "loss_eval": 0.9834396839141846, + "epoch": 8 + }, + { + "hidden_norms_cls": [ + 1.077261209487915, + 12.524529457092285, + 19.766538619995117, + 25.7626895904541, + 30.03727149963379 + ], + "hidden_norms_avg": [ + 4.1816864013671875, + 14.304539680480957, + 19.208524703979492, + 23.25862693786621, + 26.313356399536133 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014360174536705017, + 0.0003003668098244816, + 0.0001815372525015846, + 0.0001390709658153355, + 0.00011320491466904059 + ], + "bp_grad_F": [ + 0.0756259635090828, + 0.014865156263113022, + 0.008982912637293339, + 0.006551471073180437, + 0.005398898851126432 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6494140625, + "loss_eval": 0.971701979637146, + "epoch": 9 + }, + { + "hidden_norms_cls": [ + 1.1200045347213745, + 12.160452842712402, + 19.172168731689453, + 25.067665100097656, + 28.764787673950195 + ], + "hidden_norms_avg": [ + 4.289422035217285, + 15.51036262512207, + 20.407268524169922, + 24.061931610107422, + 26.493688583374023 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012870824430137873, + 0.00027074789977632463, + 0.0001742457679938525, + 0.0001348328951280564, + 0.000104573555290699 + ], + "bp_grad_F": [ + 0.07437644153833389, + 0.015084434300661087, + 0.009522279724478722, + 0.0069595095701515675, + 0.0055610560812056065 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6767578125, + "loss_eval": 0.8734689354896545, + "epoch": 10 + }, + { + "hidden_norms_cls": [ + 1.1509246826171875, + 12.219743728637695, + 19.352998733520508, + 25.70184326171875, + 29.580278396606445 + ], + "hidden_norms_avg": [ + 4.315939426422119, + 15.6610689163208, + 20.42215347290039, + 24.016841888427734, + 26.62118911743164 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013146374840289354, + 0.0002733681467361748, + 0.0001865291123976931, + 0.00013389455853030086, + 0.00010298956476617604 + ], + "bp_grad_F": [ + 0.07836466282606125, + 0.015104672871530056, + 0.009902945719659328, + 0.0069915857166051865, + 0.005596037954092026 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6767578125, + "loss_eval": 0.917751669883728, + "epoch": 11 + }, + { + "hidden_norms_cls": [ + 1.2017452716827393, + 12.72107219696045, + 18.952699661254883, + 25.067615509033203, + 29.466550827026367 + ], + "hidden_norms_avg": [ + 4.358119487762451, + 15.672205924987793, + 20.140914916992188, + 24.013885498046875, + 26.668514251708984 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011630960507318377, + 0.00025659528910182416, + 0.0001693729282123968, + 0.0001237613905686885, + 9.384296572534367e-05 + ], + "bp_grad_F": [ + 0.07334695011377335, + 0.015075902454555035, + 0.009827414527535439, + 0.007068648934364319, + 0.005549146793782711 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6982421875, + "loss_eval": 0.8279671669006348, + "epoch": 12 + }, + { + "hidden_norms_cls": [ + 1.234994649887085, + 12.283885955810547, + 18.62163543701172, + 24.3900203704834, + 28.36040496826172 + ], + "hidden_norms_avg": [ + 4.369320869445801, + 15.747625350952148, + 19.76953887939453, + 23.351999282836914, + 25.69841194152832 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011812442680820823, + 0.0002851892786566168, + 0.0001940266229212284, + 0.00013827465591020882, + 0.00010182376718148589 + ], + "bp_grad_F": [ + 0.07158326357603073, + 0.01604902744293213, + 0.010893523693084717, + 0.007844515144824982, + 0.005985426716506481 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.689453125, + "loss_eval": 0.8679210543632507, + "epoch": 13 + }, + { + "hidden_norms_cls": [ + 1.2675292491912842, + 11.706314086914062, + 18.347841262817383, + 24.01951789855957, + 28.1114501953125 + ], + "hidden_norms_avg": [ + 4.390969753265381, + 15.140497207641602, + 19.62596893310547, + 23.22857666015625, + 25.681791305541992 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010449079563841224, + 0.0002611770760267973, + 0.00017687672516331077, + 0.00012088462244719267, + 8.996625547297299e-05 + ], + "bp_grad_F": [ + 0.06979352980852127, + 0.016320781782269478, + 0.01088168565183878, + 0.007916715927422047, + 0.006064872723072767 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6884765625, + "loss_eval": 0.8092349767684937, + "epoch": 14 + }, + { + "hidden_norms_cls": [ + 1.2957582473754883, + 11.933137893676758, + 18.238237380981445, + 23.88395118713379, + 27.868513107299805 + ], + "hidden_norms_avg": [ + 4.4383697509765625, + 15.46267318725586, + 19.841346740722656, + 23.529712677001953, + 25.852684020996094 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009947444777935743, + 0.00024384066637139767, + 0.00016608397709205747, + 0.0001234996016137302, + 9.023427992360666e-05 + ], + "bp_grad_F": [ + 0.07019422203302383, + 0.016806265339255333, + 0.011433122679591179, + 0.008135766722261906, + 0.006158903241157532 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.712890625, + "loss_eval": 0.7795700430870056, + "epoch": 15 + }, + { + "hidden_norms_cls": [ + 1.3391923904418945, + 11.329567909240723, + 17.184999465942383, + 22.353059768676758, + 26.889299392700195 + ], + "hidden_norms_avg": [ + 4.53090238571167, + 15.341407775878906, + 19.109649658203125, + 22.223899841308594, + 24.45347023010254 + ], + "bp_grad_per_sample_l2_med": [ + 0.001086357282474637, + 0.00030167572549544275, + 0.0002114812668878585, + 0.00015480270667467266, + 0.00010993685282301158 + ], + "bp_grad_F": [ + 0.06569939106702805, + 0.017201317474246025, + 0.012068319134414196, + 0.008909368887543678, + 0.006427914369851351 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7314453125, + "loss_eval": 0.7724976539611816, + "epoch": 16 + }, + { + "hidden_norms_cls": [ + 1.3643215894699097, + 10.724340438842773, + 16.144981384277344, + 21.656490325927734, + 25.777481079101562 + ], + "hidden_norms_avg": [ + 4.520992279052734, + 15.036820411682129, + 18.98927879333496, + 22.688859939575195, + 24.71843910217285 + ], + "bp_grad_per_sample_l2_med": [ + 0.000967099389526993, + 0.0002715744194574654, + 0.00019328886992298067, + 0.00013628297892864794, + 9.314809722127393e-05 + ], + "bp_grad_F": [ + 0.06768078356981277, + 0.01841692440211773, + 0.012980606406927109, + 0.009295133873820305, + 0.006698420271277428 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.73828125, + "loss_eval": 0.7337102890014648, + "epoch": 17 + }, + { + "hidden_norms_cls": [ + 1.3963993787765503, + 11.463358879089355, + 16.49429702758789, + 21.585325241088867, + 25.636695861816406 + ], + "hidden_norms_avg": [ + 4.539251327514648, + 14.975208282470703, + 18.360631942749023, + 21.586400985717773, + 23.561830520629883 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008780099451541901, + 0.00024953793035820127, + 0.00017615300021134317, + 0.00012566034274641424, + 8.528940088581294e-05 + ], + "bp_grad_F": [ + 0.07198558002710342, + 0.019673649221658707, + 0.013869633898139, + 0.009656366892158985, + 0.006824122741818428 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7451171875, + "loss_eval": 0.7211208343505859, + "epoch": 18 + }, + { + "hidden_norms_cls": [ + 1.421103835105896, + 9.9105806350708, + 15.361790657043457, + 20.334768295288086, + 24.506919860839844 + ], + "hidden_norms_avg": [ + 4.622361660003662, + 14.7937650680542, + 18.042116165161133, + 21.208105087280273, + 23.21940040588379 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007793674594722688, + 0.0002331113355467096, + 0.00016331924416590482, + 0.00011330798588460311, + 7.215427467599511e-05 + ], + "bp_grad_F": [ + 0.07613872736692429, + 0.022306306287646294, + 0.015858706086874008, + 0.011275039985775948, + 0.007263499312102795 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7392578125, + "loss_eval": 0.7346716523170471, + "epoch": 19 + }, + { + "hidden_norms_cls": [ + 1.4554439783096313, + 10.118419647216797, + 15.106456756591797, + 20.052860260009766, + 24.34604263305664 + ], + "hidden_norms_avg": [ + 4.584441661834717, + 14.634279251098633, + 17.785133361816406, + 21.110010147094727, + 22.89650535583496 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007524031680077314, + 0.0002260785986436531, + 0.00016854463319759816, + 0.00011997718684142455, + 7.738151180092245e-05 + ], + "bp_grad_F": [ + 0.07370379567146301, + 0.021284889429807663, + 0.015382407233119011, + 0.010745048522949219, + 0.007394883316010237 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.74609375, + "loss_eval": 0.7024286389350891, + "epoch": 20 + }, + { + "hidden_norms_cls": [ + 1.4652466773986816, + 10.145299911499023, + 15.15330982208252, + 20.131061553955078, + 23.987186431884766 + ], + "hidden_norms_avg": [ + 4.602361679077148, + 14.532269477844238, + 17.825733184814453, + 21.43619728088379, + 23.12371253967285 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008222013129852712, + 0.0002455596113577485, + 0.00017989490879699588, + 0.00012026322656311095, + 8.26524556032382e-05 + ], + "bp_grad_F": [ + 0.0741497054696083, + 0.020758304744958878, + 0.01482379250228405, + 0.010753357782959938, + 0.007582026533782482 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7412109375, + "loss_eval": 0.7016957402229309, + "epoch": 21 + }, + { + "hidden_norms_cls": [ + 1.480756402015686, + 10.028592109680176, + 14.573174476623535, + 19.24639320373535, + 23.3629150390625 + ], + "hidden_norms_avg": [ + 4.621757984161377, + 14.29589557647705, + 17.4040470123291, + 20.71320343017578, + 22.405963897705078 + ], + "bp_grad_per_sample_l2_med": [ + 0.000667835003696382, + 0.00020642780873458833, + 0.0001538341457489878, + 0.00010652844503056258, + 6.964046770008281e-05 + ], + "bp_grad_F": [ + 0.07375485450029373, + 0.021967202425003052, + 0.016106218099594116, + 0.011507184244692326, + 0.007651185616850853 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7607421875, + "loss_eval": 0.6544591188430786, + "epoch": 22 + }, + { + "hidden_norms_cls": [ + 1.5069013833999634, + 9.897040367126465, + 14.096169471740723, + 18.488874435424805, + 22.214311599731445 + ], + "hidden_norms_avg": [ + 4.621402263641357, + 13.978808403015137, + 16.55535888671875, + 19.729736328125, + 21.272388458251953 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007426440715789795, + 0.0002414636837784201, + 0.00018161055049858987, + 0.00012697202328126878, + 8.096778037725016e-05 + ], + "bp_grad_F": [ + 0.07682260870933533, + 0.02333010919392109, + 0.017287475988268852, + 0.012499523349106312, + 0.008510846644639969 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7568359375, + "loss_eval": 0.6971542835235596, + "epoch": 23 + }, + { + "hidden_norms_cls": [ + 1.5169755220413208, + 9.5064058303833, + 13.812594413757324, + 17.95937156677246, + 21.51923370361328 + ], + "hidden_norms_avg": [ + 4.612667083740234, + 13.86723804473877, + 16.418981552124023, + 19.12198257446289, + 20.565521240234375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007257908000610769, + 0.00024720808141864836, + 0.0001871327986009419, + 0.00013439780741464347, + 8.671147952554747e-05 + ], + "bp_grad_F": [ + 0.07474599778652191, + 0.024257108569145203, + 0.01782340556383133, + 0.01281843613833189, + 0.008487668819725513 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.763671875, + "loss_eval": 0.6618016958236694, + "epoch": 24 + }, + { + "hidden_norms_cls": [ + 1.5133440494537354, + 9.023777961730957, + 13.088467597961426, + 17.324251174926758, + 21.083759307861328 + ], + "hidden_norms_avg": [ + 4.670994281768799, + 13.658943176269531, + 16.629199981689453, + 19.75893783569336, + 21.12710952758789 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005614451365545392, + 0.0001914121676236391, + 0.00014186649059411138, + 0.00010088241106132045, + 6.150588887976483e-05 + ], + "bp_grad_F": [ + 0.08172759413719177, + 0.027048049494624138, + 0.019993988797068596, + 0.014050732366740704, + 0.009047404862940311 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7626953125, + "loss_eval": 0.6708824634552002, + "epoch": 25 + }, + { + "hidden_norms_cls": [ + 1.5329865217208862, + 8.596381187438965, + 12.645307540893555, + 16.668807983398438, + 20.51462745666504 + ], + "hidden_norms_avg": [ + 4.642580986022949, + 13.140735626220703, + 15.32632064819336, + 17.985010147094727, + 19.472858428955078 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005455430946312845, + 0.00019156686903443187, + 0.00014253854169510305, + 0.00010098751954501495, + 6.338314415188506e-05 + ], + "bp_grad_F": [ + 0.08767001330852509, + 0.029545463621616364, + 0.021587952971458435, + 0.014973495155572891, + 0.009515349753201008 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.767578125, + "loss_eval": 0.6813780069351196, + "epoch": 26 + }, + { + "hidden_norms_cls": [ + 1.554770588874817, + 8.98424243927002, + 12.76674747467041, + 16.438858032226562, + 19.893146514892578 + ], + "hidden_norms_avg": [ + 4.635522365570068, + 13.039203643798828, + 15.419903755187988, + 18.176319122314453, + 19.39232635498047 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005697832675650716, + 0.0001985357521334663, + 0.0001536469644634053, + 0.00010455933079356328, + 6.821998249506578e-05 + ], + "bp_grad_F": [ + 0.07977671921253204, + 0.02706393413245678, + 0.020037846639752388, + 0.014591805636882782, + 0.009512925520539284 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.794921875, + "loss_eval": 0.628034770488739, + "epoch": 27 + }, + { + "hidden_norms_cls": [ + 1.5515426397323608, + 8.19682788848877, + 11.861184120178223, + 15.59919548034668, + 18.893400192260742 + ], + "hidden_norms_avg": [ + 4.5841450691223145, + 12.511472702026367, + 14.583609580993652, + 16.949586868286133, + 18.082292556762695 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005373116582632065, + 0.0001997901708818972, + 0.0001489907590439543, + 0.00010373342229286209, + 6.318451050901785e-05 + ], + "bp_grad_F": [ + 0.09340352565050125, + 0.03397079557180405, + 0.025108041241765022, + 0.017669958993792534, + 0.010975479148328304 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.767578125, + "loss_eval": 0.7042175531387329, + "epoch": 28 + }, + { + "hidden_norms_cls": [ + 1.5542187690734863, + 8.489326477050781, + 11.786734580993652, + 15.331045150756836, + 18.48196792602539 + ], + "hidden_norms_avg": [ + 4.615735054016113, + 12.620647430419922, + 14.822388648986816, + 17.454334259033203, + 18.677461624145508 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005812083836644888, + 0.00021461205324158072, + 0.00015997944865375757, + 0.00011693408305291086, + 7.380295573966578e-05 + ], + "bp_grad_F": [ + 0.09380948543548584, + 0.03345760330557823, + 0.025129586458206177, + 0.01789030432701111, + 0.011130682192742825 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7666015625, + "loss_eval": 0.6850110292434692, + "epoch": 29 + }, + { + "hidden_norms_cls": [ + 1.5533884763717651, + 8.01724910736084, + 11.423017501831055, + 15.046612739562988, + 18.549089431762695 + ], + "hidden_norms_avg": [ + 4.590519428253174, + 12.431540489196777, + 14.243208885192871, + 16.609176635742188, + 18.00058937072754 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004959268844686449, + 0.00020078590023331344, + 0.00015426705067511648, + 0.00010096926416736096, + 5.95865749346558e-05 + ], + "bp_grad_F": [ + 0.09663982689380646, + 0.036162860691547394, + 0.02716146595776081, + 0.01926880143582821, + 0.011334826238453388 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7783203125, + "loss_eval": 0.6707749366760254, + "epoch": 30 + }, + { + "hidden_norms_cls": [ + 1.5530469417572021, + 7.959159851074219, + 11.2805757522583, + 14.567391395568848, + 17.63263511657715 + ], + "hidden_norms_avg": [ + 4.583434581756592, + 11.983453750610352, + 13.4386625289917, + 15.498583793640137, + 16.631824493408203 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005142099689692259, + 0.00020230942755006254, + 0.00015552931290585548, + 0.00011007695866283029, + 6.233472959138453e-05 + ], + "bp_grad_F": [ + 0.09787525236606598, + 0.037690743803977966, + 0.028980012983083725, + 0.02064511366188526, + 0.012224731035530567 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7763671875, + "loss_eval": 0.6748013496398926, + "epoch": 31 + }, + { + "hidden_norms_cls": [ + 1.5515272617340088, + 7.847743988037109, + 10.868992805480957, + 14.282126426696777, + 17.300424575805664 + ], + "hidden_norms_avg": [ + 4.579150199890137, + 11.951078414916992, + 13.621748924255371, + 15.971713066101074, + 17.04889488220215 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004585929855238646, + 0.00017806614050641656, + 0.0001380510366288945, + 9.63187703746371e-05, + 5.829996371176094e-05 + ], + "bp_grad_F": [ + 0.10181005299091339, + 0.038575656712055206, + 0.02964734099805355, + 0.020979750901460648, + 0.01240287534892559 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.78125, + "loss_eval": 0.648021936416626, + "epoch": 32 + }, + { + "hidden_norms_cls": [ + 1.5606788396835327, + 7.502675533294678, + 10.430459022521973, + 13.642136573791504, + 16.445953369140625 + ], + "hidden_norms_avg": [ + 4.601283550262451, + 11.615697860717773, + 13.472222328186035, + 15.831238746643066, + 16.856765747070312 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004074577009305358, + 0.00017814920283854008, + 0.00013730341743212193, + 9.565176151227206e-05, + 5.229458474786952e-05 + ], + "bp_grad_F": [ + 0.11506060510873795, + 0.04695325344800949, + 0.03571247681975365, + 0.025198202580213547, + 0.013851121068000793 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.755859375, + "loss_eval": 0.7299192547798157, + "epoch": 33 + }, + { + "hidden_norms_cls": [ + 1.5404834747314453, + 7.528626441955566, + 10.384718894958496, + 13.326257705688477, + 16.41958999633789 + ], + "hidden_norms_avg": [ + 4.533090591430664, + 11.6575345993042, + 13.231060028076172, + 15.337231636047363, + 16.463298797607422 + ], + "bp_grad_per_sample_l2_med": [ + 0.00042279696208424866, + 0.00016955600585788488, + 0.00012915951083414257, + 8.976108074421063e-05, + 4.930083014187403e-05 + ], + "bp_grad_F": [ + 0.11639728397130966, + 0.047109171748161316, + 0.03660130873322487, + 0.02588750049471855, + 0.013930009678006172 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7822265625, + "loss_eval": 0.7065586447715759, + "epoch": 34 + }, + { + "hidden_norms_cls": [ + 1.539638638496399, + 7.26485013961792, + 9.96584701538086, + 13.003418922424316, + 16.14008140563965 + ], + "hidden_norms_avg": [ + 4.537028789520264, + 11.146146774291992, + 12.836923599243164, + 14.992585182189941, + 16.076574325561523 + ], + "bp_grad_per_sample_l2_med": [ + 0.00039646061486564577, + 0.00017108044994529337, + 0.00013601842510979623, + 9.225023677572608e-05, + 4.893271398032084e-05 + ], + "bp_grad_F": [ + 0.11648086458444595, + 0.04862738400697708, + 0.0374443456530571, + 0.026762915775179863, + 0.014388044364750385 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7939453125, + "loss_eval": 0.6772804260253906, + "epoch": 35 + }, + { + "hidden_norms_cls": [ + 1.5278778076171875, + 7.107171058654785, + 9.836174011230469, + 12.691095352172852, + 15.726043701171875 + ], + "hidden_norms_avg": [ + 4.5205254554748535, + 10.983088493347168, + 12.684239387512207, + 14.876561164855957, + 15.817031860351562 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003774319775402546, + 0.00015706375415902585, + 0.0001264828024432063, + 8.857168722897768e-05, + 4.440043630893342e-05 + ], + "bp_grad_F": [ + 0.12492093443870544, + 0.053397826850414276, + 0.040937285870313644, + 0.029012493789196014, + 0.015446576289832592 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7724609375, + "loss_eval": 0.707297146320343, + "epoch": 36 + }, + { + "hidden_norms_cls": [ + 1.51571524143219, + 7.153889179229736, + 9.856640815734863, + 12.511648178100586, + 15.47674560546875 + ], + "hidden_norms_avg": [ + 4.51829719543457, + 10.948126792907715, + 12.496319770812988, + 14.353506088256836, + 15.267280578613281 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003654273459687829, + 0.00015038737910799682, + 0.00011584001913433895, + 8.340556814800948e-05, + 4.3377422116464004e-05 + ], + "bp_grad_F": [ + 0.13914552330970764, + 0.0589178130030632, + 0.04522731155157089, + 0.0323280394077301, + 0.016300896182656288 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7626953125, + "loss_eval": 0.729290246963501, + "epoch": 37 + }, + { + "hidden_norms_cls": [ + 1.5081822872161865, + 6.952159404754639, + 9.558011054992676, + 12.107258796691895, + 15.05250358581543 + ], + "hidden_norms_avg": [ + 4.481203556060791, + 10.740157127380371, + 12.00869083404541, + 13.831336975097656, + 14.76778507232666 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003083393967244774, + 0.00012594371219165623, + 0.00010108885180670768, + 7.270355854416266e-05, + 3.639453643700108e-05 + ], + "bp_grad_F": [ + 0.14465992152690887, + 0.061646901071071625, + 0.047660429030656815, + 0.03381076827645302, + 0.01706051267683506 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7685546875, + "loss_eval": 0.7395438551902771, + "epoch": 38 + }, + { + "hidden_norms_cls": [ + 1.5159180164337158, + 6.878056526184082, + 9.382442474365234, + 11.969950675964355, + 15.129233360290527 + ], + "hidden_norms_avg": [ + 4.494526386260986, + 10.639691352844238, + 12.291059494018555, + 14.28632640838623, + 15.170000076293945 + ], + "bp_grad_per_sample_l2_med": [ + 0.00028951463173143566, + 0.00012502263416536152, + 0.00010040518827736378, + 7.046512473607436e-05, + 3.719307642313652e-05 + ], + "bp_grad_F": [ + 0.1406005620956421, + 0.06109313294291496, + 0.047722309827804565, + 0.033977217972278595, + 0.01711316779255867 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7802734375, + "loss_eval": 0.7057114839553833, + "epoch": 39 + }, + { + "hidden_norms_cls": [ + 1.5058479309082031, + 6.699619770050049, + 9.136896133422852, + 11.609856605529785, + 14.701480865478516 + ], + "hidden_norms_avg": [ + 4.482093811035156, + 10.446189880371094, + 12.056195259094238, + 13.87569522857666, + 14.783234596252441 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002856751380022615, + 0.00013275284436531365, + 0.00010139105870621279, + 6.966136425035074e-05, + 3.293903864687309e-05 + ], + "bp_grad_F": [ + 0.1529398262500763, + 0.06890096515417099, + 0.052683208137750626, + 0.03734185919165611, + 0.01789216138422489 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7822265625, + "loss_eval": 0.7478293180465698, + "epoch": 40 + }, + { + "hidden_norms_cls": [ + 1.490049123764038, + 6.627772331237793, + 9.019189834594727, + 11.385313987731934, + 14.173355102539062 + ], + "hidden_norms_avg": [ + 4.458098411560059, + 10.279450416564941, + 11.593936920166016, + 13.30923080444336, + 14.155406951904297 + ], + "bp_grad_per_sample_l2_med": [ + 0.00021343027765396982, + 9.837630932452157e-05, + 8.006956340977922e-05, + 5.6768003560137004e-05, + 2.7385456633055583e-05 + ], + "bp_grad_F": [ + 0.15772707760334015, + 0.07120667397975922, + 0.05564703419804573, + 0.03953033685684204, + 0.018776116892695427 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7724609375, + "loss_eval": 0.7677009105682373, + "epoch": 41 + }, + { + "hidden_norms_cls": [ + 1.4904595613479614, + 6.347933769226074, + 8.674281120300293, + 11.007567405700684, + 14.106690406799316 + ], + "hidden_norms_avg": [ + 4.430132865905762, + 10.265702247619629, + 11.588266372680664, + 13.410375595092773, + 14.36179256439209 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002224426862085238, + 0.00010000570182455704, + 7.794459816068411e-05, + 5.595289985649288e-05, + 2.7256841349299066e-05 + ], + "bp_grad_F": [ + 0.16928334534168243, + 0.07747916132211685, + 0.06056727096438408, + 0.04274875670671463, + 0.019731448963284492 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.771484375, + "loss_eval": 0.7774850726127625, + "epoch": 42 + }, + { + "hidden_norms_cls": [ + 1.4839239120483398, + 6.341518878936768, + 8.600671768188477, + 10.991724014282227, + 14.061833381652832 + ], + "hidden_norms_avg": [ + 4.403061866760254, + 10.020040512084961, + 11.371668815612793, + 13.18271255493164, + 14.007345199584961 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002152575325453654, + 0.00010309015488019213, + 7.964189717313275e-05, + 5.283725113258697e-05, + 2.479495196894277e-05 + ], + "bp_grad_F": [ + 0.17190901935100555, + 0.080362468957901, + 0.06201368197798729, + 0.042563296854496, + 0.019763268530368805 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.791015625, + "loss_eval": 0.7503129243850708, + "epoch": 43 + }, + { + "hidden_norms_cls": [ + 1.479953408241272, + 6.386821269989014, + 8.521474838256836, + 10.847907066345215, + 13.541037559509277 + ], + "hidden_norms_avg": [ + 4.399942874908447, + 9.979388236999512, + 11.251038551330566, + 12.998858451843262, + 13.76570987701416 + ], + "bp_grad_per_sample_l2_med": [ + 0.000195752116269432, + 9.365259029436857e-05, + 7.282401929842308e-05, + 5.209222945268266e-05, + 2.3047552531352267e-05 + ], + "bp_grad_F": [ + 0.16316288709640503, + 0.07674747705459595, + 0.06052006781101227, + 0.04277755320072174, + 0.020131859928369522 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7978515625, + "loss_eval": 0.732360303401947, + "epoch": 44 + }, + { + "hidden_norms_cls": [ + 1.4770045280456543, + 6.249807834625244, + 8.36440658569336, + 10.429434776306152, + 13.045490264892578 + ], + "hidden_norms_avg": [ + 4.391754627227783, + 9.821492195129395, + 10.789708137512207, + 12.3140869140625, + 13.067754745483398 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002329840644961223, + 0.00011798225023085251, + 9.261347440769896e-05, + 6.294570630416274e-05, + 2.9543562050093897e-05 + ], + "bp_grad_F": [ + 0.1812749058008194, + 0.08621949702501297, + 0.067754827439785, + 0.04831995815038681, + 0.021977350115776062 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7822265625, + "loss_eval": 0.7784227132797241, + "epoch": 45 + }, + { + "hidden_norms_cls": [ + 1.467228651046753, + 6.0983357429504395, + 8.231528282165527, + 10.333056449890137, + 13.266757011413574 + ], + "hidden_norms_avg": [ + 4.390368461608887, + 9.647501945495605, + 10.692501068115234, + 12.274677276611328, + 13.044783592224121 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001511751615907997, + 7.784536137478426e-05, + 6.136627780506387e-05, + 4.35807196481619e-05, + 2.014869824051857e-05 + ], + "bp_grad_F": [ + 0.18805110454559326, + 0.09124159067869186, + 0.07224944978952408, + 0.050726212561130524, + 0.02254536561667919 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7822265625, + "loss_eval": 0.814141571521759, + "epoch": 46 + }, + { + "hidden_norms_cls": [ + 1.4649879932403564, + 6.082813739776611, + 8.131811141967773, + 10.158056259155273, + 13.049956321716309 + ], + "hidden_norms_avg": [ + 4.377193927764893, + 9.599099159240723, + 10.660999298095703, + 12.21728801727295, + 12.965741157531738 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001712174853309989, + 8.400671504205093e-05, + 6.461612792918459e-05, + 4.6120971092022955e-05, + 2.0111323465243913e-05 + ], + "bp_grad_F": [ + 0.19550266861915588, + 0.09418290108442307, + 0.07462290674448013, + 0.053083814680576324, + 0.02292729914188385 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7890625, + "loss_eval": 0.7999259233474731, + "epoch": 47 + }, + { + "hidden_norms_cls": [ + 1.4617111682891846, + 6.058816432952881, + 8.100686073303223, + 10.085453987121582, + 12.920005798339844 + ], + "hidden_norms_avg": [ + 4.367196559906006, + 9.56169605255127, + 10.609153747558594, + 12.135587692260742, + 12.871316909790039 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015642307698726654, + 7.727487536612898e-05, + 5.90925665164832e-05, + 4.136386633035727e-05, + 1.6983105524559505e-05 + ], + "bp_grad_F": [ + 0.202835351228714, + 0.09727983921766281, + 0.07683655619621277, + 0.05471916124224663, + 0.02326873689889908 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.783203125, + "loss_eval": 0.8152254223823547, + "epoch": 48 + }, + { + "hidden_norms_cls": [ + 1.4593255519866943, + 6.017489433288574, + 7.96034049987793, + 9.983046531677246, + 12.839889526367188 + ], + "hidden_norms_avg": [ + 4.349035739898682, + 9.508291244506836, + 10.475739479064941, + 12.025425910949707, + 12.764323234558105 + ], + "bp_grad_per_sample_l2_med": [ + 0.00013039771874900907, + 6.479993317043409e-05, + 5.060105831944384e-05, + 3.637294139480218e-05, + 1.4738084246346261e-05 + ], + "bp_grad_F": [ + 0.2170599102973938, + 0.10417382419109344, + 0.08229079097509384, + 0.05735529586672783, + 0.024290865287184715 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7841796875, + "loss_eval": 0.8357614278793335, + "epoch": 49 + }, + { + "hidden_norms_cls": [ + 1.4566220045089722, + 5.9422221183776855, + 7.888944149017334, + 9.933752059936523, + 12.817610740661621 + ], + "hidden_norms_avg": [ + 4.346043109893799, + 9.43443489074707, + 10.415618896484375, + 11.964469909667969, + 12.66396713256836 + ], + "bp_grad_per_sample_l2_med": [ + 0.00011193535465281457, + 5.694849824067205e-05, + 4.533635365078226e-05, + 3.3492226066300645e-05, + 1.4018894034961704e-05 + ], + "bp_grad_F": [ + 0.21774698793888092, + 0.1065358892083168, + 0.08431421220302582, + 0.05883141607046127, + 0.024615641683340073 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7822265625, + "loss_eval": 0.8349668979644775, + "epoch": 50 + }, + { + "hidden_norms_cls": [ + 1.4569600820541382, + 5.859008312225342, + 7.792572498321533, + 9.738831520080566, + 12.622002601623535 + ], + "hidden_norms_avg": [ + 4.331563472747803, + 9.398598670959473, + 10.273933410644531, + 11.764141082763672, + 12.436033248901367 + ], + "bp_grad_per_sample_l2_med": [ + 0.00012003595475107431, + 5.908689126954414e-05, + 4.746428385260515e-05, + 3.251975431339815e-05, + 1.3768915778200608e-05 + ], + "bp_grad_F": [ + 0.2144007831811905, + 0.10626016557216644, + 0.08404342085123062, + 0.05926896259188652, + 0.024889416992664337 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7861328125, + "loss_eval": 0.840790331363678, + "epoch": 51 + }, + { + "hidden_norms_cls": [ + 1.4559087753295898, + 5.8081440925598145, + 7.735576629638672, + 9.665096282958984, + 12.462581634521484 + ], + "hidden_norms_avg": [ + 4.331978797912598, + 9.35647964477539, + 10.206826210021973, + 11.663065910339355, + 12.307528495788574 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010101464431500062, + 5.143512680660933e-05, + 4.1592236811993644e-05, + 3.0060553399380296e-05, + 1.2701412742899265e-05 + ], + "bp_grad_F": [ + 0.22189198434352875, + 0.11008423566818237, + 0.08644267171621323, + 0.0603644996881485, + 0.025003522634506226 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7900390625, + "loss_eval": 0.8574135303497314, + "epoch": 52 + }, + { + "hidden_norms_cls": [ + 1.4537159204483032, + 5.80010461807251, + 7.719310760498047, + 9.681657791137695, + 12.724189758300781 + ], + "hidden_norms_avg": [ + 4.318180084228516, + 9.302933692932129, + 10.182857513427734, + 11.675416946411133, + 12.381869316101074 + ], + "bp_grad_per_sample_l2_med": [ + 9.399914415553212e-05, + 4.920759965898469e-05, + 3.82029902539216e-05, + 2.4410484911641106e-05, + 9.912354471453e-06 + ], + "bp_grad_F": [ + 0.2312120646238327, + 0.11490234732627869, + 0.09031722694635391, + 0.06280362606048584, + 0.02546737529337406 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7900390625, + "loss_eval": 0.8825892210006714, + "epoch": 53 + }, + { + "hidden_norms_cls": [ + 1.4533940553665161, + 5.765341758728027, + 7.664762496948242, + 9.541180610656738, + 12.46136474609375 + ], + "hidden_norms_avg": [ + 4.321633815765381, + 9.284127235412598, + 10.135884284973145, + 11.603636741638184, + 12.27259635925293 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010168847802560776, + 5.239037636783905e-05, + 4.169415478827432e-05, + 2.8813867174903862e-05, + 1.1632122550508939e-05 + ], + "bp_grad_F": [ + 0.23138603568077087, + 0.11581514030694962, + 0.09145721793174744, + 0.06368965655565262, + 0.025816213339567184 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7900390625, + "loss_eval": 0.8627672791481018, + "epoch": 54 + }, + { + "hidden_norms_cls": [ + 1.4520151615142822, + 5.752710342407227, + 7.6372294425964355, + 9.493330001831055, + 12.49281120300293 + ], + "hidden_norms_avg": [ + 4.314420223236084, + 9.275971412658691, + 10.131872177124023, + 11.594268798828125, + 12.271230697631836 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010349372314522043, + 5.0890805141534656e-05, + 4.167861698078923e-05, + 2.9301188988029025e-05, + 1.1288396308373194e-05 + ], + "bp_grad_F": [ + 0.23472057282924652, + 0.11708012968301773, + 0.09245092421770096, + 0.06478185206651688, + 0.025885937735438347 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.791015625, + "loss_eval": 0.8611111640930176, + "epoch": 55 + }, + { + "hidden_norms_cls": [ + 1.4508332014083862, + 5.741517066955566, + 7.59091329574585, + 9.493820190429688, + 12.553393363952637 + ], + "hidden_norms_avg": [ + 4.315334320068359, + 9.272273063659668, + 10.107754707336426, + 11.5936279296875, + 12.266173362731934 + ], + "bp_grad_per_sample_l2_med": [ + 9.209421114064753e-05, + 4.9557409511180595e-05, + 3.8665639294777066e-05, + 2.703870450204704e-05, + 1.0333649697713554e-05 + ], + "bp_grad_F": [ + 0.23745231330394745, + 0.11897031217813492, + 0.09419847279787064, + 0.06559450179338455, + 0.02597379870712757 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.794921875, + "loss_eval": 0.8737660646438599, + "epoch": 56 + }, + { + "hidden_norms_cls": [ + 1.4514665603637695, + 5.724127292633057, + 7.567911624908447, + 9.464110374450684, + 12.53247356414795 + ], + "hidden_norms_avg": [ + 4.312892436981201, + 9.258728981018066, + 10.092171669006348, + 11.559837341308594, + 12.241935729980469 + ], + "bp_grad_per_sample_l2_med": [ + 8.842872193781659e-05, + 4.636628364096396e-05, + 3.5660887078847736e-05, + 2.4343042241525836e-05, + 9.563225830788724e-06 + ], + "bp_grad_F": [ + 0.23917540907859802, + 0.12006859481334686, + 0.09492167085409164, + 0.06607519090175629, + 0.02614584006369114 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7939453125, + "loss_eval": 0.8743407130241394, + "epoch": 57 + }, + { + "hidden_norms_cls": [ + 1.4513946771621704, + 5.7332282066345215, + 7.562880992889404, + 9.466405868530273, + 12.53167724609375 + ], + "hidden_norms_avg": [ + 4.3138651847839355, + 9.26041316986084, + 10.077324867248535, + 11.538521766662598, + 12.218836784362793 + ], + "bp_grad_per_sample_l2_med": [ + 9.282731480197981e-05, + 4.6137181925587356e-05, + 3.7237725337035954e-05, + 2.553310514485929e-05, + 9.964967830455862e-06 + ], + "bp_grad_F": [ + 0.24150457978248596, + 0.12129233777523041, + 0.09592130035161972, + 0.06674522906541824, + 0.026258554309606552 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7890625, + "loss_eval": 0.8750766515731812, + "epoch": 58 + }, + { + "hidden_norms_cls": [ + 1.4510550498962402, + 5.730595111846924, + 7.558650493621826, + 9.460441589355469, + 12.49626636505127 + ], + "hidden_norms_avg": [ + 4.311552047729492, + 9.2510347366333, + 10.070302963256836, + 11.530484199523926, + 12.212501525878906 + ], + "bp_grad_per_sample_l2_med": [ + 8.91910312930122e-05, + 4.6800774725852534e-05, + 3.584511432563886e-05, + 2.5313198420917615e-05, + 9.680608854978345e-06 + ], + "bp_grad_F": [ + 0.24175073206424713, + 0.12143565714359283, + 0.09590216726064682, + 0.06680992990732193, + 0.026268428191542625 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.787109375, + "loss_eval": 0.8746636509895325, + "epoch": 59 + }, + { + "hidden_norms_cls": [ + 1.450972557067871, + 5.727794647216797, + 7.5582756996154785, + 9.462045669555664, + 12.50033187866211 + ], + "hidden_norms_avg": [ + 4.311238765716553, + 9.248146057128906, + 10.065601348876953, + 11.523144721984863, + 12.206249237060547 + ], + "bp_grad_per_sample_l2_med": [ + 8.883981354301795e-05, + 4.730010550701991e-05, + 3.57187855115626e-05, + 2.4922017473727465e-05, + 9.98118775896728e-06 + ], + "bp_grad_F": [ + 0.24178682267665863, + 0.12154776602983475, + 0.09598654508590698, + 0.06685590744018555, + 0.026261666789650917 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.787109375, + "loss_eval": 0.8750864863395691, + "epoch": 60 + } + ], + "dfa_log": [ + { + "hidden_norms_cls": [ + 0.3210873007774353, + 3.3568029403686523, + 4.891699314117432, + 6.200707912445068, + 7.5911865234375 + ], + "hidden_norms_avg": [ + 5.7549052238464355, + 6.750590801239014, + 7.9020819664001465, + 8.925304412841797, + 10.076716423034668 + ], + "bp_grad_per_sample_l2_med": [ + 0.004074312746524811, + 0.0011155740357935429, + 0.0009667170234024525, + 0.0008621186716482043, + 0.0008127145702019334 + ], + "bp_grad_F": [ + 0.20160320401191711, + 0.039521340280771255, + 0.033098917454481125, + 0.029271923005580902, + 0.027136052027344704 + ], + "gamma_dfa": 0.0011031709145754576, + "gamma_dfa_per_layer": [ + -0.004096934571862221, + -0.003170878393575549, + 0.003171987598761916, + 0.008508509024977684 + ], + "acc_eval": 0.125, + "loss_eval": 2.422111988067627, + "epoch": 0 + }, + { + "hidden_norms_cls": [ + 1.7445409297943115, + 3393.872314453125, + 8096.7275390625, + 11786.4453125, + 15317.9609375 + ], + "hidden_norms_avg": [ + 46.059967041015625, + 2908.78857421875, + 9192.9140625, + 12480.814453125, + 15843.904296875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007700070273131132, + 5.177932962396881e-07, + 4.354141651674581e-07, + 4.0796010125632165e-07, + 4.096184795798763e-07 + ], + "bp_grad_F": [ + 0.14847944676876068, + 7.175570499384776e-05, + 1.7355905583826825e-05, + 1.4375820683198981e-05, + 1.4468741937889718e-05 + ], + "gamma_dfa": 0.00903075491078198, + "gamma_dfa_per_layer": [ + 0.014700280502438545, + 0.007455145940184593, + 0.009132559411227703, + 0.004835033789277077 + ], + "acc_eval": 0.2158203125, + "loss_eval": 2.072723388671875, + "epoch": 1 + }, + { + "hidden_norms_cls": [ + 3.5329439640045166, + 17943.025390625, + 46227.09765625, + 60098.9921875, + 105510.8828125 + ], + "hidden_norms_avg": [ + 95.54289245605469, + 14775.4267578125, + 44856.01953125, + 59234.35546875, + 87862.078125 + ], + "bp_grad_per_sample_l2_med": [ + 0.00029628784977830946, + 1.0676165373979529e-07, + 7.34040170868866e-08, + 6.658416396021494e-08, + 6.750254044618487e-08 + ], + "bp_grad_F": [ + 0.12055971473455429, + 8.933278149925172e-05, + 3.910079612978734e-06, + 3.3086737403209554e-06, + 3.354543650857522e-06 + ], + "gamma_dfa": 0.007886230800068006, + "gamma_dfa_per_layer": [ + 0.016902755945920944, + 0.003473796183243394, + 0.009775697253644466, + 0.0013926738174632192 + ], + "acc_eval": 0.2197265625, + "loss_eval": 2.0924925804138184, + "epoch": 2 + }, + { + "hidden_norms_cls": [ + 5.165565013885498, + 33863.33203125, + 93132.8515625, + 145828.34375, + 276496.0 + ], + "hidden_norms_avg": [ + 142.7160186767578, + 36882.9296875, + 93356.96875, + 138199.0625, + 216913.359375 + ], + "bp_grad_per_sample_l2_med": [ + 0.00022745825117453933, + 4.267175768291054e-08, + 3.181965624321492e-08, + 2.8314032007870082e-08, + 2.8843814448009653e-08 + ], + "bp_grad_F": [ + 0.06954267621040344, + 0.00012680335203185678, + 2.0300262804084923e-06, + 1.8529049157223199e-06, + 1.8672349142434541e-06 + ], + "gamma_dfa": 0.00556139531545341, + "gamma_dfa_per_layer": [ + 0.01000538095831871, + 0.0014471756294369698, + 0.011906315572559834, + -0.001113290898501873 + ], + "acc_eval": 0.2412109375, + "loss_eval": 2.0521552562713623, + "epoch": 3 + }, + { + "hidden_norms_cls": [ + 6.674264907836914, + 43835.6796875, + 150229.609375, + 253133.515625, + 481876.5 + ], + "hidden_norms_avg": [ + 186.87832641601562, + 74412.015625, + 150159.890625, + 253252.734375, + 439077.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003350951592437923, + 2.7693221937852286e-08, + 1.989219278186738e-08, + 1.704596108709211e-08, + 1.7547710839949104e-08 + ], + "bp_grad_F": [ + 0.058595605194568634, + 0.0002476655936334282, + 1.0984595064655878e-06, + 1.0368654557169066e-06, + 1.0405622106191004e-06 + ], + "gamma_dfa": 0.002481349220033735, + "gamma_dfa_per_layer": [ + 3.730843309313059e-05, + 0.0014904557028785348, + 0.011494583450257778, + -0.0030969507060945034 + ], + "acc_eval": 0.232421875, + "loss_eval": 2.058844566345215, + "epoch": 4 + }, + { + "hidden_norms_cls": [ + 8.061405181884766, + 102865.78125, + 229004.390625, + 413580.59375, + 706253.625 + ], + "hidden_norms_avg": [ + 228.99224853515625, + 131342.546875, + 229257.390625, + 410435.25, + 727001.6875 + ], + "bp_grad_per_sample_l2_med": [ + 0.00029934433405287564, + 1.670629679040303e-08, + 1.3200744497510186e-08, + 1.1068386207568892e-08, + 1.1248447506773118e-08 + ], + "bp_grad_F": [ + 0.49810686707496643, + 0.0004038630868308246, + 1.391591922583757e-06, + 6.11680206930032e-07, + 5.242948759587307e-07 + ], + "gamma_dfa": 0.0009187236428260803, + "gamma_dfa_per_layer": [ + -0.003027769736945629, + 0.002294017933309078, + 0.00904145184904337, + -0.004632805474102497 + ], + "acc_eval": 0.2197265625, + "loss_eval": 2.091141700744629, + "epoch": 5 + }, + { + "hidden_norms_cls": [ + 9.400635719299316, + 164205.859375, + 302756.3125, + 584338.25, + 1250749.125 + ], + "hidden_norms_avg": [ + 270.8563232421875, + 190832.34375, + 307117.59375, + 620500.3125, + 1149191.375 + ], + "bp_grad_per_sample_l2_med": [ + 0.00034470504033379257, + 1.3897826889319731e-08, + 8.662226491651381e-09, + 6.850678690994982e-09, + 7.0105756755367565e-09 + ], + "bp_grad_F": [ + 0.08854538202285767, + 0.0002125167811755091, + 3.9876397295302013e-07, + 2.9177280680414697e-07, + 2.903063318626664e-07 + ], + "gamma_dfa": 0.0008902656263671815, + "gamma_dfa_per_layer": [ + -0.004116768017411232, + 0.004187953192740679, + 0.007109872996807098, + -0.003619995666667819 + ], + "acc_eval": 0.208984375, + "loss_eval": 2.09378981590271, + "epoch": 6 + }, + { + "hidden_norms_cls": [ + 10.676177978515625, + 216327.671875, + 429372.28125, + 910110.1875, + 1955787.375 + ], + "hidden_norms_avg": [ + 311.3556823730469, + 279124.65625, + 434169.5, + 917506.125, + 1714750.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002802011731546372, + 8.183582700382885e-09, + 5.617039278149605e-09, + 4.765932093420133e-09, + 4.884364024348997e-09 + ], + "bp_grad_F": [ + 0.2021757811307907, + 0.00017153903900180012, + 2.627296851187566e-07, + 1.9583571031489555e-07, + 1.9719628596703842e-07 + ], + "gamma_dfa": 0.00245969754178077, + "gamma_dfa_per_layer": [ + 0.0030665153171867132, + 0.0039703575894236565, + 0.005591260269284248, + -0.0027893430087715387 + ], + "acc_eval": 0.224609375, + "loss_eval": 2.0816030502319336, + "epoch": 7 + }, + { + "hidden_norms_cls": [ + 11.970849990844727, + 282019.0, + 553729.25, + 1250316.5, + 2676136.75 + ], + "hidden_norms_avg": [ + 350.0874938964844, + 367917.96875, + 563719.125, + 1231394.75, + 2379567.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015754146443214267, + 7.837374305097455e-09, + 4.1749870227647534e-09, + 3.572480755664742e-09, + 3.6429026462059255e-09 + ], + "bp_grad_F": [ + 0.06816119700670242, + 0.0002165154874091968, + 1.8739321205885062e-07, + 1.4396131575722393e-07, + 1.449055417879208e-07 + ], + "gamma_dfa": 0.0018902571755461395, + "gamma_dfa_per_layer": [ + 0.0010774387046694756, + 0.004019944928586483, + 0.004736708011478186, + -0.0022730629425495863 + ], + "acc_eval": 0.2236328125, + "loss_eval": 2.069587469100952, + "epoch": 8 + }, + { + "hidden_norms_cls": [ + 13.234355926513672, + 498576.65625, + 747356.3125, + 1569417.0, + 3492356.0 + ], + "hidden_norms_avg": [ + 390.34356689453125, + 517596.5, + 755798.625, + 1559863.25, + 3087860.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.00012954612611792982, + 6.955718223622398e-09, + 3.3238092278509157e-09, + 2.7362234700234467e-09, + 2.7891511322764018e-09 + ], + "bp_grad_F": [ + 0.03943011909723282, + 0.00019621588580776006, + 1.9796995331944345e-07, + 1.1484767270530938e-07, + 1.1313876058238748e-07 + ], + "gamma_dfa": 0.002013051969697699, + "gamma_dfa_per_layer": [ + 0.0007974229520186782, + 0.0045172227546572685, + 0.004162413999438286, + -0.0014248518273234367 + ], + "acc_eval": 0.21484375, + "loss_eval": 2.0846829414367676, + "epoch": 9 + }, + { + "hidden_norms_cls": [ + 14.412362098693848, + 653898.875, + 962527.9375, + 1974772.75, + 4235229.0 + ], + "hidden_norms_avg": [ + 426.1747741699219, + 660897.75, + 954217.625, + 1992937.5, + 3912584.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001297950657317415, + 8.463428180505161e-09, + 2.735849546908753e-09, + 2.2942541200166033e-09, + 2.329255233135541e-09 + ], + "bp_grad_F": [ + 0.07335253059864044, + 0.0002778704511001706, + 2.1924184068211616e-07, + 1.5885484572208952e-07, + 9.551467172741468e-08 + ], + "gamma_dfa": 0.001994484744500369, + "gamma_dfa_per_layer": [ + 0.0028600264340639114, + 0.0031631651800125837, + 0.0033731083385646343, + -0.0014183609746396542 + ], + "acc_eval": 0.2373046875, + "loss_eval": 2.0768301486968994, + "epoch": 10 + }, + { + "hidden_norms_cls": [ + 15.627301216125488, + 805321.625, + 1191654.25, + 2375967.75, + 5068243.5 + ], + "hidden_norms_avg": [ + 464.92144775390625, + 870169.75, + 1209570.75, + 2342305.5, + 4797491.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014358766202349216, + 6.655038742309216e-09, + 2.213497385383789e-09, + 1.8578552030135143e-09, + 1.8845198734851465e-09 + ], + "bp_grad_F": [ + 0.22341646254062653, + 0.0010545816039666533, + 3.022053363110899e-07, + 8.581165644727662e-08, + 7.942276880612553e-08 + ], + "gamma_dfa": 0.0012935771082993597, + "gamma_dfa_per_layer": [ + -0.00014482985716313124, + 0.0035164642613381147, + 0.002910400740802288, + -0.0011077267117798328 + ], + "acc_eval": 0.2138671875, + "loss_eval": 2.076242446899414, + "epoch": 11 + }, + { + "hidden_norms_cls": [ + 16.751590728759766, + 758638.375, + 1437438.0, + 2779040.25, + 5662257.0 + ], + "hidden_norms_avg": [ + 501.60235595703125, + 1119163.625, + 1513203.375, + 2677392.25, + 5339190.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00020390149438753724, + 5.5311413227343564e-09, + 1.8890189412701375e-09, + 1.6241474831701908e-09, + 1.6578916017806478e-09 + ], + "bp_grad_F": [ + 1.734735369682312, + 0.000374374445527792, + 1.2862761877840967e-07, + 1.1062630989044919e-07, + 6.887377423936414e-08 + ], + "gamma_dfa": 0.0020944410644005984, + "gamma_dfa_per_layer": [ + 0.0036250988487154245, + 0.0027163547929376364, + 0.0028407545760273933, + -0.0008044439600780606 + ], + "acc_eval": 0.23046875, + "loss_eval": 2.083003520965576, + "epoch": 12 + }, + { + "hidden_norms_cls": [ + 17.76032066345215, + 1093088.5, + 1739864.0, + 3080344.5, + 6632118.5 + ], + "hidden_norms_avg": [ + 539.1420288085938, + 1433551.75, + 1843404.125, + 3096921.75, + 6237853.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014031230239197612, + 4.252878937904825e-09, + 1.704668295410272e-09, + 1.518661418842271e-09, + 1.5263605934734414e-09 + ], + "bp_grad_F": [ + 0.05247655138373375, + 0.00048432740732096136, + 1.395327586806161e-07, + 8.375257465331742e-08, + 5.970760241780226e-08 + ], + "gamma_dfa": 0.0018704376125242561, + "gamma_dfa_per_layer": [ + 0.0021162822376936674, + 0.003257386852055788, + 0.002796958899125457, + -0.0006888775387778878 + ], + "acc_eval": 0.2177734375, + "loss_eval": 2.1021971702575684, + "epoch": 13 + }, + { + "hidden_norms_cls": [ + 18.760025024414062, + 2223954.75, + 2460609.0, + 3718541.25, + 7618764.0 + ], + "hidden_norms_avg": [ + 577.8324584960938, + 1908819.625, + 2348359.5, + 3542983.0, + 6779725.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010403544729342684, + 2.662567277766925e-09, + 1.6195218499603925e-09, + 1.422262307926303e-09, + 1.433551610752204e-09 + ], + "bp_grad_F": [ + 0.08673901855945587, + 0.0001567020226502791, + 8.41187173250546e-08, + 5.8843131256480774e-08, + 5.371895994699116e-08 + ], + "gamma_dfa": 0.003976444830186665, + "gamma_dfa_per_layer": [ + 0.010876781307160854, + 0.0029237696435302496, + 0.0026041539385914803, + -0.000498925568535924 + ], + "acc_eval": 0.2177734375, + "loss_eval": 2.138009548187256, + "epoch": 14 + }, + { + "hidden_norms_cls": [ + 19.738407135009766, + 2339586.0, + 2696652.5, + 4235438.5, + 7955372.0 + ], + "hidden_norms_avg": [ + 619.4888916015625, + 2243613.75, + 2801893.5, + 4018190.75, + 7143025.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014718857710249722, + 2.6654392026870255e-09, + 1.4668186665289795e-09, + 1.3113429231381701e-09, + 1.3212382299343517e-09 + ], + "bp_grad_F": [ + 0.1564428061246872, + 0.00024187436792999506, + 2.621962664761668e-07, + 5.580703898999673e-08, + 5.442945649747344e-08 + ], + "gamma_dfa": 0.0019682426573126577, + "gamma_dfa_per_layer": [ + 0.003052386222407222, + 0.0027148486115038395, + 0.0025699653197079897, + -0.00046422952436842024 + ], + "acc_eval": 0.2265625, + "loss_eval": 2.145447254180908, + "epoch": 15 + }, + { + "hidden_norms_cls": [ + 20.727081298828125, + 2753822.5, + 3114285.75, + 4713040.0, + 8652256.0 + ], + "hidden_norms_avg": [ + 660.8045654296875, + 2684893.0, + 3331407.5, + 4614215.5, + 7864381.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.00013858993770554662, + 2.7730009399817845e-09, + 1.344458322449782e-09, + 1.2393497339502346e-09, + 1.2431760065823028e-09 + ], + "bp_grad_F": [ + 0.1324291080236435, + 0.00022225745487958193, + 9.285694346772289e-08, + 4.7669061586930184e-08, + 4.746264181676452e-08 + ], + "gamma_dfa": 0.001855946145951748, + "gamma_dfa_per_layer": [ + 0.004218719433993101, + 0.001718730665743351, + 0.0019668969325721264, + -0.0004805624485015869 + ], + "acc_eval": 0.251953125, + "loss_eval": 2.101409673690796, + "epoch": 16 + }, + { + "hidden_norms_cls": [ + 21.603151321411133, + 3877476.75, + 4156743.75, + 5474745.5, + 10299149.0 + ], + "hidden_norms_avg": [ + 698.7645263671875, + 3523264.5, + 4085091.75, + 5354783.0, + 9094561.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000199332891497761, + 1.9098649328697093e-09, + 1.2144363292776461e-09, + 1.1166952917918138e-09, + 1.1315383074972374e-09 + ], + "bp_grad_F": [ + 0.15142236649990082, + 4.2183397454209626e-05, + 7.309424887580462e-08, + 5.2962114693855256e-08, + 4.2337880756804225e-08 + ], + "gamma_dfa": 0.0013709207050851546, + "gamma_dfa_per_layer": [ + 0.0023175266105681658, + 0.0016730788629502058, + 0.0018372924532741308, + -0.0003442151064518839 + ], + "acc_eval": 0.220703125, + "loss_eval": 2.1280713081359863, + "epoch": 17 + }, + { + "hidden_norms_cls": [ + 22.48230743408203, + 3581296.5, + 4024996.25, + 6183271.0, + 11393130.0 + ], + "hidden_norms_avg": [ + 735.2485961914062, + 4017679.75, + 4751523.5, + 6215236.0, + 10366257.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00018803548300638795, + 1.895784862426808e-09, + 1.1237420993737146e-09, + 1.0378963244406236e-09, + 1.0573794062551656e-09 + ], + "bp_grad_F": [ + 0.12878409028053284, + 4.194497887510806e-05, + 4.941083631138099e-08, + 3.9714532107382183e-08, + 3.994472663748638e-08 + ], + "gamma_dfa": 0.0012161588310846128, + "gamma_dfa_per_layer": [ + 0.0021385664585977793, + 0.0015012789517641068, + 0.0016565187834203243, + -0.0004317288694437593 + ], + "acc_eval": 0.2158203125, + "loss_eval": 2.1137895584106445, + "epoch": 18 + }, + { + "hidden_norms_cls": [ + 23.29258155822754, + 4616424.5, + 5061994.0, + 6831782.5, + 12437102.0 + ], + "hidden_norms_avg": [ + 768.5599975585938, + 4586839.5, + 5567332.5, + 6953557.0, + 11342041.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00021542877948377281, + 1.9688994878919175e-09, + 1.0831572305747272e-09, + 9.59386015075836e-10, + 9.76972058808201e-10 + ], + "bp_grad_F": [ + 0.09346769750118256, + 4.979455843567848e-05, + 4.6927411290198506e-08, + 3.8312244043936516e-08, + 3.882623289541698e-08 + ], + "gamma_dfa": 0.0011904535058420151, + "gamma_dfa_per_layer": [ + 0.0024171490222215652, + 0.0012326111318543553, + 0.0015420420095324516, + -0.0004299881402403116 + ], + "acc_eval": 0.2333984375, + "loss_eval": 2.0970499515533447, + "epoch": 19 + }, + { + "hidden_norms_cls": [ + 24.054462432861328, + 5806660.5, + 6270370.0, + 7861086.0, + 14600824.0 + ], + "hidden_norms_avg": [ + 801.1851806640625, + 5855518.5, + 6747570.0, + 8137969.0, + 13373154.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00012799039541278034, + 1.5442244150065676e-09, + 9.774002718287989e-10, + 8.729071909741037e-10, + 8.921305361120346e-10 + ], + "bp_grad_F": [ + 0.9552626609802246, + 1.163827892014524e-05, + 2.461903250150499e-07, + 3.4675800009154045e-08, + 3.4831803219503854e-08 + ], + "gamma_dfa": 0.0018355100764892995, + "gamma_dfa_per_layer": [ + 0.004604285582900047, + 0.00167210737708956, + 0.001404301729053259, + -0.0003386543830856681 + ], + "acc_eval": 0.2138671875, + "loss_eval": 2.11769700050354, + "epoch": 20 + }, + { + "hidden_norms_cls": [ + 24.826902389526367, + 6414338.0, + 6989573.0, + 8609765.0, + 15368301.0 + ], + "hidden_norms_avg": [ + 830.1490478515625, + 6946265.5, + 7916239.0, + 9224772.0, + 14431417.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015248128329403698, + 1.4729809594271615e-09, + 9.462167716023373e-10, + 8.629364445233989e-10, + 8.805687845558907e-10 + ], + "bp_grad_F": [ + 0.1705506592988968, + 0.00016797611897345632, + 4.810285503253908e-08, + 3.399246040203252e-08, + 3.436711182303043e-08 + ], + "gamma_dfa": 0.0015317398574552499, + "gamma_dfa_per_layer": [ + 0.004021936096251011, + 0.0012830595951527357, + 0.0012305387062951922, + -0.00040857496787793934 + ], + "acc_eval": 0.2236328125, + "loss_eval": 2.102954864501953, + "epoch": 21 + }, + { + "hidden_norms_cls": [ + 25.52900505065918, + 8152435.5, + 8736555.0, + 9881049.0, + 16997340.0 + ], + "hidden_norms_avg": [ + 858.3137817382812, + 7544203.0, + 8860779.0, + 10224814.0, + 15607154.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001363755582133308, + 1.2969386675720784e-09, + 9.174655479782245e-10, + 8.421383035361885e-10, + 8.538599827190296e-10 + ], + "bp_grad_F": [ + 0.07549053430557251, + 2.9420058126561344e-05, + 5.8904493727141016e-08, + 3.187446395713778e-08, + 3.1860317051268794e-08 + ], + "gamma_dfa": 0.0023631651129107922, + "gamma_dfa_per_layer": [ + 0.007739294320344925, + 0.0009300304809585214, + 0.001171439653262496, + -0.00038810400292277336 + ], + "acc_eval": 0.2080078125, + "loss_eval": 2.1162400245666504, + "epoch": 22 + }, + { + "hidden_norms_cls": [ + 26.122589111328125, + 9255466.0, + 9964734.0, + 11054792.0, + 18565818.0 + ], + "hidden_norms_avg": [ + 884.7098388671875, + 8814330.0, + 10177720.0, + 11552646.0, + 17489728.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014142012514639646, + 1.3653665975610352e-09, + 8.580440802319345e-10, + 7.922714151398225e-10, + 8.032630116616701e-10 + ], + "bp_grad_F": [ + 0.11926258355379105, + 1.2633940968953539e-05, + 3.893048727832138e-08, + 3.075604126934195e-08, + 3.043995278062539e-08 + ], + "gamma_dfa": 0.0013515961618395522, + "gamma_dfa_per_layer": [ + 0.0038036422338336706, + 0.0009011125075630844, + 0.0010650388430804014, + -0.0003634089371189475 + ], + "acc_eval": 0.201171875, + "loss_eval": 2.134256362915039, + "epoch": 23 + }, + { + "hidden_norms_cls": [ + 26.71797752380371, + 8691604.0, + 9652268.0, + 11413482.0, + 19342164.0 + ], + "hidden_norms_avg": [ + 908.3400268554688, + 9418884.0, + 11132975.0, + 12548590.0, + 18516546.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00016020517796278, + 1.5232745065318909e-09, + 8.103306359252826e-10, + 7.392123024807518e-10, + 7.529800671868259e-10 + ], + "bp_grad_F": [ + 0.08055854588747025, + 1.5452902516699396e-05, + 3.9288735820264264e-08, + 3.091117406484045e-08, + 2.9865013573271426e-08 + ], + "gamma_dfa": 0.0012649961790884845, + "gamma_dfa_per_layer": [ + 0.0036856848746538162, + 0.0008738536853343248, + 0.0009324033162556589, + -0.00043195715988986194 + ], + "acc_eval": 0.216796875, + "loss_eval": 2.1074087619781494, + "epoch": 24 + }, + { + "hidden_norms_cls": [ + 27.27407455444336, + 9931691.0, + 10836582.0, + 12350148.0, + 20677670.0 + ], + "hidden_norms_avg": [ + 931.8362426757812, + 10575293.0, + 12476721.0, + 13979366.0, + 20145220.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002644142950884998, + 1.4137412351900025e-09, + 7.711813965194381e-10, + 7.245293809354791e-10, + 7.329452600401964e-10 + ], + "bp_grad_F": [ + 0.08752908557653427, + 3.3139032893814147e-05, + 4.584432744536571e-08, + 2.996421955003825e-08, + 2.8689356668110122e-08 + ], + "gamma_dfa": 0.0013240749976830557, + "gamma_dfa_per_layer": [ + 0.003940493334084749, + 0.0008323215297423303, + 0.0009093738626688719, + -0.0003858887357637286 + ], + "acc_eval": 0.2080078125, + "loss_eval": 2.1011557579040527, + "epoch": 25 + }, + { + "hidden_norms_cls": [ + 27.817367553710938, + 12253263.0, + 13105294.0, + 14345712.0, + 22455440.0 + ], + "hidden_norms_avg": [ + 953.0517578125, + 12373978.0, + 14141729.0, + 15597335.0, + 22309104.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014759604528080672, + 1.123480086739903e-09, + 7.102037291595309e-10, + 6.690955567378865e-10, + 6.791667228611686e-10 + ], + "bp_grad_F": [ + 0.05615593492984772, + 0.00010146480053663254, + 3.714368190799178e-08, + 2.748037175592799e-08, + 2.6385574614096186e-08 + ], + "gamma_dfa": 0.0012311612081248313, + "gamma_dfa_per_layer": [ + 0.003369898535311222, + 0.0009893677197396755, + 0.0009041082230396569, + -0.0003387296455912292 + ], + "acc_eval": 0.234375, + "loss_eval": 2.105236291885376, + "epoch": 26 + }, + { + "hidden_norms_cls": [ + 28.32236099243164, + 13643201.0, + 14611628.0, + 15764247.0, + 24160378.0 + ], + "hidden_norms_avg": [ + 973.9281616210938, + 13221320.0, + 15394035.0, + 16890642.0, + 23678466.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00016657183005008847, + 9.720990679085162e-10, + 6.881580305595492e-10, + 6.496979620962406e-10, + 6.5528305004392e-10 + ], + "bp_grad_F": [ + 0.21266740560531616, + 1.0097430276800878e-05, + 5.8009760550703504e-08, + 2.5056060337647068e-08, + 2.5318335872270836e-08 + ], + "gamma_dfa": 0.0010233484499622136, + "gamma_dfa_per_layer": [ + 0.0030805980786681175, + 0.0005203179316595197, + 0.000822446309030056, + -0.00032996851950883865 + ], + "acc_eval": 0.212890625, + "loss_eval": 2.137085437774658, + "epoch": 27 + }, + { + "hidden_norms_cls": [ + 28.79292106628418, + 13177481.0, + 14299000.0, + 15555998.0, + 23304192.0 + ], + "hidden_norms_avg": [ + 992.415771484375, + 14624837.0, + 16826644.0, + 18325902.0, + 25292966.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00020211696391925216, + 1.1425522750130312e-09, + 6.55300591567709e-10, + 6.094423854463571e-10, + 6.189129764244683e-10 + ], + "bp_grad_F": [ + 0.17359277606010437, + 1.2817296010325663e-05, + 7.396955936656013e-08, + 2.5667416636565576e-08, + 2.485118777428852e-08 + ], + "gamma_dfa": 0.0013693289074581116, + "gamma_dfa_per_layer": [ + 0.004313473589718342, + 0.0007373306434601545, + 0.000740988994948566, + -0.00031447759829461575 + ], + "acc_eval": 0.2255859375, + "loss_eval": 2.095831871032715, + "epoch": 28 + }, + { + "hidden_norms_cls": [ + 29.206546783447266, + 13026473.0, + 14086985.0, + 16207103.0, + 25752542.0 + ], + "hidden_norms_avg": [ + 1012.0676879882812, + 14977745.0, + 17788350.0, + 19459138.0, + 26297900.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002467916056048125, + 1.5415436704913077e-09, + 6.588643519656046e-10, + 6.053296752739357e-10, + 6.112412798131572e-10 + ], + "bp_grad_F": [ + 0.042935822159051895, + 9.192503966914956e-06, + 3.478140442325639e-08, + 2.366191687031005e-08, + 2.384759412166204e-08 + ], + "gamma_dfa": 0.0008732089045224711, + "gamma_dfa_per_layer": [ + 0.002771018771454692, + 0.00032788922544568777, + 0.0007068651611916721, + -0.0003129375400021672 + ], + "acc_eval": 0.2294921875, + "loss_eval": 2.0877132415771484, + "epoch": 29 + }, + { + "hidden_norms_cls": [ + 29.655010223388672, + 18104814.0, + 18959442.0, + 20352136.0, + 30115644.0 + ], + "hidden_norms_avg": [ + 1030.1336669921875, + 17704192.0, + 19945910.0, + 21540694.0, + 29199112.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00019920141494367272, + 8.472024748407136e-10, + 5.961620086480934e-10, + 5.578593698096768e-10, + 5.602495689593923e-10 + ], + "bp_grad_F": [ + 0.05658308416604996, + 2.5135868781944737e-05, + 4.3493169954444966e-08, + 2.1390142990185268e-08, + 2.1341643119399123e-08 + ], + "gamma_dfa": 0.0010463381186127663, + "gamma_dfa_per_layer": [ + 0.0027386434376239777, + 0.0009209397248923779, + 0.0007645037840120494, + -0.0002387344720773399 + ], + "acc_eval": 0.2138671875, + "loss_eval": 2.1298673152923584, + "epoch": 30 + }, + { + "hidden_norms_cls": [ + 30.063920974731445, + 20103628.0, + 20986630.0, + 22120356.0, + 31195618.0 + ], + "hidden_norms_avg": [ + 1046.1927490234375, + 18906620.0, + 21404482.0, + 23038508.0, + 30526688.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002040969266090542, + 9.528980937645315e-10, + 5.700001026731627e-10, + 5.158900528989818e-10, + 5.214851328538828e-10 + ], + "bp_grad_F": [ + 0.0816737711429596, + 5.908617822569795e-05, + 3.4592272157851767e-08, + 2.022995992945198e-08, + 2.0381063947638722e-08 + ], + "gamma_dfa": 0.001085347576008644, + "gamma_dfa_per_layer": [ + 0.0035934830084443092, + 0.0002959886915050447, + 0.0007062341319397092, + -0.0002543155278544873 + ], + "acc_eval": 0.2041015625, + "loss_eval": 2.116055965423584, + "epoch": 31 + }, + { + "hidden_norms_cls": [ + 30.392677307128906, + 21290946.0, + 22100456.0, + 23440498.0, + 32839040.0 + ], + "hidden_norms_avg": [ + 1062.797119140625, + 20072588.0, + 22866046.0, + 24608556.0, + 32259930.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00022883246128913015, + 1.3679187782500435e-09, + 5.444520945196984e-10, + 5.043216955158414e-10, + 5.114720313947885e-10 + ], + "bp_grad_F": [ + 0.2192479968070984, + 0.0001256070681847632, + 1.2757884348957305e-07, + 2.0006645229386777e-08, + 1.9971306386423748e-08 + ], + "gamma_dfa": 0.0019978012933279388, + "gamma_dfa_per_layer": [ + 0.0072806887328624725, + 0.0002412673202343285, + 0.000707695260643959, + -0.00023844614042900503 + ], + "acc_eval": 0.2197265625, + "loss_eval": 2.1034791469573975, + "epoch": 32 + }, + { + "hidden_norms_cls": [ + 30.711090087890625, + 22272344.0, + 23036462.0, + 24462584.0, + 35130192.0 + ], + "hidden_norms_avg": [ + 1082.3468017578125, + 20945452.0, + 23993758.0, + 25838460.0, + 33448582.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005148049676790833, + 2.304462176638822e-09, + 5.340937136999457e-10, + 4.950916898671665e-10, + 5.010572512453848e-10 + ], + "bp_grad_F": [ + 0.15110087394714355, + 3.209088754374534e-05, + 1.0334197497741116e-07, + 2.0131187383753968e-08, + 1.9814510920923567e-08 + ], + "gamma_dfa": 0.003046433750569122, + "gamma_dfa_per_layer": [ + 0.011593285948038101, + 0.00019314857490826398, + 0.0006439671851694584, + -0.0002446667058393359 + ], + "acc_eval": 0.208984375, + "loss_eval": 2.112250328063965, + "epoch": 33 + }, + { + "hidden_norms_cls": [ + 31.0146427154541, + 29106790.0, + 29617952.0, + 31075512.0, + 42307980.0 + ], + "hidden_norms_avg": [ + 1102.4920654296875, + 22080922.0, + 25255976.0, + 27220448.0, + 35072796.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003266549902036786, + 3.0358568992028268e-09, + 4.893331295718895e-10, + 4.395950825575312e-10, + 4.4405815136094873e-10 + ], + "bp_grad_F": [ + 1.0139163732528687, + 1.6822159523144364e-05, + 1.2544650473955699e-07, + 1.6449900996917677e-08, + 1.5756539184508256e-08 + ], + "gamma_dfa": 0.004347974703705404, + "gamma_dfa_per_layer": [ + 0.016904333606362343, + -2.5271147023886442e-05, + 0.0006614690646529198, + -0.00014863270916976035 + ], + "acc_eval": 0.1806640625, + "loss_eval": 2.1869568824768066, + "epoch": 34 + }, + { + "hidden_norms_cls": [ + 31.282560348510742, + 30793450.0, + 31273076.0, + 33029836.0, + 44659544.0 + ], + "hidden_norms_avg": [ + 1120.8310546875, + 23223250.0, + 26597348.0, + 28740710.0, + 37219140.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004533866886049509, + 8.621259817154225e-10, + 4.717314872060285e-10, + 4.43607900413312e-10, + 4.492739236194865e-10 + ], + "bp_grad_F": [ + 0.8242164254188538, + 9.425415555597283e-06, + 6.696246401816097e-08, + 1.4385987512355314e-08, + 1.456661191667763e-08 + ], + "gamma_dfa": 0.004019053936644923, + "gamma_dfa_per_layer": [ + 0.015497363172471523, + 0.0001274545502383262, + 0.0006036070408299565, + -0.00015220901696011424 + ], + "acc_eval": 0.1396484375, + "loss_eval": 2.199540615081787, + "epoch": 35 + }, + { + "hidden_norms_cls": [ + 31.512802124023438, + 21969868.0, + 22884238.0, + 24682478.0, + 38405980.0 + ], + "hidden_norms_avg": [ + 1138.61962890625, + 23861642.0, + 27547416.0, + 29877192.0, + 38524416.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00065120670478791, + 1.8789774181016128e-09, + 5.075246334307337e-10, + 4.637440431665141e-10, + 4.687980004192127e-10 + ], + "bp_grad_F": [ + 0.22404567897319794, + 6.978048531891545e-06, + 5.974419536869391e-08, + 1.854446907145757e-08, + 1.8726453276940447e-08 + ], + "gamma_dfa": 0.0030916051182430238, + "gamma_dfa_per_layer": [ + 0.011011095717549324, + 0.0010498585179448128, + 0.0005736061139032245, + -0.00026813987642526627 + ], + "acc_eval": 0.20703125, + "loss_eval": 2.1297407150268555, + "epoch": 36 + }, + { + "hidden_norms_cls": [ + 31.728811264038086, + 29299954.0, + 29843046.0, + 31522240.0, + 44597740.0 + ], + "hidden_norms_avg": [ + 1154.2742919921875, + 26176784.0, + 29361794.0, + 31622036.0, + 40631524.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00057179294526577, + 8.620974489836897e-10, + 4.3859474385676833e-10, + 4.131678610352907e-10, + 4.158901834028228e-10 + ], + "bp_grad_F": [ + 0.1988120824098587, + 6.200312782311812e-06, + 7.633398269035752e-08, + 1.800971105581084e-08, + 1.6420651505200112e-08 + ], + "gamma_dfa": 0.0036353242212499026, + "gamma_dfa_per_layer": [ + 0.013258620165288448, + 0.0009053392568603158, + 0.0005595044931396842, + -0.00018216703028883785 + ], + "acc_eval": 0.193359375, + "loss_eval": 2.162503719329834, + "epoch": 37 + }, + { + "hidden_norms_cls": [ + 31.93093490600586, + 24153264.0, + 24958016.0, + 27164164.0, + 41821856.0 + ], + "hidden_norms_avg": [ + 1168.3504638671875, + 25251302.0, + 29331440.0, + 31888322.0, + 40732864.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007007869426161051, + 3.803806603031035e-09, + 4.6435830181046356e-10, + 4.2823591894780577e-10, + 4.335505288111108e-10 + ], + "bp_grad_F": [ + 0.23370306193828583, + 5.834654530190164e-06, + 4.249230300956697e-08, + 1.778762737103534e-08, + 1.7575523258983594e-08 + ], + "gamma_dfa": 0.003036663241800852, + "gamma_dfa_per_layer": [ + 0.010693107731640339, + 0.001166085829026997, + 0.0005278221797198057, + -0.00024036277318373322 + ], + "acc_eval": 0.2060546875, + "loss_eval": 2.145090103149414, + "epoch": 38 + }, + { + "hidden_norms_cls": [ + 32.11568069458008, + 30941254.0, + 31479742.0, + 33270594.0, + 46886708.0 + ], + "hidden_norms_avg": [ + 1180.89794921875, + 26732550.0, + 30676362.0, + 33269292.0, + 42382468.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006622264045290649, + 1.5328843749884413e-09, + 4.1302217201888425e-10, + 3.8878930630481534e-10, + 3.9369618676232676e-10 + ], + "bp_grad_F": [ + 0.7251601815223694, + 2.9320523026399314e-05, + 1.0578004605577007e-07, + 1.5190060764780355e-08, + 1.538120386612718e-08 + ], + "gamma_dfa": 0.0034242832334712148, + "gamma_dfa_per_layer": [ + 0.012806901708245277, + 0.0005313451401889324, + 0.0005365218385122716, + -0.00017763575306162238 + ], + "acc_eval": 0.1904296875, + "loss_eval": 2.1417269706726074, + "epoch": 39 + }, + { + "hidden_norms_cls": [ + 32.295955657958984, + 33935232.0, + 34368956.0, + 35934572.0, + 47697056.0 + ], + "hidden_norms_avg": [ + 1192.405517578125, + 27784236.0, + 31654758.0, + 34253712.0, + 43239588.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000609845039434731, + 1.1788049425476288e-09, + 4.4074988103659507e-10, + 3.883143528948807e-10, + 3.8990835560248627e-10 + ], + "bp_grad_F": [ + 0.3570167124271393, + 5.2556606533471495e-06, + 6.658066098452764e-08, + 1.6441132899558397e-08, + 1.5662063646004754e-08 + ], + "gamma_dfa": 0.0031971330136002507, + "gamma_dfa_per_layer": [ + 0.011760826222598553, + 0.000679977354593575, + 0.0005443703266791999, + -0.00019664184947032481 + ], + "acc_eval": 0.1962890625, + "loss_eval": 2.159468173980713, + "epoch": 40 + }, + { + "hidden_norms_cls": [ + 32.446258544921875, + 19652562.0, + 21036314.0, + 25921266.0, + 40927384.0 + ], + "hidden_norms_avg": [ + 1203.144287109375, + 31749304.0, + 34556376.0, + 36976868.0, + 47059032.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006137214368209243, + 8.001962981118993e-10, + 4.3686718131930036e-10, + 4.163595301864831e-10, + 4.1693556940280985e-10 + ], + "bp_grad_F": [ + 0.12317141890525818, + 1.0874373401748016e-05, + 3.419825134187704e-08, + 1.7081790204542813e-08, + 1.7078438219186864e-08 + ], + "gamma_dfa": 0.002385696723649744, + "gamma_dfa_per_layer": [ + 0.008561503142118454, + 0.000761325703933835, + 0.00044924806570634246, + -0.0002292900171596557 + ], + "acc_eval": 0.1943359375, + "loss_eval": 2.1486196517944336, + "epoch": 41 + }, + { + "hidden_norms_cls": [ + 32.65601348876953, + 18852588.0, + 20806824.0, + 26129350.0, + 41854136.0 + ], + "hidden_norms_avg": [ + 1211.216064453125, + 33512262.0, + 36150576.0, + 38488828.0, + 48876332.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00041886867256835103, + 6.960994003435417e-10, + 3.895795075425923e-10, + 3.7316269518861134e-10, + 3.8092326515304364e-10 + ], + "bp_grad_F": [ + 0.14164908230304718, + 1.2379082363622729e-06, + 2.6289937338219715e-08, + 1.6158612226035984e-08, + 1.6345055087185756e-08 + ], + "gamma_dfa": 0.0026270662965544034, + "gamma_dfa_per_layer": [ + 0.009110232815146446, + 0.0011993220541626215, + 0.00041866287938319147, + -0.00021995256247464567 + ], + "acc_eval": 0.19140625, + "loss_eval": 2.1592655181884766, + "epoch": 42 + }, + { + "hidden_norms_cls": [ + 32.8077507019043, + 13604255.0, + 20737208.0, + 26201736.0, + 38498212.0 + ], + "hidden_norms_avg": [ + 1218.5357666015625, + 34337856.0, + 37186496.0, + 39492900.0, + 49837356.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00024631666019558907, + 7.821958081244418e-10, + 3.8121927836698433e-10, + 3.6691791271969976e-10, + 3.7013728193535655e-10 + ], + "bp_grad_F": [ + 0.16077305376529694, + 4.323472239775583e-06, + 3.772007772795405e-08, + 1.5986831414238623e-08, + 1.5948634413121e-08 + ], + "gamma_dfa": 0.002168099657865241, + "gamma_dfa_per_layer": [ + 0.007105600088834763, + 0.0013786349445581436, + 0.00041434637387283146, + -0.00022618277580477297 + ], + "acc_eval": 0.193359375, + "loss_eval": 2.1537227630615234, + "epoch": 43 + }, + { + "hidden_norms_cls": [ + 32.95870590209961, + 17278438.0, + 21010234.0, + 26451948.0, + 41976576.0 + ], + "hidden_norms_avg": [ + 1225.39501953125, + 36196112.0, + 38833272.0, + 41042520.0, + 51415488.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00017274360288865864, + 7.227461407133262e-10, + 3.619011756939017e-10, + 3.5793992769761473e-10, + 3.6092046018509905e-10 + ], + "bp_grad_F": [ + 0.9672663807868958, + 3.41643476531317e-06, + 5.25712664511957e-08, + 1.5481989024124232e-08, + 1.548605688128646e-08 + ], + "gamma_dfa": 0.001979457345441915, + "gamma_dfa_per_layer": [ + 0.006772718392312527, + 0.0009743775590322912, + 0.00037397228879854083, + -0.00020323885837569833 + ], + "acc_eval": 0.208984375, + "loss_eval": 2.1646997928619385, + "epoch": 44 + }, + { + "hidden_norms_cls": [ + 33.06986999511719, + 23368844.0, + 24521804.0, + 27230594.0, + 45358652.0 + ], + "hidden_norms_avg": [ + 1231.394287109375, + 38020996.0, + 40414464.0, + 42538228.0, + 53283596.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015840897685848176, + 6.067092384043349e-10, + 3.4933173020945674e-10, + 3.3962907486362326e-10, + 3.42745692938351e-10 + ], + "bp_grad_F": [ + 0.3695656955242157, + 2.3579739263368538e-06, + 5.5092176154403205e-08, + 1.777137192959799e-08, + 1.4559810246339566e-08 + ], + "gamma_dfa": 0.0020704490307252854, + "gamma_dfa_per_layer": [ + 0.007164421491324902, + 0.0009055124246515334, + 0.0003939281450584531, + -0.00018206593813374639 + ], + "acc_eval": 0.203125, + "loss_eval": 2.1666717529296875, + "epoch": 45 + }, + { + "hidden_norms_cls": [ + 33.164432525634766, + 29174184.0, + 30089798.0, + 32367896.0, + 48892740.0 + ], + "hidden_norms_avg": [ + 1237.1142578125, + 37470168.0, + 40219512.0, + 42356984.0, + 52772660.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00024464691523462534, + 5.441591066634999e-10, + 3.6414088411262924e-10, + 3.320065611323031e-10, + 3.387692348866267e-10 + ], + "bp_grad_F": [ + 0.20688536763191223, + 4.435638402355835e-06, + 8.288016317692382e-08, + 1.4215274291018432e-08, + 1.4331217101926086e-08 + ], + "gamma_dfa": 0.0017712319058773573, + "gamma_dfa_per_layer": [ + 0.006079941056668758, + 0.0008057263912633061, + 0.00038248312193900347, + -0.0001832229463616386 + ], + "acc_eval": 0.1806640625, + "loss_eval": 2.173765182495117, + "epoch": 46 + }, + { + "hidden_norms_cls": [ + 33.24842071533203, + 33830332.0, + 34499304.0, + 36673048.0, + 51963528.0 + ], + "hidden_norms_avg": [ + 1242.226318359375, + 38073352.0, + 40806512.0, + 42901500.0, + 53437180.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002524294250179082, + 5.388652302151797e-10, + 3.6845529405304944e-10, + 3.3760005901939394e-10, + 3.4174474361492457e-10 + ], + "bp_grad_F": [ + 0.12659014761447906, + 2.532647158659529e-06, + 5.97612910269163e-08, + 1.3431267653629675e-08, + 1.3499856343912597e-08 + ], + "gamma_dfa": 0.0021579467684205156, + "gamma_dfa_per_layer": [ + 0.007928929291665554, + 0.00047530903248116374, + 0.00039780279621481895, + -0.0001702540466794744 + ], + "acc_eval": 0.2099609375, + "loss_eval": 2.161896228790283, + "epoch": 47 + }, + { + "hidden_norms_cls": [ + 33.338741302490234, + 19795148.0, + 21916948.0, + 27189936.0, + 43588712.0 + ], + "hidden_norms_avg": [ + 1246.7552490234375, + 38983196.0, + 41658504.0, + 43769460.0, + 54177164.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002599447325337678, + 6.2289540192495e-10, + 3.6807956682594067e-10, + 3.4037242468976103e-10, + 3.472495624379235e-10 + ], + "bp_grad_F": [ + 0.11130323261022568, + 6.972830760787474e-06, + 5.447330764241087e-08, + 1.4756569299834155e-08, + 1.4917180379825368e-08 + ], + "gamma_dfa": 0.0021847522366442718, + "gamma_dfa_per_layer": [ + 0.007594278547912836, + 0.0009666476398706436, + 0.0003712670295499265, + -0.00019318427075631917 + ], + "acc_eval": 0.1904296875, + "loss_eval": 2.1626296043395996, + "epoch": 48 + }, + { + "hidden_norms_cls": [ + 33.42045974731445, + 24898126.0, + 26009376.0, + 28516464.0, + 47394980.0 + ], + "hidden_norms_avg": [ + 1250.1884765625, + 39632580.0, + 42285708.0, + 44390100.0, + 55233620.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001829452667152509, + 5.726033536213038e-10, + 3.5659752928296484e-10, + 3.292066619309253e-10, + 3.31846911061362e-10 + ], + "bp_grad_F": [ + 0.23442988097667694, + 3.2595114589639707e-06, + 1.0605135969399271e-07, + 1.4677630666426467e-08, + 1.445219677265186e-08 + ], + "gamma_dfa": 0.0021932553718215786, + "gamma_dfa_per_layer": [ + 0.007973091676831245, + 0.0006458763382397592, + 0.00032728860969655216, + -0.00017323513748124242 + ], + "acc_eval": 0.1923828125, + "loss_eval": 2.175835609436035, + "epoch": 49 + }, + { + "hidden_norms_cls": [ + 33.47613525390625, + 25550002.0, + 26776384.0, + 28507352.0, + 47268464.0 + ], + "hidden_norms_avg": [ + 1253.279541015625, + 39494300.0, + 42348356.0, + 44479368.0, + 55121100.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00012893354869447649, + 5.787402224122218e-10, + 3.341840137949248e-10, + 3.2919431069977634e-10, + 3.3201591476128556e-10 + ], + "bp_grad_F": [ + 0.10876749455928802, + 4.772132342623081e-06, + 7.90316647680811e-08, + 1.4042406348835357e-08, + 1.4153799909877307e-08 + ], + "gamma_dfa": 0.001727514507365413, + "gamma_dfa_per_layer": [ + 0.0062596434727311134, + 0.0004772312822751701, + 0.000357049866579473, + -0.0001838665921241045 + ], + "acc_eval": 0.1904296875, + "loss_eval": 2.164583444595337, + "epoch": 50 + }, + { + "hidden_norms_cls": [ + 33.52043914794922, + 28050636.0, + 29099278.0, + 31227182.0, + 49045872.0 + ], + "hidden_norms_avg": [ + 1255.7454833984375, + 40231008.0, + 42960368.0, + 45079784.0, + 55989944.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015386792074423283, + 5.41802436249128e-10, + 3.373940293815991e-10, + 3.3321326253776817e-10, + 3.361276257329848e-10 + ], + "bp_grad_F": [ + 0.2656819522380829, + 2.482481932020164e-06, + 8.287289432473699e-08, + 1.3792345932017724e-08, + 1.3917338392843703e-08 + ], + "gamma_dfa": 0.001938080065883696, + "gamma_dfa_per_layer": [ + 0.006978346034884453, + 0.0005946386372670531, + 0.00036033656215295196, + -0.00018100097076967359 + ], + "acc_eval": 0.1962890625, + "loss_eval": 2.176473379135132, + "epoch": 51 + }, + { + "hidden_norms_cls": [ + 33.55419921875, + 25508434.0, + 26505134.0, + 29051658.0, + 47339916.0 + ], + "hidden_norms_avg": [ + 1257.7822265625, + 40388772.0, + 43162480.0, + 45217960.0, + 55966100.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00018102869216818362, + 5.443374639924059e-10, + 3.9548594954474936e-10, + 3.679410942591943e-10, + 3.717116892065775e-10 + ], + "bp_grad_F": [ + 0.28429684042930603, + 3.3983885714405915e-06, + 8.993236377818903e-08, + 1.4510244561449781e-08, + 1.4562592021150067e-08 + ], + "gamma_dfa": 0.001642326584260445, + "gamma_dfa_per_layer": [ + 0.006192460190504789, + 0.00019942648941650987, + 0.00037004181649535894, + -0.0001926221593748778 + ], + "acc_eval": 0.2001953125, + "loss_eval": 2.1743006706237793, + "epoch": 52 + }, + { + "hidden_norms_cls": [ + 33.58127212524414, + 28540952.0, + 29607362.0, + 31472670.0, + 49191068.0 + ], + "hidden_norms_avg": [ + 1259.4189453125, + 40550800.0, + 43364984.0, + 45506960.0, + 56297104.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00018638238543644547, + 5.299162220140374e-10, + 3.2437005859087265e-10, + 3.1624741714253446e-10, + 3.1920088794379353e-10 + ], + "bp_grad_F": [ + 0.21056434512138367, + 3.217361381757655e-06, + 5.1724125427199397e-08, + 1.390105897058902e-08, + 1.3961146017038573e-08 + ], + "gamma_dfa": 0.0018532263711676933, + "gamma_dfa_per_layer": [ + 0.006584585644304752, + 0.0006806463352404535, + 0.00032758695306256413, + -0.00017991344793699682 + ], + "acc_eval": 0.19921875, + "loss_eval": 2.167957067489624, + "epoch": 53 + }, + { + "hidden_norms_cls": [ + 33.60611343383789, + 27949698.0, + 28918304.0, + 31366946.0, + 48876736.0 + ], + "hidden_norms_avg": [ + 1260.694091796875, + 41001392.0, + 43744060.0, + 45853688.0, + 56636716.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00021861983987037092, + 5.396287861003657e-10, + 3.377726154329963e-10, + 3.201852394330018e-10, + 3.237338452866112e-10 + ], + "bp_grad_F": [ + 0.12415990233421326, + 1.6796100226201816e-06, + 6.823196940786147e-08, + 1.384469427989643e-08, + 1.3965705036866893e-08 + ], + "gamma_dfa": 0.0017868579998321366, + "gamma_dfa_per_layer": [ + 0.006317156832665205, + 0.0006519090966321528, + 0.0003622731601353735, + -0.00018390709010418504 + ], + "acc_eval": 0.1953125, + "loss_eval": 2.178144931793213, + "epoch": 54 + }, + { + "hidden_norms_cls": [ + 33.620914459228516, + 27607036.0, + 28622492.0, + 31370470.0, + 48645068.0 + ], + "hidden_norms_avg": [ + 1261.64208984375, + 40948476.0, + 43773536.0, + 45888992.0, + 56623536.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002112231741193682, + 5.336073249928575e-10, + 3.533912051878474e-10, + 3.186636232666018e-10, + 3.226934830458106e-10 + ], + "bp_grad_F": [ + 0.1486925333738327, + 3.3336793876515003e-06, + 9.466339889740993e-08, + 1.4568017014937595e-08, + 1.4240884915750485e-08 + ], + "gamma_dfa": 0.0018792969822243322, + "gamma_dfa_per_layer": [ + 0.006730419583618641, + 0.000605170032940805, + 0.0003661802038550377, + -0.00018458189151715487 + ], + "acc_eval": 0.1982421875, + "loss_eval": 2.172356367111206, + "epoch": 55 + }, + { + "hidden_norms_cls": [ + 33.63143539428711, + 28410040.0, + 29532286.0, + 31697578.0, + 48914624.0 + ], + "hidden_norms_avg": [ + 1262.2918701171875, + 40698620.0, + 43622904.0, + 45764712.0, + 56531748.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002270409750053659, + 5.479600106994553e-10, + 3.2429942065093087e-10, + 3.150284755282229e-10, + 3.179212726411862e-10 + ], + "bp_grad_F": [ + 0.10118122398853302, + 2.5195840862579644e-06, + 8.798109263352671e-08, + 1.3570585544186997e-08, + 1.3736383586149259e-08 + ], + "gamma_dfa": 0.0017859039653558284, + "gamma_dfa_per_layer": [ + 0.006382801569998264, + 0.0005453285994008183, + 0.00039217708399519324, + -0.00017669139197096229 + ], + "acc_eval": 0.1943359375, + "loss_eval": 2.1648902893066406, + "epoch": 56 + }, + { + "hidden_norms_cls": [ + 33.63875961303711, + 31114778.0, + 32184654.0, + 34278688.0, + 50894352.0 + ], + "hidden_norms_avg": [ + 1262.7132568359375, + 40792528.0, + 43713536.0, + 45850224.0, + 56615416.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00019923689251299948, + 5.368823718931992e-10, + 3.306654117185559e-10, + 3.113070912164062e-10, + 3.1328556415743947e-10 + ], + "bp_grad_F": [ + 0.3573400378227234, + 1.249598790309392e-05, + 1.6106491784739774e-07, + 3.301076745287901e-08, + 1.3328084413899433e-08 + ], + "gamma_dfa": 0.0016940671957854647, + "gamma_dfa_per_layer": [ + 0.006114102900028229, + 0.0004918627091683447, + 0.00032346430816687644, + -0.00015316113422159106 + ], + "acc_eval": 0.201171875, + "loss_eval": 2.1634349822998047, + "epoch": 57 + }, + { + "hidden_norms_cls": [ + 33.642520904541016, + 31868976.0, + 32779660.0, + 35005740.0, + 51305220.0 + ], + "hidden_norms_avg": [ + 1262.9461669921875, + 41087592.0, + 43928832.0, + 46043268.0, + 56839576.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002181618328904733, + 5.162476557352136e-10, + 3.3206276617292474e-10, + 3.1130611977125966e-10, + 3.1441516057384433e-10 + ], + "bp_grad_F": [ + 0.12289460748434067, + 1.5301338862627745e-05, + 8.779379356838035e-08, + 1.4331889452989799e-08, + 1.318165843144925e-08 + ], + "gamma_dfa": 0.001529279034002684, + "gamma_dfa_per_layer": [ + 0.00539398193359375, + 0.0005496743833646178, + 0.00034435215638950467, + -0.00017089233733713627 + ], + "acc_eval": 0.2021484375, + "loss_eval": 2.164745807647705, + "epoch": 58 + }, + { + "hidden_norms_cls": [ + 33.6442756652832, + 31315430.0, + 32160978.0, + 34340796.0, + 51077484.0 + ], + "hidden_norms_avg": [ + 1263.062744140625, + 41015680.0, + 43882708.0, + 46002096.0, + 56770896.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00021884885791223496, + 5.177114292820306e-10, + 3.350683897007656e-10, + 3.101042200803761e-10, + 3.12167347527037e-10 + ], + "bp_grad_F": [ + 0.11127890646457672, + 1.1515544429130387e-05, + 8.542571805492116e-08, + 1.319963871537766e-08, + 1.3264477516372608e-08 + ], + "gamma_dfa": 0.0016308917693095282, + "gamma_dfa_per_layer": [ + 0.005676542408764362, + 0.0006629846757277846, + 0.0003523063496686518, + -0.0001682663569226861 + ], + "acc_eval": 0.19921875, + "loss_eval": 2.1635866165161133, + "epoch": 59 + }, + { + "hidden_norms_cls": [ + 33.643985748291016, + 31097308.0, + 32052318.0, + 34155804.0, + 50803736.0 + ], + "hidden_norms_avg": [ + 1263.064208984375, + 40997444.0, + 43870400.0, + 45990872.0, + 56755540.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00021703331731259823, + 5.1921633659191e-10, + 3.35882821556055e-10, + 3.102589296588576e-10, + 3.1300673164480486e-10 + ], + "bp_grad_F": [ + 0.1889268010854721, + 1.0328590178687591e-05, + 1.1096560825762936e-07, + 1.3215729843807367e-08, + 1.3306935997547953e-08 + ], + "gamma_dfa": 0.0016646812255203258, + "gamma_dfa_per_layer": [ + 0.005869406741112471, + 0.0006016636616550386, + 0.0003579354961402714, + -0.00017028099682647735 + ], + "acc_eval": 0.2021484375, + "loss_eval": 2.163691520690918, + "epoch": 60 + } + ] +} \ No newline at end of file diff --git a/results/snapshot_vit_v1/snapshot_vit_s42.json b/results/snapshot_vit_v1/snapshot_vit_s42.json new file mode 100644 index 0000000..569af46 --- /dev/null +++ b/results/snapshot_vit_v1/snapshot_vit_s42.json @@ -0,0 +1,4594 @@ +{ + "config": { + "output_dir": "results/snapshot_vit_v1", + "epochs": 60, + "lr": 0.001, + "wd": 0.05, + "seed": 42, + "depth": 4, + "d_model": 128, + "n_heads": 4 + }, + "depth": 4, + "d_model": 128, + "architecture": "ViTMini", + "bp_log": [ + { + "hidden_norms_cls": [ + 0.31052109599113464, + 3.2536301612854004, + 4.7681732177734375, + 6.129599571228027, + 7.124356746673584 + ], + "hidden_norms_avg": [ + 6.008513927459717, + 7.034290313720703, + 7.942849636077881, + 8.915729522705078, + 9.635361671447754 + ], + "bp_grad_per_sample_l2_med": [ + 0.004442029166966677, + 0.0012008437188342214, + 0.0009976272704079747, + 0.0009104337659664452, + 0.0008558662957511842 + ], + "bp_grad_F": [ + 0.18535660207271576, + 0.03968670591711998, + 0.032604776322841644, + 0.029427478089928627, + 0.02746850810945034 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.1376953125, + "loss_eval": 2.35188627243042, + "epoch": 0 + }, + { + "hidden_norms_cls": [ + 0.511958122253418, + 12.453446388244629, + 18.366989135742188, + 25.54116439819336, + 31.80699348449707 + ], + "hidden_norms_avg": [ + 4.10694694519043, + 10.166566848754883, + 14.66998291015625, + 19.93342399597168, + 25.32619857788086 + ], + "bp_grad_per_sample_l2_med": [ + 0.0019771556835621595, + 0.00022324378369376063, + 0.00016308785416185856, + 0.00014621105219703168, + 0.0001451292191632092 + ], + "bp_grad_F": [ + 0.11066891252994537, + 0.01034498494118452, + 0.006372526753693819, + 0.0052248528227210045, + 0.005017552524805069 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4501953125, + "loss_eval": 1.5154438018798828, + "epoch": 1 + }, + { + "hidden_norms_cls": [ + 0.6518111824989319, + 13.549692153930664, + 20.607715606689453, + 27.90418243408203, + 32.70498275756836 + ], + "hidden_norms_avg": [ + 4.0909905433654785, + 11.942686080932617, + 17.39116096496582, + 22.200014114379883, + 26.230010986328125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017800139030441642, + 0.00026728332159109414, + 0.0001720335567370057, + 0.0001423172070644796, + 0.00013423117343336344 + ], + "bp_grad_F": [ + 0.08781559765338898, + 0.010987765155732632, + 0.0064147054217755795, + 0.0050079175271093845, + 0.004637593869119883 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.494140625, + "loss_eval": 1.3824832439422607, + "epoch": 2 + }, + { + "hidden_norms_cls": [ + 0.755299985408783, + 11.224863052368164, + 19.053363800048828, + 27.303081512451172, + 33.078182220458984 + ], + "hidden_norms_avg": [ + 4.027151584625244, + 12.449769973754883, + 17.769508361816406, + 22.97556495666504, + 27.065759658813477 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018998769810423255, + 0.00030996452551335096, + 0.00018013815861195326, + 0.0001340982416877523, + 0.00012205552775412798 + ], + "bp_grad_F": [ + 0.09037011116743088, + 0.013488140888512135, + 0.007346263621002436, + 0.0051797907799482346, + 0.004589984193444252 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5439453125, + "loss_eval": 1.2540550231933594, + "epoch": 3 + }, + { + "hidden_norms_cls": [ + 0.844818651676178, + 13.648336410522461, + 20.277976989746094, + 28.240915298461914, + 33.095726013183594 + ], + "hidden_norms_avg": [ + 4.036877632141113, + 12.003630638122559, + 17.05451011657715, + 22.15869903564453, + 25.917491912841797 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016167981084436178, + 0.00028610811568796635, + 0.0001777650322765112, + 0.00012878721463494003, + 0.0001112063619075343 + ], + "bp_grad_F": [ + 0.07410340011119843, + 0.012637714855372906, + 0.007633093744516373, + 0.005242784973233938, + 0.004431390203535557 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.603515625, + "loss_eval": 1.1045944690704346, + "epoch": 4 + }, + { + "hidden_norms_cls": [ + 0.9051892161369324, + 12.476008415222168, + 19.24710464477539, + 27.6123046875, + 32.35737609863281 + ], + "hidden_norms_avg": [ + 4.138596057891846, + 12.409324645996094, + 17.427003860473633, + 22.245147705078125, + 25.471385955810547 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016044765943661332, + 0.00030248358962126076, + 0.00018807635933626443, + 0.00013626758300233632, + 0.00011398641800042242 + ], + "bp_grad_F": [ + 0.08322811126708984, + 0.01390017382800579, + 0.008505746722221375, + 0.005747759714722633, + 0.004776888992637396 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.603515625, + "loss_eval": 1.1296963691711426, + "epoch": 5 + }, + { + "hidden_norms_cls": [ + 0.9687634110450745, + 11.625859260559082, + 18.38014793395996, + 26.869504928588867, + 31.455507278442383 + ], + "hidden_norms_avg": [ + 4.263001441955566, + 13.1234769821167, + 17.853057861328125, + 22.476547241210938, + 25.29656410217285 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015340449754148722, + 0.00033552697277627885, + 0.00021536082203965634, + 0.00015067037020344287, + 0.00012220896314829588 + ], + "bp_grad_F": [ + 0.07571946829557419, + 0.015132292173802853, + 0.009512492455542088, + 0.006373303942382336, + 0.005029390100389719 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.603515625, + "loss_eval": 1.0963702201843262, + "epoch": 6 + }, + { + "hidden_norms_cls": [ + 1.0029383897781372, + 12.687585830688477, + 19.734830856323242, + 28.174379348754883, + 32.5982780456543 + ], + "hidden_norms_avg": [ + 4.357974052429199, + 13.182960510253906, + 17.720989227294922, + 21.832895278930664, + 24.934776306152344 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013370191445574164, + 0.00026788320974446833, + 0.00018144956266041845, + 0.00013219293032307178, + 0.00010196284711128101 + ], + "bp_grad_F": [ + 0.06996501982212067, + 0.013071151450276375, + 0.008477694354951382, + 0.0061036222614347935, + 0.004761465825140476 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6416015625, + "loss_eval": 0.9737913012504578, + "epoch": 7 + }, + { + "hidden_norms_cls": [ + 1.043707013130188, + 12.487404823303223, + 18.845643997192383, + 26.870864868164062, + 31.145292282104492 + ], + "hidden_norms_avg": [ + 4.454991340637207, + 13.503378868103027, + 18.694488525390625, + 23.029804229736328, + 25.810880661010742 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013130803126841784, + 0.00029930632445029914, + 0.0002022052649408579, + 0.0001383959170198068, + 0.00010439592006150633 + ], + "bp_grad_F": [ + 0.0743240937590599, + 0.015402271412312984, + 0.009977605193853378, + 0.006877230014652014, + 0.005202346481382847 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.666015625, + "loss_eval": 0.9317076206207275, + "epoch": 8 + }, + { + "hidden_norms_cls": [ + 1.0887501239776611, + 12.662396430969238, + 18.622724533081055, + 26.599454879760742, + 31.788663864135742 + ], + "hidden_norms_avg": [ + 4.529710292816162, + 13.683384895324707, + 18.47463607788086, + 22.395898818969727, + 25.244558334350586 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012017677072435617, + 0.0002972102665808052, + 0.00019775003602262586, + 0.00013734954700339586, + 9.880279685603455e-05 + ], + "bp_grad_F": [ + 0.0661192312836647, + 0.01516024675220251, + 0.010001113638281822, + 0.006893018260598183, + 0.0051134442910552025 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6669921875, + "loss_eval": 0.9026263952255249, + "epoch": 9 + }, + { + "hidden_norms_cls": [ + 1.1163448095321655, + 12.711283683776855, + 18.790128707885742, + 26.846359252929688, + 31.663158416748047 + ], + "hidden_norms_avg": [ + 4.502295970916748, + 13.801639556884766, + 18.488975524902344, + 22.378704071044922, + 25.22056007385254 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011062510311603546, + 0.00029147896566428244, + 0.0001970102748600766, + 0.00013174059859011322, + 0.0001037597976392135 + ], + "bp_grad_F": [ + 0.06217500939965248, + 0.014721231535077095, + 0.00993143580853939, + 0.006723989732563496, + 0.005166618153452873 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6845703125, + "loss_eval": 0.8660677671432495, + "epoch": 10 + }, + { + "hidden_norms_cls": [ + 1.1505078077316284, + 12.160571098327637, + 18.15353012084961, + 25.762012481689453, + 31.478300094604492 + ], + "hidden_norms_avg": [ + 4.5605149269104, + 13.918573379516602, + 18.88881492614746, + 22.79344940185547, + 25.800094604492188 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009689349099062383, + 0.0002486997109372169, + 0.0001736732665449381, + 0.00011473154881969094, + 8.573567902203649e-05 + ], + "bp_grad_F": [ + 0.06455213576555252, + 0.01547171175479889, + 0.010573537088930607, + 0.0071961241774261, + 0.005212985444813967 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.71484375, + "loss_eval": 0.812907874584198, + "epoch": 11 + }, + { + "hidden_norms_cls": [ + 1.1844152212142944, + 11.332664489746094, + 16.57625961303711, + 23.82307243347168, + 28.492321014404297 + ], + "hidden_norms_avg": [ + 4.602160453796387, + 13.876313209533691, + 17.891036987304688, + 21.410982131958008, + 23.97108268737793 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009290817542932928, + 0.0002613075776025653, + 0.0001877332106232643, + 0.0001262558507733047, + 9.168039832729846e-05 + ], + "bp_grad_F": [ + 0.06392678618431091, + 0.01674485206604004, + 0.011727217584848404, + 0.007738997228443623, + 0.005730107892304659 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7197265625, + "loss_eval": 0.7641609907150269, + "epoch": 12 + }, + { + "hidden_norms_cls": [ + 1.2184560298919678, + 12.450925827026367, + 18.076860427856445, + 25.162586212158203, + 30.365047454833984 + ], + "hidden_norms_avg": [ + 4.7080278396606445, + 13.851634979248047, + 18.517131805419922, + 22.074214935302734, + 24.72054100036621 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009277731878682971, + 0.00024563330225646496, + 0.00017736255540512502, + 0.00012202116340631619, + 8.748921391088516e-05 + ], + "bp_grad_F": [ + 0.06389915198087692, + 0.016115156933665276, + 0.0110858753323555, + 0.0076499818824231625, + 0.005541808437556028 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.697265625, + "loss_eval": 0.8037601113319397, + "epoch": 13 + }, + { + "hidden_norms_cls": [ + 1.243064045906067, + 11.932015419006348, + 17.215856552124023, + 24.764291763305664, + 29.49314308166504 + ], + "hidden_norms_avg": [ + 4.651937961578369, + 13.890728950500488, + 18.2476749420166, + 21.80103302001953, + 24.145692825317383 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009111211402341723, + 0.000253814272582531, + 0.00018247529806103557, + 0.00011639296280918643, + 8.364167297258973e-05 + ], + "bp_grad_F": [ + 0.06324896216392517, + 0.016394753009080887, + 0.01153184287250042, + 0.007614497095346451, + 0.0056136660277843475 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.728515625, + "loss_eval": 0.7384279370307922, + "epoch": 14 + }, + { + "hidden_norms_cls": [ + 1.2652677297592163, + 11.532588005065918, + 16.7224178314209, + 23.326444625854492, + 28.03766441345215 + ], + "hidden_norms_avg": [ + 4.652615547180176, + 13.981542587280273, + 17.984512329101562, + 21.317432403564453, + 23.233760833740234 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008032417972572148, + 0.00022395161795429885, + 0.00016904002404771745, + 0.0001078559216693975, + 7.841538899810985e-05 + ], + "bp_grad_F": [ + 0.06386830657720566, + 0.016731705516576767, + 0.012135310098528862, + 0.008108492009341717, + 0.006046997383236885 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7333984375, + "loss_eval": 0.7387630939483643, + "epoch": 15 + }, + { + "hidden_norms_cls": [ + 1.2944419384002686, + 11.34481430053711, + 16.45362091064453, + 22.63861846923828, + 28.011232376098633 + ], + "hidden_norms_avg": [ + 4.738389015197754, + 13.769956588745117, + 17.63072395324707, + 21.14189338684082, + 23.455045700073242 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007927753031253815, + 0.0002345799293834716, + 0.00016934113227762282, + 0.00011508075840538368, + 7.966109114931896e-05 + ], + "bp_grad_F": [ + 0.0655454769730568, + 0.01815187744796276, + 0.013005951419472694, + 0.008820701390504837, + 0.006184164900332689 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7255859375, + "loss_eval": 0.7302451133728027, + "epoch": 16 + }, + { + "hidden_norms_cls": [ + 1.3085625171661377, + 11.323317527770996, + 15.866230964660645, + 21.746976852416992, + 27.081127166748047 + ], + "hidden_norms_avg": [ + 4.687533855438232, + 13.471115112304688, + 17.396968841552734, + 20.327377319335938, + 22.58539581298828 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006625292589887977, + 0.00019486426026560366, + 0.00014659677981399, + 9.787825547391549e-05, + 6.321907130768523e-05 + ], + "bp_grad_F": [ + 0.07393868267536163, + 0.020178642123937607, + 0.014442694373428822, + 0.009784683585166931, + 0.00656729843467474 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7412109375, + "loss_eval": 0.7063955068588257, + "epoch": 17 + }, + { + "hidden_norms_cls": [ + 1.3433176279067993, + 10.762125968933105, + 15.129413604736328, + 21.06867790222168, + 26.1944522857666 + ], + "hidden_norms_avg": [ + 4.709607124328613, + 13.69739055633545, + 17.006061553955078, + 19.97213363647461, + 22.212177276611328 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006978239398449659, + 0.00021396303782239556, + 0.00016030693950597197, + 0.00010856003791559488, + 6.917239079484716e-05 + ], + "bp_grad_F": [ + 0.06653428077697754, + 0.019508732482790947, + 0.014456766657531261, + 0.010107609443366528, + 0.006681134924292564 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.75, + "loss_eval": 0.6990396976470947, + "epoch": 18 + }, + { + "hidden_norms_cls": [ + 1.3607734441757202, + 10.718966484069824, + 15.383923530578613, + 21.34387969970703, + 26.49329376220703 + ], + "hidden_norms_avg": [ + 4.7122907638549805, + 13.804581642150879, + 17.532636642456055, + 20.843929290771484, + 23.01592254638672 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007053805165924132, + 0.0002122409496223554, + 0.00016182110994122922, + 0.00011085433652624488, + 7.204789289971814e-05 + ], + "bp_grad_F": [ + 0.06105736270546913, + 0.017779415473341942, + 0.013269647024571896, + 0.009227588772773743, + 0.006410240661352873 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7763671875, + "loss_eval": 0.6498311758041382, + "epoch": 19 + }, + { + "hidden_norms_cls": [ + 1.3752704858779907, + 10.530582427978516, + 14.803340911865234, + 20.217910766601562, + 25.20522689819336 + ], + "hidden_norms_avg": [ + 4.7595720291137695, + 13.601245880126953, + 17.491943359375, + 20.960437774658203, + 22.910301208496094 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006476694834418595, + 0.00020479912927839905, + 0.0001524801627965644, + 0.00010630583710735664, + 6.906194903422147e-05 + ], + "bp_grad_F": [ + 0.06572327762842178, + 0.019566379487514496, + 0.01484121847897768, + 0.010426007211208344, + 0.006943442393094301 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.763671875, + "loss_eval": 0.6451045274734497, + "epoch": 20 + }, + { + "hidden_norms_cls": [ + 1.394100546836853, + 9.805717468261719, + 14.102628707885742, + 19.18745231628418, + 24.205224990844727 + ], + "hidden_norms_avg": [ + 4.746951580047607, + 13.343804359436035, + 16.609134674072266, + 19.829851150512695, + 21.580671310424805 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006192427244968712, + 0.0002108582411892712, + 0.0001636892993701622, + 0.0001098570428439416, + 6.864540046080947e-05 + ], + "bp_grad_F": [ + 0.06809430569410324, + 0.02151457779109478, + 0.01606965810060501, + 0.011247958056628704, + 0.007375919260084629 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7705078125, + "loss_eval": 0.6522111892700195, + "epoch": 21 + }, + { + "hidden_norms_cls": [ + 1.4160058498382568, + 9.728543281555176, + 13.389554977416992, + 18.542705535888672, + 23.791994094848633 + ], + "hidden_norms_avg": [ + 4.738738536834717, + 13.15449333190918, + 16.28533172607422, + 19.581254959106445, + 21.488550186157227 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006278376094996929, + 0.00020051853789482266, + 0.00015803576388861984, + 0.0001043542506522499, + 6.271857273532078e-05 + ], + "bp_grad_F": [ + 0.07535671442747116, + 0.02472539246082306, + 0.01880054548382759, + 0.012977317906916142, + 0.007879889570176601 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.767578125, + "loss_eval": 0.6732022762298584, + "epoch": 22 + }, + { + "hidden_norms_cls": [ + 1.4301073551177979, + 9.656251907348633, + 13.501574516296387, + 18.518707275390625, + 23.49370574951172 + ], + "hidden_norms_avg": [ + 4.7338972091674805, + 12.90231704711914, + 15.899849891662598, + 18.982860565185547, + 20.785310745239258 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005697127780877054, + 0.00018775691569317132, + 0.00014216902491170913, + 9.182754729408771e-05, + 5.984708695905283e-05 + ], + "bp_grad_F": [ + 0.07130222022533417, + 0.023520665243268013, + 0.017786188051104546, + 0.012143870815634727, + 0.007813607342541218 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7763671875, + "loss_eval": 0.6380050182342529, + "epoch": 23 + }, + { + "hidden_norms_cls": [ + 1.4623057842254639, + 10.028787612915039, + 13.687016487121582, + 18.426584243774414, + 23.602413177490234 + ], + "hidden_norms_avg": [ + 4.807516574859619, + 12.739899635314941, + 16.150466918945312, + 19.439754486083984, + 21.316791534423828 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005416463245637715, + 0.00019103426893707365, + 0.00014568559709005058, + 9.899997530737892e-05, + 6.29485584795475e-05 + ], + "bp_grad_F": [ + 0.07191846519708633, + 0.023787740617990494, + 0.01782786287367344, + 0.012350695207715034, + 0.007955120876431465 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7841796875, + "loss_eval": 0.6439570784568787, + "epoch": 24 + }, + { + "hidden_norms_cls": [ + 1.4565976858139038, + 9.294268608093262, + 12.656200408935547, + 17.385971069335938, + 21.959299087524414 + ], + "hidden_norms_avg": [ + 4.774696350097656, + 12.394432067871094, + 15.230389595031738, + 18.10796356201172, + 19.88006591796875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005462650442495942, + 0.00019751323270611465, + 0.00015244862879626453, + 0.00010562407260295004, + 6.40779035165906e-05 + ], + "bp_grad_F": [ + 0.07698184996843338, + 0.026412304490804672, + 0.02022000029683113, + 0.013991317711770535, + 0.008763212710618973 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7568359375, + "loss_eval": 0.6531677842140198, + "epoch": 25 + }, + { + "hidden_norms_cls": [ + 1.4813296794891357, + 9.043482780456543, + 12.308734893798828, + 16.513948440551758, + 21.061283111572266 + ], + "hidden_norms_avg": [ + 4.7356462478637695, + 12.33294677734375, + 15.104657173156738, + 17.771398544311523, + 19.526002883911133 + ], + "bp_grad_per_sample_l2_med": [ + 0.000557436200324446, + 0.0002021614054683596, + 0.0001567570143379271, + 0.00010984922846546397, + 6.634221062995493e-05 + ], + "bp_grad_F": [ + 0.07777652144432068, + 0.027695877477526665, + 0.021396547555923462, + 0.015052770264446735, + 0.009372876025736332 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7744140625, + "loss_eval": 0.6539995074272156, + "epoch": 26 + }, + { + "hidden_norms_cls": [ + 1.4828969240188599, + 8.677760124206543, + 12.009501457214355, + 16.262908935546875, + 20.79404067993164 + ], + "hidden_norms_avg": [ + 4.744379043579102, + 12.125540733337402, + 14.89413833618164, + 17.47431182861328, + 18.953710556030273 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005026232684031129, + 0.00019721532589755952, + 0.00014348917466122657, + 0.00010225686855847016, + 5.8645866374718025e-05 + ], + "bp_grad_F": [ + 0.0830698236823082, + 0.03011341392993927, + 0.023107260465621948, + 0.016188694164156914, + 0.00968033168464899 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7744140625, + "loss_eval": 0.6444424390792847, + "epoch": 27 + }, + { + "hidden_norms_cls": [ + 1.5019822120666504, + 9.1107816696167, + 12.172623634338379, + 16.5975341796875, + 20.453947067260742 + ], + "hidden_norms_avg": [ + 4.741573333740234, + 12.045503616333008, + 14.836026191711426, + 17.666833877563477, + 19.175966262817383 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005040269461460412, + 0.00019225970027036965, + 0.0001496450131526217, + 0.00010478955664439127, + 6.137428135843948e-05 + ], + "bp_grad_F": [ + 0.07822537422180176, + 0.02863621897995472, + 0.022284477949142456, + 0.01552330981940031, + 0.009474868886172771 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7822265625, + "loss_eval": 0.6074927449226379, + "epoch": 28 + }, + { + "hidden_norms_cls": [ + 1.5009087324142456, + 8.223862648010254, + 11.225082397460938, + 15.531359672546387, + 19.848068237304688 + ], + "hidden_norms_avg": [ + 4.69788122177124, + 11.848491668701172, + 14.342337608337402, + 16.882020950317383, + 18.197385787963867 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004685261519625783, + 0.00017912790644913912, + 0.00013862684136256576, + 9.223359666066244e-05, + 5.140554640092887e-05 + ], + "bp_grad_F": [ + 0.09127916395664215, + 0.03443564847111702, + 0.026544470340013504, + 0.01809101179242134, + 0.010493002831935883 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7783203125, + "loss_eval": 0.6329880952835083, + "epoch": 29 + }, + { + "hidden_norms_cls": [ + 1.509100079536438, + 8.238924980163574, + 10.995248794555664, + 14.927000045776367, + 19.032428741455078 + ], + "hidden_norms_avg": [ + 4.678654193878174, + 11.513160705566406, + 14.12202262878418, + 16.704364776611328, + 18.131078720092773 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004594121128320694, + 0.00018182865460403264, + 0.000145129015436396, + 0.00010142508108401671, + 5.208289803704247e-05 + ], + "bp_grad_F": [ + 0.09080124646425247, + 0.03489048779010773, + 0.027099598199129105, + 0.018760183826088905, + 0.010796112939715385 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7822265625, + "loss_eval": 0.625268816947937, + "epoch": 30 + }, + { + "hidden_norms_cls": [ + 1.503785252571106, + 7.896090030670166, + 10.495330810546875, + 14.530640602111816, + 18.728647232055664 + ], + "hidden_norms_avg": [ + 4.70166540145874, + 11.420204162597656, + 13.774767875671387, + 16.2652530670166, + 17.631481170654297 + ], + "bp_grad_per_sample_l2_med": [ + 0.00043488750816322863, + 0.00017315168224740773, + 0.0001335645210929215, + 8.99006481631659e-05, + 5.126056930748746e-05 + ], + "bp_grad_F": [ + 0.10076858103275299, + 0.039271026849746704, + 0.0300181582570076, + 0.020545953884720802, + 0.011564387008547783 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.771484375, + "loss_eval": 0.6479744911193848, + "epoch": 31 + }, + { + "hidden_norms_cls": [ + 1.505173921585083, + 7.728392124176025, + 10.420252799987793, + 14.133453369140625, + 18.110719680786133 + ], + "hidden_norms_avg": [ + 4.7109880447387695, + 11.242951393127441, + 13.997397422790527, + 16.60598373413086, + 17.915313720703125 + ], + "bp_grad_per_sample_l2_med": [ + 0.00040974540752358735, + 0.0001792571711121127, + 0.00014464404375758022, + 9.883226448437199e-05, + 5.038536983192898e-05 + ], + "bp_grad_F": [ + 0.09923475980758667, + 0.039516862481832504, + 0.03056514263153076, + 0.021311543881893158, + 0.011838918551802635 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7880859375, + "loss_eval": 0.6011433601379395, + "epoch": 32 + }, + { + "hidden_norms_cls": [ + 1.5013800859451294, + 7.8755106925964355, + 10.452071189880371, + 14.013816833496094, + 17.622900009155273 + ], + "hidden_norms_avg": [ + 4.662457466125488, + 11.018245697021484, + 13.179399490356445, + 15.56103515625, + 16.739452362060547 + ], + "bp_grad_per_sample_l2_med": [ + 0.00033098450512625277, + 0.0001421417691744864, + 0.00011021740647265688, + 7.645406731171533e-05, + 4.017115134047344e-05 + ], + "bp_grad_F": [ + 0.09463275969028473, + 0.03948793560266495, + 0.03067062795162201, + 0.021538278087973595, + 0.012101472355425358 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8076171875, + "loss_eval": 0.5846524238586426, + "epoch": 33 + }, + { + "hidden_norms_cls": [ + 1.5032685995101929, + 7.549060344696045, + 10.04562759399414, + 13.609556198120117, + 17.36180877685547 + ], + "hidden_norms_avg": [ + 4.688360214233398, + 11.03510856628418, + 13.660865783691406, + 16.024188995361328, + 17.242145538330078 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003352685598656535, + 0.0001500560319982469, + 0.000116633229481522, + 8.394405449507758e-05, + 4.0652244933880866e-05 + ], + "bp_grad_F": [ + 0.10540100187063217, + 0.044482193887233734, + 0.03421863541007042, + 0.023781608790159225, + 0.012753129936754704 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7861328125, + "loss_eval": 0.5960580110549927, + "epoch": 34 + }, + { + "hidden_norms_cls": [ + 1.5032752752304077, + 7.387601375579834, + 9.652260780334473, + 13.042936325073242, + 16.688335418701172 + ], + "hidden_norms_avg": [ + 4.644099235534668, + 10.739524841308594, + 13.165095329284668, + 15.435381889343262, + 16.59172248840332 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003447248600423336, + 0.0001518868375569582, + 0.00012246235564816743, + 8.41514120111242e-05, + 4.193704080535099e-05 + ], + "bp_grad_F": [ + 0.11063266545534134, + 0.04730832949280739, + 0.03743334487080574, + 0.02577192150056362, + 0.01377912238240242 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.78515625, + "loss_eval": 0.652167797088623, + "epoch": 35 + }, + { + "hidden_norms_cls": [ + 1.4935848712921143, + 7.262828826904297, + 9.431328773498535, + 12.742668151855469, + 16.348758697509766 + ], + "hidden_norms_avg": [ + 4.6145453453063965, + 10.670759201049805, + 12.641580581665039, + 14.64714241027832, + 15.685794830322266 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003325030847918242, + 0.00014367286348715425, + 0.00011324919614708051, + 7.871988782426342e-05, + 4.058879494550638e-05 + ], + "bp_grad_F": [ + 0.11436768621206284, + 0.04893247410655022, + 0.03840672969818115, + 0.02707456797361374, + 0.014087510295212269 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7978515625, + "loss_eval": 0.6156834363937378, + "epoch": 36 + }, + { + "hidden_norms_cls": [ + 1.4897189140319824, + 7.156031608581543, + 9.365946769714355, + 12.499292373657227, + 15.942588806152344 + ], + "hidden_norms_avg": [ + 4.635710716247559, + 10.602685928344727, + 12.637743949890137, + 14.74621868133545, + 15.834792137145996 + ], + "bp_grad_per_sample_l2_med": [ + 0.000299928622553125, + 0.00013245265290606767, + 0.00010241761629004031, + 7.247657049447298e-05, + 3.780105180339888e-05 + ], + "bp_grad_F": [ + 0.11267601698637009, + 0.0501401461660862, + 0.03941003605723381, + 0.0279407799243927, + 0.014723201282322407 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.80078125, + "loss_eval": 0.5903886556625366, + "epoch": 37 + }, + { + "hidden_norms_cls": [ + 1.4791479110717773, + 7.027911186218262, + 9.0321044921875, + 12.123476028442383, + 15.987238883972168 + ], + "hidden_norms_avg": [ + 4.5436177253723145, + 10.157598495483398, + 12.115620613098145, + 14.023022651672363, + 15.130277633666992 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002464659046381712, + 0.00011603213351918384, + 9.401622082805261e-05, + 6.44488463876769e-05, + 2.8129303245805204e-05 + ], + "bp_grad_F": [ + 0.1319781094789505, + 0.05854209512472153, + 0.04639327526092529, + 0.03260229155421257, + 0.01578359492123127 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7841796875, + "loss_eval": 0.6532921195030212, + "epoch": 38 + }, + { + "hidden_norms_cls": [ + 1.4722236394882202, + 6.847982406616211, + 9.039284706115723, + 11.94421672821045, + 15.479789733886719 + ], + "hidden_norms_avg": [ + 4.536457538604736, + 10.0848388671875, + 11.944480895996094, + 13.931117057800293, + 15.018562316894531 + ], + "bp_grad_per_sample_l2_med": [ + 0.00023636725381948054, + 0.00011084756260970607, + 8.837366476655006e-05, + 6.370043411152437e-05, + 3.0101380616542883e-05 + ], + "bp_grad_F": [ + 0.1352969855070114, + 0.06069062277674675, + 0.04737559333443642, + 0.03317096084356308, + 0.016367904841899872 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7783203125, + "loss_eval": 0.6675163507461548, + "epoch": 39 + }, + { + "hidden_norms_cls": [ + 1.4741134643554688, + 6.7887864112854, + 8.833945274353027, + 11.777705192565918, + 15.091635704040527 + ], + "hidden_norms_avg": [ + 4.546427249908447, + 10.082904815673828, + 11.992964744567871, + 14.035684585571289, + 15.085047721862793 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002497230307199061, + 0.00011889061715919524, + 9.627552208257839e-05, + 6.80557859595865e-05, + 3.187589391018264e-05 + ], + "bp_grad_F": [ + 0.13283543288707733, + 0.06097453087568283, + 0.047521013766527176, + 0.033583469688892365, + 0.016502397134900093 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7998046875, + "loss_eval": 0.6332878470420837, + "epoch": 40 + }, + { + "hidden_norms_cls": [ + 1.4732073545455933, + 6.690948009490967, + 8.623305320739746, + 11.383458137512207, + 14.868409156799316 + ], + "hidden_norms_avg": [ + 4.510478973388672, + 9.772372245788574, + 11.55829906463623, + 13.379657745361328, + 14.343344688415527 + ], + "bp_grad_per_sample_l2_med": [ + 0.00019870084361173213, + 0.00010116927296621725, + 8.329773845616728e-05, + 6.15280878264457e-05, + 2.8435944841476157e-05 + ], + "bp_grad_F": [ + 0.13917136192321777, + 0.06636927276849747, + 0.05231080949306488, + 0.0366261750459671, + 0.017451239749789238 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8017578125, + "loss_eval": 0.6271109580993652, + "epoch": 41 + }, + { + "hidden_norms_cls": [ + 1.4620546102523804, + 6.489831924438477, + 8.487679481506348, + 11.202116966247559, + 14.761962890625 + ], + "hidden_norms_avg": [ + 4.5009870529174805, + 9.717012405395508, + 11.480990409851074, + 13.235471725463867, + 14.178875923156738 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015383858408313245, + 8.131976937875152e-05, + 6.472255336120725e-05, + 4.378501034807414e-05, + 1.9541592337191105e-05 + ], + "bp_grad_F": [ + 0.1546960175037384, + 0.07402726262807846, + 0.058267489075660706, + 0.041084613651037216, + 0.018521569669246674 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.794921875, + "loss_eval": 0.6767467260360718, + "epoch": 42 + }, + { + "hidden_norms_cls": [ + 1.4651520252227783, + 6.564362525939941, + 8.296653747558594, + 11.014183044433594, + 14.418519973754883 + ], + "hidden_norms_avg": [ + 4.483984470367432, + 9.593335151672363, + 11.23758316040039, + 13.036303520202637, + 14.015531539916992 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002037636877503246, + 0.00010235400259261951, + 8.395169425057247e-05, + 5.674947897205129e-05, + 2.5295201339758933e-05 + ], + "bp_grad_F": [ + 0.15471766889095306, + 0.07422170042991638, + 0.05941145122051239, + 0.04111991077661514, + 0.018912144005298615 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8037109375, + "loss_eval": 0.6682149171829224, + "epoch": 43 + }, + { + "hidden_norms_cls": [ + 1.457137107849121, + 6.368557929992676, + 8.152215957641602, + 10.783031463623047, + 14.167640686035156 + ], + "hidden_norms_avg": [ + 4.462830066680908, + 9.585762977600098, + 11.208064079284668, + 13.065739631652832, + 13.993027687072754 + ], + "bp_grad_per_sample_l2_med": [ + 0.00016671593766659498, + 8.65811962285079e-05, + 7.217681559268385e-05, + 5.042032353230752e-05, + 2.1260022549540736e-05 + ], + "bp_grad_F": [ + 0.15730538964271545, + 0.07605564594268799, + 0.06052647903561592, + 0.04247846081852913, + 0.01923321560025215 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8134765625, + "loss_eval": 0.6757298111915588, + "epoch": 44 + }, + { + "hidden_norms_cls": [ + 1.4529122114181519, + 6.260828018188477, + 8.032843589782715, + 10.586301803588867, + 13.950445175170898 + ], + "hidden_norms_avg": [ + 4.4613800048828125, + 9.4591646194458, + 11.012088775634766, + 12.760184288024902, + 13.692852973937988 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001344321499345824, + 6.65406696498394e-05, + 5.5920852901181206e-05, + 3.9107719203457236e-05, + 1.5611329217790626e-05 + ], + "bp_grad_F": [ + 0.1660272479057312, + 0.08182978630065918, + 0.06507853418588638, + 0.046549297869205475, + 0.020592277869582176 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.806640625, + "loss_eval": 0.685518205165863, + "epoch": 45 + }, + { + "hidden_norms_cls": [ + 1.4509673118591309, + 6.163156032562256, + 7.82518196105957, + 10.378498077392578, + 13.96407699584961 + ], + "hidden_norms_avg": [ + 4.434635162353516, + 9.335474967956543, + 10.857998847961426, + 12.551763534545898, + 13.511585235595703 + ], + "bp_grad_per_sample_l2_med": [ + 0.00011230952804908156, + 5.540825441130437e-05, + 4.5063996367389336e-05, + 2.9814285881002434e-05, + 1.1903831364179496e-05 + ], + "bp_grad_F": [ + 0.1772848516702652, + 0.08942516893148422, + 0.07126298546791077, + 0.04956020042300224, + 0.021146513521671295 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7958984375, + "loss_eval": 0.69295334815979, + "epoch": 46 + }, + { + "hidden_norms_cls": [ + 1.4527415037155151, + 6.165233612060547, + 7.756027698516846, + 10.242467880249023, + 13.45471477508545 + ], + "hidden_norms_avg": [ + 4.438976287841797, + 9.343517303466797, + 10.836493492126465, + 12.435514450073242, + 13.287426948547363 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001074640967999585, + 5.268112363410182e-05, + 4.352951145847328e-05, + 3.164535519317724e-05, + 1.2792614143108949e-05 + ], + "bp_grad_F": [ + 0.17606250941753387, + 0.08888891339302063, + 0.07090400159358978, + 0.05056491121649742, + 0.021766021847724915 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.806640625, + "loss_eval": 0.6969807147979736, + "epoch": 47 + }, + { + "hidden_norms_cls": [ + 1.4455187320709229, + 6.104230880737305, + 7.606966972351074, + 10.056215286254883, + 13.531522750854492 + ], + "hidden_norms_avg": [ + 4.394144535064697, + 9.197455406188965, + 10.598797798156738, + 12.198134422302246, + 13.1181001663208 + ], + "bp_grad_per_sample_l2_med": [ + 9.084033081308007e-05, + 4.605063077178784e-05, + 3.957438457291573e-05, + 2.727917853917461e-05, + 1.0920393833657727e-05 + ], + "bp_grad_F": [ + 0.1919114887714386, + 0.09742862731218338, + 0.07786751538515091, + 0.05414625629782677, + 0.022070109844207764 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.810546875, + "loss_eval": 0.713995635509491, + "epoch": 48 + }, + { + "hidden_norms_cls": [ + 1.4383388757705688, + 6.067695617675781, + 7.595578670501709, + 9.960418701171875, + 13.367838859558105 + ], + "hidden_norms_avg": [ + 4.4121479988098145, + 9.207226753234863, + 10.62590217590332, + 12.186077117919922, + 13.054762840270996 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010577002831269056, + 5.2172203140798956e-05, + 4.119141885894351e-05, + 2.997498268086929e-05, + 1.1721556802513078e-05 + ], + "bp_grad_F": [ + 0.19711492955684662, + 0.09961695969104767, + 0.07941404730081558, + 0.05621125549077988, + 0.02285071834921837 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7998046875, + "loss_eval": 0.7457866668701172, + "epoch": 49 + }, + { + "hidden_norms_cls": [ + 1.438454270362854, + 6.097946643829346, + 7.5858659744262695, + 9.956851959228516, + 13.270756721496582 + ], + "hidden_norms_avg": [ + 4.392654895782471, + 9.144302368164062, + 10.536030769348145, + 12.092294692993164, + 12.985077857971191 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010758326970972121, + 5.274294744594954e-05, + 4.421125413500704e-05, + 3.0753104510949925e-05, + 1.1889996130776126e-05 + ], + "bp_grad_F": [ + 0.19883227348327637, + 0.1017213836312294, + 0.0807848572731018, + 0.056292060762643814, + 0.022987989708781242 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7998046875, + "loss_eval": 0.7402137517929077, + "epoch": 50 + }, + { + "hidden_norms_cls": [ + 1.4367005825042725, + 6.004332542419434, + 7.504194259643555, + 9.782310485839844, + 13.125389099121094 + ], + "hidden_norms_avg": [ + 4.3845720291137695, + 9.06988525390625, + 10.41169548034668, + 11.905806541442871, + 12.784433364868164 + ], + "bp_grad_per_sample_l2_med": [ + 9.236831829184666e-05, + 4.803440242540091e-05, + 3.901722448063083e-05, + 2.752364525804296e-05, + 1.1449340490798932e-05 + ], + "bp_grad_F": [ + 0.19664740562438965, + 0.10213448107242584, + 0.08124449104070663, + 0.05709528177976608, + 0.023260990157723427 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8017578125, + "loss_eval": 0.732274055480957, + "epoch": 51 + }, + { + "hidden_norms_cls": [ + 1.4371269941329956, + 5.965888500213623, + 7.401495933532715, + 9.748833656311035, + 13.274619102478027 + ], + "hidden_norms_avg": [ + 4.380629539489746, + 9.019668579101562, + 10.396828651428223, + 11.923394203186035, + 12.77461051940918 + ], + "bp_grad_per_sample_l2_med": [ + 7.760760490782559e-05, + 4.048245318699628e-05, + 3.216555342078209e-05, + 2.2310470740194432e-05, + 8.838631401886232e-06 + ], + "bp_grad_F": [ + 0.20731569826602936, + 0.10790340602397919, + 0.08557390421628952, + 0.059937626123428345, + 0.023827020078897476 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8046875, + "loss_eval": 0.7751725316047668, + "epoch": 52 + }, + { + "hidden_norms_cls": [ + 1.4341260194778442, + 5.9393768310546875, + 7.411903381347656, + 9.739734649658203, + 13.19786548614502 + ], + "hidden_norms_avg": [ + 4.378067493438721, + 8.986294746398926, + 10.316237449645996, + 11.792922019958496, + 12.673585891723633 + ], + "bp_grad_per_sample_l2_med": [ + 6.968516390770674e-05, + 3.471451054792851e-05, + 2.8814916731789708e-05, + 1.9318980776006356e-05, + 7.639268915227149e-06 + ], + "bp_grad_F": [ + 0.2137812376022339, + 0.11110929399728775, + 0.08847261965274811, + 0.06186935305595398, + 0.024307044222950935 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8056640625, + "loss_eval": 0.764312744140625, + "epoch": 53 + }, + { + "hidden_norms_cls": [ + 1.4324616193771362, + 5.883492469787598, + 7.319663047790527, + 9.547243118286133, + 13.008822441101074 + ], + "hidden_norms_avg": [ + 4.376597881317139, + 8.99113941192627, + 10.321625709533691, + 11.771256446838379, + 12.628817558288574 + ], + "bp_grad_per_sample_l2_med": [ + 7.972177991177887e-05, + 3.871036460623145e-05, + 3.142197601846419e-05, + 2.2371379600372165e-05, + 8.571933904022444e-06 + ], + "bp_grad_F": [ + 0.21534259617328644, + 0.11241323500871658, + 0.08915204554796219, + 0.06287811696529388, + 0.024627922102808952 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7958984375, + "loss_eval": 0.7731261253356934, + "epoch": 54 + }, + { + "hidden_norms_cls": [ + 1.4321078062057495, + 5.858248710632324, + 7.306819915771484, + 9.56387996673584, + 13.071084022521973 + ], + "hidden_norms_avg": [ + 4.371452808380127, + 8.94082260131836, + 10.26811695098877, + 11.765360832214355, + 12.617104530334473 + ], + "bp_grad_per_sample_l2_med": [ + 7.236401870613918e-05, + 3.8528516597580165e-05, + 3.0984694603830576e-05, + 2.1565809220192023e-05, + 7.989257937879302e-06 + ], + "bp_grad_F": [ + 0.2197490781545639, + 0.1155213937163353, + 0.09188564866781235, + 0.06453806161880493, + 0.024861471727490425 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7958984375, + "loss_eval": 0.7778797149658203, + "epoch": 55 + }, + { + "hidden_norms_cls": [ + 1.4319349527359009, + 5.846956253051758, + 7.283481121063232, + 9.520010948181152, + 13.023626327514648 + ], + "hidden_norms_avg": [ + 4.372097969055176, + 8.950923919677734, + 10.25277328491211, + 11.715353012084961, + 12.572748184204102 + ], + "bp_grad_per_sample_l2_med": [ + 6.399707490345463e-05, + 3.384953743079677e-05, + 2.7512824090081267e-05, + 1.8538266886025667e-05, + 7.2009356699709315e-06 + ], + "bp_grad_F": [ + 0.21942120790481567, + 0.11553706228733063, + 0.09221186488866806, + 0.06456339359283447, + 0.024819573387503624 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.798828125, + "loss_eval": 0.7808230519294739, + "epoch": 56 + }, + { + "hidden_norms_cls": [ + 1.4311723709106445, + 5.84969425201416, + 7.275974273681641, + 9.513206481933594, + 12.99256420135498 + ], + "hidden_norms_avg": [ + 4.37282133102417, + 8.946002006530762, + 10.248116493225098, + 11.702008247375488, + 12.54873275756836 + ], + "bp_grad_per_sample_l2_med": [ + 6.404191663023084e-05, + 3.509471571305767e-05, + 2.9476050258381292e-05, + 1.9310447896714322e-05, + 7.2306984293391e-06 + ], + "bp_grad_F": [ + 0.22379544377326965, + 0.11763197183609009, + 0.09364764392375946, + 0.06539658457040787, + 0.02503892220556736 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.80078125, + "loss_eval": 0.7862963080406189, + "epoch": 57 + }, + { + "hidden_norms_cls": [ + 1.4306355714797974, + 5.837501049041748, + 7.250905990600586, + 9.502866744995117, + 13.022948265075684 + ], + "hidden_norms_avg": [ + 4.368107795715332, + 8.927281379699707, + 10.20923900604248, + 11.650206565856934, + 12.504077911376953 + ], + "bp_grad_per_sample_l2_med": [ + 7.216054655145854e-05, + 3.7455520214280114e-05, + 3.0207094823708758e-05, + 2.1436455426737666e-05, + 7.401154562103329e-06 + ], + "bp_grad_F": [ + 0.22603340446949005, + 0.11918352544307709, + 0.0947541669011116, + 0.06624340265989304, + 0.02514214999973774 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8017578125, + "loss_eval": 0.7883187532424927, + "epoch": 58 + }, + { + "hidden_norms_cls": [ + 1.4303507804870605, + 5.833686351776123, + 7.24592399597168, + 9.48628044128418, + 12.962425231933594 + ], + "hidden_norms_avg": [ + 4.368690013885498, + 8.926249504089355, + 10.21507453918457, + 11.65561294555664, + 12.507142066955566 + ], + "bp_grad_per_sample_l2_med": [ + 6.914411642355844e-05, + 3.7666370189981535e-05, + 3.0613842682214454e-05, + 2.0578616386046633e-05, + 7.153785645641619e-06 + ], + "bp_grad_F": [ + 0.22665317356586456, + 0.1197197362780571, + 0.09526386857032776, + 0.06651060283184052, + 0.02521701157093048 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.798828125, + "loss_eval": 0.7879265546798706, + "epoch": 59 + }, + { + "hidden_norms_cls": [ + 1.430293083190918, + 5.832674026489258, + 7.243373394012451, + 9.484408378601074, + 12.968917846679688 + ], + "hidden_norms_avg": [ + 4.368374347686768, + 8.92542552947998, + 10.214056015014648, + 11.65438175201416, + 12.507084846496582 + ], + "bp_grad_per_sample_l2_med": [ + 6.862521695438772e-05, + 3.740868851309642e-05, + 3.050716986763291e-05, + 2.0533103452180512e-05, + 7.137502961995779e-06 + ], + "bp_grad_F": [ + 0.22697713971138, + 0.11988355964422226, + 0.09540446847677231, + 0.06659507006406784, + 0.025233659893274307 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.798828125, + "loss_eval": 0.7890625, + "epoch": 60 + } + ], + "dfa_log": [ + { + "hidden_norms_cls": [ + 0.31052109599113464, + 3.2536301612854004, + 4.7681732177734375, + 6.129599571228027, + 7.124356746673584 + ], + "hidden_norms_avg": [ + 6.008513927459717, + 7.034290313720703, + 7.942849636077881, + 8.915729522705078, + 9.635361671447754 + ], + "bp_grad_per_sample_l2_med": [ + 0.004442029166966677, + 0.0012008437188342214, + 0.0009976272704079747, + 0.0009104337659664452, + 0.0008558662957511842 + ], + "bp_grad_F": [ + 0.18535660207271576, + 0.03968670591711998, + 0.032604776322841644, + 0.029427478089928627, + 0.02746850810945034 + ], + "gamma_dfa": 0.003905070887412876, + "gamma_dfa_per_layer": [ + 0.004920602310448885, + 0.005249542184174061, + 0.0038580193649977446, + 0.0015921196900308132 + ], + "acc_eval": 0.1376953125, + "loss_eval": 2.35188627243042, + "epoch": 0 + }, + { + "hidden_norms_cls": [ + 1.969543218612671, + 2409.528564453125, + 2965.8515625, + 5388.57568359375, + 10078.4892578125 + ], + "hidden_norms_avg": [ + 45.02196502685547, + 4042.294189453125, + 10780.892578125, + 14336.607421875, + 18185.720703125 + ], + "bp_grad_per_sample_l2_med": [ + 0.00021220046619419008, + 6.587009124814358e-07, + 6.152115474833408e-07, + 6.009134381201875e-07, + 6.002246095704322e-07 + ], + "bp_grad_F": [ + 0.327708899974823, + 5.584151222137734e-05, + 3.1912604754325e-05, + 2.0850193322985433e-05, + 2.061383202089928e-05 + ], + "gamma_dfa": 0.0062168055737856776, + "gamma_dfa_per_layer": [ + 0.0034891567192971706, + 0.014096655882894993, + 0.008750341832637787, + -0.0014689321396872401 + ], + "acc_eval": 0.240234375, + "loss_eval": 2.0569005012512207, + "epoch": 1 + }, + { + "hidden_norms_cls": [ + 4.063174247741699, + 6453.43212890625, + 10849.3359375, + 13374.7021484375, + 36052.8046875 + ], + "hidden_norms_avg": [ + 93.43009185791016, + 12578.36328125, + 48372.984375, + 57469.9609375, + 73801.421875 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015539559535682201, + 2.588524239399703e-07, + 1.9553621655177267e-07, + 1.8433813409046707e-07, + 1.781664309419284e-07 + ], + "bp_grad_F": [ + 0.09239349514245987, + 5.2396142564248294e-05, + 9.398144356964622e-06, + 6.586112704098923e-06, + 6.009819117025472e-06 + ], + "gamma_dfa": 0.009027999331010506, + "gamma_dfa_per_layer": [ + 0.010615326464176178, + 0.014681536704301834, + 0.012467417865991592, + -0.0016522837104275823 + ], + "acc_eval": 0.2236328125, + "loss_eval": 2.0732030868530273, + "epoch": 2 + }, + { + "hidden_norms_cls": [ + 6.139724254608154, + 13514.7626953125, + 22634.615234375, + 30011.625, + 105646.9140625 + ], + "hidden_norms_avg": [ + 140.93157958984375, + 27337.47265625, + 105659.2734375, + 131533.03125, + 178079.78125 + ], + "bp_grad_per_sample_l2_med": [ + 0.00013191952893976122, + 1.5711624712366756e-07, + 6.783211148331247e-08, + 6.273136676782087e-08, + 6.216072989673194e-08 + ], + "bp_grad_F": [ + 0.15658611059188843, + 2.8997201297897846e-05, + 2.6110699309356278e-06, + 2.0865154510829598e-06, + 2.029548568316386e-06 + ], + "gamma_dfa": 0.0068359210272319615, + "gamma_dfa_per_layer": [ + 0.01239929161965847, + 0.008297638036310673, + 0.009697571396827698, + -0.0030508169438689947 + ], + "acc_eval": 0.2255859375, + "loss_eval": 2.0859451293945312, + "epoch": 3 + }, + { + "hidden_norms_cls": [ + 8.060498237609863, + 26771.85546875, + 47700.99609375, + 65194.9375, + 243467.953125 + ], + "hidden_norms_avg": [ + 189.60569763183594, + 53537.2734375, + 224677.375, + 271932.0625, + 380665.78125 + ], + "bp_grad_per_sample_l2_med": [ + 6.88996515236795e-05, + 7.635610188572173e-08, + 3.178359264666142e-08, + 2.8310823907418126e-08, + 2.8113991135114702e-08 + ], + "bp_grad_F": [ + 0.18565885722637177, + 2.3117625460145064e-05, + 1.2200183618915617e-06, + 1.0046638863059343e-06, + 9.67514324656804e-07 + ], + "gamma_dfa": 0.00588334770873189, + "gamma_dfa_per_layer": [ + 0.012929551303386688, + 0.005936518311500549, + 0.009927853010594845, + -0.0052605317905545235 + ], + "acc_eval": 0.216796875, + "loss_eval": 2.1008124351501465, + "epoch": 4 + }, + { + "hidden_norms_cls": [ + 9.924980163574219, + 45836.29296875, + 86015.5546875, + 115240.734375, + 396649.5625 + ], + "hidden_norms_avg": [ + 236.08885192871094, + 94806.203125, + 447709.03125, + 539570.125, + 680795.4375 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014524323341902345, + 3.066869780354864e-08, + 1.9569522891060842e-08, + 1.7725259482404e-08, + 1.7704602228718613e-08 + ], + "bp_grad_F": [ + 0.21425659954547882, + 1.3653657333634328e-05, + 6.662682494606997e-07, + 5.818570798510336e-07, + 5.813048460368009e-07 + ], + "gamma_dfa": 0.006635856116190553, + "gamma_dfa_per_layer": [ + 0.010879420675337315, + 0.013957185670733452, + 0.00779206957668066, + -0.006085251457989216 + ], + "acc_eval": 0.2265625, + "loss_eval": 2.1039814949035645, + "epoch": 5 + }, + { + "hidden_norms_cls": [ + 11.746355056762695, + 70552.8046875, + 256103.15625, + 694951.625, + 808366.5625 + ], + "hidden_norms_avg": [ + 279.4807434082031, + 128343.046875, + 645095.375, + 810123.8125, + 959871.0 + ], + "bp_grad_per_sample_l2_med": [ + 6.159865733934566e-05, + 2.1975946395969004e-08, + 1.1060357074654803e-08, + 9.967390468546e-09, + 1.011228256686536e-08 + ], + "bp_grad_F": [ + 0.09021499752998352, + 5.0024723350361455e-06, + 4.539916176327097e-07, + 3.891582309734076e-07, + 3.9641980720261927e-07 + ], + "gamma_dfa": 0.003665695490781218, + "gamma_dfa_per_layer": [ + 0.009222292341291904, + 0.0031545532401651144, + 0.00775552075356245, + -0.005469584371894598 + ], + "acc_eval": 0.220703125, + "loss_eval": 2.1214356422424316, + "epoch": 6 + }, + { + "hidden_norms_cls": [ + 13.500020980834961, + 102720.734375, + 194937.703125, + 291956.1875, + 801362.9375 + ], + "hidden_norms_avg": [ + 321.6004943847656, + 208601.421875, + 1002364.1875, + 1189027.25, + 1448220.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014696457947138697, + 1.642234792598174e-08, + 8.907985460382406e-09, + 8.127726935924784e-09, + 8.014287011803845e-09 + ], + "bp_grad_F": [ + 0.06841801106929779, + 4.044012712256517e-06, + 3.4213746857858496e-07, + 2.990170742123155e-07, + 2.988945198012516e-07 + ], + "gamma_dfa": 0.004651258233934641, + "gamma_dfa_per_layer": [ + 0.007132797501981258, + 0.010231958702206612, + 0.006907162256538868, + -0.0056668855249881744 + ], + "acc_eval": 0.2099609375, + "loss_eval": 2.0963404178619385, + "epoch": 7 + }, + { + "hidden_norms_cls": [ + 15.302024841308594, + 160872.96875, + 604043.4375, + 1296474.125, + 1546227.0 + ], + "hidden_norms_avg": [ + 359.47259521484375, + 298263.5, + 1317573.75, + 1553171.25, + 1878602.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000136460512294434, + 1.0422226637274434e-08, + 5.898865396147812e-09, + 5.4856741371622775e-09, + 5.4926698744850455e-09 + ], + "bp_grad_F": [ + 0.07932842522859573, + 2.1081664272060152e-06, + 2.560300345066935e-07, + 2.2075181504987995e-07, + 2.2043255398784822e-07 + ], + "gamma_dfa": 0.004627774120308459, + "gamma_dfa_per_layer": [ + 0.006024104077368975, + 0.01116865873336792, + 0.005747191607952118, + -0.004428857937455177 + ], + "acc_eval": 0.220703125, + "loss_eval": 2.0744481086730957, + "epoch": 8 + }, + { + "hidden_norms_cls": [ + 17.009462356567383, + 204948.671875, + 405065.21875, + 549855.3125, + 1400973.875 + ], + "hidden_norms_avg": [ + 396.66558837890625, + 480022.3125, + 2019487.75, + 2350966.75, + 2708745.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.00026586122112348676, + 1.0135083883255902e-08, + 6.120911777429683e-09, + 5.8359819199438334e-09, + 5.662275093243352e-09 + ], + "bp_grad_F": [ + 0.37594228982925415, + 1.2430107744876295e-05, + 2.3164905371686473e-07, + 2.0265188993562333e-07, + 2.001279000296563e-07 + ], + "gamma_dfa": 0.004862090456299484, + "gamma_dfa_per_layer": [ + 0.006278482731431723, + 0.012495312839746475, + 0.005351733416318893, + -0.004677167162299156 + ], + "acc_eval": 0.2265625, + "loss_eval": 2.0641043186187744, + "epoch": 9 + }, + { + "hidden_norms_cls": [ + 18.669273376464844, + 316404.0625, + 619048.375, + 804163.5, + 1798441.0 + ], + "hidden_norms_avg": [ + 434.9389343261719, + 650998.25, + 2437815.25, + 2802479.0, + 3269810.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003605277743190527, + 6.009571951182124e-09, + 4.676837139783174e-09, + 4.657723096102018e-09, + 4.49635484400801e-09 + ], + "bp_grad_F": [ + 0.14846132695674896, + 4.3979816837236285e-06, + 1.7215310776919068e-07, + 1.581869213396203e-07, + 1.561998885790672e-07 + ], + "gamma_dfa": 0.004480502451770008, + "gamma_dfa_per_layer": [ + 0.006086423061788082, + 0.010957473888993263, + 0.004586817231029272, + -0.003708704374730587 + ], + "acc_eval": 0.2265625, + "loss_eval": 2.0591208934783936, + "epoch": 10 + }, + { + "hidden_norms_cls": [ + 20.326766967773438, + 443508.46875, + 899668.0625, + 1131299.375, + 2182177.5 + ], + "hidden_norms_avg": [ + 473.4957275390625, + 854388.9375, + 2926402.0, + 3295286.75, + 3825241.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005711699486710131, + 4.8561932253221585e-09, + 3.871160725310574e-09, + 3.833432238309342e-09, + 3.74674646863582e-09 + ], + "bp_grad_F": [ + 1.0882306098937988, + 3.257442813264788e-06, + 1.6311048511852277e-07, + 1.3397652764979284e-07, + 1.326638283671855e-07 + ], + "gamma_dfa": 0.00462920154677704, + "gamma_dfa_per_layer": [ + 0.008616073988378048, + 0.009468363597989082, + 0.003528183326125145, + -0.003095814725384116 + ], + "acc_eval": 0.234375, + "loss_eval": 2.0471031665802, + "epoch": 11 + }, + { + "hidden_norms_cls": [ + 21.944751739501953, + 581616.1875, + 1205317.625, + 1456984.375, + 2587496.75 + ], + "hidden_norms_avg": [ + 511.203125, + 1119566.25, + 3562080.25, + 3992681.5, + 4538977.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009346234728582203, + 4.117307383921798e-09, + 3.257990321969828e-09, + 3.2349201095627222e-09, + 3.1638915931608835e-09 + ], + "bp_grad_F": [ + 0.42184242606163025, + 2.2249487301451154e-06, + 1.2586481545895367e-07, + 1.1919513553948491e-07, + 1.181974553787768e-07 + ], + "gamma_dfa": 0.0034259117674082518, + "gamma_dfa_per_layer": [ + 0.00526365265250206, + 0.008116653189063072, + 0.0030386103317141533, + -0.0027152691036462784 + ], + "acc_eval": 0.2255859375, + "loss_eval": 2.0867815017700195, + "epoch": 12 + }, + { + "hidden_norms_cls": [ + 23.46192741394043, + 733909.875, + 1508464.125, + 1841074.875, + 3055228.75 + ], + "hidden_norms_avg": [ + 546.8953247070312, + 1235037.0, + 3742642.75, + 4200378.0, + 4892382.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009773626225069165, + 3.5754739169391314e-09, + 2.9525657474493983e-09, + 2.9297144710227485e-09, + 2.8955173814182444e-09 + ], + "bp_grad_F": [ + 0.15538839995861053, + 2.0067516288690967e-06, + 1.1871279781416888e-07, + 1.046255491132797e-07, + 1.0416235340926505e-07 + ], + "gamma_dfa": 0.002340688748518005, + "gamma_dfa_per_layer": [ + 0.0019294173689559102, + 0.007100729271769524, + 0.0026949853636324406, + -0.0023623770102858543 + ], + "acc_eval": 0.232421875, + "loss_eval": 2.088564872741699, + "epoch": 13 + }, + { + "hidden_norms_cls": [ + 24.94734764099121, + 1151802.75, + 3671404.25, + 4625593.5, + 5052590.0 + ], + "hidden_norms_avg": [ + 582.0977172851562, + 1475600.75, + 4403784.0, + 5008330.0, + 5801902.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007562927203252912, + 2.676908916754428e-09, + 2.2055020032496486e-09, + 2.179777247590664e-09, + 2.173634161550808e-09 + ], + "bp_grad_F": [ + 0.36642539501190186, + 3.967601060139714e-06, + 8.444904864290947e-08, + 7.993684647544796e-08, + 7.900475651467787e-08 + ], + "gamma_dfa": 0.0017957038653548807, + "gamma_dfa_per_layer": [ + 0.0019046596717089415, + 0.005139546003192663, + 0.001759346341714263, + -0.0016207365551963449 + ], + "acc_eval": 0.2109375, + "loss_eval": 2.08038330078125, + "epoch": 14 + }, + { + "hidden_norms_cls": [ + 26.36701011657715, + 2210167.25, + 6804633.5, + 7592304.0, + 7772230.0 + ], + "hidden_norms_avg": [ + 615.4749145507812, + 1852637.875, + 5297662.0, + 6054509.0, + 6940769.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009053644607774913, + 2.014937106054049e-09, + 1.6813730407960747e-09, + 1.63718916201816e-09, + 1.6135126568173064e-09 + ], + "bp_grad_F": [ + 0.15154746174812317, + 3.760401341423858e-06, + 6.479213254806382e-08, + 6.350511227992683e-08, + 6.00040195308793e-08 + ], + "gamma_dfa": 0.00026495405472815037, + "gamma_dfa_per_layer": [ + -0.0023696955759078264, + 0.0033954931423068047, + 0.0012687842827290297, + -0.0012347656302154064 + ], + "acc_eval": 0.2333984375, + "loss_eval": 2.0685791969299316, + "epoch": 15 + }, + { + "hidden_norms_cls": [ + 27.747814178466797, + 2020373.25, + 6352088.0, + 7372759.0, + 7751557.0 + ], + "hidden_norms_avg": [ + 647.8715209960938, + 2166255.0, + 5964871.0, + 6820316.0, + 7888183.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.000535959261469543, + 1.8833379300531305e-09, + 1.6251041623505103e-09, + 1.5936774122593533e-09, + 1.5920619267362213e-09 + ], + "bp_grad_F": [ + 0.06977186352014542, + 4.2289293560315855e-06, + 5.94431135425566e-08, + 5.634814925770115e-08, + 5.626874255426628e-08 + ], + "gamma_dfa": 0.0009004889943753369, + "gamma_dfa_per_layer": [ + 1.3074517482891679e-05, + 0.003544538514688611, + 0.0012792267370969057, + -0.0012348837917670608 + ], + "acc_eval": 0.234375, + "loss_eval": 2.0676896572113037, + "epoch": 16 + }, + { + "hidden_norms_cls": [ + 29.053590774536133, + 3083884.0, + 8692576.0, + 10024582.0, + 10278143.0 + ], + "hidden_norms_avg": [ + 679.1322021484375, + 2750560.0, + 7205648.0, + 8204248.5, + 9336888.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006835769745521247, + 1.5781399520520267e-09, + 1.3378861352109084e-09, + 1.2995797771253592e-09, + 1.2820219330578198e-09 + ], + "bp_grad_F": [ + 0.25767308473587036, + 1.6246455061263987e-06, + 6.349461756371966e-08, + 6.242527206268278e-08, + 4.5665522918625356e-08 + ], + "gamma_dfa": 0.0003357882087584585, + "gamma_dfa_per_layer": [ + -0.001319598057307303, + 0.002733789850026369, + 0.0008947808528319001, + -0.0009658198105171323 + ], + "acc_eval": 0.23046875, + "loss_eval": 2.0777204036712646, + "epoch": 17 + }, + { + "hidden_norms_cls": [ + 30.246440887451172, + 3200014.0, + 8626485.0, + 9743865.0, + 10146681.0 + ], + "hidden_norms_avg": [ + 708.5135498046875, + 2989787.0, + 7458187.5, + 8607358.0, + 10070516.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005841738311573863, + 1.4247033552905464e-09, + 1.2406603522308046e-09, + 1.21434362565509e-09, + 1.217411615961339e-09 + ], + "bp_grad_F": [ + 0.08999939262866974, + 1.7538721976961824e-06, + 4.803559150445835e-08, + 4.36282370230856e-08, + 4.3068951072200434e-08 + ], + "gamma_dfa": -2.2506676032207906e-05, + "gamma_dfa_per_layer": [ + -0.002581980312243104, + 0.002518225461244583, + 0.0009317069780081511, + -0.0009579788311384618 + ], + "acc_eval": 0.2392578125, + "loss_eval": 2.0627658367156982, + "epoch": 18 + }, + { + "hidden_norms_cls": [ + 31.42615509033203, + 4556513.5, + 10711725.0, + 11956874.0, + 12318100.0 + ], + "hidden_norms_avg": [ + 737.157958984375, + 3520006.5, + 8303534.5, + 9571905.0, + 11293369.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007374613196589053, + 1.2111865954622658e-09, + 1.0633514069269268e-09, + 1.0194807220642588e-09, + 1.0034837405470398e-09 + ], + "bp_grad_F": [ + 0.12247106432914734, + 2.740941681622644e-06, + 4.6019909660799385e-08, + 4.372383344275477e-08, + 3.6865596797497346e-08 + ], + "gamma_dfa": 0.0005736843086197041, + "gamma_dfa_per_layer": [ + 0.0002251334663014859, + 0.0021776340436190367, + 0.0006795942317694426, + -0.0007876245072111487 + ], + "acc_eval": 0.22265625, + "loss_eval": 2.062939167022705, + "epoch": 19 + }, + { + "hidden_norms_cls": [ + 32.559165954589844, + 4224958.5, + 10227904.0, + 11507743.0, + 12041642.0 + ], + "hidden_norms_avg": [ + 765.5013427734375, + 3988012.5, + 8953060.0, + 10431809.0, + 12380471.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006474430556409061, + 1.179957687114097e-09, + 1.0031043773395254e-09, + 9.744786089171953e-10, + 9.782840093564005e-10 + ], + "bp_grad_F": [ + 0.12209221720695496, + 1.616509621271689e-06, + 3.8821241332698264e-08, + 3.6648025059093925e-08, + 3.527756931021031e-08 + ], + "gamma_dfa": -0.00019280995184089988, + "gamma_dfa_per_layer": [ + -0.002911232877522707, + 0.0022857212461531162, + 0.0006594176520593464, + -0.0008051458280533552 + ], + "acc_eval": 0.240234375, + "loss_eval": 2.0555338859558105, + "epoch": 20 + }, + { + "hidden_norms_cls": [ + 33.59370040893555, + 5323277.5, + 11855673.0, + 13697022.0, + 14246667.0 + ], + "hidden_norms_avg": [ + 789.9629516601562, + 4634178.0, + 10205192.0, + 11930021.0, + 13993152.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006352875498123467, + 1.0036302899862903e-09, + 8.794808215029093e-10, + 8.579849608558732e-10, + 8.574586596310496e-10 + ], + "bp_grad_F": [ + 0.09745635837316513, + 5.127232043378172e-07, + 3.342180221466151e-08, + 3.173540363832217e-08, + 3.091372491326183e-08 + ], + "gamma_dfa": -0.0006959605379961431, + "gamma_dfa_per_layer": [ + -0.004454955458641052, + 0.0018251645378768444, + 0.0005447655566968024, + -0.000698816787917167 + ], + "acc_eval": 0.2265625, + "loss_eval": 2.056840181350708, + "epoch": 21 + }, + { + "hidden_norms_cls": [ + 34.583858489990234, + 6778143.0, + 13401385.0, + 15847366.0, + 16344266.0 + ], + "hidden_norms_avg": [ + 814.3038330078125, + 5395352.5, + 11137891.0, + 13094203.0, + 15406614.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006492820102721453, + 8.925201688825268e-10, + 7.777718469270667e-10, + 7.627384279729199e-10, + 7.601627105557895e-10 + ], + "bp_grad_F": [ + 0.08801906555891037, + 1.8660392697711359e-06, + 3.472371190582635e-08, + 2.7845679539950652e-08, + 2.7135749647300145e-08 + ], + "gamma_dfa": -0.0012016263353871182, + "gamma_dfa_per_layer": [ + -0.006280785892158747, + 0.001651690574362874, + 0.0004266214673407376, + -0.0006040314910933375 + ], + "acc_eval": 0.2255859375, + "loss_eval": 2.0746021270751953, + "epoch": 22 + }, + { + "hidden_norms_cls": [ + 35.516666412353516, + 6985935.5, + 14020116.0, + 16575473.0, + 17109272.0 + ], + "hidden_norms_avg": [ + 838.5614013671875, + 6365095.0, + 12448551.0, + 14566203.0, + 16943832.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007437304593622684, + 8.387662786546457e-10, + 7.299132409599451e-10, + 7.170505300635455e-10, + 7.115786293532267e-10 + ], + "bp_grad_F": [ + 0.1540054827928543, + 1.4262270724429982e-06, + 2.9031822279534936e-08, + 2.776059560005706e-08, + 2.5270722403547552e-08 + ], + "gamma_dfa": -0.00010950746218441054, + "gamma_dfa_per_layer": [ + -0.0017721566837280989, + 0.0015054477844387293, + 0.0003872170636896044, + -0.000558538013137877 + ], + "acc_eval": 0.2392578125, + "loss_eval": 2.065904140472412, + "epoch": 23 + }, + { + "hidden_norms_cls": [ + 36.39850997924805, + 7861434.0, + 14415042.0, + 16660478.0, + 17496562.0 + ], + "hidden_norms_avg": [ + 862.4805297851562, + 6600421.5, + 12694272.0, + 15043836.0, + 17968980.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005834798794239759, + 7.558619286029966e-10, + 6.530426754913776e-10, + 6.420492471015393e-10, + 6.389526685524061e-10 + ], + "bp_grad_F": [ + 0.09943251311779022, + 1.4788431599299656e-06, + 2.582997993272329e-08, + 2.3754548550414256e-08, + 2.322415859623561e-08 + ], + "gamma_dfa": -0.0009345750440843403, + "gamma_dfa_per_layer": [ + -0.005123761482536793, + 0.0015550897223874927, + 0.0003447675844654441, + -0.0005143960006535053 + ], + "acc_eval": 0.2529296875, + "loss_eval": 2.041043758392334, + "epoch": 24 + }, + { + "hidden_norms_cls": [ + 37.283199310302734, + 8933519.0, + 15359962.0, + 17441364.0, + 18346258.0 + ], + "hidden_norms_avg": [ + 883.0538330078125, + 7354756.0, + 13721222.0, + 16105006.0, + 19368310.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00026283934130333364, + 6.873029922971341e-10, + 6.058342161274766e-10, + 6.000055452481945e-10, + 5.98545990548871e-10 + ], + "bp_grad_F": [ + 0.11474847048521042, + 2.4628958271932788e-05, + 1.3788282160476228e-07, + 2.199209525599599e-08, + 2.15279509774291e-08 + ], + "gamma_dfa": -0.0014451614988502115, + "gamma_dfa_per_layer": [ + -0.006978219375014305, + 0.0013526652473956347, + 0.0002992081572301686, + -0.0004543000250123441 + ], + "acc_eval": 0.2451171875, + "loss_eval": 2.0492172241210938, + "epoch": 25 + }, + { + "hidden_norms_cls": [ + 38.11500930786133, + 10836846.0, + 17507178.0, + 19929002.0, + 20726542.0 + ], + "hidden_norms_avg": [ + 901.960205078125, + 8138403.5, + 14552406.0, + 17157852.0, + 20773122.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005291851703077555, + 6.35470620569123e-10, + 5.6208532273061e-10, + 5.496996191567405e-10, + 5.433966054901873e-10 + ], + "bp_grad_F": [ + 0.07972504198551178, + 1.2489309710872476e-06, + 2.2593511062041216e-08, + 2.1460177634935462e-08, + 1.941634231172884e-08 + ], + "gamma_dfa": -0.000788729106716346, + "gamma_dfa_per_layer": [ + -0.00451657734811306, + 0.0015372345224022865, + 0.00024382121046073735, + -0.00041939481161534786 + ], + "acc_eval": 0.2265625, + "loss_eval": 2.0669429302215576, + "epoch": 26 + }, + { + "hidden_norms_cls": [ + 38.87166213989258, + 11480826.0, + 18077316.0, + 20884150.0, + 22098916.0 + ], + "hidden_norms_avg": [ + 920.577880859375, + 8893063.0, + 15579717.0, + 18401958.0, + 22225722.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005104477168060839, + 5.858571405781277e-10, + 5.198571018105724e-10, + 5.114682011253535e-10, + 5.120092128052534e-10 + ], + "bp_grad_F": [ + 0.13577552139759064, + 2.0482397303567268e-05, + 2.1394010119024642e-08, + 2.0649670418038113e-08, + 1.8286096192809964e-08 + ], + "gamma_dfa": -0.0004262418224243447, + "gamma_dfa_per_layer": [ + -0.0029134145006537437, + 0.0013950758147984743, + 0.00018188939429819584, + -0.0003685179981403053 + ], + "acc_eval": 0.2490234375, + "loss_eval": 2.053382396697998, + "epoch": 27 + }, + { + "hidden_norms_cls": [ + 39.6179313659668, + 10591964.0, + 16346992.0, + 18847678.0, + 21847726.0 + ], + "hidden_norms_avg": [ + 937.9719848632812, + 9576851.0, + 16784906.0, + 19828342.0, + 23673520.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00023470228188671172, + 5.629120503058971e-10, + 5.04818964408571e-10, + 4.974847200855947e-10, + 4.968530586957343e-10 + ], + "bp_grad_F": [ + 0.03459252789616585, + 8.028884622035548e-06, + 1.9716548393944322e-08, + 1.807922522800709e-08, + 1.7913645677936074e-08 + ], + "gamma_dfa": -0.0018089709192281589, + "gamma_dfa_per_layer": [ + -0.008484212681651115, + 0.0014374498277902603, + 0.00020184949971735477, + -0.00039097032276913524 + ], + "acc_eval": 0.224609375, + "loss_eval": 2.0604443550109863, + "epoch": 28 + }, + { + "hidden_norms_cls": [ + 40.344242095947266, + 10467030.0, + 15235544.0, + 17027748.0, + 23281082.0 + ], + "hidden_norms_avg": [ + 954.3844604492188, + 10038487.0, + 16584430.0, + 19613710.0, + 24505476.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015729073493275791, + 5.36418076624301e-10, + 4.5378717450361705e-10, + 4.4796202858243817e-10, + 4.477457571372412e-10 + ], + "bp_grad_F": [ + 0.04820869117975235, + 2.3596087430632906e-06, + 1.7855482425943592e-08, + 1.7340139990551506e-08, + 1.672622929049794e-08 + ], + "gamma_dfa": -0.0013171448226785287, + "gamma_dfa_per_layer": [ + -0.006438364274799824, + 0.0013229507021605968, + 0.00020032597240060568, + -0.00035349169047549367 + ], + "acc_eval": 0.236328125, + "loss_eval": 2.061581611633301, + "epoch": 29 + }, + { + "hidden_norms_cls": [ + 41.04903793334961, + 12235056.0, + 17721728.0, + 19784938.0, + 25024272.0 + ], + "hidden_norms_avg": [ + 969.5825805664062, + 11940616.0, + 19401350.0, + 22468846.0, + 26879212.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00035265026963315904, + 5.423251847602728e-10, + 4.4247547292819434e-10, + 4.358849947649901e-10, + 4.3593659238005955e-10 + ], + "bp_grad_F": [ + 0.0735621377825737, + 1.917086819958058e-06, + 1.9346130031294706e-08, + 1.5936171493535767e-08, + 1.5501758099389917e-08 + ], + "gamma_dfa": -0.001081134716514498, + "gamma_dfa_per_layer": [ + -0.005434883758425713, + 0.0012318368535488844, + 0.00019993717432953417, + -0.00032142913551069796 + ], + "acc_eval": 0.2265625, + "loss_eval": 2.0760293006896973, + "epoch": 30 + }, + { + "hidden_norms_cls": [ + 41.723567962646484, + 10562926.0, + 13746881.0, + 15736975.0, + 26354068.0 + ], + "hidden_norms_avg": [ + 984.3485717773438, + 12533570.0, + 19717132.0, + 22961588.0, + 28083302.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002546848263591528, + 4.777176432213537e-10, + 4.0483683072523036e-10, + 4.0072575813177025e-10, + 4.013349652609577e-10 + ], + "bp_grad_F": [ + 0.06879052519798279, + 1.7057992636182462e-06, + 1.6271217262442406e-08, + 1.4877675091895526e-08, + 1.484982270483215e-08 + ], + "gamma_dfa": -0.0015064112594700418, + "gamma_dfa_per_layer": [ + -0.007336798589676619, + 0.0013772943057119846, + 0.00022022609482519329, + -0.0002863668487407267 + ], + "acc_eval": 0.20703125, + "loss_eval": 2.078207492828369, + "epoch": 31 + }, + { + "hidden_norms_cls": [ + 42.342227935791016, + 13283171.0, + 17422292.0, + 19770980.0, + 28086972.0 + ], + "hidden_norms_avg": [ + 999.26123046875, + 13875387.0, + 21404830.0, + 24833206.0, + 29923332.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003442879824433476, + 4.4142753341525065e-10, + 3.8908712363117104e-10, + 3.845144203040718e-10, + 3.8369810106964053e-10 + ], + "bp_grad_F": [ + 0.10482411086559296, + 2.8695783385046525e-06, + 1.7273855235089286e-08, + 1.4195452813225984e-08, + 1.3857171410336377e-08 + ], + "gamma_dfa": -0.0009248298447346315, + "gamma_dfa_per_layer": [ + -0.004888010676950216, + 0.0012753453338518739, + 0.00017224671319127083, + -0.0002589007490314543 + ], + "acc_eval": 0.2373046875, + "loss_eval": 2.078000068664551, + "epoch": 32 + }, + { + "hidden_norms_cls": [ + 42.90097427368164, + 16870614.0, + 22116480.0, + 24442270.0, + 29665536.0 + ], + "hidden_norms_avg": [ + 1013.56396484375, + 14764026.0, + 21856036.0, + 25334308.0, + 30474444.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00047380090109072626, + 4.22005735911668e-10, + 3.5831293487831317e-10, + 3.5505443030103834e-10, + 3.5614466931122024e-10 + ], + "bp_grad_F": [ + 0.1035437062382698, + 1.2711110457530594e-06, + 1.418432571398398e-08, + 1.2978671470875724e-08, + 1.2937439564097986e-08 + ], + "gamma_dfa": -0.00034118785697501153, + "gamma_dfa_per_layer": [ + -0.002568737603724003, + 0.001293556997552514, + 0.000137164635816589, + -0.00022673545754514635 + ], + "acc_eval": 0.2265625, + "loss_eval": 2.0730109214782715, + "epoch": 33 + }, + { + "hidden_norms_cls": [ + 43.419898986816406, + 18221210.0, + 22675590.0, + 24728546.0, + 30520888.0 + ], + "hidden_norms_avg": [ + 1027.6595458984375, + 16337822.0, + 23378412.0, + 26921720.0, + 31927994.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004629126051440835, + 4.106864293085266e-10, + 3.557905081663648e-10, + 3.536362591649578e-10, + 3.5421768296295397e-10 + ], + "bp_grad_F": [ + 0.08281872421503067, + 1.4263683851822861e-06, + 1.3245164076636229e-08, + 1.2740572152836194e-08, + 1.2752362721357713e-08 + ], + "gamma_dfa": -0.0006677984529233072, + "gamma_dfa_per_layer": [ + -0.0036979843862354755, + 0.0011370242573320866, + 0.00012192466238047928, + -0.00023215834517031908 + ], + "acc_eval": 0.23828125, + "loss_eval": 2.0669164657592773, + "epoch": 34 + }, + { + "hidden_norms_cls": [ + 43.868682861328125, + 18758150.0, + 23109030.0, + 25432404.0, + 31503354.0 + ], + "hidden_norms_avg": [ + 1040.644287109375, + 15512033.0, + 21965288.0, + 25882228.0, + 31813648.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00048007385339587927, + 4.271450415593847e-10, + 3.4119135294830016e-10, + 3.391489034054729e-10, + 3.387232438978316e-10 + ], + "bp_grad_F": [ + 0.36019906401634216, + 1.9220671674702317e-05, + 1.358929768713324e-08, + 1.2455363851415768e-08, + 1.2401786264604198e-08 + ], + "gamma_dfa": -0.00031488661625189707, + "gamma_dfa_per_layer": [ + -0.002551896497607231, + 0.001431336859241128, + 9.301750105805695e-05, + -0.00023200432769954205 + ], + "acc_eval": 0.234375, + "loss_eval": 2.0609660148620605, + "epoch": 35 + }, + { + "hidden_norms_cls": [ + 44.293697357177734, + 21659484.0, + 26491946.0, + 29332332.0, + 32793040.0 + ], + "hidden_norms_avg": [ + 1051.83740234375, + 17567000.0, + 24049368.0, + 28083622.0, + 33467380.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00043948061647824943, + 4.0486294872188466e-10, + 3.3493480211532756e-10, + 3.3453453895937457e-10, + 3.3604671823006527e-10 + ], + "bp_grad_F": [ + 0.10878865420818329, + 3.037727083210484e-06, + 1.2592222375928941e-08, + 1.2103843261002112e-08, + 1.2022392859023512e-08 + ], + "gamma_dfa": -0.00015630935013177805, + "gamma_dfa_per_layer": [ + -0.0019119374919682741, + 0.0014281735057011247, + 7.57485831854865e-05, + -0.00021722199744544923 + ], + "acc_eval": 0.2431640625, + "loss_eval": 2.0587897300720215, + "epoch": 36 + }, + { + "hidden_norms_cls": [ + 44.68658447265625, + 21628572.0, + 26077032.0, + 28336790.0, + 33305650.0 + ], + "hidden_norms_avg": [ + 1062.067138671875, + 18163602.0, + 24404446.0, + 28478594.0, + 34156064.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005865619168616831, + 4.0249623078914e-10, + 3.3121710929506776e-10, + 3.310392793220984e-10, + 3.318675056984688e-10 + ], + "bp_grad_F": [ + 0.20061102509498596, + 1.4544431223839638e-06, + 1.3441372459510603e-08, + 1.2418687411752671e-08, + 1.2016870165609816e-08 + ], + "gamma_dfa": -0.00039686575473751873, + "gamma_dfa_per_layer": [ + -0.0029668076895177364, + 0.0015295962803065777, + 6.985102663747966e-05, + -0.00022010263637639582 + ], + "acc_eval": 0.2275390625, + "loss_eval": 2.0569839477539062, + "epoch": 37 + }, + { + "hidden_norms_cls": [ + 45.062259674072266, + 25376026.0, + 30203382.0, + 32772746.0, + 35119040.0 + ], + "hidden_norms_avg": [ + 1071.6630859375, + 18637428.0, + 24671676.0, + 28819074.0, + 34739232.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005594053072854877, + 3.9023292930373543e-10, + 3.2509483993692356e-10, + 3.23913590394298e-10, + 3.250162639023557e-10 + ], + "bp_grad_F": [ + 0.13359014689922333, + 4.247889592079446e-06, + 1.4051211749688264e-08, + 1.2317144637563615e-08, + 1.1531787968976914e-08 + ], + "gamma_dfa": -0.0005283378432068275, + "gamma_dfa_per_layer": [ + -0.0037097278982400894, + 0.0017695487476885319, + 4.308431380195543e-05, + -0.000216256536077708 + ], + "acc_eval": 0.2666015625, + "loss_eval": 2.0476396083831787, + "epoch": 38 + }, + { + "hidden_norms_cls": [ + 45.38731384277344, + 24903830.0, + 30026926.0, + 33563200.0, + 35539932.0 + ], + "hidden_norms_avg": [ + 1080.0860595703125, + 20496828.0, + 26709690.0, + 30932660.0, + 36357072.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005004233680665493, + 3.8017103354270887e-10, + 3.1730867933177365e-10, + 3.167333340048373e-10, + 3.1768215835725755e-10 + ], + "bp_grad_F": [ + 0.24717594683170319, + 2.9436714612529613e-06, + 1.1934382371237007e-08, + 1.1459838411553847e-08, + 1.1365100860416533e-08 + ], + "gamma_dfa": -0.00022031009211787023, + "gamma_dfa_per_layer": [ + -0.0022991469595581293, + 0.0015725505072623491, + 4.821528273168951e-05, + -0.00020285919890739024 + ], + "acc_eval": 0.244140625, + "loss_eval": 2.0488319396972656, + "epoch": 39 + }, + { + "hidden_norms_cls": [ + 45.68830490112305, + 27470426.0, + 32688434.0, + 35418348.0, + 37778420.0 + ], + "hidden_norms_avg": [ + 1088.195068359375, + 19636778.0, + 25748976.0, + 30137794.0, + 36341748.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000507087679579854, + 3.7039282752004965e-10, + 3.106248036566228e-10, + 3.096240208666501e-10, + 3.10577202844442e-10 + ], + "bp_grad_F": [ + 0.247142493724823, + 5.3006801863375586e-06, + 1.5794508811950436e-08, + 1.5706817180216603e-08, + 1.0953104201405495e-08 + ], + "gamma_dfa": -0.00026929086834570626, + "gamma_dfa_per_layer": [ + -0.0025479549076408148, + 0.0016400209860876203, + 2.4549921363359317e-05, + -0.00019377947319298983 + ], + "acc_eval": 0.2548828125, + "loss_eval": 2.0380632877349854, + "epoch": 40 + }, + { + "hidden_norms_cls": [ + 45.95172119140625, + 29219790.0, + 34751968.0, + 37645720.0, + 39363420.0 + ], + "hidden_norms_avg": [ + 1095.55908203125, + 20059094.0, + 26161532.0, + 30539128.0, + 36948852.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004415555449668318, + 3.578430884942918e-10, + 3.05192260352527e-10, + 3.046965735276075e-10, + 3.0560776131949297e-10 + ], + "bp_grad_F": [ + 0.1088763028383255, + 4.900910880678566e-06, + 1.1387745857405207e-08, + 1.0883239198733463e-08, + 1.0722531307294503e-08 + ], + "gamma_dfa": -0.0006201292017067317, + "gamma_dfa_per_layer": [ + -0.004000760614871979, + 0.0016785510815680027, + 3.265401755925268e-05, + -0.0001909612910822034 + ], + "acc_eval": 0.25, + "loss_eval": 2.041342258453369, + "epoch": 41 + }, + { + "hidden_norms_cls": [ + 46.1973876953125, + 29375584.0, + 34745100.0, + 38109944.0, + 40454424.0 + ], + "hidden_norms_avg": [ + 1102.340087890625, + 21066706.0, + 27296236.0, + 31874516.0, + 38108092.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00040148120024241507, + 3.579030682931972e-10, + 3.0047467292071417e-10, + 2.979275159908923e-10, + 2.9703536852387913e-10 + ], + "bp_grad_F": [ + 0.2525903582572937, + 8.925781003199518e-06, + 1.1219404072448924e-08, + 1.084880185686643e-08, + 1.0492501978376367e-08 + ], + "gamma_dfa": -0.00034770679030771134, + "gamma_dfa_per_layer": [ + -0.002933461917564273, + 0.001698363572359085, + 3.748677045223303e-05, + -0.0001932155864778906 + ], + "acc_eval": 0.244140625, + "loss_eval": 2.0345935821533203, + "epoch": 42 + }, + { + "hidden_norms_cls": [ + 46.42340087890625, + 27399134.0, + 31821602.0, + 34474508.0, + 38109560.0 + ], + "hidden_norms_avg": [ + 1108.236328125, + 21543940.0, + 27684760.0, + 32082502.0, + 38718660.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000570801377762109, + 3.5802838471710174e-10, + 2.990230563160168e-10, + 2.9852947891484405e-10, + 2.9978877713610075e-10 + ], + "bp_grad_F": [ + 0.173945352435112, + 2.9223572255432373e-06, + 1.2221713419080515e-08, + 1.1539666999738074e-08, + 1.0805790928714032e-08 + ], + "gamma_dfa": -5.9806044191645924e-05, + "gamma_dfa_per_layer": [ + -0.001857165014371276, + 0.0017762510105967522, + 3.49261645169463e-05, + -0.00019323633750900626 + ], + "acc_eval": 0.2412109375, + "loss_eval": 2.043308734893799, + "epoch": 43 + }, + { + "hidden_norms_cls": [ + 46.619728088378906, + 31052948.0, + 36542220.0, + 39935176.0, + 42316204.0 + ], + "hidden_norms_avg": [ + 1113.68896484375, + 22679808.0, + 29079456.0, + 33751472.0, + 40006012.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00046165595995262265, + 3.339039600369631e-10, + 2.9132621315319795e-10, + 2.9080904351275194e-10, + 2.9134980539247124e-10 + ], + "bp_grad_F": [ + 0.08871550858020782, + 1.195927779917838e-05, + 1.2490571243972681e-08, + 1.2371740965022582e-08, + 1.015614703447909e-08 + ], + "gamma_dfa": -0.0003672020420708577, + "gamma_dfa_per_layer": [ + -0.002894133096560836, + 0.0016025153454393148, + 2.5333010853501037e-05, + -0.0002025234280154109 + ], + "acc_eval": 0.244140625, + "loss_eval": 2.029773473739624, + "epoch": 44 + }, + { + "hidden_norms_cls": [ + 46.796348571777344, + 30912490.0, + 36281496.0, + 39245376.0, + 41656108.0 + ], + "hidden_norms_avg": [ + 1118.38134765625, + 23560890.0, + 29646840.0, + 34192144.0, + 40581760.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005251869442872703, + 3.3097524720915317e-10, + 2.891357153700369e-10, + 2.8932781170887267e-10, + 2.8904145743524623e-10 + ], + "bp_grad_F": [ + 0.09888254106044769, + 4.3903874029638246e-06, + 1.0815308648659538e-08, + 1.040402519691952e-08, + 1.0228043301196976e-08 + ], + "gamma_dfa": -0.00037046667421236634, + "gamma_dfa_per_layer": [ + -0.002757731592282653, + 0.0014231146778911352, + 3.9225356886163354e-05, + -0.00018647513934411108 + ], + "acc_eval": 0.234375, + "loss_eval": 2.0383992195129395, + "epoch": 45 + }, + { + "hidden_norms_cls": [ + 46.95427322387695, + 31720426.0, + 37234788.0, + 40129424.0, + 42928428.0 + ], + "hidden_norms_avg": [ + 1122.57470703125, + 22583276.0, + 28617936.0, + 33269996.0, + 40462568.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004295881371945143, + 3.419305394380956e-10, + 2.8222821302215095e-10, + 2.8184321543278656e-10, + 2.8312005517783234e-10 + ], + "bp_grad_F": [ + 0.5366736650466919, + 2.256676998513285e-05, + 1.1914533359913548e-08, + 1.1219233542192342e-08, + 1.004730165732326e-08 + ], + "gamma_dfa": 0.00015619578334735706, + "gamma_dfa_per_layer": [ + -0.0010500183561816812, + 0.001834970898926258, + 3.652184386737645e-05, + -0.00019669125322252512 + ], + "acc_eval": 0.2431640625, + "loss_eval": 2.039337396621704, + "epoch": 46 + }, + { + "hidden_norms_cls": [ + 47.09259796142578, + 32824944.0, + 38341332.0, + 41754692.0, + 44005196.0 + ], + "hidden_norms_avg": [ + 1126.26953125, + 24313264.0, + 30669532.0, + 35293632.0, + 41785680.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005083036958239973, + 3.2607763711389737e-10, + 2.8033902976787317e-10, + 2.7943025671106625e-10, + 2.7980692762774595e-10 + ], + "bp_grad_F": [ + 0.06971772015094757, + 2.262569068989251e-06, + 1.0069017619684928e-08, + 9.845756210324907e-09, + 9.862499261714675e-09 + ], + "gamma_dfa": 0.0007457349984179018, + "gamma_dfa_per_layer": [ + 0.0015201317146420479, + 0.0016060702037066221, + 3.652479063021019e-05, + -0.00017978671530727297 + ], + "acc_eval": 0.25, + "loss_eval": 2.0368857383728027, + "epoch": 47 + }, + { + "hidden_norms_cls": [ + 47.21082305908203, + 33649040.0, + 39036836.0, + 42500816.0, + 44653764.0 + ], + "hidden_norms_avg": [ + 1129.5389404296875, + 24447482.0, + 30689206.0, + 35330028.0, + 42064012.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00046678923536092043, + 3.204189136241098e-10, + 2.755325689829391e-10, + 2.7554050707756517e-10, + 2.7654081802275243e-10 + ], + "bp_grad_F": [ + 0.07496139407157898, + 2.2861270281282486e-06, + 9.997683569906712e-09, + 9.715622084627284e-09, + 9.736355721656764e-09 + ], + "gamma_dfa": 0.0006021281524226652, + "gamma_dfa_per_layer": [ + 0.0007927162805572152, + 0.001763419946655631, + 3.104796996922232e-05, + -0.000178671587491408 + ], + "acc_eval": 0.259765625, + "loss_eval": 2.0324196815490723, + "epoch": 48 + }, + { + "hidden_norms_cls": [ + 47.315826416015625, + 34514608.0, + 40222940.0, + 43606628.0, + 45508540.0 + ], + "hidden_norms_avg": [ + 1132.157958984375, + 24487910.0, + 30821460.0, + 35505456.0, + 42327908.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00041785358916968107, + 3.3263317100740153e-10, + 2.696754763942266e-10, + 2.701733836651954e-10, + 2.71275196750409e-10 + ], + "bp_grad_F": [ + 0.08130628615617752, + 3.3661247016425477e-06, + 1.078094857831502e-08, + 9.643851939244996e-09, + 9.617946439277603e-09 + ], + "gamma_dfa": 0.0005021913366363151, + "gamma_dfa_per_layer": [ + 0.00036606384674087167, + 0.0017899572849273682, + 2.7483671146910638e-05, + -0.00017473945626989007 + ], + "acc_eval": 0.2626953125, + "loss_eval": 2.028841495513916, + "epoch": 49 + }, + { + "hidden_norms_cls": [ + 47.388946533203125, + 35118772.0, + 40722008.0, + 44347232.0, + 46331384.0 + ], + "hidden_norms_avg": [ + 1134.3621826171875, + 24821028.0, + 31074444.0, + 35754528.0, + 42627356.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00043533919961191714, + 3.173189211391758e-10, + 2.687766953446413e-10, + 2.68161992611482e-10, + 2.690903055935223e-10 + ], + "bp_grad_F": [ + 0.09458157420158386, + 1.9965789306297665e-06, + 1.025628915130028e-08, + 9.58252854843522e-09, + 9.523047239667903e-09 + ], + "gamma_dfa": 0.00038969498109509004, + "gamma_dfa_per_layer": [ + -0.00010247333557344973, + 0.0018051008228212595, + 3.0877545214025304e-05, + -0.0001747251080814749 + ], + "acc_eval": 0.2548828125, + "loss_eval": 2.0298049449920654, + "epoch": 50 + }, + { + "hidden_norms_cls": [ + 47.4621696472168, + 34836160.0, + 40469796.0, + 44120564.0, + 46361016.0 + ], + "hidden_norms_avg": [ + 1136.3079833984375, + 24152832.0, + 30436140.0, + 35273740.0, + 42621312.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000491869286634028, + 3.2774055691575654e-10, + 2.667974174919152e-10, + 2.669577336966711e-10, + 2.680060617876734e-10 + ], + "bp_grad_F": [ + 0.0854402706027031, + 1.6183460047614062e-06, + 9.980491100236577e-09, + 9.461099459429079e-09, + 9.473674289495193e-09 + ], + "gamma_dfa": 0.0005695745421689935, + "gamma_dfa_per_layer": [ + 0.0004214277723804116, + 0.001994946738705039, + 3.653779276646674e-05, + -0.00017461413517594337 + ], + "acc_eval": 0.23828125, + "loss_eval": 2.024928092956543, + "epoch": 51 + }, + { + "hidden_norms_cls": [ + 47.52342224121094, + 36446320.0, + 42468064.0, + 46175108.0, + 47947040.0 + ], + "hidden_norms_avg": [ + 1137.8057861328125, + 25400616.0, + 31703746.0, + 36432956.0, + 43307828.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00034005154157057405, + 3.121023717245208e-10, + 2.6523216956064743e-10, + 2.6489818671926457e-10, + 2.649658548126155e-10 + ], + "bp_grad_F": [ + 0.10125189274549484, + 4.0649438233231194e-06, + 9.830144698241838e-09, + 9.345456852827283e-09, + 9.317212779080819e-09 + ], + "gamma_dfa": 0.0005080709906906122, + "gamma_dfa_per_layer": [ + 0.00023581110872328281, + 0.0019333910895511508, + 3.0449831683654338e-05, + -0.00016736806719563901 + ], + "acc_eval": 0.251953125, + "loss_eval": 2.0343496799468994, + "epoch": 52 + }, + { + "hidden_norms_cls": [ + 47.567466735839844, + 35483484.0, + 41150516.0, + 44742840.0, + 47102380.0 + ], + "hidden_norms_avg": [ + 1139.05029296875, + 25225282.0, + 31585082.0, + 36363108.0, + 43411416.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00046872245729900897, + 3.1678357159670156e-10, + 2.6331647973165673e-10, + 2.64141680750285e-10, + 2.646937946604311e-10 + ], + "bp_grad_F": [ + 0.08037562668323517, + 2.9532295684475685e-06, + 9.44631484145475e-09, + 9.393840372240447e-09, + 9.41009226096412e-09 + ], + "gamma_dfa": 0.0005205844290685491, + "gamma_dfa_per_layer": [ + 0.0003642886003945023, + 0.0018537556752562523, + 3.766161171370186e-05, + -0.00017336817109026015 + ], + "acc_eval": 0.2392578125, + "loss_eval": 2.02734375, + "epoch": 53 + }, + { + "hidden_norms_cls": [ + 47.602928161621094, + 35582280.0, + 41200288.0, + 44686488.0, + 47126900.0 + ], + "hidden_norms_avg": [ + 1139.965087890625, + 25657812.0, + 31984420.0, + 36722060.0, + 43681628.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00047245126916095614, + 3.1708738412739024e-10, + 2.6278745846042284e-10, + 2.6274540876336516e-10, + 2.6386243190401615e-10 + ], + "bp_grad_F": [ + 0.08141150325536728, + 1.0596501851978246e-05, + 1.0370135861137442e-08, + 1.0129613592368969e-08, + 9.407171930320146e-09 + ], + "gamma_dfa": 0.00048223476824205136, + "gamma_dfa_per_layer": [ + 0.00032963097328320146, + 0.00173661345615983, + 3.3767075365176424e-05, + -0.00017107243184000254 + ], + "acc_eval": 0.251953125, + "loss_eval": 2.0290825366973877, + "epoch": 54 + }, + { + "hidden_norms_cls": [ + 47.62870788574219, + 36373308.0, + 42049216.0, + 45803868.0, + 47955172.0 + ], + "hidden_norms_avg": [ + 1140.6492919921875, + 25698864.0, + 31990548.0, + 36707920.0, + 43700336.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004157091898377985, + 3.1451533044624114e-10, + 2.6160756894100246e-10, + 2.62937283057596e-10, + 2.633904483406724e-10 + ], + "bp_grad_F": [ + 0.28710466623306274, + 2.876764028769685e-06, + 9.405439982401731e-09, + 9.308096515781017e-09, + 9.319982119393444e-09 + ], + "gamma_dfa": 0.00045457817577698734, + "gamma_dfa_per_layer": [ + 0.00011597995762713253, + 0.0018383568385615945, + 3.561873018043116e-05, + -0.00017164282326120883 + ], + "acc_eval": 0.2509765625, + "loss_eval": 2.0309882164001465, + "epoch": 55 + }, + { + "hidden_norms_cls": [ + 47.646034240722656, + 35748556.0, + 41284136.0, + 44861788.0, + 47367128.0 + ], + "hidden_norms_avg": [ + 1141.1492919921875, + 25812252.0, + 32106642.0, + 36789100.0, + 43809728.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004877470782957971, + 3.1724206595029614e-10, + 2.6251881224403917e-10, + 2.627319750647672e-10, + 2.634734097561875e-10 + ], + "bp_grad_F": [ + 0.08355043828487396, + 2.428784682706464e-06, + 9.579466109244095e-09, + 9.378172016738517e-09, + 9.3862775329967e-09 + ], + "gamma_dfa": 0.0006408758436009521, + "gamma_dfa_per_layer": [ + 0.0009491340606473386, + 0.0017479720991104841, + 4.02485384256579e-05, + -0.00017385132377967238 + ], + "acc_eval": 0.2451171875, + "loss_eval": 2.030231475830078, + "epoch": 56 + }, + { + "hidden_norms_cls": [ + 47.65734100341797, + 35952124.0, + 41526152.0, + 45192104.0, + 47596588.0 + ], + "hidden_norms_avg": [ + 1141.4708251953125, + 25858530.0, + 32145604.0, + 36816776.0, + 43830904.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004684069426730275, + 3.1406693912217065e-10, + 2.6245111639511265e-10, + 2.628100792545496e-10, + 2.632017381820617e-10 + ], + "bp_grad_F": [ + 0.16165603697299957, + 3.1715710520074936e-06, + 1.017021755700398e-08, + 9.52006651289139e-09, + 9.360165087457517e-09 + ], + "gamma_dfa": 0.0005993541035422822, + "gamma_dfa_per_layer": [ + 0.0007396150031127036, + 0.0017993964720517397, + 3.345730510773137e-05, + -0.00017505236610304564 + ], + "acc_eval": 0.2529296875, + "loss_eval": 2.030412197113037, + "epoch": 57 + }, + { + "hidden_norms_cls": [ + 47.6636962890625, + 36249912.0, + 41976852.0, + 45623612.0, + 47785064.0 + ], + "hidden_norms_avg": [ + 1141.6495361328125, + 25785932.0, + 32065610.0, + 36745760.0, + 43805624.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00047133295447565615, + 3.155541938859585e-10, + 2.617887573386213e-10, + 2.615481442536094e-10, + 2.6276933406954583e-10 + ], + "bp_grad_F": [ + 0.09146469831466675, + 1.8705788988881977e-06, + 9.432087999527994e-09, + 9.323818161988129e-09, + 9.325629157785897e-09 + ], + "gamma_dfa": 0.0005754136018367717, + "gamma_dfa_per_layer": [ + 0.0005892712506465614, + 0.0018461447907611728, + 3.762807318707928e-05, + -0.00017138970724772662 + ], + "acc_eval": 0.251953125, + "loss_eval": 2.031130790710449, + "epoch": 58 + }, + { + "hidden_norms_cls": [ + 47.66678237915039, + 36057328.0, + 41647260.0, + 45391196.0, + 47626604.0 + ], + "hidden_norms_avg": [ + 1141.7391357421875, + 25717830.0, + 31995718.0, + 36684084.0, + 43781820.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00047832890413701534, + 3.149952798597866e-10, + 2.614737593109595e-10, + 2.6173804790197153e-10, + 2.6257329643897265e-10 + ], + "bp_grad_F": [ + 0.16335515677928925, + 1.6483251101817586e-06, + 9.493151154060797e-09, + 9.393547273361946e-09, + 9.338456230523207e-09 + ], + "gamma_dfa": 0.0005906115802645218, + "gamma_dfa_per_layer": [ + 0.0007219060207717121, + 0.0017734188586473465, + 3.73886723536998e-05, + -0.00017026723071467131 + ], + "acc_eval": 0.255859375, + "loss_eval": 2.0293946266174316, + "epoch": 59 + }, + { + "hidden_norms_cls": [ + 47.666595458984375, + 36029164.0, + 41621316.0, + 45328004.0, + 47606828.0 + ], + "hidden_norms_avg": [ + 1141.736328125, + 25716872.0, + 31991962.0, + 36680384.0, + 43781988.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004811616672668606, + 3.1537170097628575e-10, + 2.6223428983840336e-10, + 2.6155200227861997e-10, + 2.6258059615535956e-10 + ], + "bp_grad_F": [ + 0.0951727032661438, + 1.623439857212361e-06, + 9.415242807619961e-09, + 9.343901652414388e-09, + 9.342033813197759e-09 + ], + "gamma_dfa": 0.000660182828141842, + "gamma_dfa_per_layer": [ + 0.0009655870962888002, + 0.0018112185643985868, + 3.598399052862078e-05, + -0.00017205833864863962 + ], + "acc_eval": 0.255859375, + "loss_eval": 2.029409408569336, + "epoch": 60 + } + ] +} \ No newline at end of file diff --git a/results/snapshot_vit_v1/snapshot_vit_s456.json b/results/snapshot_vit_v1/snapshot_vit_s456.json new file mode 100644 index 0000000..1b43b92 --- /dev/null +++ b/results/snapshot_vit_v1/snapshot_vit_s456.json @@ -0,0 +1,4594 @@ +{ + "config": { + "output_dir": "results/snapshot_vit_v1", + "epochs": 60, + "lr": 0.001, + "wd": 0.05, + "seed": 456, + "depth": 4, + "d_model": 128, + "n_heads": 4 + }, + "depth": 4, + "d_model": 128, + "architecture": "ViTMini", + "bp_log": [ + { + "hidden_norms_cls": [ + 0.3042769432067871, + 3.2273340225219727, + 4.6926493644714355, + 6.003997802734375, + 6.652705669403076 + ], + "hidden_norms_avg": [ + 6.027750492095947, + 7.1044697761535645, + 7.910475730895996, + 8.79189682006836, + 9.458833694458008 + ], + "bp_grad_per_sample_l2_med": [ + 0.005248428788036108, + 0.0012287507997825742, + 0.0010387187357991934, + 0.0009678652859292924, + 0.0009174557635560632 + ], + "bp_grad_F": [ + 0.248850479722023, + 0.0424945093691349, + 0.0348997563123703, + 0.03202275559306145, + 0.030239813029766083 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.0791015625, + "loss_eval": 2.544933319091797, + "epoch": 0 + }, + { + "hidden_norms_cls": [ + 0.47296053171157837, + 11.65749454498291, + 18.3483943939209, + 24.296405792236328, + 29.94684410095215 + ], + "hidden_norms_avg": [ + 4.04442834854126, + 9.927255630493164, + 14.762720108032227, + 19.817049026489258, + 24.69188690185547 + ], + "bp_grad_per_sample_l2_med": [ + 0.0025219416711479425, + 0.00024655580637045205, + 0.00017099862452596426, + 0.0001493149611633271, + 0.00015047143097035587 + ], + "bp_grad_F": [ + 0.11354690045118332, + 0.00995445717126131, + 0.006139951758086681, + 0.005140931811183691, + 0.005088545847684145 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.458984375, + "loss_eval": 1.4817876815795898, + "epoch": 1 + }, + { + "hidden_norms_cls": [ + 0.6174129843711853, + 12.388140678405762, + 20.656904220581055, + 27.073535919189453, + 32.43647003173828 + ], + "hidden_norms_avg": [ + 3.8196825981140137, + 10.982677459716797, + 17.020437240600586, + 22.471168518066406, + 27.064218521118164 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020673249382525682, + 0.0002501676499377936, + 0.00015905944746918976, + 0.00013718422269448638, + 0.0001328626531176269 + ], + "bp_grad_F": [ + 0.09556808322668076, + 0.01051106583327055, + 0.005822391714900732, + 0.004766201134771109, + 0.004577947780489922 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.498046875, + "loss_eval": 1.356250286102295, + "epoch": 2 + }, + { + "hidden_norms_cls": [ + 0.7216586470603943, + 12.527997016906738, + 19.815393447875977, + 26.452791213989258, + 30.71564483642578 + ], + "hidden_norms_avg": [ + 3.8907485008239746, + 11.261369705200195, + 16.61492156982422, + 21.57110023498535, + 24.978900909423828 + ], + "bp_grad_per_sample_l2_med": [ + 0.0021546317730098963, + 0.00030062923906371, + 0.00018509272194933146, + 0.00013865686196368188, + 0.00012920796871185303 + ], + "bp_grad_F": [ + 0.10040326416492462, + 0.012564396485686302, + 0.007171053439378738, + 0.005316051654517651, + 0.004880763124674559 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5263671875, + "loss_eval": 1.2655537128448486, + "epoch": 3 + }, + { + "hidden_norms_cls": [ + 0.8026084899902344, + 12.023736953735352, + 20.35123062133789, + 26.937381744384766, + 31.122047424316406 + ], + "hidden_norms_avg": [ + 3.9065797328948975, + 11.544925689697266, + 17.131011962890625, + 22.292007446289062, + 25.61225128173828 + ], + "bp_grad_per_sample_l2_med": [ + 0.0019258656539022923, + 0.00027825392317026854, + 0.00017385024693794549, + 0.0001323536125710234, + 0.00012172113929409534 + ], + "bp_grad_F": [ + 0.09238748997449875, + 0.01207020040601492, + 0.007036368828266859, + 0.005208354443311691, + 0.0047498126514256 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5673828125, + "loss_eval": 1.1375834941864014, + "epoch": 4 + }, + { + "hidden_norms_cls": [ + 0.8784403204917908, + 11.689644813537598, + 20.318578720092773, + 27.47210121154785, + 30.616111755371094 + ], + "hidden_norms_avg": [ + 3.991969585418701, + 11.499222755432129, + 17.010013580322266, + 21.869060516357422, + 24.784456253051758 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017466156277805567, + 0.00030884172883816063, + 0.00018451173673383892, + 0.00013519970525521785, + 0.00011779358464991674 + ], + "bp_grad_F": [ + 0.0881652981042862, + 0.014197942800819874, + 0.008167672902345657, + 0.00570154283195734, + 0.0048713223077356815 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.611328125, + "loss_eval": 1.078152060508728, + "epoch": 5 + }, + { + "hidden_norms_cls": [ + 0.9501535892486572, + 12.59860610961914, + 20.491111755371094, + 27.280519485473633, + 30.350204467773438 + ], + "hidden_norms_avg": [ + 4.104201793670654, + 12.098063468933105, + 17.173715591430664, + 21.416263580322266, + 24.0885066986084 + ], + "bp_grad_per_sample_l2_med": [ + 0.001603498705662787, + 0.0003018827992491424, + 0.00017963100981432945, + 0.00013513887824956328, + 0.00010907831892836839 + ], + "bp_grad_F": [ + 0.08621370792388916, + 0.01517424639314413, + 0.008794959634542465, + 0.006117440760135651, + 0.0050094337202608585 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6337890625, + "loss_eval": 1.0198562145233154, + "epoch": 6 + }, + { + "hidden_norms_cls": [ + 1.000899076461792, + 12.766633987426758, + 21.096908569335938, + 28.377235412597656, + 31.630756378173828 + ], + "hidden_norms_avg": [ + 4.143934726715088, + 13.046825408935547, + 18.295841217041016, + 23.147098541259766, + 25.70033836364746 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015043691964820027, + 0.00027919537387788296, + 0.0001850408734753728, + 0.0001339056616416201, + 0.00011227549111936241 + ], + "bp_grad_F": [ + 0.07296615093946457, + 0.012746848165988922, + 0.00809843186289072, + 0.005660817492753267, + 0.00492064468562603 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6357421875, + "loss_eval": 1.0125277042388916, + "epoch": 7 + }, + { + "hidden_norms_cls": [ + 1.0544841289520264, + 10.223775863647461, + 18.59557342529297, + 26.47129249572754, + 29.77008819580078 + ], + "hidden_norms_avg": [ + 4.213057994842529, + 13.021050453186035, + 18.172080993652344, + 22.743032455444336, + 25.225244522094727 + ], + "bp_grad_per_sample_l2_med": [ + 0.001364147407002747, + 0.0002890345931518823, + 0.00017917664081323892, + 0.000133156034280546, + 0.00011372177687007934 + ], + "bp_grad_F": [ + 0.07409710437059402, + 0.015113108791410923, + 0.00921319704502821, + 0.006366679444909096, + 0.005320113617926836 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6376953125, + "loss_eval": 0.9630928039550781, + "epoch": 8 + }, + { + "hidden_norms_cls": [ + 1.1071640253067017, + 12.073644638061523, + 19.524917602539062, + 26.858781814575195, + 30.318849563598633 + ], + "hidden_norms_avg": [ + 4.280055522918701, + 13.520170211791992, + 18.620624542236328, + 22.658164978027344, + 25.25646209716797 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012990576215088367, + 0.00027366873109713197, + 0.00016998387582134455, + 0.00012336595682427287, + 9.77109739324078e-05 + ], + "bp_grad_F": [ + 0.07662060856819153, + 0.015166237019002438, + 0.0096206646412611, + 0.006477049086242914, + 0.005294579081237316 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.654296875, + "loss_eval": 0.9390516877174377, + "epoch": 9 + }, + { + "hidden_norms_cls": [ + 1.1426520347595215, + 12.005794525146484, + 20.33642578125, + 27.80829429626465, + 31.22698974609375 + ], + "hidden_norms_avg": [ + 4.328567981719971, + 13.725446701049805, + 19.644866943359375, + 23.91346549987793, + 26.409910202026367 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012125002685934305, + 0.00027867915923707187, + 0.00017298922466579825, + 0.0001231397909577936, + 0.00010014672443503514 + ], + "bp_grad_F": [ + 0.06728038191795349, + 0.014830472879111767, + 0.008772061206400394, + 0.006222804542630911, + 0.00518346531316638 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6708984375, + "loss_eval": 0.8987849950790405, + "epoch": 10 + }, + { + "hidden_norms_cls": [ + 1.182861089706421, + 11.343650817871094, + 19.158103942871094, + 26.537256240844727, + 29.248126983642578 + ], + "hidden_norms_avg": [ + 4.343320846557617, + 13.940053939819336, + 19.19382667541504, + 23.443157196044922, + 25.7342529296875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012841055868193507, + 0.00029811219428665936, + 0.00019176788919139653, + 0.0001351374085061252, + 0.00010611475590849295 + ], + "bp_grad_F": [ + 0.07373103499412537, + 0.015750709921121597, + 0.010071114636957645, + 0.007257349323481321, + 0.00578929902985692 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6708984375, + "loss_eval": 0.9137783646583557, + "epoch": 11 + }, + { + "hidden_norms_cls": [ + 1.2363859415054321, + 11.583894729614258, + 18.828346252441406, + 26.30917739868164, + 29.363861083984375 + ], + "hidden_norms_avg": [ + 4.441896915435791, + 13.568662643432617, + 18.774181365966797, + 22.73027801513672, + 24.84675407409668 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011289563262835145, + 0.00029387036920525134, + 0.0001886928512249142, + 0.00013024669897276908, + 9.712533210404217e-05 + ], + "bp_grad_F": [ + 0.06850193440914154, + 0.016727343201637268, + 0.010432050563395023, + 0.00744031835347414, + 0.0057919141836464405 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6865234375, + "loss_eval": 0.8655319809913635, + "epoch": 12 + }, + { + "hidden_norms_cls": [ + 1.276246428489685, + 11.161674499511719, + 18.18111801147461, + 24.498512268066406, + 28.472366333007812 + ], + "hidden_norms_avg": [ + 4.438092231750488, + 13.71449089050293, + 18.358896255493164, + 21.998794555664062, + 24.44672966003418 + ], + "bp_grad_per_sample_l2_med": [ + 0.001100392546504736, + 0.0002873367629945278, + 0.00018384194117970765, + 0.0001337265275651589, + 9.951705578714609e-05 + ], + "bp_grad_F": [ + 0.06749056279659271, + 0.01716373674571514, + 0.010762249119579792, + 0.007881316356360912, + 0.005892573855817318 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6982421875, + "loss_eval": 0.8163608908653259, + "epoch": 13 + }, + { + "hidden_norms_cls": [ + 1.3131792545318604, + 11.034884452819824, + 17.936412811279297, + 24.541194915771484, + 28.02472496032715 + ], + "hidden_norms_avg": [ + 4.504117012023926, + 13.86273193359375, + 18.456012725830078, + 22.296085357666016, + 24.57513427734375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010489820269867778, + 0.0002784461830742657, + 0.00018129698582924902, + 0.00013628850865643471, + 0.00010334269609302282 + ], + "bp_grad_F": [ + 0.06553377211093903, + 0.016712775453925133, + 0.010981550440192223, + 0.007675213273614645, + 0.006061363499611616 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.69921875, + "loss_eval": 0.8088906407356262, + "epoch": 14 + }, + { + "hidden_norms_cls": [ + 1.3631325960159302, + 10.72367000579834, + 17.147600173950195, + 23.750171661376953, + 26.97018051147461 + ], + "hidden_norms_avg": [ + 4.5338335037231445, + 13.55031967163086, + 17.503305435180664, + 21.003847122192383, + 23.168630599975586 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010022176429629326, + 0.0002914569922722876, + 0.00018890199135057628, + 0.00013593978655990213, + 0.00010251985804643482 + ], + "bp_grad_F": [ + 0.06372744590044022, + 0.017576243728399277, + 0.011715950444340706, + 0.008481587283313274, + 0.006441249046474695 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.701171875, + "loss_eval": 0.815929651260376, + "epoch": 15 + }, + { + "hidden_norms_cls": [ + 1.3926054239273071, + 10.609240531921387, + 17.234729766845703, + 23.659292221069336, + 27.24931526184082 + ], + "hidden_norms_avg": [ + 4.513574600219727, + 13.48448371887207, + 17.66766929626465, + 21.098644256591797, + 23.213909149169922 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008784966776147485, + 0.0002452125190757215, + 0.0001629967155167833, + 0.00012193062138976529, + 8.820713992463425e-05 + ], + "bp_grad_F": [ + 0.06515656411647797, + 0.017664309591054916, + 0.011493389494717121, + 0.008405888453125954, + 0.006338838487863541 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.71875, + "loss_eval": 0.7755489349365234, + "epoch": 16 + }, + { + "hidden_norms_cls": [ + 1.4288005828857422, + 9.991934776306152, + 16.30902671813965, + 22.53181266784668, + 25.98328971862793 + ], + "hidden_norms_avg": [ + 4.606818199157715, + 13.761014938354492, + 18.061887741088867, + 21.805465698242188, + 23.856918334960938 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008885160204954445, + 0.00026409278507344425, + 0.0001749310758896172, + 0.00012756467913277447, + 8.965048618847504e-05 + ], + "bp_grad_F": [ + 0.07283030450344086, + 0.01973560079932213, + 0.013354410417377949, + 0.009586230851709843, + 0.006897584535181522 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.693359375, + "loss_eval": 0.8082709908485413, + "epoch": 17 + }, + { + "hidden_norms_cls": [ + 1.4623849391937256, + 9.794211387634277, + 16.102649688720703, + 21.62982940673828, + 25.186201095581055 + ], + "hidden_norms_avg": [ + 4.6317901611328125, + 13.527764320373535, + 17.6087589263916, + 21.295202255249023, + 23.361501693725586 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008634055848233402, + 0.0002727442770265043, + 0.00018466924666427076, + 0.00013278424739837646, + 8.995016105473042e-05 + ], + "bp_grad_F": [ + 0.06913765519857407, + 0.02126000076532364, + 0.014007972553372383, + 0.010056250728666782, + 0.00732502993196249 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.720703125, + "loss_eval": 0.7786685824394226, + "epoch": 18 + }, + { + "hidden_norms_cls": [ + 1.4771180152893066, + 9.776408195495605, + 15.485087394714355, + 21.054513931274414, + 25.07387351989746 + ], + "hidden_norms_avg": [ + 4.570744514465332, + 13.13935375213623, + 16.70624351501465, + 20.002471923828125, + 22.400487899780273 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008809147984720767, + 0.00026235057157464325, + 0.0001801249454729259, + 0.0001285924663534388, + 8.227767830248922e-05 + ], + "bp_grad_F": [ + 0.07356031239032745, + 0.02142982743680477, + 0.014684871770441532, + 0.010477974079549313, + 0.007170504424721003 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7412109375, + "loss_eval": 0.7548146843910217, + "epoch": 19 + }, + { + "hidden_norms_cls": [ + 1.4932866096496582, + 9.586905479431152, + 15.190006256103516, + 20.53044891357422, + 23.871917724609375 + ], + "hidden_norms_avg": [ + 4.640237808227539, + 13.333914756774902, + 16.603134155273438, + 19.70735740661621, + 21.712968826293945 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008201555465348065, + 0.00025074987206608057, + 0.00018013773660641164, + 0.0001373633131152019, + 8.871335012372583e-05 + ], + "bp_grad_F": [ + 0.07453557848930359, + 0.02180560864508152, + 0.015117364004254341, + 0.010920760221779346, + 0.007648298051208258 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7294921875, + "loss_eval": 0.7338082790374756, + "epoch": 20 + }, + { + "hidden_norms_cls": [ + 1.5380369424819946, + 8.941458702087402, + 14.383026123046875, + 19.64396858215332, + 23.333805084228516 + ], + "hidden_norms_avg": [ + 4.57804012298584, + 12.777068138122559, + 15.852535247802734, + 19.008466720581055, + 21.123043060302734 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007403296767733991, + 0.00023140048142522573, + 0.0001578826195327565, + 0.00011260491737630218, + 7.754044054308906e-05 + ], + "bp_grad_F": [ + 0.07555028051137924, + 0.024111615493893623, + 0.01656532846391201, + 0.01178746297955513, + 0.007888367399573326 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.744140625, + "loss_eval": 0.7344021201133728, + "epoch": 21 + }, + { + "hidden_norms_cls": [ + 1.5561290979385376, + 9.454068183898926, + 14.400370597839355, + 19.253843307495117, + 22.27718734741211 + ], + "hidden_norms_avg": [ + 4.687749862670898, + 12.994861602783203, + 15.969095230102539, + 18.976381301879883, + 20.873851776123047 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008383935783058405, + 0.0002680755569599569, + 0.000193025975022465, + 0.00013935549941379577, + 9.83258432825096e-05 + ], + "bp_grad_F": [ + 0.06634547561407089, + 0.021603766828775406, + 0.01579204760491848, + 0.011702721007168293, + 0.008362310007214546 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.734375, + "loss_eval": 0.7299590110778809, + "epoch": 22 + }, + { + "hidden_norms_cls": [ + 1.5774884223937988, + 8.741745948791504, + 13.803518295288086, + 18.90570831298828, + 22.218149185180664 + ], + "hidden_norms_avg": [ + 4.594933032989502, + 12.66419506072998, + 15.714310646057129, + 19.085254669189453, + 21.135629653930664 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006682098028250039, + 0.00022848948719911277, + 0.00016414522542618215, + 0.0001115989507525228, + 7.056116737658158e-05 + ], + "bp_grad_F": [ + 0.07456765323877335, + 0.024261610582470894, + 0.01710386760532856, + 0.012147205881774426, + 0.008177526295185089 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7763671875, + "loss_eval": 0.699420154094696, + "epoch": 23 + }, + { + "hidden_norms_cls": [ + 1.576693058013916, + 8.762345314025879, + 13.443113327026367, + 18.230920791625977, + 22.07720375061035 + ], + "hidden_norms_avg": [ + 4.667433738708496, + 12.606098175048828, + 15.544108390808105, + 18.674053192138672, + 20.65712547302246 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006520473980344832, + 0.00022687950695399195, + 0.0001629517209948972, + 0.00011739470210159197, + 7.377319707302377e-05 + ], + "bp_grad_F": [ + 0.08037886768579483, + 0.026545122265815735, + 0.0190938338637352, + 0.013439938426017761, + 0.00869175884872675 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7353515625, + "loss_eval": 0.733207106590271, + "epoch": 24 + }, + { + "hidden_norms_cls": [ + 1.5915056467056274, + 8.431538581848145, + 13.075739860534668, + 17.782840728759766, + 20.799991607666016 + ], + "hidden_norms_avg": [ + 4.626980304718018, + 12.152971267700195, + 14.936114311218262, + 18.13477325439453, + 19.853097915649414 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007118558278307319, + 0.00024262107035610825, + 0.0001753592659952119, + 0.00012127246736781672, + 7.87421886343509e-05 + ], + "bp_grad_F": [ + 0.0734892264008522, + 0.025602566078305244, + 0.018658706918358803, + 0.013666817918419838, + 0.009108936414122581 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7578125, + "loss_eval": 0.6893049478530884, + "epoch": 25 + }, + { + "hidden_norms_cls": [ + 1.589570164680481, + 8.064777374267578, + 12.609880447387695, + 17.195837020874023, + 20.27288818359375 + ], + "hidden_norms_avg": [ + 4.651576995849609, + 12.02392578125, + 14.5856351852417, + 17.578563690185547, + 19.327190399169922 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006660808576270938, + 0.0002373493480263278, + 0.0001695255923550576, + 0.00012064678594470024, + 7.89113255450502e-05 + ], + "bp_grad_F": [ + 0.08072065562009811, + 0.02827218733727932, + 0.020335549488663673, + 0.014427169226109982, + 0.009556911885738373 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.755859375, + "loss_eval": 0.7047942876815796, + "epoch": 26 + }, + { + "hidden_norms_cls": [ + 1.6077263355255127, + 7.734760284423828, + 11.882841110229492, + 15.991426467895508, + 19.111549377441406 + ], + "hidden_norms_avg": [ + 4.672310829162598, + 11.994673728942871, + 14.48837661743164, + 16.922487258911133, + 18.498437881469727 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005716760642826557, + 0.00020494087948463857, + 0.0001548439176985994, + 0.00011144367454107851, + 6.537805165862665e-05 + ], + "bp_grad_F": [ + 0.08237622678279877, + 0.03036416694521904, + 0.022357620298862457, + 0.01651921682059765, + 0.010484294034540653 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7548828125, + "loss_eval": 0.6863161325454712, + "epoch": 27 + }, + { + "hidden_norms_cls": [ + 1.6167913675308228, + 7.661223411560059, + 11.857555389404297, + 16.11384391784668, + 19.207155227661133 + ], + "hidden_norms_avg": [ + 4.6568603515625, + 11.916447639465332, + 14.127670288085938, + 16.765464782714844, + 18.548715591430664 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006015675025992095, + 0.00022187062131706625, + 0.00015665855607949197, + 0.00011372221342753619, + 6.673130701528862e-05 + ], + "bp_grad_F": [ + 0.08522997796535492, + 0.03222256526350975, + 0.023626696318387985, + 0.01693013124167919, + 0.010611210018396378 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.75390625, + "loss_eval": 0.6998279094696045, + "epoch": 28 + }, + { + "hidden_norms_cls": [ + 1.6032800674438477, + 7.3315229415893555, + 11.458590507507324, + 15.827820777893066, + 19.03597640991211 + ], + "hidden_norms_avg": [ + 4.592748641967773, + 11.431793212890625, + 13.694733619689941, + 16.380725860595703, + 17.913341522216797 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006015695980750024, + 0.00023376141325570643, + 0.00015724304830655456, + 0.00010976113844662905, + 6.412796210497618e-05 + ], + "bp_grad_F": [ + 0.09064542502164841, + 0.03456525132060051, + 0.02491987682878971, + 0.01721413992345333, + 0.010797572322189808 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7734375, + "loss_eval": 0.6845672130584717, + "epoch": 29 + }, + { + "hidden_norms_cls": [ + 1.6067036390304565, + 7.343894004821777, + 11.072548866271973, + 15.027584075927734, + 17.731834411621094 + ], + "hidden_norms_avg": [ + 4.656601428985596, + 11.393535614013672, + 13.465471267700195, + 15.975980758666992, + 17.53518295288086 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005384382093325257, + 0.00021189975086599588, + 0.0001552984758745879, + 0.00010658086830517277, + 6.326750008156523e-05 + ], + "bp_grad_F": [ + 0.08886278420686722, + 0.03500310331583023, + 0.025932280346751213, + 0.018638672307133675, + 0.011571940965950489 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7666015625, + "loss_eval": 0.6816176772117615, + "epoch": 30 + }, + { + "hidden_norms_cls": [ + 1.6034201383590698, + 7.28795051574707, + 10.777915000915527, + 14.885525703430176, + 17.61635398864746 + ], + "hidden_norms_avg": [ + 4.614856719970703, + 11.156272888183594, + 13.103291511535645, + 15.514464378356934, + 16.799636840820312 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005928887985646725, + 0.0002398774668108672, + 0.00018353872292209417, + 0.00012629387492779642, + 8.196983981179073e-05 + ], + "bp_grad_F": [ + 0.09026212245225906, + 0.03624382242560387, + 0.027555860579013824, + 0.019604889675974846, + 0.012266743928194046 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7578125, + "loss_eval": 0.6996170878410339, + "epoch": 31 + }, + { + "hidden_norms_cls": [ + 1.611714243888855, + 7.183743953704834, + 10.724074363708496, + 14.5570650100708, + 17.022544860839844 + ], + "hidden_norms_avg": [ + 4.623075485229492, + 11.19589614868164, + 13.009132385253906, + 15.365489959716797, + 16.62962532043457 + ], + "bp_grad_per_sample_l2_med": [ + 0.00036223753704689443, + 0.00014417112106457353, + 0.00010984936670865864, + 8.023829286685213e-05, + 4.624977009370923e-05 + ], + "bp_grad_F": [ + 0.09605100005865097, + 0.03848516568541527, + 0.029046298936009407, + 0.021008647978305817, + 0.012804670259356499 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7666015625, + "loss_eval": 0.6707476377487183, + "epoch": 32 + }, + { + "hidden_norms_cls": [ + 1.6100214719772339, + 6.872183322906494, + 10.294036865234375, + 14.205705642700195, + 17.145418167114258 + ], + "hidden_norms_avg": [ + 4.6112518310546875, + 11.086106300354004, + 12.928976058959961, + 15.350056648254395, + 16.69057846069336 + ], + "bp_grad_per_sample_l2_med": [ + 0.00041789902024902403, + 0.00017518684035167098, + 0.0001297849084949121, + 8.867425640346482e-05, + 4.886053648078814e-05 + ], + "bp_grad_F": [ + 0.10439282655715942, + 0.04290134832262993, + 0.03223341330885887, + 0.02269606664776802, + 0.013486144132912159 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.759765625, + "loss_eval": 0.7303465604782104, + "epoch": 33 + }, + { + "hidden_norms_cls": [ + 1.5996708869934082, + 6.756699085235596, + 9.930717468261719, + 13.55428695678711, + 16.25560188293457 + ], + "hidden_norms_avg": [ + 4.561036109924316, + 10.72261905670166, + 12.331817626953125, + 14.622406005859375, + 16.10407829284668 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004882134380750358, + 0.0002138838026439771, + 0.00016901774506550282, + 0.0001125320850405842, + 6.579834007425234e-05 + ], + "bp_grad_F": [ + 0.10555483400821686, + 0.043922487646341324, + 0.03336327522993088, + 0.02399253286421299, + 0.013897648081183434 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7744140625, + "loss_eval": 0.71100252866745, + "epoch": 34 + }, + { + "hidden_norms_cls": [ + 1.5904232263565063, + 6.662050247192383, + 9.66409683227539, + 13.113885879516602, + 15.527644157409668 + ], + "hidden_norms_avg": [ + 4.5454936027526855, + 10.621905326843262, + 12.306397438049316, + 14.576898574829102, + 15.954529762268066 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004819612659048289, + 0.00020982844580430537, + 0.00015760491078253835, + 0.00010895934246946126, + 5.958566543995403e-05 + ], + "bp_grad_F": [ + 0.10991083830595016, + 0.047212228178977966, + 0.03634340688586235, + 0.02575613744556904, + 0.014786512590944767 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7705078125, + "loss_eval": 0.7015272378921509, + "epoch": 35 + }, + { + "hidden_norms_cls": [ + 1.5926766395568848, + 6.752022743225098, + 9.809683799743652, + 13.14870548248291, + 15.66618537902832 + ], + "hidden_norms_avg": [ + 4.554390907287598, + 10.59433650970459, + 12.38070011138916, + 14.597192764282227, + 15.870081901550293 + ], + "bp_grad_per_sample_l2_med": [ + 0.00043442551395855844, + 0.0001767174544511363, + 0.0001353291590930894, + 9.88640749710612e-05, + 5.115106250741519e-05 + ], + "bp_grad_F": [ + 0.11412353813648224, + 0.04936130344867706, + 0.03786878660321236, + 0.027230119332671165, + 0.015144454315304756 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7734375, + "loss_eval": 0.7246569395065308, + "epoch": 36 + }, + { + "hidden_norms_cls": [ + 1.5873360633850098, + 6.424077987670898, + 9.43139934539795, + 12.677597999572754, + 15.172491073608398 + ], + "hidden_norms_avg": [ + 4.4964070320129395, + 10.287262916564941, + 11.751147270202637, + 13.867583274841309, + 15.24795150756836 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004166838189121336, + 0.0001985515555134043, + 0.00014922211994417012, + 0.0001073441599146463, + 5.765057721873745e-05 + ], + "bp_grad_F": [ + 0.11522030830383301, + 0.05126715078949928, + 0.039791759103536606, + 0.028239542618393898, + 0.015849631279706955 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.76953125, + "loss_eval": 0.7268451452255249, + "epoch": 37 + }, + { + "hidden_norms_cls": [ + 1.5890607833862305, + 6.295929431915283, + 9.119135856628418, + 12.20608901977539, + 14.642122268676758 + ], + "hidden_norms_avg": [ + 4.5021796226501465, + 10.095436096191406, + 11.7933988571167, + 13.924290657043457, + 15.25149917602539 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004105751868337393, + 0.00017681249300949275, + 0.00014306302182376385, + 9.77686358965002e-05, + 5.147796036908403e-05 + ], + "bp_grad_F": [ + 0.12662801146507263, + 0.057947222143411636, + 0.044759348034858704, + 0.03212600201368332, + 0.017064588144421577 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7587890625, + "loss_eval": 0.7464388012886047, + "epoch": 38 + }, + { + "hidden_norms_cls": [ + 1.5761758089065552, + 6.18004846572876, + 9.069403648376465, + 12.180702209472656, + 14.516327857971191 + ], + "hidden_norms_avg": [ + 4.492326736450195, + 9.971968650817871, + 11.50478744506836, + 13.5086669921875, + 14.760706901550293 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003273288893979043, + 0.00015071693633217365, + 0.00011665018246276304, + 8.30927092465572e-05, + 4.371673639980145e-05 + ], + "bp_grad_F": [ + 0.1212363913655281, + 0.055609479546546936, + 0.04309426248073578, + 0.0311796423047781, + 0.016882745549082756 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7783203125, + "loss_eval": 0.7176246643066406, + "epoch": 39 + }, + { + "hidden_norms_cls": [ + 1.5679142475128174, + 6.109372615814209, + 8.818140029907227, + 11.853668212890625, + 14.200343132019043 + ], + "hidden_norms_avg": [ + 4.478363037109375, + 9.777668952941895, + 11.217857360839844, + 13.170299530029297, + 14.35566520690918 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003435175749473274, + 0.00015563883061986417, + 0.00011927648301934823, + 8.298752072732896e-05, + 4.157157673034817e-05 + ], + "bp_grad_F": [ + 0.13136376440525055, + 0.06076597049832344, + 0.046719472855329514, + 0.033368490636348724, + 0.01777712069451809 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.78125, + "loss_eval": 0.7149413228034973, + "epoch": 40 + }, + { + "hidden_norms_cls": [ + 1.5576080083847046, + 6.149768829345703, + 8.711091041564941, + 11.498035430908203, + 13.903903007507324 + ], + "hidden_norms_avg": [ + 4.435859680175781, + 9.742182731628418, + 10.966800689697266, + 12.826833724975586, + 13.987249374389648 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002820935333147645, + 0.00013546310947276652, + 0.00010691316856537014, + 7.935341272968799e-05, + 4.027710747322999e-05 + ], + "bp_grad_F": [ + 0.1424364149570465, + 0.0660286620259285, + 0.05190045386552811, + 0.037452246993780136, + 0.019488148391246796 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.759765625, + "loss_eval": 0.7794969081878662, + "epoch": 41 + }, + { + "hidden_norms_cls": [ + 1.55929696559906, + 6.027406215667725, + 8.56254768371582, + 11.315313339233398, + 13.816405296325684 + ], + "hidden_norms_avg": [ + 4.444095611572266, + 9.598461151123047, + 11.017721176147461, + 12.939472198486328, + 14.150469779968262 + ], + "bp_grad_per_sample_l2_med": [ + 0.00028881963226012886, + 0.00014081982953939587, + 0.00010864014620892704, + 7.903494406491518e-05, + 3.460505831753835e-05 + ], + "bp_grad_F": [ + 0.14435029029846191, + 0.06792720407247543, + 0.05288391932845116, + 0.03809889778494835, + 0.0192741546779871 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7783203125, + "loss_eval": 0.7500836253166199, + "epoch": 42 + }, + { + "hidden_norms_cls": [ + 1.5569288730621338, + 5.83992338180542, + 8.285759925842285, + 11.15902328491211, + 13.44404125213623 + ], + "hidden_norms_avg": [ + 4.416918754577637, + 9.525116920471191, + 10.900503158569336, + 12.753186225891113, + 13.810358047485352 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003584402147680521, + 0.00016757070261519402, + 0.000135006892378442, + 8.858168439473957e-05, + 4.690655987360515e-05 + ], + "bp_grad_F": [ + 0.14751866459846497, + 0.07057010382413864, + 0.05518123507499695, + 0.039941366761922836, + 0.019994540140032768 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.783203125, + "loss_eval": 0.7740926146507263, + "epoch": 43 + }, + { + "hidden_norms_cls": [ + 1.5507482290267944, + 5.7182297706604, + 8.143424034118652, + 10.900334358215332, + 13.179159164428711 + ], + "hidden_norms_avg": [ + 4.415921688079834, + 9.42380142211914, + 10.672327995300293, + 12.439417839050293, + 13.481410026550293 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002743537479545921, + 0.00013802653120364994, + 0.00010440178448334336, + 7.395831926260144e-05, + 3.546295192791149e-05 + ], + "bp_grad_F": [ + 0.15799099206924438, + 0.0763181671500206, + 0.060047682374715805, + 0.043460771441459656, + 0.02125636488199234 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.78125, + "loss_eval": 0.7693630456924438, + "epoch": 44 + }, + { + "hidden_norms_cls": [ + 1.5424573421478271, + 5.688177585601807, + 7.995815753936768, + 10.642090797424316, + 12.71364688873291 + ], + "hidden_norms_avg": [ + 4.399099349975586, + 9.228434562683105, + 10.541167259216309, + 12.30521297454834, + 13.311983108520508 + ], + "bp_grad_per_sample_l2_med": [ + 0.00024789522285573184, + 0.0001290303043788299, + 9.614775626687333e-05, + 6.680067599518225e-05, + 3.041914533241652e-05 + ], + "bp_grad_F": [ + 0.16617916524410248, + 0.08274275809526443, + 0.06457101553678513, + 0.04608331620693207, + 0.02214660868048668 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.77734375, + "loss_eval": 0.7963705062866211, + "epoch": 45 + }, + { + "hidden_norms_cls": [ + 1.5373201370239258, + 5.651702880859375, + 7.870075702667236, + 10.383352279663086, + 12.742950439453125 + ], + "hidden_norms_avg": [ + 4.359274387359619, + 9.120989799499512, + 10.328361511230469, + 11.979691505432129, + 13.047332763671875 + ], + "bp_grad_per_sample_l2_med": [ + 0.00020789829432033002, + 0.00010236673551844433, + 8.31241559353657e-05, + 5.5589163821423426e-05, + 2.5046059818123467e-05 + ], + "bp_grad_F": [ + 0.1711728274822235, + 0.08452030271291733, + 0.06641850620508194, + 0.048034753650426865, + 0.022233933210372925 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796875, + "loss_eval": 0.787158727645874, + "epoch": 46 + }, + { + "hidden_norms_cls": [ + 1.534119725227356, + 5.64213752746582, + 7.87826681137085, + 10.351583480834961, + 12.802285194396973 + ], + "hidden_norms_avg": [ + 4.381091594696045, + 9.210761070251465, + 10.374320030212402, + 12.017292976379395, + 13.094472885131836 + ], + "bp_grad_per_sample_l2_med": [ + 0.00020434240286704153, + 9.69645261648111e-05, + 7.39863608032465e-05, + 5.592328670900315e-05, + 2.489626240276266e-05 + ], + "bp_grad_F": [ + 0.17339713871479034, + 0.08632633090019226, + 0.06861955672502518, + 0.05006933584809303, + 0.022428762167692184 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7919921875, + "loss_eval": 0.7851632833480835, + "epoch": 47 + }, + { + "hidden_norms_cls": [ + 1.5289297103881836, + 5.52672004699707, + 7.675796985626221, + 10.204718589782715, + 12.873387336730957 + ], + "hidden_norms_avg": [ + 4.3382954597473145, + 8.994754791259766, + 10.112909317016602, + 11.741432189941406, + 12.863862037658691 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001689869095571339, + 8.723067730898038e-05, + 6.962454062886536e-05, + 4.9918842705665156e-05, + 2.0077559383935295e-05 + ], + "bp_grad_F": [ + 0.1893138736486435, + 0.09529414772987366, + 0.07472710311412811, + 0.053626082837581635, + 0.023708311840891838 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7802734375, + "loss_eval": 0.8306612968444824, + "epoch": 48 + }, + { + "hidden_norms_cls": [ + 1.5282790660858154, + 5.412533760070801, + 7.559310436248779, + 10.040712356567383, + 12.344849586486816 + ], + "hidden_norms_avg": [ + 4.344850063323975, + 8.943357467651367, + 10.036619186401367, + 11.63318157196045, + 12.690427780151367 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015994974819477648, + 8.589095523348078e-05, + 6.632162694586441e-05, + 4.7776728024473414e-05, + 1.923311901919078e-05 + ], + "bp_grad_F": [ + 0.19004860520362854, + 0.09673094749450684, + 0.07585947215557098, + 0.05484768748283386, + 0.02464146539568901 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7880859375, + "loss_eval": 0.8193543553352356, + "epoch": 49 + }, + { + "hidden_norms_cls": [ + 1.5247719287872314, + 5.414742469787598, + 7.496610164642334, + 9.884673118591309, + 12.301740646362305 + ], + "hidden_norms_avg": [ + 4.334397792816162, + 8.873777389526367, + 9.937097549438477, + 11.524014472961426, + 12.564128875732422 + ], + "bp_grad_per_sample_l2_med": [ + 0.00016137116472236812, + 8.459146192763001e-05, + 7.113611354725435e-05, + 4.750298467115499e-05, + 1.9900418919860385e-05 + ], + "bp_grad_F": [ + 0.1871533840894699, + 0.09687218815088272, + 0.0768747329711914, + 0.05509059876203537, + 0.024593451991677284 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.80078125, + "loss_eval": 0.810278058052063, + "epoch": 50 + }, + { + "hidden_norms_cls": [ + 1.5175530910491943, + 5.423762798309326, + 7.493518352508545, + 9.848480224609375, + 12.152653694152832 + ], + "hidden_norms_avg": [ + 4.333771228790283, + 8.846830368041992, + 9.895172119140625, + 11.470880508422852, + 12.51230239868164 + ], + "bp_grad_per_sample_l2_med": [ + 0.00018688049749471247, + 9.502686589257792e-05, + 7.833576091798022e-05, + 5.505367516889237e-05, + 2.1109613953740336e-05 + ], + "bp_grad_F": [ + 0.19925038516521454, + 0.10273440927267075, + 0.08146088570356369, + 0.05800405889749527, + 0.025326546281576157 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.79296875, + "loss_eval": 0.8315975069999695, + "epoch": 51 + }, + { + "hidden_norms_cls": [ + 1.5154390335083008, + 5.332769870758057, + 7.351593971252441, + 9.726226806640625, + 12.217824935913086 + ], + "hidden_norms_avg": [ + 4.312089443206787, + 8.77189826965332, + 9.80828857421875, + 11.376079559326172, + 12.424320220947266 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001625730947125703, + 8.300685294670984e-05, + 6.064521585358307e-05, + 4.498598718782887e-05, + 1.878884904726874e-05 + ], + "bp_grad_F": [ + 0.20003639161586761, + 0.10495735704898834, + 0.08297032862901688, + 0.059033025056123734, + 0.02547283098101616 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7890625, + "loss_eval": 0.8281288146972656, + "epoch": 52 + }, + { + "hidden_norms_cls": [ + 1.5136713981628418, + 5.367674827575684, + 7.355134963989258, + 9.682082176208496, + 12.047696113586426 + ], + "hidden_norms_avg": [ + 4.316784381866455, + 8.783827781677246, + 9.812792778015137, + 11.395760536193848, + 12.420063018798828 + ], + "bp_grad_per_sample_l2_med": [ + 0.00016071743448264897, + 7.887884567026049e-05, + 6.097723598941229e-05, + 4.243743751430884e-05, + 1.8102018657373264e-05 + ], + "bp_grad_F": [ + 0.20199808478355408, + 0.10541712492704391, + 0.0835103914141655, + 0.05967256799340248, + 0.025771932676434517 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7890625, + "loss_eval": 0.8389135599136353, + "epoch": 53 + }, + { + "hidden_norms_cls": [ + 1.5129119157791138, + 5.326069355010986, + 7.275172233581543, + 9.633310317993164, + 12.064473152160645 + ], + "hidden_norms_avg": [ + 4.308472633361816, + 8.717856407165527, + 9.717677116394043, + 11.28734016418457, + 12.3176851272583 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015608215471729636, + 8.108095789793879e-05, + 6.294465129030868e-05, + 4.2116138502024114e-05, + 1.7733293134369887e-05 + ], + "bp_grad_F": [ + 0.20727074146270752, + 0.10958535224199295, + 0.08667060732841492, + 0.06113011762499809, + 0.026037005707621574 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.787109375, + "loss_eval": 0.8504288792610168, + "epoch": 54 + }, + { + "hidden_norms_cls": [ + 1.5120813846588135, + 5.313214302062988, + 7.253427982330322, + 9.583664894104004, + 12.01283073425293 + ], + "hidden_norms_avg": [ + 4.303354263305664, + 8.709893226623535, + 9.714727401733398, + 11.287162780761719, + 12.301621437072754 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014261712203733623, + 8.006545249372721e-05, + 6.104232306824997e-05, + 4.1361305193277076e-05, + 1.670202073000837e-05 + ], + "bp_grad_F": [ + 0.20587928593158722, + 0.10970292240381241, + 0.0869779959321022, + 0.06163511052727699, + 0.02630491554737091 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7919921875, + "loss_eval": 0.8500803709030151, + "epoch": 55 + }, + { + "hidden_norms_cls": [ + 1.5113301277160645, + 5.33270263671875, + 7.255039215087891, + 9.560588836669922, + 11.935233116149902 + ], + "hidden_norms_avg": [ + 4.311485767364502, + 8.737537384033203, + 9.710383415222168, + 11.27385425567627, + 12.309149742126465 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014448253205046058, + 7.629570609424263e-05, + 6.040706284693442e-05, + 4.236707536620088e-05, + 1.7641770682530478e-05 + ], + "bp_grad_F": [ + 0.20638784766197205, + 0.10957971960306168, + 0.08719436824321747, + 0.06181200593709946, + 0.026369713246822357 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7900390625, + "loss_eval": 0.8525989055633545, + "epoch": 56 + }, + { + "hidden_norms_cls": [ + 1.5115892887115479, + 5.313480377197266, + 7.247244834899902, + 9.550230979919434, + 11.989883422851562 + ], + "hidden_norms_avg": [ + 4.3022141456604, + 8.688987731933594, + 9.685582160949707, + 11.234566688537598, + 12.270132064819336 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001483379164710641, + 7.948598067741841e-05, + 6.1946535424795e-05, + 4.4680935388896614e-05, + 1.6852744010975584e-05 + ], + "bp_grad_F": [ + 0.21088635921478271, + 0.11181779950857162, + 0.08855349570512772, + 0.06269123405218124, + 0.026410162448883057 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7890625, + "loss_eval": 0.8474454879760742, + "epoch": 57 + }, + { + "hidden_norms_cls": [ + 1.5110703706741333, + 5.306856632232666, + 7.230412483215332, + 9.542105674743652, + 11.942556381225586 + ], + "hidden_norms_avg": [ + 4.305404186248779, + 8.697504997253418, + 9.679413795471191, + 11.226194381713867, + 12.25047492980957 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014003549586050212, + 7.460260530933738e-05, + 6.204132660059258e-05, + 3.912465035682544e-05, + 1.6441039406345226e-05 + ], + "bp_grad_F": [ + 0.20991134643554688, + 0.11143218725919724, + 0.08832813799381256, + 0.06269684433937073, + 0.026480402797460556 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.791015625, + "loss_eval": 0.8496487140655518, + "epoch": 58 + }, + { + "hidden_norms_cls": [ + 1.5111491680145264, + 5.304075717926025, + 7.234795093536377, + 9.53318977355957, + 11.964473724365234 + ], + "hidden_norms_avg": [ + 4.304405689239502, + 8.697833061218262, + 9.683843612670898, + 11.22890853881836, + 12.259684562683105 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014237761206459254, + 7.472094148397446e-05, + 5.683211929863319e-05, + 4.049929339089431e-05, + 1.4964447473175824e-05 + ], + "bp_grad_F": [ + 0.21009324491024017, + 0.11155029386281967, + 0.08846566081047058, + 0.06290413439273834, + 0.026488499715924263 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.794921875, + "loss_eval": 0.8498167395591736, + "epoch": 59 + }, + { + "hidden_norms_cls": [ + 1.5111573934555054, + 5.304897785186768, + 7.23397970199585, + 9.53254508972168, + 11.969621658325195 + ], + "hidden_norms_avg": [ + 4.304327964782715, + 8.696623802185059, + 9.681411743164062, + 11.225934982299805, + 12.255182266235352 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001376860454911366, + 7.4876043072436e-05, + 5.8659916248871014e-05, + 4.048796836286783e-05, + 1.5446972611243837e-05 + ], + "bp_grad_F": [ + 0.210032656788826, + 0.11159469932317734, + 0.08847951143980026, + 0.06288634985685349, + 0.02649829164147377 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.791015625, + "loss_eval": 0.8496516942977905, + "epoch": 60 + } + ], + "dfa_log": [ + { + "hidden_norms_cls": [ + 0.3042769432067871, + 3.2273340225219727, + 4.6926493644714355, + 6.003997802734375, + 6.652705669403076 + ], + "hidden_norms_avg": [ + 6.027750492095947, + 7.1044697761535645, + 7.910475730895996, + 8.79189682006836, + 9.458833694458008 + ], + "bp_grad_per_sample_l2_med": [ + 0.005248428788036108, + 0.0012287507997825742, + 0.0010387187357991934, + 0.0009678652859292924, + 0.0009174557635560632 + ], + "bp_grad_F": [ + 0.248850479722023, + 0.0424945093691349, + 0.0348997563123703, + 0.03202275559306145, + 0.030239813029766083 + ], + "gamma_dfa": -0.0027123973850393668, + "gamma_dfa_per_layer": [ + -0.0010305923642590642, + -0.01111956313252449, + 0.0014823779929429293, + -0.00018181203631684184 + ], + "acc_eval": 0.0791015625, + "loss_eval": 2.544933319091797, + "epoch": 0 + }, + { + "hidden_norms_cls": [ + 1.8898234367370605, + 1755.5985107421875, + 3812.865966796875, + 4063.967529296875, + 6749.62646484375 + ], + "hidden_norms_avg": [ + 48.02373504638672, + 2610.970458984375, + 7442.5693359375, + 13001.9443359375, + 19569.59765625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006367825553752482, + 1.061867237694969e-06, + 9.113553005590802e-07, + 8.042399599617056e-07, + 7.901451226643985e-07 + ], + "bp_grad_F": [ + 0.11358296871185303, + 5.570299981627613e-05, + 4.605366484611295e-05, + 3.752685370272957e-05, + 3.027659113286063e-05 + ], + "gamma_dfa": 0.007312511210329831, + "gamma_dfa_per_layer": [ + 0.01007317565381527, + 0.008024577051401138, + 0.008248038589954376, + 0.0029042535461485386 + ], + "acc_eval": 0.2333984375, + "loss_eval": 2.0879125595092773, + "epoch": 1 + }, + { + "hidden_norms_cls": [ + 3.704786777496338, + 7219.806640625, + 19592.4140625, + 21808.44921875, + 46117.11328125 + ], + "hidden_norms_avg": [ + 97.33866882324219, + 9787.240234375, + 35216.66015625, + 64377.67578125, + 97116.8125 + ], + "bp_grad_per_sample_l2_med": [ + 9.637367475079373e-05, + 1.6794896851024532e-07, + 1.5954641696680483e-07, + 1.4061814113119908e-07, + 1.445507677999558e-07 + ], + "bp_grad_F": [ + 0.04642009362578392, + 2.128358573827427e-05, + 2.0123250578762963e-05, + 6.922710781509522e-06, + 6.6381039687257726e-06 + ], + "gamma_dfa": 0.007922766148112714, + "gamma_dfa_per_layer": [ + 0.016379408538341522, + 0.005931380204856396, + 0.007020577322691679, + 0.0023596985265612602 + ], + "acc_eval": 0.205078125, + "loss_eval": 2.1287283897399902, + "epoch": 2 + }, + { + "hidden_norms_cls": [ + 5.554904937744141, + 16081.3388671875, + 48028.96875, + 51717.93359375, + 100197.7265625 + ], + "hidden_norms_avg": [ + 147.4190216064453, + 22860.939453125, + 90670.5078125, + 172520.15625, + 247624.09375 + ], + "bp_grad_per_sample_l2_med": [ + 3.051399289688561e-05, + 9.248702070863146e-08, + 7.303499671706959e-08, + 6.487525183729304e-08, + 6.620962977876843e-08 + ], + "bp_grad_F": [ + 0.034720927476882935, + 1.6823112673591822e-05, + 1.1384844583517406e-05, + 3.0318508379423292e-06, + 2.624829903652426e-06 + ], + "gamma_dfa": 0.0067759081866825, + "gamma_dfa_per_layer": [ + 0.014651123434305191, + 0.004187515936791897, + 0.007594288792461157, + 0.0006707045831717551 + ], + "acc_eval": 0.20703125, + "loss_eval": 2.107574462890625, + "epoch": 3 + }, + { + "hidden_norms_cls": [ + 7.38655424118042, + 30113.763671875, + 92815.4375, + 102848.4453125, + 183389.40625 + ], + "hidden_norms_avg": [ + 194.20396423339844, + 39156.78515625, + 166144.453125, + 360300.25, + 500574.96875 + ], + "bp_grad_per_sample_l2_med": [ + 2.7757007046602666e-05, + 6.177719313882335e-08, + 4.3474216226968565e-08, + 3.8972562066419414e-08, + 3.9463689205376795e-08 + ], + "bp_grad_F": [ + 0.03289186581969261, + 5.563175363931805e-06, + 2.151713033526903e-06, + 1.463158696424216e-06, + 1.3795681752526434e-06 + ], + "gamma_dfa": 0.006396490931365406, + "gamma_dfa_per_layer": [ + 0.015158161520957947, + 0.0035972977057099342, + 0.006714952643960714, + 0.00011555185483302921 + ], + "acc_eval": 0.203125, + "loss_eval": 2.1379737854003906, + "epoch": 4 + }, + { + "hidden_norms_cls": [ + 9.15835189819336, + 53591.8984375, + 170615.734375, + 181427.171875, + 289063.5625 + ], + "hidden_norms_avg": [ + 238.28347778320312, + 61062.31640625, + 250187.6875, + 548101.3125, + 724058.1875 + ], + "bp_grad_per_sample_l2_med": [ + 2.960537312901579e-05, + 4.670241438020639e-08, + 3.080446120407032e-08, + 2.670985388419922e-08, + 2.6331489877406966e-08 + ], + "bp_grad_F": [ + 0.016260992735624313, + 4.766869551531272e-06, + 2.067620698653627e-06, + 9.787106591829797e-07, + 8.912123234949831e-07 + ], + "gamma_dfa": 0.0068261599517427385, + "gamma_dfa_per_layer": [ + 0.014116348698735237, + 0.003242844482883811, + 0.008411802351474762, + 0.0015336442738771439 + ], + "acc_eval": 0.1962890625, + "loss_eval": 2.1309733390808105, + "epoch": 5 + }, + { + "hidden_norms_cls": [ + 10.888343811035156, + 91755.1171875, + 249917.8125, + 274005.3125, + 444277.53125 + ], + "hidden_norms_avg": [ + 276.9202880859375, + 104021.7109375, + 349872.5, + 931915.875, + 1222273.75 + ], + "bp_grad_per_sample_l2_med": [ + 2.7342781322658993e-05, + 3.6854661544794e-08, + 2.4993127567540796e-08, + 1.8662358769461207e-08, + 1.7811659702715588e-08 + ], + "bp_grad_F": [ + 0.022468894720077515, + 3.493201802484691e-06, + 1.1520894531713566e-06, + 7.113425795068906e-07, + 6.108040793151304e-07 + ], + "gamma_dfa": 0.007193240569904447, + "gamma_dfa_per_layer": [ + 0.017048656940460205, + 0.002665129955857992, + 0.007390158250927925, + 0.001669017132371664 + ], + "acc_eval": 0.2109375, + "loss_eval": 2.1020355224609375, + "epoch": 6 + }, + { + "hidden_norms_cls": [ + 12.623483657836914, + 158915.890625, + 360070.6875, + 406906.3125, + 630641.3125 + ], + "hidden_norms_avg": [ + 315.0859680175781, + 172244.328125, + 490065.59375, + 1510240.375, + 1952914.5 + ], + "bp_grad_per_sample_l2_med": [ + 3.403881783015095e-05, + 2.7625405962794503e-08, + 1.651102543576144e-08, + 1.1742161909467086e-08, + 1.0927361238088906e-08 + ], + "bp_grad_F": [ + 0.024832597002387047, + 1.8080392010233481e-06, + 7.246239306368807e-07, + 4.936595132676302e-07, + 4.0145107504940825e-07 + ], + "gamma_dfa": 0.006596001767320558, + "gamma_dfa_per_layer": [ + 0.016851693391799927, + 0.001910479972139001, + 0.0058369822800159454, + 0.0017848514253273606 + ], + "acc_eval": 0.2138671875, + "loss_eval": 2.1312928199768066, + "epoch": 7 + }, + { + "hidden_norms_cls": [ + 14.368335723876953, + 243332.8125, + 525771.0, + 593291.75, + 875288.5 + ], + "hidden_norms_avg": [ + 351.16015625, + 247222.375, + 640658.75, + 1855662.75, + 2391194.25 + ], + "bp_grad_per_sample_l2_med": [ + 2.87416060018586e-05, + 1.8018790015617014e-08, + 1.2651691250198382e-08, + 9.33115984480537e-09, + 8.563736386690834e-09 + ], + "bp_grad_F": [ + 0.017871394753456116, + 9.426115070709784e-07, + 4.7217255882969766e-07, + 3.564711050785263e-07, + 3.2240865266430774e-07 + ], + "gamma_dfa": 0.006289168493822217, + "gamma_dfa_per_layer": [ + 0.013373943977057934, + 0.0037157258484512568, + 0.00672483816742897, + 0.001342165982350707 + ], + "acc_eval": 0.220703125, + "loss_eval": 2.0829837322235107, + "epoch": 8 + }, + { + "hidden_norms_cls": [ + 16.041412353515625, + 385486.09375, + 776263.875, + 869037.0, + 1191002.25 + ], + "hidden_norms_avg": [ + 383.5213317871094, + 383708.40625, + 941498.0, + 2793651.25, + 3510556.5 + ], + "bp_grad_per_sample_l2_med": [ + 2.8917142117279582e-05, + 1.1363525231899985e-08, + 8.616331648170217e-09, + 5.602694308493028e-09, + 5.260086588521062e-09 + ], + "bp_grad_F": [ + 0.024791762232780457, + 6.833873840150773e-07, + 3.100701633229619e-07, + 2.26619619070334e-07, + 2.1342954426017968e-07 + ], + "gamma_dfa": 0.00652129843365401, + "gamma_dfa_per_layer": [ + 0.014406262896955013, + 0.004345592111349106, + 0.006529162637889385, + 0.0008041760884225368 + ], + "acc_eval": 0.2197265625, + "loss_eval": 2.1437277793884277, + "epoch": 9 + }, + { + "hidden_norms_cls": [ + 17.677919387817383, + 582942.5, + 1148260.75, + 1279834.25, + 1709270.625 + ], + "hidden_norms_avg": [ + 416.1814880371094, + 530246.375, + 1201761.5, + 2944394.0, + 3732565.75 + ], + "bp_grad_per_sample_l2_med": [ + 3.369058686075732e-05, + 6.623859238885643e-09, + 4.513381224313662e-09, + 3.933114278709127e-09, + 3.794405678547719e-09 + ], + "bp_grad_F": [ + 0.01620429754257202, + 3.022730652446626e-07, + 1.9097409165169665e-07, + 1.773983058228623e-07, + 1.593236333974346e-07 + ], + "gamma_dfa": 0.006082151841837913, + "gamma_dfa_per_layer": [ + 0.01578153669834137, + 0.002655572956427932, + 0.005509376525878906, + 0.00038212118670344353 + ], + "acc_eval": 0.197265625, + "loss_eval": 2.089698314666748, + "epoch": 10 + }, + { + "hidden_norms_cls": [ + 19.31073760986328, + 843820.0625, + 1587423.25, + 1759006.0, + 2222149.5 + ], + "hidden_norms_avg": [ + 448.93133544921875, + 796172.1875, + 1678321.375, + 3888912.0, + 4810418.0 + ], + "bp_grad_per_sample_l2_med": [ + 4.445635568117723e-05, + 3.5140981236025937e-09, + 2.8926525619255017e-09, + 2.65975419466713e-09, + 2.6499111793754082e-09 + ], + "bp_grad_F": [ + 0.020245229825377464, + 2.6993967594535206e-07, + 1.701987457636278e-07, + 1.3198047099649557e-07, + 1.2469256205349666e-07 + ], + "gamma_dfa": 0.005559869911849091, + "gamma_dfa_per_layer": [ + 0.015185668133199215, + 0.0025689376052469015, + 0.004468783736228943, + 1.6090172721305862e-05 + ], + "acc_eval": 0.2314453125, + "loss_eval": 2.0838193893432617, + "epoch": 11 + }, + { + "hidden_norms_cls": [ + 20.861183166503906, + 1157778.75, + 2054207.5, + 2289084.5, + 2841995.0 + ], + "hidden_norms_avg": [ + 479.8387145996094, + 981138.875, + 2112497.25, + 4439588.0, + 5517614.5 + ], + "bp_grad_per_sample_l2_med": [ + 3.176981772412546e-05, + 3.1782512177613853e-09, + 2.5456772245746606e-09, + 2.4393245201537184e-09, + 2.414718425214346e-09 + ], + "bp_grad_F": [ + 0.09368129819631577, + 9.166008680949744e-07, + 2.675243706562469e-07, + 1.0984689424731187e-07, + 1.0444787079677553e-07 + ], + "gamma_dfa": 0.004390636342577636, + "gamma_dfa_per_layer": [ + 0.011994147673249245, + 0.001997251994907856, + 0.003865728620439768, + -0.00029458291828632355 + ], + "acc_eval": 0.224609375, + "loss_eval": 2.0896079540252686, + "epoch": 12 + }, + { + "hidden_norms_cls": [ + 22.362810134887695, + 1504072.375, + 2527410.75, + 2870361.25, + 3557771.0 + ], + "hidden_norms_avg": [ + 510.81561279296875, + 1188843.375, + 2574796.25, + 5296089.0, + 6640932.5 + ], + "bp_grad_per_sample_l2_med": [ + 2.8154454412288032e-05, + 3.057065711686846e-09, + 2.121731013104977e-09, + 2.0999049166192663e-09, + 2.0892536589656174e-09 + ], + "bp_grad_F": [ + 0.011068353429436684, + 1.3467251847032458e-06, + 1.0581060649883511e-07, + 9.427417069218791e-08, + 9.197237460512042e-08 + ], + "gamma_dfa": 0.003989392673247494, + "gamma_dfa_per_layer": [ + 0.011822337284684181, + 0.001384879695251584, + 0.00329465395770967, + -0.0005443002446554601 + ], + "acc_eval": 0.244140625, + "loss_eval": 2.077056407928467, + "epoch": 13 + }, + { + "hidden_norms_cls": [ + 23.812599182128906, + 1930070.0, + 2995981.75, + 3469627.0, + 4303896.0 + ], + "hidden_norms_avg": [ + 539.9255981445312, + 1589889.5, + 3066154.25, + 6015238.0, + 7540605.5 + ], + "bp_grad_per_sample_l2_med": [ + 3.170168929500505e-05, + 2.518652619798445e-09, + 1.924201020742089e-09, + 1.8520206479522017e-09, + 1.8417810609960839e-09 + ], + "bp_grad_F": [ + 0.032089244574308395, + 1.0142422297576559e-06, + 1.6566445992793888e-07, + 8.33219857554468e-08, + 7.640721122470495e-08 + ], + "gamma_dfa": 0.0029267592035466805, + "gamma_dfa_per_layer": [ + 0.008105762302875519, + 0.001629034522920847, + 0.0022919299080967903, + -0.000319689919706434 + ], + "acc_eval": 0.224609375, + "loss_eval": 2.0748229026794434, + "epoch": 14 + }, + { + "hidden_norms_cls": [ + 25.248563766479492, + 2452306.5, + 3664022.75, + 4168536.0, + 5106242.5 + ], + "hidden_norms_avg": [ + 570.19384765625, + 1965615.5, + 3710471.5, + 7372995.0, + 9239893.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.4190969270421192e-05, + 1.8390389211475622e-09, + 1.5613663695290825e-09, + 1.5359991056840272e-09, + 1.5388512686342892e-09 + ], + "bp_grad_F": [ + 0.015056902542710304, + 6.693913292110665e-06, + 1.241161982079575e-07, + 7.622224984515924e-08, + 6.743793790064956e-08 + ], + "gamma_dfa": 0.0022661721595795825, + "gamma_dfa_per_layer": [ + 0.006208081729710102, + 0.001149914925917983, + 0.0020575951784849167, + -0.0003509031957946718 + ], + "acc_eval": 0.236328125, + "loss_eval": 2.0835204124450684, + "epoch": 15 + }, + { + "hidden_norms_cls": [ + 26.6426944732666, + 3107169.0, + 4381372.0, + 5027998.5, + 6065136.0 + ], + "hidden_norms_avg": [ + 596.7793579101562, + 2542559.0, + 4400625.5, + 8374831.5, + 10510773.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.787545781757217e-05, + 1.5701163702530607e-09, + 1.2841328000945396e-09, + 1.2669904014828148e-09, + 1.2700215323846464e-09 + ], + "bp_grad_F": [ + 0.006971500348299742, + 1.8619180991663598e-05, + 6.465826629664662e-08, + 5.84209978171657e-08, + 5.694714744208795e-08 + ], + "gamma_dfa": 0.0030232197314035147, + "gamma_dfa_per_layer": [ + 0.009539565071463585, + 0.0012945058988407254, + 0.0015697493217885494, + -0.0003109413664788008 + ], + "acc_eval": 0.236328125, + "loss_eval": 2.058485507965088, + "epoch": 16 + }, + { + "hidden_norms_cls": [ + 27.95879364013672, + 3613966.25, + 5044349.0, + 5874924.0, + 7080756.0 + ], + "hidden_norms_avg": [ + 623.2052612304688, + 2844551.5, + 4942977.0, + 8742455.0, + 11094594.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.8442762413760647e-05, + 1.629689605486817e-09, + 1.115437520127216e-09, + 1.0797144289753646e-09, + 1.0779978021346892e-09 + ], + "bp_grad_F": [ + 0.0072508929297327995, + 1.4132167507341364e-06, + 6.271753250075562e-08, + 4.991998281411725e-08, + 4.950436149897541e-08 + ], + "gamma_dfa": 0.001284227124415338, + "gamma_dfa_per_layer": [ + 0.00256139412522316, + 0.0014944188296794891, + 0.0013982560485601425, + -0.0003171605058014393 + ], + "acc_eval": 0.240234375, + "loss_eval": 2.0549392700195312, + "epoch": 17 + }, + { + "hidden_norms_cls": [ + 29.22184181213379, + 4211867.5, + 5636704.5, + 6891397.5, + 8559809.0 + ], + "hidden_norms_avg": [ + 647.4288330078125, + 3423908.25, + 5695376.5, + 10367815.0, + 13188250.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.8086895326850936e-05, + 1.1501447572115353e-09, + 8.738501033889179e-10, + 8.528160400089746e-10, + 8.584906674435899e-10 + ], + "bp_grad_F": [ + 0.012267161160707474, + 1.591232035025314e-06, + 4.697067268466526e-08, + 4.271150899626264e-08, + 4.017679700041299e-08 + ], + "gamma_dfa": 0.0022953646985115483, + "gamma_dfa_per_layer": [ + 0.007007642649114132, + 0.0012370320037007332, + 0.0011846421984955668, + -0.0002478580572642386 + ], + "acc_eval": 0.228515625, + "loss_eval": 2.053128242492676, + "epoch": 18 + }, + { + "hidden_norms_cls": [ + 30.412078857421875, + 4986411.0, + 6504586.0, + 7889628.0, + 9783147.0 + ], + "hidden_norms_avg": [ + 670.3391723632812, + 3921667.0, + 6270645.0, + 10589857.0, + 13580617.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.768085505522322e-05, + 1.3132780418700918e-09, + 7.742924079678914e-10, + 7.418777814294231e-10, + 7.448673344789825e-10 + ], + "bp_grad_F": [ + 0.007575999945402145, + 1.7771724287740653e-06, + 5.529824420591467e-08, + 3.790939828718365e-08, + 3.6307092443621514e-08 + ], + "gamma_dfa": 0.0009071348831639625, + "gamma_dfa_per_layer": [ + 0.001273356145247817, + 0.001484773471020162, + 0.0010661636479198933, + -0.00019575373153202236 + ], + "acc_eval": 0.25390625, + "loss_eval": 2.0479414463043213, + "epoch": 19 + }, + { + "hidden_norms_cls": [ + 31.54771614074707, + 5502896.5, + 7070197.5, + 8994800.0, + 11604998.0 + ], + "hidden_norms_avg": [ + 692.4578247070312, + 4249610.0, + 6837255.0, + 11617683.0, + 15223152.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.0367684303200804e-05, + 1.325711207478264e-09, + 6.525959217462685e-10, + 6.324714640904006e-10, + 6.32227936669949e-10 + ], + "bp_grad_F": [ + 0.0062190573662519455, + 1.129235442931531e-06, + 3.317861896334762e-08, + 3.131979653403505e-08, + 3.109861168582029e-08 + ], + "gamma_dfa": 0.0011510169642861001, + "gamma_dfa_per_layer": [ + 0.002568549243733287, + 0.0013005147920921445, + 0.0009535959688946605, + -0.00021859214757569134 + ], + "acc_eval": 0.255859375, + "loss_eval": 2.0359444618225098, + "epoch": 20 + }, + { + "hidden_norms_cls": [ + 32.638641357421875, + 6320697.0, + 7897073.5, + 10165307.0, + 13313912.0 + ], + "hidden_norms_avg": [ + 713.3525390625, + 4812640.5, + 7533297.5, + 12847435.0, + 16993420.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.871564695145935e-05, + 1.2221273992807369e-09, + 6.080098646776833e-10, + 5.917044632042234e-10, + 5.89539916884263e-10 + ], + "bp_grad_F": [ + 0.011915000155568123, + 6.25122083874885e-06, + 3.6603957198622084e-08, + 2.876341298474472e-08, + 2.8581927935533713e-08 + ], + "gamma_dfa": 0.0002986440376844257, + "gamma_dfa_per_layer": [ + -0.0004627959569916129, + 0.0009951044339686632, + 0.0008257199660874903, + -0.00016345229232683778 + ], + "acc_eval": 0.2626953125, + "loss_eval": 2.059875965118408, + "epoch": 21 + }, + { + "hidden_norms_cls": [ + 33.6330451965332, + 7264995.5, + 8758988.0, + 11785280.0, + 15874132.0 + ], + "hidden_norms_avg": [ + 732.8869018554688, + 5982206.0, + 8454064.0, + 14846262.0, + 19834080.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.5420635211048648e-05, + 7.56205986718328e-10, + 5.169706884800007e-10, + 5.026724592127607e-10, + 5.024383686880185e-10 + ], + "bp_grad_F": [ + 0.014803220517933369, + 4.478873961488716e-06, + 4.4555019229619575e-08, + 2.4910459472948787e-08, + 2.4745437698925343e-08 + ], + "gamma_dfa": 0.001046390665578656, + "gamma_dfa_per_layer": [ + 0.0027164756320416927, + 0.0009058329742401838, + 0.0007253356743603945, + -0.00016208161832764745 + ], + "acc_eval": 0.255859375, + "loss_eval": 2.0538365840911865, + "epoch": 22 + }, + { + "hidden_norms_cls": [ + 34.621524810791016, + 8089090.5, + 9671455.0, + 13086530.0, + 17616980.0 + ], + "hidden_norms_avg": [ + 751.2442016601562, + 6699752.5, + 9159771.0, + 15622865.0, + 21214146.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.7939373467233963e-05, + 7.656756340068682e-10, + 5.061054908495066e-10, + 4.837483191799663e-10, + 4.820439047925618e-10 + ], + "bp_grad_F": [ + 0.008210284635424614, + 3.91981393477181e-06, + 2.727725245676993e-08, + 2.349457695061119e-08, + 2.2768137597495297e-08 + ], + "gamma_dfa": 0.0013028495595790446, + "gamma_dfa_per_layer": [ + 0.0034610098227858543, + 0.0012297509238123894, + 0.0006837932160124183, + -0.00016315572429448366 + ], + "acc_eval": 0.2646484375, + "loss_eval": 2.0430214405059814, + "epoch": 23 + }, + { + "hidden_norms_cls": [ + 35.54478454589844, + 9145767.0, + 10558942.0, + 14636200.0, + 19721632.0 + ], + "hidden_norms_avg": [ + 768.5211791992188, + 7473006.0, + 10093548.0, + 17775052.0, + 24159262.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.364618532941677e-05, + 8.066202705769854e-10, + 4.5619852340195166e-10, + 4.4121445386124947e-10, + 4.323804370098827e-10 + ], + "bp_grad_F": [ + 0.09167197346687317, + 4.855019597016508e-06, + 2.689265521382822e-08, + 2.1627007740221416e-08, + 2.0867716443717654e-08 + ], + "gamma_dfa": 0.0001647558601689525, + "gamma_dfa_per_layer": [ + -0.0005364040262065828, + 0.0007433416321873665, + 0.0005910456529818475, + -0.00013895981828682125 + ], + "acc_eval": 0.23046875, + "loss_eval": 2.0427517890930176, + "epoch": 24 + }, + { + "hidden_norms_cls": [ + 36.43881607055664, + 10216266.0, + 11478190.0, + 16476424.0, + 22393992.0 + ], + "hidden_norms_avg": [ + 785.1990966796875, + 8300483.0, + 10872433.0, + 18667924.0, + 25447926.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.0938736017560586e-05, + 7.561202219896757e-10, + 4.2832748459176173e-10, + 4.0923736621678586e-10, + 4.0218126051705383e-10 + ], + "bp_grad_F": [ + 0.013463743962347507, + 1.9222785340389237e-05, + 2.2825457079989064e-08, + 1.9977358434175585e-08, + 1.9259800865256693e-08 + ], + "gamma_dfa": 0.0005702937960450072, + "gamma_dfa_per_layer": [ + 0.0011116554960608482, + 0.0007594762137159705, + 0.0005430461023934186, + -0.00013300262799020857 + ], + "acc_eval": 0.2568359375, + "loss_eval": 2.0594615936279297, + "epoch": 25 + }, + { + "hidden_norms_cls": [ + 37.30263137817383, + 11623684.0, + 12776919.0, + 18306868.0, + 24740858.0 + ], + "hidden_norms_avg": [ + 800.9972534179688, + 9603253.0, + 12104963.0, + 20835068.0, + 28405318.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.261065648985095e-05, + 6.65525801135658e-10, + 3.838940831890625e-10, + 3.742672838313865e-10, + 3.7395189722566613e-10 + ], + "bp_grad_F": [ + 0.007853930816054344, + 1.2899076864414383e-06, + 1.9278010299217385e-08, + 1.8154999281705386e-08, + 1.7368931182204506e-08 + ], + "gamma_dfa": 0.00021361159815569408, + "gamma_dfa_per_layer": [ + -0.00034064118517562747, + 0.0008438127697445452, + 0.0004718025156762451, + -0.00012052770762238652 + ], + "acc_eval": 0.255859375, + "loss_eval": 2.0433781147003174, + "epoch": 26 + }, + { + "hidden_norms_cls": [ + 38.06776428222656, + 12599130.0, + 13703165.0, + 19834172.0, + 26867468.0 + ], + "hidden_norms_avg": [ + 816.2463989257812, + 10421772.0, + 12873138.0, + 21321398.0, + 29452538.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.774638414848596e-05, + 6.227232618449818e-10, + 3.566741624272396e-10, + 3.4781866276034634e-10, + 3.45437983773067e-10 + ], + "bp_grad_F": [ + 0.013920681551098824, + 3.4208371744171018e-06, + 2.1883508338760294e-08, + 1.7128741092165e-08, + 1.6603545205384762e-08 + ], + "gamma_dfa": 0.0008690126524015795, + "gamma_dfa_per_layer": [ + 0.0021882583387196064, + 0.0009064457844942808, + 0.0004841286572627723, + -0.00010278217087034136 + ], + "acc_eval": 0.2529296875, + "loss_eval": 2.0433974266052246, + "epoch": 27 + }, + { + "hidden_norms_cls": [ + 38.7847785949707, + 14429584.0, + 15438086.0, + 21566880.0, + 29267340.0 + ], + "hidden_norms_avg": [ + 830.9344482421875, + 11436777.0, + 13832175.0, + 22913616.0, + 32026754.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.8682481570285745e-05, + 5.758302168423768e-10, + 3.3607527871737375e-10, + 3.304233830991876e-10, + 3.2846284026000205e-10 + ], + "bp_grad_F": [ + 0.012251574546098709, + 2.996052717207931e-05, + 2.7452134787608884e-08, + 1.577506480998636e-08, + 1.5141546683139495e-08 + ], + "gamma_dfa": 0.0004505918041104451, + "gamma_dfa_per_layer": [ + 0.00026967719895765185, + 0.001212525530718267, + 0.0004131481982767582, + -9.298371151089668e-05 + ], + "acc_eval": 0.2607421875, + "loss_eval": 2.039923667907715, + "epoch": 28 + }, + { + "hidden_norms_cls": [ + 39.49647521972656, + 15523604.0, + 16504434.0, + 23236370.0, + 31306890.0 + ], + "hidden_norms_avg": [ + 844.8562622070312, + 12856661.0, + 15124535.0, + 23633704.0, + 32995118.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.6219468054478057e-05, + 5.519696366640403e-10, + 3.2825916984613457e-10, + 3.235848811122821e-10, + 3.2190172749579915e-10 + ], + "bp_grad_F": [ + 0.012884745374321938, + 1.8329246813664213e-05, + 1.8323355277516384e-08, + 1.5584015855552025e-08, + 1.4755748622974352e-08 + ], + "gamma_dfa": 0.0006857650478195865, + "gamma_dfa_per_layer": [ + 0.0016966589028015733, + 0.0007126724813133478, + 0.0003994358121417463, + -6.570700497832149e-05 + ], + "acc_eval": 0.2451171875, + "loss_eval": 2.0533735752105713, + "epoch": 29 + }, + { + "hidden_norms_cls": [ + 40.16881561279297, + 16141660.0, + 17137856.0, + 24286464.0, + 32903152.0 + ], + "hidden_norms_avg": [ + 857.8116455078125, + 12895693.0, + 15492559.0, + 23745768.0, + 33843860.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.2289473892888054e-05, + 6.340856728570543e-10, + 3.264067627295475e-10, + 3.149370209065694e-10, + 3.097411216401724e-10 + ], + "bp_grad_F": [ + 0.006337009835988283, + 1.7065680367522873e-05, + 5.785592804841144e-08, + 1.519365788738014e-08, + 1.464850551968766e-08 + ], + "gamma_dfa": 0.0005419648223323748, + "gamma_dfa_per_layer": [ + 0.00038546844734810293, + 0.0014093497302383184, + 0.0004054713645018637, + -3.243025275878608e-05 + ], + "acc_eval": 0.265625, + "loss_eval": 2.0390102863311768, + "epoch": 30 + }, + { + "hidden_norms_cls": [ + 40.790164947509766, + 18768648.0, + 19610716.0, + 26926266.0, + 36060360.0 + ], + "hidden_norms_avg": [ + 869.6182861328125, + 15248417.0, + 17480158.0, + 26928640.0, + 37555876.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.939497062470764e-05, + 5.127394064885493e-10, + 3.1137872835707014e-10, + 3.074558663218596e-10, + 3.04990144250894e-10 + ], + "bp_grad_F": [ + 0.03832927718758583, + 8.881174835551064e-06, + 2.5206949416656244e-08, + 1.4185034480362901e-08, + 1.3504863893842867e-08 + ], + "gamma_dfa": 0.0005767397606177838, + "gamma_dfa_per_layer": [ + 0.00058704090770334, + 0.0013887862442061305, + 0.0003486467176117003, + -1.751482705003582e-05 + ], + "acc_eval": 0.232421875, + "loss_eval": 2.055915117263794, + "epoch": 31 + }, + { + "hidden_norms_cls": [ + 41.36415481567383, + 20590018.0, + 21418164.0, + 28674892.0, + 38102536.0 + ], + "hidden_norms_avg": [ + 880.8012084960938, + 15857472.0, + 18200580.0, + 27607590.0, + 38905496.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.6930878448183648e-05, + 5.041319584009329e-10, + 3.0716035270828e-10, + 2.9963459491355593e-10, + 2.9755845010193127e-10 + ], + "bp_grad_F": [ + 0.01052916795015335, + 1.7662874597590417e-05, + 1.8223250464188823e-08, + 1.4229329714510186e-08, + 1.2928855319671584e-08 + ], + "gamma_dfa": 0.0005623552362976625, + "gamma_dfa_per_layer": [ + 0.0005056762602180243, + 0.00140343327075243, + 0.0003372218052390963, + 3.0896089810994454e-06 + ], + "acc_eval": 0.2451171875, + "loss_eval": 2.054579734802246, + "epoch": 32 + }, + { + "hidden_norms_cls": [ + 41.9267578125, + 21995458.0, + 22701258.0, + 30227660.0, + 40381468.0 + ], + "hidden_norms_avg": [ + 891.6727294921875, + 17925388.0, + 19924592.0, + 29375846.0, + 41265952.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.4433691325830296e-05, + 4.786913088139499e-10, + 3.083476807219654e-10, + 3.030005690796145e-10, + 3.0202479406327143e-10 + ], + "bp_grad_F": [ + 0.006410651374608278, + 9.426087672181893e-06, + 1.748733602369157e-08, + 1.330249954634155e-08, + 1.2548162509062877e-08 + ], + "gamma_dfa": 0.0005204869294175296, + "gamma_dfa_per_layer": [ + 0.0004088875139132142, + 0.001322226831689477, + 0.00032363145146518946, + 2.7201920602237806e-05 + ], + "acc_eval": 0.2568359375, + "loss_eval": 2.0504493713378906, + "epoch": 33 + }, + { + "hidden_norms_cls": [ + 42.43289566040039, + 23788478.0, + 24547006.0, + 32122702.0, + 42524392.0 + ], + "hidden_norms_avg": [ + 902.5420532226562, + 19126440.0, + 21210522.0, + 30872922.0, + 43207040.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.8793765523005277e-05, + 4.69506655775831e-10, + 2.9882180063722785e-10, + 2.9027436010409247e-10, + 2.88086998700976e-10 + ], + "bp_grad_F": [ + 0.02046363614499569, + 1.535968840471469e-05, + 1.9181511490273806e-08, + 1.3211375105015577e-08, + 1.2052867148781843e-08 + ], + "gamma_dfa": 0.0005800028211524477, + "gamma_dfa_per_layer": [ + 0.0005789051647298038, + 0.001365642063319683, + 0.0003222030645702034, + 5.326099199010059e-05 + ], + "acc_eval": 0.236328125, + "loss_eval": 2.056929349899292, + "epoch": 34 + }, + { + "hidden_norms_cls": [ + 42.88957595825195, + 24876160.0, + 25665632.0, + 33698024.0, + 44433192.0 + ], + "hidden_norms_avg": [ + 912.5694580078125, + 20388924.0, + 22492538.0, + 32293406.0, + 44758584.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.043079595954623e-05, + 4.6556239419182077e-10, + 3.0177585430557485e-10, + 2.9259758504984745e-10, + 2.8850585809259144e-10 + ], + "bp_grad_F": [ + 0.018651673570275307, + 8.0938043538481e-06, + 2.600621051840335e-08, + 1.3419185762586494e-08, + 1.200509913701353e-08 + ], + "gamma_dfa": 0.0008372370848519495, + "gamma_dfa_per_layer": [ + 0.001413366524502635, + 0.0015261531807482243, + 0.0003260627272538841, + 8.336590690305457e-05 + ], + "acc_eval": 0.2353515625, + "loss_eval": 2.060340404510498, + "epoch": 35 + }, + { + "hidden_norms_cls": [ + 43.32978057861328, + 25917158.0, + 26720118.0, + 34948196.0, + 46313048.0 + ], + "hidden_norms_avg": [ + 921.58642578125, + 21474648.0, + 23549474.0, + 33572188.0, + 46615396.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.262757672928274e-05, + 4.5062673037499223e-10, + 2.984587021970242e-10, + 2.923088993078693e-10, + 2.888300987269332e-10 + ], + "bp_grad_F": [ + 0.01846941001713276, + 2.4291131921927445e-05, + 2.994345393858566e-08, + 1.4564162320596097e-08, + 1.1765412644137996e-08 + ], + "gamma_dfa": 0.0007057133989292197, + "gamma_dfa_per_layer": [ + 0.0011925556464120746, + 0.0012432597577571869, + 0.0002897845406550914, + 9.725365089252591e-05 + ], + "acc_eval": 0.2451171875, + "loss_eval": 2.0591180324554443, + "epoch": 36 + }, + { + "hidden_norms_cls": [ + 43.74128341674805, + 27200966.0, + 27911578.0, + 36161972.0, + 47854788.0 + ], + "hidden_norms_avg": [ + 930.2008666992188, + 22529414.0, + 24601434.0, + 34829948.0, + 48238220.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.328157981741242e-05, + 4.659617691693541e-10, + 2.8960928100119077e-10, + 2.8687860420539835e-10, + 2.800103759970085e-10 + ], + "bp_grad_F": [ + 0.004556785803288221, + 9.644008059694897e-06, + 1.5685751364458156e-08, + 1.2929571191477862e-08, + 1.1707988356590704e-08 + ], + "gamma_dfa": 0.0005315981106832623, + "gamma_dfa_per_layer": [ + 0.0004304055473767221, + 0.0012520912569016218, + 0.0003118191962130368, + 0.0001320764422416687 + ], + "acc_eval": 0.255859375, + "loss_eval": 2.049736738204956, + "epoch": 37 + }, + { + "hidden_norms_cls": [ + 44.10750198364258, + 28860724.0, + 29566448.0, + 37605440.0, + 49767188.0 + ], + "hidden_norms_avg": [ + 938.7098999023438, + 24297102.0, + 26192510.0, + 36561148.0, + 49957968.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.900460640375968e-05, + 4.445998014190877e-10, + 2.888302930159625e-10, + 2.855987946137617e-10, + 2.818917876901139e-10 + ], + "bp_grad_F": [ + 0.013354518450796604, + 6.135221156000625e-06, + 1.780158420672251e-08, + 1.3947193622243503e-08, + 1.161484952660885e-08 + ], + "gamma_dfa": 0.0005519518890650943, + "gamma_dfa_per_layer": [ + 0.0005505518638528883, + 0.001156628131866455, + 0.00033354441984556615, + 0.0001670831406954676 + ], + "acc_eval": 0.2412109375, + "loss_eval": 2.0527162551879883, + "epoch": 38 + }, + { + "hidden_norms_cls": [ + 44.42500305175781, + 30085758.0, + 30793664.0, + 39317268.0, + 51773680.0 + ], + "hidden_norms_avg": [ + 946.3699340820312, + 24723960.0, + 26763662.0, + 37607688.0, + 51575988.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.9910466764704324e-05, + 4.753269444712771e-10, + 2.936461906966059e-10, + 2.873846438600225e-10, + 2.8520716344182517e-10 + ], + "bp_grad_F": [ + 0.00976789090782404, + 1.76885150722228e-05, + 1.7970489096796882e-08, + 1.3952313970833075e-08, + 1.130456972475713e-08 + ], + "gamma_dfa": 0.0009108289959840477, + "gamma_dfa_per_layer": [ + 0.0019160081865265965, + 0.0012680008076131344, + 0.00030145354685373604, + 0.00015785344294272363 + ], + "acc_eval": 0.2412109375, + "loss_eval": 2.0550765991210938, + "epoch": 39 + }, + { + "hidden_norms_cls": [ + 44.73127746582031, + 30730856.0, + 31431762.0, + 40187116.0, + 53148352.0 + ], + "hidden_norms_avg": [ + 953.6856079101562, + 24778752.0, + 27014248.0, + 38275640.0, + 52795456.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.8919872420374304e-05, + 4.755910110176842e-10, + 2.84101492331601e-10, + 2.7933383384137755e-10, + 2.7627339305169585e-10 + ], + "bp_grad_F": [ + 0.009574169293045998, + 4.757252463605255e-05, + 1.5709005651842745e-08, + 1.3778580054690792e-08, + 1.1154800638735196e-08 + ], + "gamma_dfa": 0.0003838329284917563, + "gamma_dfa_per_layer": [ + -0.0004134870832785964, + 0.001480170525610447, + 0.0002943193248938769, + 0.00017432894674129784 + ], + "acc_eval": 0.255859375, + "loss_eval": 2.0383803844451904, + "epoch": 40 + }, + { + "hidden_norms_cls": [ + 44.999107360839844, + 32617970.0, + 33381886.0, + 41663220.0, + 54853168.0 + ], + "hidden_norms_avg": [ + 960.5386962890625, + 27910628.0, + 29647900.0, + 40418716.0, + 54716684.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.9992028430569917e-05, + 4.221052118946744e-10, + 2.9753777219809763e-10, + 2.8370578109004896e-10, + 2.813366484222257e-10 + ], + "bp_grad_F": [ + 0.015446176752448082, + 3.8060017686802894e-05, + 5.211516906911129e-08, + 1.3235438522940512e-08, + 1.116207481999254e-08 + ], + "gamma_dfa": 0.0005705733274226077, + "gamma_dfa_per_layer": [ + 0.0006168894469738007, + 0.0011725829681381583, + 0.00029753358103334904, + 0.00019528731354512274 + ], + "acc_eval": 0.240234375, + "loss_eval": 2.0557656288146973, + "epoch": 41 + }, + { + "hidden_norms_cls": [ + 45.25053024291992, + 33936992.0, + 34621240.0, + 42946580.0, + 56031144.0 + ], + "hidden_norms_avg": [ + 966.2922973632812, + 28239400.0, + 30055502.0, + 41338012.0, + 56048388.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.0256345780799165e-05, + 4.424338395647709e-10, + 2.9891861208497517e-10, + 2.8403482343897224e-10, + 2.798661857816853e-10 + ], + "bp_grad_F": [ + 0.006179355084896088, + 8.527667887392454e-06, + 2.116273023489157e-08, + 1.2261468285146293e-08, + 1.1058569171495947e-08 + ], + "gamma_dfa": 0.0009438929373573046, + "gamma_dfa_per_layer": [ + 0.00216879416257143, + 0.0010916339233517647, + 0.0003159396001137793, + 0.00019920406339224428 + ], + "acc_eval": 0.2470703125, + "loss_eval": 2.0517942905426025, + "epoch": 42 + }, + { + "hidden_norms_cls": [ + 45.481727600097656, + 34746476.0, + 35397348.0, + 43639664.0, + 57119836.0 + ], + "hidden_norms_avg": [ + 971.5364379882812, + 28891962.0, + 30705540.0, + 42078288.0, + 57065612.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.9764614737359807e-05, + 4.5060349895820195e-10, + 3.0148228358228835e-10, + 2.912529661891483e-10, + 2.8715479993834947e-10 + ], + "bp_grad_F": [ + 0.02291245572268963, + 1.3926567589805927e-05, + 3.118159241921603e-08, + 2.1897225366274142e-08, + 1.1063916893760961e-08 + ], + "gamma_dfa": 0.00046937728620832786, + "gamma_dfa_per_layer": [ + -0.00010078266495838761, + 0.0014219002332538366, + 0.0003067174111492932, + 0.00024967416538856924 + ], + "acc_eval": 0.2451171875, + "loss_eval": 2.054462432861328, + "epoch": 43 + }, + { + "hidden_norms_cls": [ + 45.68215560913086, + 35169816.0, + 35827116.0, + 44266788.0, + 58219984.0 + ], + "hidden_norms_avg": [ + 976.61279296875, + 29302304.0, + 31207594.0, + 42541932.0, + 57918596.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.18697166221682e-05, + 4.4465031656670817e-10, + 3.0559865749069104e-10, + 2.891223926937414e-10, + 2.8127278284273416e-10 + ], + "bp_grad_F": [ + 0.02285478264093399, + 5.0576767534948885e-05, + 2.966898726697309e-08, + 1.374073210769211e-08, + 1.1011787037773502e-08 + ], + "gamma_dfa": 0.0006015256294631399, + "gamma_dfa_per_layer": [ + 0.0005435256171040237, + 0.0013653798960149288, + 0.000284912355709821, + 0.0002122846490237862 + ], + "acc_eval": 0.244140625, + "loss_eval": 2.0539493560791016, + "epoch": 44 + }, + { + "hidden_norms_cls": [ + 45.86240005493164, + 36071220.0, + 36702996.0, + 45105948.0, + 59117940.0 + ], + "hidden_norms_avg": [ + 980.9766845703125, + 29250424.0, + 31315982.0, + 42895240.0, + 58632240.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.0838917155051604e-05, + 4.517226037670241e-10, + 3.037594897836726e-10, + 2.95300450758873e-10, + 2.8246391337027887e-10 + ], + "bp_grad_F": [ + 0.009441024623811245, + 2.5670700779301114e-05, + 2.221704953342396e-08, + 1.750507294673298e-08, + 1.1021731971538884e-08 + ], + "gamma_dfa": 0.00038505904376506805, + "gamma_dfa_per_layer": [ + -0.0006303560803644359, + 0.0016098625492304564, + 0.00032150247716344893, + 0.00023922722903080285 + ], + "acc_eval": 0.244140625, + "loss_eval": 2.0488905906677246, + "epoch": 45 + }, + { + "hidden_norms_cls": [ + 46.00979995727539, + 36876176.0, + 37547776.0, + 45586304.0, + 59641656.0 + ], + "hidden_norms_avg": [ + 984.9158935546875, + 29720264.0, + 31840778.0, + 43341952.0, + 59202960.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.8270042093936354e-05, + 4.981586254615422e-10, + 3.011032534416813e-10, + 2.830454204350019e-10, + 2.763113071679868e-10 + ], + "bp_grad_F": [ + 0.01947774738073349, + 4.3539188482100144e-05, + 2.1426325602647012e-08, + 1.4225844502391283e-08, + 1.0958768115187922e-08 + ], + "gamma_dfa": 0.0003295415808679536, + "gamma_dfa_per_layer": [ + -0.0008024196140468121, + 0.0015490652294829488, + 0.0003235205076634884, + 0.0002480002003721893 + ], + "acc_eval": 0.2568359375, + "loss_eval": 2.0367085933685303, + "epoch": 46 + }, + { + "hidden_norms_cls": [ + 46.14581298828125, + 37542628.0, + 38211032.0, + 46396536.0, + 60543468.0 + ], + "hidden_norms_avg": [ + 988.5308837890625, + 31589698.0, + 33421126.0, + 44806960.0, + 60355708.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.7766556740971282e-05, + 4.28473617697378e-10, + 3.07322972625812e-10, + 2.9381372335102185e-10, + 2.797302944834712e-10 + ], + "bp_grad_F": [ + 0.06864868849515915, + 3.788271715166047e-05, + 2.1370066605186366e-08, + 1.4025233419090455e-08, + 1.1044066994259083e-08 + ], + "gamma_dfa": 9.462468733545393e-05, + "gamma_dfa_per_layer": [ + -0.0015880623832345009, + 0.0014036648208275437, + 0.0003099621389992535, + 0.00025293417274951935 + ], + "acc_eval": 0.244140625, + "loss_eval": 2.0631895065307617, + "epoch": 47 + }, + { + "hidden_norms_cls": [ + 46.26278305053711, + 38372568.0, + 39046204.0, + 47148944.0, + 61308416.0 + ], + "hidden_norms_avg": [ + 991.4658813476562, + 31279712.0, + 33238512.0, + 44902484.0, + 60826544.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.812536695273593e-05, + 4.3919237691092405e-10, + 3.053821084897379e-10, + 2.9203767182295337e-10, + 2.833127066281804e-10 + ], + "bp_grad_F": [ + 0.011117708869278431, + 2.0018645955133252e-05, + 1.9244726701117543e-08, + 1.4165241424279884e-08, + 1.090406964721069e-08 + ], + "gamma_dfa": 0.00016991631855489686, + "gamma_dfa_per_layer": [ + -0.0015358870150521398, + 0.0016542371595278382, + 0.0003059905138798058, + 0.00025532461586408317 + ], + "acc_eval": 0.2548828125, + "loss_eval": 2.0491740703582764, + "epoch": 48 + }, + { + "hidden_norms_cls": [ + 46.36857223510742, + 38788812.0, + 39461172.0, + 47582644.0, + 61831224.0 + ], + "hidden_norms_avg": [ + 994.04541015625, + 32215950.0, + 34096260.0, + 45599356.0, + 61425516.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.0041363061172888e-05, + 4.480187609789965e-10, + 3.0562316566395964e-10, + 2.9085803210371353e-10, + 2.820148004012424e-10 + ], + "bp_grad_F": [ + 0.03149434179067612, + 6.209969433257356e-05, + 2.1469357847081483e-08, + 1.3228349970972886e-08, + 1.092844392758252e-08 + ], + "gamma_dfa": 0.00010758559074020013, + "gamma_dfa_per_layer": [ + -0.0014505982398986816, + 0.001327117788605392, + 0.0002981229918077588, + 0.0002556998224463314 + ], + "acc_eval": 0.244140625, + "loss_eval": 2.0554656982421875, + "epoch": 49 + }, + { + "hidden_norms_cls": [ + 46.4505729675293, + 38845108.0, + 39504860.0, + 47660992.0, + 62097052.0 + ], + "hidden_norms_avg": [ + 996.2877807617188, + 32178676.0, + 34106748.0, + 45494312.0, + 61553340.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.0276962206698954e-05, + 4.5564105266571175e-10, + 3.0059965627771135e-10, + 2.8785077099691136e-10, + 2.794499076586021e-10 + ], + "bp_grad_F": [ + 0.011724308133125305, + 1.9755616449401714e-05, + 2.1592299503936374e-08, + 1.3796129572085647e-08, + 1.0886693324607677e-08 + ], + "gamma_dfa": 0.0002330350544070825, + "gamma_dfa_per_layer": [ + -0.0009828422917053103, + 0.0013922813814133406, + 0.00027237151516601443, + 0.00025032961275428534 + ], + "acc_eval": 0.2578125, + "loss_eval": 2.0504729747772217, + "epoch": 50 + }, + { + "hidden_norms_cls": [ + 46.521934509277344, + 39260604.0, + 39906660.0, + 48073644.0, + 62524844.0 + ], + "hidden_norms_avg": [ + 998.1359252929688, + 32138106.0, + 34129788.0, + 45757544.0, + 61958428.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.9659293431905098e-05, + 4.597033309572396e-10, + 3.0463259692581346e-10, + 2.893623118893629e-10, + 2.780784769118583e-10 + ], + "bp_grad_F": [ + 0.009033501148223877, + 1.7998809198616073e-05, + 2.5067617315244206e-08, + 1.8738653295713448e-08, + 1.087139978039886e-08 + ], + "gamma_dfa": 0.00016801172751002014, + "gamma_dfa_per_layer": [ + -0.0013465819647535682, + 0.0014174225507304072, + 0.00031502131605520844, + 0.00028618500800803304 + ], + "acc_eval": 0.255859375, + "loss_eval": 2.0473151206970215, + "epoch": 51 + }, + { + "hidden_norms_cls": [ + 46.57882308959961, + 39427768.0, + 40090548.0, + 48369740.0, + 62859588.0 + ], + "hidden_norms_avg": [ + 999.5881958007812, + 32546802.0, + 34502940.0, + 46179212.0, + 62426560.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.0221139240893535e-05, + 4.495410987903625e-10, + 3.065779852207129e-10, + 2.9148336522233365e-10, + 2.8107866034687845e-10 + ], + "bp_grad_F": [ + 0.016372976824641228, + 2.868929186661262e-05, + 2.4158071099122935e-08, + 2.1377838166358742e-08, + 1.0851396226030374e-08 + ], + "gamma_dfa": 0.00012949823576491326, + "gamma_dfa_per_layer": [ + -0.0014246907085180283, + 0.0013606694992631674, + 0.0003105594660155475, + 0.0002714546862989664 + ], + "acc_eval": 0.2568359375, + "loss_eval": 2.0468568801879883, + "epoch": 52 + }, + { + "hidden_norms_cls": [ + 46.621891021728516, + 39709320.0, + 40367452.0, + 48619224.0, + 63258040.0 + ], + "hidden_norms_avg": [ + 1000.7721557617188, + 33325650.0, + 35170832.0, + 47006208.0, + 63117408.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.0193185011739843e-05, + 4.388156504830931e-10, + 3.137757831339627e-10, + 2.8996427481331466e-10, + 2.7836044580453745e-10 + ], + "bp_grad_F": [ + 0.020163528621196747, + 3.054905027966015e-05, + 2.3064796295102497e-08, + 1.4526934322134366e-08, + 1.0852998499899513e-08 + ], + "gamma_dfa": 0.00017183857562486082, + "gamma_dfa_per_layer": [ + -0.0013185564894229174, + 0.0014156483812257648, + 0.00031098624458536506, + 0.00027927616611123085 + ], + "acc_eval": 0.2529296875, + "loss_eval": 2.054586410522461, + "epoch": 53 + }, + { + "hidden_norms_cls": [ + 46.65864562988281, + 39798476.0, + 40463920.0, + 48764504.0, + 63346472.0 + ], + "hidden_norms_avg": [ + 1001.6641845703125, + 33379128.0, + 35239452.0, + 46955488.0, + 63122060.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.965362000395544e-05, + 4.4001230437018535e-10, + 3.0546970508638083e-10, + 2.8820767994375274e-10, + 2.777780505613947e-10 + ], + "bp_grad_F": [ + 0.048469845205545425, + 4.790218736161478e-05, + 2.6222814142329298e-08, + 2.4079582772174035e-08, + 1.0861339383438917e-08 + ], + "gamma_dfa": -6.432890222640708e-05, + "gamma_dfa_per_layer": [ + -0.002126228529959917, + 0.0012497524730861187, + 0.00034036440774798393, + 0.0002787960402201861 + ], + "acc_eval": 0.2509765625, + "loss_eval": 2.0531256198883057, + "epoch": 54 + }, + { + "hidden_norms_cls": [ + 46.683528900146484, + 39922192.0, + 40544356.0, + 48855360.0, + 63435588.0 + ], + "hidden_norms_avg": [ + 1002.31494140625, + 33437468.0, + 35316604.0, + 47039952.0, + 63236136.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.79724281426752e-05, + 4.357196548010478e-10, + 3.0789479299464517e-10, + 2.8999944112761966e-10, + 2.7672003577450255e-10 + ], + "bp_grad_F": [ + 0.009082098491489887, + 6.448025487770792e-06, + 2.3372145108169207e-08, + 1.58603672417712e-08, + 1.0855457865943663e-08 + ], + "gamma_dfa": 8.819025242701173e-05, + "gamma_dfa_per_layer": [ + -0.0015805144794285297, + 0.0013432127889245749, + 0.000321696512401104, + 0.00026836618781089783 + ], + "acc_eval": 0.2529296875, + "loss_eval": 2.0517051219940186, + "epoch": 55 + }, + { + "hidden_norms_cls": [ + 46.70249938964844, + 40094040.0, + 40695052.0, + 48969004.0, + 63542232.0 + ], + "hidden_norms_avg": [ + 1002.7830810546875, + 33826664.0, + 35653116.0, + 47279168.0, + 63409756.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.8208709409227595e-05, + 4.3868975119210063e-10, + 3.102354484418868e-10, + 2.8893865078316594e-10, + 2.794520170823489e-10 + ], + "bp_grad_F": [ + 0.012775770388543606, + 3.5907680285163224e-05, + 3.276610627267473e-08, + 1.9733393585852355e-08, + 1.0837335473468102e-08 + ], + "gamma_dfa": -7.604052370879799e-06, + "gamma_dfa_per_layer": [ + -0.0020841513760387897, + 0.001464233035221696, + 0.0003138828033115715, + 0.0002756193280220032 + ], + "acc_eval": 0.2509765625, + "loss_eval": 2.053762912750244, + "epoch": 56 + }, + { + "hidden_norms_cls": [ + 46.71390914916992, + 39990840.0, + 40613704.0, + 48947088.0, + 63626668.0 + ], + "hidden_norms_avg": [ + 1003.0780639648438, + 33512400.0, + 35398544.0, + 47052320.0, + 63319172.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.8852005925728008e-05, + 4.408986231663192e-10, + 3.0767774439333095e-10, + 2.8811911190196327e-10, + 2.780060626150771e-10 + ], + "bp_grad_F": [ + 0.017775027081370354, + 2.9518716473830864e-05, + 1.6785485001946654e-08, + 1.3991450664718741e-08, + 1.082214762249123e-08 + ], + "gamma_dfa": 0.0001292051310883835, + "gamma_dfa_per_layer": [ + -0.001528067048639059, + 0.0014583747833967209, + 0.0003044582554139197, + 0.0002820545341819525 + ], + "acc_eval": 0.2548828125, + "loss_eval": 2.0512585639953613, + "epoch": 57 + }, + { + "hidden_norms_cls": [ + 46.72029495239258, + 40048976.0, + 40673908.0, + 49005780.0, + 63650516.0 + ], + "hidden_norms_avg": [ + 1003.2393188476562, + 33518072.0, + 35408260.0, + 47059300.0, + 63337588.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.040391493414063e-05, + 4.422071042675668e-10, + 3.0922153726464785e-10, + 2.885988392709038e-10, + 2.7767882437856883e-10 + ], + "bp_grad_F": [ + 0.05996337905526161, + 4.702213846030645e-05, + 2.0060964445178797e-08, + 1.6814832193290385e-08, + 1.0825355722943186e-08 + ], + "gamma_dfa": 6.977042357902974e-05, + "gamma_dfa_per_layer": [ + -0.0016858375165611506, + 0.001342209754511714, + 0.00032920570811256766, + 0.00029350374825298786 + ], + "acc_eval": 0.25390625, + "loss_eval": 2.0525753498077393, + "epoch": 58 + }, + { + "hidden_norms_cls": [ + 46.723426818847656, + 40078224.0, + 40696452.0, + 49005116.0, + 63676392.0 + ], + "hidden_norms_avg": [ + 1003.3213500976562, + 33528454.0, + 35420932.0, + 47084140.0, + 63362884.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.9969949537189677e-05, + 4.438247824811725e-10, + 3.0574925924398144e-10, + 2.876155424935689e-10, + 2.772651552795935e-10 + ], + "bp_grad_F": [ + 0.015555496327579021, + 1.9468383470666595e-05, + 2.2645199493354085e-08, + 2.0153352764396004e-08, + 1.082723954937137e-08 + ], + "gamma_dfa": -2.766123361652717e-05, + "gamma_dfa_per_layer": [ + -0.0021022262517362833, + 0.0013793597463518381, + 0.0003187692491337657, + 0.0002934523217845708 + ], + "acc_eval": 0.2529296875, + "loss_eval": 2.05129337310791, + "epoch": 59 + }, + { + "hidden_norms_cls": [ + 46.72323226928711, + 40073516.0, + 40694276.0, + 48970848.0, + 63674696.0 + ], + "hidden_norms_avg": [ + 1003.3206176757812, + 33517796.0, + 35411552.0, + 47074216.0, + 63356572.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.986433173646219e-05, + 4.4209438887499175e-10, + 3.069269838285038e-10, + 2.8717661582078335e-10, + 2.7721389073143143e-10 + ], + "bp_grad_F": [ + 0.011835500597953796, + 1.2977254300494678e-05, + 2.7325663509714104e-08, + 2.23609397664859e-08, + 1.0828303587118171e-08 + ], + "gamma_dfa": 4.879416519543156e-05, + "gamma_dfa_per_layer": [ + -0.0018596879672259092, + 0.0014319919282570481, + 0.0003201703366357833, + 0.00030270236311480403 + ], + "acc_eval": 0.2529296875, + "loss_eval": 2.051326274871826, + "epoch": 60 + } + ] +} \ No newline at end of file diff --git a/results/structured_aux/structured_aux_t5_s42.json b/results/structured_aux/structured_aux_t5_s42.json new file mode 100644 index 0000000..d1e671b --- /dev/null +++ b/results/structured_aux/structured_aux_t5_s42.json @@ -0,0 +1,6481 @@ +{ + "args": { + "num_blocks": 4, + "d_hidden": 256, + "batch_size": 128, + "epochs": 100, + "t0": 5, + "alpha": 0.75, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "M": 4, + "seed": 42, + "gpu": 2, + "output_dir": "results/structured_aux" + }, + "dfa_ckpt_acc": 0.304, + "fresh_sigma": 48.45175752639771, + "continue_DFA": { + "test_acc": [ + 0.3055, + 0.3025, + 0.3224, + 0.2971, + 0.3011, + 0.3158, + 0.3148, + 0.2917, + 0.3128, + 0.3092, + 0.3117, + 0.3029, + 0.3018, + 0.2891, + 0.3079, + 0.294, + 0.3136, + 0.297, + 0.3097, + 0.3143, + 0.306, + 0.3011, + 0.3085, + 0.3112, + 0.3071, + 0.3216, + 0.306, + 0.3039, + 0.3042, + 0.3179, + 0.3125, + 0.3099, + 0.3093, + 0.3114, + 0.303, + 0.3076, + 0.3098, + 0.3081, + 0.3176, + 0.306, + 0.3063, + 0.2957, + 0.3092, + 0.2989, + 0.3149, + 0.3091, + 0.3025, + 0.309, + 0.2979, + 0.3043, + 0.3122, + 0.3105, + 0.2994, + 0.3104, + 0.3163, + 0.3144, + 0.3072, + 0.3095, + 0.3116, + 0.3008, + 0.3108, + 0.3135, + 0.3144, + 0.3143, + 0.3155, + 0.3128, + 0.3122, + 0.3105, + 0.3091, + 0.3132, + 0.3027, + 0.3099, + 0.3087, + 0.3119, + 0.311, + 0.3091, + 0.3104, + 0.3129, + 0.3084, + 0.3121, + 0.3152, + 0.3123, + 0.3127, + 0.3107, + 0.3115, + 0.3096, + 0.3116, + 0.3104, + 0.3117, + 0.3122, + 0.312, + 0.3118, + 0.3117, + 0.3115, + 0.3115 + ], + "train_loss": [ + 1.991048743209839, + 1.9916367597198485, + 1.9883640994262695, + 1.9904318043518066, + 1.990765456390381, + 1.9885113190460204, + 1.988723781814575, + 1.9883269626617432, + 1.9865176509857179, + 1.986528792037964, + 1.9871076442718505, + 1.9852300271606445, + 1.9855789277648925, + 1.9873473043823242, + 1.9887369604873657, + 1.984825173187256, + 1.986682919845581, + 1.986023438949585, + 1.9879054671478271, + 1.984492504119873, + 1.9841545476531983, + 1.985333773574829, + 1.9837070235443115, + 1.9856928632354736, + 1.985661566505432, + 1.9854957870101928, + 1.9840560776138305, + 1.9859882206726074, + 1.9846108224487304, + 1.9859439390563964, + 1.985415450668335, + 1.985925768699646, + 1.9856847537231446, + 1.9866711866760254, + 1.9869563925552367, + 1.9871451406860352, + 1.9837623266601563, + 1.9858767760467528, + 1.9862659697723388, + 1.9852370281219482, + 1.9850765836334228, + 1.9856702326965332, + 1.986476949081421, + 1.9855420697784423, + 1.9845534466552734, + 1.9860719301605225, + 1.9862464963531494, + 1.985343392906189, + 1.985123703918457, + 1.9840784968566894, + 1.988379104537964, + 1.9863914632415771, + 1.9844388414001466, + 1.986172850189209, + 1.9863445208740234, + 1.9870363287734985, + 1.9851792503356933, + 1.9847805208587646, + 1.9851327020645142, + 1.984974264831543, + 1.9859494774627686, + 1.9863537815856933, + 1.9853967378234862, + 1.9863174615859986, + 1.985906039199829, + 1.9847168277359009, + 1.9855578246688843, + 1.9851220603942872, + 1.9855838941192627, + 1.9842845658874513, + 1.9864070181655884, + 1.9828656870269776, + 1.9845347036743164, + 1.9851781808853148, + 1.9849923505020142, + 1.9846813095474243, + 1.9840032190322876, + 1.9832153865814208, + 1.9829858123397828, + 1.9832415357971191, + 1.984812937889099, + 1.9836833013916015, + 1.9820556320953369, + 1.9829538493347167, + 1.9816045610046387, + 1.983920804977417, + 1.9816958462524414, + 1.9848244665145873, + 1.983539125366211, + 1.9812593657684325, + 1.98392430519104, + 1.982444817276001, + 1.9834877124404908, + 1.9847186293792725, + 1.9808635054016113 + ], + "gamma": [ + [ + 6, + 0.08111585443839431 + ], + [ + 7, + 0.08216675627045333 + ], + [ + 8, + 0.08403038466349244 + ], + [ + 9, + 0.08592397905886173 + ], + [ + 10, + 0.08453304693102837 + ], + [ + 13, + 0.08727108407765627 + ], + [ + 15, + 0.08908557938411832 + ], + [ + 20, + 0.09117648331448436 + ], + [ + 25, + 0.09268091293051839 + ], + [ + 35, + 0.09528384893201292 + ], + [ + 45, + 0.09749913006089628 + ], + [ + 55, + 0.09926950337830931 + ], + [ + 65, + 0.10043945582583547 + ], + [ + 75, + 0.10120803816244006 + ], + [ + 85, + 0.10144373204093426 + ], + [ + 95, + 0.10144099860917777 + ], + [ + 100, + 0.10145036247558892 + ] + ], + "rho": [ + [ + 6, + 0.02260437374934554 + ], + [ + 7, + 0.018085405696183443 + ], + [ + 8, + 0.003474419005215168 + ], + [ + 9, + 0.03226925013586879 + ], + [ + 10, + -0.006800428731366992 + ], + [ + 13, + 0.0110914102406241 + ], + [ + 15, + 0.005172164877876639 + ], + [ + 20, + -8.558854460716248e-06 + ], + [ + 25, + 0.007936288602650166 + ], + [ + 35, + 0.0030459770932793617 + ], + [ + 45, + 0.0008034338243305683 + ], + [ + 55, + -0.013237068429589272 + ], + [ + 65, + -0.0035184742882847786 + ], + [ + 75, + 0.0012920110020786524 + ], + [ + 85, + -0.0010051392018795013 + ], + [ + 95, + 0.003301333636045456 + ], + [ + 100, + -0.006845369935035706 + ] + ], + "alpha_eff": [ + [ + 6, + 0.0 + ], + [ + 7, + 0.0 + ], + [ + 8, + 0.0 + ], + [ + 9, + 0.0 + ], + [ + 10, + 0.0 + ], + [ + 11, + 0.0 + ], + [ + 12, + 0.0 + ], + [ + 13, + 0.0 + ], + [ + 14, + 0.0 + ], + [ + 15, + 0.0 + ], + [ + 16, + 0.0 + ], + [ + 17, + 0.0 + ], + [ + 18, + 0.0 + ], + [ + 19, + 0.0 + ], + [ + 20, + 0.0 + ], + [ + 21, + 0.0 + ], + [ + 22, + 0.0 + ], + [ + 23, + 0.0 + ], + [ + 24, + 0.0 + ], + [ + 25, + 0.0 + ], + [ + 26, + 0.0 + ], + [ + 27, + 0.0 + ], + [ + 28, + 0.0 + ], + [ + 29, + 0.0 + ], + [ + 30, + 0.0 + ], + [ + 31, + 0.0 + ], + [ + 32, + 0.0 + ], + [ + 33, + 0.0 + ], + [ + 34, + 0.0 + ], + [ + 35, + 0.0 + ], + [ + 36, + 0.0 + ], + [ + 37, + 0.0 + ], + [ + 38, + 0.0 + ], + [ + 39, + 0.0 + ], + [ + 40, + 0.0 + ], + [ + 41, + 0.0 + ], + [ + 42, + 0.0 + ], + [ + 43, + 0.0 + ], + [ + 44, + 0.0 + ], + [ + 45, + 0.0 + ], + [ + 46, + 0.0 + ], + [ + 47, + 0.0 + ], + [ + 48, + 0.0 + ], + [ + 49, + 0.0 + ], + [ + 50, + 0.0 + ], + [ + 51, + 0.0 + ], + [ + 52, + 0.0 + ], + [ + 53, + 0.0 + ], + [ + 54, + 0.0 + ], + [ + 55, + 0.0 + ], + [ + 56, + 0.0 + ], + [ + 57, + 0.0 + ], + [ + 58, + 0.0 + ], + [ + 59, + 0.0 + ], + [ + 60, + 0.0 + ], + [ + 61, + 0.0 + ], + [ + 62, + 0.0 + ], + [ + 63, + 0.0 + ], + [ + 64, + 0.0 + ], + [ + 65, + 0.0 + ], + [ + 66, + 0.0 + ], + [ + 67, + 0.0 + ], + [ + 68, + 0.0 + ], + [ + 69, + 0.0 + ], + [ + 70, + 0.0 + ], + [ + 71, + 0.0 + ], + [ + 72, + 0.0 + ], + [ + 73, + 0.0 + ], + [ + 74, + 0.0 + ], + [ + 75, + 0.0 + ], + [ + 76, + 0.0 + ], + [ + 77, + 0.0 + ], + [ + 78, + 0.0 + ], + [ + 79, + 0.0 + ], + [ + 80, + 0.0 + ], + [ + 81, + 0.0 + ], + [ + 82, + 0.0 + ], + [ + 83, + 0.0 + ], + [ + 84, + 0.0 + ], + [ + 85, + 0.0 + ], + [ + 86, + 0.0 + ], + [ + 87, + 0.0 + ], + [ + 88, + 0.0 + ], + [ + 89, + 0.0 + ], + [ + 90, + 0.0 + ], + [ + 91, + 0.0 + ], + [ + 92, + 0.0 + ], + [ + 93, + 0.0 + ], + [ + 94, + 0.0 + ], + [ + 95, + 0.0 + ], + [ + 96, + 0.0 + ], + [ + 97, + 0.0 + ], + [ + 98, + 0.0 + ], + [ + 99, + 0.0 + ], + [ + 100, + 0.0 + ] + ] + }, + "blend_random_trainable": { + "test_acc": [ + 0.3024, + 0.3133, + 0.3097, + 0.307, + 0.3116, + 0.3037, + 0.3014, + 0.2983, + 0.291, + 0.3055, + 0.3125, + 0.3139, + 0.3176, + 0.3088, + 0.3045, + 0.3023, + 0.3169, + 0.3117, + 0.3143, + 0.3083, + 0.3044, + 0.3178, + 0.31, + 0.3154, + 0.3085, + 0.3108, + 0.3147, + 0.3214, + 0.3137, + 0.3153, + 0.32, + 0.3137, + 0.3128, + 0.3133, + 0.3224, + 0.316, + 0.3188, + 0.3258, + 0.3181, + 0.3258, + 0.318, + 0.3162, + 0.3205, + 0.3186, + 0.3133, + 0.3192, + 0.3257, + 0.3151, + 0.3148, + 0.3225, + 0.3158, + 0.3179, + 0.3219, + 0.3152, + 0.3179, + 0.3174, + 0.324, + 0.3211, + 0.3156, + 0.3182, + 0.3209, + 0.3242, + 0.3204, + 0.3295, + 0.3139, + 0.3167, + 0.3243, + 0.3252, + 0.325, + 0.3206, + 0.3204, + 0.3258, + 0.3232, + 0.3239, + 0.3176, + 0.3245, + 0.3182, + 0.3243, + 0.3214, + 0.3223, + 0.3266, + 0.326, + 0.3262, + 0.3237, + 0.3235, + 0.3235, + 0.3225, + 0.3234, + 0.3228, + 0.3224, + 0.3233, + 0.3235, + 0.3238, + 0.3238, + 0.3239 + ], + "train_loss": [ + 1.9876464429473877, + 1.9871312660217286, + 1.98794667137146, + 1.979866360206604, + 1.9829724767303467, + 1.978883454246521, + 1.9780245680999755, + 1.9819539237213135, + 1.9816560133361816, + 1.9825326041412354, + 1.9787122887420654, + 1.973865717124939, + 1.9732693460845947, + 1.9691582153320313, + 1.9713216143035888, + 1.970405147857666, + 1.9690808911895752, + 1.9719929265975953, + 1.9672391814422607, + 1.9673247147369384, + 1.9670495735931397, + 1.9656842587280274, + 1.9644684192276, + 1.96691089553833, + 1.9685032133483886, + 1.9638118313980102, + 1.9630551633453368, + 1.965095313796997, + 1.9634219128036499, + 1.9641351106262206, + 1.9643780905151367, + 1.9637394803237915, + 1.9656481066131593, + 1.9634420028686523, + 1.9667505270385741, + 1.9628459647369385, + 1.9643579544830323, + 1.9633583740234375, + 1.9635034155273436, + 1.9661723876190185, + 1.9633576497650147, + 1.9618351065826416, + 1.9632835869598388, + 1.966858482017517, + 1.9653798733901977, + 1.9619794463348388, + 1.9633574157714844, + 1.9612697646713257, + 1.9618599697113037, + 1.9626816901016235, + 1.9624275286102295, + 1.960104427833557, + 1.9636346054458618, + 1.9611790425872804, + 1.9631773295593262, + 1.9610639614486693, + 1.9634941321563721, + 1.9607968753814697, + 1.960719214401245, + 1.9611839714813233, + 1.961498717956543, + 1.962079864730835, + 1.9621083187103272, + 1.9580735195159913, + 1.9596791373443603, + 1.9599584259796143, + 1.9578871935653686, + 1.9627594772338868, + 1.9603685702896119, + 1.9600560396575928, + 1.9598616068267822, + 1.9589437344360352, + 1.9607008143615723, + 1.9578518214416505, + 1.960224426651001, + 1.959071869430542, + 1.959806990737915, + 1.9606619339370728, + 1.958533956451416, + 1.956637857093811, + 1.9607464468765259, + 1.9562711632537841, + 1.959853370666504, + 1.9559039768218993, + 1.9549042249298096, + 1.9581724520492554, + 1.9576588166046143, + 1.9579018334960938, + 1.9578932962036133, + 1.9547549870300294, + 1.9586515881347657, + 1.9600395129776, + 1.957794129257202, + 1.9562179388809204, + 1.9606438481903077 + ], + "gamma": [ + [ + 6, + 0.023424091981723905 + ], + [ + 7, + 0.02299115271307528 + ], + [ + 8, + 0.018762043910101056 + ], + [ + 9, + 0.03282992116874084 + ], + [ + 10, + 0.0370270183775574 + ], + [ + 13, + 0.031177338445559144 + ], + [ + 15, + 0.03360762202646583 + ], + [ + 20, + 0.036809065961278975 + ], + [ + 25, + 0.027988859452307224 + ], + [ + 35, + 0.03813225851627067 + ], + [ + 45, + 0.026877354714088142 + ], + [ + 55, + 0.02659994421992451 + ], + [ + 65, + 0.03517918023862876 + ], + [ + 75, + 0.02342122921254486 + ], + [ + 85, + 0.024287903041113168 + ], + [ + 95, + 0.03690479922806844 + ], + [ + 100, + 0.03183859743876383 + ] + ], + "rho": [ + [ + 6, + 0.004794585169292986 + ], + [ + 7, + 0.01906854542903602 + ], + [ + 8, + 0.018232747446745634 + ], + [ + 9, + -0.006440505385398865 + ], + [ + 10, + 0.009400886483490467 + ], + [ + 13, + -0.006829604506492615 + ], + [ + 15, + 0.004158142954111099 + ], + [ + 20, + -0.0073410505428910255 + ], + [ + 25, + -0.015496937441639602 + ], + [ + 35, + 0.0030443017894867808 + ], + [ + 45, + 0.004381767328595743 + ], + [ + 55, + -0.002541719004511833 + ], + [ + 65, + 0.015656484989449382 + ], + [ + 75, + 0.014971858356148005 + ], + [ + 85, + 0.007261662278324366 + ], + [ + 95, + -0.004689584719017148 + ], + [ + 100, + -0.0020664925687015057 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7499220049468636 + ], + [ + 7, + 0.7498469948386692 + ], + [ + 8, + 0.7497922943083747 + ], + [ + 9, + 0.7497436076690509 + ], + [ + 10, + 0.7497147271011655 + ], + [ + 11, + 0.7496373700685055 + ], + [ + 12, + 0.7495911377516936 + ], + [ + 13, + 0.7495591076923991 + ], + [ + 14, + 0.7495520259230328 + ], + [ + 15, + 0.7494965013090477 + ], + [ + 16, + 0.7494952091159308 + ], + [ + 17, + 0.7495059615860385 + ], + [ + 18, + 0.7494701363824298 + ], + [ + 19, + 0.7494422326147001 + ], + [ + 20, + 0.7494295847275737 + ], + [ + 21, + 0.7494258583416467 + ], + [ + 22, + 0.7494341580473979 + ], + [ + 23, + 0.749417299478136 + ], + [ + 24, + 0.7494054863689891 + ], + [ + 25, + 0.7494183335600948 + ], + [ + 26, + 0.7494062009469158 + ], + [ + 27, + 0.749386443815835 + ], + [ + 28, + 0.7493906387259565 + ], + [ + 29, + 0.7493977933561468 + ], + [ + 30, + 0.7494115413552965 + ], + [ + 31, + 0.74937497749007 + ], + [ + 32, + 0.7493738134103862 + ], + [ + 33, + 0.749387575031919 + ], + [ + 34, + 0.7493895790085617 + ], + [ + 35, + 0.7493779495658293 + ], + [ + 36, + 0.7493688614537896 + ], + [ + 37, + 0.7493811285321982 + ], + [ + 38, + 0.7493793503531336 + ], + [ + 39, + 0.7493793535783112 + ], + [ + 40, + 0.7493862838940486 + ], + [ + 41, + 0.7493963453482582 + ], + [ + 42, + 0.7493902605330259 + ], + [ + 43, + 0.7493899791972367 + ], + [ + 44, + 0.7493909907774019 + ], + [ + 45, + 0.7493882524314522 + ], + [ + 46, + 0.7493926965007238 + ], + [ + 47, + 0.7493777149605533 + ], + [ + 48, + 0.7493754540083309 + ], + [ + 49, + 0.74940470901309 + ], + [ + 50, + 0.7493888419454201 + ], + [ + 51, + 0.7493701886233235 + ], + [ + 52, + 0.7493823970078906 + ], + [ + 53, + 0.7493955027904773 + ], + [ + 54, + 0.7494067685560947 + ], + [ + 55, + 0.7494373228710867 + ], + [ + 56, + 0.749436131478882 + ], + [ + 57, + 0.7494092143251209 + ], + [ + 58, + 0.7493974854803174 + ], + [ + 59, + 0.7493886318130187 + ], + [ + 60, + 0.7493818393201509 + ], + [ + 61, + 0.7493855390419224 + ], + [ + 62, + 0.749397444060802 + ], + [ + 63, + 0.7493839866832109 + ], + [ + 64, + 0.7493896721443025 + ], + [ + 65, + 0.7493912184954649 + ], + [ + 66, + 0.749390525573084 + ], + [ + 67, + 0.7493892431315118 + ], + [ + 68, + 0.7493890806349718 + ], + [ + 69, + 0.7493942837137954 + ], + [ + 70, + 0.7493718437995105 + ], + [ + 71, + 0.7493855616542222 + ], + [ + 72, + 0.7493912184147061 + ], + [ + 73, + 0.7493976699937478 + ], + [ + 74, + 0.7494079082700383 + ], + [ + 75, + 0.7493938400148441 + ], + [ + 76, + 0.7494368868131648 + ], + [ + 77, + 0.749415196714498 + ], + [ + 78, + 0.7493968677634235 + ], + [ + 79, + 0.7493896917777243 + ], + [ + 80, + 0.7493831183029268 + ], + [ + 81, + 0.7493887478890309 + ], + [ + 82, + 0.749392078676077 + ], + [ + 83, + 0.7493897096223924 + ], + [ + 84, + 0.7493905341199444 + ], + [ + 85, + 0.7493948951239413 + ], + [ + 86, + 0.7493925549281948 + ], + [ + 87, + 0.7493985287550686 + ], + [ + 88, + 0.7493904891133867 + ], + [ + 89, + 0.7493750918006233 + ], + [ + 90, + 0.7493767894612435 + ], + [ + 91, + 0.7493757401805374 + ], + [ + 92, + 0.7493788542072656 + ], + [ + 93, + 0.7494012095815523 + ], + [ + 94, + 0.749389581481011 + ], + [ + 95, + 0.7493941822683292 + ], + [ + 96, + 0.7493976644324434 + ], + [ + 97, + 0.7493948974013512 + ], + [ + 98, + 0.749406639377133 + ], + [ + 99, + 0.7494037991022731 + ], + [ + 100, + 0.7493907136643728 + ] + ] + }, + "blend_shuffled_trainable": { + "test_acc": [ + 0.3041, + 0.3133, + 0.3185, + 0.3058, + 0.3077, + 0.3033, + 0.3036, + 0.3013, + 0.2961, + 0.3049, + 0.3163, + 0.3139, + 0.3183, + 0.3102, + 0.304, + 0.3033, + 0.315, + 0.3169, + 0.314, + 0.308, + 0.3079, + 0.3217, + 0.3104, + 0.3153, + 0.3091, + 0.3143, + 0.3154, + 0.3181, + 0.3142, + 0.3163, + 0.3215, + 0.3153, + 0.3146, + 0.314, + 0.3235, + 0.3162, + 0.3242, + 0.3246, + 0.3209, + 0.3233, + 0.3197, + 0.3186, + 0.3205, + 0.3202, + 0.3176, + 0.3207, + 0.3227, + 0.3143, + 0.3179, + 0.3208, + 0.3226, + 0.32, + 0.3256, + 0.3192, + 0.3207, + 0.3216, + 0.3266, + 0.3223, + 0.3171, + 0.3186, + 0.3239, + 0.3258, + 0.323, + 0.3309, + 0.3173, + 0.3182, + 0.3247, + 0.3253, + 0.326, + 0.3219, + 0.3234, + 0.3265, + 0.3231, + 0.3249, + 0.3185, + 0.3272, + 0.3219, + 0.3249, + 0.3233, + 0.3234, + 0.3277, + 0.327, + 0.3275, + 0.3245, + 0.3247, + 0.3249, + 0.3248, + 0.3242, + 0.3246, + 0.3247, + 0.325, + 0.3252, + 0.3252, + 0.3251, + 0.325 + ], + "train_loss": [ + 1.9882133629608154, + 1.9881019673919678, + 1.9891524069976807, + 1.9868328957366943, + 1.9891845949935913, + 1.9813592992782594, + 1.9801440045547485, + 1.9806723363494874, + 1.9786427125549317, + 1.9821630545806885, + 1.977519662437439, + 1.971266616859436, + 1.9723616131210326, + 1.968949783859253, + 1.9696260055541992, + 1.9699068839263916, + 1.9684647756958007, + 1.9725180642700195, + 1.9684360600280761, + 1.968059073562622, + 1.9673038653564454, + 1.9664155136871337, + 1.9645250603866578, + 1.9675670454406737, + 1.969709717025757, + 1.9648988067245483, + 1.9637554684448242, + 1.9651869311904908, + 1.9632979507064818, + 1.9634353633117676, + 1.963195507736206, + 1.9624330361557007, + 1.9649106032562256, + 1.96261977809906, + 1.965746845703125, + 1.96231167137146, + 1.9636095551300048, + 1.9628686709976195, + 1.9632325925064087, + 1.965823385925293, + 1.9639251545715333, + 1.9625721590423584, + 1.9632411141586303, + 1.9666285999298097, + 1.9646705523300172, + 1.9612812813568115, + 1.9628031824493408, + 1.9612671447372436, + 1.9614050133514405, + 1.9616153263092042, + 1.9616178183746338, + 1.9597780437850951, + 1.9633536209106446, + 1.961100555114746, + 1.9633056440734864, + 1.9609289096450806, + 1.9632993547821045, + 1.9602513189315796, + 1.9607367464828491, + 1.9611903679656983, + 1.9616722354507445, + 1.96167990234375, + 1.9621346522521972, + 1.9584645178222657, + 1.9602933213806153, + 1.960143120803833, + 1.9579744591522217, + 1.9633731325912476, + 1.9604005276107788, + 1.9604838925933838, + 1.960356443862915, + 1.9593083364868165, + 1.9605383354187012, + 1.958080934677124, + 1.9600851589584352, + 1.9594914280700684, + 1.959912822265625, + 1.9608478322982787, + 1.9587051663208008, + 1.956825029220581, + 1.9607854579162598, + 1.956131549911499, + 1.9600519333648683, + 1.9560367584991456, + 1.9549996364593505, + 1.9579589212799071, + 1.9576114078140259, + 1.9580341373062133, + 1.9579882822418213, + 1.9546271855926514, + 1.9580214026641847, + 1.9600323877334596, + 1.957533321609497, + 1.955910203552246, + 1.9606612694549561 + ], + "gamma": [ + [ + 6, + 0.016355152998585254 + ], + [ + 7, + 0.024427944561466575 + ], + [ + 8, + 0.03244515031110495 + ], + [ + 9, + 0.037574231857433915 + ], + [ + 10, + 0.02381341380532831 + ], + [ + 13, + 0.03183329018065706 + ], + [ + 15, + 0.039742537890560925 + ], + [ + 20, + 0.028106374549679458 + ], + [ + 25, + 0.023346851172391325 + ], + [ + 35, + 0.022161927772685885 + ], + [ + 45, + 0.02809242461808026 + ], + [ + 55, + 0.02980245597427711 + ], + [ + 65, + 0.02308708109194413 + ], + [ + 75, + 0.02955220313742757 + ], + [ + 85, + 0.036079382756724954 + ], + [ + 95, + 0.030997981084510684 + ], + [ + 100, + 0.03075875889044255 + ] + ], + "rho": [ + [ + 6, + 0.017404719023033977 + ], + [ + 7, + -0.007129559060558677 + ], + [ + 8, + -0.005894948495551944 + ], + [ + 9, + 0.003232832415960729 + ], + [ + 10, + -0.0037994354497641325 + ], + [ + 13, + 0.00012775661889463663 + ], + [ + 15, + 0.0049165410455316305 + ], + [ + 20, + 0.007058484945446253 + ], + [ + 25, + 0.003497648925986141 + ], + [ + 35, + 0.004558940418064594 + ], + [ + 45, + 0.0013113794848322868 + ], + [ + 55, + -0.006722114223521203 + ], + [ + 65, + 0.023264381452463567 + ], + [ + 75, + 0.009205496869981289 + ], + [ + 85, + 0.015811771620064974 + ], + [ + 95, + 0.002596069360151887 + ], + [ + 100, + 0.004170703352428973 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7499203817126044 + ], + [ + 7, + 0.7498473926536209 + ], + [ + 8, + 0.7498067954424582 + ], + [ + 9, + 0.7497330329265922 + ], + [ + 10, + 0.7497022644111692 + ], + [ + 11, + 0.7497089800874237 + ], + [ + 12, + 0.749580267629901 + ], + [ + 13, + 0.7495483148022443 + ], + [ + 14, + 0.7494877798640726 + ], + [ + 15, + 0.7495237351049973 + ], + [ + 16, + 0.7495026151842156 + ], + [ + 17, + 0.7494681925269019 + ], + [ + 18, + 0.7494358266469395 + ], + [ + 19, + 0.7494331298572458 + ], + [ + 20, + 0.7494433294281939 + ], + [ + 21, + 0.7494393382691086 + ], + [ + 22, + 0.7494336879655699 + ], + [ + 23, + 0.7494508309427925 + ], + [ + 24, + 0.7494223317599271 + ], + [ + 25, + 0.7494121362855057 + ], + [ + 26, + 0.7494163679596605 + ], + [ + 27, + 0.7493960160775697 + ], + [ + 28, + 0.749390409223028 + ], + [ + 29, + 0.749390992617308 + ], + [ + 30, + 0.7493927307020445 + ], + [ + 31, + 0.7493766611360625 + ], + [ + 32, + 0.7493977801865833 + ], + [ + 33, + 0.7493917157028857 + ], + [ + 34, + 0.7493982176615227 + ], + [ + 35, + 0.749390067311929 + ], + [ + 36, + 0.7493826796278233 + ], + [ + 37, + 0.7493882938770885 + ], + [ + 38, + 0.7493950978303817 + ], + [ + 39, + 0.7494004245071493 + ], + [ + 40, + 0.7493957884956443 + ], + [ + 41, + 0.7494055237064294 + ], + [ + 42, + 0.7494023169006231 + ], + [ + 43, + 0.7493906380727359 + ], + [ + 44, + 0.7493832241801811 + ], + [ + 45, + 0.7493974674089477 + ], + [ + 46, + 0.7494142002768108 + ], + [ + 47, + 0.7493976151953635 + ], + [ + 48, + 0.7493915037172526 + ], + [ + 49, + 0.7494232293952092 + ], + [ + 50, + 0.7494189364938916 + ], + [ + 51, + 0.7494011521037299 + ], + [ + 52, + 0.7493943786563599 + ], + [ + 53, + 0.7493953434522991 + ], + [ + 54, + 0.7493984032912804 + ], + [ + 55, + 0.7494011344276886 + ], + [ + 56, + 0.7494025120058067 + ], + [ + 57, + 0.749399989966068 + ], + [ + 58, + 0.7494005554979026 + ], + [ + 59, + 0.7494070563576691 + ], + [ + 60, + 0.7493985346423274 + ], + [ + 61, + 0.7494018762471589 + ], + [ + 62, + 0.7494062978834193 + ], + [ + 63, + 0.7494025019737532 + ], + [ + 64, + 0.7494022031209248 + ], + [ + 65, + 0.749387289949488 + ], + [ + 66, + 0.7493899903292269 + ], + [ + 67, + 0.749382444034868 + ], + [ + 68, + 0.749384555546625 + ], + [ + 69, + 0.7493789641887715 + ], + [ + 70, + 0.7493899454910227 + ], + [ + 71, + 0.7493869980099057 + ], + [ + 72, + 0.7494041179491546 + ], + [ + 73, + 0.7493882349730862 + ], + [ + 74, + 0.7493931032889941 + ], + [ + 75, + 0.7493848343975982 + ], + [ + 76, + 0.7493753700321834 + ], + [ + 77, + 0.749390683112653 + ], + [ + 78, + 0.7493938601463527 + ], + [ + 79, + 0.7493921215605192 + ], + [ + 80, + 0.7494007935058512 + ], + [ + 81, + 0.7494058194317977 + ], + [ + 82, + 0.7493941038440329 + ], + [ + 83, + 0.749384788037309 + ], + [ + 84, + 0.7493802564428359 + ], + [ + 85, + 0.749381685825373 + ], + [ + 86, + 0.7493992416161968 + ], + [ + 87, + 0.7493822721108743 + ], + [ + 88, + 0.7493802332545368 + ], + [ + 89, + 0.7493812286084873 + ], + [ + 90, + 0.7494055120914692 + ], + [ + 91, + 0.7493854098891867 + ], + [ + 92, + 0.7493959012792147 + ], + [ + 93, + 0.7494048054970472 + ], + [ + 94, + 0.7493850305850241 + ], + [ + 95, + 0.7493791660549699 + ], + [ + 96, + 0.7493938625420236 + ], + [ + 97, + 0.7493986404581087 + ], + [ + 98, + 0.7493953739123228 + ], + [ + 99, + 0.7494022995179244 + ], + [ + 100, + 0.7494032432948281 + ] + ] + }, + "blend_zero_target_trainable": { + "test_acc": [ + 0.2776, + 0.2859, + 0.2805, + 0.2661, + 0.2658, + 0.2625, + 0.2518, + 0.2559, + 0.2367, + 0.2386, + 0.2522, + 0.257, + 0.272, + 0.254, + 0.2397, + 0.2066, + 0.2232, + 0.2022, + 0.2002, + 0.1872, + 0.2078, + 0.2154, + 0.195, + 0.2013, + 0.164, + 0.1929, + 0.1923, + 0.1889, + 0.2011, + 0.1976, + 0.1834, + 0.1939, + 0.2045, + 0.2035, + 0.2051, + 0.2083, + 0.2028, + 0.2012, + 0.2005, + 0.2037, + 0.2092, + 0.2123, + 0.2199, + 0.2173, + 0.2086, + 0.2149, + 0.2153, + 0.2067, + 0.2197, + 0.2205, + 0.2132, + 0.2176, + 0.1899, + 0.2031, + 0.203, + 0.2123, + 0.2189, + 0.2162, + 0.2138, + 0.2102, + 0.2251, + 0.2257, + 0.2202, + 0.2213, + 0.2029, + 0.2014, + 0.2309, + 0.2326, + 0.2125, + 0.2143, + 0.214, + 0.2285, + 0.2212, + 0.2184, + 0.2123, + 0.2223, + 0.2237, + 0.2171, + 0.2127, + 0.2241, + 0.2287, + 0.2289, + 0.2309, + 0.2232, + 0.2243, + 0.2193, + 0.2227, + 0.2184, + 0.2208, + 0.2206, + 0.2194, + 0.2202, + 0.2199, + 0.2208, + 0.2206 + ], + "train_loss": [ + 2.0023640447235107, + 2.040512075881958, + 2.0519314972686766, + 2.0638853752136233, + 2.072012276687622, + 2.0677214878082277, + 2.06886547164917, + 2.0694519245147704, + 2.067423739013672, + 2.0655289979553224, + 2.06629921081543, + 2.0631995821380613, + 2.0609045373153685, + 2.058683188858032, + 2.071466637496948, + 2.0982071717834474, + 2.1176902227783203, + 2.135855104904175, + 2.1459106968688966, + 2.1510271551513673, + 2.155086622314453, + 2.1585256716156005, + 2.15646563873291, + 2.161513948287964, + 2.164117654876709, + 2.166316808319092, + 2.1665096879577637, + 2.1655848853302, + 2.163163600769043, + 2.1617049073791503, + 2.1624610729980467, + 2.1621627906799317, + 2.1596954206085206, + 2.1561568085479736, + 2.1541545433044433, + 2.1522645554351807, + 2.147998229827881, + 2.1471784650421144, + 2.1451251698303224, + 2.1426290184020997, + 2.1404898113250734, + 2.1406173085021973, + 2.136187228088379, + 2.137960918197632, + 2.1342968878173827, + 2.1303375938415527, + 2.1304951375579835, + 2.1299390644836427, + 2.1318602128601074, + 2.1347230551147462, + 2.139710686645508, + 2.141014033355713, + 2.141334562149048, + 2.1429337422180175, + 2.1455739665222167, + 2.1454911710357667, + 2.146714199447632, + 2.1462488514709475, + 2.1462212409973143, + 2.1472820111846924, + 2.145705964202881, + 2.14649310295105, + 2.1461523735046386, + 2.1450838286590574, + 2.144278532180786, + 2.1443131462097167, + 2.1445733752441405, + 2.1462536781311035, + 2.1437386114501953, + 2.144259309768677, + 2.1427957734680176, + 2.1440535404205323, + 2.1424728871154786, + 2.140573755340576, + 2.1422169814300536, + 2.140773203048706, + 2.1420933238220217, + 2.1398540377044677, + 2.140619307861328, + 2.140531947479248, + 2.1405946379089356, + 2.140400583343506, + 2.1403809301757812, + 2.1384230867767333, + 2.1384307886505125, + 2.139088828277588, + 2.13851263961792, + 2.1375454248809813, + 2.1381795156860353, + 2.1372567707824706, + 2.138834800338745, + 2.1392871213531492, + 2.1383936073303222, + 2.1379687480163576, + 2.1397182269287107 + ], + "gamma": [ + [ + 6, + 0.030306661501526833 + ], + [ + 7, + 0.0225322386395419 + ], + [ + 8, + 0.02592305262805894 + ], + [ + 9, + 0.02201161568518728 + ], + [ + 10, + 0.027305484749376774 + ], + [ + 13, + 0.029643934220075607 + ], + [ + 15, + 0.03215414332225919 + ], + [ + 20, + 0.02044028788805008 + ], + [ + 25, + 0.020044114789925516 + ], + [ + 35, + 0.019949833513237536 + ], + [ + 45, + 0.018003164615947753 + ], + [ + 55, + 0.014312395825982094 + ], + [ + 65, + 0.01663823623675853 + ], + [ + 75, + 0.014795503608183935 + ], + [ + 85, + 0.00809670623857528 + ], + [ + 95, + 0.014231618042686023 + ], + [ + 100, + 0.01487609907053411 + ] + ], + "rho": [ + [ + 6, + 0.01702426071278751 + ], + [ + 7, + -0.009573296178132296 + ], + [ + 8, + 0.011328767170198262 + ], + [ + 9, + 0.0018548705847933888 + ], + [ + 10, + 0.008511126041412354 + ], + [ + 13, + -0.00647524930536747 + ], + [ + 15, + -0.0025810777442529798 + ], + [ + 20, + -0.003653603489510715 + ], + [ + 25, + -0.01230846531689167 + ], + [ + 35, + 0.005644407821819186 + ], + [ + 45, + 0.002691521542146802 + ], + [ + 55, + 0.0031679244711995125 + ], + [ + 65, + -0.012788467109203339 + ], + [ + 75, + 0.0022694955114275217 + ], + [ + 85, + 0.0019409467931836843 + ], + [ + 95, + -0.004382152110338211 + ], + [ + 100, + -0.000769294798374176 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7497362805693359 + ], + [ + 7, + 0.749581041647472 + ], + [ + 8, + 0.7493584059826238 + ], + [ + 9, + 0.7492339451117882 + ], + [ + 10, + 0.749340315582399 + ], + [ + 11, + 0.7492374924704412 + ], + [ + 12, + 0.749268120206403 + ], + [ + 13, + 0.7488045502174396 + ], + [ + 14, + 0.7490390551992111 + ], + [ + 15, + 0.7491335750242463 + ], + [ + 16, + 0.7485394191089099 + ], + [ + 17, + 0.749188013620795 + ], + [ + 18, + 0.7490501542138405 + ], + [ + 19, + 0.7494024164487249 + ], + [ + 20, + 0.7489704299304686 + ], + [ + 21, + 0.7482152964560599 + ], + [ + 22, + 0.7476362146506301 + ], + [ + 23, + 0.7473182194932083 + ], + [ + 24, + 0.7470924176076084 + ], + [ + 25, + 0.7469232675918307 + ], + [ + 26, + 0.7467048544817158 + ], + [ + 27, + 0.7481883180130917 + ], + [ + 28, + 0.7458056054316415 + ], + [ + 29, + 0.7449148521055118 + ], + [ + 30, + 0.7447975838552088 + ], + [ + 31, + 0.7451361479511207 + ], + [ + 32, + 0.7463947116893779 + ], + [ + 33, + 0.7483167771979659 + ], + [ + 34, + 0.746645246947765 + ], + [ + 35, + 0.7474467234429543 + ], + [ + 36, + 0.7463204594921183 + ], + [ + 37, + 0.7457082718160046 + ], + [ + 38, + 0.7445172385580846 + ], + [ + 39, + 0.747980915036212 + ], + [ + 40, + 0.744528498161014 + ], + [ + 41, + 0.7478056033792548 + ], + [ + 42, + 0.7469712747506486 + ], + [ + 43, + 0.7471201332337015 + ], + [ + 44, + 0.7469539144734552 + ], + [ + 45, + 0.7471630825801321 + ], + [ + 46, + 0.7473871518768268 + ], + [ + 47, + 0.7471176624314386 + ], + [ + 48, + 0.743804909426897 + ], + [ + 49, + 0.7464271822022943 + ], + [ + 50, + 0.7457063004472081 + ], + [ + 51, + 0.7443068895341965 + ], + [ + 52, + 0.745908651516242 + ], + [ + 53, + 0.7477515538739072 + ], + [ + 54, + 0.7445847598211315 + ], + [ + 55, + 0.7436352794600138 + ], + [ + 56, + 0.7437537290894932 + ], + [ + 57, + 0.742756492732124 + ], + [ + 58, + 0.7429733408056187 + ], + [ + 59, + 0.741951651371069 + ], + [ + 60, + 0.7423943479210192 + ], + [ + 61, + 0.741484254779124 + ], + [ + 62, + 0.7410289125490176 + ], + [ + 63, + 0.7412163916214788 + ], + [ + 64, + 0.7415920425252699 + ], + [ + 65, + 0.7419986056818562 + ], + [ + 66, + 0.7440932156421496 + ], + [ + 67, + 0.7459786459484441 + ], + [ + 68, + 0.7438676156593648 + ], + [ + 69, + 0.7438779883301126 + ], + [ + 70, + 0.744394855639493 + ], + [ + 71, + 0.7449061219308878 + ], + [ + 72, + 0.7447229961625207 + ], + [ + 73, + 0.7438470911602947 + ], + [ + 74, + 0.7448100710654857 + ], + [ + 75, + 0.7446996377833014 + ], + [ + 76, + 0.7420718533734099 + ], + [ + 77, + 0.7427279224559526 + ], + [ + 78, + 0.7442672048736515 + ], + [ + 79, + 0.7428208040916006 + ], + [ + 80, + 0.7420642174954307 + ], + [ + 81, + 0.7433102963989435 + ], + [ + 82, + 0.7438790263942314 + ], + [ + 83, + 0.7438760150199217 + ], + [ + 84, + 0.7417600190910029 + ], + [ + 85, + 0.7432293351132631 + ], + [ + 86, + 0.744130491360313 + ], + [ + 87, + 0.7426509841574067 + ], + [ + 88, + 0.7430889500736941 + ], + [ + 89, + 0.7437418916670842 + ], + [ + 90, + 0.7436062592096674 + ], + [ + 91, + 0.7431842913178145 + ], + [ + 92, + 0.7439143371174419 + ], + [ + 93, + 0.7439819765655518 + ], + [ + 94, + 0.7437855115582399 + ], + [ + 95, + 0.743877112837538 + ], + [ + 96, + 0.7437099819636295 + ], + [ + 97, + 0.7440975147807718 + ], + [ + 98, + 0.7436722978532115 + ], + [ + 99, + 0.7437938121857754 + ], + [ + 100, + 0.7186698543225942 + ] + ] + }, + "blend_fresh_random_target": { + "test_acc": [ + 0.3079, + 0.315, + 0.3135, + 0.3101, + 0.3113, + 0.3055, + 0.3043, + 0.2983, + 0.2992, + 0.2994, + 0.3112, + 0.3159, + 0.3205, + 0.309, + 0.3107, + 0.3061, + 0.3132, + 0.3121, + 0.316, + 0.3082, + 0.3053, + 0.32, + 0.3076, + 0.3154, + 0.3078, + 0.3124, + 0.3146, + 0.3185, + 0.313, + 0.3142, + 0.3193, + 0.3094, + 0.3118, + 0.3147, + 0.322, + 0.3141, + 0.3219, + 0.3238, + 0.3178, + 0.3225, + 0.3169, + 0.3159, + 0.3197, + 0.3192, + 0.3118, + 0.3234, + 0.3254, + 0.3125, + 0.3126, + 0.3191, + 0.3196, + 0.3169, + 0.3234, + 0.3172, + 0.3182, + 0.3177, + 0.3229, + 0.3211, + 0.3166, + 0.3172, + 0.3203, + 0.3256, + 0.3228, + 0.3319, + 0.3142, + 0.3183, + 0.3254, + 0.3256, + 0.3262, + 0.3201, + 0.3216, + 0.3246, + 0.3229, + 0.3247, + 0.3192, + 0.3269, + 0.32, + 0.3241, + 0.3226, + 0.322, + 0.3258, + 0.3259, + 0.3264, + 0.3238, + 0.3243, + 0.3245, + 0.3241, + 0.3235, + 0.3234, + 0.3241, + 0.3244, + 0.3245, + 0.3248, + 0.3246, + 0.3247 + ], + "train_loss": [ + 1.9895956008148192, + 1.9871157150268555, + 1.9889365613555907, + 1.9874303811645508, + 1.9918496588897705, + 1.9849690564727782, + 1.9797383239746094, + 1.9821398335266114, + 1.980450602874756, + 1.982718380355835, + 1.980131506690979, + 1.9749598886871338, + 1.9776175240325928, + 1.9743317586898803, + 1.9755635387420654, + 1.9738460313415527, + 1.9721670236206055, + 1.976031579360962, + 1.9730562036895751, + 1.972999349899292, + 1.9716904864501954, + 1.971796060256958, + 1.9695869226074219, + 1.9704775234222411, + 1.97195292427063, + 1.9660728258514404, + 1.9655471087646483, + 1.966665030479431, + 1.9647278304672242, + 1.965036628112793, + 1.96549792137146, + 1.9644975103378295, + 1.9673720928192138, + 1.9650436472320556, + 1.967986387939453, + 1.9649243574523925, + 1.9669129509735108, + 1.9663866016387939, + 1.9665748501205444, + 1.9689803732681275, + 1.966659411315918, + 1.9652994158935546, + 1.9668769124984742, + 1.9698543347549438, + 1.968035751914978, + 1.9646889480590821, + 1.9669011117553712, + 1.9649674994277955, + 1.9647760410308839, + 1.9656365216445923, + 1.9660039056015015, + 1.9634289357757568, + 1.9663543716430665, + 1.9644216299057007, + 1.966054580230713, + 1.9641708936309814, + 1.966459882545471, + 1.9637008392333983, + 1.96356682346344, + 1.963944573287964, + 1.9648190647125243, + 1.9643907577514648, + 1.9645199195861816, + 1.960793134994507, + 1.9616555389404298, + 1.9615585623931884, + 1.9598950524139405, + 1.9651576745986938, + 1.9621147458648682, + 1.9626274981689453, + 1.9624529599380494, + 1.961181657485962, + 1.9628156858825683, + 1.9600841522216796, + 1.9619939487457276, + 1.9610844894790649, + 1.9621123931503295, + 1.9624303231811524, + 1.9605216361999511, + 1.9586425089263917, + 1.9624747284698487, + 1.9581730127716064, + 1.9616589535140991, + 1.9579475601959229, + 1.9571584579086303, + 1.960104623374939, + 1.9596380628204346, + 1.9596924450683593, + 1.9598581456756592, + 1.9566800785827636, + 1.9601387897491456, + 1.9619328371429443, + 1.959656799545288, + 1.9580980550765992, + 1.9627989617538453 + ], + "gamma": [ + [ + 6, + 0.017292891163378954 + ], + [ + 7, + 0.036347093526273966 + ], + [ + 8, + 0.03849387320224196 + ], + [ + 9, + 0.027741328405681998 + ], + [ + 10, + 0.021491852588951588 + ], + [ + 13, + 0.026236126199364662 + ], + [ + 15, + 0.025328890304081142 + ], + [ + 20, + 0.033093019970692694 + ], + [ + 25, + 0.031382174929603934 + ], + [ + 35, + 0.02521582809276879 + ], + [ + 45, + 0.029412550502456725 + ], + [ + 55, + 0.02664855885086581 + ], + [ + 65, + 0.02817878598580137 + ], + [ + 75, + 0.025164220336591825 + ], + [ + 85, + 0.02900500304531306 + ], + [ + 95, + 0.02672984590753913 + ], + [ + 100, + 0.02726486313622445 + ] + ], + "rho": [ + [ + 6, + 0.008813910884782672 + ], + [ + 7, + -0.0029148668982088566 + ], + [ + 8, + 0.026879789656959474 + ], + [ + 9, + 0.010234457906335592 + ], + [ + 10, + 0.02435486181639135 + ], + [ + 13, + 0.010708853835240006 + ], + [ + 15, + 0.006966336397454143 + ], + [ + 20, + 0.01967952074483037 + ], + [ + 25, + 0.0013518772320821881 + ], + [ + 35, + 0.01640128600411117 + ], + [ + 45, + 0.006852992926724255 + ], + [ + 55, + 0.02206423506140709 + ], + [ + 65, + 0.01695137156639248 + ], + [ + 75, + -0.010456086485646665 + ], + [ + 85, + 0.000875505618751049 + ], + [ + 95, + 0.0027324086986482143 + ], + [ + 100, + 0.0019112437730655074 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7499183675984715 + ], + [ + 7, + 0.7498580718404874 + ], + [ + 8, + 0.7498184614014324 + ], + [ + 9, + 0.7497375510676978 + ], + [ + 10, + 0.7496627172099697 + ], + [ + 11, + 0.7496257167184156 + ], + [ + 12, + 0.7495836037212643 + ], + [ + 13, + 0.7495750356463327 + ], + [ + 14, + 0.7495544696996854 + ], + [ + 15, + 0.7495137648838652 + ], + [ + 16, + 0.7494891249735052 + ], + [ + 17, + 0.7494626932817029 + ], + [ + 18, + 0.7495223934064319 + ], + [ + 19, + 0.7494750130017354 + ], + [ + 20, + 0.7494305373439367 + ], + [ + 21, + 0.7494377475191072 + ], + [ + 22, + 0.7494168348085465 + ], + [ + 23, + 0.7494110696282498 + ], + [ + 24, + 0.7493937961573321 + ], + [ + 25, + 0.7494024936440973 + ], + [ + 26, + 0.7493996146160407 + ], + [ + 27, + 0.749411104858257 + ], + [ + 28, + 0.7494145623168125 + ], + [ + 29, + 0.7494095625496254 + ], + [ + 30, + 0.7493938665475209 + ], + [ + 31, + 0.7493840179563203 + ], + [ + 32, + 0.7493590159715497 + ], + [ + 33, + 0.7493591914530261 + ], + [ + 34, + 0.7493842326098364 + ], + [ + 35, + 0.7493979958724923 + ], + [ + 36, + 0.7493944236339718 + ], + [ + 37, + 0.7494003491047037 + ], + [ + 38, + 0.7493888468259413 + ], + [ + 39, + 0.7493736761180659 + ], + [ + 40, + 0.7493549698919852 + ], + [ + 41, + 0.7493853133556705 + ], + [ + 42, + 0.749398322846658 + ], + [ + 43, + 0.749373823661955 + ], + [ + 44, + 0.7493814780112398 + ], + [ + 45, + 0.7493827812779604 + ], + [ + 46, + 0.7493957852421362 + ], + [ + 47, + 0.7493943278085832 + ], + [ + 48, + 0.7493840316609607 + ], + [ + 49, + 0.7493895244535708 + ], + [ + 50, + 0.7494209243375904 + ], + [ + 51, + 0.7494003427223144 + ], + [ + 52, + 0.7493912036305236 + ], + [ + 53, + 0.7493774334948415 + ], + [ + 54, + 0.7493705998545339 + ], + [ + 55, + 0.7493912803523951 + ], + [ + 56, + 0.7493862524979168 + ], + [ + 57, + 0.7493808633927121 + ], + [ + 58, + 0.749402714070985 + ], + [ + 59, + 0.7493970766262411 + ], + [ + 60, + 0.7493830753918892 + ], + [ + 61, + 0.749386443775214 + ], + [ + 62, + 0.7493818838348248 + ], + [ + 63, + 0.7493722809940843 + ], + [ + 64, + 0.7493679694670623 + ], + [ + 65, + 0.749386178299581 + ], + [ + 66, + 0.7493855593945847 + ], + [ + 67, + 0.7494739224494158 + ], + [ + 68, + 0.7494390666617322 + ], + [ + 69, + 0.7494310294839032 + ], + [ + 70, + 0.7494182732076973 + ], + [ + 71, + 0.7494000519643902 + ], + [ + 72, + 0.749392574531181 + ], + [ + 73, + 0.7493930338288214 + ], + [ + 74, + 0.7493969130682594 + ], + [ + 75, + 0.7493961390578522 + ], + [ + 76, + 0.7493879748280946 + ], + [ + 77, + 0.749386659807227 + ], + [ + 78, + 0.749393861964963 + ], + [ + 79, + 0.7493903064944849 + ], + [ + 80, + 0.7493894222732886 + ], + [ + 81, + 0.7493849652191917 + ], + [ + 82, + 0.7493878939906475 + ], + [ + 83, + 0.7494084649253259 + ], + [ + 84, + 0.7494049802813402 + ], + [ + 85, + 0.749403945577232 + ], + [ + 86, + 0.7493871750912952 + ], + [ + 87, + 0.7493875947506622 + ], + [ + 88, + 0.749400633475107 + ], + [ + 89, + 0.7494062220382451 + ], + [ + 90, + 0.7493935668980417 + ], + [ + 91, + 0.749402243979675 + ], + [ + 92, + 0.7493878218997805 + ], + [ + 93, + 0.7493876239118213 + ], + [ + 94, + 0.7494012793496149 + ], + [ + 95, + 0.7493987452877314 + ], + [ + 96, + 0.7493926918529484 + ], + [ + 97, + 0.749408920363831 + ], + [ + 98, + 0.7494054176455518 + ], + [ + 99, + 0.7493890317916441 + ], + [ + 100, + 0.7493907402290226 + ] + ] + }, + "blend_time_only_trainable": { + "test_acc": [ + 0.2968, + 0.3071, + 0.3016, + 0.2942, + 0.3056, + 0.3091, + 0.2983, + 0.3115, + 0.3031, + 0.3076, + 0.3122, + 0.3129, + 0.3144, + 0.2949, + 0.2949, + 0.3109, + 0.2999, + 0.3045, + 0.3097, + 0.3003, + 0.3261, + 0.3178, + 0.3094, + 0.3212, + 0.3227, + 0.3059, + 0.3066, + 0.3077, + 0.3134, + 0.3254, + 0.3147, + 0.3064, + 0.315, + 0.3169, + 0.3138, + 0.3085, + 0.3095, + 0.316, + 0.3201, + 0.315, + 0.3156, + 0.3099, + 0.3111, + 0.3199, + 0.3179, + 0.3181, + 0.3211, + 0.3176, + 0.3215, + 0.3202, + 0.3191, + 0.3143, + 0.3154, + 0.3202, + 0.3202, + 0.3125, + 0.3172, + 0.3184, + 0.3268, + 0.3217, + 0.3168, + 0.3137, + 0.3183, + 0.3233, + 0.3245, + 0.3225, + 0.3181, + 0.3201, + 0.3195, + 0.3136, + 0.3216, + 0.3186, + 0.3219, + 0.3215, + 0.3223, + 0.3215, + 0.3241, + 0.3196, + 0.3218, + 0.3213, + 0.3176, + 0.3195, + 0.3227, + 0.3202, + 0.3209, + 0.3219, + 0.3211, + 0.321, + 0.3208, + 0.3218, + 0.3216, + 0.3208, + 0.3209, + 0.321, + 0.321 + ], + "train_loss": [ + 1.9886227381896973, + 1.9827429238128662, + 1.9804512140655517, + 1.9798980695343018, + 1.9805296991348267, + 1.977417304725647, + 1.974860093536377, + 1.9769952285003662, + 1.9753232281112671, + 1.9729519940948486, + 1.9743930877685547, + 1.9746073372650146, + 1.974119525680542, + 1.9704522942733764, + 1.9700338676452638, + 1.9719092016601563, + 1.973803524208069, + 1.9692140093994142, + 1.970864155807495, + 1.9679285832977296, + 1.9677499777221679, + 1.968604490890503, + 1.967433316192627, + 1.9737133739852906, + 1.9710391773223876, + 1.967381762237549, + 1.9636189496612548, + 1.9688137311553955, + 1.9630879692077636, + 1.964395586013794, + 1.9672391658020019, + 1.967085045928955, + 1.9683808533477782, + 1.9686685515594482, + 1.9683083154678345, + 1.9649195724487305, + 1.9674741954040527, + 1.96513455078125, + 1.9665856964874266, + 1.9676008330535888, + 1.9649982983398437, + 1.9688120121002197, + 1.9681585739135743, + 1.9651886529541016, + 1.9651513041687012, + 1.964658903274536, + 1.965113462562561, + 1.9656871701812744, + 1.963506703338623, + 1.9635086895370484, + 1.9646611813735961, + 1.965419214439392, + 1.9622100240707399, + 1.9655747576904297, + 1.9645401123809814, + 1.9638557550811768, + 1.9656030306625367, + 1.9630318942260743, + 1.9633430401992797, + 1.9632549198150635, + 1.9656342436218261, + 1.9612906111145019, + 1.9649773630523681, + 1.961433423538208, + 1.9648060617446899, + 1.962691479949951, + 1.9623157412719727, + 1.9617682968521117, + 1.9638728455352783, + 1.9607208148956299, + 1.9633137642669678, + 1.9640166495132447, + 1.962754055747986, + 1.9637004630279542, + 1.9611902783966064, + 1.9633544604110718, + 1.9624716176605224, + 1.9580968730926513, + 1.9603176507949829, + 1.961276364479065, + 1.961574722137451, + 1.9626929391479493, + 1.960529104614258, + 1.9612769229507447, + 1.9601130446624755, + 1.9594660828018189, + 1.9633270732116699, + 1.960886742477417, + 1.960172682952881, + 1.9584505153656007, + 1.9622385289764404, + 1.9607479111480712, + 1.9632561265563966, + 1.960337890663147, + 1.9582083444976806 + ], + "gamma": [ + [ + 6, + 0.028835158329457045 + ], + [ + 7, + 0.027052901219576597 + ], + [ + 8, + 0.023494747059885412 + ], + [ + 9, + 0.01783509086817503 + ], + [ + 10, + 0.023978060635272413 + ], + [ + 13, + 0.033078035805374384 + ], + [ + 15, + 0.028882148093543947 + ], + [ + 20, + 0.038076453492976725 + ], + [ + 25, + 0.02922750887228176 + ], + [ + 35, + 0.02892274083569646 + ], + [ + 45, + 0.03040214753127657 + ], + [ + 55, + 0.027280541777145118 + ], + [ + 65, + 0.02700136008206755 + ], + [ + 75, + 0.03386293107178062 + ], + [ + 85, + 0.029299015528522432 + ], + [ + 95, + 0.02438629453536123 + ], + [ + 100, + 0.02840151885175146 + ] + ], + "rho": [ + [ + 6, + 0.020045978017151356 + ], + [ + 7, + 0.028075518901459873 + ], + [ + 8, + 0.004343734122812748 + ], + [ + 9, + -0.012429071473889053 + ], + [ + 10, + 0.018212675815448165 + ], + [ + 13, + 0.002771535189822316 + ], + [ + 15, + -0.0013614993076771498 + ], + [ + 20, + 0.007225814741104841 + ], + [ + 25, + 0.01997060887515545 + ], + [ + 35, + -0.0010430027032271028 + ], + [ + 45, + -0.01927056908607483 + ], + [ + 55, + 0.01598264859057963 + ], + [ + 65, + 0.0003244243562221527 + ], + [ + 75, + -0.008988905930891633 + ], + [ + 85, + -0.0020510986214503646 + ], + [ + 95, + 0.01564559619873762 + ], + [ + 100, + 0.016892846673727036 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7498882009566175 + ], + [ + 7, + 0.7497984738201007 + ], + [ + 8, + 0.7497484604477911 + ], + [ + 9, + 0.7497051138427109 + ], + [ + 10, + 0.7496591238246716 + ], + [ + 11, + 0.7496403825695535 + ], + [ + 12, + 0.7496081863730946 + ], + [ + 13, + 0.749569962328138 + ], + [ + 14, + 0.7495464701316163 + ], + [ + 15, + 0.7495313845850577 + ], + [ + 16, + 0.7495077609527684 + ], + [ + 17, + 0.7494939682039945 + ], + [ + 18, + 0.7494596863913463 + ], + [ + 19, + 0.7494542556912652 + ], + [ + 20, + 0.7494421229895855 + ], + [ + 21, + 0.7494211121616516 + ], + [ + 22, + 0.7494151826595754 + ], + [ + 23, + 0.7494095261072832 + ], + [ + 24, + 0.7494114239713908 + ], + [ + 25, + 0.7494028569990477 + ], + [ + 26, + 0.7494114251452957 + ], + [ + 27, + 0.7494005251340944 + ], + [ + 28, + 0.7493941172133661 + ], + [ + 29, + 0.7494099036627795 + ], + [ + 30, + 0.7494189837029221 + ], + [ + 31, + 0.749403710805218 + ], + [ + 32, + 0.7493835514498101 + ], + [ + 33, + 0.7493986115859782 + ], + [ + 34, + 0.7493892537734781 + ], + [ + 35, + 0.7493799657091523 + ], + [ + 36, + 0.7493929103624215 + ], + [ + 37, + 0.749392135133588 + ], + [ + 38, + 0.7493882166969528 + ], + [ + 39, + 0.7493849680986849 + ], + [ + 40, + 0.7493985919810099 + ], + [ + 41, + 0.7494020881991523 + ], + [ + 42, + 0.7494109207276094 + ], + [ + 43, + 0.7493794652168388 + ], + [ + 44, + 0.7494031802429594 + ], + [ + 45, + 0.7493990648166816 + ], + [ + 46, + 0.7493984620406952 + ], + [ + 47, + 0.7494144054470806 + ], + [ + 48, + 0.7493973840204821 + ], + [ + 49, + 0.7493976802506256 + ], + [ + 50, + 0.7493877922890425 + ], + [ + 51, + 0.7493718458066876 + ], + [ + 52, + 0.7493909285869184 + ], + [ + 53, + 0.7493949711375981 + ], + [ + 54, + 0.7494164331448312 + ], + [ + 55, + 0.749431435404787 + ], + [ + 56, + 0.7494219244917812 + ], + [ + 57, + 0.7494214302769182 + ], + [ + 58, + 0.7494130351618888 + ], + [ + 59, + 0.7494082658052762 + ], + [ + 60, + 0.7494077110138571 + ], + [ + 61, + 0.7493790412152981 + ], + [ + 62, + 0.7494181898768314 + ], + [ + 63, + 0.7493980372946877 + ], + [ + 64, + 0.7493909441797553 + ], + [ + 65, + 0.7493971148354409 + ], + [ + 66, + 0.7493889381657717 + ], + [ + 67, + 0.7493936954225355 + ], + [ + 68, + 0.7493900038395401 + ], + [ + 69, + 0.7494178118601867 + ], + [ + 70, + 0.7493853853804173 + ], + [ + 71, + 0.7493931562152367 + ], + [ + 72, + 0.7493988530900674 + ], + [ + 73, + 0.7494122157852626 + ], + [ + 74, + 0.7494146094890184 + ], + [ + 75, + 0.7494208011582342 + ], + [ + 76, + 0.7494050698938658 + ], + [ + 77, + 0.7494055599993505 + ], + [ + 78, + 0.7494059285128851 + ], + [ + 79, + 0.7493929029232673 + ], + [ + 80, + 0.749377186090891 + ], + [ + 81, + 0.7494000715183446 + ], + [ + 82, + 0.74940029120142 + ], + [ + 83, + 0.7494105884852755 + ], + [ + 84, + 0.749399848526255 + ], + [ + 85, + 0.7493994322680746 + ], + [ + 86, + 0.7493970703341848 + ], + [ + 87, + 0.7493847860839147 + ], + [ + 88, + 0.7493903081046276 + ], + [ + 89, + 0.7493824421770239 + ], + [ + 90, + 0.749410890924463 + ], + [ + 91, + 0.7493914349492756 + ], + [ + 92, + 0.7493911763245706 + ], + [ + 93, + 0.749396897074757 + ], + [ + 94, + 0.7493974736752277 + ], + [ + 95, + 0.7494033625548995 + ], + [ + 96, + 0.7493953665583865 + ], + [ + 97, + 0.7494132061763379 + ], + [ + 98, + 0.7493921745762918 + ], + [ + 99, + 0.7493799493323625 + ], + [ + 100, + 0.7494036375793924 + ] + ] + }, + "blend_constant_input": { + "test_acc": [ + 0.3095, + 0.2927, + 0.3152, + 0.3064, + 0.3074, + 0.3125, + 0.3162, + 0.3217, + 0.3136, + 0.3142, + 0.3136, + 0.315, + 0.3249, + 0.3132, + 0.3039, + 0.3117, + 0.3118, + 0.3065, + 0.3034, + 0.3145, + 0.3201, + 0.3066, + 0.3019, + 0.3041, + 0.301, + 0.2939, + 0.309, + 0.3114, + 0.3148, + 0.3116, + 0.3123, + 0.3073, + 0.3116, + 0.3158, + 0.3152, + 0.3133, + 0.3061, + 0.3231, + 0.3095, + 0.3212, + 0.3188, + 0.3074, + 0.3088, + 0.3033, + 0.308, + 0.3137, + 0.305, + 0.3078, + 0.3172, + 0.3093, + 0.3045, + 0.3027, + 0.3125, + 0.3152, + 0.3112, + 0.3128, + 0.3125, + 0.3096, + 0.3048, + 0.3121, + 0.3129, + 0.312, + 0.3152, + 0.3115, + 0.3099, + 0.3091, + 0.3142, + 0.3124, + 0.3069, + 0.3084, + 0.3122, + 0.3144, + 0.3147, + 0.3111, + 0.312, + 0.3121, + 0.3114, + 0.3122, + 0.3138, + 0.313, + 0.3111, + 0.3137, + 0.3106, + 0.3141, + 0.3113, + 0.3115, + 0.3115, + 0.3115, + 0.3124, + 0.3116, + 0.312, + 0.3117, + 0.3117, + 0.3117, + 0.3116 + ], + "train_loss": [ + 1.9875338983917237, + 1.9781464235687256, + 1.9745915028381347, + 1.9724161750030518, + 1.9703527437591553, + 1.9698648984527587, + 1.971249841003418, + 1.9712429263305664, + 1.9799304322052003, + 1.9778242485046387, + 1.9836121215820313, + 1.9883264628601074, + 1.9827331024932862, + 1.9819735743713378, + 1.9824169759368897, + 1.990514292755127, + 1.9945136283874512, + 1.995475414085388, + 1.9869946667861937, + 1.9829312426757812, + 1.9761786726379396, + 1.9753313485336303, + 1.9803643784332274, + 1.9841854313659668, + 1.9868849114990235, + 1.983912781600952, + 1.9798361653137206, + 1.978118487586975, + 1.9769819805908204, + 1.9753173876190186, + 1.9730472027969361, + 1.9742750312042237, + 1.975975908241272, + 1.9766003805541992, + 1.975649796600342, + 1.9733796028137207, + 1.9730736239624023, + 1.9763634573745728, + 1.9743109363174438, + 1.9727392714691163, + 1.9759128737640381, + 1.9758021099853516, + 1.9766102784729005, + 1.9757713250732423, + 1.9760345909881591, + 1.975186833267212, + 1.9701717514419557, + 1.9783073165130616, + 1.9799149188995362, + 1.976058423423767, + 1.9737729637908936, + 1.9780769903182984, + 1.971851884765625, + 1.9752169612121582, + 1.9761044771575929, + 1.9749460768890381, + 1.9757458843231201, + 1.9762586096191406, + 1.9757843294525146, + 1.9742973477554322, + 1.9754280879211426, + 1.9723532569122315, + 1.9717969180679322, + 1.9720607820129394, + 1.9751361526489257, + 1.9715440291595459, + 1.972982950820923, + 1.97191197265625, + 1.9730741275024415, + 1.9697976119232177, + 1.969512387123108, + 1.9704620248413085, + 1.9706119800186157, + 1.970843869895935, + 1.969023858947754, + 1.970489073753357, + 1.9707957164764405, + 1.9714748225402832, + 1.970333583908081, + 1.969499998321533, + 1.9728154964447022, + 1.9725122617340087, + 1.9686164707183837, + 1.9708904336547852, + 1.9692982942199706, + 1.9682558645629882, + 1.9676385024261474, + 1.9665554128265381, + 1.9685520446014404, + 1.9690102555084228, + 1.9706991818237305, + 1.9691560688018799, + 1.9693079661560058, + 1.969636968536377, + 1.9691142596817017 + ], + "gamma": [ + [ + 6, + 0.03311742760706693 + ], + [ + 7, + 0.028048108099028468 + ], + [ + 8, + 0.02896452709683217 + ], + [ + 9, + 0.031478883465752006 + ], + [ + 10, + 0.02344508725218475 + ], + [ + 13, + 0.024458521860651672 + ], + [ + 15, + 0.02667085622670129 + ], + [ + 20, + 0.03174502568435855 + ], + [ + 25, + 0.024454289814457297 + ], + [ + 35, + 0.025064532179385424 + ], + [ + 45, + 0.025748528307303786 + ], + [ + 55, + 0.02379508875310421 + ], + [ + 65, + 0.02414266101550311 + ], + [ + 75, + 0.0254881803994067 + ], + [ + 85, + 0.026983873452991247 + ], + [ + 95, + 0.01588204613653943 + ], + [ + 100, + 0.02812473534140736 + ] + ], + "rho": [ + [ + 6, + -0.009256488177925348 + ], + [ + 7, + -0.005333291715942323 + ], + [ + 8, + 0.024343792349100113 + ], + [ + 9, + 0.01545919943600893 + ], + [ + 10, + -0.0037216898053884506 + ], + [ + 13, + 0.006445262581110001 + ], + [ + 15, + 0.005032598739489913 + ], + [ + 20, + 0.005152330035343766 + ], + [ + 25, + 0.0013879609759896994 + ], + [ + 35, + -0.0005084157455712557 + ], + [ + 45, + -0.010277077089995146 + ], + [ + 55, + -0.0013219688553363085 + ], + [ + 65, + -0.00706016318872571 + ], + [ + 75, + 0.010231438325718045 + ], + [ + 85, + -0.00585735950153321 + ], + [ + 95, + -0.008048742078244686 + ], + [ + 100, + 0.012646065675653517 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7484106513263207 + ], + [ + 7, + 0.7493717186701357 + ], + [ + 8, + 0.749375857356196 + ], + [ + 9, + 0.749365078317222 + ], + [ + 10, + 0.7493864681557557 + ], + [ + 11, + 0.7493782179808761 + ], + [ + 12, + 0.7493562254885738 + ], + [ + 13, + 0.7493701979998898 + ], + [ + 14, + 0.7493732262742637 + ], + [ + 15, + 0.7493859856155834 + ], + [ + 16, + 0.7493801137028954 + ], + [ + 17, + 0.7493968515730436 + ], + [ + 18, + 0.7493865920427955 + ], + [ + 19, + 0.749369233728556 + ], + [ + 20, + 0.7493602552275802 + ], + [ + 21, + 0.7493635033527809 + ], + [ + 22, + 0.749371721733354 + ], + [ + 23, + 0.7493767283211062 + ], + [ + 24, + 0.7493810997744813 + ], + [ + 25, + 0.7493756990939394 + ], + [ + 26, + 0.7493523778935989 + ], + [ + 27, + 0.7493686187064469 + ], + [ + 28, + 0.7493555866914537 + ], + [ + 29, + 0.7493754313520443 + ], + [ + 30, + 0.7493895373621285 + ], + [ + 31, + 0.7493635118909127 + ], + [ + 32, + 0.749364527087908 + ], + [ + 33, + 0.7493709444425792 + ], + [ + 34, + 0.7493707801614627 + ], + [ + 35, + 0.7493651612681415 + ], + [ + 36, + 0.7493714776094735 + ], + [ + 37, + 0.7493673442828049 + ], + [ + 38, + 0.7493595623245222 + ], + [ + 39, + 0.74936136073031 + ], + [ + 40, + 0.749371822843851 + ], + [ + 41, + 0.7493670358897049 + ], + [ + 42, + 0.7493623165683013 + ], + [ + 43, + 0.7493678602210149 + ], + [ + 44, + 0.7493675602252929 + ], + [ + 45, + 0.7493665691080361 + ], + [ + 46, + 0.7493738502922623 + ], + [ + 47, + 0.7493562694557622 + ], + [ + 48, + 0.74934288725951 + ], + [ + 49, + 0.7493899037155466 + ], + [ + 50, + 0.7493644489260175 + ], + [ + 51, + 0.7493553400577623 + ], + [ + 52, + 0.7493727653378641 + ], + [ + 53, + 0.7493637200668858 + ], + [ + 54, + 0.7493784007644393 + ], + [ + 55, + 0.7493878835084044 + ], + [ + 56, + 0.7493926391945999 + ], + [ + 57, + 0.7493923963585047 + ], + [ + 58, + 0.7493964115422674 + ], + [ + 59, + 0.7493628329000167 + ], + [ + 60, + 0.7493843180349045 + ], + [ + 61, + 0.7493717207431344 + ], + [ + 62, + 0.7493938599658067 + ], + [ + 63, + 0.7493671735761203 + ], + [ + 64, + 0.749364996482394 + ], + [ + 65, + 0.7493521466954451 + ], + [ + 66, + 0.7493709974139263 + ], + [ + 67, + 0.7493721116666429 + ], + [ + 68, + 0.7493693271276669 + ], + [ + 69, + 0.7493736741513296 + ], + [ + 70, + 0.7493662216141617 + ], + [ + 71, + 0.7493765024832033 + ], + [ + 72, + 0.7493745193670395 + ], + [ + 73, + 0.7493649242419702 + ], + [ + 74, + 0.7493966243789978 + ], + [ + 75, + 0.7493959565525711 + ], + [ + 76, + 0.7493842283630113 + ], + [ + 77, + 0.7493826575990793 + ], + [ + 78, + 0.7493771928497606 + ], + [ + 79, + 0.7493694518659229 + ], + [ + 80, + 0.7493549627274159 + ], + [ + 81, + 0.7493761083199512 + ], + [ + 82, + 0.7493647890141059 + ], + [ + 83, + 0.749363323225991 + ], + [ + 84, + 0.7493727437759294 + ], + [ + 85, + 0.7493784333230321 + ], + [ + 86, + 0.7493660763696164 + ], + [ + 87, + 0.7493592969538754 + ], + [ + 88, + 0.7493700916492844 + ], + [ + 89, + 0.7493578736291281 + ], + [ + 90, + 0.7493669943472065 + ], + [ + 91, + 0.7493683110399325 + ], + [ + 92, + 0.7493635305152803 + ], + [ + 93, + 0.7493783224508156 + ], + [ + 94, + 0.7493629790427503 + ], + [ + 95, + 0.7493759327014129 + ], + [ + 96, + 0.7493891169149812 + ], + [ + 97, + 0.7493704727066623 + ], + [ + 98, + 0.7493684423255998 + ], + [ + 99, + 0.7493643425710621 + ], + [ + 100, + 0.749369694385133 + ] + ] + }, + "blend_prefit60_frozen": { + "test_acc": [ + 0.2043, + 0.1273, + 0.1202, + 0.124, + 0.1064, + 0.1037, + 0.1044, + 0.1378, + 0.1019, + 0.1119, + 0.1038, + 0.1202, + 0.1191, + 0.1212, + 0.1053, + 0.1005, + 0.1, + 0.1043, + 0.1128, + 0.1349, + 0.1, + 0.0942, + 0.1, + 0.1, + 0.1046, + 0.1229, + 0.1202, + 0.0961, + 0.1033, + 0.1348, + 0.1, + 0.1, + 0.1387, + 0.1, + 0.1011, + 0.1404, + 0.1261, + 0.1256, + 0.1245, + 0.1263, + 0.1, + 0.1411, + 0.1253, + 0.1, + 0.1354, + 0.101, + 0.1307, + 0.1241, + 0.1142, + 0.1164, + 0.1348, + 0.1275, + 0.1268, + 0.1254, + 0.1202, + 0.1299, + 0.1208, + 0.1427, + 0.1258, + 0.1291, + 0.1382, + 0.1267, + 0.1401, + 0.1411, + 0.1247, + 0.127, + 0.1255, + 0.1227, + 0.1376, + 0.1252, + 0.1287, + 0.1288, + 0.1284, + 0.1233, + 0.1239, + 0.1284, + 0.1171, + 0.1387, + 0.1323, + 0.1336, + 0.1281, + 0.1282, + 0.1192, + 0.1361, + 0.122, + 0.1421, + 0.1272, + 0.1191, + 0.1337, + 0.1189, + 0.1256, + 0.1259, + 0.1269, + 0.1273, + 0.1273 + ], + "train_loss": [ + 2.0830069789123535, + 2.2363857093811035, + 2.286753871307373, + 2.3021955226135256, + 2.307171946411133, + 2.306757819290161, + 2.308535819091797, + 2.3114971450042723, + 2.310006459350586, + 2.308248912963867, + 2.3091092628479, + 2.3101371949005127, + 2.3100573498535155, + 2.3091729637908935, + 2.3108024481201173, + 2.309446760787964, + 2.309663332901001, + 2.308393766937256, + 2.3079774335479737, + 2.308805708770752, + 2.308893244781494, + 2.3087623870849607, + 2.3080819446563723, + 2.3082434127807616, + 2.3073471446990967, + 2.308298185272217, + 2.3072395930480956, + 2.3067903547668456, + 2.306027341995239, + 2.305646753387451, + 2.304693531036377, + 2.305372020339966, + 2.306144116973877, + 2.304595169143677, + 2.3051424267578127, + 2.304107342147827, + 2.304104132614136, + 2.3047459492492677, + 2.3041023583984375, + 2.304119969787598, + 2.303680535202026, + 2.3037661632537842, + 2.303230378341675, + 2.303156194381714, + 2.3029407551574708, + 2.3039470793914796, + 2.3019987341308594, + 2.302603823928833, + 2.301570912399292, + 2.3022499572753907, + 2.301214624328613, + 2.3014222357177734, + 2.301103698272705, + 2.300695306549072, + 2.3011233628845216, + 2.300446473388672, + 2.3007079207611083, + 2.3002176605987548, + 2.300141312866211, + 2.299731453857422, + 2.2998401210021973, + 2.2995610164642333, + 2.299095908508301, + 2.2994387922668458, + 2.299033603668213, + 2.2988384745788575, + 2.298912456817627, + 2.298532929611206, + 2.298629486083984, + 2.298695648651123, + 2.298283136367798, + 2.298307420196533, + 2.2984528969573974, + 2.2981724449157714, + 2.2978037510681153, + 2.2978140604400634, + 2.2976280823516846, + 2.2976026635742186, + 2.2976952281188967, + 2.2973396068573, + 2.297480895614624, + 2.297378879394531, + 2.29748806388855, + 2.297339668197632, + 2.2973999842071535, + 2.29707500831604, + 2.297092576599121, + 2.2970709034729, + 2.296968642654419, + 2.29701911857605, + 2.2968643725585935, + 2.2971342435455324, + 2.2969509156799317, + 2.2969766483306886, + 2.296942285003662 + ], + "gamma": [ + [ + 6, + 0.02637748871347867 + ], + [ + 7, + 0.02395206643268466 + ], + [ + 8, + 0.020127142313867807 + ], + [ + 9, + 0.02275098697282374 + ], + [ + 10, + 0.019405266852118075 + ], + [ + 13, + 0.006674408679828048 + ], + [ + 15, + 0.00812907435465604 + ], + [ + 20, + 0.012263836681086104 + ], + [ + 25, + 0.009719834713905584 + ], + [ + 35, + 0.0076912970462217345 + ], + [ + 45, + 0.007174774635132053 + ], + [ + 55, + 0.0061106626299078926 + ], + [ + 65, + 0.004976394520781469 + ], + [ + 75, + 0.005896237093566015 + ], + [ + 85, + 0.005409017603824395 + ], + [ + 95, + 0.005116917479995209 + ], + [ + 100, + 0.005077318550547716 + ] + ], + "rho": [ + [ + 6, + -0.011525815818458796 + ], + [ + 7, + -0.004745047073811293 + ], + [ + 8, + -0.003275573253631592 + ], + [ + 9, + -0.0032713948749005795 + ], + [ + 10, + -0.00852298946119845 + ], + [ + 13, + -0.010459980345331132 + ], + [ + 15, + 0.014339560060761869 + ], + [ + 20, + -0.00014275737339630723 + ], + [ + 25, + -0.008080001920461655 + ], + [ + 35, + -0.006155483657494187 + ], + [ + 45, + 0.01036455383291468 + ], + [ + 55, + 0.005281219491735101 + ], + [ + 65, + 9.279907681047916e-05 + ], + [ + 75, + 0.001974701415747404 + ], + [ + 85, + 0.016728006303310394 + ], + [ + 95, + -0.002427483443170786 + ], + [ + 100, + -0.011901997029781342 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7494038553062852 + ], + [ + 7, + 0.749403834493919 + ], + [ + 8, + 0.7494038299291426 + ], + [ + 9, + 0.7494038277493726 + ], + [ + 10, + 0.7494038230211482 + ], + [ + 11, + 0.749403818386261 + ], + [ + 12, + 0.749403815334158 + ], + [ + 13, + 0.749403815441683 + ], + [ + 14, + 0.7494038145784992 + ], + [ + 15, + 0.7494038145368954 + ], + [ + 16, + 0.7494038142491459 + ], + [ + 17, + 0.7494038141915446 + ], + [ + 18, + 0.7494038139619765 + ], + [ + 19, + 0.7494038140938216 + ], + [ + 20, + 0.7494038139888102 + ], + [ + 21, + 0.7494038141685808 + ], + [ + 22, + 0.7494038142696579 + ], + [ + 23, + 0.7494038141109793 + ], + [ + 24, + 0.7494038141578092 + ], + [ + 25, + 0.7494038144616851 + ], + [ + 26, + 0.7494038139383039 + ], + [ + 27, + 0.7494038137592423 + ], + [ + 28, + 0.7494038141343298 + ], + [ + 29, + 0.7494038137862693 + ], + [ + 30, + 0.7494038141545194 + ], + [ + 31, + 0.7494038138845078 + ], + [ + 32, + 0.7494038144889699 + ], + [ + 33, + 0.7494038143814421 + ], + [ + 34, + 0.749403814120784 + ], + [ + 35, + 0.7494038142590151 + ], + [ + 36, + 0.749403814042864 + ], + [ + 37, + 0.7494038141441345 + ], + [ + 38, + 0.7494038142794627 + ], + [ + 39, + 0.749403814343708 + ], + [ + 40, + 0.7494038144018251 + ], + [ + 41, + 0.7494038139923577 + ], + [ + 42, + 0.7494038140260286 + ], + [ + 43, + 0.7494038144382057 + ], + [ + 44, + 0.7494038144623939 + ], + [ + 45, + 0.7494038141583892 + ], + [ + 46, + 0.749403814415242 + ], + [ + 47, + 0.7494038145163834 + ], + [ + 48, + 0.7494038138574164 + ], + [ + 49, + 0.749403814228634 + ], + [ + 50, + 0.7494038141881257 + ], + [ + 51, + 0.7494038144514936 + ], + [ + 52, + 0.7494038140393809 + ], + [ + 53, + 0.7494038141204619 + ], + [ + 54, + 0.7494038145699863 + ], + [ + 55, + 0.7494038142624337 + ], + [ + 56, + 0.7494038144853579 + ], + [ + 57, + 0.7494038144073734 + ], + [ + 58, + 0.7494038142826879 + ], + [ + 59, + 0.74940381437725 + ], + [ + 60, + 0.7494038141779343 + ], + [ + 61, + 0.7494038146679024 + ], + [ + 62, + 0.7494038143603501 + ], + [ + 63, + 0.7494038144176938 + ], + [ + 64, + 0.749403814438399 + ], + [ + 65, + 0.7494038146577109 + ], + [ + 66, + 0.7494038144045347 + ], + [ + 67, + 0.7494038145192865 + ], + [ + 68, + 0.7494038144010516 + ], + [ + 69, + 0.7494038144516869 + ], + [ + 70, + 0.7494038144718765 + ], + [ + 71, + 0.7494038144926463 + ], + [ + 72, + 0.7494038147289225 + ], + [ + 73, + 0.7494038149014046 + ], + [ + 74, + 0.7494038147894915 + ], + [ + 75, + 0.7494038145597947 + ], + [ + 76, + 0.7494038147965222 + ], + [ + 77, + 0.7494038147455646 + ], + [ + 78, + 0.7494038147258262 + ], + [ + 79, + 0.7494038149720361 + ], + [ + 80, + 0.74940381440776 + ], + [ + 81, + 0.7494038150091257 + ], + [ + 82, + 0.7494038150199617 + ], + [ + 83, + 0.7494038147490477 + ], + [ + 84, + 0.7494038148167762 + ], + [ + 85, + 0.7494038149455893 + ], + [ + 86, + 0.7494038148743777 + ], + [ + 87, + 0.7494038147429194 + ], + [ + 88, + 0.7494038149899673 + ], + [ + 89, + 0.7494038150609854 + ], + [ + 90, + 0.7494038151344555 + ], + [ + 91, + 0.7494038146208148 + ], + [ + 92, + 0.7494038151489036 + ], + [ + 93, + 0.7494038152729445 + ], + [ + 94, + 0.74940381507408 + ], + [ + 95, + 0.7494038149120472 + ], + [ + 96, + 0.7494038147498856 + ], + [ + 97, + 0.7494038152265659 + ], + [ + 98, + 0.7494038151347779 + ], + [ + 99, + 0.7494038153075823 + ], + [ + 100, + 0.7494038152466266 + ] + ] + }, + "blend_prefit60_trainable": { + "test_acc": [ + 0.3083, + 0.3096, + 0.3056, + 0.311, + 0.3054, + 0.3053, + 0.3122, + 0.3092, + 0.312, + 0.3037, + 0.3107, + 0.3116, + 0.3253, + 0.3111, + 0.3215, + 0.3103, + 0.3113, + 0.3133, + 0.3175, + 0.3174, + 0.3213, + 0.3171, + 0.3217, + 0.318, + 0.3082, + 0.324, + 0.3106, + 0.3084, + 0.3258, + 0.3144, + 0.3272, + 0.3182, + 0.326, + 0.3111, + 0.3273, + 0.3222, + 0.3236, + 0.3161, + 0.3134, + 0.3167, + 0.3133, + 0.3164, + 0.314, + 0.3138, + 0.321, + 0.3204, + 0.324, + 0.3099, + 0.3131, + 0.3171, + 0.3203, + 0.3055, + 0.3112, + 0.3258, + 0.3168, + 0.3215, + 0.3225, + 0.3149, + 0.3236, + 0.3212, + 0.3233, + 0.3258, + 0.3205, + 0.3235, + 0.3156, + 0.3192, + 0.3208, + 0.328, + 0.3228, + 0.3209, + 0.3204, + 0.3262, + 0.3194, + 0.3216, + 0.3188, + 0.319, + 0.3236, + 0.3218, + 0.3175, + 0.3216, + 0.321, + 0.3218, + 0.3215, + 0.3208, + 0.3231, + 0.3219, + 0.3214, + 0.3215, + 0.3213, + 0.3208, + 0.321, + 0.3213, + 0.3211, + 0.3212, + 0.3211 + ], + "train_loss": [ + 1.9869631629943847, + 1.982107442779541, + 1.9800773624038697, + 1.9818990044403075, + 1.975253528137207, + 1.9774205728149414, + 1.9751682382965088, + 1.9734763603973389, + 1.971316197052002, + 1.9686581175231934, + 1.9697350271606446, + 1.9697708779907226, + 1.9679039678192138, + 1.9665398016357423, + 1.9669920742034912, + 1.9624735032653808, + 1.9654020233535767, + 1.9674128352355957, + 1.9649122500610352, + 1.9671058654785156, + 1.968050679588318, + 1.9661344065093995, + 1.9655031778335572, + 1.965856990890503, + 1.9651026904678344, + 1.9633458019638061, + 1.9671223302841188, + 1.9679012558746338, + 1.9653001847839355, + 1.962793049545288, + 1.9672515293884278, + 1.9679883306884767, + 1.9659979307556152, + 1.967029616470337, + 1.965907823486328, + 1.9659454788970947, + 1.965747356300354, + 1.9647465851593018, + 1.96370748752594, + 1.9651040491104126, + 1.9665634396743774, + 1.9663065463256837, + 1.9650677017211915, + 1.9633804962921142, + 1.9627257344818114, + 1.9607258738708495, + 1.9627140160751342, + 1.9640110021972657, + 1.9638081337738038, + 1.9621095028305053, + 1.9615541821289062, + 1.9626792596054077, + 1.9610307932281494, + 1.9590073849487304, + 1.9610003355407715, + 1.9595879172134398, + 1.9591543670272826, + 1.960877984085083, + 1.9608802389526367, + 1.9572701121520997, + 1.959934578933716, + 1.9634374791717528, + 1.9611477459716797, + 1.9614908032226563, + 1.9595665050888063, + 1.9605130221939087, + 1.961020618019104, + 1.95984165184021, + 1.9602812258529663, + 1.9593161968994142, + 1.9606877487945558, + 1.9583045994567871, + 1.9585868435287475, + 1.9605323672103883, + 1.9587446689605712, + 1.9603156557846069, + 1.9589103647613526, + 1.9578054639434814, + 1.9590308611297607, + 1.9598375805282593, + 1.9584676153564453, + 1.9602760329818725, + 1.9589101021575928, + 1.9583418262481689, + 1.9600815436553956, + 1.9572944204330445, + 1.9606394169616699, + 1.9585626053237915, + 1.960242194519043, + 1.957658486289978, + 1.9579220495986938, + 1.9595472118377686, + 1.956711728553772, + 1.9555246179962158, + 1.9605165130615234 + ], + "gamma": [ + [ + 6, + 0.027149309520609677 + ], + [ + 7, + 0.028437960718292743 + ], + [ + 8, + 0.034789546742103994 + ], + [ + 9, + 0.022622307355049998 + ], + [ + 10, + 0.03235352906631306 + ], + [ + 13, + 0.02301677397917956 + ], + [ + 15, + 0.025688304798677564 + ], + [ + 20, + 0.027680203143972903 + ], + [ + 25, + 0.01849789312109351 + ], + [ + 35, + 0.031101900152862072 + ], + [ + 45, + 0.02937179930449929 + ], + [ + 55, + 0.030146236123982817 + ], + [ + 65, + 0.024986988748423755 + ], + [ + 75, + 0.023811903840396553 + ], + [ + 85, + 0.033509362605400383 + ], + [ + 95, + 0.03029970038915053 + ], + [ + 100, + 0.02625635568983853 + ] + ], + "rho": [ + [ + 6, + 0.020763279870152473 + ], + [ + 7, + -0.01829602080397308 + ], + [ + 8, + 0.03202603850513697 + ], + [ + 9, + 0.005786044057458639 + ], + [ + 10, + 0.025155132869258523 + ], + [ + 13, + 0.011773683363571763 + ], + [ + 15, + -0.010100261773914099 + ], + [ + 20, + -0.004275039536878467 + ], + [ + 25, + -0.004346607718616724 + ], + [ + 35, + -0.004164531943388283 + ], + [ + 45, + 0.008717172779142857 + ], + [ + 55, + 0.021293016499839723 + ], + [ + 65, + 0.007391993887722492 + ], + [ + 75, + 0.025975750293582678 + ], + [ + 85, + -0.02585920598357916 + ], + [ + 95, + 0.017909258254803717 + ], + [ + 100, + -0.004653664771467447 + ] + ], + "alpha_eff": [ + [ + 6, + 0.7494198855774478 + ], + [ + 7, + 0.7493945028864009 + ], + [ + 8, + 0.7494045543931235 + ], + [ + 9, + 0.7493988742149943 + ], + [ + 10, + 0.749409506439465 + ], + [ + 11, + 0.7493851544776187 + ], + [ + 12, + 0.7493931222874718 + ], + [ + 13, + 0.7494051439577297 + ], + [ + 14, + 0.7494143308644613 + ], + [ + 15, + 0.7493897442606672 + ], + [ + 16, + 0.749390242434998 + ], + [ + 17, + 0.7493832566522736 + ], + [ + 18, + 0.7493837943928502 + ], + [ + 19, + 0.7493764624723499 + ], + [ + 20, + 0.74938416701579 + ], + [ + 21, + 0.749394064849191 + ], + [ + 22, + 0.7494066318569547 + ], + [ + 23, + 0.7493839590126894 + ], + [ + 24, + 0.7493944212005683 + ], + [ + 25, + 0.7494086175230461 + ], + [ + 26, + 0.7493879019763686 + ], + [ + 27, + 0.7493887785759618 + ], + [ + 28, + 0.7493890992273776 + ], + [ + 29, + 0.7493921938446095 + ], + [ + 30, + 0.749392955277891 + ], + [ + 31, + 0.7494070060785534 + ], + [ + 32, + 0.7494018975461066 + ], + [ + 33, + 0.749390302470714 + ], + [ + 34, + 0.7493936958318456 + ], + [ + 35, + 0.7493847156329149 + ], + [ + 36, + 0.7493830615807119 + ], + [ + 37, + 0.7493959014510937 + ], + [ + 38, + 0.7493826145772485 + ], + [ + 39, + 0.7494004122947528 + ], + [ + 40, + 0.749390372331179 + ], + [ + 41, + 0.7493846509161871 + ], + [ + 42, + 0.7493945714806454 + ], + [ + 43, + 0.7493948280228023 + ], + [ + 44, + 0.7494010476809537 + ], + [ + 45, + 0.7493908627766896 + ], + [ + 46, + 0.7493879079302833 + ], + [ + 47, + 0.7493752931701734 + ], + [ + 48, + 0.7493746657364128 + ], + [ + 49, + 0.7493817363498273 + ], + [ + 50, + 0.7493954868582153 + ], + [ + 51, + 0.7494180908502441 + ], + [ + 52, + 0.7494128547280554 + ], + [ + 53, + 0.7494010229751693 + ], + [ + 54, + 0.7493916645250338 + ], + [ + 55, + 0.7493986710654272 + ], + [ + 56, + 0.7493859344989389 + ], + [ + 57, + 0.7493909396665319 + ], + [ + 58, + 0.7493882004138976 + ], + [ + 59, + 0.749399057726123 + ], + [ + 60, + 0.7494158935871307 + ], + [ + 61, + 0.7494089975920222 + ], + [ + 62, + 0.7493982538662999 + ], + [ + 63, + 0.7494030029314076 + ], + [ + 64, + 0.749399792622185 + ], + [ + 65, + 0.7494163832557151 + ], + [ + 66, + 0.749400623752514 + ], + [ + 67, + 0.7493899962477784 + ], + [ + 68, + 0.7493832026704041 + ], + [ + 69, + 0.7493755145942212 + ], + [ + 70, + 0.7493852732327845 + ], + [ + 71, + 0.749396029782683 + ], + [ + 72, + 0.7493985081308931 + ], + [ + 73, + 0.7493950887715348 + ], + [ + 74, + 0.7493878717853603 + ], + [ + 75, + 0.7493873475788589 + ], + [ + 76, + 0.7493865010832917 + ], + [ + 77, + 0.7493955297336615 + ], + [ + 78, + 0.7493856801895845 + ], + [ + 79, + 0.7493983698829365 + ], + [ + 80, + 0.749404937236268 + ], + [ + 81, + 0.749389356360739 + ], + [ + 82, + 0.7493913243999851 + ], + [ + 83, + 0.7494008850885872 + ], + [ + 84, + 0.7494028172064978 + ], + [ + 85, + 0.7494147534853167 + ], + [ + 86, + 0.7494104948005028 + ], + [ + 87, + 0.7494106429226236 + ], + [ + 88, + 0.7493989916786297 + ], + [ + 89, + 0.7493947275831284 + ], + [ + 90, + 0.749380560246787 + ], + [ + 91, + 0.7493890447050457 + ], + [ + 92, + 0.7493909601507237 + ], + [ + 93, + 0.7493811012400322 + ], + [ + 94, + 0.749397621126069 + ], + [ + 95, + 0.7493992755600606 + ], + [ + 96, + 0.749402396710577 + ], + [ + 97, + 0.7493987377379719 + ], + [ + 98, + 0.7493964994726998 + ], + [ + 99, + 0.7494097391707691 + ], + [ + 100, + 0.7493962720968325 + ] + ] + } +} \ No newline at end of file diff --git a/results/synth_ladder_smoke/config.json b/results/synth_ladder_smoke/config.json new file mode 100644 index 0000000..d3102c3 --- /dev/null +++ b/results/synth_ladder_smoke/config.json @@ -0,0 +1,30 @@ +{ + "alphas": [ + 0.0, + 0.5, + 1.0 + ], + "depths": [ + 2, + 8 + ], + "seeds": [ + 42 + ], + "d_hidden": 128, + "num_classes": 10, + "n_train": 10000, + "n_test": 2000, + "batch_size": 256, + "epochs": 60, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "gpu": 0, + "output_dir": "results/synth_ladder_smoke" +} \ No newline at end of file diff --git a/results/synth_ladder_smoke/summary.json b/results/synth_ladder_smoke/summary.json new file mode 100644 index 0000000..09ab8d7 --- /dev/null +++ b/results/synth_ladder_smoke/summary.json @@ -0,0 +1,782 @@ +{ + "a0.0_L2_s42": { + "bp": { + "test_acc": 0.9445, + "mean_bp_cosine": 0.8363544940948486, + "mean_rho": 0.9999966025352478, + "mean_nudge_001": -0.014867921359837055, + "mean_nudge_003": -0.038927674293518066, + "mean_nudge_01": -0.08314211666584015, + "bp_cosine_per_layer": [ + 0.841028094291687, + 0.8316808938980103 + ], + "rho_per_layer": [ + 0.9999988079071045, + 0.9999943971633911 + ], + "nudge_per_layer": [ + -0.10806188732385635, + -0.058222346007823944 + ] + }, + "dfa": { + "test_acc": 0.8905, + "mean_bp_cosine": 0.028207830036990345, + "mean_rho": -0.013231039047241211, + "mean_nudge_001": -0.0004544301191344857, + "mean_nudge_003": -0.0012695252080447972, + "mean_nudge_01": -0.003105040406808257, + "bp_cosine_per_layer": [ + -0.002617625752463937, + 0.059033285826444626 + ], + "rho_per_layer": [ + -0.03406350687146187, + 0.007601428776979446 + ], + "nudge_per_layer": [ + -0.0010169181041419506, + -0.005193162709474564 + ] + }, + "state_bridge": { + "test_acc": 0.825, + "mean_bp_cosine": 0.5880793333053589, + "mean_rho": 0.44639749079942703, + "mean_nudge_001": -0.01224998920224607, + "mean_nudge_003": -0.035131572745740414, + "mean_nudge_01": -0.10013834200799465, + "bp_cosine_per_layer": [ + 0.8860390186309814, + 0.29011964797973633 + ], + "rho_per_layer": [ + 0.729070782661438, + 0.16372419893741608 + ], + "nudge_per_layer": [ + -0.17900359630584717, + -0.021273087710142136 + ], + "state_pred_error_per_layer": [ + 33793.6875, + 17287.951171875 + ], + "mean_state_pred_error": 25540.8193359375 + }, + "credit_bridge": { + "test_acc": 0.656, + "mean_bp_cosine": 0.10665101930499077, + "mean_rho": 0.23030418902635574, + "mean_nudge_001": -0.006580323912203312, + "mean_nudge_003": -0.019663945073261857, + "mean_nudge_01": -0.06460809707641602, + "bp_cosine_per_layer": [ + 0.10150224715471268, + 0.11179979145526886 + ], + "rho_per_layer": [ + 0.24922937154769897, + 0.2113790065050125 + ], + "nudge_per_layer": [ + -0.10681234300136566, + -0.02240385115146637 + ], + "final_value_loss": 0.5207448813438416, + "final_term_loss": 0.20168962478637695, + "final_bridge_loss": 0.10483724861145019, + "final_tgrad_loss": 0.21421800775527955 + } + }, + "a0.0_L8_s42": { + "bp": { + "test_acc": 0.948, + "mean_bp_cosine": 0.6927967146039009, + "mean_rho": 0.9999185726046562, + "mean_nudge_001": -0.007844092877348885, + "mean_nudge_003": -0.021484591998159885, + "mean_nudge_01": -0.053326028981246054, + "bp_cosine_per_layer": [ + 0.7277177572250366, + 0.7186546921730042, + 0.7086087465286255, + 0.6982603073120117, + 0.686427116394043, + 0.6760239601135254, + 0.6675269603729248, + 0.6591541767120361 + ], + "rho_per_layer": [ + 0.999999463558197, + 0.999997615814209, + 0.9999939203262329, + 0.9999786019325256, + 0.9999496340751648, + 0.99991774559021, + 0.9998468160629272, + 0.9996647834777832 + ], + "nudge_per_layer": [ + -0.14217889308929443, + -0.10304947197437286, + -0.06661910563707352, + -0.04270746558904648, + -0.028325699269771576, + -0.019565371796488762, + -0.013980223797261715, + -0.010182000696659088 + ] + }, + "dfa": { + "test_acc": 0.9465, + "mean_bp_cosine": 0.012617309403140098, + "mean_rho": 0.13837066129781306, + "mean_nudge_001": -0.016161460865987465, + "mean_nudge_003": -0.04494552121468587, + "mean_nudge_01": -0.12098311571025988, + "bp_cosine_per_layer": [ + -0.003863303456455469, + 0.017664283514022827, + 0.01661803014576435, + 0.018178246915340424, + 0.015868376940488815, + 0.014126626774668694, + 0.014091677032411098, + 0.008254537358880043 + ], + "rho_per_layer": [ + -0.019435672089457512, + 0.2941593527793884, + 0.18103283643722534, + 0.20650765299797058, + 0.18732143938541412, + 0.13352911174297333, + 0.15822581946849823, + -0.03437525033950806 + ], + "nudge_per_layer": [ + 0.4985465407371521, + -0.834585428237915, + -0.4260305166244507, + -0.15289700031280518, + -0.03924320265650749, + -0.009715870022773743, + -0.002982086967676878, + -0.0009573615971021354 + ] + }, + "state_bridge": { + "test_acc": 0.167, + "mean_bp_cosine": -0.03321670075220595, + "mean_rho": -3.657315392047167e-05, + "mean_nudge_001": -146456576.0, + "mean_nudge_003": -383148544.0, + "mean_nudge_01": -1178039808.0, + "bp_cosine_per_layer": [ + 0.09916997700929642, + -0.0925145074725151, + -0.12530964612960815, + -0.051633648574352264, + -0.0899374783039093, + -0.005518035963177681, + 1.1753130820579827e-05, + -2.0197142021061154e-06 + ], + "rho_per_layer": [ + 0.0036257803440093994, + -0.0018100417219102383, + 0.0009338338859379292, + -0.0030421577394008636, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "nudge_per_layer": [ + -9628057600.0, + 254652416.0, + -49807360.0, + -1126400.0, + 20480.0, + 0.0, + 0.0, + 0.0 + ], + "state_pred_error_per_layer": [ + 3.788521752616758e+33, + 3.788521752616758e+33, + 3.788521752616758e+33, + 3.788521752616758e+33, + 3.788521752616758e+33, + 3.788521752616758e+33, + 3.788521752616758e+33, + 3.788521752616758e+33 + ], + "mean_state_pred_error": 3.788521752616758e+33 + }, + "credit_bridge": { + "test_acc": 0.0965, + "mean_bp_cosine": 0.10048330621793866, + "mean_rho": -0.022956646920647472, + "mean_nudge_001": -59174496.0, + "mean_nudge_003": -195268096.0, + "mean_nudge_01": -642210232.0, + "bp_cosine_per_layer": [ + 0.517741858959198, + 0.33828628063201904, + 0.4149113893508911, + 0.23560978472232819, + -0.15021789073944092, + -0.1476898193359375, + -0.3642715811729431, + -0.040503572672605515 + ], + "rho_per_layer": [ + -0.004317115992307663, + 9.15133859962225e-05, + 0.0010522708762437105, + 0.0034065949730575085, + -0.18388643860816956, + 0.0, + 0.0, + 0.0 + ], + "nudge_per_layer": [ + -5081367040.0, + -74964928.0, + 31930368.0, + -13346304.0, + 66048.0, + 0.0, + 0.0, + 0.0 + ], + "final_value_loss": 7.270963528184324e+22, + "final_term_loss": 7.270963401002671e+22, + "final_bridge_loss": 1784726332749172.0, + "final_tgrad_loss": 0.6689293840408325 + } + }, + "a0.5_L2_s42": { + "bp": { + "test_acc": 0.8905, + "mean_bp_cosine": 0.8927535116672516, + "mean_rho": 0.9999973773956299, + "mean_nudge_001": -0.017791217658668756, + "mean_nudge_003": -0.04914894513785839, + "mean_nudge_01": -0.12422022968530655, + "bp_cosine_per_layer": [ + 0.8970257639884949, + 0.8884812593460083 + ], + "rho_per_layer": [ + 0.9999991655349731, + 0.9999955892562866 + ], + "nudge_per_layer": [ + -0.16577741503715515, + -0.08266304433345795 + ] + }, + "dfa": { + "test_acc": 0.8565, + "mean_bp_cosine": 0.032235472928732634, + "mean_rho": -0.0014879778027534485, + "mean_nudge_001": -0.00016316675464622676, + "mean_nudge_003": -0.00043464876944199204, + "mean_nudge_01": -0.0008175973780453205, + "bp_cosine_per_layer": [ + -0.009920955635607243, + 0.07439190149307251 + ], + "rho_per_layer": [ + -0.054706037044525146, + 0.05173008143901825 + ], + "nudge_per_layer": [ + 0.004189381375908852, + -0.005824576131999493 + ] + }, + "state_bridge": { + "test_acc": 0.825, + "mean_bp_cosine": 0.645551860332489, + "mean_rho": 0.5210425555706024, + "mean_nudge_001": -0.012871089624240994, + "mean_nudge_003": -0.03697468154132366, + "mean_nudge_01": -0.10600546188652515, + "bp_cosine_per_layer": [ + 0.8819085955619812, + 0.4091951251029968 + ], + "rho_per_layer": [ + 0.761555552482605, + 0.28052955865859985 + ], + "nudge_per_layer": [ + -0.18185698986053467, + -0.03015393391251564 + ], + "state_pred_error_per_layer": [ + 7353.158203125, + 2627.8740234375 + ], + "mean_state_pred_error": 4990.51611328125 + }, + "credit_bridge": { + "test_acc": 0.692, + "mean_bp_cosine": 0.1708241105079651, + "mean_rho": 0.3076810836791992, + "mean_nudge_001": -0.0058031873777508736, + "mean_nudge_003": -0.017323508858680725, + "mean_nudge_01": -0.05672750808298588, + "bp_cosine_per_layer": [ + 0.14308685064315796, + 0.19856137037277222 + ], + "rho_per_layer": [ + 0.26277071237564087, + 0.35259145498275757 + ], + "nudge_per_layer": [ + -0.08629482984542847, + -0.02716018632054329 + ], + "final_value_loss": 0.28658444921970366, + "final_term_loss": 0.040962481904029846, + "final_bridge_loss": 0.0227132670879364, + "final_tgrad_loss": 0.22290869793891907 + } + }, + "a0.5_L8_s42": { + "bp": { + "test_acc": 0.8825, + "mean_bp_cosine": 0.7004428058862686, + "mean_rho": 0.9999219477176666, + "mean_nudge_001": -0.013686691803741269, + "mean_nudge_003": -0.03912358166417107, + "mean_nudge_01": -0.11077304021455348, + "bp_cosine_per_layer": [ + 0.7438379526138306, + 0.7323452234268188, + 0.723551869392395, + 0.7129155397415161, + 0.6892737746238708, + 0.6759694814682007, + 0.6671421527862549, + 0.658506453037262 + ], + "rho_per_layer": [ + 0.9999985694885254, + 0.9999985694885254, + 0.9999951720237732, + 0.9999872446060181, + 0.9999734163284302, + 0.9999377727508545, + 0.9998385310173035, + 0.9996463060379028 + ], + "nudge_per_layer": [ + -0.3025854229927063, + -0.20860256254673004, + -0.13888010382652283, + -0.09112250804901123, + -0.0598360076546669, + -0.039668694138526917, + -0.026830831542611122, + -0.018658190965652466 + ] + }, + "dfa": { + "test_acc": 0.8805, + "mean_bp_cosine": 0.030201979679986835, + "mean_rho": 0.14581625070422888, + "mean_nudge_001": -0.007218341752377455, + "mean_nudge_003": -0.021398383076302707, + "mean_nudge_01": -0.06869508739328012, + "bp_cosine_per_layer": [ + -0.0057187266647815704, + 0.03526674211025238, + 0.03511466830968857, + 0.043710630387067795, + 0.04474484175443649, + 0.03394380211830139, + 0.03243564814329147, + 0.022118231281638145 + ], + "rho_per_layer": [ + -0.08895743638277054, + 0.2165505439043045, + 0.14878079295158386, + 0.23983460664749146, + 0.23414158821105957, + 0.22946099936962128, + 0.044252023100852966, + 0.14246688783168793 + ], + "nudge_per_layer": [ + 0.20587505400180817, + -0.4487733840942383, + -0.17917752265930176, + -0.0796520859003067, + -0.03180943429470062, + -0.009406229481101036, + -0.004543165676295757, + -0.0020739310421049595 + ] + }, + "state_bridge": { + "test_acc": 0.1155, + "mean_bp_cosine": 0.04451697081094608, + "mean_rho": -0.013691710773855448, + "mean_nudge_001": -294302.75, + "mean_nudge_003": -880992.0, + "mean_nudge_01": -2656252.75, + "bp_cosine_per_layer": [ + 0.30725735425949097, + 0.12316203862428665, + -0.0629364550113678, + 0.007313757669180632, + -0.009149492718279362, + -0.008323092944920063, + -0.006843051873147488, + 0.005654708482325077 + ], + "rho_per_layer": [ + -0.0015011467039585114, + 0.0004240265116095543, + 0.0019385055638849735, + 0.0008086063899099827, + -0.11120367795228958, + 0.0, + 0.0, + 0.0 + ], + "nudge_per_layer": [ + -20625168.0, + -717604.0, + -58672.0, + 134824.0, + 16604.0, + -6.0, + 0.0, + 0.0 + ], + "state_pred_error_per_layer": [ + 1.2424051312422632e+29, + 1.2424051312422632e+29, + 1.2424051312422632e+29, + 1.2424051312422632e+29, + 1.2424051312422632e+29, + 1.2424051312422632e+29, + 1.2424051312422632e+29, + 1.2424051312422632e+29 + ], + "mean_state_pred_error": 1.2424051312422632e+29 + }, + "credit_bridge": { + "test_acc": 0.1095, + "mean_bp_cosine": 0.0375741989701055, + "mean_rho": 0.011375281232176349, + "mean_nudge_001": 64012.0, + "mean_nudge_003": 195061.0, + "mean_nudge_01": 1148873.0, + "bp_cosine_per_layer": [ + 0.04903252795338631, + 0.20776475965976715, + 0.12520574033260345, + -0.2015925794839859, + -0.03666269779205322, + 0.005083487834781408, + 0.13890880346298218, + 0.012853549793362617 + ], + "rho_per_layer": [ + 0.011465835385024548, + 0.00849771499633789, + 0.0009214465972036123, + -0.005531121976673603, + 0.07564837485551834, + 0.0, + 0.0, + 0.0 + ], + "nudge_per_layer": [ + 10792360.0, + -1553496.0, + -27560.0, + -69368.0, + 49144.0, + -96.0, + 0.0, + 0.0 + ], + "final_value_loss": 1.0739092229740712e+19, + "final_term_loss": 5.965625762330856e+18, + "final_bridge_loss": 4.773466424748804e+18, + "final_tgrad_loss": 0.753796951675415 + } + }, + "a1.0_L2_s42": { + "bp": { + "test_acc": 0.79, + "mean_bp_cosine": 0.9718506336212158, + "mean_rho": 0.9999988377094269, + "mean_nudge_001": -0.030717147514224052, + "mean_nudge_003": -0.08905789628624916, + "mean_nudge_01": -0.2628655806183815, + "bp_cosine_per_layer": [ + 0.977530300617218, + 0.9661709666252136 + ], + "rho_per_layer": [ + 0.9999992847442627, + 0.9999983906745911 + ], + "nudge_per_layer": [ + -0.3279687762260437, + -0.1977623850107193 + ] + }, + "dfa": { + "test_acc": 0.7575, + "mean_bp_cosine": 0.03516392147867009, + "mean_rho": -0.00011159107089042664, + "mean_nudge_001": -0.000253174692261382, + "mean_nudge_003": -0.0007429331817547791, + "mean_nudge_01": -0.0022771726071368903, + "bp_cosine_per_layer": [ + -0.0018995754653587937, + 0.07222741842269897 + ], + "rho_per_layer": [ + -0.03529410809278488, + 0.03507092595100403 + ], + "nudge_per_layer": [ + 0.00033701310167089105, + -0.004891358315944672 + ] + }, + "state_bridge": { + "test_acc": 0.7315, + "mean_bp_cosine": 0.6242872625589371, + "mean_rho": 0.576740100979805, + "mean_nudge_001": -0.013815624406561255, + "mean_nudge_003": -0.04068431770429015, + "mean_nudge_01": -0.12692053988575935, + "bp_cosine_per_layer": [ + 0.7724592089653015, + 0.47611531615257263 + ], + "rho_per_layer": [ + 0.7083259224891663, + 0.4451542794704437 + ], + "nudge_per_layer": [ + -0.2117496132850647, + -0.04209146648645401 + ], + "state_pred_error_per_layer": [ + 2210.423828125, + 264.2466125488281 + ], + "mean_state_pred_error": 1237.335220336914 + }, + "credit_bridge": { + "test_acc": 0.556, + "mean_bp_cosine": 0.1866571605205536, + "mean_rho": 0.2675167992711067, + "mean_nudge_001": -0.0047563593834638596, + "mean_nudge_003": -0.014220114797353745, + "mean_nudge_01": -0.04682535119354725, + "bp_cosine_per_layer": [ + 0.14650292694568634, + 0.22681139409542084 + ], + "rho_per_layer": [ + 0.22659505903720856, + 0.3084385395050049 + ], + "nudge_per_layer": [ + -0.06274554133415222, + -0.030905161052942276 + ], + "final_value_loss": 0.24172186150550842, + "final_term_loss": 0.06502777924537659, + "final_bridge_loss": 0.03994156485795975, + "final_tgrad_loss": 0.13675251703262328 + } + }, + "a1.0_L8_s42": { + "bp": { + "test_acc": 0.753, + "mean_bp_cosine": 0.8404746800661087, + "mean_rho": 0.9999860152602196, + "mean_nudge_001": -0.03076103754574433, + "mean_nudge_003": -0.08962251944467425, + "mean_nudge_01": -0.26998535776510835, + "bp_cosine_per_layer": [ + 0.8599272966384888, + 0.8556707501411438, + 0.8523739576339722, + 0.848276674747467, + 0.8402513265609741, + 0.8327686190605164, + 0.8243966698646545, + 0.8101321458816528 + ], + "rho_per_layer": [ + 0.9999995231628418, + 0.9999991059303284, + 0.9999986290931702, + 0.9999972581863403, + 0.999995231628418, + 0.999988853931427, + 0.999974250793457, + 0.9999352693557739 + ], + "nudge_per_layer": [ + -0.5608033537864685, + -0.46859920024871826, + -0.3716525733470917, + -0.2780599594116211, + -0.19847190380096436, + -0.13576632738113403, + -0.08930139243602753, + -0.057228151708841324 + ] + }, + "dfa": { + "test_acc": 0.7235, + "mean_bp_cosine": 0.04556959925685078, + "mean_rho": 0.048565957229584455, + "mean_nudge_001": -0.00017181782459374517, + "mean_nudge_003": -0.0005837090320710558, + "mean_nudge_01": -0.0014622680901084095, + "bp_cosine_per_layer": [ + -0.009654381312429905, + 0.06123851239681244, + 0.05049855262041092, + 0.06316959857940674, + 0.06684726476669312, + 0.04511053115129471, + 0.06236346811056137, + 0.024983247742056847 + ], + "rho_per_layer": [ + -0.04901190102100372, + 0.05014052242040634, + 0.041004884988069534, + 0.0795036256313324, + 0.11356800049543381, + 0.03488320857286453, + 0.06926114857196808, + 0.049178168177604675 + ], + "nudge_per_layer": [ + 0.009471571072936058, + -0.008436895906925201, + -0.0030148853547871113, + -0.002505694981664419, + -0.0025559633504599333, + -0.0017773781437426805, + -0.002164034638553858, + -0.0007148634176701307 + ] + }, + "state_bridge": { + "test_acc": 0.669, + "mean_bp_cosine": 0.17768670711666346, + "mean_rho": 0.1722423667088151, + "mean_nudge_001": -0.003032438595255371, + "mean_nudge_003": -0.009077076290850528, + "mean_nudge_01": -0.02989676801371388, + "bp_cosine_per_layer": [ + 0.4364655911922455, + 0.2538519501686096, + 0.12610256671905518, + 0.11331324279308319, + 0.12084640562534332, + 0.12215165793895721, + 0.1230584904551506, + 0.12570375204086304 + ], + "rho_per_layer": [ + 0.3833135962486267, + 0.2661164402961731, + 0.1022414043545723, + 0.0808584988117218, + 0.13698244094848633, + 0.1416344791650772, + 0.1372133493423462, + 0.12957872450351715 + ], + "nudge_per_layer": [ + -0.19196540117263794, + -0.024129249155521393, + -0.005033540539443493, + -0.0036849211901426315, + -0.003727084957063198, + -0.003625791519880295, + -0.0035160125698894262, + -0.003492143005132675 + ], + "state_pred_error_per_layer": [ + 10125.46875, + 4586.849609375, + 2924.994384765625, + 2696.109130859375, + 2272.20361328125, + 2131.38916015625, + 1861.77978515625, + 1746.7655029296875 + ], + "mean_state_pred_error": 3543.1949920654297 + }, + "credit_bridge": { + "test_acc": 0.574, + "mean_bp_cosine": 0.14715833496302366, + "mean_rho": 0.21127336705103517, + "mean_nudge_001": -0.0017491802136646584, + "mean_nudge_003": -0.005117673281347379, + "mean_nudge_01": -0.017382657038979232, + "bp_cosine_per_layer": [ + 0.034526653587818146, + 0.05641080439090729, + 0.10281616449356079, + 0.15385565161705017, + 0.18335095047950745, + 0.20484405755996704, + 0.21195781230926514, + 0.22950458526611328 + ], + "rho_per_layer": [ + 0.036690596491098404, + 0.08035410940647125, + 0.14528854191303253, + 0.19739355146884918, + 0.2672373652458191, + 0.3182218074798584, + 0.32729244232177734, + 0.3177085220813751 + ], + "nudge_per_layer": [ + -0.04240123927593231, + -0.01825123094022274, + -0.012862971983850002, + -0.012372580356895924, + -0.012917900457978249, + -0.01307743415236473, + -0.013364783488214016, + -0.013813115656375885 + ], + "final_value_loss": 0.5224067583084107, + "final_term_loss": 0.30657225689888, + "final_bridge_loss": 0.06283499038815499, + "final_tgrad_loss": 0.15299950742721558 + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_smoke/synth_a0.0_L2_s42.json b/results/synth_ladder_smoke/synth_a0.0_L2_s42.json new file mode 100644 index 0000000..7a42e31 --- /dev/null +++ b/results/synth_ladder_smoke/synth_a0.0_L2_s42.json @@ -0,0 +1,1172 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.7533995316505433, + 0.7836601768493653, + 0.4336150965690613, + 0.3156591456890106, + 0.26115909841060636, + 0.21855008835792541, + 0.20245241773128508, + 0.1854707410812378, + 0.171177279484272, + 0.1577904580116272, + 0.16167830117940904, + 0.13525569295883177, + 0.15880949127674102, + 0.1267966023683548, + 0.135716259598732, + 0.12722588217258454, + 0.1248846586227417, + 0.12528773012161254, + 0.13043007722496985, + 0.10238944809436798, + 0.10000436370372773, + 0.09743008491992951, + 0.09774633845090866, + 0.0909515031337738, + 0.08864497351646423, + 0.09541612682342529, + 0.08492451270222665, + 0.07652511271238327, + 0.07194267210960388, + 0.0679610144495964, + 0.07048724781274796, + 0.06801209087371826, + 0.06563281005620956, + 0.06872930953502655, + 0.06238800450563431, + 0.06467725517749787, + 0.06289580785036088, + 0.05844259022772312, + 0.0557950256228447, + 0.05462282573878765, + 0.053031637322902676, + 0.05512283474802971, + 0.052326148790121076, + 0.051231220483779906, + 0.04978705406785011, + 0.049222904124856, + 0.04818815061151981, + 0.04727265299856663, + 0.04677308195531368, + 0.04608564888834953, + 0.0458140979886055, + 0.04530899636745453, + 0.045030354833602904, + 0.04478087300062179, + 0.044504375572502614, + 0.04426856064796448, + 0.04410454820394516, + 0.04398917088881135, + 0.04390392400026322, + 0.043855037939548494 + ], + "train_acc": [ + 0.4163, + 0.796, + 0.8972, + 0.9216, + 0.9325, + 0.9467, + 0.9423, + 0.9446, + 0.9512, + 0.9541, + 0.9472, + 0.9636, + 0.9431, + 0.96, + 0.9528, + 0.9593, + 0.9587, + 0.9555, + 0.9543, + 0.9691, + 0.9696, + 0.9704, + 0.9695, + 0.9739, + 0.9773, + 0.97, + 0.9778, + 0.9804, + 0.9834, + 0.9887, + 0.9839, + 0.9856, + 0.9865, + 0.9843, + 0.9888, + 0.9862, + 0.9877, + 0.9917, + 0.9918, + 0.9936, + 0.9945, + 0.9926, + 0.9938, + 0.9948, + 0.9954, + 0.9959, + 0.9962, + 0.9968, + 0.9973, + 0.9969, + 0.9976, + 0.9979, + 0.9975, + 0.9979, + 0.9978, + 0.9981, + 0.9981, + 0.9981, + 0.9981, + 0.9981 + ], + "test_acc": [ + 0.6825, + 0.841, + 0.888, + 0.904, + 0.909, + 0.9115, + 0.922, + 0.9275, + 0.921, + 0.924, + 0.916, + 0.9305, + 0.9225, + 0.928, + 0.917, + 0.925, + 0.9365, + 0.919, + 0.9295, + 0.9355, + 0.93, + 0.937, + 0.935, + 0.9365, + 0.932, + 0.932, + 0.938, + 0.937, + 0.9395, + 0.941, + 0.9415, + 0.9385, + 0.9405, + 0.9355, + 0.942, + 0.937, + 0.933, + 0.939, + 0.9395, + 0.941, + 0.944, + 0.9445, + 0.9425, + 0.9405, + 0.945, + 0.944, + 0.9435, + 0.9445, + 0.946, + 0.946, + 0.9445, + 0.9445, + 0.943, + 0.9445, + 0.946, + 0.9445, + 0.945, + 0.9445, + 0.9445, + 0.9445 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.841028094291687, + 0.8316808938980103 + ], + "perturbation_rho": [ + 0.9999988079071045, + 0.9999943971633911 + ], + "nudging": { + "0.001": [ + -0.02241116389632225, + -0.00732467882335186 + ], + "0.003": [ + -0.05696076154708862, + -0.02089458703994751 + ], + "0.01": [ + -0.10806188732385635, + -0.058222346007823944 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2681663370132448, + 1.5578918802261352, + 0.9035645442008973, + 0.5999464567184448, + 0.4491278485774994, + 0.3660543300151825, + 0.31826040496826175, + 0.28996203372478485, + 0.27258815791606905, + 0.258673814201355, + 0.2605429262816906, + 0.2453741048812866, + 0.2707838849082589, + 0.24489454474449157, + 0.2667243903636932, + 0.24532563347816466, + 0.2407766224384308, + 0.2794936346054077, + 0.23863817923367023, + 0.227928395652771, + 0.22128773531913756, + 0.24110795383453368, + 0.25780398631095885, + 0.23606836762428285, + 0.22999447169303894, + 0.21888184334039687, + 0.22170222326517106, + 0.20384172608852386, + 0.21664435220509767, + 0.18759276245832443, + 0.1907250598371029, + 0.19302489280700683, + 0.21028617808818817, + 0.18639517907500266, + 0.18032784458398818, + 0.17618319692611695, + 0.18565691118240357, + 0.17661046228408814, + 0.17732410440444946, + 0.17734829990416764, + 0.1658576126098633, + 0.18027312584370375, + 0.1593181769669056, + 0.1599530577659607, + 0.15934612050056457, + 0.15842962717413903, + 0.15354473167657853, + 0.15257517569065093, + 0.15343474090099335, + 0.15061425738334655, + 0.1513981466114521, + 0.14823738946914672, + 0.14945683048963546, + 0.14723094618320465, + 0.14593036649525165, + 0.14519548625946044, + 0.1448047935962677, + 0.14448406311944126, + 0.1441643814086914, + 0.14402359859347344 + ], + "train_acc": [ + 0.1713, + 0.4916, + 0.6924, + 0.7834, + 0.8324, + 0.8582, + 0.8748, + 0.885, + 0.8912, + 0.9011, + 0.8987, + 0.9039, + 0.9046, + 0.9101, + 0.9077, + 0.9128, + 0.915, + 0.9068, + 0.9177, + 0.9215, + 0.925, + 0.9222, + 0.9191, + 0.9216, + 0.9253, + 0.9266, + 0.9282, + 0.9318, + 0.9305, + 0.9359, + 0.9363, + 0.9367, + 0.9354, + 0.9373, + 0.9387, + 0.942, + 0.9376, + 0.941, + 0.9397, + 0.9416, + 0.9439, + 0.9414, + 0.946, + 0.9467, + 0.9471, + 0.9448, + 0.9478, + 0.9485, + 0.9475, + 0.9489, + 0.948, + 0.9483, + 0.9483, + 0.9498, + 0.9493, + 0.9501, + 0.9509, + 0.9508, + 0.9508, + 0.9507 + ], + "test_acc": [ + 0.3065, + 0.6105, + 0.7235, + 0.7705, + 0.8025, + 0.8175, + 0.8315, + 0.843, + 0.841, + 0.8485, + 0.855, + 0.849, + 0.865, + 0.867, + 0.858, + 0.8625, + 0.8545, + 0.8615, + 0.8605, + 0.872, + 0.8695, + 0.861, + 0.8765, + 0.874, + 0.8795, + 0.8765, + 0.878, + 0.882, + 0.8805, + 0.886, + 0.882, + 0.88, + 0.8805, + 0.8835, + 0.8875, + 0.8865, + 0.886, + 0.8825, + 0.8845, + 0.885, + 0.886, + 0.8895, + 0.8915, + 0.891, + 0.8915, + 0.888, + 0.886, + 0.8925, + 0.889, + 0.8865, + 0.887, + 0.889, + 0.889, + 0.89, + 0.891, + 0.891, + 0.891, + 0.891, + 0.8905, + 0.8905 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.002617625752463937, + 0.059033285826444626 + ], + "perturbation_rho": [ + -0.03406350687146187, + 0.007601428776979446 + ], + "nudging": { + "0.001": [ + -0.0003772574127651751, + -0.0005316028255037963 + ], + "0.003": [ + -0.0009525500936433673, + -0.001586500322446227 + ], + "0.01": [ + -0.0010169181041419506, + -0.005193162709474564 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 2.0382345211029054, + 1.0948151384353637, + 0.6032020771503448, + 0.40623809757232665, + 0.33226056547164917, + 0.3133425868034363, + 0.30417577662467954, + 0.3053503430366516, + 0.31328839625120164, + 0.31271673035621644, + 0.3245254298210144, + 0.31218559067249296, + 0.3044342563152313, + 0.31126695098876955, + 0.3119384925365448, + 0.30271564536094664, + 0.30667407779693606, + 0.3065519708395004, + 0.30940110969543455, + 0.3272845676660538, + 0.3199685447216034, + 0.32677091150283816, + 0.32642143268585205, + 0.33318281002044675, + 0.36578635778427127, + 0.37762247943878174, + 0.39828639793396, + 0.3289969065666199, + 0.3450239597797394, + 0.358044877243042, + 0.36087529759407044, + 0.36222470116615296, + 0.33878248867988586, + 0.3413470969080925, + 0.3363194646835327, + 0.343668280172348, + 0.34620368288755415, + 0.32506093147993087, + 0.3287040949821472, + 0.32957409336566923, + 0.3357783727645874, + 0.33654043445587156, + 0.3232738302230835, + 0.3100067971229553, + 0.3171101568222046, + 0.3073707001209259, + 0.30577496590614317, + 0.313213066983223, + 0.29881200022697446, + 0.2981369870185852, + 0.30165741591453554, + 0.2990313836097717, + 0.29394608516693116, + 0.2944581679344177, + 0.2910430798530579, + 0.2914781629562378, + 0.2900803961753845, + 0.28867093825340273, + 0.28835845890045164, + 0.2879593663215637 + ], + "train_acc": [ + 0.2672, + 0.6388, + 0.7992, + 0.8588, + 0.879, + 0.8775, + 0.8801, + 0.8794, + 0.8784, + 0.8798, + 0.8755, + 0.8774, + 0.8824, + 0.8796, + 0.8779, + 0.8837, + 0.8817, + 0.8798, + 0.8804, + 0.873, + 0.8771, + 0.8717, + 0.8701, + 0.8727, + 0.8597, + 0.8592, + 0.8536, + 0.8736, + 0.8688, + 0.8657, + 0.8613, + 0.8636, + 0.8696, + 0.8708, + 0.8713, + 0.8673, + 0.8674, + 0.8758, + 0.8726, + 0.8733, + 0.8726, + 0.871, + 0.8732, + 0.8793, + 0.8785, + 0.8824, + 0.8814, + 0.8756, + 0.8846, + 0.885, + 0.8841, + 0.8847, + 0.8864, + 0.887, + 0.887, + 0.8879, + 0.8871, + 0.8875, + 0.8887, + 0.8889 + ], + "test_acc": [ + 0.504, + 0.7175, + 0.8095, + 0.8285, + 0.833, + 0.834, + 0.828, + 0.8205, + 0.8225, + 0.829, + 0.8275, + 0.8185, + 0.8205, + 0.825, + 0.8255, + 0.8325, + 0.831, + 0.8215, + 0.829, + 0.817, + 0.817, + 0.817, + 0.8235, + 0.818, + 0.7945, + 0.7985, + 0.8165, + 0.8215, + 0.7985, + 0.8005, + 0.8095, + 0.816, + 0.794, + 0.819, + 0.8165, + 0.8045, + 0.8145, + 0.805, + 0.8175, + 0.7915, + 0.807, + 0.8145, + 0.8265, + 0.8245, + 0.818, + 0.817, + 0.8295, + 0.8165, + 0.8215, + 0.817, + 0.827, + 0.8245, + 0.826, + 0.8275, + 0.8265, + 0.8235, + 0.825, + 0.826, + 0.8245, + 0.825 + ], + "state_pred_error": [ + 0.7940658317565918, + 0.3446289403915405, + 0.21205402789115907, + 0.18055613265037537, + 0.17316545538902284, + 0.16974504861831666, + 0.16455158114433288, + 0.1532918233156204, + 0.1344613233089447, + 0.11496315777301788, + 0.09990090398788452, + 0.0852064457654953, + 0.07807356501817703, + 0.06980399495363235, + 0.06664942329525947, + 0.06597541292905808, + 0.062055612790584566, + 0.06308431391716003, + 0.062131305885314944, + 0.06258162593841553, + 0.06345035761594772, + 0.06398923227190971, + 0.06478530389666558, + 0.06886953679323196, + 0.06948684022426606, + 0.0712984862446785, + 0.0716869054555893, + 0.07109182901382446, + 0.0715145544052124, + 0.07274168980121612, + 0.07417786152362824, + 0.07344579526185989, + 0.07273043178319931, + 0.07403365852832794, + 0.07517185529470444, + 0.07344330585598946, + 0.07345378184318542, + 0.07930274074077606, + 0.07390495628118515, + 0.0726435121536255, + 0.07187280968427658, + 0.07082273955345154, + 0.07124607337713242, + 0.06916670203208923, + 0.06908640279769898, + 0.06788007100820541, + 0.06682880482673645, + 0.06678611476421356, + 0.06645168607234955, + 0.0616137608230114, + 0.06136730970740318, + 0.06039532200098038, + 0.059799978923797605, + 0.05922998292446136, + 0.05737149256467819, + 0.05544037868976593, + 0.05257278437614441, + 0.05509069833755493, + 0.05201517162322998, + 0.05045925542712212 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8860390186309814, + 0.29011964797973633 + ], + "perturbation_rho": [ + 0.729070782661438, + 0.16372419893741608 + ], + "nudging": { + "0.001": [ + -0.0223261546343565, + -0.002173823770135641 + ], + "0.003": [ + -0.06377331912517548, + -0.006489826366305351 + ], + "0.01": [ + -0.17900359630584717, + -0.021273087710142136 + ] + }, + "state_pred_error_per_layer": [ + 33793.6875, + 17287.951171875 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2692262367248537, + 1.5542793827056884, + 0.9020736213684082, + 0.596830725479126, + 0.4468186724662781, + 0.3618718198776245, + 0.31232853326797483, + 0.2787938956260681, + 0.2674659299373627, + 0.2642947849750519, + 0.2523771431446075, + 0.24515730214118958, + 0.2538480486392975, + 0.28014468059539793, + 0.31275188341140747, + 0.36153240275383, + 0.45546971778869627, + 0.470155521774292, + 0.49532660064697265, + 0.6091033678054809, + 0.6895332248687744, + 0.8440474328041077, + 0.9790623798370361, + 1.0800415994644166, + 1.2051820819854737, + 1.2633331064224242, + 1.2919290416717528, + 1.3715517765998841, + 1.3725673580169677, + 1.4548830583572387, + 1.4191310758590698, + 1.3940866708755493, + 1.4137959768295287, + 1.3491390239715577, + 1.3602781624317168, + 1.2946188051223755, + 1.3052873740196227, + 1.271211790084839, + 1.2458847396850585, + 1.221630898284912, + 1.2014152545928956, + 1.1802498739242553, + 1.1862596946716308, + 1.1738021017074585, + 1.149361166381836, + 1.146301950263977, + 1.123859150505066, + 1.1185205829620362, + 1.1123267906188965, + 1.101036505126953, + 1.088988446044922, + 1.079156160736084, + 1.0718450695037842, + 1.065549393081665, + 1.0595159755706787, + 1.0557796686172485, + 1.0525294914245606, + 1.0508896852493286, + 1.0492018606185913, + 1.0485244590759277 + ], + "train_acc": [ + 0.1678, + 0.4881, + 0.6916, + 0.7856, + 0.834, + 0.8604, + 0.8766, + 0.8891, + 0.8969, + 0.8957, + 0.9013, + 0.9053, + 0.9055, + 0.9019, + 0.8975, + 0.8912, + 0.8739, + 0.8689, + 0.8627, + 0.8466, + 0.8313, + 0.8064, + 0.7853, + 0.7715, + 0.7514, + 0.7433, + 0.7304, + 0.7127, + 0.7089, + 0.6894, + 0.6898, + 0.6898, + 0.6846, + 0.6929, + 0.6888, + 0.6896, + 0.6874, + 0.6922, + 0.6915, + 0.6901, + 0.6957, + 0.6928, + 0.689, + 0.6875, + 0.6931, + 0.6961, + 0.693, + 0.6958, + 0.6921, + 0.7, + 0.6966, + 0.6992, + 0.6993, + 0.7002, + 0.7014, + 0.7012, + 0.7017, + 0.7013, + 0.7013, + 0.7015 + ], + "test_acc": [ + 0.319, + 0.61, + 0.727, + 0.7705, + 0.8105, + 0.818, + 0.8355, + 0.8335, + 0.8395, + 0.8495, + 0.8565, + 0.8575, + 0.8595, + 0.8455, + 0.8455, + 0.834, + 0.817, + 0.813, + 0.793, + 0.783, + 0.7655, + 0.7445, + 0.73, + 0.721, + 0.7015, + 0.7085, + 0.6835, + 0.6705, + 0.661, + 0.65, + 0.662, + 0.652, + 0.6485, + 0.6565, + 0.6525, + 0.6585, + 0.6465, + 0.66, + 0.6535, + 0.648, + 0.647, + 0.649, + 0.6465, + 0.655, + 0.6475, + 0.65, + 0.653, + 0.6525, + 0.6485, + 0.653, + 0.6555, + 0.6525, + 0.656, + 0.654, + 0.654, + 0.6575, + 0.656, + 0.6565, + 0.656, + 0.656 + ], + "value_loss": [ + 2.909094351196289, + 0.7658272996902465, + 0.6340765568733215, + 0.5706955344200134, + 0.5016238324642182, + 0.43215153760910036, + 0.3868287033081055, + 0.35505294566154477, + 0.3537649361371994, + 0.3869753558635712, + 0.38371925399303436, + 0.3659987478256226, + 0.3994653451919556, + 0.4804273064136505, + 0.617082247543335, + 0.8328494649887085, + 1.19136689453125, + 1.1524452226638795, + 1.273973949432373, + 1.6705972339630126, + 1.947713963317871, + 2.429694472694397, + 2.9975417751312254, + 3.3247394645690918, + 4.073798774719238, + 4.177117526245117, + 4.067596185684204, + 4.233567604827881, + 3.9992895797729493, + 4.0748225051879885, + 3.6166735214233396, + 3.5715755424499513, + 3.170370510101318, + 2.6065550357818603, + 2.4747390007972716, + 2.096208452987671, + 1.974884965133667, + 1.788527022743225, + 1.615757702445984, + 1.4653602067947387, + 1.3991004487991332, + 1.2780299221038818, + 1.231626374053955, + 1.1686214462280273, + 1.0741170415878296, + 1.009229591178894, + 0.9554481613159179, + 0.9123099586486817, + 0.8534572563171386, + 0.8179267116546631, + 0.7517884971618652, + 0.7146735996246338, + 0.6941907648086548, + 0.6707411470413208, + 0.6082350830078125, + 0.6151707311630249, + 0.5768671339035034, + 0.5514906231880188, + 0.5400699325561523, + 0.5207448813438416 + ], + "term_loss": [ + 1.6756160216331482, + 0.3529724612236023, + 0.390537335395813, + 0.3742113214969635, + 0.33054120086431504, + 0.26847299547195436, + 0.22873805408477782, + 0.213564708507061, + 0.2188684166431427, + 0.2586360571861267, + 0.2644814089179039, + 0.2492242072761059, + 0.2802458667755127, + 0.35211685800552367, + 0.4764906127929687, + 0.6769205916404724, + 1.0035622982025147, + 0.9530633958816528, + 1.0660293413162232, + 1.427315857410431, + 1.6753887001037597, + 2.1101916246414185, + 2.6351540704727174, + 2.93334910736084, + 3.628789786529541, + 3.7103049926757814, + 3.5738488626480103, + 3.7151432455062867, + 3.4672480880737306, + 3.5043161994934082, + 3.0582513076782227, + 2.9907237396240234, + 2.609465662384033, + 2.0792490367889402, + 1.9462039555549622, + 1.6056369823455812, + 1.4855788904190064, + 1.3233418182373047, + 1.1531369215011598, + 1.010161297416687, + 0.9468067415237427, + 0.8260270189285278, + 0.7786426908493042, + 0.7235319651603699, + 0.6420190993309021, + 0.5773346517562866, + 0.5359861539840698, + 0.506299984741211, + 0.45566908836364745, + 0.4283084735870361, + 0.37325937843322754, + 0.3429936631202698, + 0.3306818127632141, + 0.31145757360458376, + 0.26386104679107664, + 0.27378877906799315, + 0.2430652662754059, + 0.22444696111679077, + 0.2165537470817566, + 0.20168962478637695 + ], + "bridge_loss": [ + 0.9061962479351089, + 0.11340018844604492, + 0.018831115587055684, + 0.006585106197744608, + 0.007741253206133843, + 0.01931276010274887, + 0.02597333793640137, + 0.020665125489234923, + 0.016416490584611892, + 0.00939844745695591, + 0.006557002264261246, + 0.007693992963433266, + 0.00838148719072342, + 0.010554035685956479, + 0.014100195910781621, + 0.019740482191741467, + 0.029861405584216117, + 0.03811971082091332, + 0.04297128603458405, + 0.05843619774580002, + 0.07096547927856445, + 0.09096145362854004, + 0.11484820014238357, + 0.13357684574127196, + 0.17190906581878662, + 0.1907400098323822, + 0.21238168239593505, + 0.22990054244995117, + 0.2459044690132141, + 0.2736733878135681, + 0.271633962059021, + 0.29980236659049986, + 0.28194295258522034, + 0.2610706382751465, + 0.26103880503177646, + 0.23405041053295136, + 0.23127240090370177, + 0.21618038527965547, + 0.21614487179517747, + 0.21264133446216582, + 0.2144686206102371, + 0.21590589094161988, + 0.21614528675079345, + 0.21047820831537248, + 0.20197302742004394, + 0.20249471414089204, + 0.19271916406154632, + 0.1802452743768692, + 0.17243436317443847, + 0.1680455225944519, + 0.1576254985809326, + 0.15183655140399932, + 0.1453061292052269, + 0.14224059772491454, + 0.1282794843673706, + 0.1261581906080246, + 0.11894494748115539, + 0.11249599847793579, + 0.10926979708671569, + 0.10483724861145019 + ], + "tgrad_loss": [ + 0.32728208103179934, + 0.2994546513557434, + 0.22470810203552247, + 0.18989910242557526, + 0.16334137752056122, + 0.14436578254699706, + 0.13211731100082397, + 0.12082311434745789, + 0.118480029129982, + 0.1189408509016037, + 0.1126808422088623, + 0.10908054541349411, + 0.11083799247741699, + 0.11775641236305237, + 0.12649144034385681, + 0.1361883921146393, + 0.15794320333003997, + 0.1612621042728424, + 0.16497332499027254, + 0.184845175075531, + 0.20135978260040283, + 0.22854138774871827, + 0.24753951168060304, + 0.2578135227203369, + 0.2730999213218689, + 0.27607250838279723, + 0.2813656562805176, + 0.2885238247871399, + 0.28613699531555176, + 0.29683294076919553, + 0.28678826389312745, + 0.2810494341850281, + 0.2789619082689285, + 0.26623538064956664, + 0.2674962314367294, + 0.25652106018066406, + 0.2580336720466614, + 0.2490048062801361, + 0.2464759041786194, + 0.24255758218765258, + 0.23782507863044738, + 0.2360969993829727, + 0.23683840417861937, + 0.23461127347946167, + 0.23012492628097533, + 0.22940022025108336, + 0.22674284510612489, + 0.22576470098495482, + 0.22535381288528442, + 0.22157270841598511, + 0.22090361948013307, + 0.2198433807373047, + 0.2182028178215027, + 0.21704297912120818, + 0.21609454655647278, + 0.21522376427650453, + 0.214856924533844, + 0.21454766092300415, + 0.214246386384964, + 0.21421800775527955 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.10150224715471268, + 0.11179979145526886 + ], + "perturbation_rho": [ + 0.24922937154769897, + 0.2113790065050125 + ], + "nudging": { + "0.001": [ + -0.010911274701356888, + -0.002249373123049736 + ], + "0.003": [ + -0.032585203647613525, + -0.006742686498910189 + ], + "0.01": [ + -0.10681234300136566, + -0.02240385115146637 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_smoke/synth_a0.0_L8_s42.json b/results/synth_ladder_smoke/synth_a0.0_L8_s42.json new file mode 100644 index 0000000..dab8eba --- /dev/null +++ b/results/synth_ladder_smoke/synth_a0.0_L8_s42.json @@ -0,0 +1,1298 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.0280954638957978, + 0.5170450178146362, + 0.46660222864151, + 0.3860828907012939, + 0.3847982373714447, + 0.37869311784505844, + 0.3040668855667114, + 0.43982459917068484, + 0.3666351689338684, + 0.30392495489120486, + 0.3629165101528168, + 0.3360342849731445, + 0.3675597408294678, + 0.2872942142009735, + 0.2673515892028809, + 0.27461685419082643, + 0.2779176469087601, + 0.25853867259025576, + 0.30305951404571535, + 0.2197611361503601, + 0.2107482223033905, + 0.278306410741806, + 0.27574938082695005, + 0.277136362361908, + 0.23484622938632965, + 0.19353969383239747, + 0.22733799839019775, + 0.22033537466526032, + 0.17364222700595855, + 0.16525054998397828, + 0.1696811216711998, + 0.13102262905836104, + 0.12456847798824311, + 0.1238709403514862, + 0.1256138543844223, + 0.13760859820842744, + 0.11888999514579773, + 0.10369425783157349, + 0.1449669484615326, + 0.09903482309579849, + 0.08961749286651612, + 0.08136189094781876, + 0.06542902387678623, + 0.0602282164812088, + 0.0563331375837326, + 0.05991012490987778, + 0.05653515813350678, + 0.06136429299712181, + 0.048407906904816625, + 0.043913619375228884, + 0.042284037798829374, + 0.039931213203072545, + 0.03806337122917175, + 0.03679427447915077, + 0.03630924501419067, + 0.03573910497426987, + 0.034844432763755324, + 0.034415369933843615, + 0.03412407999634743, + 0.03397467752844095 + ], + "train_acc": [ + 0.6283, + 0.8046, + 0.8228, + 0.8463, + 0.8457, + 0.851, + 0.88, + 0.8359, + 0.8551, + 0.8784, + 0.8596, + 0.8648, + 0.858, + 0.8826, + 0.8913, + 0.8935, + 0.8925, + 0.8946, + 0.8815, + 0.9137, + 0.9155, + 0.8924, + 0.8921, + 0.8934, + 0.9096, + 0.9199, + 0.9091, + 0.9155, + 0.931, + 0.9328, + 0.9327, + 0.9494, + 0.9551, + 0.949, + 0.9489, + 0.9443, + 0.9525, + 0.9607, + 0.9447, + 0.9623, + 0.9664, + 0.9723, + 0.9808, + 0.9832, + 0.9863, + 0.9823, + 0.9842, + 0.9815, + 0.9907, + 0.994, + 0.9949, + 0.9958, + 0.9971, + 0.9981, + 0.998, + 0.9985, + 0.9987, + 0.9987, + 0.9989, + 0.9989 + ], + "test_acc": [ + 0.8035, + 0.813, + 0.8465, + 0.8505, + 0.853, + 0.8565, + 0.8505, + 0.8325, + 0.871, + 0.8755, + 0.863, + 0.877, + 0.8655, + 0.869, + 0.8865, + 0.8845, + 0.872, + 0.8835, + 0.8815, + 0.8925, + 0.8935, + 0.8835, + 0.8675, + 0.9055, + 0.9075, + 0.904, + 0.8925, + 0.896, + 0.917, + 0.921, + 0.9155, + 0.9275, + 0.9265, + 0.9165, + 0.92, + 0.921, + 0.9215, + 0.9315, + 0.922, + 0.9335, + 0.9315, + 0.9345, + 0.942, + 0.944, + 0.945, + 0.9465, + 0.949, + 0.941, + 0.9485, + 0.947, + 0.947, + 0.949, + 0.9495, + 0.948, + 0.9485, + 0.947, + 0.9475, + 0.948, + 0.9475, + 0.948 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.7277177572250366, + 0.7186546921730042, + 0.7086087465286255, + 0.6982603073120117, + 0.686427116394043, + 0.6760239601135254, + 0.6675269603729248, + 0.6591541767120361 + ], + "perturbation_rho": [ + 0.999999463558197, + 0.999997615814209, + 0.9999939203262329, + 0.9999786019325256, + 0.9999496340751648, + 0.99991774559021, + 0.9998468160629272, + 0.9996647834777832 + ], + "nudging": { + "0.001": [ + -0.0279630608856678, + -0.014471527189016342, + -0.00800193939357996, + -0.0047535281628370285, + -0.003030599094927311, + -0.002047237241640687, + -0.0014431248418986797, + -0.0010417262092232704 + ], + "0.003": [ + -0.07214734703302383, + -0.04029766097664833, + -0.023058053106069565, + -0.013927915133535862, + -0.008957058191299438, + -0.00608035596087575, + -0.004299057647585869, + -0.0031092879362404346 + ], + "0.01": [ + -0.14217889308929443, + -0.10304947197437286, + -0.06661910563707352, + -0.04270746558904648, + -0.028325699269771576, + -0.019565371796488762, + -0.013980223797261715, + -0.010182000696659088 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.120793573760986, + 1.1692349800109862, + 4.318221380615235, + 11.969316799926759, + 7.433457641983032, + 6.906938210105896, + 5.740281340026855, + 4.8412636898040775, + 4.507975682801008, + 3.7150641967773437, + 4.818854993438721, + 4.81442878112793, + 20.13569976043701, + 8.72026117067337, + 6.009071774291992, + 8.157103067016601, + 8.301325323486328, + 5.596079114532471, + 5.222048434448242, + 4.3211271118164065, + 6.586086061096191, + 7.058012394714355, + 7.975131286621094, + 4.45829043045044, + 6.86703256225586, + 5.461534704589844, + 4.5320643615722656, + 9.255783943176269, + 5.773329333496093, + 6.4948376953840254, + 3.3313274047851564, + 4.754503839111329, + 2.9795879699707033, + 2.045443130493164, + 1.6959571681976318, + 4.3149334289550785, + 2.6201193557739257, + 3.423483766937256, + 3.6280470642089844, + 1.005617715549469, + 0.6395519275665283, + 0.7112416195869445, + 0.5932440514087505, + 0.3480766498327255, + 0.22201839945018279, + 0.10360232348032086, + 0.07467308974369516, + 0.0435215163884204, + 0.01338290655186513, + 0.005486118838652374, + 0.0007142521263321178, + 9.912207722550193e-07, + 1.192092824453539e-11, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "train_acc": [ + 0.2294, + 0.6006, + 0.5854, + 0.6087, + 0.7444, + 0.7746, + 0.8255, + 0.8538, + 0.8616, + 0.8829, + 0.8721, + 0.8787, + 0.8112, + 0.8775, + 0.9052, + 0.8905, + 0.8932, + 0.9182, + 0.9206, + 0.9299, + 0.9097, + 0.9155, + 0.9093, + 0.9347, + 0.9187, + 0.9291, + 0.934, + 0.9141, + 0.9285, + 0.93, + 0.9466, + 0.9384, + 0.9501, + 0.9621, + 0.9649, + 0.9431, + 0.9575, + 0.9503, + 0.9522, + 0.9747, + 0.9804, + 0.9788, + 0.9829, + 0.9877, + 0.9907, + 0.9941, + 0.9956, + 0.9967, + 0.9986, + 0.9992, + 0.9999, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.467, + 0.5225, + 0.368, + 0.651, + 0.7435, + 0.694, + 0.744, + 0.8385, + 0.831, + 0.849, + 0.8375, + 0.77, + 0.816, + 0.8785, + 0.875, + 0.8375, + 0.8675, + 0.9025, + 0.898, + 0.8805, + 0.8725, + 0.8845, + 0.891, + 0.892, + 0.9035, + 0.9075, + 0.8945, + 0.887, + 0.9035, + 0.9035, + 0.9075, + 0.913, + 0.9235, + 0.9195, + 0.92, + 0.9115, + 0.9165, + 0.9255, + 0.924, + 0.9355, + 0.9335, + 0.932, + 0.936, + 0.936, + 0.943, + 0.9405, + 0.9415, + 0.9445, + 0.9455, + 0.947, + 0.948, + 0.947, + 0.9465, + 0.9465, + 0.9465, + 0.9465, + 0.9465, + 0.9465, + 0.9465, + 0.9465 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.003863303456455469, + 0.017664283514022827, + 0.01661803014576435, + 0.018178246915340424, + 0.015868376940488815, + 0.014126626774668694, + 0.014091677032411098, + 0.008254537358880043 + ], + "perturbation_rho": [ + -0.019435672089457512, + 0.2941593527793884, + 0.18103283643722534, + 0.20650765299797058, + 0.18732143938541412, + 0.13352911174297333, + 0.15822581946849823, + -0.03437525033950806 + ], + "nudging": { + "0.001": [ + 0.036526963114738464, + -0.0999140739440918, + -0.04491303116083145, + -0.01566406711935997, + -0.003947979770600796, + -0.0009792994242161512, + -0.0003040542942471802, + -9.614432929083705e-05 + ], + "0.003": [ + 0.12329098582267761, + -0.28696703910827637, + -0.13323917984962463, + -0.04670665040612221, + -0.011821148917078972, + -0.0029212406370788813, + -0.0009074252448044717, + -0.0002924713771790266 + ], + "0.01": [ + 0.4985465407371521, + -0.834585428237915, + -0.4260305166244507, + -0.15289700031280518, + -0.03924320265650749, + -0.009715870022773743, + -0.002982086967676878, + -0.0009573615971021354 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 2.0005249774932863, + 2.6273609729766845, + 8.55051524810791, + 28.19482956542969, + 494.44503037109376, + 145970.183125, + 38351053.152, + 783867611.5456, + 5883874551.3984, + 27799864927.8464, + 85124742643.712, + 195224481536.4096, + 442692943845.7856, + 842439712990.8224, + 1651162470993.1008, + 2556945754803.405, + 3782613268221.133, + 5426827993337.037, + 8994248014063.207, + 10276278090543.924, + 12815248601487.77, + 16660498968530.125, + 22318331472537.19, + 27810257342300.16, + 29551719156075.727, + 51621289471560.91, + 45316131817888.16, + 43844487198067.914, + 57194053893724.57, + 73896788449925.53, + 61295718724062.414, + 82310528867133.03, + 93415520025024.92, + 61149932904303.82, + 68502432536697.24, + 82411367948091.39, + 82084643933991.73, + 84632321762997.05, + 89683307751328.97, + 72435138440462.34, + 54397312468149.86, + 57919262188529.26, + 61994143401482.65, + 53247288374250.7, + 55559185813104.23, + 45703202357221.79, + 37343173069609.37, + 36908977404195.63, + 26988508651664.18, + 26102202092853.656, + 20915066426412.24, + 14917304209270.375, + 10353277576360.756, + 6941676885403.238, + 4919116560544.563, + 3041523188052.787, + 1825675577131.008, + 1313364471342.6943, + 730159227338.752, + 535084413327.7696 + ], + "train_acc": [ + 0.3619, + 0.4586, + 0.3937, + 0.2828, + 0.1952, + 0.145, + 0.107, + 0.1002, + 0.1046, + 0.1062, + 0.1073, + 0.1116, + 0.1045, + 0.1064, + 0.1039, + 0.1066, + 0.1115, + 0.1125, + 0.1037, + 0.1068, + 0.1111, + 0.1089, + 0.1009, + 0.1038, + 0.1045, + 0.1017, + 0.1071, + 0.1163, + 0.1042, + 0.1053, + 0.1051, + 0.1054, + 0.1021, + 0.1087, + 0.1069, + 0.1091, + 0.1108, + 0.1093, + 0.1076, + 0.1055, + 0.1184, + 0.1049, + 0.104, + 0.1111, + 0.1133, + 0.1057, + 0.1088, + 0.1193, + 0.1099, + 0.0994, + 0.1083, + 0.1094, + 0.116, + 0.1115, + 0.1125, + 0.1196, + 0.1318, + 0.1382, + 0.1583, + 0.1644 + ], + "test_acc": [ + 0.4745, + 0.4445, + 0.3525, + 0.1685, + 0.228, + 0.1435, + 0.1015, + 0.1125, + 0.1075, + 0.0965, + 0.115, + 0.1045, + 0.1165, + 0.089, + 0.1045, + 0.097, + 0.127, + 0.079, + 0.1315, + 0.098, + 0.105, + 0.128, + 0.1015, + 0.1335, + 0.1075, + 0.0925, + 0.068, + 0.1255, + 0.0695, + 0.1085, + 0.123, + 0.133, + 0.1015, + 0.1, + 0.097, + 0.0965, + 0.1085, + 0.076, + 0.123, + 0.112, + 0.098, + 0.109, + 0.1115, + 0.078, + 0.137, + 0.104, + 0.0905, + 0.102, + 0.134, + 0.1265, + 0.0885, + 0.126, + 0.119, + 0.0925, + 0.142, + 0.1215, + 0.137, + 0.1575, + 0.156, + 0.167 + ], + "state_pred_error": [ + 0.6850057603836059, + 0.468855588722229, + 0.719591781616211, + 0.9295594707489013, + 0.9863706101417542, + 0.9992992053031922, + 0.9999989013671875, + 1.0000000061035157, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 0.9999999999046326, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.09916997700929642, + -0.0925145074725151, + -0.12530964612960815, + -0.051633648574352264, + -0.0899374783039093, + -0.005518035963177681, + 1.1753130820579827e-05, + -2.0197142021061154e-06 + ], + "perturbation_rho": [ + 0.0036257803440093994, + -0.0018100417219102383, + 0.0009338338859379292, + -0.0030421577394008636, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -1124003840.0, + -22863872.0, + -26816512.0, + 2031616.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "0.003": [ + -3080515584.0, + 60985344.0, + -31789056.0, + -13869056.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "0.01": [ + -9628057600.0, + 254652416.0, + -49807360.0, + -1126400.0, + 20480.0, + 0.0, + 0.0, + 0.0 + ] + }, + "state_pred_error_per_layer": [ + 3.788521752616758e+33, + 3.788521752616758e+33, + 3.788521752616758e+33, + 3.788521752616758e+33, + 3.788521752616758e+33, + 3.788521752616758e+33, + 3.788521752616758e+33, + 3.788521752616758e+33 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.1233988201141356, + 1.162066788482666, + 6.497762945556641, + 7.657052541351319, + 7.195169696044922, + 8.47833557434082, + 9.642318778991699, + 5.338678979492188, + 7.198572373962402, + 11.581513494873047, + 6.664580947875977, + 10.820601950073241, + 41.76819462890625, + 25341.329733203125, + 989068.8966, + 20290034.592, + 327517565.184, + 2993445992.8576, + 19252386037.76, + 71484986648.1664, + 268552830346.8544, + 576653121552.384, + 1236291385766.7073, + 2171526277234.688, + 3708553561689.293, + 6411481239676.519, + 7886516879202.714, + 12247534797848.576, + 14733154332337.766, + 16258317710838.988, + 23497199149121.535, + 24087115828140.44, + 39647623746525.59, + 36765792046206.16, + 36509247690348.95, + 45728307340325.68, + 32588393748837.17, + 39329005865795.586, + 50793491846293.09, + 48569952628847.414, + 36464852586410.805, + 33697520137378.203, + 41922094853783.555, + 34577268358302.926, + 26970957053060.71, + 28872966972375.04, + 28294261609227.88, + 25690026637524.992, + 17515176864723.764, + 14857032527196.979, + 13097298348841.37, + 10537307935762.021, + 8655926777085.952, + 5209544274110.055, + 4970898223058.125, + 3055830361649.971, + 2162992193994.752, + 1569585720459.264, + 638252859208.4991, + 170934811387.4944 + ], + "train_acc": [ + 0.2277, + 0.5992, + 0.5395, + 0.653, + 0.7253, + 0.7552, + 0.7777, + 0.8482, + 0.8421, + 0.8272, + 0.8818, + 0.8542, + 0.7639, + 0.3423, + 0.1487, + 0.1153, + 0.1127, + 0.1017, + 0.0974, + 0.1009, + 0.1066, + 0.097, + 0.0976, + 0.1049, + 0.1024, + 0.1018, + 0.1017, + 0.1049, + 0.1032, + 0.1061, + 0.105, + 0.1095, + 0.1048, + 0.0993, + 0.0988, + 0.0961, + 0.1016, + 0.1035, + 0.0983, + 0.1016, + 0.0998, + 0.1062, + 0.1033, + 0.0971, + 0.1027, + 0.1041, + 0.1012, + 0.1046, + 0.0974, + 0.1008, + 0.1016, + 0.1064, + 0.1067, + 0.0981, + 0.097, + 0.1014, + 0.1002, + 0.102, + 0.0967, + 0.1007 + ], + "test_acc": [ + 0.4615, + 0.5575, + 0.454, + 0.684, + 0.665, + 0.699, + 0.786, + 0.781, + 0.754, + 0.8375, + 0.833, + 0.7865, + 0.59, + 0.1515, + 0.12, + 0.11, + 0.071, + 0.1075, + 0.0895, + 0.0835, + 0.087, + 0.125, + 0.115, + 0.113, + 0.109, + 0.11, + 0.107, + 0.1075, + 0.097, + 0.113, + 0.115, + 0.086, + 0.101, + 0.108, + 0.091, + 0.093, + 0.106, + 0.095, + 0.1025, + 0.1155, + 0.0985, + 0.1125, + 0.0905, + 0.1035, + 0.0875, + 0.1055, + 0.122, + 0.1115, + 0.0915, + 0.1115, + 0.0985, + 0.0875, + 0.098, + 0.109, + 0.1145, + 0.122, + 0.104, + 0.089, + 0.104, + 0.0965 + ], + "value_loss": [ + 2.9206485233306885, + 2.0991278984069823, + 153.16756047363282, + 262.89109077148436, + 301.8986732177734, + 495.5761693359375, + 753.0837014160156, + 342.91361103515624, + 623.1438095703126, + 1342.1768841796875, + 688.7091521484375, + 1468.21179375, + 13486.07113125, + 4533543333.752, + 4295295710527.488, + 1555069778667136.5, + 3.543898946818405e+17, + 2.835243663556606e+19, + 1.0096818054899128e+21, + 1.4048934563635221e+22, + 1.8293547075063784e+23, + 7.697987056110226e+23, + 3.54912064433393e+24, + 1.1125125750623107e+25, + 3.1799350153452077e+25, + 9.789950619326869e+25, + 1.420868244737442e+26, + 3.459160974195652e+26, + 5.1043215119493686e+26, + 6.537477195485665e+26, + 1.2926765559111974e+27, + 1.355836419967747e+27, + 3.857192822771172e+27, + 3.0881104638007575e+27, + 2.98728819026721e+27, + 4.973556844106116e+27, + 2.4829612427916363e+27, + 3.618593511782004e+27, + 5.909823532870358e+27, + 5.509981539949248e+27, + 3.062461172506452e+27, + 2.7797273823082046e+27, + 4.165363838841025e+27, + 2.921289151763202e+27, + 1.6917021233293298e+27, + 1.928555425022408e+27, + 1.875115507311143e+27, + 1.526313704196276e+27, + 6.898097075137517e+26, + 4.975919540275713e+26, + 4.097411489423477e+26, + 2.588628670357625e+26, + 1.833065029932479e+26, + 6.37755539204331e+25, + 5.804486747312932e+25, + 2.2065378859328795e+25, + 1.1536604072952298e+25, + 5.943531860139447e+24, + 1.0235238164400898e+24, + 7.270963528184324e+22 + ], + "term_loss": [ + 1.7422680698394775, + 1.8807483413696289, + 152.85236198730468, + 262.62057387695313, + 301.65136936035157, + 495.3016552734375, + 752.7325140625, + 342.58498349609374, + 622.7896586547852, + 1341.6220409179687, + 687.97834453125, + 1467.73975625, + 13347.8051, + 4533199027.5072, + 4295237151857.05, + 1555068234116366.2, + 3.543898843189434e+17, + 2.8352436632047624e+19, + 1.0096818054899128e+21, + 1.4048934563635221e+22, + 1.8293547075063784e+23, + 7.697987056110226e+23, + 3.54912064433393e+24, + 1.1125125750623107e+25, + 3.1799350153452077e+25, + 9.789950619326869e+25, + 1.420868244737442e+26, + 3.459160974195652e+26, + 5.1043215119493686e+26, + 6.537477195485665e+26, + 1.2926765559111974e+27, + 1.355836419967747e+27, + 3.857192822771172e+27, + 3.0881104638007575e+27, + 2.98728819026721e+27, + 4.973556844106116e+27, + 2.4829612427916363e+27, + 3.618593511782004e+27, + 5.909823532870358e+27, + 5.509981539949248e+27, + 3.062461172506452e+27, + 2.7797273823082046e+27, + 4.165363838841025e+27, + 2.921289151763202e+27, + 1.6917021233293298e+27, + 1.928555425022408e+27, + 1.875115507311143e+27, + 1.526313704196276e+27, + 6.898097075137517e+26, + 4.975919540275713e+26, + 4.097411489423477e+26, + 2.588628670357625e+26, + 1.833065029932479e+26, + 6.37755539204331e+25, + 5.804486747312932e+25, + 2.2065378859328795e+25, + 1.1536604072952298e+25, + 5.943531860139447e+24, + 1.0235238164400898e+24, + 7.270963401002671e+22 + ], + "bridge_loss": [ + 0.9007177171653835, + 0.03482201856076717, + 0.03401930815577507, + 0.044149079644680025, + 0.06504781594276428, + 0.10785873763561249, + 0.19907727756500243, + 0.22560245553255082, + 0.2465970028400421, + 0.43639145512580874, + 0.6498134763002396, + 0.37018338203430173, + 138.0976214126587, + 344382.48475625, + 58528349.0368, + 1544434832.9984, + 15424911215.8208, + 88761282487.9104, + 359884191904.5632, + 1146056050579.8655, + 3082334455516.3647, + 7280448903525.171, + 15563046603089.51, + 30748648594525.39, + 56933510534083.38, + 78527059769216.2, + 69464854150250.49, + 57126047046015.38, + 46248430805817.75, + 37585254076121.086, + 31106447176839.99, + 26525783025097.113, + 23478969605029.887, + 21575042935763.76, + 20503348559583.64, + 19995540443050.805, + 19841517164586.598, + 19924112197550.08, + 20125042417755.75, + 20383496081191.73, + 20669371822322.484, + 20946154892872.91, + 21198758720254.77, + 21420233960141.62, + 21622274828691.047, + 21798393734181.684, + 21954262076909.16, + 22072565790094.133, + 22186079490670.594, + 22270596729536.51, + 22344026181494.375, + 22409917999402.188, + 22516087621314.152, + 23653329912673.074, + 26443035151695.87, + 37578006567111.88, + 100635763783237.62, + 284677502217171.75, + 748937290699715.4, + 1784726332749172.0 + ], + "tgrad_loss": [ + 0.2776627652645111, + 0.18355755290985107, + 0.28117700395584105, + 0.22637253255844117, + 0.18225482790470124, + 0.16665410552024842, + 0.15210829964876174, + 0.10302361340522766, + 0.10755606596469879, + 0.11845469012856484, + 0.08099215364456176, + 0.1018688705444336, + 0.16829132108688355, + 0.4821447519302368, + 0.6398852281570434, + 0.67133180103302, + 0.6683558599472046, + 0.6734609581947326, + 0.675953857421875, + 0.6732820883750915, + 0.6747180856704712, + 0.6789773254394531, + 0.6800599794387817, + 0.6716786396980285, + 0.6725797680854797, + 0.6708943399429321, + 0.6656238901138306, + 0.6709495178222656, + 0.6712634092330932, + 0.6674262565612793, + 0.6604786745071412, + 0.6650773746490478, + 0.6686529180526734, + 0.6680105316162109, + 0.6736366228103637, + 0.6724730527877808, + 0.6645567403793335, + 0.6630275300979614, + 0.672146079826355, + 0.6698319987297058, + 0.6705549544334412, + 0.6641793041229248, + 0.6620641376495361, + 0.6850378318786621, + 0.671090496635437, + 0.6601127412796021, + 0.6603810975074768, + 0.6602658043861389, + 0.6775860306739807, + 0.6670328340530396, + 0.6655113603591919, + 0.661010055923462, + 0.6625628248214722, + 0.6739681219100953, + 0.6659061016082763, + 0.6693037282943726, + 0.6730936048507691, + 0.6696272415161133, + 0.6722038083076477, + 0.6689293840408325 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.517741858959198, + 0.33828628063201904, + 0.4149113893508911, + 0.23560978472232819, + -0.15021789073944092, + -0.1476898193359375, + -0.3642715811729431, + -0.040503572672605515 + ], + "perturbation_rho": [ + -0.004317115992307663, + 9.15133859962225e-05, + 0.0010522708762437105, + 0.0034065949730575085, + -0.18388643860816956, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -524155392.0, + 29052416.0, + 30197760.0, + -8481792.0, + -8960.0, + 0.0, + 0.0, + 0.0 + ], + "0.003": [ + -1570021760.0, + -2878336.0, + 22212864.0, + -11307520.0, + -150016.0, + 0.0, + 0.0, + 0.0 + ], + "0.01": [ + -5081367040.0, + -74964928.0, + 31930368.0, + -13346304.0, + 66048.0, + 0.0, + 0.0, + 0.0 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_smoke/synth_a0.5_L2_s42.json b/results/synth_ladder_smoke/synth_a0.5_L2_s42.json new file mode 100644 index 0000000..d6dbba5 --- /dev/null +++ b/results/synth_ladder_smoke/synth_a0.5_L2_s42.json @@ -0,0 +1,1172 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.8446357597351075, + 0.9337884250640869, + 0.5358327745437622, + 0.3911330166339874, + 0.32849840292930604, + 0.2850165479660034, + 0.2686881549835205, + 0.25319644589424134, + 0.23558919601440428, + 0.22118966565132142, + 0.2210680745959282, + 0.2016040184020996, + 0.20486357657909393, + 0.18903831100463866, + 0.18852734336853028, + 0.1785359749317169, + 0.17395910472869874, + 0.18103560156822204, + 0.17268380609750747, + 0.16011136660575867, + 0.1667647705078125, + 0.1562471776008606, + 0.1488836531996727, + 0.14291370005607604, + 0.1413789472579956, + 0.13651124601364137, + 0.13058673537671567, + 0.12447206282615661, + 0.12683574684858323, + 0.11880559389591216, + 0.12121504894495011, + 0.1152825408577919, + 0.11083448304533959, + 0.1080839204788208, + 0.10981180058121681, + 0.10525347989797593, + 0.10407337579727173, + 0.09992667212486267, + 0.10014419107437134, + 0.09764940270185471, + 0.09493863627910613, + 0.0940910838842392, + 0.09462859318256378, + 0.09235266934633254, + 0.08991062052249908, + 0.08853154343366623, + 0.08709892609715461, + 0.08601901152133942, + 0.08521206267476082, + 0.08447394663095474, + 0.08380048310756684, + 0.08328880717754364, + 0.08290200964212417, + 0.082516270506382, + 0.0820741615831852, + 0.08178826131820678, + 0.08155987080335617, + 0.08138326687812805, + 0.08128138109445572, + 0.08121294350624085 + ], + "train_acc": [ + 0.3769, + 0.7502, + 0.8602, + 0.8939, + 0.9048, + 0.9137, + 0.9118, + 0.9135, + 0.9168, + 0.9248, + 0.9194, + 0.9306, + 0.9246, + 0.9308, + 0.9319, + 0.9351, + 0.9394, + 0.9292, + 0.9379, + 0.9434, + 0.9388, + 0.9449, + 0.9479, + 0.9511, + 0.9505, + 0.9534, + 0.9574, + 0.9617, + 0.9569, + 0.9621, + 0.961, + 0.9652, + 0.9675, + 0.9694, + 0.9667, + 0.9689, + 0.9697, + 0.9724, + 0.9722, + 0.973, + 0.9748, + 0.976, + 0.9743, + 0.9768, + 0.9789, + 0.9789, + 0.9807, + 0.9809, + 0.9811, + 0.982, + 0.9821, + 0.9822, + 0.9829, + 0.9829, + 0.9828, + 0.9832, + 0.9831, + 0.9832, + 0.9833, + 0.9834 + ], + "test_acc": [ + 0.6305, + 0.8045, + 0.868, + 0.8805, + 0.878, + 0.884, + 0.8845, + 0.8855, + 0.882, + 0.882, + 0.886, + 0.8895, + 0.8845, + 0.89, + 0.894, + 0.8935, + 0.884, + 0.885, + 0.884, + 0.895, + 0.8865, + 0.8915, + 0.8855, + 0.8865, + 0.8875, + 0.8905, + 0.8955, + 0.8935, + 0.8885, + 0.891, + 0.8925, + 0.8935, + 0.8915, + 0.893, + 0.895, + 0.8905, + 0.891, + 0.8945, + 0.891, + 0.893, + 0.8935, + 0.8925, + 0.8905, + 0.887, + 0.886, + 0.8875, + 0.89, + 0.8895, + 0.8885, + 0.8885, + 0.888, + 0.89, + 0.89, + 0.891, + 0.89, + 0.89, + 0.89, + 0.8905, + 0.8905, + 0.8905 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8970257639884949, + 0.8884812593460083 + ], + "perturbation_rho": [ + 0.9999991655349731, + 0.9999955892562866 + ], + "nudging": { + "0.001": [ + -0.02583475597202778, + -0.009747679345309734 + ], + "0.003": [ + -0.07010301947593689, + -0.028194870799779892 + ], + "0.01": [ + -0.16577741503715515, + -0.08266304433345795 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.27625731010437, + 1.6932389553070069, + 1.0857321990966797, + 0.75010082654953, + 0.5716302475452423, + 0.4672969693660736, + 0.4043164154052734, + 0.3653347668647766, + 0.33810731897354124, + 0.32000629520416257, + 0.31557338215112685, + 0.306670289850235, + 0.3169789312839508, + 0.3090059988975525, + 0.3211127027988434, + 0.30841862708330153, + 0.3055117506980896, + 0.3295214436531067, + 0.34342247110009194, + 0.3109726100921631, + 0.31801784634590147, + 0.32870279140472414, + 0.32357279167175296, + 0.31220887575149536, + 0.33542337856292725, + 0.3194949890613556, + 0.3191724066019058, + 0.30960334286689756, + 0.3245603529512882, + 0.3087747444152832, + 0.3317766746044159, + 0.3014678807616234, + 0.2997256254792213, + 0.29870811405181885, + 0.3113420418739319, + 0.29615239515304564, + 0.3031815109014511, + 0.29484934725761414, + 0.29226981248855594, + 0.29299453842788936, + 0.28204461708068845, + 0.2941273021697998, + 0.2800413821220398, + 0.27800616981983184, + 0.2764166726350784, + 0.2763713481783867, + 0.27189454293251036, + 0.27382534552812576, + 0.269278941822052, + 0.27021434302330016, + 0.2698526949882507, + 0.2682139085292816, + 0.26725732135772706, + 0.2652432975292206, + 0.2637831997156143, + 0.2630580255508423, + 0.26260964117050173, + 0.2622452072620392, + 0.2619642446279526, + 0.2617356785297394 + ], + "train_acc": [ + 0.1661, + 0.4501, + 0.6451, + 0.7414, + 0.7921, + 0.8238, + 0.8427, + 0.8554, + 0.8672, + 0.8715, + 0.8749, + 0.8813, + 0.8786, + 0.8823, + 0.8803, + 0.8873, + 0.8881, + 0.88, + 0.8772, + 0.8859, + 0.8862, + 0.885, + 0.8879, + 0.8931, + 0.8854, + 0.8902, + 0.8914, + 0.8946, + 0.8913, + 0.892, + 0.8878, + 0.8958, + 0.8957, + 0.8977, + 0.8976, + 0.8976, + 0.894, + 0.8972, + 0.9001, + 0.9001, + 0.9037, + 0.8986, + 0.9026, + 0.9034, + 0.9026, + 0.9037, + 0.9039, + 0.9061, + 0.9049, + 0.9065, + 0.9056, + 0.9059, + 0.906, + 0.9069, + 0.907, + 0.9075, + 0.9073, + 0.9077, + 0.9081, + 0.908 + ], + "test_acc": [ + 0.29, + 0.5665, + 0.678, + 0.7465, + 0.7665, + 0.7995, + 0.81, + 0.8255, + 0.8285, + 0.8265, + 0.833, + 0.839, + 0.8275, + 0.8435, + 0.8295, + 0.841, + 0.84, + 0.832, + 0.8355, + 0.851, + 0.841, + 0.845, + 0.8355, + 0.838, + 0.843, + 0.848, + 0.854, + 0.8515, + 0.8445, + 0.8315, + 0.849, + 0.8445, + 0.841, + 0.843, + 0.847, + 0.8435, + 0.8545, + 0.853, + 0.8505, + 0.855, + 0.8465, + 0.8525, + 0.858, + 0.854, + 0.8535, + 0.858, + 0.856, + 0.8515, + 0.852, + 0.858, + 0.855, + 0.855, + 0.859, + 0.8545, + 0.8565, + 0.858, + 0.857, + 0.8565, + 0.8565, + 0.8565 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.009920955635607243, + 0.07439190149307251 + ], + "perturbation_rho": [ + -0.054706037044525146, + 0.05173008143901825 + ], + "nudging": { + "0.001": [ + 0.00026212679222226143, + -0.000588460301514715 + ], + "0.003": [ + 0.0008918952662497759, + -0.00176119280513376 + ], + "0.01": [ + 0.004189381375908852, + -0.005824576131999493 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 2.0848215646743773, + 1.211621427154541, + 0.7053265221595764, + 0.4795488802909851, + 0.38192135109901426, + 0.34821708626747133, + 0.337696081662178, + 0.3322465687274933, + 0.33291667788028717, + 0.338371639585495, + 0.34170880966186523, + 0.342152866768837, + 0.3392792880296707, + 0.339041673374176, + 0.3449883652687073, + 0.3402249610185623, + 0.34081881189346314, + 0.33598546833992005, + 0.3371055328369141, + 0.3591313819885254, + 0.34564214142560956, + 0.3394580416202545, + 0.34311104855537417, + 0.33622951345443725, + 0.3556391622543335, + 0.3568912126541138, + 0.34955705823898314, + 0.3417039113998413, + 0.35299610414505006, + 0.3575472953557968, + 0.34411632428169253, + 0.35480775973796846, + 0.34226418747901916, + 0.357436913728714, + 0.3434531378746033, + 0.3444290014266968, + 0.3643165395140648, + 0.33347331820726395, + 0.3350465914726257, + 0.3356053658485413, + 0.34029814500808714, + 0.3406800155639648, + 0.33120009369850156, + 0.3287809826850891, + 0.32986082344055173, + 0.32653587369918824, + 0.325406661939621, + 0.3253041708946228, + 0.32081891207695007, + 0.32064156465530397, + 0.3223177612066269, + 0.3184559244155884, + 0.31674068355560303, + 0.3164571708202362, + 0.3151209916114807, + 0.3144640969753265, + 0.3136228200674057, + 0.31325989184379577, + 0.31308275623321535, + 0.3128601837158203 + ], + "train_acc": [ + 0.2498, + 0.6046, + 0.7683, + 0.8313, + 0.8632, + 0.8659, + 0.8672, + 0.87, + 0.8691, + 0.8699, + 0.8677, + 0.868, + 0.8675, + 0.8672, + 0.8658, + 0.8671, + 0.8653, + 0.8695, + 0.8688, + 0.8596, + 0.8654, + 0.8689, + 0.8632, + 0.8671, + 0.8573, + 0.8599, + 0.8633, + 0.8629, + 0.8589, + 0.8617, + 0.8637, + 0.8616, + 0.8635, + 0.8625, + 0.8659, + 0.8651, + 0.8582, + 0.8696, + 0.8683, + 0.8707, + 0.8656, + 0.8638, + 0.8697, + 0.8694, + 0.8709, + 0.8723, + 0.872, + 0.8734, + 0.8736, + 0.8742, + 0.8753, + 0.8756, + 0.8772, + 0.877, + 0.877, + 0.8784, + 0.8769, + 0.878, + 0.878, + 0.878 + ], + "test_acc": [ + 0.4745, + 0.682, + 0.7765, + 0.818, + 0.8365, + 0.8285, + 0.8275, + 0.828, + 0.8295, + 0.828, + 0.824, + 0.8335, + 0.8255, + 0.822, + 0.835, + 0.829, + 0.826, + 0.834, + 0.828, + 0.8275, + 0.8175, + 0.8185, + 0.8225, + 0.8245, + 0.8245, + 0.814, + 0.8245, + 0.8115, + 0.8205, + 0.821, + 0.8265, + 0.8275, + 0.8135, + 0.8205, + 0.823, + 0.813, + 0.8165, + 0.8215, + 0.8245, + 0.8225, + 0.823, + 0.827, + 0.826, + 0.8235, + 0.825, + 0.826, + 0.824, + 0.83, + 0.8245, + 0.8255, + 0.827, + 0.8215, + 0.826, + 0.8255, + 0.825, + 0.822, + 0.8245, + 0.825, + 0.825, + 0.825 + ], + "state_pred_error": [ + 0.8007919464111328, + 0.3660256730556488, + 0.21767480976581574, + 0.17657471108436584, + 0.16651829404830934, + 0.16410830841064453, + 0.1607012363433838, + 0.15436248441934586, + 0.14273409378528595, + 0.12546166217327118, + 0.10508068288564681, + 0.09174856995344162, + 0.07927782148122788, + 0.07130704913139344, + 0.06682584903240203, + 0.06470049023628235, + 0.059187446343898775, + 0.06052878065705299, + 0.055212487065792085, + 0.054425645017623904, + 0.054145838260650635, + 0.05300228137969971, + 0.055760251158475875, + 0.05360760774612427, + 0.055333372712135315, + 0.055942467188835145, + 0.057480208098888395, + 0.055890723019838336, + 0.05407774894237518, + 0.0541152871966362, + 0.056709947526454925, + 0.056150261449813846, + 0.05520617353320122, + 0.056996329259872434, + 0.057790105390548706, + 0.05606599482297897, + 0.056856753021478655, + 0.059714989024400714, + 0.05486650733947754, + 0.055311821693181995, + 0.05465262854099274, + 0.053158983314037324, + 0.05372279359102249, + 0.051694966912269595, + 0.05255660619735718, + 0.0502005146086216, + 0.049731254732608796, + 0.049252740573883055, + 0.05221502633690834, + 0.04587042521238327, + 0.04583015296459198, + 0.04525720854997635, + 0.04457337497472763, + 0.04612945556640625, + 0.042507706445455554, + 0.040471922528743744, + 0.03980488125681877, + 0.040267976915836334, + 0.038662106162309647, + 0.03791789541244507 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8819085955619812, + 0.4091951251029968 + ], + "perturbation_rho": [ + 0.761555552482605, + 0.28052955865859985 + ], + "nudging": { + "0.001": [ + -0.02264053374528885, + -0.00310164550319314 + ], + "0.003": [ + -0.0647020936012268, + -0.009247269481420517 + ], + "0.01": [ + -0.18185698986053467, + -0.03015393391251564 + ] + }, + "state_pred_error_per_layer": [ + 7353.158203125, + 2627.8740234375 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2758026485443117, + 1.6885655117034912, + 1.08470324382782, + 0.7463973359584808, + 0.5717253586769104, + 0.46329988174438475, + 0.39801541891098025, + 0.3542559162139893, + 0.3321510377883911, + 0.32213094537258147, + 0.30751878271102906, + 0.31636517415046694, + 0.3064259076118469, + 0.3367045620918274, + 0.35580090804100034, + 0.3754026936531067, + 0.40374352722167967, + 0.43292674508094786, + 0.46699409065246583, + 0.5129571395874023, + 0.5549553430557251, + 0.6454820284843444, + 0.6873638281822204, + 0.7763219680786133, + 0.8179979449272156, + 0.8366187688827514, + 0.8139018608093261, + 0.7946758689880371, + 0.7822862171173096, + 0.8099772785186767, + 0.7882675226211547, + 0.8030387943267823, + 0.8235842838287354, + 0.8256282581329346, + 0.8351705140113831, + 0.8342797046661377, + 0.8355479052543641, + 0.8148316853523254, + 0.8180710522651672, + 0.8008527454376221, + 0.7904974743366241, + 0.7784066701889039, + 0.7801080569267272, + 0.7695643264770508, + 0.7619868974685668, + 0.7521709791183472, + 0.7479159229278565, + 0.7424602756500244, + 0.7412874538421631, + 0.7384739780426025, + 0.7354034683227539, + 0.7321881999969483, + 0.7304416828870773, + 0.7277423991203308, + 0.7266941992759705, + 0.7254751741409302, + 0.7244712076187134, + 0.7236532078742981, + 0.723047044467926, + 0.7228024994850158 + ], + "train_acc": [ + 0.1643, + 0.447, + 0.6451, + 0.7397, + 0.7886, + 0.8234, + 0.8475, + 0.8612, + 0.8717, + 0.873, + 0.8802, + 0.877, + 0.8796, + 0.8747, + 0.8718, + 0.8696, + 0.8602, + 0.853, + 0.8432, + 0.8316, + 0.8168, + 0.8, + 0.7828, + 0.7701, + 0.758, + 0.7589, + 0.7561, + 0.7565, + 0.7552, + 0.7491, + 0.7482, + 0.7481, + 0.7404, + 0.7413, + 0.7355, + 0.7367, + 0.7314, + 0.7339, + 0.7328, + 0.7344, + 0.7318, + 0.7354, + 0.7307, + 0.73, + 0.7304, + 0.7318, + 0.7299, + 0.7348, + 0.7319, + 0.7324, + 0.7316, + 0.7334, + 0.7326, + 0.7342, + 0.7331, + 0.7339, + 0.7345, + 0.7341, + 0.7341, + 0.7342 + ], + "test_acc": [ + 0.2905, + 0.569, + 0.68, + 0.7385, + 0.7775, + 0.7915, + 0.813, + 0.8245, + 0.831, + 0.831, + 0.8305, + 0.8425, + 0.8345, + 0.843, + 0.833, + 0.8295, + 0.8155, + 0.81, + 0.789, + 0.772, + 0.764, + 0.742, + 0.7525, + 0.724, + 0.733, + 0.7265, + 0.735, + 0.732, + 0.7265, + 0.7145, + 0.7215, + 0.7135, + 0.7125, + 0.704, + 0.7055, + 0.702, + 0.7, + 0.697, + 0.703, + 0.7005, + 0.698, + 0.691, + 0.697, + 0.696, + 0.695, + 0.6985, + 0.6995, + 0.694, + 0.6925, + 0.6915, + 0.695, + 0.6935, + 0.6915, + 0.6895, + 0.6895, + 0.69, + 0.69, + 0.6915, + 0.692, + 0.692 + ], + "value_loss": [ + 2.9288026363372803, + 0.7864144048690795, + 0.639929295539856, + 0.6204524069786072, + 0.5754725531578064, + 0.5040289174079895, + 0.4698821117401123, + 0.42889139366149903, + 0.40420380544662476, + 0.4028634844779968, + 0.3892712847232819, + 0.42402955713272095, + 0.4190965398788452, + 0.5044933345794678, + 0.5825771816253662, + 0.6768685617446899, + 0.7133742139816284, + 0.7950645107269287, + 0.8662869777679444, + 0.8996373329162598, + 1.0280699882507325, + 1.163149174976349, + 1.221600127506256, + 1.3104056980133056, + 1.2766916957855226, + 1.326834045124054, + 1.134784700345993, + 1.0404576797485352, + 0.9483049005508423, + 0.9540580884933472, + 0.8205204145908356, + 0.785475520324707, + 0.7712423495292664, + 0.7447103875160217, + 0.7290693919181823, + 0.7014289337158203, + 0.6762246777057648, + 0.6185135121822357, + 0.5984228439331055, + 0.5883202701568604, + 0.5178473577141762, + 0.49681459336280825, + 0.47928457641601563, + 0.4505615571975708, + 0.4401890376567841, + 0.4055981549263, + 0.3913276084661484, + 0.3749931034088135, + 0.36367860050201417, + 0.3544500424861908, + 0.3396661903381348, + 0.3323349492073059, + 0.3219338518619537, + 0.31491898312568667, + 0.31108326172828676, + 0.3048648599147797, + 0.3013700053215027, + 0.2964340720176697, + 0.2898823614120483, + 0.28658444921970366 + ], + "term_loss": [ + 1.680461615371704, + 0.318868265914917, + 0.35254693756103517, + 0.3742735361099243, + 0.3474857358932495, + 0.28915810022354127, + 0.2642122935295105, + 0.23409572947025298, + 0.21996172314882279, + 0.23002521407604218, + 0.22711438574790954, + 0.2580068214178085, + 0.2574511836051941, + 0.3300004418611526, + 0.40008525619506835, + 0.4885060411453247, + 0.5082338293075561, + 0.5783841617822647, + 0.6369189880371093, + 0.6535232496738433, + 0.7590381214141846, + 0.8601485894203186, + 0.894815693473816, + 0.9405028270721436, + 0.8813811222076416, + 0.9386566973686218, + 0.7575348546385765, + 0.6686955894470215, + 0.584379263305664, + 0.5871846159934998, + 0.4701783618569374, + 0.4340015830993652, + 0.4127886173248291, + 0.3876411557197571, + 0.36765715140104294, + 0.34130483388900756, + 0.3164654992282391, + 0.2649745005369186, + 0.24806257448196412, + 0.23591347963511944, + 0.18224032307416202, + 0.17264214125871657, + 0.16115299315452575, + 0.14498900377750396, + 0.13794133849143983, + 0.11381195783615113, + 0.10435335038900376, + 0.09480323598384857, + 0.08906670632362365, + 0.08353737684488297, + 0.07434089761972427, + 0.06973979330062866, + 0.062392609396576884, + 0.057668454825878145, + 0.05661035113334656, + 0.05194146478176117, + 0.050404521048069, + 0.04641184125840664, + 0.04249159356355667, + 0.040962481904029846 + ], + "bridge_loss": [ + 0.9235159797744243, + 0.14302324088811874, + 0.027366681298613547, + 0.007692705816030502, + 0.010395049159228802, + 0.019707173657417296, + 0.02507652835845947, + 0.02611555808186531, + 0.021296515330672262, + 0.013124176825582982, + 0.008141374707221986, + 0.007833877293765544, + 0.008524406471848487, + 0.010415069633722305, + 0.013049487066268921, + 0.016472193028777837, + 0.021332170206308364, + 0.026048093110322953, + 0.029016028451919557, + 0.034247407439351084, + 0.04159984835982323, + 0.050617339766025546, + 0.06549989938735962, + 0.09351733729839325, + 0.11405401186943054, + 0.11128878911733628, + 0.10870532690286637, + 0.10964111132621765, + 0.10776555414199829, + 0.106626724588871, + 0.09811114823818207, + 0.10090886116027832, + 0.10686962119936944, + 0.10767342432141304, + 0.11076187438368797, + 0.11315056962966918, + 0.11132480944395065, + 0.10967807099819184, + 0.1067829899072647, + 0.11111221095919609, + 0.09527428455650806, + 0.08718832828998566, + 0.07998935594558716, + 0.07022619643211364, + 0.06896837931275368, + 0.06022721946239471, + 0.0557270368874073, + 0.05167174000740051, + 0.04623512443304062, + 0.04293481481075287, + 0.038837641191482544, + 0.0364598036468029, + 0.03402813461869955, + 0.03277047674655914, + 0.030157368355989457, + 0.02910452802181244, + 0.02725501443147659, + 0.026727657391130925, + 0.024257883021235466, + 0.0227132670879364 + ], + "tgrad_loss": [ + 0.32482506103515624, + 0.3245229008197784, + 0.26001567754745486, + 0.23848616292476654, + 0.21759176819324494, + 0.19516364593505858, + 0.18059329314231873, + 0.1686801063299179, + 0.16294556813240052, + 0.15971409220695496, + 0.15401552100181579, + 0.1581888596534729, + 0.15312094755172728, + 0.16407781987190245, + 0.16944243593215944, + 0.17189033045768737, + 0.1838082096338272, + 0.19063225364685057, + 0.200351966047287, + 0.21186667006015777, + 0.22743201670646668, + 0.2523832549571991, + 0.2612845244407654, + 0.276385528755188, + 0.28125656070709226, + 0.2768885573148727, + 0.26854453350305557, + 0.26212098736763, + 0.2561600820541382, + 0.26024675402641295, + 0.25223090353012084, + 0.2505650712966919, + 0.2515841117858887, + 0.24939580075740814, + 0.2506503685951233, + 0.2469735339164734, + 0.24843437323570253, + 0.24386094369888306, + 0.24357727665901185, + 0.24129457442760469, + 0.2403327546596527, + 0.23698412399291993, + 0.2381422297000885, + 0.23534635643959045, + 0.23327932082414626, + 0.23155897912979126, + 0.23124722099304199, + 0.22851812629699708, + 0.2283767698287964, + 0.22797785167694093, + 0.22648765294551848, + 0.2261353533267975, + 0.2255131096124649, + 0.22448005208969116, + 0.22431554079055785, + 0.2238188648223877, + 0.2237104712486267, + 0.22329457123279572, + 0.22313288278579713, + 0.22290869793891907 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.14308685064315796, + 0.19856137037277222 + ], + "perturbation_rho": [ + 0.26277071237564087, + 0.35259145498275757 + ], + "nudging": { + "0.001": [ + -0.008868614211678505, + -0.002737760543823242 + ], + "0.003": [ + -0.026448238641023636, + -0.008198779076337814 + ], + "0.01": [ + -0.08629482984542847, + -0.02716018632054329 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_smoke/synth_a0.5_L8_s42.json b/results/synth_ladder_smoke/synth_a0.5_L8_s42.json new file mode 100644 index 0000000..4100509 --- /dev/null +++ b/results/synth_ladder_smoke/synth_a0.5_L8_s42.json @@ -0,0 +1,1298 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.136691594696045, + 0.46806032037734985, + 0.4316451009750366, + 0.4347771800994873, + 0.3343221833229065, + 0.3072679266691208, + 0.2860998099684715, + 0.2768943711280823, + 0.3112841864347458, + 0.25927799339294433, + 0.3529360438346863, + 0.25663795070648193, + 0.24724824962615966, + 0.21611351084709168, + 0.18648713210821152, + 0.15988158864974975, + 0.15585354483127595, + 0.18523548917770385, + 0.22896917595863342, + 0.2142798038750887, + 0.1302151912689209, + 0.16641850475668907, + 0.12069643893241883, + 0.08900030250549316, + 0.08987545764446259, + 0.10792131569385528, + 0.16137572979927062, + 0.1006333449959755, + 0.06665127108097077, + 0.08824220795631409, + 0.08165898373126984, + 0.06826103755831718, + 0.04620580951422453, + 0.028055201417207718, + 0.02063491685986519, + 0.01727813795208931, + 0.02019768879711628, + 0.01568793712258339, + 0.012248684544116258, + 0.010092336454987525, + 0.00976453013420105, + 0.009257472205534578, + 0.008108717930689454, + 0.007677602717280388, + 0.007419238343834877, + 0.0072768413543701175, + 0.006870861586928368, + 0.006650014963746071, + 0.006521989097818732, + 0.0062547821387648585, + 0.006135749720607419, + 0.00600387082695961, + 0.005926267157122493, + 0.005855366069078445, + 0.005777022970467806, + 0.0057358153447508815, + 0.005699658918380738, + 0.005675127564370632, + 0.005658907664567232, + 0.005650237935781479 + ], + "train_acc": [ + 0.5999, + 0.8146, + 0.8325, + 0.8321, + 0.8652, + 0.8786, + 0.8874, + 0.8888, + 0.8769, + 0.8976, + 0.8648, + 0.8974, + 0.9054, + 0.9145, + 0.9254, + 0.939, + 0.9408, + 0.9272, + 0.9121, + 0.9191, + 0.9485, + 0.9388, + 0.9548, + 0.9693, + 0.9681, + 0.9608, + 0.9414, + 0.9608, + 0.9771, + 0.9692, + 0.9699, + 0.9768, + 0.9856, + 0.9942, + 0.9977, + 0.9991, + 0.9986, + 0.9993, + 1.0, + 0.9999, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.798, + 0.828, + 0.834, + 0.828, + 0.8475, + 0.849, + 0.863, + 0.838, + 0.8405, + 0.849, + 0.8435, + 0.8605, + 0.86, + 0.8595, + 0.8585, + 0.8665, + 0.8675, + 0.869, + 0.8575, + 0.8665, + 0.8715, + 0.861, + 0.87, + 0.884, + 0.8745, + 0.878, + 0.861, + 0.875, + 0.878, + 0.8755, + 0.876, + 0.8785, + 0.882, + 0.886, + 0.8875, + 0.8875, + 0.8875, + 0.8825, + 0.882, + 0.8835, + 0.8805, + 0.883, + 0.8825, + 0.881, + 0.884, + 0.8815, + 0.882, + 0.8805, + 0.8835, + 0.8815, + 0.8825, + 0.8825, + 0.8825, + 0.8825, + 0.8825, + 0.8825, + 0.8825, + 0.8825, + 0.8825, + 0.8825 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.7438379526138306, + 0.7323452234268188, + 0.723551869392395, + 0.7129155397415161, + 0.6892737746238708, + 0.6759694814682007, + 0.6671421527862549, + 0.658506453037262 + ], + "perturbation_rho": [ + 0.9999985694885254, + 0.9999985694885254, + 0.9999951720237732, + 0.9999872446060181, + 0.9999734163284302, + 0.9999377727508545, + 0.9998385310173035, + 0.9996463060379028 + ], + "nudging": { + "0.001": [ + -0.04311143979430199, + -0.025736961513757706, + -0.015766380354762077, + -0.009858880192041397, + -0.006290047895163298, + -0.0040962668135762215, + -0.0027405626606196165, + -0.001892995205707848 + ], + "0.003": [ + -0.11948808282613754, + -0.07372619211673737, + -0.04599824547767639, + -0.02906736731529236, + -0.018663030117750168, + -0.012201843783259392, + -0.008183058351278305, + -0.005660833325237036 + ], + "0.01": [ + -0.3025854229927063, + -0.20860256254673004, + -0.13888010382652283, + -0.09112250804901123, + -0.0598360076546669, + -0.039668694138526917, + -0.026830831542611122, + -0.018658190965652466 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.179273973274231, + 1.1607816802024842, + 1.0248043842315673, + 3.511209108734131, + 6.032191545772553, + 3.914867709350586, + 3.949158609008789, + 5.983486985874176, + 4.987364087677002, + 5.680050399017334, + 7.099758061218262, + 5.354408818435669, + 4.76497013092041, + 4.123531845378876, + 2.0574048504590916, + 2.323176780796051, + 2.782958260065317, + 2.5619404708862303, + 3.480497920135781, + 3.101931768798828, + 3.8787393211364747, + 4.53973305053711, + 4.699173797607422, + 3.983302816152543, + 2.5256453704833985, + 2.8716179557800294, + 6.437423288345337, + 5.216130206298828, + 3.4424527400970457, + 2.7655251071929934, + 2.3487059077380605, + 1.864477375984192, + 2.0987041217803957, + 1.88752355449982, + 1.6080115905761718, + 2.913223678588867, + 2.908343041229248, + 2.2413818557739256, + 1.606345883178711, + 1.371524071931839, + 1.3019395248413086, + 1.273482549238205, + 1.2922779474943877, + 1.0599872829437256, + 1.1355560552597046, + 1.0550661331176758, + 0.8672094687118195, + 0.8589552932739258, + 0.8731966491699219, + 0.7816802364406933, + 0.726442290687561, + 0.6984855533599853, + 0.6792838054656982, + 0.6738904183980471, + 0.6512476387023926, + 0.6394786426544189, + 0.6294556060791016, + 0.6173530825614929, + 0.6136219739913941, + 0.6067015721155331 + ], + "train_acc": [ + 0.2084, + 0.5847, + 0.674, + 0.578, + 0.6114, + 0.7162, + 0.7505, + 0.7481, + 0.7826, + 0.7953, + 0.7895, + 0.8298, + 0.8505, + 0.8621, + 0.9028, + 0.8975, + 0.8895, + 0.8946, + 0.8819, + 0.8901, + 0.8856, + 0.874, + 0.8729, + 0.8867, + 0.9077, + 0.9028, + 0.8631, + 0.8812, + 0.9016, + 0.9094, + 0.9176, + 0.9257, + 0.9212, + 0.9291, + 0.9327, + 0.9092, + 0.9081, + 0.9217, + 0.9326, + 0.9422, + 0.9406, + 0.9399, + 0.9404, + 0.9463, + 0.9438, + 0.9485, + 0.954, + 0.955, + 0.9564, + 0.9593, + 0.9616, + 0.9631, + 0.9652, + 0.9652, + 0.9654, + 0.9658, + 0.9679, + 0.9675, + 0.9688, + 0.9688 + ], + "test_acc": [ + 0.4305, + 0.643, + 0.4325, + 0.5125, + 0.6255, + 0.678, + 0.5685, + 0.73, + 0.746, + 0.693, + 0.7235, + 0.697, + 0.7775, + 0.8565, + 0.8395, + 0.8115, + 0.8285, + 0.828, + 0.8635, + 0.8115, + 0.8095, + 0.8265, + 0.831, + 0.858, + 0.8555, + 0.821, + 0.826, + 0.8525, + 0.8595, + 0.85, + 0.873, + 0.873, + 0.8635, + 0.878, + 0.851, + 0.8725, + 0.8675, + 0.876, + 0.873, + 0.8765, + 0.873, + 0.8735, + 0.877, + 0.889, + 0.879, + 0.8815, + 0.881, + 0.876, + 0.876, + 0.879, + 0.8825, + 0.882, + 0.882, + 0.8805, + 0.8835, + 0.8805, + 0.8815, + 0.8815, + 0.881, + 0.8805 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.0057187266647815704, + 0.03526674211025238, + 0.03511466830968857, + 0.043710630387067795, + 0.04474484175443649, + 0.03394380211830139, + 0.03243564814329147, + 0.022118231281638145 + ], + "perturbation_rho": [ + -0.08895743638277054, + 0.2165505439043045, + 0.14878079295158386, + 0.23983460664749146, + 0.23414158821105957, + 0.22946099936962128, + 0.044252023100852966, + 0.14246688783168793 + ], + "nudging": { + "0.001": [ + 0.01978934183716774, + -0.046600837260484695, + -0.01815088465809822, + -0.00800597295165062, + -0.003184718545526266, + -0.0009393530781380832, + -0.0004502768279053271, + -0.00020403253438416868 + ], + "0.003": [ + 0.05996423214673996, + -0.13848936557769775, + -0.05431535094976425, + -0.023991748690605164, + -0.009551258757710457, + -0.002814686391502619, + -0.0013659803662449121, + -0.0006229060236364603 + ], + "0.01": [ + 0.20587505400180817, + -0.4487733840942383, + -0.17917752265930176, + -0.0796520859003067, + -0.03180943429470062, + -0.009406229481101036, + -0.004543165676295757, + -0.0020739310421049595 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.7562337284088134, + 1.257188836669922, + 1.2758575519561768, + 1.4537065887451173, + 4.792724206542969, + 16.118391802978515, + 51.218969592285156, + 48.630170703125, + 67.82239494628907, + 283.23611538085936, + 290.38378896484375, + 2590.0150890625, + 189232.429075, + 11507255.3056, + 83814626.9184, + 556083459.6864, + 1844555113.2672, + 4752015027.4048, + 9102063837.184, + 15721989154.4064, + 22484995447.1936, + 47668534312.96, + 72129013573.2224, + 96852680389.4272, + 118100167544.0128, + 164099385982.976, + 233045719357.8496, + 258927479383.6544, + 289939393295.1552, + 320891180076.2368, + 355023569656.2176, + 426034706146.9184, + 458971803235.1232, + 431989108978.4832, + 568470620287.7952, + 535395968430.8992, + 482758674140.3648, + 466598119027.5072, + 584723043083.8784, + 447152531177.472, + 457150332456.1408, + 483606448989.7984, + 493444037135.5648, + 376356872074.0352, + 351529334525.1328, + 274896416879.4112, + 218886323568.64, + 218774933078.016, + 185821763783.8848, + 164821042043.2896, + 130335844388.0448, + 133878474814.2592, + 86565364930.9696, + 76351718686.72, + 42520756237.1072, + 42705961222.144, + 20059558078.0544, + 11325599613.7472, + 4514770222.2848, + 1008829087.0272 + ], + "train_acc": [ + 0.3685, + 0.5914, + 0.6448, + 0.6722, + 0.5488, + 0.4659, + 0.3427, + 0.2972, + 0.2839, + 0.2087, + 0.1858, + 0.1589, + 0.1279, + 0.1125, + 0.1096, + 0.1005, + 0.1171, + 0.1053, + 0.1049, + 0.1081, + 0.1082, + 0.1096, + 0.1077, + 0.1075, + 0.1022, + 0.1095, + 0.1022, + 0.111, + 0.1071, + 0.1092, + 0.1054, + 0.1141, + 0.103, + 0.1071, + 0.108, + 0.1053, + 0.1096, + 0.0984, + 0.1037, + 0.1036, + 0.1063, + 0.106, + 0.1069, + 0.11, + 0.1116, + 0.1099, + 0.1091, + 0.1007, + 0.109, + 0.1116, + 0.1059, + 0.1058, + 0.1044, + 0.1083, + 0.1069, + 0.1109, + 0.1098, + 0.1108, + 0.112, + 0.1261 + ], + "test_acc": [ + 0.565, + 0.5825, + 0.65, + 0.5875, + 0.371, + 0.344, + 0.3245, + 0.321, + 0.2305, + 0.2225, + 0.147, + 0.1465, + 0.0775, + 0.116, + 0.099, + 0.092, + 0.1165, + 0.096, + 0.0785, + 0.086, + 0.114, + 0.1155, + 0.0995, + 0.085, + 0.107, + 0.1245, + 0.107, + 0.113, + 0.1135, + 0.131, + 0.113, + 0.1115, + 0.082, + 0.0955, + 0.1185, + 0.12, + 0.11, + 0.075, + 0.0715, + 0.1145, + 0.0785, + 0.1215, + 0.0925, + 0.0995, + 0.056, + 0.1145, + 0.116, + 0.126, + 0.092, + 0.1085, + 0.1115, + 0.1025, + 0.1165, + 0.12, + 0.109, + 0.1105, + 0.114, + 0.1085, + 0.107, + 0.1155 + ], + "state_pred_error": [ + 0.6633167713165283, + 0.26668925323486325, + 0.26785421018600464, + 0.34208936038017274, + 0.5517430818557739, + 0.6263181097984314, + 0.706014741897583, + 0.7488139172554016, + 0.8344351757049561, + 0.8824913305282592, + 0.9566375088691711, + 0.9905429431915284, + 0.9992951532363892, + 0.9999922995567322, + 0.9999997146606445, + 1.0000000045776367, + 0.9999999969482422, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.30725735425949097, + 0.12316203862428665, + -0.0629364550113678, + 0.007313757669180632, + -0.009149492718279362, + -0.008323092944920063, + -0.006843051873147488, + 0.005654708482325077 + ], + "perturbation_rho": [ + -0.0015011467039585114, + 0.0004240265116095543, + 0.0019385055638849735, + 0.0008086063899099827, + -0.11120367795228958, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + -2189696.0, + -217512.0, + 46920.0, + 6430.0, + -564.0, + 0.0, + 0.0, + 0.0 + ], + "0.003": [ + -6324534.0, + -344800.0, + -455572.0, + 78020.0, + -1050.0, + 0.0, + 0.0, + 0.0 + ], + "0.01": [ + -20625168.0, + -717604.0, + -58672.0, + 134824.0, + 16604.0, + -6.0, + 0.0, + 0.0 + ] + }, + "state_pred_error_per_layer": [ + 1.2424051312422632e+29, + 1.2424051312422632e+29, + 1.2424051312422632e+29, + 1.2424051312422632e+29, + 1.2424051312422632e+29, + 1.2424051312422632e+29, + 1.2424051312422632e+29, + 1.2424051312422632e+29 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.180813762664795, + 1.15851598777771, + 0.9752382919311523, + 4.310234674072266, + 5.409528110504151, + 4.571157476806641, + 5.59428627319336, + 4.906880990600586, + 7.153588356018067, + 6.169279209899902, + 3.151282291030884, + 3.04000318069458, + 6.902088081359863, + 17.079356958007814, + 434.114821875, + 4274.5153546875, + 173495.374425, + 4126869.5424, + 45074575.5072, + 302295021.6704, + 1100553773.8752, + 3910569343.3856, + 9480743307.6736, + 16287986919.0144, + 29592091230.208, + 51855394812.7232, + 83006749854.9248, + 96506064981.1968, + 116092555807.9488, + 171146794840.8832, + 207085592064.8192, + 233484588574.3104, + 283273713837.6704, + 237359135195.136, + 259830706549.5552, + 291922276725.5552, + 370882607054.848, + 375864110035.7632, + 391053997349.2736, + 312687643538.2272, + 361586948204.1344, + 234246995286.4256, + 305559670934.7328, + 253578320569.9584, + 266700764951.3472, + 217946732442.4192, + 196479827797.6064, + 155095557891.6864, + 144038231710.1056, + 122997998983.5776, + 80291857511.2192, + 68673229920.6656, + 65797288237.4656, + 40392089901.4656, + 38889432743.936, + 24285740983.9104, + 15643154428.7232, + 7760484663.296, + 3768164856.6272, + 1482127218.2784 + ], + "train_acc": [ + 0.207, + 0.5837, + 0.6796, + 0.5624, + 0.626, + 0.7089, + 0.7231, + 0.7772, + 0.7578, + 0.7978, + 0.8542, + 0.8601, + 0.788, + 0.7148, + 0.4485, + 0.2829, + 0.1504, + 0.1176, + 0.108, + 0.1062, + 0.1079, + 0.1019, + 0.105, + 0.1026, + 0.105, + 0.1077, + 0.1098, + 0.1012, + 0.1017, + 0.1066, + 0.0997, + 0.1023, + 0.1045, + 0.0995, + 0.1, + 0.1057, + 0.1021, + 0.1046, + 0.1054, + 0.1032, + 0.1046, + 0.1034, + 0.1026, + 0.1062, + 0.1054, + 0.1081, + 0.1028, + 0.1015, + 0.1012, + 0.1019, + 0.1052, + 0.1001, + 0.1075, + 0.1084, + 0.1051, + 0.1085, + 0.1046, + 0.1054, + 0.0986, + 0.1106 + ], + "test_acc": [ + 0.434, + 0.6285, + 0.5345, + 0.3995, + 0.493, + 0.59, + 0.644, + 0.6435, + 0.6805, + 0.7895, + 0.8255, + 0.732, + 0.7095, + 0.532, + 0.216, + 0.193, + 0.1255, + 0.134, + 0.128, + 0.1135, + 0.103, + 0.1005, + 0.1055, + 0.113, + 0.107, + 0.1055, + 0.0975, + 0.109, + 0.1115, + 0.086, + 0.1005, + 0.1045, + 0.1045, + 0.1205, + 0.1045, + 0.117, + 0.074, + 0.11, + 0.09, + 0.0975, + 0.112, + 0.117, + 0.116, + 0.1095, + 0.1225, + 0.0945, + 0.103, + 0.0975, + 0.071, + 0.103, + 0.08, + 0.098, + 0.1, + 0.123, + 0.1145, + 0.0905, + 0.0995, + 0.1105, + 0.0855, + 0.1095 + ], + "value_loss": [ + 2.9669607288360598, + 1.0902458826065065, + 2.4584463294982912, + 73.88889157714844, + 108.27681814575195, + 115.91943471679687, + 184.67528198242186, + 185.08425294189453, + 366.67125908203127, + 319.5852258789063, + 108.21394526367187, + 110.3386819946289, + 347.8569515869141, + 1525.27198203125, + 856406.213575, + 47010726.9056, + 133654556568.7808, + 66485560641008.44, + 5601329709154566.0, + 2.5619643797350563e+17, + 2.6437525286434504e+18, + 3.759435327830707e+19, + 2.0967746443938254e+20, + 5.8249832460428005e+20, + 1.900429415713445e+21, + 5.965233893645854e+21, + 1.5141398248046291e+22, + 2.0838459753445628e+22, + 3.0155778903345744e+22, + 6.534392113196693e+22, + 9.49085397644098e+22, + 1.213205072102303e+23, + 1.7861691251715246e+23, + 1.2310981571846513e+23, + 1.5074213926386971e+23, + 1.8590761851447484e+23, + 3.03252706604308e+23, + 2.9249324086900395e+23, + 3.357804742753062e+23, + 2.1885845744735628e+23, + 2.9055369486406765e+23, + 1.2206187316440685e+23, + 2.033396564696724e+23, + 1.3890040725471885e+23, + 1.5181943868702285e+23, + 1.0498341258536981e+23, + 8.700237478106012e+22, + 5.5888224113303126e+22, + 4.543935391813068e+22, + 3.3037088316902575e+22, + 1.3904496443146646e+22, + 9.820491629311279e+21, + 9.319735665267294e+21, + 3.4896288732690126e+21, + 3.242478367096937e+21, + 1.2534107606733638e+21, + 5.020361207667576e+20, + 1.2250652965564804e+20, + 2.762850564012813e+19, + 1.0739092229740712e+19 + ], + "term_loss": [ + 1.7164982944488525, + 0.8336014386177063, + 2.2766597854614257, + 73.54188282470703, + 107.95569302368165, + 115.66435822753907, + 184.40134716796874, + 184.7544172607422, + 366.257100390625, + 319.2935396972656, + 107.97936694335938, + 109.77867339172363, + 344.50278088378906, + 1497.03217421875, + 850602.74975, + 45127585.504, + 133558798774.272, + 66483576837557.45, + 5601311970080640.0, + 2.5619634165628704e+17, + 2.643752139856139e+18, + 3.759435259924869e+19, + 2.0967746386235884e+20, + 5.8249832322505264e+20, + 1.900429415713445e+21, + 5.965233893645854e+21, + 1.5141398248046291e+22, + 2.0838459753445628e+22, + 3.0155778903345744e+22, + 6.534392111755541e+22, + 9.49085397644098e+22, + 1.213205072102303e+23, + 1.786169119983378e+23, + 1.2310981249028493e+23, + 1.507421335857313e+23, + 1.859076049964702e+23, + 3.032526846411533e+23, + 2.9249321106598305e+23, + 3.357804382465092e+23, + 2.1885840778526248e+23, + 2.9055362533569517e+23, + 1.2206178266006874e+23, + 2.0333954119193347e+23, + 1.3890026196499199e+23, + 1.518192558336722e+23, + 1.0498318148225422e+23, + 8.700208820170359e+22, + 5.58878513881922e+22, + 4.543886667909131e+22, + 3.303644348790505e+22, + 1.3903648404528173e+22, + 9.81934621260509e+21, + 9.318203673079891e+21, + 3.487588749168033e+21, + 3.2397836163048517e+21, + 1.2498825943945005e+21, + 4.9747612976701296e+20, + 1.1696705443212127e+20, + 2.209300562524519e+19, + 5.965625762330856e+18 + ], + "bridge_loss": [ + 0.9642023840372916, + 0.05619153835773468, + 0.005403100261092186, + 0.058217010986804964, + 0.05494740681946278, + 0.042279357314109804, + 0.0697695098221302, + 0.162632954120636, + 0.23094681215286256, + 0.13801171278953553, + 0.12224743638038635, + 0.452451789855957, + 3.1901706958770752, + 28.013733642578124, + 5803.01872421875, + 1883141.245, + 95755957.4144, + 1983570290.2784, + 17710332162.8672, + 96817318513.8688, + 390040245397.0944, + 1279194057775.5137, + 3592114526591.3857, + 9084595204626.842, + 20649508923978.547, + 43515842118916.51, + 86588981919927.5, + 168821964468020.84, + 315478200580833.25, + 569613611072435.0, + 998514458413026.5, + 1685223969845254.5, + 2790164946525513.5, + 4566915636675163.0, + 7302383131868057.0, + 1.1539139114325718e+16, + 1.792385532122649e+16, + 2.6165467718487532e+16, + 3.703484551294238e+16, + 5.036573563672792e+16, + 6.666833228308184e+16, + 8.993736963563118e+16, + 1.160181461275235e+17, + 1.4629456896849453e+17, + 1.839375407288156e+17, + 2.3162479642745126e+17, + 2.8634254129500176e+17, + 3.724947283800484e+17, + 4.8719852038305664e+17, + 6.446355790276814e+17, + 8.479242257230209e+17, + 1.1453916665696928e+18, + 1.5320334050146908e+18, + 2.0400817170051474e+18, + 2.694757338137747e+18, + 3.5281727448711936e+18, + 4.559988939699667e+18, + 5.539475408244719e+18, + 5.535499985855834e+18, + 4.773466424748804e+18 + ], + "tgrad_loss": [ + 0.2862600553512573, + 0.20045291225910186, + 0.1763834413051605, + 0.28879174451828005, + 0.26617846899032593, + 0.21279841418266296, + 0.20416503925323487, + 0.1672018569469452, + 0.18320466527938842, + 0.15367574200630188, + 0.11233035919070244, + 0.10755652726888656, + 0.16400148527622224, + 0.22606448984146119, + 0.44932379856109617, + 0.6031550155639649, + 0.7285950341224671, + 0.7613764246940613, + 0.7669176729202271, + 0.7755544228553772, + 0.761812369441986, + 0.7759272521972657, + 0.7649501113891601, + 0.7714386423110962, + 0.7607672102928161, + 0.7632091217041016, + 0.7585373802185058, + 0.7713048749923707, + 0.7605478080749511, + 0.7533323201179505, + 0.7780433281898499, + 0.7613308283805847, + 0.7529919390678406, + 0.7724364114761353, + 0.7689524433135987, + 0.7545342383384704, + 0.7692763340950012, + 0.7591918215751648, + 0.7541144882202149, + 0.7748589099884033, + 0.7660150268554687, + 0.7596425477027893, + 0.7580499425888062, + 0.7523354890823364, + 0.7643221777915955, + 0.7510903036117553, + 0.7648061880111694, + 0.7583307800292969, + 0.7644666131973267, + 0.7654717210769654, + 0.7569819689750671, + 0.7661532715797424, + 0.7553690487861633, + 0.7546149060249329, + 0.7635059030532837, + 0.7580290970802307, + 0.7618262603759766, + 0.7523887557983399, + 0.7711429117202758, + 0.753796951675415 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.04903252795338631, + 0.20776475965976715, + 0.12520574033260345, + -0.2015925794839859, + -0.03666269779205322, + 0.005083487834781408, + 0.13890880346298218, + 0.012853549793362617 + ], + "perturbation_rho": [ + 0.011465835385024548, + 0.00849771499633789, + 0.0009214465972036123, + -0.005531121976673603, + 0.07564837485551834, + 0.0, + 0.0, + 0.0 + ], + "nudging": { + "0.001": [ + 708984.0, + -55272.0, + -159328.0, + 5952.0, + 11760.0, + 0.0, + 0.0, + 0.0 + ], + "0.003": [ + 1608888.0, + -316624.0, + 189376.0, + 38104.0, + 40760.0, + -16.0, + 0.0, + 0.0 + ], + "0.01": [ + 10792360.0, + -1553496.0, + -27560.0, + -69368.0, + 49144.0, + -96.0, + 0.0, + 0.0 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_smoke/synth_a1.0_L2_s42.json b/results/synth_ladder_smoke/synth_a1.0_L2_s42.json new file mode 100644 index 0000000..8777ebc --- /dev/null +++ b/results/synth_ladder_smoke/synth_a1.0_L2_s42.json @@ -0,0 +1,1172 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.9491056894302368, + 1.1529242127418518, + 0.7467040473937988, + 0.5807420476913452, + 0.5123631197452545, + 0.4696790289878845, + 0.4497463710784912, + 0.429621799659729, + 0.41180882892608645, + 0.396394921875, + 0.38590312049388886, + 0.3658535495758057, + 0.36799508414268495, + 0.3456149130344391, + 0.33443590273857116, + 0.3238851601600647, + 0.31360859479904174, + 0.3038917881965637, + 0.2932293901443481, + 0.2798507716178894, + 0.2779016891479492, + 0.2641272247314453, + 0.25414685287475586, + 0.24580603408813476, + 0.23633735848665238, + 0.22347580795288086, + 0.2150943549990654, + 0.20704293329715728, + 0.20073787801265716, + 0.1922430892944336, + 0.18689737136363982, + 0.1811553675174713, + 0.174488536298275, + 0.1676148865222931, + 0.16302786118984222, + 0.1570287989139557, + 0.15195925567150115, + 0.14744717358350753, + 0.14354275007247924, + 0.14035524681806563, + 0.13632459359169005, + 0.1334148339509964, + 0.13127109580039978, + 0.12843341019153595, + 0.1255687529563904, + 0.12336780984401703, + 0.12139199416637421, + 0.11968175506591797, + 0.11819040449261665, + 0.11690922620296479, + 0.11574092161655426, + 0.11482840909957885, + 0.11413576412200928, + 0.1134418436050415, + 0.1129186130464077, + 0.11250319490432739, + 0.1122022265791893, + 0.11199904860854148, + 0.11187557553052903, + 0.11180531568527222 + ], + "train_acc": [ + 0.326, + 0.666, + 0.7775, + 0.8124, + 0.821, + 0.8339, + 0.8331, + 0.8403, + 0.8466, + 0.8518, + 0.8559, + 0.8653, + 0.8621, + 0.8726, + 0.8746, + 0.8799, + 0.8862, + 0.8891, + 0.893, + 0.9011, + 0.8995, + 0.908, + 0.9113, + 0.9184, + 0.9233, + 0.9295, + 0.9343, + 0.9367, + 0.9398, + 0.9434, + 0.9464, + 0.9497, + 0.9517, + 0.9563, + 0.96, + 0.9629, + 0.9651, + 0.9678, + 0.9685, + 0.9692, + 0.9726, + 0.9736, + 0.9744, + 0.9749, + 0.9766, + 0.9774, + 0.9796, + 0.9799, + 0.9802, + 0.9808, + 0.9817, + 0.982, + 0.9828, + 0.9832, + 0.9835, + 0.9837, + 0.9838, + 0.9838, + 0.9839, + 0.9839 + ], + "test_acc": [ + 0.551, + 0.7215, + 0.769, + 0.787, + 0.78, + 0.7825, + 0.779, + 0.7875, + 0.783, + 0.783, + 0.7885, + 0.791, + 0.7845, + 0.789, + 0.7875, + 0.7875, + 0.7905, + 0.783, + 0.78, + 0.79, + 0.785, + 0.7895, + 0.785, + 0.7875, + 0.783, + 0.789, + 0.794, + 0.793, + 0.795, + 0.792, + 0.788, + 0.7875, + 0.788, + 0.7905, + 0.79, + 0.7925, + 0.7915, + 0.791, + 0.791, + 0.791, + 0.791, + 0.792, + 0.793, + 0.7915, + 0.7935, + 0.7905, + 0.7925, + 0.792, + 0.7925, + 0.792, + 0.7915, + 0.7915, + 0.791, + 0.791, + 0.791, + 0.791, + 0.7905, + 0.79, + 0.79, + 0.79 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.977530300617218, + 0.9661709666252136 + ], + "perturbation_rho": [ + 0.9999992847442627, + 0.9999983906745911 + ], + "nudging": { + "0.001": [ + -0.039579540491104126, + -0.02185475453734398 + ], + "0.003": [ + -0.11397463828325272, + -0.0641411542892456 + ], + "0.01": [ + -0.3279687762260437, + -0.1977623850107193 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2824316204071047, + 1.8118354099273681, + 1.310678900718689, + 0.9875048950195312, + 0.802082624912262, + 0.6931869449615479, + 0.6263151250839233, + 0.583215159034729, + 0.5534961759567261, + 0.5339154810905457, + 0.524110235452652, + 0.516173376083374, + 0.5156016312360764, + 0.512758362197876, + 0.5118656126976013, + 0.5098454748153687, + 0.515489036655426, + 0.516552147102356, + 0.525282747721672, + 0.5107382669448852, + 0.5240657005310059, + 0.5196773475646973, + 0.5238636440277099, + 0.5113746579170227, + 0.5147426022052765, + 0.5082735379695892, + 0.5030142297744751, + 0.5007089898109436, + 0.5198602245807648, + 0.5054092597007751, + 0.5186554452896118, + 0.5035870767593383, + 0.5099767215251922, + 0.5068207990646363, + 0.5057487522125245, + 0.49573901596069336, + 0.49725718212127684, + 0.4981450731754303, + 0.5011708973884582, + 0.5046835836648941, + 0.4929028748512268, + 0.48766262950897216, + 0.48986145362854006, + 0.4863999965190887, + 0.4881520263671875, + 0.48129477083683014, + 0.47820149402618406, + 0.4828622418403625, + 0.47945194401741026, + 0.4764244254112244, + 0.47533812894821165, + 0.47597204813957217, + 0.47481061878204345, + 0.4737321941375732, + 0.4729536075592041, + 0.4717037543296814, + 0.47100696840286255, + 0.4707401922225952, + 0.4704310829162598, + 0.4702408764839172 + ], + "train_acc": [ + 0.1625, + 0.4015, + 0.5907, + 0.6668, + 0.7135, + 0.7441, + 0.762, + 0.7733, + 0.7858, + 0.7916, + 0.7968, + 0.7993, + 0.7998, + 0.8007, + 0.8051, + 0.8059, + 0.8025, + 0.7994, + 0.7962, + 0.8008, + 0.7975, + 0.7985, + 0.8012, + 0.8033, + 0.8026, + 0.8027, + 0.808, + 0.8064, + 0.7975, + 0.8053, + 0.8016, + 0.8046, + 0.807, + 0.8064, + 0.803, + 0.8084, + 0.8055, + 0.8085, + 0.805, + 0.8026, + 0.8094, + 0.811, + 0.8096, + 0.812, + 0.8104, + 0.8128, + 0.8129, + 0.8123, + 0.8132, + 0.8161, + 0.8158, + 0.8152, + 0.8148, + 0.8167, + 0.815, + 0.8162, + 0.8169, + 0.8174, + 0.8167, + 0.8173 + ], + "test_acc": [ + 0.263, + 0.5155, + 0.606, + 0.6685, + 0.7025, + 0.716, + 0.736, + 0.745, + 0.742, + 0.7485, + 0.749, + 0.753, + 0.7545, + 0.7515, + 0.7505, + 0.7475, + 0.745, + 0.749, + 0.7515, + 0.7355, + 0.744, + 0.753, + 0.746, + 0.7395, + 0.75, + 0.7485, + 0.757, + 0.747, + 0.7465, + 0.7305, + 0.746, + 0.755, + 0.755, + 0.7435, + 0.752, + 0.748, + 0.7455, + 0.7385, + 0.7475, + 0.7485, + 0.7525, + 0.7575, + 0.7535, + 0.751, + 0.758, + 0.752, + 0.7515, + 0.7515, + 0.758, + 0.7545, + 0.7605, + 0.758, + 0.755, + 0.7565, + 0.7585, + 0.757, + 0.7575, + 0.755, + 0.7585, + 0.7575 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.0018995754653587937, + 0.07222741842269897 + ], + "perturbation_rho": [ + -0.03529410809278488, + 0.03507092595100403 + ], + "nudging": { + "0.001": [ + -1.5221663488773629e-05, + -0.0004911277210339904 + ], + "0.003": [ + -1.3497992767952383e-05, + -0.0014723683707416058 + ], + "0.01": [ + 0.00033701310167089105, + -0.004891358315944672 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 2.1366306617736814, + 1.3788719619750978, + 0.8893764835357666, + 0.6547704791069031, + 0.5521520162582397, + 0.5176527221679688, + 0.5091254537582397, + 0.509008034992218, + 0.5123045497894287, + 0.5199989007949829, + 0.524878611278534, + 0.5291456949710845, + 0.536843958902359, + 0.5352446517944336, + 0.5378374597549439, + 0.5358052321434021, + 0.536317100429535, + 0.5289794270515442, + 0.5393810579776764, + 0.5359365615844727, + 0.5326271821022034, + 0.5334983486175537, + 0.5313910109758377, + 0.5330386216163635, + 0.5434488729476928, + 0.5396566688537597, + 0.5416565005540848, + 0.5412564635276794, + 0.5482967029571533, + 0.5540884985685348, + 0.5473237035751343, + 0.553294009923935, + 0.5513850021362304, + 0.5501684650421143, + 0.5599284547805786, + 0.5542884324073791, + 0.5526859965801239, + 0.54858907122612, + 0.5504395879745484, + 0.5546976717948914, + 0.5577109105110168, + 0.5555753686904907, + 0.5482306803703308, + 0.5521730173110961, + 0.5481728059768677, + 0.5459907444953919, + 0.5481118337631226, + 0.5456091236114502, + 0.5448256337881088, + 0.5454645185470581, + 0.5465922353744507, + 0.544160694026947, + 0.5431355364322662, + 0.5428927242279052, + 0.5422361792087554, + 0.5417640048980713, + 0.5416455334186554, + 0.5414225485801697, + 0.5411964197158814, + 0.5410834015846252 + ], + "train_acc": [ + 0.2285, + 0.547, + 0.7045, + 0.7719, + 0.7951, + 0.798, + 0.8014, + 0.8034, + 0.803, + 0.8021, + 0.8031, + 0.8011, + 0.7966, + 0.7982, + 0.7993, + 0.7976, + 0.798, + 0.8008, + 0.792, + 0.7937, + 0.7942, + 0.7963, + 0.7974, + 0.7912, + 0.7917, + 0.7929, + 0.794, + 0.7919, + 0.791, + 0.788, + 0.7909, + 0.7873, + 0.7846, + 0.7889, + 0.7863, + 0.786, + 0.7913, + 0.7893, + 0.789, + 0.7833, + 0.7849, + 0.786, + 0.7893, + 0.7867, + 0.7892, + 0.7901, + 0.7889, + 0.7912, + 0.7906, + 0.7891, + 0.7891, + 0.7905, + 0.7923, + 0.7905, + 0.7909, + 0.7922, + 0.7908, + 0.7905, + 0.791, + 0.7913 + ], + "test_acc": [ + 0.4125, + 0.6255, + 0.7095, + 0.7555, + 0.7665, + 0.7585, + 0.758, + 0.754, + 0.7575, + 0.751, + 0.748, + 0.7475, + 0.7495, + 0.7485, + 0.745, + 0.7415, + 0.7455, + 0.743, + 0.749, + 0.746, + 0.74, + 0.733, + 0.7365, + 0.7395, + 0.743, + 0.7285, + 0.739, + 0.7225, + 0.7335, + 0.7385, + 0.7345, + 0.734, + 0.7215, + 0.734, + 0.7305, + 0.7265, + 0.7275, + 0.728, + 0.732, + 0.7235, + 0.7245, + 0.7265, + 0.7305, + 0.7295, + 0.729, + 0.727, + 0.728, + 0.7275, + 0.724, + 0.727, + 0.725, + 0.729, + 0.727, + 0.7305, + 0.7325, + 0.7325, + 0.7315, + 0.7315, + 0.7315, + 0.7315 + ], + "state_pred_error": [ + 0.8065836928367615, + 0.39146546201705934, + 0.23437868328094483, + 0.18158424789905547, + 0.1659492648601532, + 0.165374738740921, + 0.16782979707717896, + 0.16855716466903686, + 0.16732614138126373, + 0.16346708936691284, + 0.15476743512153626, + 0.1457847490310669, + 0.13143579788208007, + 0.12530215060710906, + 0.11034695791006088, + 0.102148695230484, + 0.09918132054805756, + 0.09876347059011459, + 0.09330155829191208, + 0.08962574129104614, + 0.08644098112583161, + 0.08444308232069016, + 0.08924337093830109, + 0.08370417824983596, + 0.08257257657051087, + 0.0830527756690979, + 0.07959871637821198, + 0.08018354167938233, + 0.07715057510137557, + 0.07508554146289825, + 0.07615803725719451, + 0.07278824622035027, + 0.07192154746055603, + 0.07228410756587982, + 0.06885680447816848, + 0.06863646980524063, + 0.0701085786998272, + 0.06621884278059005, + 0.06437455928325653, + 0.06294822212457657, + 0.06241208130121231, + 0.0603535782456398, + 0.06039485886096954, + 0.058678721296787265, + 0.0627734629034996, + 0.05633028925061226, + 0.054364062464237216, + 0.05458668622970581, + 0.057001876127719876, + 0.05133199627399444, + 0.05066398676633835, + 0.05105280518531799, + 0.048901369220018386, + 0.04867930979728699, + 0.04660500448346138, + 0.04554321520328522, + 0.04535353593826294, + 0.04524428225755692, + 0.04350994995832443, + 0.042987993323802945 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.7724592089653015, + 0.47611531615257263 + ], + "perturbation_rho": [ + 0.7083259224891663, + 0.4451542794704437 + ], + "nudging": { + "0.001": [ + -0.02335088513791561, + -0.0042803636752069 + ], + "0.003": [ + -0.06857505440711975, + -0.012793581001460552 + ], + "0.01": [ + -0.2117496132850647, + -0.04209146648645401 + ] + }, + "state_pred_error_per_layer": [ + 2210.423828125, + 264.2466125488281 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.280885036087036, + 1.8083742904663085, + 1.3096392322540282, + 0.9843997146606446, + 0.8018227068901062, + 0.6911002159118652, + 0.6208388906478882, + 0.5762016658782959, + 0.5495558090209961, + 0.5351255585193634, + 0.521960182762146, + 0.5177917494773865, + 0.5170808288574219, + 0.5229834615707397, + 0.5378183418750763, + 0.543828378534317, + 0.5555255395889283, + 0.5777033507347107, + 0.6048572025299073, + 0.6596059831619263, + 0.7269416851043701, + 0.7936675106048584, + 0.8489301277160645, + 0.894895606803894, + 0.9307584834098815, + 0.9389586345672607, + 0.9596725919723511, + 0.9730803798675537, + 0.97893427734375, + 0.993195873451233, + 1.0001418331146241, + 1.01285452003479, + 1.0197131780624389, + 1.034778191757202, + 1.041685494327545, + 1.0485894695281983, + 1.0534755035400392, + 1.05557954082489, + 1.0589550355911255, + 1.062454942703247, + 1.0662316680908204, + 1.0691890292644501, + 1.0679836296081544, + 1.0683391422271729, + 1.0701301013946534, + 1.0684261167526246, + 1.0693684279441833, + 1.0679564714431762, + 1.067317788696289, + 1.065644224357605, + 1.065113991165161, + 1.0640747312545777, + 1.062864318561554, + 1.0622759931564332, + 1.0614560607910157, + 1.0607545525550843, + 1.060345379447937, + 1.0600630114555358, + 1.059776364517212, + 1.0596500343322754 + ], + "train_acc": [ + 0.1626, + 0.4032, + 0.5948, + 0.6697, + 0.7145, + 0.7427, + 0.7638, + 0.779, + 0.7901, + 0.792, + 0.7958, + 0.7973, + 0.8003, + 0.7995, + 0.7923, + 0.793, + 0.7887, + 0.7841, + 0.7708, + 0.7467, + 0.7295, + 0.7074, + 0.6889, + 0.6705, + 0.6583, + 0.6541, + 0.6508, + 0.6462, + 0.6401, + 0.6374, + 0.6371, + 0.6305, + 0.6305, + 0.63, + 0.6271, + 0.6214, + 0.6242, + 0.6219, + 0.6193, + 0.6164, + 0.6166, + 0.6165, + 0.6156, + 0.6143, + 0.6187, + 0.6177, + 0.6181, + 0.6173, + 0.6175, + 0.6185, + 0.6185, + 0.6182, + 0.6184, + 0.6195, + 0.6181, + 0.6183, + 0.6172, + 0.6177, + 0.6175, + 0.6176 + ], + "test_acc": [ + 0.2655, + 0.5115, + 0.607, + 0.665, + 0.699, + 0.721, + 0.735, + 0.744, + 0.7445, + 0.7495, + 0.746, + 0.7435, + 0.7545, + 0.752, + 0.7465, + 0.744, + 0.731, + 0.719, + 0.711, + 0.6885, + 0.6685, + 0.6455, + 0.627, + 0.6115, + 0.608, + 0.6, + 0.5865, + 0.587, + 0.5895, + 0.5815, + 0.5805, + 0.5765, + 0.576, + 0.57, + 0.568, + 0.562, + 0.5625, + 0.5615, + 0.5595, + 0.56, + 0.563, + 0.56, + 0.5585, + 0.5575, + 0.556, + 0.5515, + 0.5555, + 0.559, + 0.5595, + 0.5565, + 0.558, + 0.5565, + 0.558, + 0.5545, + 0.556, + 0.556, + 0.5555, + 0.5555, + 0.556, + 0.556 + ], + "value_loss": [ + 2.9421537250518797, + 0.7975870166778565, + 0.6290085078239441, + 0.6890224185943603, + 0.7243394228935242, + 0.7203487901687622, + 0.6851132621765137, + 0.6520533827781677, + 0.6242853847503662, + 0.5676819869995117, + 0.5082380643844604, + 0.46420030603408813, + 0.4317733027458191, + 0.4148032331466675, + 0.42368859605789183, + 0.41361817846298216, + 0.404498645734787, + 0.42820386209487915, + 0.4646932671546936, + 0.49615267877578734, + 0.5365245307922363, + 0.60305582447052, + 0.6144193868637084, + 0.6435288933753968, + 0.6711149896621704, + 0.6648149871826172, + 0.6623215785980224, + 0.6906130850791932, + 0.6547210404396057, + 0.6582367699623108, + 0.6525213989257812, + 0.636179097366333, + 0.6109009315490722, + 0.6143948897361755, + 0.5951230112075806, + 0.5812291944503785, + 0.5685462500572205, + 0.5358655210494995, + 0.5175749897480011, + 0.4981157001018524, + 0.491326168346405, + 0.46913531432151795, + 0.45610346326828005, + 0.4415822687149048, + 0.43499350595474245, + 0.41386851291656496, + 0.39472350492477415, + 0.38443425817489624, + 0.37052898192405703, + 0.3712545476913452, + 0.34303374967575073, + 0.3286073633670807, + 0.3148073835849762, + 0.3157298050403595, + 0.2915987443447113, + 0.29081232733726503, + 0.26972808542251586, + 0.2690109848499298, + 0.25245738320350647, + 0.24172186150550842 + ], + "term_loss": [ + 1.6904042894363402, + 0.2855438080787659, + 0.29688326778411867, + 0.3748186621665955, + 0.41050878925323486, + 0.409766743850708, + 0.37635576343536375, + 0.34139811835289, + 0.311102571105957, + 0.2642718635082245, + 0.2312528870344162, + 0.19706957862377167, + 0.16916403424739837, + 0.15267400243282317, + 0.15790578067302705, + 0.1481425419330597, + 0.13407545802593232, + 0.1449426043510437, + 0.156369549536705, + 0.1508458754479885, + 0.1561945830821991, + 0.1846889454483986, + 0.16443501464128493, + 0.17366822769641876, + 0.18008243708610536, + 0.1709399109840393, + 0.15955905029773712, + 0.17902734649181365, + 0.14751170055866242, + 0.1511731291770935, + 0.1535642296075821, + 0.1460076296210289, + 0.1346515518426895, + 0.1449428592443466, + 0.1370476897954941, + 0.13113817830085756, + 0.1311385383963585, + 0.11210595957040786, + 0.10532034933567047, + 0.09617096209526062, + 0.10268295025229454, + 0.09031319347620011, + 0.08960143175125122, + 0.08745422222614288, + 0.09128843301534653, + 0.0811536382317543, + 0.07390678917169571, + 0.07607333833873271, + 0.0751576281785965, + 0.08278024282455444, + 0.07106895277500153, + 0.06941268212795258, + 0.07024301192462444, + 0.0796181839466095, + 0.06771385662257672, + 0.0745224772721529, + 0.06610622253417969, + 0.07373185048103333, + 0.06927853472232819, + 0.06502777924537659 + ], + "bridge_loss": [ + 0.9286653239635634, + 0.17183133554458618, + 0.03998481778204441, + 0.01001567878574133, + 0.009969949465990066, + 0.015016184416413307, + 0.024849868083000184, + 0.03629762133359909, + 0.04424135708212853, + 0.03887685165405273, + 0.02251410899758339, + 0.019279291635751723, + 0.02122289401292801, + 0.024350534307956695, + 0.026771693634986878, + 0.029644794487953187, + 0.03368165337443352, + 0.04201666583120823, + 0.05519947910308838, + 0.0729088222026825, + 0.08839097814559936, + 0.1063108127295971, + 0.12425719275474548, + 0.13326186714172364, + 0.14929705357551576, + 0.1520007657766342, + 0.15773920249938964, + 0.1658132124185562, + 0.16225691890716554, + 0.16371301856040954, + 0.15795323207378387, + 0.14942308008670807, + 0.1378128324508667, + 0.13277515301704407, + 0.1221957174539566, + 0.11507334886789322, + 0.10920816420316697, + 0.099838148355484, + 0.09326583639383317, + 0.08822717505693435, + 0.08127219996452331, + 0.07723046572208404, + 0.07338595504760742, + 0.0678777373790741, + 0.06394213989078999, + 0.06211670498847961, + 0.05893324030339718, + 0.05608555132746697, + 0.05505429896116257, + 0.05282158476114273, + 0.051606026875972745, + 0.04767316770553589, + 0.0467881379365921, + 0.04444693030118942, + 0.0429530450463295, + 0.04317285764813423, + 0.043168327283859255, + 0.03980205556154251, + 0.040649286246299744, + 0.03994156485795975 + ], + "tgrad_loss": [ + 0.32308411664962766, + 0.34021187663078306, + 0.29214042167663573, + 0.3041880838871002, + 0.3038606840133667, + 0.29556585988998413, + 0.28390763030052185, + 0.2743576454162598, + 0.2689414535522461, + 0.2645332676410675, + 0.2544710647583008, + 0.2478514326095581, + 0.24138637371063232, + 0.23777869787216185, + 0.23901112205982208, + 0.2358308396577835, + 0.2367415349960327, + 0.24124458963871, + 0.25312424030303954, + 0.2723979799747467, + 0.29193896837234495, + 0.31205606231689453, + 0.3257271741390228, + 0.33659879665374753, + 0.341735502576828, + 0.34187430839538574, + 0.34502332849502565, + 0.3457725248575211, + 0.3449524227142334, + 0.3433506235599518, + 0.3410039307594299, + 0.3407483920574188, + 0.33843654861450195, + 0.3366768836021423, + 0.3358796048641205, + 0.33501766514778136, + 0.3281995443820953, + 0.3239214171409607, + 0.3189888015270233, + 0.3137175616264343, + 0.3073710187911987, + 0.3015916561603546, + 0.2931160747528076, + 0.2862503114700317, + 0.2797629333496094, + 0.2705981719493866, + 0.2618834746837616, + 0.25227536766529085, + 0.2403170545101166, + 0.23565271859169007, + 0.22035877032279969, + 0.21152150876522063, + 0.19777623581886292, + 0.19166468963623046, + 0.18093183915615083, + 0.17311699080467224, + 0.16045353627204895, + 0.1554770776748657, + 0.1425295654296875, + 0.13675251703262328 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.14650292694568634, + 0.22681139409542084 + ], + "perturbation_rho": [ + 0.22659505903720856, + 0.3084385395050049 + ], + "nudging": { + "0.001": [ + -0.0063989125192165375, + -0.0031138062477111816 + ], + "0.003": [ + -0.01911432109773159, + -0.009325908496975899 + ], + "0.01": [ + -0.06274554133415222, + -0.030905161052942276 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_smoke/synth_a1.0_L8_s42.json b/results/synth_ladder_smoke/synth_a1.0_L8_s42.json new file mode 100644 index 0000000..84f6f53 --- /dev/null +++ b/results/synth_ladder_smoke/synth_a1.0_L8_s42.json @@ -0,0 +1,1298 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.3549648769378662, + 0.6442762393951416, + 0.5306558219909668, + 0.48609975258111954, + 0.36504030923843384, + 0.34034587018489837, + 0.2708170123100281, + 0.2531612884521484, + 0.2000002146959305, + 0.13551229400634765, + 0.13542884222269058, + 0.08572723088264465, + 0.08422799642086029, + 0.04283563904762268, + 0.02871562500782311, + 0.01670246643871069, + 0.011288518036901951, + 0.009128199395537377, + 0.007812268234789372, + 0.0068127627149224285, + 0.005905307191610336, + 0.005293884661793709, + 0.004605621902272105, + 0.0042049066483974456, + 0.003823694904893637, + 0.0035320142075419424, + 0.0032889791917055846, + 0.0030689228884875773, + 0.002866979796439409, + 0.002720682065561414, + 0.0025651114743202924, + 0.0024138968043029307, + 0.0023048722617328168, + 0.0022053348077461124, + 0.0021035693101584913, + 0.0020162027064710855, + 0.0019403529457747936, + 0.0018770673342049123, + 0.0018140029758214951, + 0.001762567887827754, + 0.0017115408962592484, + 0.001670302376151085, + 0.001631921947747469, + 0.001596466457284987, + 0.001566920978203416, + 0.0015393117513507605, + 0.0015165731955319643, + 0.0014953597854822874, + 0.0014767639184370637, + 0.0014608209997415543, + 0.0014476791420951485, + 0.0014363898681476713, + 0.001426739953830838, + 0.001419567819312215, + 0.001413508789241314, + 0.0014089626897126437, + 0.0014057869891636074, + 0.0014036820456385614, + 0.0014023557703010739, + 0.0014017068047076464 + ], + "train_acc": [ + 0.5249, + 0.7478, + 0.7964, + 0.811, + 0.8593, + 0.8695, + 0.9016, + 0.9085, + 0.9248, + 0.9598, + 0.9563, + 0.9787, + 0.9777, + 0.9941, + 0.9972, + 0.9999, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.7155, + 0.744, + 0.754, + 0.753, + 0.7645, + 0.7615, + 0.757, + 0.7565, + 0.7515, + 0.7555, + 0.751, + 0.7615, + 0.749, + 0.756, + 0.7565, + 0.761, + 0.76, + 0.76, + 0.758, + 0.7585, + 0.7565, + 0.758, + 0.7565, + 0.7575, + 0.7565, + 0.755, + 0.756, + 0.755, + 0.7555, + 0.755, + 0.7545, + 0.7545, + 0.7555, + 0.7565, + 0.755, + 0.7525, + 0.753, + 0.7555, + 0.7525, + 0.7535, + 0.7535, + 0.752, + 0.752, + 0.7515, + 0.752, + 0.7535, + 0.7525, + 0.752, + 0.7515, + 0.7515, + 0.7525, + 0.7525, + 0.7525, + 0.7525, + 0.7525, + 0.753, + 0.753, + 0.753, + 0.753, + 0.753 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8599272966384888, + 0.8556707501411438, + 0.8523739576339722, + 0.848276674747467, + 0.8402513265609741, + 0.8327686190605164, + 0.8243966698646545, + 0.8101321458816528 + ], + "perturbation_rho": [ + 0.9999995231628418, + 0.9999991059303284, + 0.9999986290931702, + 0.9999972581863403, + 0.999995231628418, + 0.999988853931427, + 0.999974250793457, + 0.9999352693557739 + ], + "nudging": { + "0.001": [ + -0.06869316846132278, + -0.055045101791620255, + -0.04193408414721489, + -0.03029901161789894, + -0.021042225882411003, + -0.014109719544649124, + -0.009153226390480995, + -0.005811762530356646 + ], + "0.003": [ + -0.19696879386901855, + -0.15935087203979492, + -0.12249457091093063, + -0.08919193595647812, + -0.06231769919395447, + -0.041970327496528625, + -0.027310188859701157, + -0.01737576723098755 + ], + "0.01": [ + -0.5608033537864685, + -0.46859920024871826, + -0.3716525733470917, + -0.2780599594116211, + -0.19847190380096436, + -0.13576632738113403, + -0.08930139243602753, + -0.057228151708841324 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2318700828552247, + 1.406381654548645, + 0.95339030418396, + 0.8680307843208313, + 0.8229897514343262, + 0.7794928709030151, + 0.7778801984786987, + 0.782413025188446, + 0.7710376887798309, + 0.7573087496757507, + 0.7456204961776733, + 0.8025073329925537, + 0.8309173440933227, + 0.8010511989593506, + 0.8825912656784057, + 0.8369182188987732, + 0.8160124311447143, + 0.8535087263107299, + 0.8696415189743042, + 0.8184520126342774, + 0.8577543560028076, + 0.8529799373626709, + 0.8702422420501709, + 0.824615712928772, + 0.8162686037063599, + 0.8295847707748413, + 0.8639348524093627, + 0.8216630945205688, + 0.8430556495666504, + 0.8807237106323242, + 0.8641441562652588, + 0.7917474311351776, + 0.799493196105957, + 0.7866990953445434, + 0.7909674090385437, + 0.7694881486892701, + 0.7699867319107055, + 0.7733240715026856, + 0.7584297584533691, + 0.7648862591743469, + 0.7560698497772217, + 0.7396681387901306, + 0.7261051610946655, + 0.7199150282859802, + 0.7145794815063476, + 0.7221284794807434, + 0.707148173904419, + 0.7056992305755615, + 0.7101434396266937, + 0.7036544319152832, + 0.6999993465900421, + 0.6964569509506225, + 0.690802536535263, + 0.6862456171989441, + 0.6861504990577698, + 0.685116357254982, + 0.6811881905555726, + 0.6796620162963867, + 0.678962588262558, + 0.678569483089447 + ], + "train_acc": [ + 0.1825, + 0.5204, + 0.6469, + 0.6793, + 0.6954, + 0.7167, + 0.7183, + 0.7201, + 0.7257, + 0.7335, + 0.7398, + 0.7284, + 0.7277, + 0.7339, + 0.7151, + 0.7335, + 0.7359, + 0.7306, + 0.7303, + 0.7422, + 0.7368, + 0.7358, + 0.7367, + 0.7445, + 0.7465, + 0.7444, + 0.7377, + 0.7507, + 0.7428, + 0.7388, + 0.744, + 0.7531, + 0.7536, + 0.7596, + 0.7581, + 0.7618, + 0.7655, + 0.7594, + 0.7671, + 0.7637, + 0.765, + 0.7685, + 0.767, + 0.7729, + 0.7725, + 0.7682, + 0.772, + 0.7729, + 0.7753, + 0.7719, + 0.7767, + 0.7751, + 0.7758, + 0.777, + 0.7787, + 0.7792, + 0.7793, + 0.7819, + 0.7823, + 0.7822 + ], + "test_acc": [ + 0.3755, + 0.579, + 0.6165, + 0.642, + 0.6585, + 0.6655, + 0.678, + 0.689, + 0.6805, + 0.6945, + 0.666, + 0.6485, + 0.6615, + 0.64, + 0.6875, + 0.6825, + 0.6765, + 0.668, + 0.679, + 0.675, + 0.6945, + 0.6775, + 0.6985, + 0.681, + 0.6985, + 0.6785, + 0.6945, + 0.6945, + 0.674, + 0.6825, + 0.6925, + 0.6955, + 0.706, + 0.697, + 0.6935, + 0.6915, + 0.7035, + 0.709, + 0.7095, + 0.707, + 0.7075, + 0.712, + 0.7105, + 0.7105, + 0.7245, + 0.7165, + 0.715, + 0.714, + 0.717, + 0.7195, + 0.7245, + 0.724, + 0.72, + 0.725, + 0.7215, + 0.721, + 0.7245, + 0.7225, + 0.722, + 0.7235 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.009654381312429905, + 0.06123851239681244, + 0.05049855262041092, + 0.06316959857940674, + 0.06684726476669312, + 0.04511053115129471, + 0.06236346811056137, + 0.024983247742056847 + ], + "perturbation_rho": [ + -0.04901190102100372, + 0.05014052242040634, + 0.041004884988069534, + 0.0795036256313324, + 0.11356800049543381, + 0.03488320857286453, + 0.06926114857196808, + 0.049178168177604675 + ], + "nudging": { + "0.001": [ + 0.0007382960757240653, + -0.0008381383959203959, + -0.0003019912401214242, + -0.00025056113372556865, + -0.00025583984097465873, + -0.0001781730679795146, + -0.00021656398894265294, + -7.157100480981171e-05 + ], + "0.003": [ + 0.0016830505337566137, + -0.00252811168320477, + -0.0009058922296389937, + -0.0007522155065089464, + -0.0007675112574361265, + -0.0005343147786334157, + -0.0006497750291600823, + -0.00021490230574272573 + ], + "0.01": [ + 0.009471571072936058, + -0.008436895906925201, + -0.0030148853547871113, + -0.002505694981664419, + -0.0025559633504599333, + -0.0017773781437426805, + -0.002164034638553858, + -0.0007148634176701307 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.8172380752563477, + 1.0125908603668212, + 0.8132157420158386, + 0.763969026184082, + 0.8119130191802979, + 0.8651832290649414, + 0.8795650399208069, + 0.8390799371719361, + 0.8750604623794556, + 0.9108563968658447, + 0.9423255216598511, + 0.9454748561859131, + 0.9387800750732422, + 0.9664641128540039, + 0.9676774660587311, + 0.9720300651550293, + 0.972385873222351, + 0.9552276044845581, + 0.9379316561698914, + 0.9411427532196045, + 0.9463931692123413, + 0.9267581472396851, + 0.9241247764587402, + 0.921794878578186, + 0.9066226318359375, + 0.9252418887138367, + 0.8958363393783569, + 0.8902327404975892, + 0.8794603199958801, + 0.8775459489822388, + 0.8668269435882568, + 0.8435388278961181, + 0.8464404319763184, + 0.8412695461273193, + 0.8285974182128907, + 0.8338440036773682, + 0.8191730420589447, + 0.808089348602295, + 0.8105339024543762, + 0.7986673656463623, + 0.8060823263168335, + 0.8041851411819458, + 0.7978612077713013, + 0.7954094837188721, + 0.7925621782302856, + 0.7874609822273254, + 0.7843514801025391, + 0.7868727991104126, + 0.7825984308719635, + 0.7754398143768311, + 0.7745126781463623, + 0.7730914865493774, + 0.7703591567993164, + 0.7687865433692932, + 0.7680869552612305, + 0.7666429103851319, + 0.7662865003585816, + 0.7655640112876893, + 0.7650162103652954, + 0.7647706716537476 + ], + "train_acc": [ + 0.3376, + 0.6277, + 0.7014, + 0.7221, + 0.7069, + 0.6933, + 0.6878, + 0.6881, + 0.6805, + 0.6703, + 0.6607, + 0.6553, + 0.6543, + 0.6502, + 0.6512, + 0.6492, + 0.6458, + 0.6579, + 0.6556, + 0.6565, + 0.6586, + 0.6661, + 0.662, + 0.6664, + 0.6733, + 0.6684, + 0.6759, + 0.6777, + 0.6829, + 0.683, + 0.6867, + 0.6906, + 0.6888, + 0.6915, + 0.6941, + 0.6932, + 0.6979, + 0.698, + 0.702, + 0.701, + 0.693, + 0.7013, + 0.7062, + 0.7023, + 0.7045, + 0.7069, + 0.7079, + 0.7062, + 0.7095, + 0.7113, + 0.7088, + 0.7086, + 0.7123, + 0.7128, + 0.7133, + 0.7143, + 0.7141, + 0.7135, + 0.7148, + 0.7151 + ], + "test_acc": [ + 0.528, + 0.671, + 0.694, + 0.69, + 0.6655, + 0.657, + 0.656, + 0.6575, + 0.649, + 0.6355, + 0.6235, + 0.6275, + 0.6205, + 0.6225, + 0.612, + 0.608, + 0.6215, + 0.6265, + 0.64, + 0.6315, + 0.6325, + 0.635, + 0.6375, + 0.627, + 0.62, + 0.6475, + 0.638, + 0.646, + 0.633, + 0.6415, + 0.6545, + 0.645, + 0.6495, + 0.6485, + 0.656, + 0.648, + 0.658, + 0.6485, + 0.6505, + 0.651, + 0.6585, + 0.6675, + 0.662, + 0.6625, + 0.6695, + 0.6675, + 0.6685, + 0.662, + 0.6685, + 0.665, + 0.667, + 0.6625, + 0.6645, + 0.6665, + 0.666, + 0.668, + 0.668, + 0.669, + 0.67, + 0.669 + ], + "state_pred_error": [ + 0.6994195578575134, + 0.22920655875205995, + 0.16802907910346984, + 0.16559766590595246, + 0.18445851514339448, + 0.21028385319709778, + 0.2191893015384674, + 0.21834363677501678, + 0.21849494242668152, + 0.21396265230178832, + 0.20434389827251434, + 0.19273596215248107, + 0.18696985533237456, + 0.18150037777423858, + 0.17128414888381957, + 0.16282646454572677, + 0.15897824714183809, + 0.15465531346797942, + 0.1488338336467743, + 0.14391191310882567, + 0.1379982359647751, + 0.1323638156414032, + 0.12555919518470765, + 0.12027550373077392, + 0.11485727074146271, + 0.11013496897220612, + 0.10653402326107025, + 0.10248540735244752, + 0.09892402567863465, + 0.09584726904630661, + 0.09310160474777222, + 0.09092893778085709, + 0.08776243501901626, + 0.08469328643083572, + 0.08289645419120789, + 0.0801550854563713, + 0.07860101690292358, + 0.0770820389509201, + 0.07482871805429459, + 0.07315796376466752, + 0.07184150853157044, + 0.07020361883640289, + 0.06892922757863998, + 0.06784615393877029, + 0.06689863914251327, + 0.0658311774611473, + 0.06467983536124229, + 0.06354528537988663, + 0.06249780519008637, + 0.06192109000682831, + 0.06163203666806221, + 0.060276210111379624, + 0.059241956239938734, + 0.058475232946872714, + 0.05833017838597298, + 0.05753721442222595, + 0.05705702358484268, + 0.057157775408029556, + 0.05591552573442459, + 0.054930789399147036 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.4364655911922455, + 0.2538519501686096, + 0.12610256671905518, + 0.11331324279308319, + 0.12084640562534332, + 0.12215165793895721, + 0.1230584904551506, + 0.12570375204086304 + ], + "perturbation_rho": [ + 0.3833135962486267, + 0.2661164402961731, + 0.1022414043545723, + 0.0808584988117218, + 0.13698244094848633, + 0.1416344791650772, + 0.1372133493423462, + 0.12957872450351715 + ], + "nudging": { + "0.001": [ + -0.0195440873503685, + -0.002403483958914876, + -0.0005046981386840343, + -0.00036888872273266315, + -0.00037333741784095764, + -0.0003630969440564513, + -0.00035216944525018334, + -0.0003497467841953039 + ], + "0.003": [ + -0.058456890285015106, + -0.007226475980132818, + -0.001513201161287725, + -0.0011065197177231312, + -0.0011195887345820665, + -0.0010890010744333267, + -0.0010560574010014534, + -0.0010488759726285934 + ], + "0.01": [ + -0.19196540117263794, + -0.024129249155521393, + -0.005033540539443493, + -0.0036849211901426315, + -0.003727084957063198, + -0.003625791519880295, + -0.0035160125698894262, + -0.003492143005132675 + ] + }, + "state_pred_error_per_layer": [ + 10125.46875, + 4586.849609375, + 2924.994384765625, + 2696.109130859375, + 2272.20361328125, + 2131.38916015625, + 1861.77978515625, + 1746.7655029296875 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2328295001983642, + 1.4101718687057496, + 0.9575806739807129, + 0.8476838275909424, + 0.8366983779907227, + 0.796540838432312, + 0.7965328689575195, + 0.804645627784729, + 0.76351228017807, + 0.8332673097610473, + 0.8028367862701417, + 0.7686783805847168, + 0.8133863924980164, + 0.8388292132377625, + 0.8813985456466675, + 0.9070027080535888, + 0.9268054521560669, + 0.8929174848556518, + 0.9617136255264283, + 0.9518166580200196, + 0.9915473003387452, + 1.03904186668396, + 1.1187934215545654, + 1.1396577449798584, + 1.1753866115570069, + 1.2152013864517213, + 1.2781038455963134, + 1.2973245435714722, + 1.3062091507911682, + 1.330575175857544, + 1.3508051769256593, + 1.372145989227295, + 1.3418801939964295, + 1.313326547241211, + 1.2953170734405517, + 1.3397330959320068, + 1.3408296878814698, + 1.3446595726013184, + 1.3166897232055663, + 1.331870413017273, + 1.3017619667053222, + 1.294947805404663, + 1.3108612091064453, + 1.2846161266326905, + 1.2734370964050292, + 1.271145669746399, + 1.2568953948974608, + 1.26171327753067, + 1.249517316055298, + 1.2554497623443603, + 1.2432411881446839, + 1.2372928746461869, + 1.2344558517456055, + 1.2330647632598877, + 1.2286329887390137, + 1.228268436050415, + 1.227671130180359, + 1.2260378023147582, + 1.224634275817871, + 1.2242035968780518 + ], + "train_acc": [ + 0.1812, + 0.5161, + 0.649, + 0.6835, + 0.6927, + 0.7114, + 0.7115, + 0.715, + 0.728, + 0.7161, + 0.7231, + 0.7368, + 0.7278, + 0.7261, + 0.7201, + 0.7154, + 0.7159, + 0.7205, + 0.7079, + 0.7081, + 0.7033, + 0.6956, + 0.6831, + 0.6858, + 0.6772, + 0.6723, + 0.6625, + 0.6463, + 0.6444, + 0.6348, + 0.6273, + 0.6171, + 0.6224, + 0.6198, + 0.6225, + 0.6052, + 0.6068, + 0.6005, + 0.6053, + 0.6035, + 0.6058, + 0.6088, + 0.605, + 0.6071, + 0.6089, + 0.6084, + 0.6106, + 0.606, + 0.6094, + 0.6078, + 0.6118, + 0.6124, + 0.611, + 0.6097, + 0.6115, + 0.6089, + 0.6095, + 0.6096, + 0.6095, + 0.6094 + ], + "test_acc": [ + 0.3705, + 0.5695, + 0.6255, + 0.6375, + 0.6505, + 0.667, + 0.6705, + 0.686, + 0.661, + 0.6765, + 0.698, + 0.6695, + 0.6895, + 0.661, + 0.6625, + 0.6765, + 0.682, + 0.6525, + 0.657, + 0.6425, + 0.6565, + 0.6455, + 0.643, + 0.6395, + 0.6385, + 0.625, + 0.61, + 0.5985, + 0.5945, + 0.594, + 0.5835, + 0.581, + 0.597, + 0.598, + 0.59, + 0.5885, + 0.5745, + 0.582, + 0.5705, + 0.5845, + 0.582, + 0.568, + 0.574, + 0.5755, + 0.5725, + 0.584, + 0.5795, + 0.5745, + 0.5765, + 0.5785, + 0.57, + 0.5755, + 0.579, + 0.579, + 0.569, + 0.574, + 0.573, + 0.5735, + 0.574, + 0.574 + ], + "value_loss": [ + 3.0612864276885987, + 0.9298634000778199, + 1.0534765914916993, + 1.1624056129455567, + 1.287022685623169, + 1.2191282211303711, + 1.1473731142044068, + 1.2222970941543578, + 1.0844892554283143, + 1.2464203895568848, + 1.2315531982421875, + 1.0791297135353088, + 1.2645495239257813, + 1.326454645872116, + 1.3909792762756348, + 1.46472707157135, + 1.6084086065292358, + 1.4191848960876465, + 1.5598558122634887, + 1.4034530574798585, + 1.360558862876892, + 1.4974057355880737, + 1.5152985761642457, + 1.5459233176231384, + 1.6183912239074707, + 1.7463767976760864, + 1.6744214597702027, + 1.4573214498519897, + 1.4008925676345825, + 1.3678995864868164, + 1.3241787738800048, + 1.319063488006592, + 1.2433307300567626, + 1.0671293781280518, + 1.0261332641601562, + 1.0388721265792846, + 1.0011196897506713, + 0.9702223169326782, + 0.9575115978240967, + 0.9511522947311402, + 0.871139727306366, + 0.8162722229003906, + 0.8406558853149414, + 0.790790128326416, + 0.7439771286010742, + 0.7198011109590531, + 0.7005921336650849, + 0.6835938632965088, + 0.6486449011325837, + 0.6239403274536133, + 0.6149130923271179, + 0.6258885129511357, + 0.5848597867965698, + 0.5708261927604675, + 0.5448934956550598, + 0.5640273152351379, + 0.5487895909309387, + 0.5382195985794067, + 0.5229669218063354, + 0.5224067583084107 + ], + "term_loss": [ + 1.7380344909667969, + 0.5437232830047607, + 0.8284306915283203, + 0.9567685474395752, + 1.0802118640899658, + 0.9863194431304931, + 0.9126659242630005, + 1.0141376696586608, + 0.8975709108352661, + 1.0503646591186524, + 1.0410141807556152, + 0.8969525803565979, + 1.0739669722557068, + 1.1351874728679656, + 1.1846843212127685, + 1.226121760559082, + 1.353541067504883, + 1.1525111585140229, + 1.2433963447093963, + 1.1111729244232178, + 1.0706022632598877, + 1.1812005992889405, + 1.1949755194664002, + 1.241350096321106, + 1.317452368450165, + 1.4344143880844116, + 1.366858615756035, + 1.1617898447036743, + 1.1149580620765687, + 1.0898091663360596, + 1.0528370998382568, + 1.0468038051605224, + 0.9734418066978454, + 0.8105616062164307, + 0.7722046535491943, + 0.7813135403633118, + 0.7447025863647461, + 0.7173005515098572, + 0.7083561273574829, + 0.7011982561588287, + 0.6327509389877319, + 0.5813593649864197, + 0.607800398683548, + 0.5606256068229676, + 0.5164450220108032, + 0.49647570234537125, + 0.48213193352222444, + 0.4650268939375877, + 0.43274318981170656, + 0.4082659092903137, + 0.39861374917030334, + 0.4051392196834087, + 0.3712418370246887, + 0.3574744204521179, + 0.3357436392784119, + 0.35090364389419554, + 0.3320211359024048, + 0.32399859981536866, + 0.31227648725509644, + 0.30657225689888 + ], + "bridge_loss": [ + 1.033972427075947, + 0.1259313227057457, + 0.013127804318070412, + 0.0068917840205132965, + 0.01259806400835514, + 0.04915154292583466, + 0.054842041409015656, + 0.0279923313960433, + 0.01622686858177185, + 0.015008053582906723, + 0.015984716065227986, + 0.015876483254134655, + 0.019972576881945134, + 0.019738174071907998, + 0.03136125123798847, + 0.06120928807258606, + 0.078516369754076, + 0.09715313489437104, + 0.13975104311704636, + 0.11691163322329522, + 0.11400446672141552, + 0.1377958104610443, + 0.1374728867292404, + 0.1246106859445572, + 0.12149106123447419, + 0.1336177960038185, + 0.12678081693649293, + 0.11429111970663071, + 0.1066114503979683, + 0.09759099328517915, + 0.09151432385444641, + 0.0911779996395111, + 0.093770928388834, + 0.08366052788496017, + 0.08443067642450333, + 0.08428607819080353, + 0.08389535593986511, + 0.08062444943189621, + 0.0807857982158661, + 0.0812311357140541, + 0.07345293629169464, + 0.07137182642519474, + 0.06880553373098373, + 0.06860192837715148, + 0.067187957072258, + 0.06452970866262912, + 0.06065080301761627, + 0.06125029466152191, + 0.060076392430067065, + 0.05876207324266434, + 0.060951916396617886, + 0.06561451515704393, + 0.059012375992536545, + 0.05898748941421509, + 0.05535315696001053, + 0.0593130940079689, + 0.06311285648345948, + 0.06080557494163513, + 0.057529071378707886, + 0.06283499038815499 + ], + "tgrad_loss": [ + 0.28927949557304383, + 0.2602087851524353, + 0.21191810626983643, + 0.19874528608322142, + 0.19421276106834412, + 0.18365723705291748, + 0.1798651430130005, + 0.18016709561347963, + 0.17069146556854248, + 0.18104767799377441, + 0.17455429816246032, + 0.16630066150426864, + 0.17060998005867004, + 0.1715290092945099, + 0.1749337030172348, + 0.177396022939682, + 0.17635114104747773, + 0.16952060701847077, + 0.1767084276676178, + 0.17536849284172057, + 0.1759521385669708, + 0.1784093313217163, + 0.18285016713142396, + 0.17996254091262817, + 0.17944778304100037, + 0.17834460110664369, + 0.18078203921318053, + 0.18124049134254455, + 0.17932304699420928, + 0.1804994152545929, + 0.17982735419273377, + 0.1810816912651062, + 0.17611798644065857, + 0.17290724143981934, + 0.16949793553352355, + 0.17327251043319702, + 0.1725217536211014, + 0.17229731659889222, + 0.1683696664094925, + 0.16872289276123048, + 0.16493585252761842, + 0.16354102935791015, + 0.16404994721412658, + 0.16156259379386903, + 0.16034415247440337, + 0.15879569890499115, + 0.15780939960479737, + 0.15731667776107788, + 0.15582531983852385, + 0.1569123430252075, + 0.15534742782115937, + 0.15513477906584738, + 0.15460557351112367, + 0.1543642846226692, + 0.15379669663906098, + 0.15381058180332183, + 0.15365558917522432, + 0.1534154201745987, + 0.15316136314868928, + 0.15299950742721558 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.034526653587818146, + 0.05641080439090729, + 0.10281616449356079, + 0.15385565161705017, + 0.18335095047950745, + 0.20484405755996704, + 0.21195781230926514, + 0.22950458526611328 + ], + "perturbation_rho": [ + 0.036690596491098404, + 0.08035410940647125, + 0.14528854191303253, + 0.19739355146884918, + 0.2672373652458191, + 0.3182218074798584, + 0.32729244232177734, + 0.3177085220813751 + ], + "nudging": { + "0.001": [ + -0.004214188549667597, + -0.0019195483764633536, + -0.0012887499760836363, + -0.001240130397491157, + -0.0012948594521731138, + -0.0013112489832565188, + -0.0013397705042734742, + -0.0013849454699084163 + ], + "0.003": [ + -0.011589612811803818, + -0.005784940905869007, + -0.0038642820436507463, + -0.003718423191457987, + -0.003882676362991333, + -0.003930780105292797, + -0.004017728380858898, + -0.004152942448854446 + ], + "0.01": [ + -0.04240123927593231, + -0.01825123094022274, + -0.012862971983850002, + -0.012372580356895924, + -0.012917900457978249, + -0.01307743415236473, + -0.013364783488214016, + -0.013813115656375885 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/config.json b/results/synth_ladder_v2_hi/config.json new file mode 100644 index 0000000..a96090b --- /dev/null +++ b/results/synth_ladder_v2_hi/config.json @@ -0,0 +1,33 @@ +{ + "alphas": [ + 0.5, + 1.0 + ], + "depths": [ + 2, + 4, + 8, + 12 + ], + "seeds": [ + 42, + 123, + 456 + ], + "d_hidden": 128, + "num_classes": 10, + "n_train": 10000, + "n_test": 2000, + "batch_size": 256, + "epochs": 80, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "gpu": 0, + "output_dir": "results/synth_ladder_v2_hi" +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/summary.json b/results/synth_ladder_v2_hi/summary.json new file mode 100644 index 0000000..b7ad268 --- /dev/null +++ b/results/synth_ladder_v2_hi/summary.json @@ -0,0 +1,3590 @@ +{ + "a0.5_L2_s42": { + "bp": { + "test_acc": 0.8845, + "mean_bp_cosine": 0.9139105975627899, + "mean_rho": 0.9999974966049194, + "mean_nudge_001": -0.021973546594381332, + "mean_nudge_003": -0.061596330255270004, + "mean_nudge_01": -0.16279328987002373, + "bp_cosine_per_layer": [ + 0.9165740013122559, + 0.911247193813324 + ], + "rho_per_layer": [ + 0.9999988079071045, + 0.9999961853027344 + ], + "nudge_per_layer": [ + -0.21485117077827454, + -0.11073540896177292 + ] + }, + "dfa": { + "test_acc": 0.8185, + "mean_bp_cosine": 0.013388294260948896, + "mean_rho": -0.010654313489794731, + "mean_nudge_001": 0.00010355231643188745, + "mean_nudge_003": 0.00034307173336856067, + "mean_nudge_01": 0.0015135867288336158, + "bp_cosine_per_layer": [ + -0.008949288167059422, + 0.035725876688957214 + ], + "rho_per_layer": [ + -0.042064815759658813, + 0.02075618878006935 + ], + "nudge_per_layer": [ + 0.004335631616413593, + -0.0013084581587463617 + ] + }, + "state_bridge": { + "test_acc": 0.8125, + "mean_bp_cosine": 0.6582441031932831, + "mean_rho": 0.6169608980417252, + "mean_nudge_001": -0.013940556207671762, + "mean_nudge_003": -0.040253227576613426, + "mean_nudge_01": -0.11712449323385954, + "bp_cosine_per_layer": [ + 0.8927175402641296, + 0.4237706661224365 + ], + "rho_per_layer": [ + 0.8139950037002563, + 0.41992679238319397 + ], + "nudge_per_layer": [ + -0.20875152945518494, + -0.02549745701253414 + ], + "state_pred_error_per_layer": [ + 1690.90478515625, + 278.7707214355469 + ], + "mean_state_pred_error": 984.8377532958984 + }, + "credit_bridge": { + "test_acc": 0.6365, + "mean_bp_cosine": 0.23397326469421387, + "mean_rho": 0.31064942479133606, + "mean_nudge_001": -0.004609669325873256, + "mean_nudge_003": -0.013776597566902637, + "mean_nudge_01": -0.04530538059771061, + "bp_cosine_per_layer": [ + 0.12511783838272095, + 0.3428286910057068 + ], + "rho_per_layer": [ + 0.21235734224319458, + 0.40894150733947754 + ], + "nudge_per_layer": [ + -0.061930932104587555, + -0.028679829090833664 + ], + "final_value_loss": 0.48061015357971193, + "final_term_loss": 0.14492559936642646, + "final_bridge_loss": 0.020528473022580148, + "final_tgrad_loss": 0.31515607919692995 + } + }, + "a0.5_L2_s123": { + "bp": { + "test_acc": 0.895, + "mean_bp_cosine": 0.878325492143631, + "mean_rho": 0.9999979734420776, + "mean_nudge_001": -0.019721894524991512, + "mean_nudge_003": -0.055400675162672997, + "mean_nudge_01": -0.14613648504018784, + "bp_cosine_per_layer": [ + 0.8870643973350525, + 0.8695865869522095 + ], + "rho_per_layer": [ + 0.9999991059303284, + 0.9999968409538269 + ], + "nudge_per_layer": [ + -0.1920192688703537, + -0.10025370121002197 + ] + }, + "dfa": { + "test_acc": 0.8405, + "mean_bp_cosine": 0.08467924036085606, + "mean_rho": 0.07321365177631378, + "mean_nudge_001": -0.0010137155040865764, + "mean_nudge_003": -0.0030202887719497085, + "mean_nudge_01": -0.009814865421503782, + "bp_cosine_per_layer": [ + 0.05535196140408516, + 0.11400651931762695 + ], + "rho_per_layer": [ + 0.07898944616317749, + 0.06743785738945007 + ], + "nudge_per_layer": [ + -0.015302825719118118, + -0.004326905123889446 + ] + }, + "state_bridge": { + "test_acc": 0.8305, + "mean_bp_cosine": 0.659128725528717, + "mean_rho": 0.5701804161071777, + "mean_nudge_001": -0.012253106338903308, + "mean_nudge_003": -0.035399872343987226, + "mean_nudge_01": -0.10352936759591103, + "bp_cosine_per_layer": [ + 0.8879689574241638, + 0.43028849363327026 + ], + "rho_per_layer": [ + 0.7560213804244995, + 0.38433945178985596 + ], + "nudge_per_layer": [ + -0.18288554251194, + -0.02417319267988205 + ], + "state_pred_error_per_layer": [ + 1696.6031494140625, + 278.31060791015625 + ], + "mean_state_pred_error": 987.4568786621094 + }, + "credit_bridge": { + "test_acc": 0.634, + "mean_bp_cosine": 0.21542657166719437, + "mean_rho": 0.3815983682870865, + "mean_nudge_001": -0.004454661626368761, + "mean_nudge_003": -0.0132976695895195, + "mean_nudge_01": -0.04354145657271147, + "bp_cosine_per_layer": [ + 0.11650891602039337, + 0.31434422731399536 + ], + "rho_per_layer": [ + 0.23759987950325012, + 0.5255968570709229 + ], + "nudge_per_layer": [ + -0.05865050479769707, + -0.028432408347725868 + ], + "final_value_loss": 0.5198581983566284, + "final_term_loss": 0.1660363396883011, + "final_bridge_loss": 0.026915473002195357, + "final_tgrad_loss": 0.32690638537406924 + } + }, + "a0.5_L2_s456": { + "bp": { + "test_acc": 0.875, + "mean_bp_cosine": 0.8901284635066986, + "mean_rho": 0.9999979138374329, + "mean_nudge_001": -0.024593621492385864, + "mean_nudge_003": -0.06968314573168755, + "mean_nudge_01": -0.18856997787952423, + "bp_cosine_per_layer": [ + 0.8992727398872375, + 0.8809841871261597 + ], + "rho_per_layer": [ + 0.999998927116394, + 0.9999969005584717 + ], + "nudge_per_layer": [ + -0.2502431571483612, + -0.12689679861068726 + ] + }, + "dfa": { + "test_acc": 0.816, + "mean_bp_cosine": 0.04272198863327503, + "mean_rho": 0.0372689850628376, + "mean_nudge_001": -0.0004823530907742679, + "mean_nudge_003": -0.0014278392773121595, + "mean_nudge_01": -0.004543605959042907, + "bp_cosine_per_layer": [ + 0.017043430358171463, + 0.0684005469083786 + ], + "rho_per_layer": [ + -0.039058439433574677, + 0.11359640955924988 + ], + "nudge_per_layer": [ + -0.005804130807518959, + -0.0032830811105668545 + ] + }, + "state_bridge": { + "test_acc": 0.807, + "mean_bp_cosine": 0.6757712662220001, + "mean_rho": 0.6000171899795532, + "mean_nudge_001": -0.01571581745520234, + "mean_nudge_003": -0.04562427382916212, + "mean_nudge_01": -0.13532716780900955, + "bp_cosine_per_layer": [ + 0.8896123766899109, + 0.46193015575408936 + ], + "rho_per_layer": [ + 0.8089620471000671, + 0.3910723328590393 + ], + "nudge_per_layer": [ + -0.23563425242900848, + -0.03502008318901062 + ], + "state_pred_error_per_layer": [ + 1470.6129150390625, + 266.84222412109375 + ], + "mean_state_pred_error": 868.7275695800781 + }, + "credit_bridge": { + "test_acc": 0.6605, + "mean_bp_cosine": 0.23513908684253693, + "mean_rho": 0.3664921522140503, + "mean_nudge_001": -0.005338509101420641, + "mean_nudge_003": -0.015948554500937462, + "mean_nudge_01": -0.052367652766406536, + "bp_cosine_per_layer": [ + 0.15452352166175842, + 0.31575465202331543 + ], + "rho_per_layer": [ + 0.26963475346565247, + 0.4633495509624481 + ], + "nudge_per_layer": [ + -0.07802344858646393, + -0.026711856946349144 + ], + "final_value_loss": 0.3851433990240097, + "final_term_loss": 0.10070284021273256, + "final_bridge_loss": 0.01744421122968197, + "final_tgrad_loss": 0.26699634662866595 + } + }, + "a0.5_L4_s42": { + "bp": { + "test_acc": 0.883, + "mean_bp_cosine": 0.8371244817972183, + "mean_rho": 0.9999875724315643, + "mean_nudge_001": -0.0205106531502679, + "mean_nudge_003": -0.05829396191984415, + "mean_nudge_01": -0.15927099250257015, + "bp_cosine_per_layer": [ + 0.8572149276733398, + 0.8503379821777344, + 0.8309497833251953, + 0.8099952340126038 + ], + "rho_per_layer": [ + 0.9999990463256836, + 0.9999980330467224, + 0.999992311000824, + 0.9999608993530273 + ], + "nudge_per_layer": [ + -0.29344552755355835, + -0.19200363755226135, + -0.10158533602952957, + -0.050049468874931335 + ] + }, + "dfa": { + "test_acc": 0.825, + "mean_bp_cosine": 0.08056101959664375, + "mean_rho": 0.07036433229222894, + "mean_nudge_001": -0.0004525305703282356, + "mean_nudge_003": -0.0013484152732416987, + "mean_nudge_01": -0.004391533322632313, + "bp_cosine_per_layer": [ + 0.0060789515264332294, + 0.09873200953006744, + 0.10723873972892761, + 0.1101943776011467 + ], + "rho_per_layer": [ + -0.012974856421351433, + 0.14552229642868042, + 0.08513970673084259, + 0.06377018243074417 + ], + "nudge_per_layer": [ + -0.0025177751667797565, + -0.006775799673050642, + -0.004219442140311003, + -0.00405311631038785 + ] + }, + "state_bridge": { + "test_acc": 0.7175, + "mean_bp_cosine": 0.389427974820137, + "mean_rho": 0.3547045961022377, + "mean_nudge_001": -0.006397623001248576, + "mean_nudge_003": -0.018759612808935344, + "mean_nudge_01": -0.05771041696425527, + "bp_cosine_per_layer": [ + 0.81822270154953, + 0.44441917538642883, + 0.15419423580169678, + 0.14087578654289246 + ], + "rho_per_layer": [ + 0.7556701302528381, + 0.42722654342651367, + 0.13306331634521484, + 0.10285839438438416 + ], + "nudge_per_layer": [ + -0.2031538337469101, + -0.01867133006453514, + -0.004740326199680567, + -0.00427617784589529 + ], + "state_pred_error_per_layer": [ + 6433.45703125, + 2426.59619140625, + 1950.234130859375, + 1929.63232421875 + ], + "mean_state_pred_error": 3184.9799194335938 + }, + "credit_bridge": { + "test_acc": 0.662, + "mean_bp_cosine": 0.2142251469194889, + "mean_rho": 0.3778097555041313, + "mean_nudge_001": -0.002453161054290831, + "mean_nudge_003": -0.007344013080000877, + "mean_nudge_01": -0.024294552858918905, + "bp_cosine_per_layer": [ + 0.08037468791007996, + 0.24492917954921722, + 0.2708122730255127, + 0.26078444719314575 + ], + "rho_per_layer": [ + 0.14874565601348877, + 0.4311285614967346, + 0.48388832807540894, + 0.44747647643089294 + ], + "nudge_per_layer": [ + -0.03933826461434364, + -0.020281529054045677, + -0.01922188699245453, + -0.018336530774831772 + ], + "final_value_loss": 0.4397273305892944, + "final_term_loss": 0.15641304728984834, + "final_bridge_loss": 0.03557699205875397, + "final_tgrad_loss": 0.24773729231357575 + } + }, + "a0.5_L4_s123": { + "bp": { + "test_acc": 0.882, + "mean_bp_cosine": 0.7865977436304092, + "mean_rho": 0.9999855011701584, + "mean_nudge_001": -0.019216455286368728, + "mean_nudge_003": -0.05414565000683069, + "mean_nudge_01": -0.14401183556765318, + "bp_cosine_per_layer": [ + 0.817541241645813, + 0.7992762923240662, + 0.7803024053573608, + 0.749271035194397 + ], + "rho_per_layer": [ + 0.9999992847442627, + 0.9999971389770508, + 0.9999915361404419, + 0.9999540448188782 + ], + "nudge_per_layer": [ + -0.25995129346847534, + -0.17589232325553894, + -0.09449617564678192, + -0.04570754989981651 + ] + }, + "dfa": { + "test_acc": 0.8045, + "mean_bp_cosine": 0.13894247123971581, + "mean_rho": 0.15608793403953314, + "mean_nudge_001": -0.0003833890805253759, + "mean_nudge_003": -0.0011389600113034248, + "mean_nudge_01": -0.0036781042581424117, + "bp_cosine_per_layer": [ + -0.027901431545615196, + 0.2837410271167755, + 0.17885790765285492, + 0.12107238173484802 + ], + "rho_per_layer": [ + -0.007988158613443375, + 0.25683730840682983, + 0.21096175909042358, + 0.1645408272743225 + ], + "nudge_per_layer": [ + 0.005267709027975798, + -0.009674372151494026, + -0.005893784575164318, + -0.0044119693338871 + ] + }, + "state_bridge": { + "test_acc": 0.7345, + "mean_bp_cosine": 0.3779419884085655, + "mean_rho": 0.3288300409913063, + "mean_nudge_001": -0.006349694755044766, + "mean_nudge_003": -0.018683148198761046, + "mean_nudge_01": -0.05818818649277091, + "bp_cosine_per_layer": [ + 0.8108769655227661, + 0.3922353684902191, + 0.15907782316207886, + 0.149577796459198 + ], + "rho_per_layer": [ + 0.6536975502967834, + 0.33696871995925903, + 0.15431806445121765, + 0.1703358292579651 + ], + "nudge_per_layer": [ + -0.2048409879207611, + -0.01618226245045662, + -0.006159749813377857, + -0.005569745786488056 + ], + "state_pred_error_per_layer": [ + 3474.9130859375, + 1348.3646240234375, + 1462.0654296875, + 924.672607421875 + ], + "mean_state_pred_error": 1802.5039367675781 + }, + "credit_bridge": { + "test_acc": 0.668, + "mean_bp_cosine": 0.16247223876416683, + "mean_rho": 0.2929591853171587, + "mean_nudge_001": -0.001968744763871655, + "mean_nudge_003": -0.005892619024962187, + "mean_nudge_01": -0.019490228034555912, + "bp_cosine_per_layer": [ + 0.05806349962949753, + 0.19388319551944733, + 0.1997416615486145, + 0.19820059835910797 + ], + "rho_per_layer": [ + 0.05481833964586258, + 0.3572811782360077, + 0.4186326265335083, + 0.3411045968532562 + ], + "nudge_per_layer": [ + -0.0286177359521389, + -0.01660466194152832, + -0.01654389500617981, + -0.016194619238376617 + ], + "final_value_loss": 0.4729928963661194, + "final_term_loss": 0.15622255086898804, + "final_bridge_loss": 0.034451057982444765, + "final_tgrad_loss": 0.28231928570270537 + } + }, + "a0.5_L4_s456": { + "bp": { + "test_acc": 0.8855, + "mean_bp_cosine": 0.7703797668218613, + "mean_rho": 0.999986544251442, + "mean_nudge_001": -0.017331300303339958, + "mean_nudge_003": -0.04883333737961948, + "mean_nudge_01": -0.13096668012440205, + "bp_cosine_per_layer": [ + 0.792909562587738, + 0.7804109454154968, + 0.7618845105171204, + 0.7463140487670898 + ], + "rho_per_layer": [ + 0.9999990463256836, + 0.9999976754188538, + 0.9999912977218628, + 0.9999581575393677 + ], + "nudge_per_layer": [ + -0.2336917370557785, + -0.1588592678308487, + -0.0874030739068985, + -0.04391264170408249 + ] + }, + "dfa": { + "test_acc": 0.817, + "mean_bp_cosine": 0.07182160578668118, + "mean_rho": 0.09282832965254784, + "mean_nudge_001": -0.0003612322652770672, + "mean_nudge_003": -0.0010782249155454338, + "mean_nudge_01": -0.0035168152826372534, + "bp_cosine_per_layer": [ + -0.010789386928081512, + 0.08449429273605347, + 0.10027095675468445, + 0.1133105605840683 + ], + "rho_per_layer": [ + -0.022197294980287552, + 0.02167895808815956, + 0.18905602395534515, + 0.18277563154697418 + ], + "nudge_per_layer": [ + -0.0005262043559923768, + -0.005684657022356987, + -0.003974507562816143, + -0.0038818921893835068 + ] + }, + "state_bridge": { + "test_acc": 0.7675, + "mean_bp_cosine": 0.4189938008785248, + "mean_rho": 0.348801476880908, + "mean_nudge_001": -0.006437422598537523, + "mean_nudge_003": -0.018775500764604658, + "mean_nudge_01": -0.056744852219708264, + "bp_cosine_per_layer": [ + 0.8223247528076172, + 0.5256583094596863, + 0.17289233207702637, + 0.1550998091697693 + ], + "rho_per_layer": [ + 0.7023045420646667, + 0.4341009259223938, + 0.10907860845327377, + 0.14972183108329773 + ], + "nudge_per_layer": [ + -0.19577056169509888, + -0.022263746708631516, + -0.004863455425947905, + -0.0040816450491547585 + ], + "state_pred_error_per_layer": [ + 6500.04248046875, + 2179.638671875, + 1695.392333984375, + 1466.414306640625 + ], + "mean_state_pred_error": 2960.3719482421875 + }, + "credit_bridge": { + "test_acc": 0.617, + "mean_bp_cosine": 0.19905064720660448, + "mean_rho": 0.27845675125718117, + "mean_nudge_001": -0.0017877554928418249, + "mean_nudge_003": -0.005349543411284685, + "mean_nudge_01": -0.017666283063590527, + "bp_cosine_per_layer": [ + 0.0613640733063221, + 0.23986753821372986, + 0.24101567268371582, + 0.25395530462265015 + ], + "rho_per_layer": [ + 0.07897584140300751, + 0.3258228003978729, + 0.35056060552597046, + 0.3584677577018738 + ], + "nudge_per_layer": [ + -0.019116222858428955, + -0.01759088784456253, + -0.016751645132899284, + -0.017206376418471336 + ], + "final_value_loss": 0.4424677228450775, + "final_term_loss": 0.12383701201379299, + "final_bridge_loss": 0.02319883658438921, + "final_tgrad_loss": 0.29543187527656556 + } + }, + "a0.5_L8_s42": { + "bp": { + "test_acc": 0.8715, + "mean_bp_cosine": 0.808967724442482, + "mean_rho": 0.999945156276226, + "mean_nudge_001": -0.011501751199830323, + "mean_nudge_003": -0.03289153927471489, + "mean_nudge_01": -0.09379934845492244, + "bp_cosine_per_layer": [ + 0.8294941186904907, + 0.823101282119751, + 0.815970778465271, + 0.8095235824584961, + 0.8066394329071045, + 0.8012610673904419, + 0.7956615686416626, + 0.7900899648666382 + ], + "rho_per_layer": [ + 0.999998927116394, + 0.999997615814209, + 0.9999938011169434, + 0.9999845027923584, + 0.9999604225158691, + 0.9999330043792725, + 0.999873697757721, + 0.999819278717041 + ], + "nudge_per_layer": [ + -0.2528620958328247, + -0.17482446134090424, + -0.11384513974189758, + -0.07313278317451477, + -0.04917728155851364, + -0.03563641011714935, + -0.02781001478433609, + -0.02310660108923912 + ] + }, + "dfa": { + "test_acc": 0.804, + "mean_bp_cosine": 0.06822564313188195, + "mean_rho": 0.08298261812888086, + "mean_nudge_001": -5.095545566291548e-05, + "mean_nudge_003": -0.0001400069668306969, + "mean_nudge_01": -0.0003324677818454802, + "bp_cosine_per_layer": [ + -0.029147807508707047, + 0.09590217471122742, + 0.0916377604007721, + 0.10714393854141235, + 0.10661958158016205, + 0.05731643736362457, + 0.06447312980890274, + 0.05185993015766144 + ], + "rho_per_layer": [ + -0.08288859575986862, + 0.14039787650108337, + 0.1433517336845398, + 0.1548803746700287, + 0.09298646450042725, + 0.08800182491540909, + 0.09949750453233719, + 0.02763376198709011 + ], + "nudge_per_layer": [ + 0.019184602424502373, + -0.0062692309729754925, + -0.0031640869565308094, + -0.0033698435872793198, + -0.003262510057538748, + -0.0018756084609776735, + -0.0022803605534136295, + -0.0016227040905505419 + ] + }, + "state_bridge": { + "test_acc": 0.7265, + "mean_bp_cosine": 0.2766533959656954, + "mean_rho": 0.24636799190193415, + "mean_nudge_001": -0.003215807260858128, + "mean_nudge_003": -0.00946771033341065, + "mean_nudge_01": -0.029514338413719088, + "bp_cosine_per_layer": [ + 0.8188973069190979, + 0.4508240222930908, + 0.20906424522399902, + 0.16529136896133423, + 0.1612900048494339, + 0.1292058229446411, + 0.14780420064926147, + 0.1308501958847046 + ], + "rho_per_layer": [ + 0.7345798015594482, + 0.40806666016578674, + 0.18922817707061768, + 0.1360217034816742, + 0.11187596619129181, + 0.1472519189119339, + 0.12442155927419662, + 0.11949814856052399 + ], + "nudge_per_layer": [ + -0.19829359650611877, + -0.01426965557038784, + -0.005409521050751209, + -0.004344802349805832, + -0.0038992268964648247, + -0.0032464847899973392, + -0.003532196395099163, + -0.00311922375112772 + ], + "state_pred_error_per_layer": [ + 5640.76416015625, + 3768.9912109375, + 2209.80126953125, + 1863.6328125, + 1833.0330810546875, + 2052.747802734375, + 1687.1876220703125, + 1871.18310546875 + ], + "mean_state_pred_error": 2615.9176330566406 + }, + "credit_bridge": { + "test_acc": 0.5935, + "mean_bp_cosine": 0.12945402902550995, + "mean_rho": 0.20130334049463272, + "mean_nudge_001": -0.0008943625434767455, + "mean_nudge_003": -0.0026800249179359525, + "mean_nudge_01": -0.00888864736771211, + "bp_cosine_per_layer": [ + 0.014968650415539742, + 0.08219218999147415, + 0.12315872311592102, + 0.1350458562374115, + 0.16176681220531464, + 0.1692444086074829, + 0.17282617092132568, + 0.17642942070960999 + ], + "rho_per_layer": [ + 0.09865723550319672, + 0.1636437624692917, + 0.19447889924049377, + 0.2091381549835205, + 0.2243458330631256, + 0.23168572783470154, + 0.2512606978416443, + 0.23721641302108765 + ], + "nudge_per_layer": [ + -0.006006492767482996, + -0.006066862493753433, + -0.008294559083878994, + -0.008802486583590508, + -0.009770728647708893, + -0.010544568300247192, + -0.010718668811023235, + -0.010904812254011631 + ], + "final_value_loss": 0.3977136660575867, + "final_term_loss": 0.13710964921712876, + "final_bridge_loss": 0.018799800185859205, + "final_tgrad_loss": 0.24180421624183654 + } + }, + "a0.5_L8_s123": { + "bp": { + "test_acc": 0.868, + "mean_bp_cosine": 0.8070773705840111, + "mean_rho": 0.9999594464898109, + "mean_nudge_001": -0.01314116342109628, + "mean_nudge_003": -0.037657674751244485, + "mean_nudge_01": -0.10643287934362888, + "bp_cosine_per_layer": [ + 0.8442516326904297, + 0.8351782560348511, + 0.8238041400909424, + 0.811212420463562, + 0.800036609172821, + 0.789252519607544, + 0.7798817157745361, + 0.7730016708374023 + ], + "rho_per_layer": [ + 0.9999992251396179, + 0.9999983906745911, + 0.9999960660934448, + 0.99998939037323, + 0.9999715685844421, + 0.9999511241912842, + 0.9999076128005981, + 0.9998621940612793 + ], + "nudge_per_layer": [ + -0.281266987323761, + -0.2009655237197876, + -0.1321270614862442, + -0.08429376780986786, + -0.05586903542280197, + -0.039932381361722946, + -0.031076554208993912, + -0.025931723415851593 + ] + }, + "dfa": { + "test_acc": 0.8, + "mean_bp_cosine": 0.07366255111992359, + "mean_rho": 0.07397386711090803, + "mean_nudge_001": -8.963746586232446e-05, + "mean_nudge_003": -0.0002625839406391606, + "mean_nudge_01": -0.0007999172084964812, + "bp_cosine_per_layer": [ + -0.02832707017660141, + 0.13987571001052856, + 0.07857642322778702, + 0.061437755823135376, + 0.0877213403582573, + 0.09552451223134995, + 0.07042402029037476, + 0.08406771719455719 + ], + "rho_per_layer": [ + 0.034647777676582336, + 0.1467832326889038, + 0.036387018859386444, + 0.061308689415454865, + 0.1038040965795517, + 0.09023141860961914, + 0.03672575205564499, + 0.08190295100212097 + ], + "nudge_per_layer": [ + 0.012113340198993683, + -0.00537356361746788, + -0.0023620566353201866, + -0.001645779935643077, + -0.002037967788055539, + -0.0027765799313783646, + -0.001988787204027176, + -0.002327942755073309 + ] + }, + "state_bridge": { + "test_acc": 0.718, + "mean_bp_cosine": 0.2835564874112606, + "mean_rho": 0.2681517219170928, + "mean_nudge_001": -0.0027127867688250262, + "mean_nudge_003": -0.007993465682375245, + "mean_nudge_01": -0.025023294263519347, + "bp_cosine_per_layer": [ + 0.8429861068725586, + 0.3551006317138672, + 0.246289923787117, + 0.21019335091114044, + 0.17309927940368652, + 0.14295682311058044, + 0.15966862440109253, + 0.13815715909004211 + ], + "rho_per_layer": [ + 0.7732758522033691, + 0.2933464050292969, + 0.24295836687088013, + 0.22880345582962036, + 0.1602117419242859, + 0.11042392998933792, + 0.18763291835784912, + 0.14856110513210297 + ], + "nudge_per_layer": [ + -0.15847395360469818, + -0.010836342349648476, + -0.007060050964355469, + -0.005947217810899019, + -0.004753550048917532, + -0.004264200571924448, + -0.004713424481451511, + -0.0041376142762601376 + ], + "state_pred_error_per_layer": [ + 3389.93017578125, + 4477.634765625, + 1038.2586669921875, + 911.949951171875, + 702.6972045898438, + 659.9431762695312, + 824.164794921875, + 821.9293212890625 + ], + "mean_state_pred_error": 1603.3135070800781 + }, + "credit_bridge": { + "test_acc": 0.6185, + "mean_bp_cosine": 0.1525184395723045, + "mean_rho": 0.23177338391542435, + "mean_nudge_001": -0.0011540915293153375, + "mean_nudge_003": -0.0034589636488817632, + "mean_nudge_01": -0.01147624314762652, + "bp_cosine_per_layer": [ + 0.024487923830747604, + 0.1551763117313385, + 0.17440856993198395, + 0.18776318430900574, + 0.163284569978714, + 0.17855775356292725, + 0.162883460521698, + 0.17358574271202087 + ], + "rho_per_layer": [ + 0.024775028228759766, + 0.25605684518814087, + 0.2314496785402298, + 0.2697882056236267, + 0.24329833686351776, + 0.3152206242084503, + 0.23843368887901306, + 0.2751646637916565 + ], + "nudge_per_layer": [ + -0.010280786082148552, + -0.011451397091150284, + -0.01173271145671606, + -0.012431012466549873, + -0.01105603575706482, + -0.011893808841705322, + -0.011241357773542404, + -0.011722835712134838 + ], + "final_value_loss": 0.3728706964492798, + "final_term_loss": 0.12118487646579743, + "final_bridge_loss": 0.015310661105066539, + "final_tgrad_loss": 0.23637515988349914 + } + }, + "a0.5_L8_s456": { + "bp": { + "test_acc": 0.8555, + "mean_bp_cosine": 0.8527287542819977, + "mean_rho": 0.9999570250511169, + "mean_nudge_001": -0.01194569593644701, + "mean_nudge_003": -0.033871308725792915, + "mean_nudge_01": -0.09340489702299237, + "bp_cosine_per_layer": [ + 0.8810831904411316, + 0.8730225563049316, + 0.8656145334243774, + 0.8578245639801025, + 0.8490546345710754, + 0.8397257328033447, + 0.8311692476272583, + 0.8243355751037598 + ], + "rho_per_layer": [ + 0.9999987483024597, + 0.9999980330467224, + 0.9999955892562866, + 0.9999854564666748, + 0.9999719858169556, + 0.999948263168335, + 0.9998974204063416, + 0.9998607039451599 + ], + "nudge_per_layer": [ + -0.23731596767902374, + -0.17453062534332275, + -0.11795195937156677, + -0.07674264907836914, + -0.05135927349328995, + -0.036901768296957016, + -0.028667811304330826, + -0.02376912161707878 + ] + }, + "dfa": { + "test_acc": 0.7985, + "mean_bp_cosine": 0.09374871966429055, + "mean_rho": 0.12165694544091821, + "mean_nudge_001": -0.0004589786858559819, + "mean_nudge_003": -0.0013758796121692285, + "mean_nudge_01": -0.004529613710474223, + "bp_cosine_per_layer": [ + 0.027731137350201607, + 0.10604047030210495, + 0.13601002097129822, + 0.07596071809530258, + 0.0985877588391304, + 0.08992618322372437, + 0.1115533858537674, + 0.10418008267879486 + ], + "rho_per_layer": [ + -0.01300876960158348, + 0.12486347556114197, + 0.1899794042110443, + 0.08801613748073578, + 0.11934874951839447, + 0.15905101597309113, + 0.1374979466199875, + 0.167507603764534 + ], + "nudge_per_layer": [ + -0.011210349388420582, + -0.00580610241740942, + -0.004417200107127428, + -0.002277099061757326, + -0.003015844151377678, + -0.0030763214454054832, + -0.003333096392452717, + -0.003100896719843149 + ] + }, + "state_bridge": { + "test_acc": 0.7505, + "mean_bp_cosine": 0.25108483247458935, + "mean_rho": 0.22314902767539024, + "mean_nudge_001": -0.0032180442212847993, + "mean_nudge_003": -0.009445599382161163, + "mean_nudge_01": -0.029192803369369358, + "bp_cosine_per_layer": [ + 0.8145060539245605, + 0.39495280385017395, + 0.15602949261665344, + 0.14954066276550293, + 0.1189848780632019, + 0.14297258853912354, + 0.11834269762039185, + 0.11334948241710663 + ], + "rho_per_layer": [ + 0.7131592035293579, + 0.31938445568084717, + 0.13574811816215515, + 0.13510501384735107, + 0.12680554389953613, + 0.13444143533706665, + 0.1260460913181305, + 0.09450235962867737 + ], + "nudge_per_layer": [ + -0.20040717720985413, + -0.012472910806536674, + -0.003969438374042511, + -0.003768536727875471, + -0.0031205681152641773, + -0.00363306887447834, + -0.0031901695765554905, + -0.002980557270348072 + ], + "state_pred_error_per_layer": [ + 7208.7744140625, + 4043.077392578125, + 2431.6259765625, + 2036.907958984375, + 1977.547119140625, + 1708.2327880859375, + 1901.497314453125, + 1821.6331787109375 + ], + "mean_state_pred_error": 2891.1620178222656 + }, + "credit_bridge": { + "test_acc": 0.555, + "mean_bp_cosine": 0.12328627426177263, + "mean_rho": 0.16509935073554516, + "mean_nudge_001": -0.000985160811978858, + "mean_nudge_003": -0.002952177223050967, + "mean_nudge_01": -0.009791445219889283, + "bp_cosine_per_layer": [ + 0.03383665531873703, + 0.10378465056419373, + 0.1522345095872879, + 0.12050338089466095, + 0.12787620723247528, + 0.13963481783866882, + 0.14998120069503784, + 0.1584387719631195 + ], + "rho_per_layer": [ + 0.02018044888973236, + 0.14589767158031464, + 0.20607107877731323, + 0.18045580387115479, + 0.1894514560699463, + 0.16447019577026367, + 0.1924649477005005, + 0.2218032032251358 + ], + "nudge_per_layer": [ + -0.00981426052749157, + -0.00849075522273779, + -0.010712197050452232, + -0.009203735738992691, + -0.009092864580452442, + -0.00978156179189682, + -0.010470103472471237, + -0.010766083374619484 + ], + "final_value_loss": 0.5412774887084961, + "final_term_loss": 0.23150972747802734, + "final_bridge_loss": 0.02621319934129715, + "final_tgrad_loss": 0.28355456256866457 + } + }, + "a0.5_L12_s42": { + "bp": { + "test_acc": 0.8585, + "mean_bp_cosine": 0.8183901458978653, + "mean_rho": 0.9998798171679179, + "mean_nudge_001": -0.011188714299350977, + "mean_nudge_003": -0.03214278844340394, + "mean_nudge_01": -0.09301998885348439, + "bp_cosine_per_layer": [ + 0.8657882213592529, + 0.8541754484176636, + 0.8436384201049805, + 0.832263708114624, + 0.8208613991737366, + 0.8122134208679199, + 0.8057717084884644, + 0.8017721176147461, + 0.7986597418785095, + 0.7967146635055542, + 0.7952107787132263, + 0.7936121225357056 + ], + "rho_per_layer": [ + 0.9999991655349731, + 0.9999977350234985, + 0.9999939203262329, + 0.9999861121177673, + 0.9999700784683228, + 0.9999415874481201, + 0.9999051094055176, + 0.9998413324356079, + 0.9998086094856262, + 0.9997647404670715, + 0.9996839165687561, + 0.9996654987335205 + ], + "nudge_per_layer": [ + -0.3461707830429077, + -0.23528623580932617, + -0.151905819773674, + -0.0986800491809845, + -0.06758347898721695, + -0.04991145431995392, + -0.039162103086709976, + -0.032274406403303146, + -0.02771918475627899, + -0.024551689624786377, + -0.02231007255613804, + -0.020684588700532913 + ] + }, + "dfa": { + "test_acc": 0.791, + "mean_bp_cosine": 0.07122930279001594, + "mean_rho": 0.10592638049274683, + "mean_nudge_001": -0.00047647209915642935, + "mean_nudge_003": -0.0014203774189809337, + "mean_nudge_01": -0.004644906090106815, + "bp_cosine_per_layer": [ + 0.023988625034689903, + 0.0961650088429451, + 0.10208466649055481, + 0.07022920250892639, + 0.09604307264089584, + 0.07800711691379547, + 0.08064866811037064, + 0.015484225004911423, + 0.04617477208375931, + 0.10530653595924377, + 0.06217034161090851, + 0.07844939827919006 + ], + "rho_per_layer": [ + -0.021668296307325363, + 0.13302525877952576, + 0.14676621556282043, + 0.11482817679643631, + 0.09230026602745056, + 0.15572097897529602, + 0.084853395819664, + 0.06741442531347275, + 0.09585727006196976, + 0.17402535676956177, + 0.1249062716960907, + 0.10308724641799927 + ], + "nudge_per_layer": [ + -0.013704460114240646, + -0.009605048224329948, + -0.004514003172516823, + -0.00345102627761662, + -0.003412249032407999, + -0.0038682736922055483, + -0.0031317053362727165, + -0.0012646813411265612, + -0.002444072160869837, + -0.004538315813988447, + -0.0027466074097901583, + -0.0030584305059164762 + ] + }, + "state_bridge": { + "test_acc": 0.684, + "mean_bp_cosine": 0.17019233045478663, + "mean_rho": 0.14254611171782017, + "mean_nudge_001": -0.0020112845547070415, + "mean_nudge_003": -0.005932022473037553, + "mean_nudge_01": -0.01860854132488991, + "bp_cosine_per_layer": [ + 0.7669721841812134, + 0.3159201741218567, + 0.12931227684020996, + 0.11285121738910675, + 0.11607236415147781, + 0.09898597002029419, + 0.08882047981023788, + 0.08661012351512909, + 0.08416090905666351, + 0.07891363650560379, + 0.08571723103523254, + 0.07797139883041382 + ], + "rho_per_layer": [ + 0.6671731472015381, + 0.26826971769332886, + 0.10340800136327744, + 0.06843797862529755, + 0.0669264942407608, + 0.08176875114440918, + 0.10683348774909973, + 0.06641782820224762, + 0.09755225479602814, + 0.04477599635720253, + 0.0847611278295517, + 0.05422855541110039 + ], + "nudge_per_layer": [ + -0.18878120183944702, + -0.009807860478758812, + -0.003219514386728406, + -0.0027990485541522503, + -0.0029557342641055584, + -0.002479594200849533, + -0.0022394107654690742, + -0.0022681057453155518, + -0.0022236446384340525, + -0.0021239176858216524, + -0.002271223347634077, + -0.0021332399919629097 + ], + "state_pred_error_per_layer": [ + 11168.2578125, + 8443.55078125, + 4301.74609375, + 3486.31884765625, + 3134.353515625, + 2733.8369140625, + 2666.431640625, + 2571.673095703125, + 2489.172119140625, + 2732.81298828125, + 3179.04296875, + 3116.75927734375 + ], + "mean_state_pred_error": 4168.663004557292 + }, + "credit_bridge": { + "test_acc": 0.571, + "mean_bp_cosine": 0.08207109943032265, + "mean_rho": 0.14231220919949314, + "mean_nudge_001": -0.0008072109461257545, + "mean_nudge_003": -0.0024178701957377293, + "mean_nudge_01": -0.008001433801837265, + "bp_cosine_per_layer": [ + 0.009321734309196472, + 0.04962325841188431, + 0.06880976259708405, + 0.07808464020490646, + 0.08887439966201782, + 0.0946938544511795, + 0.09941184520721436, + 0.09979166835546494, + 0.10197117179632187, + 0.10147081315517426, + 0.09914548695087433, + 0.0936545580625534 + ], + "rho_per_layer": [ + -0.0036096302792429924, + 0.0626683160662651, + 0.10237888991832733, + 0.12722331285476685, + 0.138666570186615, + 0.14094725251197815, + 0.1720128357410431, + 0.18820315599441528, + 0.1971924901008606, + 0.19901405274868011, + 0.18742212653160095, + 0.1956271380186081 + ], + "nudge_per_layer": [ + -0.00799381174147129, + -0.0042757005430758, + -0.005744780879467726, + -0.006799482740461826, + -0.0076793828047811985, + -0.008442584425210953, + -0.008797119371592999, + -0.009013657458126545, + -0.009450232610106468, + -0.009471941739320755, + -0.009278533980250359, + -0.009069977328181267 + ], + "final_value_loss": 0.95497522315979, + "final_term_loss": 0.6288936994552612, + "final_bridge_loss": 0.0344168305516243, + "final_tgrad_loss": 0.2916646807193756 + } + }, + "a0.5_L12_s123": { + "bp": { + "test_acc": 0.873, + "mean_bp_cosine": 0.7415736317634583, + "mean_rho": 0.9999099324146906, + "mean_nudge_001": -0.010182377610666057, + "mean_nudge_003": -0.029109801825446386, + "mean_nudge_01": -0.08149818579355876, + "bp_cosine_per_layer": [ + 0.8060421943664551, + 0.7944625616073608, + 0.776944637298584, + 0.7588614821434021, + 0.7418972849845886, + 0.7322722673416138, + 0.724165678024292, + 0.7197043299674988, + 0.7152823209762573, + 0.7119243144989014, + 0.709496021270752, + 0.7078304886817932 + ], + "rho_per_layer": [ + 0.9999996423721313, + 0.9999984502792358, + 0.9999962449073792, + 0.999989926815033, + 0.9999754428863525, + 0.9999579191207886, + 0.999927818775177, + 0.999887228012085, + 0.9998751878738403, + 0.9997915029525757, + 0.9997637867927551, + 0.9997560381889343 + ], + "nudge_per_layer": [ + -0.2872876822948456, + -0.20931334793567657, + -0.13937950134277344, + -0.09144100546836853, + -0.06199805811047554, + -0.04483566805720329, + -0.03463221341371536, + -0.02817366272211075, + -0.023888790979981422, + -0.02094285935163498, + -0.01881779544055462, + -0.01726764440536499 + ] + }, + "dfa": { + "test_acc": 0.7975, + "mean_bp_cosine": 0.06331516286203016, + "mean_rho": 0.04216622615543505, + "mean_nudge_001": -0.00018036465129019538, + "mean_nudge_003": -0.0005390862012670065, + "mean_nudge_01": -0.0017679805799465005, + "bp_cosine_per_layer": [ + 0.004078918602317572, + 0.1059243381023407, + 0.07574640959501266, + 0.07308551669120789, + 0.066571444272995, + 0.056897446513175964, + 0.12165610492229462, + 0.06462406367063522, + 0.04925639182329178, + 0.04602370783686638, + 0.035759277641773224, + 0.06015833467245102 + ], + "rho_per_layer": [ + -0.011486321687698364, + 0.04376016557216644, + 0.037421341985464096, + 0.05220063030719757, + 0.09364941716194153, + -0.03169674053788185, + 0.15961039066314697, + 0.10634914040565491, + 0.03384825587272644, + 0.02390148863196373, + -0.010392685420811176, + 0.00882963091135025 + ], + "nudge_per_layer": [ + -0.0026711553800851107, + -0.003443576628342271, + -0.001918894238770008, + -0.0020233127288520336, + -0.0016027885721996427, + -0.0010300527792423964, + -0.002917288802564144, + -0.001525502186268568, + -0.0009703689720481634, + -0.0010098961647599936, + -0.0008095581433735788, + -0.0012933723628520966 + ] + }, + "state_bridge": { + "test_acc": 0.69, + "mean_bp_cosine": 0.17323703753451505, + "mean_rho": 0.15179013274610043, + "mean_nudge_001": -0.0019852635256635645, + "mean_nudge_003": -0.005834519392616737, + "mean_nudge_01": -0.018113662886510912, + "bp_cosine_per_layer": [ + 0.7613614797592163, + 0.3896995782852173, + 0.1309610903263092, + 0.10979019105434418, + 0.09164053201675415, + 0.07316795736551285, + 0.09407100081443787, + 0.08964815735816956, + 0.08292470127344131, + 0.08648289740085602, + 0.0870373547077179, + 0.08205951005220413 + ], + "rho_per_layer": [ + 0.6734859943389893, + 0.37621644139289856, + 0.08932416141033173, + 0.11710754036903381, + 0.07942430675029755, + 0.058268360793590546, + 0.05698401480913162, + 0.12727776169776917, + 0.03869014233350754, + 0.06775026768445969, + 0.0798446387052536, + 0.05710796266794205 + ], + "nudge_per_layer": [ + -0.1828688532114029, + -0.012644743546843529, + -0.003011793363839388, + -0.0024378912057727575, + -0.0020753229036927223, + -0.0017659795703366399, + -0.0021767604630440474, + -0.0021774054039269686, + -0.0019914493896067142, + -0.0021301559172570705, + -0.0020812181755900383, + -0.0020023814868181944 + ], + "state_pred_error_per_layer": [ + 12496.853515625, + 8106.66162109375, + 5059.9169921875, + 4050.405517578125, + 3454.0888671875, + 2936.005859375, + 2830.2294921875, + 2863.870361328125, + 3118.476806640625, + 3786.361083984375, + 3251.337890625, + 3255.708740234375 + ], + "mean_state_pred_error": 4600.826395670573 + }, + "credit_bridge": { + "test_acc": 0.6545, + "mean_bp_cosine": -0.010937775252386928, + "mean_rho": 0.02020453056320548, + "mean_nudge_001": 7.376461204936884e-05, + "mean_nudge_003": 0.00022662243100057822, + "mean_nudge_01": 0.0008031492385877451, + "bp_cosine_per_layer": [ + -0.022733785212039948, + -0.008966443128883839, + -0.020323125645518303, + -0.018136776983737946, + -0.01592089980840683, + -0.019174236804246902, + -0.014491843990981579, + -0.016727179288864136, + -0.008660020306706429, + -0.007111798040568829, + 0.0011803526431322098, + 0.019812453538179398 + ], + "rho_per_layer": [ + -0.05155084282159805, + 0.03821132332086563, + 0.07940525561571121, + 0.014752240851521492, + 0.016678672283887863, + 0.04385560005903244, + 0.03276895359158516, + -0.0006132312119007111, + -0.024450641125440598, + -0.029637619853019714, + 0.058109357953071594, + 0.06492529809474945 + ], + "nudge_per_layer": [ + 0.00777015183120966, + 0.00029987754533067346, + 0.00037500812322832644, + 0.00043640032527036965, + 0.0005594875547103584, + 0.0007026067469269037, + 0.00045700964983552694, + 0.000550219090655446, + 0.00020889028382953256, + 0.00013992507592774928, + -0.0004261335707269609, + -0.0014356517931446433 + ], + "final_value_loss": 1.470289986038208, + "final_term_loss": 0.35005189373493195, + "final_bridge_loss": 0.9054676934719086, + "final_tgrad_loss": 0.2147704033613205 + } + }, + "a0.5_L12_s456": { + "bp": { + "test_acc": 0.869, + "mean_bp_cosine": 0.74041115740935, + "mean_rho": 0.9998869399229685, + "mean_nudge_001": -0.007502871051353092, + "mean_nudge_003": -0.02132872895648082, + "mean_nudge_01": -0.05926296177009741, + "bp_cosine_per_layer": [ + 0.802544355392456, + 0.7848162055015564, + 0.7700465321540833, + 0.7570744752883911, + 0.7440193891525269, + 0.733696699142456, + 0.7256457805633545, + 0.7199540734291077, + 0.7157886028289795, + 0.7124584913253784, + 0.7102035284042358, + 0.7086857557296753 + ], + "rho_per_layer": [ + 0.9999985694885254, + 0.9999974966049194, + 0.9999951720237732, + 0.9999867677688599, + 0.9999691843986511, + 0.9999383687973022, + 0.9999032020568848, + 0.9998719692230225, + 0.9998380541801453, + 0.9998047351837158, + 0.9996931552886963, + 0.9996466040611267 + ], + "nudge_per_layer": [ + -0.20057430863380432, + -0.1480334997177124, + -0.10051561146974564, + -0.0672251284122467, + -0.04664912819862366, + -0.03438428044319153, + -0.026901239529252052, + -0.02211749367415905, + -0.018912356346845627, + -0.01670587807893753, + -0.015132123604416847, + -0.01400449313223362 + ] + }, + "dfa": { + "test_acc": 0.8, + "mean_bp_cosine": 0.11594532305995624, + "mean_rho": 0.11397512660672267, + "mean_nudge_001": -0.00042300097387245234, + "mean_nudge_003": -0.0012634664356786136, + "mean_nudge_01": -0.0041745746857486665, + "bp_cosine_per_layer": [ + 0.04262668639421463, + 0.2711353898048401, + 0.1898173838853836, + 0.1387583613395691, + 0.09531620889902115, + 0.1376194804906845, + 0.07653278112411499, + 0.08707999438047409, + 0.09030534327030182, + 0.10221391171216965, + 0.06503984332084656, + 0.09489849209785461 + ], + "rho_per_layer": [ + 0.0572824701666832, + 0.20349135994911194, + 0.20036441087722778, + 0.17148703336715698, + 0.0623050183057785, + 0.14095279574394226, + 0.05262026563286781, + 0.12087561190128326, + 0.10731191188097, + 0.061124786734580994, + 0.07995927333831787, + 0.10992658138275146 + ], + "nudge_per_layer": [ + -0.009360449388623238, + -0.00823313370347023, + -0.005617598537355661, + -0.004333253484219313, + -0.0029935596976429224, + -0.0036506117321550846, + -0.002341690007597208, + -0.002613792195916176, + -0.0027945097535848618, + -0.003059752518311143, + -0.002222315641120076, + -0.002874229568988085 + ] + }, + "state_bridge": { + "test_acc": 0.702, + "mean_bp_cosine": 0.18659504254659018, + "mean_rho": 0.1786113940179348, + "mean_nudge_001": -0.002035917636627952, + "mean_nudge_003": -0.0060201529073917, + "mean_nudge_01": -0.019059499570478994, + "bp_cosine_per_layer": [ + 0.7615377902984619, + 0.3628881573677063, + 0.1397334486246109, + 0.13061293959617615, + 0.11024273186922073, + 0.09393852204084396, + 0.10003305226564407, + 0.10794281214475632, + 0.10362739115953445, + 0.10100233554840088, + 0.1030983105301857, + 0.12448301911354065 + ], + "rho_per_layer": [ + 0.7019654512405396, + 0.3051794767379761, + 0.12004730850458145, + 0.11974964290857315, + 0.1315283179283142, + 0.11543487757444382, + 0.08415813744068146, + 0.14185138046741486, + 0.12905646860599518, + 0.0691840872168541, + 0.12997986376285553, + 0.09520171582698822 + ], + "nudge_per_layer": [ + -0.1852446049451828, + -0.011355580762028694, + -0.003981029614806175, + -0.0038526845164597034, + -0.0031567115802317858, + -0.0028176922351121902, + -0.0029711187817156315, + -0.0031051787082105875, + -0.0029434349853545427, + -0.002931142458692193, + -0.002905802335590124, + -0.0034490139223635197 + ], + "state_pred_error_per_layer": [ + 8110.80078125, + 4497.13623046875, + 2448.651123046875, + 2213.206298828125, + 2038.592041015625, + 2361.478515625, + 2122.5341796875, + 2178.11474609375, + 2310.2265625, + 2081.50390625, + 2114.170654296875, + 2407.947998046875 + ], + "mean_state_pred_error": 2907.0302530924478 + }, + "credit_bridge": { + "test_acc": 0.6375, + "mean_bp_cosine": 0.09317115658389714, + "mean_rho": 0.17472073963532844, + "mean_nudge_001": -0.000727248170733219, + "mean_nudge_003": -0.0021776299763587303, + "mean_nudge_01": -0.007225943821443555, + "bp_cosine_per_layer": [ + -0.0012992812553420663, + 0.028360359370708466, + 0.07222752273082733, + 0.06384990364313126, + 0.0745362713932991, + 0.10235601663589478, + 0.11958298832178116, + 0.12767711281776428, + 0.12978672981262207, + 0.13033980131149292, + 0.131376713514328, + 0.13925974071025848 + ], + "rho_per_layer": [ + -0.036700520664453506, + 0.08258875459432602, + 0.18529893457889557, + 0.1350553333759308, + 0.14971259236335754, + 0.23370781540870667, + 0.15428856015205383, + 0.2475280910730362, + 0.20684200525283813, + 0.26022571325302124, + 0.23770767450332642, + 0.24039392173290253 + ], + "nudge_per_layer": [ + 0.0004691533395089209, + -0.002260619541630149, + -0.007056917063891888, + -0.005040735937654972, + -0.005857650190591812, + -0.007526098750531673, + -0.008702869527041912, + -0.009377602487802505, + -0.009931675158441067, + -0.01026402972638607, + -0.010433407500386238, + -0.010728873312473297 + ], + "final_value_loss": 0.6376882638454437, + "final_term_loss": 0.3444120800256729, + "final_bridge_loss": 0.029638116455078124, + "final_tgrad_loss": 0.2636380691766739 + } + }, + "a1.0_L2_s42": { + "bp": { + "test_acc": 0.7915, + "mean_bp_cosine": 0.9376864433288574, + "mean_rho": 0.9999988675117493, + "mean_nudge_001": -0.040167851373553276, + "mean_nudge_003": -0.11654911190271378, + "mean_nudge_01": -0.34635232388973236, + "bp_cosine_per_layer": [ + 0.937772274017334, + 0.9376006126403809 + ], + "rho_per_layer": [ + 0.9999990463256836, + 0.9999986886978149 + ], + "nudge_per_layer": [ + -0.4167234003543854, + -0.27598124742507935 + ] + }, + "dfa": { + "test_acc": 0.7025, + "mean_bp_cosine": 0.007199164479970932, + "mean_rho": 0.005297745577991009, + "mean_nudge_001": -7.51367933844449e-05, + "mean_nudge_003": -0.00021808056044392288, + "mean_nudge_01": -0.000639150632196106, + "bp_cosine_per_layer": [ + -0.005922339856624603, + 0.020320668816566467 + ], + "rho_per_layer": [ + -0.003393532708287239, + 0.013989023864269257 + ], + "nudge_per_layer": [ + 5.659737507812679e-05, + -0.0013348986394703388 + ] + }, + "state_bridge": { + "test_acc": 0.6735, + "mean_bp_cosine": 0.5210442394018173, + "mean_rho": 0.48512911796569824, + "mean_nudge_001": -0.011768221855163574, + "mean_nudge_003": -0.034833950689062476, + "mean_nudge_01": -0.11062158830463886, + "bp_cosine_per_layer": [ + 0.6727198958396912, + 0.3693685829639435 + ], + "rho_per_layer": [ + 0.6028042435646057, + 0.36745399236679077 + ], + "nudge_per_layer": [ + -0.19608698785305023, + -0.025156188756227493 + ], + "state_pred_error_per_layer": [ + 4083.197509765625, + 262.47991943359375 + ], + "mean_state_pred_error": 2172.8387145996094 + }, + "credit_bridge": { + "test_acc": 0.5125, + "mean_bp_cosine": 0.5678956210613251, + "mean_rho": 0.5935650169849396, + "mean_nudge_001": -0.00795893557369709, + "mean_nudge_003": -0.023799872025847435, + "mean_nudge_01": -0.07842501997947693, + "bp_cosine_per_layer": [ + 0.39126425981521606, + 0.7445269823074341 + ], + "rho_per_layer": [ + 0.44417524337768555, + 0.7429547905921936 + ], + "nudge_per_layer": [ + -0.08887787163257599, + -0.06797216832637787 + ], + "final_value_loss": 0.6212269179344178, + "final_term_loss": 0.05304660900235176, + "final_bridge_loss": 0.010462266248464584, + "final_tgrad_loss": 0.5577180406570434 + } + }, + "a1.0_L2_s123": { + "bp": { + "test_acc": 0.809, + "mean_bp_cosine": 0.9559402465820312, + "mean_rho": 0.9999986886978149, + "mean_nudge_001": -0.03185446374118328, + "mean_nudge_003": -0.09129266440868378, + "mean_nudge_01": -0.258349284529686, + "bp_cosine_per_layer": [ + 0.9615377187728882, + 0.9503427743911743 + ], + "rho_per_layer": [ + 0.9999992847442627, + 0.9999980926513672 + ], + "nudge_per_layer": [ + -0.3078651428222656, + -0.20883342623710632 + ] + }, + "dfa": { + "test_acc": 0.7455, + "mean_bp_cosine": 0.05108090303838253, + "mean_rho": 0.05254313163459301, + "mean_nudge_001": -0.0008275873260572553, + "mean_nudge_003": -0.0024727254058234394, + "mean_nudge_01": -0.008127598091959953, + "bp_cosine_per_layer": [ + 0.057878345251083374, + 0.044283460825681686 + ], + "rho_per_layer": [ + 0.047237616032361984, + 0.057848647236824036 + ], + "nudge_per_layer": [ + -0.013432648032903671, + -0.0028225481510162354 + ] + }, + "state_bridge": { + "test_acc": 0.704, + "mean_bp_cosine": 0.5101080536842346, + "mean_rho": 0.45375654101371765, + "mean_nudge_001": -0.00980611308477819, + "mean_nudge_003": -0.02897635381668806, + "mean_nudge_01": -0.09152827039361, + "bp_cosine_per_layer": [ + 0.6596157550811768, + 0.3606003522872925 + ], + "rho_per_layer": [ + 0.5883278250694275, + 0.3191852569580078 + ], + "nudge_per_layer": [ + -0.16100725531578064, + -0.02204928547143936 + ], + "state_pred_error_per_layer": [ + 4266.72509765625, + 268.82733154296875 + ], + "mean_state_pred_error": 2267.7762145996094 + }, + "credit_bridge": { + "test_acc": 0.536, + "mean_bp_cosine": 0.5000061094760895, + "mean_rho": 0.5169470459222794, + "mean_nudge_001": -0.007283595856279135, + "mean_nudge_003": -0.0217662351205945, + "mean_nudge_01": -0.07154248096048832, + "bp_cosine_per_layer": [ + 0.3330497741699219, + 0.6669624447822571 + ], + "rho_per_layer": [ + 0.38148215413093567, + 0.652411937713623 + ], + "nudge_per_layer": [ + -0.08540114760398865, + -0.05768381431698799 + ], + "final_value_loss": 0.6294826040267945, + "final_term_loss": 0.06573917962312699, + "final_bridge_loss": 0.01474373927861452, + "final_tgrad_loss": 0.5489996829986572 + } + }, + "a1.0_L2_s456": { + "bp": { + "test_acc": 0.7905, + "mean_bp_cosine": 0.9266799688339233, + "mean_rho": 0.9999988377094269, + "mean_nudge_001": -0.03671902138739824, + "mean_nudge_003": -0.10590140148997307, + "mean_nudge_01": -0.30589545518159866, + "bp_cosine_per_layer": [ + 0.9291538000106812, + 0.9242061376571655 + ], + "rho_per_layer": [ + 0.9999991059303284, + 0.9999985694885254 + ], + "nudge_per_layer": [ + -0.36666756868362427, + -0.24512334167957306 + ] + }, + "dfa": { + "test_acc": 0.73, + "mean_bp_cosine": 0.03006170690059662, + "mean_rho": 0.039368635043501854, + "mean_nudge_001": -0.0004903670051135123, + "mean_nudge_003": -0.0014640121953561902, + "mean_nudge_01": -0.004785260884091258, + "bp_cosine_per_layer": [ + 0.02131858840584755, + 0.03880482539534569 + ], + "rho_per_layer": [ + 0.006325956434011459, + 0.07241131365299225 + ], + "nudge_per_layer": [ + -0.006775922141969204, + -0.002794599626213312 + ] + }, + "state_bridge": { + "test_acc": 0.6755, + "mean_bp_cosine": 0.5186701416969299, + "mean_rho": 0.48068559169769287, + "mean_nudge_001": -0.011591368587687612, + "mean_nudge_003": -0.03431171411648393, + "mean_nudge_01": -0.10901244357228279, + "bp_cosine_per_layer": [ + 0.669547975063324, + 0.3677923083305359 + ], + "rho_per_layer": [ + 0.6219363808631897, + 0.33943480253219604 + ], + "nudge_per_layer": [ + -0.19162335991859436, + -0.026401527225971222 + ], + "state_pred_error_per_layer": [ + 3936.27783203125, + 288.300537109375 + ], + "mean_state_pred_error": 2112.2891845703125 + }, + "credit_bridge": { + "test_acc": 0.544, + "mean_bp_cosine": 0.5161235481500626, + "mean_rho": 0.5938436686992645, + "mean_nudge_001": -0.0068406532518565655, + "mean_nudge_003": -0.020453338511288166, + "mean_nudge_01": -0.0673653893172741, + "bp_cosine_per_layer": [ + 0.35489675402641296, + 0.6773503422737122 + ], + "rho_per_layer": [ + 0.4646533727645874, + 0.7230339646339417 + ], + "nudge_per_layer": [ + -0.07572861015796661, + -0.059002168476581573 + ], + "final_value_loss": 0.6262330022811889, + "final_term_loss": 0.049621654653549195, + "final_bridge_loss": 0.011661755262315273, + "final_tgrad_loss": 0.5649495909690857 + } + }, + "a1.0_L4_s42": { + "bp": { + "test_acc": 0.7875, + "mean_bp_cosine": 0.882385790348053, + "mean_rho": 0.999995619058609, + "mean_nudge_001": -0.03646231605671346, + "mean_nudge_003": -0.10610398091375828, + "mean_nudge_01": -0.31568005308508873, + "bp_cosine_per_layer": [ + 0.8902335166931152, + 0.8886877298355103, + 0.8827626705169678, + 0.8678592443466187 + ], + "rho_per_layer": [ + 0.9999993443489075, + 0.9999990463256836, + 0.9999973773956299, + 0.9999867081642151 + ], + "nudge_per_layer": [ + -0.49256381392478943, + -0.4056996703147888, + -0.2497977763414383, + -0.11465895175933838 + ] + }, + "dfa": { + "test_acc": 0.7075, + "mean_bp_cosine": 0.060902527533471584, + "mean_rho": 0.052925301948562264, + "mean_nudge_001": -0.00048208528460236266, + "mean_nudge_003": -0.0014429198927246034, + "mean_nudge_01": -0.004763618926517665, + "bp_cosine_per_layer": [ + 0.026215966790914536, + 0.05776425451040268, + 0.07666948437690735, + 0.08296040445566177 + ], + "rho_per_layer": [ + 0.04998716711997986, + 0.09949691593647003, + 0.049676910042762756, + 0.012540214695036411 + ], + "nudge_per_layer": [ + -0.008544353768229485, + -0.0038241599686443806, + -0.0033461027778685093, + -0.003339859191328287 + ] + }, + "state_bridge": { + "test_acc": 0.6625, + "mean_bp_cosine": 0.3484594225883484, + "mean_rho": 0.3289090357720852, + "mean_nudge_001": -0.005907032289542258, + "mean_nudge_003": -0.01748002166277729, + "mean_nudge_01": -0.05545389896724373, + "bp_cosine_per_layer": [ + 0.6404350996017456, + 0.4214136302471161, + 0.18068093061447144, + 0.15130802989006042 + ], + "rho_per_layer": [ + 0.5499319434165955, + 0.368219256401062, + 0.21391229331493378, + 0.1835726499557495 + ], + "nudge_per_layer": [ + -0.18587297201156616, + -0.0235043503344059, + -0.00688221026211977, + -0.005556063260883093 + ], + "state_pred_error_per_layer": [ + 10066.107421875, + 1273.9140625, + 696.594482421875, + 612.3014526367188 + ], + "mean_state_pred_error": 3162.2293548583984 + }, + "credit_bridge": { + "test_acc": 0.558, + "mean_bp_cosine": 0.45794273912906647, + "mean_rho": 0.5322257168591022, + "mean_nudge_001": -0.003842960635665804, + "mean_nudge_003": -0.011505396338179708, + "mean_nudge_01": -0.038075629621744156, + "bp_cosine_per_layer": [ + 0.17809242010116577, + 0.5349531173706055, + 0.5522423982620239, + 0.5664830207824707 + ], + "rho_per_layer": [ + 0.22843755781650543, + 0.5910820364952087, + 0.6707864999771118, + 0.638596773147583 + ], + "nudge_per_layer": [ + -0.044362872838974, + -0.03722546622157097, + -0.03515344485640526, + -0.0355607345700264 + ], + "final_value_loss": 0.38718592133522034, + "final_term_loss": 0.06566130868196488, + "final_bridge_loss": 0.01777836950570345, + "final_tgrad_loss": 0.30374624242782594 + } + }, + "a1.0_L4_s123": { + "bp": { + "test_acc": 0.786, + "mean_bp_cosine": 0.8366721421480179, + "mean_rho": 0.9999945610761642, + "mean_nudge_001": -0.03740503964945674, + "mean_nudge_003": -0.1080933827906847, + "mean_nudge_01": -0.3170367181301117, + "bp_cosine_per_layer": [ + 0.8610074520111084, + 0.8541143536567688, + 0.8321727514266968, + 0.7993940114974976 + ], + "rho_per_layer": [ + 0.9999990463256836, + 0.9999986886978149, + 0.9999971389770508, + 0.9999833703041077 + ], + "nudge_per_layer": [ + -0.492245614528656, + -0.40577083826065063, + -0.25304561853408813, + -0.117084801197052 + ] + }, + "dfa": { + "test_acc": 0.682, + "mean_bp_cosine": 0.049554066732525826, + "mean_rho": 0.06381266703829169, + "mean_nudge_001": -0.00014734033902641386, + "mean_nudge_003": -0.0004330205119913444, + "mean_nudge_01": -0.001343857147730887, + "bp_cosine_per_layer": [ + -0.008613362908363342, + 0.039367884397506714, + 0.07619941979646683, + 0.0912623256444931 + ], + "rho_per_layer": [ + -0.007624803110957146, + 0.008791688829660416, + 0.13103844225406647, + 0.12304534018039703 + ], + "nudge_per_layer": [ + 0.005509334150701761, + -0.003195145633071661, + -0.0036095697432756424, + -0.004080047365278006 + ] + }, + "state_bridge": { + "test_acc": 0.6305, + "mean_bp_cosine": 0.3143155351281166, + "mean_rho": 0.30846646428108215, + "mean_nudge_001": -0.005087231853394769, + "mean_nudge_003": -0.015093521040398628, + "mean_nudge_01": -0.04834054387174547, + "bp_cosine_per_layer": [ + 0.5847928524017334, + 0.3501134514808655, + 0.17105570435523987, + 0.15130013227462769 + ], + "rho_per_layer": [ + 0.5387442708015442, + 0.3080189526081085, + 0.17941737174987793, + 0.20768526196479797 + ], + "nudge_per_layer": [ + -0.16164088249206543, + -0.01902196928858757, + -0.006823995150625706, + -0.005875328555703163 + ], + "state_pred_error_per_layer": [ + 10103.57421875, + 1132.8861083984375, + 636.5859375, + 537.355224609375 + ], + "mean_state_pred_error": 3102.600372314453 + }, + "credit_bridge": { + "test_acc": 0.502, + "mean_bp_cosine": 0.39079025387763977, + "mean_rho": 0.4630395397543907, + "mean_nudge_001": -0.0038928183494135737, + "mean_nudge_003": -0.011659935116767883, + "mean_nudge_01": -0.03865493927150965, + "bp_cosine_per_layer": [ + 0.1632033884525299, + 0.4602273404598236, + 0.4661305546760559, + 0.47359973192214966 + ], + "rho_per_layer": [ + 0.20324298739433289, + 0.5429707169532776, + 0.5653814077377319, + 0.5405630469322205 + ], + "nudge_per_layer": [ + -0.04415123537182808, + -0.037312425673007965, + -0.03657253086566925, + -0.036583565175533295 + ], + "final_value_loss": 0.5799021621704101, + "final_term_loss": 0.1424343505382538, + "final_bridge_loss": 0.03182844363451004, + "final_tgrad_loss": 0.4056393639087677 + } + }, + "a1.0_L4_s456": { + "bp": { + "test_acc": 0.792, + "mean_bp_cosine": 0.8552748262882233, + "mean_rho": 0.9999953359365463, + "mean_nudge_001": -0.03656455362215638, + "mean_nudge_003": -0.10595990065485239, + "mean_nudge_01": -0.31139715015888214, + "bp_cosine_per_layer": [ + 0.8668075799942017, + 0.8621845245361328, + 0.8550785779953003, + 0.8370286226272583 + ], + "rho_per_layer": [ + 0.9999995827674866, + 0.9999990463256836, + 0.999997615814209, + 0.9999850988388062 + ], + "nudge_per_layer": [ + -0.4802546799182892, + -0.3984469175338745, + -0.2503964900970459, + -0.11649051308631897 + ] + }, + "dfa": { + "test_acc": 0.68, + "mean_bp_cosine": 0.052356213971506804, + "mean_rho": 0.05650564655661583, + "mean_nudge_001": -0.0003577733878046274, + "mean_nudge_003": -0.0010662981367204338, + "mean_nudge_01": -0.0034739490947686136, + "bp_cosine_per_layer": [ + -0.001797341974452138, + 0.06668862700462341, + 0.05448886379599571, + 0.09004470705986023 + ], + "rho_per_layer": [ + -0.01287321001291275, + 0.007983170449733734, + 0.10568365454673767, + 0.12522897124290466 + ], + "nudge_per_layer": [ + -0.0016110537108033895, + -0.004868227988481522, + -0.0030549662187695503, + -0.004361548461019993 + ] + }, + "state_bridge": { + "test_acc": 0.651, + "mean_bp_cosine": 0.35348402336239815, + "mean_rho": 0.3312904089689255, + "mean_nudge_001": -0.005755784470238723, + "mean_nudge_003": -0.017025350069161505, + "mean_nudge_01": -0.05395022651646286, + "bp_cosine_per_layer": [ + 0.6501579284667969, + 0.4189426302909851, + 0.1800653487443924, + 0.1647701859474182 + ], + "rho_per_layer": [ + 0.5907484292984009, + 0.36159276962280273, + 0.19337056577205658, + 0.1794498711824417 + ], + "nudge_per_layer": [ + -0.1790994107723236, + -0.023556631058454514, + -0.006848426535725594, + -0.0062964376993477345 + ], + "state_pred_error_per_layer": [ + 7107.7138671875, + 890.22314453125, + 493.5357360839844, + 407.69677734375 + ], + "mean_state_pred_error": 2224.792381286621 + }, + "credit_bridge": { + "test_acc": 0.487, + "mean_bp_cosine": 0.5049829035997391, + "mean_rho": 0.5321159400045872, + "mean_nudge_001": -0.004336995130870491, + "mean_nudge_003": -0.012986946385353804, + "mean_nudge_01": -0.04301031678915024, + "bp_cosine_per_layer": [ + 0.20670706033706665, + 0.594096302986145, + 0.6002212762832642, + 0.6189069747924805 + ], + "rho_per_layer": [ + 0.24109239876270294, + 0.6317664384841919, + 0.6270265579223633, + 0.6285783648490906 + ], + "nudge_per_layer": [ + -0.03731346130371094, + -0.04525235667824745, + -0.044518306851387024, + -0.04495714232325554 + ], + "final_value_loss": 0.46226135368347165, + "final_term_loss": 0.049428026616573334, + "final_bridge_loss": 0.022721626716852187, + "final_tgrad_loss": 0.39011170201301576 + } + }, + "a1.0_L8_s42": { + "bp": { + "test_acc": 0.763, + "mean_bp_cosine": 0.8278333768248558, + "mean_rho": 0.9999853745102882, + "mean_nudge_001": -0.029990217997692525, + "mean_nudge_003": -0.08752790885046124, + "mean_nudge_01": -0.2652519349940121, + "bp_cosine_per_layer": [ + 0.85625159740448, + 0.8527897596359253, + 0.847720742225647, + 0.8408411145210266, + 0.831807017326355, + 0.8158122301101685, + 0.7960221171379089, + 0.7814224362373352 + ], + "rho_per_layer": [ + 0.999999463558197, + 0.9999992847442627, + 0.9999988079071045, + 0.9999978542327881, + 0.999994695186615, + 0.9999883770942688, + 0.9999692440032959, + 0.9999352693557739 + ], + "nudge_per_layer": [ + -0.5478029251098633, + -0.4737934172153473, + -0.3800549805164337, + -0.2769272029399872, + -0.18745023012161255, + -0.12213317304849625, + -0.07957549393177032, + -0.05427805706858635 + ] + }, + "dfa": { + "test_acc": 0.657, + "mean_bp_cosine": 0.046988741494715214, + "mean_rho": 0.0527694383636117, + "mean_nudge_001": -0.00015309322225220967, + "mean_nudge_003": -0.00045631649845745414, + "mean_nudge_01": -0.0014890892343828455, + "bp_cosine_per_layer": [ + -0.01574046164751053, + 0.07191511988639832, + 0.043905604630708694, + 0.07308061420917511, + 0.07518148422241211, + 0.026394926011562347, + 0.06854978203773499, + 0.03262286260724068 + ], + "rho_per_layer": [ + -0.02709903195500374, + 0.1010747104883194, + 0.06438975036144257, + 0.07812117040157318, + 0.0766223892569542, + 0.026489075273275375, + 0.09218208491802216, + 0.010375358164310455 + ], + "nudge_per_layer": [ + 0.007441862486302853, + -0.0052239359356462955, + -0.0022090799175202847, + -0.003076428547501564, + -0.0031523762736469507, + -0.0013899998739361763, + -0.0030318819917738438, + -0.0012708738213405013 + ] + }, + "state_bridge": { + "test_acc": 0.65, + "mean_bp_cosine": 0.2592074144631624, + "mean_rho": 0.23237370885908604, + "mean_nudge_001": -0.0031611585363862105, + "mean_nudge_003": -0.009385082448716275, + "mean_nudge_01": -0.030122902884613723, + "bp_cosine_per_layer": [ + 0.6320836544036865, + 0.4503885507583618, + 0.22882479429244995, + 0.17507168650627136, + 0.15456035733222961, + 0.15327030420303345, + 0.14079461991786957, + 0.1386653482913971 + ], + "rho_per_layer": [ + 0.5491607189178467, + 0.3870346248149872, + 0.23711450397968292, + 0.15141981840133667, + 0.12508505582809448, + 0.15914584696292877, + 0.13365353643894196, + 0.11637556552886963 + ], + "nudge_per_layer": [ + -0.18924641609191895, + -0.02186501771211624, + -0.007085676770657301, + -0.0053551034070551395, + -0.00462403055280447, + -0.004574076272547245, + -0.004170445259660482, + -0.004062457010149956 + ], + "state_pred_error_per_layer": [ + 9406.7255859375, + 1991.255126953125, + 1233.173095703125, + 996.4456787109375, + 824.75537109375, + 800.2864990234375, + 821.3734130859375, + 840.202392578125 + ], + "mean_state_pred_error": 2114.277145385742 + }, + "credit_bridge": { + "test_acc": 0.5165, + "mean_bp_cosine": 0.41811549477279186, + "mean_rho": 0.45575808361172676, + "mean_nudge_001": -0.002801764407195151, + "mean_nudge_003": -0.00839249708224088, + "mean_nudge_01": -0.02782702073454857, + "bp_cosine_per_layer": [ + 0.159218892455101, + 0.41163527965545654, + 0.4353415369987488, + 0.4608742594718933, + 0.46223077178001404, + 0.4579800069332123, + 0.4774817228317261, + 0.48016148805618286 + ], + "rho_per_layer": [ + 0.16694357991218567, + 0.4445253610610962, + 0.4925374388694763, + 0.48059922456741333, + 0.4989780783653259, + 0.5061379075050354, + 0.5181043148040771, + 0.5382387638092041 + ], + "nudge_per_layer": [ + -0.030580628663301468, + -0.027534715831279755, + -0.027298064902424812, + -0.027803048491477966, + -0.027431834489107132, + -0.02679138071835041, + -0.027646536007523537, + -0.02752995677292347 + ], + "final_value_loss": 0.35056146993637083, + "final_term_loss": 0.0784306697010994, + "final_bridge_loss": 0.0149920065253973, + "final_tgrad_loss": 0.25713879618644714 + } + }, + "a1.0_L8_s123": { + "bp": { + "test_acc": 0.7715, + "mean_bp_cosine": 0.8317327573895454, + "mean_rho": 0.9999875128269196, + "mean_nudge_001": -0.028257266676519066, + "mean_nudge_003": -0.08214446459896863, + "mean_nudge_01": -0.24747182056307793, + "bp_cosine_per_layer": [ + 0.8705248832702637, + 0.8637571334838867, + 0.8509291410446167, + 0.8393645286560059, + 0.8308560848236084, + 0.8178726434707642, + 0.800449013710022, + 0.780108630657196 + ], + "rho_per_layer": [ + 0.9999995231628418, + 0.9999995827674866, + 0.9999989867210388, + 0.9999984502792358, + 0.9999953508377075, + 0.9999901056289673, + 0.9999750852584839, + 0.9999430179595947 + ], + "nudge_per_layer": [ + -0.5067576169967651, + -0.4360688626766205, + -0.3518902063369751, + -0.26053690910339355, + -0.1787266880273819, + -0.1170111671090126, + -0.07650406658649445, + -0.052279047667980194 + ] + }, + "dfa": { + "test_acc": 0.67, + "mean_bp_cosine": 0.06255943619180471, + "mean_rho": 0.0582913524704054, + "mean_nudge_001": -0.00016377134670619853, + "mean_nudge_003": -0.00048249874453176744, + "mean_nudge_01": -0.0015042584564071149, + "bp_cosine_per_layer": [ + -0.006531993858516216, + 0.06646430492401123, + 0.03470785170793533, + 0.06075863167643547, + 0.08359120786190033, + 0.10361115634441376, + 0.07729409635066986, + 0.08058023452758789 + ], + "rho_per_layer": [ + -0.009454472921788692, + 0.027615420520305634, + 0.016344428062438965, + 0.07737872004508972, + 0.07998150587081909, + 0.10012705624103546, + 0.06766189634799957, + 0.10667626559734344 + ], + "nudge_per_layer": [ + 0.008429424837231636, + -0.004321999382227659, + -0.0012797827366739511, + -0.0022665630094707012, + -0.003274995367974043, + -0.0036867314483970404, + -0.0025471593253314495, + -0.0030862612184137106 + ] + }, + "state_bridge": { + "test_acc": 0.63, + "mean_bp_cosine": 0.2676183916628361, + "mean_rho": 0.249815184623003, + "mean_nudge_001": -0.0025806196208577603, + "mean_nudge_003": -0.007662267831619829, + "mean_nudge_01": -0.024620095442514867, + "bp_cosine_per_layer": [ + 0.6138853430747986, + 0.41074037551879883, + 0.25203365087509155, + 0.20834164321422577, + 0.16624599695205688, + 0.15929004549980164, + 0.15449269115924835, + 0.175917387008667 + ], + "rho_per_layer": [ + 0.5534218549728394, + 0.3554393947124481, + 0.28831934928894043, + 0.1869889795780182, + 0.14766299724578857, + 0.176305890083313, + 0.1294843554496765, + 0.16089865565299988 + ], + "nudge_per_layer": [ + -0.14630448818206787, + -0.017482426017522812, + -0.00796731747686863, + -0.006267632823437452, + -0.00492177763953805, + -0.00457757618278265, + -0.004429594613611698, + -0.00500995060428977 + ], + "state_pred_error_per_layer": [ + 7478.478515625, + 1555.7657470703125, + 846.884521484375, + 607.9534301757812, + 659.867919921875, + 614.796630859375, + 546.969482421875, + 518.796142578125 + ], + "mean_state_pred_error": 1603.6890487670898 + }, + "credit_bridge": { + "test_acc": 0.5695, + "mean_bp_cosine": 0.33955336920917034, + "mean_rho": 0.4137213062494993, + "mean_nudge_001": -0.002328026050236076, + "mean_nudge_003": -0.006974202115088701, + "mean_nudge_01": -0.023127662017941475, + "bp_cosine_per_layer": [ + 0.08390675485134125, + 0.2993828356266022, + 0.37482553720474243, + 0.3876585066318512, + 0.3966418504714966, + 0.3863479495048523, + 0.3938036561012268, + 0.39385986328125 + ], + "rho_per_layer": [ + 0.09506039321422577, + 0.3888479173183441, + 0.42724472284317017, + 0.5000925064086914, + 0.4708487391471863, + 0.47097086906433105, + 0.48436442017555237, + 0.4723408818244934 + ], + "nudge_per_layer": [ + -0.027181372046470642, + -0.02298363298177719, + -0.02282092720270157, + -0.022664468735456467, + -0.02277727797627449, + -0.02207607962191105, + -0.022199643775820732, + -0.02231789380311966 + ], + "final_value_loss": 0.32433377566337585, + "final_term_loss": 0.09466714213788509, + "final_bridge_loss": 0.018076158130913973, + "final_tgrad_loss": 0.21159047515392304 + } + }, + "a1.0_L8_s456": { + "bp": { + "test_acc": 0.753, + "mean_bp_cosine": 0.8595180436968803, + "mean_rho": 0.9999836012721062, + "mean_nudge_001": -0.029901663539931178, + "mean_nudge_003": -0.08636575657874346, + "mean_nudge_01": -0.25306460773572326, + "bp_cosine_per_layer": [ + 0.8814424872398376, + 0.8780966401100159, + 0.8716025352478027, + 0.8659577369689941, + 0.8611791133880615, + 0.8505971431732178, + 0.840730607509613, + 0.8265380859375 + ], + "rho_per_layer": [ + 0.9999989867210388, + 0.9999986886978149, + 0.9999985694885254, + 0.9999977350234985, + 0.9999950528144836, + 0.9999887943267822, + 0.9999659657478333, + 0.9999250173568726 + ], + "nudge_per_layer": [ + -0.4892617166042328, + -0.43737056851387024, + -0.36532458662986755, + -0.27772778272628784, + -0.1931857019662857, + -0.12626537680625916, + -0.08131371438503265, + -0.05406741425395012 + ] + }, + "dfa": { + "test_acc": 0.6545, + "mean_bp_cosine": 0.07594231329858303, + "mean_rho": 0.08383850008249283, + "mean_nudge_001": -0.00040534641811973415, + "mean_nudge_003": -0.0011938292009290308, + "mean_nudge_01": -0.0038653643568977714, + "bp_cosine_per_layer": [ + 0.025392260402441025, + 0.05978121981024742, + 0.09360896795988083, + 0.06215091794729233, + 0.08870920538902283, + 0.07948237657546997, + 0.10833052545785904, + 0.0900830328464508 + ], + "rho_per_layer": [ + -0.015408031642436981, + 0.08876338601112366, + 0.15722069144248962, + 0.07516318559646606, + 0.12132002413272858, + 0.08764688670635223, + 0.0905974954366684, + 0.06540436297655106 + ], + "nudge_per_layer": [ + -0.002068763133138418, + -0.004839141853153706, + -0.004507332108914852, + -0.002498403424397111, + -0.004324691370129585, + -0.004049480427056551, + -0.004787375684827566, + -0.0038477268535643816 + ] + }, + "state_bridge": { + "test_acc": 0.6315, + "mean_bp_cosine": 0.22162932250648737, + "mean_rho": 0.200162704102695, + "mean_nudge_001": -0.002804466668749228, + "mean_nudge_003": -0.008329451040481217, + "mean_nudge_01": -0.026790971111040562, + "bp_cosine_per_layer": [ + 0.6046093106269836, + 0.3773959279060364, + 0.1675240397453308, + 0.13364183902740479, + 0.12548640370368958, + 0.11966440826654434, + 0.11708953976631165, + 0.12762311100959778 + ], + "rho_per_layer": [ + 0.5598001480102539, + 0.35775649547576904, + 0.14680343866348267, + 0.103827565908432, + 0.12472978234291077, + 0.08794894069433212, + 0.12868158519268036, + 0.09175367653369904 + ], + "nudge_per_layer": [ + -0.17137765884399414, + -0.018192056566476822, + -0.005168645642697811, + -0.004143164958804846, + -0.0039602769538760185, + -0.0037884372286498547, + -0.003734107594937086, + -0.00396342109888792 + ], + "state_pred_error_per_layer": [ + 11751.603515625, + 2306.73095703125, + 1321.091796875, + 1033.674560546875, + 973.6993408203125, + 865.9056396484375, + 869.378173828125, + 839.1387329101562 + ], + "mean_state_pred_error": 2495.1528396606445 + }, + "credit_bridge": { + "test_acc": 0.5275, + "mean_bp_cosine": 0.33450845070183277, + "mean_rho": 0.39851769525557756, + "mean_nudge_001": -0.0025428086810279638, + "mean_nudge_003": -0.007617499912157655, + "mean_nudge_01": -0.025270385667681694, + "bp_cosine_per_layer": [ + 0.1268395036458969, + 0.30569249391555786, + 0.34143707156181335, + 0.3805205225944519, + 0.3833070397377014, + 0.38344305753707886, + 0.3742453455924988, + 0.3805825710296631 + ], + "rho_per_layer": [ + 0.10492167621850967, + 0.4008791148662567, + 0.42003583908081055, + 0.4331238567829132, + 0.4291571080684662, + 0.4853004217147827, + 0.4488537311553955, + 0.46586981415748596 + ], + "nudge_per_layer": [ + -0.02585173025727272, + -0.023091215640306473, + -0.0244273878633976, + -0.026221776381134987, + -0.026039035990834236, + -0.025849176570773125, + -0.025189466774463654, + -0.02549329586327076 + ], + "final_value_loss": 0.41436073665618894, + "final_term_loss": 0.08663651337623596, + "final_bridge_loss": 0.013127461233735085, + "final_tgrad_loss": 0.3145967625617981 + } + }, + "a1.0_L12_s42": { + "bp": { + "test_acc": 0.761, + "mean_bp_cosine": 0.8604618857304255, + "mean_rho": 0.9999715387821198, + "mean_nudge_001": -0.027060116563613217, + "mean_nudge_003": -0.07916912420963247, + "mean_nudge_01": -0.2410698818663756, + "bp_cosine_per_layer": [ + 0.9098777174949646, + 0.9046642780303955, + 0.8960509300231934, + 0.8827707171440125, + 0.8719829320907593, + 0.8605888485908508, + 0.8495617508888245, + 0.8414114117622375, + 0.8343594074249268, + 0.8291183114051819, + 0.8250235915184021, + 0.8201327323913574 + ], + "rho_per_layer": [ + 0.9999990463256836, + 0.9999990463256836, + 0.9999988675117493, + 0.9999977946281433, + 0.9999968409538269, + 0.9999942779541016, + 0.9999903440475464, + 0.9999786615371704, + 0.9999630451202393, + 0.9999446272850037, + 0.9999108910560608, + 0.9998850226402283 + ], + "nudge_per_layer": [ + -0.6227189302444458, + -0.5321269631385803, + -0.43762683868408203, + -0.34503036737442017, + -0.26150017976760864, + -0.1957385241985321, + -0.14543747901916504, + -0.10888919234275818, + -0.08308196067810059, + -0.06497863680124283, + -0.05229911208152771, + -0.043410398066043854 + ] + }, + "dfa": { + "test_acc": 0.6555, + "mean_bp_cosine": 0.07142843399196863, + "mean_rho": 0.08962296570340793, + "mean_nudge_001": -0.00027090053966579336, + "mean_nudge_003": -0.0007314661440129081, + "mean_nudge_01": -0.0026503523016193262, + "bp_cosine_per_layer": [ + 0.019931811839342117, + 0.08357247710227966, + 0.07596792280673981, + 0.07454836368560791, + 0.08405900746583939, + 0.09273561835289001, + 0.08532143384218216, + 0.014841631054878235, + 0.05702097713947296, + 0.11365848034620285, + 0.0635562390089035, + 0.09192724525928497 + ], + "rho_per_layer": [ + -0.021908380091190338, + 0.08644437789916992, + 0.133758544921875, + 0.11560394614934921, + 0.09019643068313599, + 0.10901004821062088, + 0.05401141196489334, + 0.06626297533512115, + 0.10668720304965973, + 0.11482831090688705, + 0.07995637506246567, + 0.14062434434890747 + ], + "nudge_per_layer": [ + 0.012093277648091316, + -0.00814887322485447, + -0.0036774289328604937, + -0.0036643892526626587, + -0.0034756590612232685, + -0.0045063551515340805, + -0.003735880134627223, + -0.00101565255317837, + -0.0033070247154682875, + -0.005390047561377287, + -0.0029281126335263252, + -0.004048082046210766 + ] + }, + "state_bridge": { + "test_acc": 0.612, + "mean_bp_cosine": 0.2312017778555552, + "mean_rho": 0.2218381396184365, + "mean_nudge_001": -0.0020883519706937173, + "mean_nudge_003": -0.0062129807386857765, + "mean_nudge_01": -0.02010280774751057, + "bp_cosine_per_layer": [ + 0.6137553453445435, + 0.458263099193573, + 0.30694735050201416, + 0.21984770894050598, + 0.18884725868701935, + 0.1519574671983719, + 0.14165323972702026, + 0.13691727817058563, + 0.1416233777999878, + 0.126474529504776, + 0.13544593751430511, + 0.15268874168395996 + ], + "rho_per_layer": [ + 0.5528259873390198, + 0.43722641468048096, + 0.3177984952926636, + 0.20145072042942047, + 0.17441785335540771, + 0.10548915714025497, + 0.16265320777893066, + 0.1351865828037262, + 0.16532285511493683, + 0.1285737156867981, + 0.14820542931556702, + 0.13290725648403168 + ], + "nudge_per_layer": [ + -0.16301177442073822, + -0.02157333306968212, + -0.011153988540172577, + -0.00765608623623848, + -0.006283854134380817, + -0.005166183691471815, + -0.0045799510553479195, + -0.004474613815546036, + -0.004547867923974991, + -0.003950329497456551, + -0.004098072648048401, + -0.004737637937068939 + ], + "state_pred_error_per_layer": [ + 9663.3720703125, + 2355.42919921875, + 1189.673095703125, + 946.2671508789062, + 890.0131225585938, + 836.83837890625, + 765.7700805664062, + 776.2135009765625, + 909.9769287109375, + 744.7386474609375, + 809.6233520507812, + 764.1907958984375 + ], + "mean_state_pred_error": 1721.0088602701824 + }, + "credit_bridge": { + "test_acc": 0.551, + "mean_bp_cosine": 0.24796992043654123, + "mean_rho": 0.34521655660743517, + "mean_nudge_001": -0.0019821600387028107, + "mean_nudge_003": -0.005940369796007872, + "mean_nudge_01": -0.01972930335129301, + "bp_cosine_per_layer": [ + 0.050826266407966614, + 0.1324397623538971, + 0.19395378232002258, + 0.22954219579696655, + 0.24835197627544403, + 0.26261672377586365, + 0.2866933345794678, + 0.3069983422756195, + 0.3148944675922394, + 0.31817084550857544, + 0.3155951499938965, + 0.31555619835853577 + ], + "rho_per_layer": [ + 0.024354537948966026, + 0.23902058601379395, + 0.29458120465278625, + 0.31519168615341187, + 0.3208061456680298, + 0.38384467363357544, + 0.38460177183151245, + 0.4478553831577301, + 0.41032421588897705, + 0.452781081199646, + 0.43433815240859985, + 0.434899240732193 + ], + "nudge_per_layer": [ + -0.018513288348913193, + -0.014132995158433914, + -0.016322217881679535, + -0.017585258930921555, + -0.018846090883016586, + -0.02027801051735878, + -0.021141095086932182, + -0.02164183184504509, + -0.02207053080201149, + -0.022233182564377785, + -0.02206714265048504, + -0.021919995546340942 + ], + "final_value_loss": 0.40481987361907956, + "final_term_loss": 0.14867231681346893, + "final_bridge_loss": 0.015895452450215817, + "final_tgrad_loss": 0.24025210301876068 + } + }, + "a1.0_L12_s123": { + "bp": { + "test_acc": 0.7615, + "mean_bp_cosine": 0.8364224582910538, + "mean_rho": 0.9999674806992213, + "mean_nudge_001": -0.021432781708426774, + "mean_nudge_003": -0.061891427962109447, + "mean_nudge_01": -0.18090539829184613, + "bp_cosine_per_layer": [ + 0.86488276720047, + 0.8622424006462097, + 0.8600971698760986, + 0.85722416639328, + 0.8523166179656982, + 0.8457985520362854, + 0.8359642028808594, + 0.828606367111206, + 0.8221874237060547, + 0.8125513792037964, + 0.80171799659729, + 0.7934804558753967 + ], + "rho_per_layer": [ + 0.9999992251396179, + 0.9999991655349731, + 0.9999990463256836, + 0.9999980330467224, + 0.9999971389770508, + 0.9999936819076538, + 0.9999881386756897, + 0.9999800324440002, + 0.9999632835388184, + 0.999937891960144, + 0.9999018311500549, + 0.9998522996902466 + ], + "nudge_per_layer": [ + -0.4491935074329376, + -0.38857996463775635, + -0.3270212411880493, + -0.26439201831817627, + -0.20410630106925964, + -0.15283547341823578, + -0.11351937055587769, + -0.08454076200723648, + -0.06403174996376038, + -0.04978282377123833, + -0.03986590355634689, + -0.032995663583278656 + ] + }, + "dfa": { + "test_acc": 0.6485, + "mean_bp_cosine": 0.05831230893575897, + "mean_rho": 0.0407225100013117, + "mean_nudge_001": -0.00021713114256272092, + "mean_nudge_003": -0.0006509826756276501, + "mean_nudge_01": -0.002172412224657213, + "bp_cosine_per_layer": [ + 0.003139778506010771, + 0.07545783370733261, + 0.07123857736587524, + 0.04737270250916481, + 0.07089244574308395, + 0.05843178555369377, + 0.10959646850824356, + 0.04730183631181717, + 0.05721074715256691, + 0.06935717165470123, + 0.04019004851579666, + 0.04955831170082092 + ], + "rho_per_layer": [ + -0.020620837807655334, + 0.0424807034432888, + 0.07906489074230194, + -0.014874707907438278, + 0.06078936904668808, + 0.006801994517445564, + 0.11016394942998886, + 0.07577681541442871, + 0.01940302737057209, + 0.0600065141916275, + 0.020656054839491844, + 0.04902234673500061 + ], + "nudge_per_layer": [ + 0.00014946935698390007, + -0.004455030895769596, + -0.0028790468350052834, + -0.0015581330517306924, + -0.0028997263871133327, + -0.0020245155319571495, + -0.003806713502854109, + -0.0014502943959087133, + -0.0017623959574848413, + -0.002352846320718527, + -0.001400630921125412, + -0.001629082253202796 + ] + }, + "state_bridge": { + "test_acc": 0.6055, + "mean_bp_cosine": 0.23132580270369849, + "mean_rho": 0.21027085681756338, + "mean_nudge_001": -0.002061755420678916, + "mean_nudge_003": -0.006128282761589314, + "mean_nudge_01": -0.019752548774704337, + "bp_cosine_per_layer": [ + 0.5538393259048462, + 0.4287089705467224, + 0.25277969241142273, + 0.2402075231075287, + 0.180599182844162, + 0.15653815865516663, + 0.1736883521080017, + 0.18825414776802063, + 0.1335570216178894, + 0.13271775841712952, + 0.15632027387619019, + 0.17869922518730164 + ], + "rho_per_layer": [ + 0.4586557149887085, + 0.4002187252044678, + 0.23149724304676056, + 0.21227607131004333, + 0.1842716634273529, + 0.16792945563793182, + 0.21390791237354279, + 0.19318881630897522, + 0.08300350606441498, + 0.10752588510513306, + 0.12254554033279419, + 0.14822974801063538 + ], + "nudge_per_layer": [ + -0.16128812730312347, + -0.02071414887905121, + -0.008381091989576817, + -0.007560182362794876, + -0.005691731348633766, + -0.0046913521364331245, + -0.005232630763202906, + -0.0054755983874201775, + -0.0038832086138427258, + -0.004123975522816181, + -0.004747895523905754, + -0.005240642465651035 + ], + "state_pred_error_per_layer": [ + 8762.341796875, + 2348.0966796875, + 1278.38525390625, + 1081.769287109375, + 948.214599609375, + 985.5714111328125, + 775.6072387695312, + 713.37109375, + 927.2667846679688, + 1123.047119140625, + 1035.65966796875, + 864.7014770507812 + ], + "mean_state_pred_error": 1737.002700805664 + }, + "credit_bridge": { + "test_acc": 0.4905, + "mean_bp_cosine": 0.14494075424348316, + "mean_rho": 0.18026241473853588, + "mean_nudge_001": -0.0010125784683623351, + "mean_nudge_003": -0.003034341447346378, + "mean_nudge_01": -0.010073745266709011, + "bp_cosine_per_layer": [ + 0.0054779257625341415, + 0.004163481295108795, + -0.01823507994413376, + 0.06908583641052246, + 0.09582538902759552, + 0.15172168612480164, + 0.18814444541931152, + 0.21233659982681274, + 0.2397850900888443, + 0.26321661472320557, + 0.2640886902809143, + 0.2636783719062805 + ], + "rho_per_layer": [ + 0.05151631310582161, + 0.03990761935710907, + 0.02668120339512825, + 0.08933386206626892, + 0.12927217781543732, + 0.1893344521522522, + 0.20202970504760742, + 0.27141058444976807, + 0.2724490761756897, + 0.2844354808330536, + 0.2797800898551941, + 0.32699841260910034 + ], + "nudge_per_layer": [ + -0.0015225817915052176, + -0.0009501088643446565, + 0.00033305209944956005, + -0.005592360161244869, + -0.00755771528929472, + -0.010863769799470901, + -0.012987833470106125, + -0.014405487105250359, + -0.015937766060233116, + -0.017140284180641174, + -0.017137283459305763, + -0.01712280511856079 + ], + "final_value_loss": 0.42473253202438355, + "final_term_loss": 0.10016471980810165, + "final_bridge_loss": 0.011516085395216941, + "final_tgrad_loss": 0.3130517265796661 + } + }, + "a1.0_L12_s456": { + "bp": { + "test_acc": 0.762, + "mean_bp_cosine": 0.8058839539686838, + "mean_rho": 0.999967540303866, + "mean_nudge_001": -0.023895990879585344, + "mean_nudge_003": -0.06970183023562034, + "mean_nudge_01": -0.21104640668878952, + "bp_cosine_per_layer": [ + 0.8338037729263306, + 0.8328856229782104, + 0.8300410509109497, + 0.823561429977417, + 0.8153207302093506, + 0.8093391060829163, + 0.8022103309631348, + 0.797042727470398, + 0.7909072041511536, + 0.7847579121589661, + 0.7778322100639343, + 0.7729053497314453 + ], + "rho_per_layer": [ + 0.9999991059303284, + 0.999998927116394, + 0.9999983906745911, + 0.9999978542327881, + 0.999996542930603, + 0.9999936819076538, + 0.9999876022338867, + 0.9999791383743286, + 0.9999581575393677, + 0.9999358057975769, + 0.9998983144760132, + 0.9998669624328613 + ], + "nudge_per_layer": [ + -0.5344969034194946, + -0.45930254459381104, + -0.3820700943470001, + -0.30436116456985474, + -0.2331882268190384, + -0.17455099523067474, + -0.12991222739219666, + -0.09728521853685379, + -0.07412658631801605, + -0.05795694515109062, + -0.04662308096885681, + -0.03868289291858673 + ] + }, + "dfa": { + "test_acc": 0.6705, + "mean_bp_cosine": 0.07614415294180314, + "mean_rho": 0.07346192157516877, + "mean_nudge_001": -0.0004569464314651365, + "mean_nudge_003": -0.0013685211645982538, + "mean_nudge_01": -0.004532526101684198, + "bp_cosine_per_layer": [ + 0.04563574492931366, + 0.07466404139995575, + 0.07062304764986038, + 0.07941032946109772, + 0.08478259295225143, + 0.1176375150680542, + 0.051365386694669724, + 0.07094398140907288, + 0.06898803263902664, + 0.07310269773006439, + 0.0635182335972786, + 0.11305823177099228 + ], + "rho_per_layer": [ + 0.026268895715475082, + 0.03733495995402336, + 0.07775422930717468, + 0.12396883964538574, + 0.05687103420495987, + 0.13703036308288574, + -0.0030320845544338226, + 0.08171480149030685, + 0.06336408108472824, + 0.09909991919994354, + 0.06059148907661438, + 0.12057653069496155 + ], + "nudge_per_layer": [ + -0.015672076493501663, + -0.0053095086477696896, + -0.0031822575256228447, + -0.003722358262166381, + -0.0036155935376882553, + -0.004913205746561289, + -0.0017889357404783368, + -0.002959918463602662, + -0.003063073381781578, + -0.003171245101839304, + -0.0024787387810647488, + -0.004513401538133621 + ] + }, + "state_bridge": { + "test_acc": 0.6015, + "mean_bp_cosine": 0.1852269663165013, + "mean_rho": 0.18596469921370348, + "mean_nudge_001": -0.001999816272776419, + "mean_nudge_003": -0.005956100358162075, + "mean_nudge_01": -0.01933680862809221, + "bp_cosine_per_layer": [ + 0.5561584234237671, + 0.39794063568115234, + 0.20452159643173218, + 0.14641982316970825, + 0.11315252631902695, + 0.12314423173666, + 0.11100500077009201, + 0.11256138980388641, + 0.12550771236419678, + 0.11898934841156006, + 0.11000233888626099, + 0.10332056879997253 + ], + "rho_per_layer": [ + 0.4663659632205963, + 0.38622361421585083, + 0.20298895239830017, + 0.1521472930908203, + 0.10572830587625504, + 0.14532539248466492, + 0.1235864907503128, + 0.12295880913734436, + 0.1263602077960968, + 0.1123446375131607, + 0.14707674086093903, + 0.1404699832201004 + ], + "nudge_per_layer": [ + -0.16852372884750366, + -0.020911922678351402, + -0.007518916856497526, + -0.005010381806641817, + -0.0037449360825121403, + -0.004001074004918337, + -0.0037657374050468206, + -0.0037060989998281, + -0.00406123511493206, + -0.003861584234982729, + -0.0035726726055145264, + -0.0033634149003773928 + ], + "state_pred_error_per_layer": [ + 16351.89453125, + 3139.08837890625, + 1824.6005859375, + 1391.949462890625, + 1295.1900634765625, + 1149.4605712890625, + 981.4422607421875, + 921.3729248046875, + 954.6389770507812, + 1032.970703125, + 1065.58984375, + 1272.3818359375 + ], + "mean_state_pred_error": 2615.048344930013 + }, + "credit_bridge": { + "test_acc": 0.5585, + "mean_bp_cosine": 0.3251700059821208, + "mean_rho": 0.4226210874815782, + "mean_nudge_001": -0.0023732566623948514, + "mean_nudge_003": -0.007109481530884902, + "mean_nudge_01": -0.02357900080581506, + "bp_cosine_per_layer": [ + 0.05994441360235214, + 0.19127817451953888, + 0.25874069333076477, + 0.31905949115753174, + 0.31442493200302124, + 0.3214789927005768, + 0.368133008480072, + 0.38988351821899414, + 0.4050426781177521, + 0.416469931602478, + 0.4253390431404114, + 0.4322451949119568 + ], + "rho_per_layer": [ + 0.1191493421792984, + 0.31643322110176086, + 0.4170604646205902, + 0.42330044507980347, + 0.4319503903388977, + 0.42732322216033936, + 0.46659332513809204, + 0.487338662147522, + 0.496512234210968, + 0.4787842035293579, + 0.5010949969291687, + 0.5059125423431396 + ], + "nudge_per_layer": [ + -0.015865826979279518, + -0.018151750788092613, + -0.021288521587848663, + -0.02352731302380562, + -0.023306310176849365, + -0.02329857647418976, + -0.025182321667671204, + -0.025520823895931244, + -0.026067661121487617, + -0.026535863056778908, + -0.027021951973438263, + -0.02718108892440796 + ], + "final_value_loss": 0.3557061047077179, + "final_term_loss": 0.06590610226392746, + "final_bridge_loss": 0.010093027733266353, + "final_tgrad_loss": 0.2797069767475128 + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a0.5_L12_s123.json b/results/synth_ladder_v2_hi/synth_a0.5_L12_s123.json new file mode 100644 index 0000000..5ae584b --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a0.5_L12_s123.json @@ -0,0 +1,1722 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.0668871035575866, + 0.5437644843578339, + 0.4442927023410797, + 0.40189131622314456, + 0.41018874361515045, + 0.3410574321269989, + 0.3484022264003754, + 0.3299962274551392, + 0.3777468213558197, + 0.320639072227478, + 0.3502114427804947, + 0.2625524127006531, + 0.31084647080898287, + 0.23638844475746154, + 0.23954274733066558, + 0.21965548858642578, + 0.23137761989831923, + 0.2215217474937439, + 0.21972281413078307, + 0.2046865596175194, + 0.17405090971589088, + 0.16184886281490327, + 0.19982717757225035, + 0.21438712718486785, + 0.18986032649278642, + 0.16079453411102296, + 0.12543020910024644, + 0.10698981108665466, + 0.1377583697795868, + 0.15657683781385423, + 0.11835481392145157, + 0.11930964469909668, + 0.1372688979268074, + 0.10084772405028343, + 0.08756917915344238, + 0.09215591390132905, + 0.10565964897871018, + 0.08364779654145241, + 0.06760566492080688, + 0.06659261006116866, + 0.05321097924113274, + 0.04292736679315567, + 0.038505215954780576, + 0.04860781878978014, + 0.03835035711228847, + 0.03284513468891382, + 0.02925829759836197, + 0.034927824586629866, + 0.02977181176543236, + 0.02587605638951063, + 0.021584136448800563, + 0.021009254217147826, + 0.035822143226861954, + 0.02755334359407425, + 0.022640997081622483, + 0.01857010641694069, + 0.016963605327904224, + 0.016223060864210128, + 0.015676903715729714, + 0.014825385958701372, + 0.014110816264152526, + 0.014133429580926895, + 0.013563485038280487, + 0.01332942191362381, + 0.012876193167269229, + 0.012466417776048183, + 0.012171600410342216, + 0.012017940378189087, + 0.011746616941690446, + 0.011764343333244325, + 0.011572992166876793, + 0.011454691462218761, + 0.011281873452663422, + 0.011190583446621894, + 0.011105955013632774, + 0.011065145464241505, + 0.011014660102501512, + 0.01097581763714552, + 0.01095222277250141, + 0.01094091155230999 + ], + "train_acc": [ + 0.6115, + 0.7903, + 0.8251, + 0.8409, + 0.8391, + 0.8641, + 0.8593, + 0.8679, + 0.8542, + 0.8751, + 0.8637, + 0.8989, + 0.877, + 0.9065, + 0.9038, + 0.9146, + 0.9084, + 0.9142, + 0.914, + 0.921, + 0.9315, + 0.9368, + 0.9221, + 0.921, + 0.9307, + 0.938, + 0.9533, + 0.9631, + 0.9481, + 0.9406, + 0.9552, + 0.9537, + 0.9495, + 0.9637, + 0.97, + 0.9687, + 0.9622, + 0.9706, + 0.9784, + 0.9788, + 0.9861, + 0.9911, + 0.9939, + 0.9886, + 0.9935, + 0.9961, + 0.998, + 0.9944, + 0.9963, + 0.998, + 0.9992, + 0.9989, + 0.992, + 0.9963, + 0.998, + 0.9995, + 0.9996, + 0.9998, + 0.9998, + 0.9999, + 0.9998, + 1.0, + 0.9999, + 1.0, + 0.9999, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.775, + 0.776, + 0.8255, + 0.8235, + 0.8115, + 0.836, + 0.838, + 0.838, + 0.837, + 0.8235, + 0.827, + 0.8475, + 0.8465, + 0.8435, + 0.841, + 0.856, + 0.847, + 0.8495, + 0.85, + 0.856, + 0.8575, + 0.857, + 0.854, + 0.8415, + 0.859, + 0.851, + 0.8635, + 0.865, + 0.8625, + 0.851, + 0.868, + 0.8505, + 0.8565, + 0.87, + 0.866, + 0.861, + 0.852, + 0.868, + 0.869, + 0.8655, + 0.8675, + 0.869, + 0.8685, + 0.8635, + 0.8705, + 0.8675, + 0.869, + 0.867, + 0.872, + 0.873, + 0.8705, + 0.8715, + 0.864, + 0.8715, + 0.872, + 0.871, + 0.878, + 0.8745, + 0.872, + 0.874, + 0.8735, + 0.8715, + 0.872, + 0.8715, + 0.8725, + 0.8735, + 0.873, + 0.872, + 0.872, + 0.873, + 0.8735, + 0.872, + 0.8725, + 0.872, + 0.872, + 0.873, + 0.8725, + 0.873, + 0.873, + 0.873 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8060421943664551, + 0.7944625616073608, + 0.776944637298584, + 0.7588614821434021, + 0.7418972849845886, + 0.7322722673416138, + 0.724165678024292, + 0.7197043299674988, + 0.7152823209762573, + 0.7119243144989014, + 0.709496021270752, + 0.7078304886817932 + ], + "perturbation_rho": [ + 0.9999996423721313, + 0.9999984502792358, + 0.9999962449073792, + 0.999989926815033, + 0.9999754428863525, + 0.9999579191207886, + 0.999927818775177, + 0.999887228012085, + 0.9998751878738403, + 0.9997915029525757, + 0.9997637867927551, + 0.9997560381889343 + ], + "nudging": { + "0.001": [ + -0.04387564957141876, + -0.026459218934178352, + -0.01598835177719593, + -0.009950939565896988, + -0.0065530999563634396, + -0.004664362408220768, + -0.003570194821804762, + -0.0028879866003990173, + -0.0024394416250288486, + -0.0021331091411411762, + -0.0019131104927510023, + -0.0017530664335936308 + ], + "0.003": [ + -0.12082510441541672, + -0.07548783719539642, + -0.04654107615351677, + -0.029300624504685402, + -0.01941942237317562, + -0.01387093961238861, + -0.010638581588864326, + -0.008616363629698753, + -0.007284482475370169, + -0.006373265758156776, + -0.005718273110687733, + -0.005241651087999344 + ], + "0.01": [ + -0.2872876822948456, + -0.20931334793567657, + -0.13937950134277344, + -0.09144100546836853, + -0.06199805811047554, + -0.04483566805720329, + -0.03463221341371536, + -0.02817366272211075, + -0.023888790979981422, + -0.02094285935163498, + -0.01881779544055462, + -0.01726764440536499 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.142750821685791, + 1.124327583885193, + 0.7785231340408325, + 0.6528371575355529, + 0.597726934146881, + 0.5598292840957642, + 0.5507024248838425, + 0.5393614018440247, + 0.5861102363586426, + 0.5633430314064026, + 0.5583740697860717, + 0.5919369807243348, + 0.6456176485061645, + 0.557507578754425, + 0.6100466576099396, + 0.5981708965301513, + 0.6966950350761414, + 0.6483181215286254, + 0.6949886666774749, + 0.7073626656532288, + 0.7537654346466064, + 0.84040883102417, + 0.6919007718086243, + 0.7978002725124359, + 0.7179612370491028, + 0.799304240322113, + 0.8661868356734514, + 0.6795031730651856, + 0.6878745692253113, + 0.6902590084075928, + 0.8633141542434692, + 0.7126479680061341, + 0.7912728582382202, + 0.8799988972187043, + 0.8774635292053222, + 0.7583431783676148, + 0.7759649380683898, + 0.6964675615310669, + 0.7451448738098144, + 0.9347431049585342, + 0.6569768931627273, + 0.6217489993751049, + 0.6617763934135437, + 0.763850627553463, + 0.7051671092033386, + 0.6679003673553466, + 0.6873064106941223, + 0.721931100845337, + 0.7477014111042023, + 0.6456629550933838, + 0.6599196642875671, + 0.6208732713699341, + 0.6234532192230224, + 0.5699338432312012, + 0.6139316390037537, + 0.5759364881515503, + 0.5688060250282287, + 0.5778871156692504, + 0.5713616683959961, + 0.5509775221824647, + 0.5339077308654785, + 0.5171661471366882, + 0.5024198468208313, + 0.5114490198850632, + 0.4912056381225586, + 0.49547468848228454, + 0.4774726238250732, + 0.4827991735935211, + 0.47101506519317626, + 0.47335759959220886, + 0.47204044761657715, + 0.46472445521354677, + 0.4678656229496002, + 0.4620117915153503, + 0.45770361523628234, + 0.45486976613998414, + 0.4546703920841217, + 0.4531755482196808, + 0.4513186443388462, + 0.4506361876010895 + ], + "train_acc": [ + 0.2264, + 0.5937, + 0.7105, + 0.7583, + 0.775, + 0.7885, + 0.7948, + 0.803, + 0.7889, + 0.7989, + 0.8026, + 0.7968, + 0.7883, + 0.8152, + 0.7994, + 0.8119, + 0.7968, + 0.8073, + 0.7994, + 0.7931, + 0.7927, + 0.7855, + 0.8066, + 0.7951, + 0.8074, + 0.7894, + 0.7862, + 0.8163, + 0.8118, + 0.8146, + 0.7906, + 0.8097, + 0.8035, + 0.7874, + 0.7907, + 0.8091, + 0.8032, + 0.8171, + 0.8057, + 0.784, + 0.8211, + 0.8244, + 0.8214, + 0.8004, + 0.8099, + 0.8165, + 0.8113, + 0.8098, + 0.8046, + 0.8138, + 0.8158, + 0.8238, + 0.8252, + 0.8327, + 0.8298, + 0.8294, + 0.8263, + 0.8262, + 0.8303, + 0.8366, + 0.8356, + 0.842, + 0.8421, + 0.8435, + 0.8451, + 0.8433, + 0.8497, + 0.8496, + 0.8532, + 0.851, + 0.8511, + 0.8527, + 0.8529, + 0.8519, + 0.8545, + 0.854, + 0.8556, + 0.8556, + 0.8555, + 0.8553 + ], + "test_acc": [ + 0.4685, + 0.6425, + 0.7055, + 0.723, + 0.755, + 0.755, + 0.7485, + 0.71, + 0.734, + 0.746, + 0.706, + 0.685, + 0.7565, + 0.7435, + 0.7425, + 0.7695, + 0.7395, + 0.74, + 0.7145, + 0.696, + 0.7095, + 0.694, + 0.6885, + 0.7055, + 0.7615, + 0.7, + 0.7625, + 0.751, + 0.7555, + 0.7025, + 0.7275, + 0.757, + 0.6975, + 0.683, + 0.7535, + 0.721, + 0.7555, + 0.7335, + 0.7275, + 0.7405, + 0.7865, + 0.746, + 0.724, + 0.731, + 0.7445, + 0.7255, + 0.7325, + 0.723, + 0.772, + 0.752, + 0.7665, + 0.785, + 0.7755, + 0.7705, + 0.76, + 0.7715, + 0.7895, + 0.777, + 0.767, + 0.7965, + 0.7835, + 0.7975, + 0.7865, + 0.786, + 0.796, + 0.801, + 0.7965, + 0.791, + 0.7925, + 0.791, + 0.786, + 0.7975, + 0.7935, + 0.7895, + 0.796, + 0.7965, + 0.798, + 0.796, + 0.797, + 0.7975 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.004078918602317572, + 0.1059243381023407, + 0.07574640959501266, + 0.07308551669120789, + 0.066571444272995, + 0.056897446513175964, + 0.12165610492229462, + 0.06462406367063522, + 0.04925639182329178, + 0.04602370783686638, + 0.035759277641773224, + 0.06015833467245102 + ], + "perturbation_rho": [ + -0.011486321687698364, + 0.04376016557216644, + 0.037421341985464096, + 0.05220063030719757, + 0.09364941716194153, + -0.03169674053788185, + 0.15961039066314697, + 0.10634914040565491, + 0.03384825587272644, + 0.02390148863196373, + -0.010392685420811176, + 0.00882963091135025 + ], + "nudging": { + "0.001": [ + -0.0003049457154702395, + -0.0003453067038208246, + -0.00019223694107495248, + -0.00020254506671335548, + -0.00016044230142142624, + -0.00010334418038837612, + -0.00029247987549751997, + -0.00015202155918814242, + -9.743614646140486e-05, + -0.00010192080662818626, + -8.19721317384392e-05, + -0.0001297243870794773 + ], + "0.003": [ + -0.0008906631264835596, + -0.0010361261665821075, + -0.0005767023540101945, + -0.0006089159287512302, + -0.0004821037291549146, + -0.00030989840161055326, + -0.0008778797928243876, + -0.00045706197852268815, + -0.0002917651436291635, + -0.0003039806033484638, + -0.0002444116398692131, + -0.00038952555041760206 + ], + "0.01": [ + -0.0026711553800851107, + -0.003443576628342271, + -0.001918894238770008, + -0.0020233127288520336, + -0.0016027885721996427, + -0.0010300527792423964, + -0.002917288802564144, + -0.001525502186268568, + -0.0009703689720481634, + -0.0010098961647599936, + -0.0008095581433735788, + -0.0012933723628520966 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.7463860042572021, + 1.1237696697235107, + 0.972771835899353, + 0.9426122094154358, + 0.8994912829399109, + 0.9408926801681519, + 0.9865427770614624, + 1.0485262629508971, + 1.0925080902099609, + 1.1362103001594543, + 1.0678862438201904, + 1.0652718430519104, + 1.0586652740478515, + 1.0178926465988158, + 1.0305222831726075, + 1.0413858165740968, + 1.0357634119033814, + 1.047720281791687, + 1.0609775308609009, + 1.0116510014533997, + 0.9950579191207886, + 0.9199824966430664, + 0.9665196490287781, + 0.9476463966369629, + 1.0014626719474793, + 0.9582755434036255, + 1.010899329662323, + 1.0397068269729615, + 1.0328380886077881, + 1.043629725265503, + 0.9458726802825927, + 0.9873936015129089, + 1.0067718154907226, + 0.9733795068740845, + 0.9494395099639893, + 0.9087101627349854, + 0.9260237079620361, + 0.9596985802650452, + 0.8670240854263306, + 0.9266280819892884, + 0.9033067417144776, + 0.8523105756759644, + 0.8422792108535767, + 0.8166048532485962, + 0.8156945413589477, + 0.8301033269882202, + 0.8141396549224853, + 0.8390941219329834, + 0.8281017392158508, + 0.8349929582595825, + 0.8482530313491822, + 0.8541515255928039, + 0.842770311498642, + 0.8406181728363037, + 0.8218491198539734, + 0.8218080397605896, + 0.8124953329086304, + 0.7943122324943542, + 0.7955346862792969, + 0.7875666446685791, + 0.7818890949249268, + 0.7744473322868347, + 0.7751531169891357, + 0.7724810953140259, + 0.7624368892669677, + 0.7628077686309814, + 0.7549171347618103, + 0.755369038105011, + 0.7542786574363709, + 0.7511461977005005, + 0.7510316205978393, + 0.7489814598083496, + 0.7467557451248169, + 0.7460188133239746, + 0.7445521638870239, + 0.7435068511009216, + 0.7426531793594361, + 0.7419929014205933, + 0.7417299631118774, + 0.7414803896903992 + ], + "train_acc": [ + 0.3799, + 0.5937, + 0.6617, + 0.6768, + 0.6897, + 0.6834, + 0.6646, + 0.6466, + 0.6432, + 0.6355, + 0.643, + 0.6389, + 0.6358, + 0.6479, + 0.6424, + 0.641, + 0.6359, + 0.6327, + 0.632, + 0.6475, + 0.6546, + 0.6719, + 0.6631, + 0.6691, + 0.6638, + 0.6735, + 0.6655, + 0.6522, + 0.6519, + 0.6562, + 0.6804, + 0.6703, + 0.6634, + 0.6783, + 0.6836, + 0.6906, + 0.6856, + 0.685, + 0.7038, + 0.693, + 0.6972, + 0.7082, + 0.7133, + 0.7162, + 0.7181, + 0.7105, + 0.7131, + 0.7086, + 0.7153, + 0.7128, + 0.7104, + 0.7091, + 0.7102, + 0.7122, + 0.7194, + 0.719, + 0.7198, + 0.7235, + 0.7189, + 0.7262, + 0.7256, + 0.7258, + 0.7319, + 0.7268, + 0.7345, + 0.7312, + 0.7347, + 0.7352, + 0.7339, + 0.736, + 0.7356, + 0.736, + 0.7385, + 0.7368, + 0.7372, + 0.7371, + 0.737, + 0.7382, + 0.738, + 0.7379 + ], + "test_acc": [ + 0.5265, + 0.6085, + 0.6455, + 0.635, + 0.656, + 0.616, + 0.6215, + 0.608, + 0.5975, + 0.6135, + 0.605, + 0.6015, + 0.5845, + 0.5955, + 0.601, + 0.6115, + 0.619, + 0.6165, + 0.609, + 0.626, + 0.6445, + 0.632, + 0.6355, + 0.6185, + 0.6355, + 0.602, + 0.614, + 0.6335, + 0.618, + 0.628, + 0.634, + 0.642, + 0.607, + 0.6585, + 0.6435, + 0.6575, + 0.608, + 0.654, + 0.6625, + 0.652, + 0.681, + 0.6795, + 0.6775, + 0.685, + 0.6635, + 0.6925, + 0.665, + 0.6675, + 0.663, + 0.6625, + 0.6655, + 0.6675, + 0.6725, + 0.674, + 0.684, + 0.685, + 0.6875, + 0.685, + 0.693, + 0.686, + 0.688, + 0.683, + 0.6925, + 0.679, + 0.6815, + 0.6875, + 0.69, + 0.6855, + 0.683, + 0.6885, + 0.6895, + 0.6905, + 0.6875, + 0.689, + 0.6915, + 0.692, + 0.6925, + 0.6915, + 0.6905, + 0.69 + ], + "state_pred_error": [ + 0.657575396156311, + 0.22584220933914184, + 0.18108190598487853, + 0.1738492854833603, + 0.1768016979932785, + 0.17527156100273134, + 0.1744111572265625, + 0.18089782931804657, + 0.1815103266239166, + 0.17203099308013917, + 0.16158259053230287, + 0.150070090007782, + 0.14713554129600526, + 0.1392310976266861, + 0.13433781069517137, + 0.12369427697658539, + 0.11368098001480102, + 0.10957575480937957, + 0.10401724026203156, + 0.097935398042202, + 0.09728261232376098, + 0.09723384432792663, + 0.08889269602298737, + 0.08045474321842194, + 0.0764869434595108, + 0.0754717215538025, + 0.07573794380426407, + 0.07702496689558029, + 0.07481489708423615, + 0.06833497145175933, + 0.06267784029245377, + 0.05740301186442375, + 0.05463098112940788, + 0.05097537848949432, + 0.04853306106328964, + 0.046815031588077545, + 0.04702129671573639, + 0.047897269797325136, + 0.04525828623175621, + 0.04126551170349121, + 0.038078772968053815, + 0.035508244448900224, + 0.033928532779216765, + 0.033214526349306106, + 0.032263154244422915, + 0.03165398389697075, + 0.03176654878854752, + 0.032726337200403216, + 0.03520564076304436, + 0.03746888961195946, + 0.039616973650455474, + 0.040450227236747745, + 0.03974002408981323, + 0.03915794268846512, + 0.038212089216709134, + 0.03644757592380047, + 0.034951094454526904, + 0.033642032438516614, + 0.032086009567976, + 0.031101924151182174, + 0.030201471465826035, + 0.029204100465774537, + 0.02867460669875145, + 0.027740669012069702, + 0.027074356430768966, + 0.026351269084215163, + 0.02568203446865082, + 0.024844326972961427, + 0.024070368832349778, + 0.023772034823894502, + 0.023003196692466737, + 0.02215852342545986, + 0.02170176804959774, + 0.021068523544073105, + 0.020733746546506882, + 0.020220248556137084, + 0.019796535715460778, + 0.019584159588813783, + 0.019099098661541938, + 0.018604568365216255 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.7613614797592163, + 0.3896995782852173, + 0.1309610903263092, + 0.10979019105434418, + 0.09164053201675415, + 0.07316795736551285, + 0.09407100081443787, + 0.08964815735816956, + 0.08292470127344131, + 0.08648289740085602, + 0.0870373547077179, + 0.08205951005220413 + ], + "perturbation_rho": [ + 0.6734859943389893, + 0.37621644139289856, + 0.08932416141033173, + 0.11710754036903381, + 0.07942430675029755, + 0.058268360793590546, + 0.05698401480913162, + 0.12727776169776917, + 0.03869014233350754, + 0.06775026768445969, + 0.0798446387052536, + 0.05710796266794205 + ], + "nudging": { + "0.001": [ + -0.02036258764564991, + -0.0012726839631795883, + -0.00030185317154973745, + -0.00024410546757280827, + -0.00020778426551260054, + -0.00017662602476775646, + -0.00021787048899568617, + -0.00021810311591252685, + -0.00019943300867453218, + -0.00021332810865715146, + -0.0002083198050968349, + -0.00020046724239364266 + ], + "0.003": [ + -0.05963846668601036, + -0.0038126767612993717, + -0.0009049437940120697, + -0.000732341140974313, + -0.0006232722080312669, + -0.0005303305806592107, + -0.0006538627203553915, + -0.0006539188325405121, + -0.0005980591522529721, + -0.0006397926481440663, + -0.0006250399746932089, + -0.000601528212428093 + ], + "0.01": [ + -0.1828688532114029, + -0.012644743546843529, + -0.003011793363839388, + -0.0024378912057727575, + -0.0020753229036927223, + -0.0017659795703366399, + -0.0021767604630440474, + -0.0021774054039269686, + -0.0019914493896067142, + -0.0021301559172570705, + -0.0020812181755900383, + -0.0020023814868181944 + ] + }, + "state_pred_error_per_layer": [ + 12496.853515625, + 8106.66162109375, + 5059.9169921875, + 4050.405517578125, + 3454.0888671875, + 2936.005859375, + 2830.2294921875, + 2863.870361328125, + 3118.476806640625, + 3786.361083984375, + 3251.337890625, + 3255.708740234375 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.1431375211715697, + 1.1314113176345826, + 0.763494457435608, + 0.6545422078132629, + 0.5963865146636963, + 0.5926999958992004, + 0.5563723385810853, + 0.5273848016023636, + 0.526389640045166, + 0.5737923973083496, + 0.6184886278152466, + 0.540420817565918, + 0.6509309328079224, + 0.6382177831172943, + 0.7038152565479279, + 0.6197104157209397, + 0.6280380012512207, + 0.7637808742523193, + 0.7737348519325257, + 0.9252185022354126, + 0.8572391531944275, + 0.8700120922088623, + 0.9276481540679932, + 0.9125369520187377, + 0.9172161891937256, + 0.8759773926734924, + 0.9195978992462158, + 0.9266179433822632, + 0.9306347612380982, + 0.9355648864746093, + 1.1860807178497315, + 1.2574410260200501, + 0.9577581795692444, + 0.9231017108917237, + 0.9289527448654175, + 1.1865424547195436, + 1.267508578491211, + 1.2051992826461793, + 1.0714506145477294, + 1.0610662315368653, + 1.08882954788208, + 1.1172235593795776, + 1.0685178228378296, + 1.072965350151062, + 1.0879979553222656, + 1.091849722290039, + 1.0951012313842774, + 1.1118889781951904, + 1.1178365121841431, + 1.1614880767822267, + 1.1315129627227782, + 1.1100497497558595, + 1.0586509960174562, + 1.0336646169662476, + 0.9826500085830688, + 0.9442742486953736, + 0.9249188864707947, + 0.9147214357376099, + 0.9175932567596435, + 0.902301881980896, + 0.9019629783630371, + 0.9227725395202637, + 0.9098626622200012, + 0.9148895687103271, + 0.9403810447692871, + 0.9147419730186462, + 0.9180494606018066, + 0.9268005172729492, + 0.9152821050643921, + 0.9107012414932251, + 0.9089200870513916, + 0.9040866283416749, + 0.9004606851577759, + 0.8984116611480712, + 0.8967930128097534, + 0.8934282851934433, + 0.8917015773773194, + 0.8904676536560059, + 0.889515599822998, + 0.8890901028633118 + ], + "train_acc": [ + 0.2244, + 0.5835, + 0.7155, + 0.7573, + 0.78, + 0.7817, + 0.7882, + 0.8049, + 0.805, + 0.798, + 0.7902, + 0.811, + 0.7863, + 0.796, + 0.7855, + 0.8072, + 0.8079, + 0.7868, + 0.7864, + 0.7652, + 0.7689, + 0.7653, + 0.7554, + 0.7566, + 0.7448, + 0.7535, + 0.7354, + 0.7394, + 0.7249, + 0.7259, + 0.6872, + 0.6905, + 0.7291, + 0.7244, + 0.7165, + 0.6711, + 0.6454, + 0.6564, + 0.6834, + 0.6735, + 0.6685, + 0.6727, + 0.6801, + 0.6826, + 0.6789, + 0.6825, + 0.6789, + 0.6757, + 0.6757, + 0.6735, + 0.6784, + 0.6749, + 0.6853, + 0.6856, + 0.6876, + 0.694, + 0.699, + 0.6992, + 0.6983, + 0.6973, + 0.702, + 0.6927, + 0.695, + 0.6934, + 0.6853, + 0.695, + 0.6897, + 0.6934, + 0.6927, + 0.6948, + 0.693, + 0.695, + 0.6974, + 0.6947, + 0.6957, + 0.6963, + 0.6997, + 0.6972, + 0.698, + 0.6986 + ], + "test_acc": [ + 0.4745, + 0.6585, + 0.71, + 0.7365, + 0.713, + 0.7385, + 0.7485, + 0.7465, + 0.7115, + 0.7135, + 0.755, + 0.718, + 0.7445, + 0.705, + 0.7395, + 0.739, + 0.696, + 0.739, + 0.7015, + 0.654, + 0.693, + 0.6895, + 0.6715, + 0.696, + 0.6895, + 0.641, + 0.642, + 0.6835, + 0.6535, + 0.677, + 0.634, + 0.6605, + 0.67, + 0.651, + 0.579, + 0.5805, + 0.57, + 0.61, + 0.5835, + 0.612, + 0.5455, + 0.639, + 0.612, + 0.6275, + 0.6515, + 0.6425, + 0.6285, + 0.651, + 0.6015, + 0.647, + 0.619, + 0.6465, + 0.6315, + 0.651, + 0.6475, + 0.6345, + 0.655, + 0.649, + 0.65, + 0.653, + 0.652, + 0.6555, + 0.6455, + 0.651, + 0.6585, + 0.6535, + 0.6575, + 0.65, + 0.6545, + 0.659, + 0.6545, + 0.65, + 0.6545, + 0.6585, + 0.653, + 0.6555, + 0.6515, + 0.651, + 0.652, + 0.6545 + ], + "value_loss": [ + 2.9568321046829222, + 1.0785086713790895, + 0.90905224609375, + 0.8156556116104126, + 0.71209981174469, + 0.7162606690883636, + 0.6878525162696838, + 0.6334588691949844, + 0.6678785998344421, + 0.8333585778236389, + 0.9790375330209732, + 0.8892305318832397, + 1.190905132675171, + 1.22135962972641, + 1.4191310731887818, + 1.2301843813419342, + 1.309260043334961, + 1.786697961139679, + 1.8390044986248015, + 2.7407329641342164, + 2.683467747211456, + 2.4605039993286133, + 2.697446767044067, + 2.505884079360962, + 2.3811799823760986, + 2.1130632976531984, + 2.547091405200958, + 2.568806095790863, + 2.326700057220459, + 2.050758037567139, + 3.351647375488281, + 3.8653842737197874, + 2.4262299686431885, + 1.973457328939438, + 1.9173651649951935, + 2.7696605461120605, + 3.223868531227112, + 2.516205952453613, + 2.1309806928634645, + 1.581437483215332, + 1.520662855911255, + 1.7421501956939698, + 1.6392579578399658, + 1.7828631855010986, + 1.503568088912964, + 1.5523305910110474, + 1.513862213420868, + 1.4381744204521179, + 1.703464267539978, + 1.8939362186431885, + 1.997329638671875, + 2.3897830280303953, + 1.7983587005615234, + 1.697597998046875, + 1.9598307273864746, + 2.306221367645264, + 2.709978248977661, + 2.6091056289672854, + 2.1318489376068115, + 2.478940699005127, + 4.479023780822754, + 2.6361848222732545, + 2.3030937707901002, + 2.172142697906494, + 2.1629171989440916, + 2.1354505142211915, + 3.6189373970031737, + 1.9153299285888672, + 1.6933829580307007, + 1.5514454183578492, + 1.7198340145111084, + 2.304251728439331, + 2.3330616605758667, + 2.141467953872681, + 2.1230085525512696, + 1.957105325627327, + 1.2174413562774657, + 1.088514053273201, + 1.3677844764709473, + 1.470289986038208 + ], + "term_loss": [ + 1.7106032176971435, + 0.8254648140907288, + 0.7463485570907593, + 0.6676207568168641, + 0.5505435749053955, + 0.541679301738739, + 0.5368218964576721, + 0.4944875739812851, + 0.5313012260437012, + 0.688984687590599, + 0.824212459397316, + 0.7535633095741272, + 1.0329072504997254, + 1.0706197033405305, + 1.2603799612522126, + 1.077820935988426, + 1.1586309091567992, + 1.6123901631355286, + 1.6418114624261857, + 2.436177046394348, + 2.397401628804207, + 2.1149996490478515, + 2.31136040019989, + 2.1631346977233887, + 2.049055897331238, + 1.7832660831809044, + 2.158650917363167, + 2.1838888779640198, + 1.8579028195381164, + 1.675981715774536, + 2.8682561981201173, + 3.322650659561157, + 2.0634375164031984, + 1.6218495529174806, + 1.5564533473014832, + 2.2553051567077635, + 2.749121911621094, + 2.076441255569458, + 1.7535715727806092, + 1.2274940629959106, + 1.1482607242584228, + 1.3356118202209473, + 1.1993759344100952, + 1.2911961950302124, + 1.048892977809906, + 1.0074683206558228, + 1.0248507034778596, + 0.935506264257431, + 1.1044427654266358, + 1.1969995346069335, + 1.1418621253967285, + 1.3484027454376222, + 0.962894126367569, + 0.9484803367614746, + 0.9511542388916016, + 0.9807710059165955, + 0.9729905309677124, + 1.0154107706069946, + 0.8337604522705078, + 0.9689625096797944, + 1.7556117889404297, + 0.9268646779537201, + 0.828965087556839, + 0.6780174582958222, + 0.7625543830394745, + 0.6682373239994049, + 0.9152047227859497, + 0.7351679893016815, + 0.47258839864730834, + 0.5454990069389343, + 0.5863055065393448, + 0.40333252935409547, + 0.3903892815351486, + 0.3693857752799988, + 0.39749053382873534, + 0.3525045004069805, + 0.3847132333755493, + 0.3305401994973421, + 0.33507129402160646, + 0.35005189373493195 + ], + "bridge_loss": [ + 0.9669484859231743, + 0.05317885834872722, + 0.00808393329679966, + 0.008157965920865536, + 0.029252383983135222, + 0.03924694521427154, + 0.021582315093278886, + 0.014747861477732658, + 0.010850316934287549, + 0.01159995011985302, + 0.01137650200240314, + 0.008062006759643555, + 0.010978949210047722, + 0.010464786231517791, + 0.010793930877745151, + 0.014536779739707708, + 0.013218280214071274, + 0.01831962423026562, + 0.04002247373312712, + 0.12877036023139954, + 0.11417192211151123, + 0.17329340472221375, + 0.1982671790599823, + 0.1537047609090805, + 0.13700159553289412, + 0.14344184587001801, + 0.19639654465913772, + 0.18772757058143616, + 0.2604771111011505, + 0.16612488641738893, + 0.24183178367614747, + 0.29544510494470594, + 0.15411187861561776, + 0.14273896975517272, + 0.1461831522524357, + 0.2598205562591553, + 0.20287768486738206, + 0.17781711089611055, + 0.13225486822128296, + 0.1091677051782608, + 0.12344816446304321, + 0.15784135718345643, + 0.19993465332984925, + 0.2517854769706726, + 0.21548625774383545, + 0.303979873418808, + 0.24833559863567353, + 0.25959504103660586, + 0.3560759227275848, + 0.4449814043998718, + 0.6060321228027343, + 0.7924756161689759, + 0.5928340180397034, + 0.5072291620254517, + 0.7738087944030762, + 1.0943159332275392, + 1.5088457412719727, + 1.3652442758560182, + 1.0671269865989685, + 1.276467441558838, + 2.486809080886841, + 1.4710026905059814, + 1.2389037780284882, + 1.261445129776001, + 1.164626408290863, + 1.2384403867721558, + 2.4690226011276244, + 0.9487775525093078, + 0.9965210990428924, + 0.7810107170104981, + 0.9109019186019898, + 1.6800292533874512, + 1.7228944480895996, + 1.5527821187973023, + 1.5077555236816407, + 1.3873976001620292, + 0.6169261030197144, + 0.542320925283432, + 0.817931770324707, + 0.9054676934719086 + ], + "tgrad_loss": [ + 0.2792804120540619, + 0.19986500358581544, + 0.15461974563598632, + 0.13987688381671906, + 0.1323038545846939, + 0.13533442150354386, + 0.1294483060002327, + 0.12422343373596668, + 0.12572705571651457, + 0.1327739451289177, + 0.14344856899380684, + 0.12760521812438966, + 0.14701892898082733, + 0.1402751523733139, + 0.1479571692466736, + 0.13782665922790766, + 0.1374108523607254, + 0.15598817284107208, + 0.15717057017087938, + 0.17578555488586425, + 0.17189420654773713, + 0.17221092910766603, + 0.18781920006275177, + 0.1890446207523346, + 0.1951224928855896, + 0.1863553591489792, + 0.19204393486976623, + 0.19718966495990753, + 0.20832013266086577, + 0.20865144987106324, + 0.24155937967300414, + 0.2472884924173355, + 0.2086805598974228, + 0.2088688009262085, + 0.21472869415283202, + 0.25453484058380127, + 0.271868927192688, + 0.26194758088588715, + 0.24515422630310058, + 0.24477570347785949, + 0.24895398588180542, + 0.24869702105522157, + 0.23994735856056212, + 0.2398815236568451, + 0.2391888491630554, + 0.240882395029068, + 0.24067591972351074, + 0.2430731174468994, + 0.2429455770969391, + 0.25195528326034544, + 0.24943538155555725, + 0.2489046775341034, + 0.2426305419921875, + 0.24188849420547484, + 0.23486768898963928, + 0.23113440914154051, + 0.22814198708534242, + 0.22845054547786714, + 0.23096151385307312, + 0.23351073865890504, + 0.23660291147232054, + 0.23831744689941406, + 0.2352248964548111, + 0.23268011784553527, + 0.23573639130592347, + 0.22877280921936036, + 0.2347100558757782, + 0.23138438067436218, + 0.22427347674369813, + 0.22493569655418397, + 0.2226265817642212, + 0.22088994021415712, + 0.21977790536880493, + 0.21930006308555602, + 0.21776250076293946, + 0.21720322926640512, + 0.2158020221233368, + 0.21565292925834656, + 0.21478140382766725, + 0.2147704033613205 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.022733785212039948, + -0.008966443128883839, + -0.020323125645518303, + -0.018136776983737946, + -0.01592089980840683, + -0.019174236804246902, + -0.014491843990981579, + -0.016727179288864136, + -0.008660020306706429, + -0.007111798040568829, + 0.0011803526431322098, + 0.019812453538179398 + ], + "perturbation_rho": [ + -0.05155084282159805, + 0.03821132332086563, + 0.07940525561571121, + 0.014752240851521492, + 0.016678672283887863, + 0.04385560005903244, + 0.03276895359158516, + -0.0006132312119007111, + -0.024450641125440598, + -0.029637619853019714, + 0.058109357953071594, + 0.06492529809474945 + ], + "nudging": { + "0.001": [ + 0.0007101683877408504, + 2.878123996197246e-05, + 3.59775876859203e-05, + 4.22842385887634e-05, + 5.514687654795125e-05, + 6.889239011798054e-05, + 4.4554166379384696e-05, + 5.3767391364090145e-05, + 2.042827327386476e-05, + 1.283050369238481e-05, + -4.334753975854255e-05, + -0.00014430817100219429 + ], + "0.003": [ + 0.002175786066800356, + 8.923052519094199e-05, + 0.00010926096001639962, + 0.00012868153862655163, + 0.00016585344565100968, + 0.00020889895677100867, + 0.00013566638517659158, + 0.00016381990280933678, + 6.132574344519526e-05, + 4.1310246160719544e-05, + -0.0001288450148422271, + -0.00043151958379894495 + ], + "0.01": [ + 0.00777015183120966, + 0.00029987754533067346, + 0.00037500812322832644, + 0.00043640032527036965, + 0.0005594875547103584, + 0.0007026067469269037, + 0.00045700964983552694, + 0.000550219090655446, + 0.00020889028382953256, + 0.00013992507592774928, + -0.0004261335707269609, + -0.0014356517931446433 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a0.5_L12_s42.json b/results/synth_ladder_v2_hi/synth_a0.5_L12_s42.json new file mode 100644 index 0000000..534cbe6 --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a0.5_L12_s42.json @@ -0,0 +1,1722 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.0289972447395326, + 0.5518267907142639, + 0.4511595572471619, + 0.39422388381958007, + 0.44242291359901426, + 0.35389120923280715, + 0.31342196378707887, + 0.3463186399459839, + 0.32175993151664734, + 0.2832035564661026, + 0.2801107416152954, + 0.2918631485939026, + 0.3457958580970764, + 0.3110818340301514, + 0.26716538116931915, + 0.2110436717748642, + 0.21322266802787782, + 0.23035920186042785, + 0.2469690625667572, + 0.20660339014530182, + 0.17914194725751878, + 0.16029981126785278, + 0.2650108504295349, + 0.23070593461990357, + 0.22895147225856782, + 0.1446519785642624, + 0.15114033766984938, + 0.13604806888103485, + 0.14886143884658815, + 0.14153230743408204, + 0.1639685553073883, + 0.1721979957818985, + 0.12600361688137054, + 0.09298437514305115, + 0.0910780445933342, + 0.0859093768119812, + 0.0917577600479126, + 0.11107840504646302, + 0.1042894508600235, + 0.0790501122713089, + 0.060757651767134664, + 0.052207192993164064, + 0.07682168252468109, + 0.08167480888366699, + 0.05967919422090054, + 0.042717813885211946, + 0.04176127468943596, + 0.03670722253918648, + 0.03259751065224409, + 0.030135507690906525, + 0.03625146338418126, + 0.02841401128768921, + 0.03439460081905127, + 0.026802394422888755, + 0.024497890919446944, + 0.023438648000359535, + 0.0227094176530838, + 0.020777325369045137, + 0.019944287514686583, + 0.020628850987553595, + 0.01877836397886276, + 0.019591398665308953, + 0.01804204930663109, + 0.017368639394640922, + 0.01685231066942215, + 0.016730269909650087, + 0.016215140321850778, + 0.016110457883775235, + 0.01567506283596158, + 0.01538568799868226, + 0.015168684274703264, + 0.015022477886080741, + 0.014880986557900905, + 0.014766420166194439, + 0.014667600397765636, + 0.014582521318644286, + 0.014523118747770786, + 0.014479038575291633, + 0.014449081733822823, + 0.01443173177242279 + ], + "train_acc": [ + 0.6277, + 0.7816, + 0.8214, + 0.8428, + 0.8261, + 0.857, + 0.8746, + 0.8661, + 0.8744, + 0.8865, + 0.8865, + 0.882, + 0.8687, + 0.878, + 0.8936, + 0.916, + 0.9192, + 0.908, + 0.9018, + 0.9187, + 0.9326, + 0.9371, + 0.9017, + 0.9109, + 0.9141, + 0.9478, + 0.9455, + 0.9496, + 0.9445, + 0.9454, + 0.9359, + 0.9367, + 0.951, + 0.9693, + 0.9695, + 0.9721, + 0.9683, + 0.9605, + 0.9637, + 0.9745, + 0.9842, + 0.9876, + 0.9748, + 0.9709, + 0.9832, + 0.9909, + 0.9922, + 0.9944, + 0.9957, + 0.9985, + 0.9954, + 0.9975, + 0.9927, + 0.9984, + 0.9985, + 0.999, + 0.9993, + 0.9997, + 0.9997, + 0.9995, + 0.9996, + 0.9995, + 0.9998, + 0.9999, + 0.9999, + 0.9998, + 0.9999, + 0.9999, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.7515, + 0.8025, + 0.806, + 0.811, + 0.8295, + 0.834, + 0.8235, + 0.8265, + 0.836, + 0.837, + 0.8325, + 0.8185, + 0.8215, + 0.8335, + 0.8405, + 0.8485, + 0.8455, + 0.8475, + 0.8395, + 0.8535, + 0.838, + 0.8455, + 0.839, + 0.8415, + 0.8415, + 0.8625, + 0.861, + 0.8545, + 0.855, + 0.845, + 0.853, + 0.8455, + 0.8555, + 0.86, + 0.8545, + 0.861, + 0.8545, + 0.86, + 0.8525, + 0.856, + 0.8595, + 0.8595, + 0.854, + 0.858, + 0.854, + 0.8535, + 0.8555, + 0.861, + 0.8625, + 0.858, + 0.8545, + 0.861, + 0.864, + 0.8605, + 0.861, + 0.8605, + 0.8585, + 0.8595, + 0.862, + 0.8635, + 0.8615, + 0.863, + 0.859, + 0.8605, + 0.861, + 0.862, + 0.8605, + 0.862, + 0.8615, + 0.859, + 0.861, + 0.8595, + 0.8605, + 0.8595, + 0.8595, + 0.859, + 0.859, + 0.8585, + 0.8585, + 0.8585 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8657882213592529, + 0.8541754484176636, + 0.8436384201049805, + 0.832263708114624, + 0.8208613991737366, + 0.8122134208679199, + 0.8057717084884644, + 0.8017721176147461, + 0.7986597418785095, + 0.7967146635055542, + 0.7952107787132263, + 0.7936121225357056 + ], + "perturbation_rho": [ + 0.9999991655349731, + 0.9999977350234985, + 0.9999939203262329, + 0.9999861121177673, + 0.9999700784683228, + 0.9999415874481201, + 0.9999051094055176, + 0.9998413324356079, + 0.9998086094856262, + 0.9997647404670715, + 0.9996839165687561, + 0.9996654987335205 + ], + "nudging": { + "0.001": [ + -0.04849132150411606, + -0.02874898351728916, + -0.017109278589487076, + -0.010623453184962273, + -0.007099856156855822, + -0.00517381401732564, + -0.004027326591312885, + -0.003302204655483365, + -0.002826581709086895, + -0.0024977410212159157, + -0.0022658759262412786, + -0.002098134718835354 + ], + "0.003": [ + -0.13462388515472412, + -0.08245518803596497, + -0.049992166459560394, + -0.03135458379983902, + -0.021068472415208817, + -0.015398472547531128, + -0.012007322162389755, + -0.009856492280960083, + -0.008443145081400871, + -0.0074646552093327045, + -0.006774362176656723, + -0.00627471599727869 + ], + "0.01": [ + -0.3461707830429077, + -0.23528623580932617, + -0.151905819773674, + -0.0986800491809845, + -0.06758347898721695, + -0.04991145431995392, + -0.039162103086709976, + -0.032274406403303146, + -0.02771918475627899, + -0.024551689624786377, + -0.02231007255613804, + -0.020684588700532913 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.1235100923538206, + 1.1082965564727782, + 0.750099405670166, + 0.6328572737693786, + 0.5875409540176392, + 0.5631556386470795, + 0.5060072989463806, + 0.540234273815155, + 0.5666848608016968, + 0.5682762460708618, + 0.5639706572532653, + 0.5890132635116577, + 0.6135262609481812, + 0.602108911037445, + 0.6072693287372589, + 0.6348110971450805, + 0.7817256136894226, + 0.6661777521133423, + 0.6966238568305969, + 0.7440887294769287, + 0.7967543980598449, + 0.7141374285697937, + 0.7286955251693725, + 0.7677665306091308, + 0.9173848634719849, + 0.7543825769424438, + 0.7648948078155517, + 0.7503327812194824, + 0.7647949110984802, + 0.7902673944473266, + 0.9369182168960571, + 0.8630489279747009, + 0.7868163341522216, + 0.7187879699707032, + 0.7061111800193787, + 0.7407430360794067, + 0.6999222482681274, + 0.7179792369842529, + 0.7611988479614258, + 0.9336099584102631, + 0.7458975120544433, + 0.7050964839935303, + 0.7907829219818115, + 0.8120410600662231, + 0.8178721930742264, + 0.8078300096511841, + 0.7027412726402282, + 0.7329458427906036, + 0.738685355424881, + 0.7487446063995361, + 0.7514049421310425, + 0.730554404258728, + 0.7941344120979309, + 0.7334264843940735, + 0.6445084705352783, + 0.6251215059280395, + 0.6134120052337646, + 0.649115455532074, + 0.633389378452301, + 0.6228324326515198, + 0.611019660949707, + 0.6410484097003937, + 0.5912066791534424, + 0.5904429639816284, + 0.6285253910064698, + 0.5794477666854858, + 0.5771131004333496, + 0.5889648357391357, + 0.5780286474227905, + 0.5594178355693817, + 0.5606797921180725, + 0.5604514053821563, + 0.5562048003673553, + 0.5510331042289733, + 0.5497398493766784, + 0.545871854686737, + 0.5429510949134827, + 0.5423210851669311, + 0.5398131627082825, + 0.5393634226799011 + ], + "train_acc": [ + 0.2323, + 0.596, + 0.7208, + 0.7599, + 0.7788, + 0.7874, + 0.8057, + 0.8007, + 0.7918, + 0.7962, + 0.7997, + 0.8031, + 0.8048, + 0.8065, + 0.8051, + 0.8065, + 0.7841, + 0.8036, + 0.8097, + 0.7995, + 0.7896, + 0.8078, + 0.8071, + 0.8026, + 0.7855, + 0.8111, + 0.8127, + 0.8163, + 0.8174, + 0.8154, + 0.791, + 0.8028, + 0.8168, + 0.8281, + 0.8279, + 0.8255, + 0.8283, + 0.8251, + 0.8235, + 0.8042, + 0.8284, + 0.8306, + 0.8251, + 0.8193, + 0.8153, + 0.8206, + 0.8358, + 0.8319, + 0.8309, + 0.8326, + 0.8313, + 0.8342, + 0.8227, + 0.8297, + 0.8425, + 0.8437, + 0.8475, + 0.8429, + 0.8449, + 0.846, + 0.8498, + 0.8461, + 0.8488, + 0.8512, + 0.8447, + 0.8533, + 0.8547, + 0.8538, + 0.8497, + 0.8569, + 0.8574, + 0.8529, + 0.8559, + 0.8562, + 0.8583, + 0.8588, + 0.8603, + 0.8591, + 0.86, + 0.86 + ], + "test_acc": [ + 0.4615, + 0.655, + 0.702, + 0.7135, + 0.721, + 0.7235, + 0.7425, + 0.7335, + 0.7075, + 0.7205, + 0.7285, + 0.7125, + 0.737, + 0.756, + 0.72, + 0.708, + 0.72, + 0.6935, + 0.7225, + 0.7035, + 0.731, + 0.7365, + 0.757, + 0.6705, + 0.74, + 0.7185, + 0.7655, + 0.725, + 0.741, + 0.7335, + 0.728, + 0.6915, + 0.7585, + 0.7555, + 0.7625, + 0.755, + 0.7535, + 0.7325, + 0.7505, + 0.7705, + 0.7305, + 0.763, + 0.7435, + 0.7545, + 0.726, + 0.741, + 0.7665, + 0.756, + 0.7335, + 0.7705, + 0.7425, + 0.7435, + 0.7435, + 0.772, + 0.789, + 0.773, + 0.776, + 0.7705, + 0.776, + 0.782, + 0.784, + 0.783, + 0.779, + 0.78, + 0.7885, + 0.786, + 0.78, + 0.7735, + 0.789, + 0.7865, + 0.7915, + 0.7865, + 0.7925, + 0.7905, + 0.784, + 0.79, + 0.789, + 0.7905, + 0.79, + 0.791 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.023988625034689903, + 0.0961650088429451, + 0.10208466649055481, + 0.07022920250892639, + 0.09604307264089584, + 0.07800711691379547, + 0.08064866811037064, + 0.015484225004911423, + 0.04617477208375931, + 0.10530653595924377, + 0.06217034161090851, + 0.07844939827919006 + ], + "perturbation_rho": [ + -0.021668296307325363, + 0.13302525877952576, + 0.14676621556282043, + 0.11482817679643631, + 0.09230026602745056, + 0.15572097897529602, + 0.084853395819664, + 0.06741442531347275, + 0.09585727006196976, + 0.17402535676956177, + 0.1249062716960907, + 0.10308724641799927 + ], + "nudging": { + "0.001": [ + -0.0014991102507337928, + -0.0009640245698392391, + -0.0004538548528216779, + -0.00034582847729325294, + -0.00034230330493301153, + -0.0003880904405377805, + -0.00031353221856988966, + -0.00012767358566634357, + -0.0002463337150402367, + -0.0004554776242002845, + -0.00027469650376588106, + -0.00030673964647576213 + ], + "0.003": [ + -0.004409522749483585, + -0.002890376141294837, + -0.0013566706329584122, + -0.0010372062679380178, + -0.001026148907840252, + -0.001161768101155758, + -0.0009411850478500128, + -0.0003798047546297312, + -0.0007346655474975705, + -0.001363673829473555, + -0.0008243860211223364, + -0.0009191210265271366 + ], + "0.01": [ + -0.013704460114240646, + -0.009605048224329948, + -0.004514003172516823, + -0.00345102627761662, + -0.003412249032407999, + -0.0038682736922055483, + -0.0031317053362727165, + -0.0012646813411265612, + -0.002444072160869837, + -0.004538315813988447, + -0.0027466074097901583, + -0.0030584305059164762 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.807085013961792, + 1.102435264968872, + 0.8967913342475891, + 0.8658248983383179, + 1.0182812132835388, + 0.9767744832992554, + 0.9880819606781006, + 1.035093484020233, + 1.0461988681793213, + 1.0764453081130982, + 1.1296374977111816, + 1.1917438926696777, + 1.222821136856079, + 1.174761890888214, + 1.14142276802063, + 1.1630746793746949, + 1.0981647139549255, + 1.1113210584640503, + 1.151859906578064, + 1.1268991245269775, + 1.1279105222702026, + 1.1556508625030517, + 1.1305137939453125, + 1.185821006011963, + 1.138044129371643, + 1.1439549321651459, + 1.1212958415985108, + 1.0799880672454834, + 1.0542625444412232, + 1.0640178268432616, + 1.10920906085968, + 1.1122959064483642, + 1.0692581912994386, + 1.0431142856597901, + 1.0079946722984314, + 1.004625850868225, + 0.9657065452575684, + 0.987287603187561, + 0.9696861606597901, + 0.9506798803329468, + 0.9282126628875732, + 0.927169044971466, + 0.8895869630813599, + 0.9118406322479248, + 0.880739783000946, + 0.8995118801116944, + 0.9030367485046387, + 0.8806243282318115, + 0.859384224319458, + 0.8554368983268738, + 0.8580255534172058, + 0.8396073943138123, + 0.8226373916625976, + 0.8179270943164826, + 0.8061285870552063, + 0.8003266729354859, + 0.7872838403701782, + 0.7727557550430297, + 0.7704776877403259, + 0.7667377745628357, + 0.7585975839614868, + 0.7477805254936218, + 0.7369667429924012, + 0.7361846633911133, + 0.7324250010490417, + 0.7300120206832885, + 0.7282338066101074, + 0.7252779340744019, + 0.7199260646820068, + 0.7161426591873169, + 0.7162261745452881, + 0.7125815645217896, + 0.7121326784133911, + 0.712986146068573, + 0.7102373764991761, + 0.709166716003418, + 0.7090627272605896, + 0.7080635800361633, + 0.7075329236984252, + 0.7072855897903443 + ], + "train_acc": [ + 0.3632, + 0.6056, + 0.6822, + 0.7026, + 0.6763, + 0.6838, + 0.6698, + 0.6532, + 0.6384, + 0.6301, + 0.6145, + 0.5902, + 0.5922, + 0.6063, + 0.6007, + 0.6007, + 0.6167, + 0.6197, + 0.6073, + 0.6184, + 0.6022, + 0.5992, + 0.6109, + 0.5973, + 0.6053, + 0.6094, + 0.606, + 0.6251, + 0.6317, + 0.6342, + 0.6262, + 0.6251, + 0.6305, + 0.6374, + 0.6449, + 0.6433, + 0.6553, + 0.6504, + 0.6565, + 0.6661, + 0.6722, + 0.675, + 0.6841, + 0.6819, + 0.6916, + 0.689, + 0.6844, + 0.6898, + 0.697, + 0.6968, + 0.6992, + 0.7051, + 0.7069, + 0.7039, + 0.7086, + 0.7106, + 0.7106, + 0.7148, + 0.7182, + 0.7197, + 0.7222, + 0.7262, + 0.7283, + 0.7306, + 0.7298, + 0.7304, + 0.7295, + 0.7306, + 0.7326, + 0.7349, + 0.7313, + 0.7338, + 0.7356, + 0.7332, + 0.7336, + 0.7353, + 0.7341, + 0.7366, + 0.7364, + 0.7364 + ], + "test_acc": [ + 0.5135, + 0.618, + 0.6695, + 0.6515, + 0.6515, + 0.6315, + 0.6225, + 0.6055, + 0.5995, + 0.584, + 0.5585, + 0.557, + 0.551, + 0.5605, + 0.5265, + 0.599, + 0.558, + 0.551, + 0.563, + 0.5645, + 0.57, + 0.577, + 0.563, + 0.546, + 0.5685, + 0.571, + 0.588, + 0.5825, + 0.6095, + 0.585, + 0.5855, + 0.604, + 0.5945, + 0.587, + 0.5875, + 0.62, + 0.6, + 0.6235, + 0.627, + 0.64, + 0.633, + 0.641, + 0.6375, + 0.6475, + 0.6465, + 0.633, + 0.648, + 0.6575, + 0.654, + 0.639, + 0.6655, + 0.6525, + 0.6625, + 0.662, + 0.6645, + 0.666, + 0.6765, + 0.67, + 0.674, + 0.678, + 0.681, + 0.6715, + 0.674, + 0.6805, + 0.674, + 0.678, + 0.6785, + 0.684, + 0.6795, + 0.6855, + 0.6845, + 0.685, + 0.6815, + 0.682, + 0.684, + 0.681, + 0.68, + 0.6825, + 0.684, + 0.684 + ], + "state_pred_error": [ + 0.6512474334239959, + 0.23058344020843505, + 0.1896287111759186, + 0.18471159949302673, + 0.18485726273059844, + 0.1737810070514679, + 0.16258639628887175, + 0.16076858344078063, + 0.15332085819244384, + 0.14920532870292663, + 0.14722106504440308, + 0.14300990376472472, + 0.1492370625972748, + 0.1439142399072647, + 0.12816479614973067, + 0.1202324061870575, + 0.117945645570755, + 0.11019849457740784, + 0.10783304533958435, + 0.10931210429668427, + 0.10170301874876023, + 0.09073063535690308, + 0.08647769033908843, + 0.08548861846923828, + 0.08252622492313386, + 0.08297095057964325, + 0.08413988354206085, + 0.08291892770528793, + 0.08127011013031006, + 0.08014206212759017, + 0.07530246855020523, + 0.07383085484504699, + 0.07433314504027366, + 0.07500043790340423, + 0.06373311177492141, + 0.053063148951530456, + 0.04655604932308197, + 0.04248758298754692, + 0.039597957611083985, + 0.03774079847335816, + 0.036414392232894895, + 0.036177867931127546, + 0.03710191646814346, + 0.03799050847887993, + 0.03865900856852531, + 0.03986500010490417, + 0.04025968971848488, + 0.04023946278095245, + 0.03935071052908897, + 0.038617061150074, + 0.03697362271547318, + 0.03568208778500557, + 0.03376017547249794, + 0.03194519720077515, + 0.03046695657968521, + 0.028837302082777024, + 0.026821034044027327, + 0.025166314297914504, + 0.023858547830581667, + 0.022523800045251847, + 0.02142890711426735, + 0.02049182191491127, + 0.019461944046616553, + 0.018724638411402702, + 0.018098203578591345, + 0.017532397788763046, + 0.017125102549791337, + 0.016625906114280223, + 0.016127729009091853, + 0.0156772187769413, + 0.01534948223233223, + 0.01498309828042984, + 0.014769109533727169, + 0.014400660943984985, + 0.014128298926353455, + 0.013869472323358058, + 0.013623444560170174, + 0.013534102323651313, + 0.013178734815120698, + 0.012914137981832028 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.7669721841812134, + 0.3159201741218567, + 0.12931227684020996, + 0.11285121738910675, + 0.11607236415147781, + 0.09898597002029419, + 0.08882047981023788, + 0.08661012351512909, + 0.08416090905666351, + 0.07891363650560379, + 0.08571723103523254, + 0.07797139883041382 + ], + "perturbation_rho": [ + 0.6671731472015381, + 0.26826971769332886, + 0.10340800136327744, + 0.06843797862529755, + 0.0669264942407608, + 0.08176875114440918, + 0.10683348774909973, + 0.06641782820224762, + 0.09755225479602814, + 0.04477599635720253, + 0.0847611278295517, + 0.05422855541110039 + ], + "nudging": { + "0.001": [ + -0.020674603059887886, + -0.0009852666407823563, + -0.00032257993007078767, + -0.00028019698220305145, + -0.00029603225993923843, + -0.0002484910364728421, + -0.00022453245765063912, + -0.0002270418481202796, + -0.0002228383964393288, + -0.00021279064822010696, + -0.00022745912428945303, + -0.00021358227240853012 + ], + "0.003": [ + -0.06080744415521622, + -0.0029529533348977566, + -0.000967606611084193, + -0.0008409440633840859, + -0.0008881675312295556, + -0.0007449040422216058, + -0.000672660768032074, + -0.0006811338244006038, + -0.000667730113491416, + -0.0006377690588124096, + -0.0006822676514275372, + -0.0006406885222531855 + ], + "0.01": [ + -0.18878120183944702, + -0.009807860478758812, + -0.003219514386728406, + -0.0027990485541522503, + -0.0029557342641055584, + -0.002479594200849533, + -0.0022394107654690742, + -0.0022681057453155518, + -0.0022236446384340525, + -0.0021239176858216524, + -0.002271223347634077, + -0.0021332399919629097 + ] + }, + "state_pred_error_per_layer": [ + 11168.2578125, + 8443.55078125, + 4301.74609375, + 3486.31884765625, + 3134.353515625, + 2733.8369140625, + 2666.431640625, + 2571.673095703125, + 2489.172119140625, + 2732.81298828125, + 3179.04296875, + 3116.75927734375 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.1315750801086426, + 1.1275678437232972, + 0.7608565049171447, + 0.6336094784736633, + 0.5893053354263306, + 0.5536110488414765, + 0.5473899070739746, + 0.5555015350341796, + 0.5377608227729798, + 0.5654601648330688, + 0.5768093711853027, + 0.5968125733375549, + 0.5762377287864685, + 0.6280837037563324, + 0.6525607712745667, + 0.6160441763401031, + 0.6452989727020264, + 0.6671710391998291, + 0.7498049283504487, + 0.7619616928100585, + 0.8783720811843873, + 0.8115640605926514, + 0.8540671677589416, + 0.9438815314292908, + 1.0194129499912261, + 1.3004956233024598, + 1.208273486328125, + 1.1028277763366698, + 0.9904912512779236, + 1.0831217368125916, + 1.6056551074981689, + 1.5679107995986938, + 1.3498116270065308, + 1.2021915550231934, + 1.233414642238617, + 1.173053926086426, + 1.244126808643341, + 1.2047833410263062, + 1.3103191875457765, + 1.450556330871582, + 1.338700449371338, + 1.394380598449707, + 1.3369567630767822, + 1.3830016635894775, + 1.4491120206832886, + 1.355772504043579, + 1.4613750009536743, + 1.3933008644104004, + 1.4618995168685913, + 1.4758007205963135, + 1.3685514781951904, + 1.3153245384216308, + 1.376934875679016, + 1.3746307342529296, + 1.379645304107666, + 1.3670798933029176, + 1.3901595281600951, + 1.4185121158599854, + 1.4470027433395385, + 1.5002961723327637, + 1.5068544860839843, + 1.5301587196350097, + 1.513092244720459, + 1.5387826145172119, + 1.5067788402557374, + 1.4915789882659911, + 1.4699815629959105, + 1.4490281288146973, + 1.4375888122558593, + 1.4150205673217773, + 1.400378854084015, + 1.3909439609527587, + 1.3824152030944825, + 1.3735420917510985, + 1.3697484756469727, + 1.366435227203369, + 1.3618904499053954, + 1.3581113803863525, + 1.356816044807434, + 1.3559203275680543 + ], + "train_acc": [ + 0.224, + 0.5908, + 0.7109, + 0.7607, + 0.7744, + 0.794, + 0.79, + 0.7914, + 0.8039, + 0.802, + 0.8029, + 0.801, + 0.8075, + 0.8013, + 0.7967, + 0.8075, + 0.8041, + 0.8037, + 0.7932, + 0.7959, + 0.7755, + 0.7864, + 0.78, + 0.7553, + 0.7388, + 0.7019, + 0.7005, + 0.7057, + 0.7206, + 0.698, + 0.6358, + 0.6414, + 0.6436, + 0.6583, + 0.6537, + 0.6534, + 0.6344, + 0.6334, + 0.6075, + 0.585, + 0.6124, + 0.5768, + 0.5856, + 0.5795, + 0.5786, + 0.5889, + 0.5765, + 0.5842, + 0.5754, + 0.5733, + 0.5886, + 0.5993, + 0.578, + 0.5823, + 0.5771, + 0.589, + 0.5874, + 0.5864, + 0.5841, + 0.581, + 0.5822, + 0.5828, + 0.5828, + 0.5829, + 0.585, + 0.5876, + 0.591, + 0.5893, + 0.5924, + 0.5971, + 0.5978, + 0.5993, + 0.5975, + 0.5989, + 0.6019, + 0.5996, + 0.6014, + 0.6027, + 0.6026, + 0.6024 + ], + "test_acc": [ + 0.4435, + 0.637, + 0.691, + 0.7055, + 0.742, + 0.723, + 0.724, + 0.698, + 0.71, + 0.7455, + 0.7285, + 0.727, + 0.7385, + 0.7515, + 0.734, + 0.736, + 0.7215, + 0.719, + 0.7625, + 0.697, + 0.724, + 0.7325, + 0.711, + 0.701, + 0.667, + 0.6085, + 0.6425, + 0.637, + 0.6435, + 0.488, + 0.5185, + 0.5225, + 0.5955, + 0.617, + 0.612, + 0.5595, + 0.554, + 0.5335, + 0.539, + 0.5405, + 0.4145, + 0.5155, + 0.524, + 0.4825, + 0.5755, + 0.477, + 0.5435, + 0.4805, + 0.4845, + 0.5665, + 0.5725, + 0.494, + 0.5165, + 0.55, + 0.538, + 0.5355, + 0.5435, + 0.5345, + 0.5575, + 0.561, + 0.556, + 0.563, + 0.564, + 0.56, + 0.562, + 0.572, + 0.568, + 0.557, + 0.564, + 0.574, + 0.5685, + 0.5775, + 0.563, + 0.568, + 0.5705, + 0.572, + 0.572, + 0.5725, + 0.572, + 0.571 + ], + "value_loss": [ + 2.9138871958732606, + 1.1022631580352784, + 0.9319236121177673, + 0.7978519012451172, + 0.7577287331581116, + 0.7042515501976013, + 0.6586682022094726, + 0.7588884521484375, + 0.7518065408706665, + 0.8810499990463256, + 0.9755400789260864, + 1.0526361764431, + 1.0445400088310242, + 1.252692174434662, + 1.3889376731872558, + 1.300380541419983, + 1.3794576427936553, + 1.4253910701751709, + 1.9810868307113647, + 2.194575175476074, + 3.0307659772872926, + 2.4067670707702638, + 2.5513597805023194, + 2.7336216793060304, + 3.053514086151123, + 4.7302221481323246, + 3.3925644401550294, + 2.775765018463135, + 2.221942966938019, + 2.2246411628723144, + 5.384357067489624, + 5.233831034374237, + 3.163105836868286, + 2.1542870338439943, + 2.1550992218017577, + 2.6656919672012327, + 2.002714876174927, + 1.74481948928833, + 1.8624648433685302, + 2.076787268447876, + 1.8710257823944092, + 1.958513571166992, + 1.649655185508728, + 1.6125932949066162, + 2.0081273155212402, + 1.4420139938354493, + 1.8238695256233215, + 1.6240278913497925, + 1.8388916667938233, + 1.5901467416763306, + 1.4791289331436157, + 1.3453978649139404, + 1.297918366909027, + 1.200528673171997, + 1.2604325717926026, + 1.2986903020858764, + 1.3409297351837157, + 1.3383622268676758, + 1.5519800048828125, + 1.4891740257263184, + 1.6088176250457764, + 1.7245799392700196, + 1.7291366215705872, + 1.5569227603912354, + 1.5849707220077516, + 1.453390936088562, + 1.4432776542663575, + 1.4676635822296142, + 1.273773190689087, + 1.1522198958158494, + 1.3450853576660156, + 1.1712487615585327, + 1.1006177734375, + 1.117146457862854, + 1.159826749610901, + 1.040153635787964, + 1.0537519412994385, + 0.9792304852485657, + 1.0188624217987061, + 0.95497522315979 + ], + "term_loss": [ + 1.6808870628356933, + 0.8418537575721741, + 0.7667020098686218, + 0.6550530954360962, + 0.6069779561758042, + 0.5468185155630112, + 0.4998374924182892, + 0.6111144859313965, + 0.6096799449920655, + 0.7287877419471741, + 0.8274648229598999, + 0.8995155854701996, + 0.9002441462039947, + 1.097049927520752, + 1.2271722087860106, + 1.1485843418121338, + 1.2233097215652466, + 1.26716976146698, + 1.7900210740089417, + 1.9460071144104003, + 2.6685218320846555, + 2.036626290512085, + 2.1439288049697875, + 2.35301021528244, + 2.6526825618743897, + 4.199914279556275, + 2.894145081329346, + 2.3209693365097044, + 1.8253290235519408, + 1.8232774297714234, + 4.733495523166656, + 4.460964757013321, + 2.59017871131897, + 1.7353513706207275, + 1.7227497034072876, + 2.170975755023956, + 1.5856938004493712, + 1.3557625965118407, + 1.4581338554382324, + 1.65160093460083, + 1.460218872833252, + 1.5324822853088378, + 1.2387194828033448, + 1.1904955023765564, + 1.5343577083587647, + 1.0203948043823243, + 1.3787709797382355, + 1.1686672458648681, + 1.3607313781142234, + 1.164192317056656, + 1.0531481260299682, + 0.9685713556289672, + 0.9191585310459137, + 0.8289684215545654, + 0.8956387975692749, + 0.9272360958099365, + 0.9794390370845795, + 0.9855687606811523, + 1.181628607749939, + 1.123434832572937, + 1.2307934044837952, + 1.335347871017456, + 1.3480947745800018, + 1.1828620002746582, + 1.2076996083259584, + 1.0852937175512314, + 1.0779944334030152, + 1.0861511331558227, + 0.9256630334854126, + 0.8190074906170368, + 0.9839356534004211, + 0.8315309607505799, + 0.7704235172271728, + 0.7783107600212097, + 0.8086720629692078, + 0.7087357486724853, + 0.7182173488616943, + 0.6559986435174942, + 0.6836358494758606, + 0.6288936994552612 + ], + "bridge_loss": [ + 0.9492729762485367, + 0.05790521508902311, + 0.008084059101343155, + 0.0038914968118071557, + 0.014953732180595397, + 0.026874115404486656, + 0.025175111523270607, + 0.013569228036701679, + 0.011279044309258461, + 0.015361159473657609, + 0.010007666802406312, + 0.010759075009822846, + 0.008863374817371369, + 0.010565215808153153, + 0.01431704029738903, + 0.01245639272481203, + 0.011864153837412596, + 0.013191274722665548, + 0.036286889004707334, + 0.08858205670118333, + 0.1876173447370529, + 0.2052448028087616, + 0.23761723659038544, + 0.19063645343780516, + 0.19986087894439697, + 0.2954687296628952, + 0.2650281882286072, + 0.22584694170951844, + 0.18357310107946395, + 0.17081516757011414, + 0.3614925577163696, + 0.48578131484985354, + 0.29585003600120546, + 0.16319083409309387, + 0.16577295184135438, + 0.23821018815040587, + 0.14544457584619522, + 0.11933779344558716, + 0.1195192194223404, + 0.12099922590255738, + 0.11734530322551727, + 0.1201287920832634, + 0.11132868221998214, + 0.12015857456922531, + 0.16084424114227294, + 0.12574590224027635, + 0.12926621383428574, + 0.15031628198623656, + 0.16125666260719299, + 0.10902463984489441, + 0.12337167377471923, + 0.0837235963344574, + 0.07390378758907318, + 0.06712040519714356, + 0.05870588574409485, + 0.07018440127372742, + 0.05867706568241119, + 0.047857114362716675, + 0.0606671004652977, + 0.05209314270019531, + 0.06518135804533959, + 0.07501878665685653, + 0.06833717626929284, + 0.06045493056178093, + 0.06650661500692368, + 0.060288525009155276, + 0.06200537823438644, + 0.07822481272220612, + 0.04460304388999939, + 0.03354956085383892, + 0.0633296797245741, + 0.04248417546153069, + 0.03512862289845944, + 0.04510229033231735, + 0.05826025112867356, + 0.03656574003100395, + 0.04282294084429741, + 0.03138661871179938, + 0.043345933312177655, + 0.0344168305516243 + ], + "tgrad_loss": [ + 0.2837271708488464, + 0.20250418248176574, + 0.1571375395655632, + 0.13890730676651, + 0.13579704699516296, + 0.13055892231464386, + 0.1336555983543396, + 0.13420473737716676, + 0.1308475558042526, + 0.13690110483169557, + 0.13806758637428285, + 0.14236151192188262, + 0.13543248913288117, + 0.14507703199386596, + 0.14744842977523803, + 0.1393398109436035, + 0.14428377581238747, + 0.14503003504276277, + 0.1547788742184639, + 0.1599859984397888, + 0.17462680044174195, + 0.16489596152305602, + 0.1698137484550476, + 0.1899749903678894, + 0.20097066857814788, + 0.2348391308784485, + 0.23339117636680604, + 0.22894872980117797, + 0.21304085222482683, + 0.2305485824584961, + 0.28936895632743836, + 0.28708498154878614, + 0.2770771013736725, + 0.2557448182106018, + 0.2665765688657761, + 0.2565060169696808, + 0.2715765025138855, + 0.2697190866470337, + 0.2848117718219757, + 0.3041871148586273, + 0.2934616066932678, + 0.3059024829864502, + 0.29960701389312744, + 0.30193921012878416, + 0.3129253786087036, + 0.29587329483032226, + 0.31583235063552856, + 0.305044357919693, + 0.31690361921787263, + 0.31692978138923644, + 0.3026091367721558, + 0.29310291533470156, + 0.30485604639053343, + 0.30443984775543215, + 0.30608788843154905, + 0.3012698002338409, + 0.302813631105423, + 0.3049363513946533, + 0.30968429160118105, + 0.3136460470676422, + 0.3128428608894348, + 0.31421328043937685, + 0.31270467071533203, + 0.31360582246780394, + 0.3107645062446594, + 0.30780868940353395, + 0.30327784061431884, + 0.30328763818740845, + 0.3035071188926697, + 0.29966285078525545, + 0.29782002868652346, + 0.29723363511562345, + 0.29506562762260435, + 0.29373341407775877, + 0.2928944456100464, + 0.29485214648246766, + 0.29271164841651914, + 0.29184522535800933, + 0.2918806325912476, + 0.2916646807193756 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.009321734309196472, + 0.04962325841188431, + 0.06880976259708405, + 0.07808464020490646, + 0.08887439966201782, + 0.0946938544511795, + 0.09941184520721436, + 0.09979166835546494, + 0.10197117179632187, + 0.10147081315517426, + 0.09914548695087433, + 0.0936545580625534 + ], + "perturbation_rho": [ + -0.0036096302792429924, + 0.0626683160662651, + 0.10237888991832733, + 0.12722331285476685, + 0.138666570186615, + 0.14094725251197815, + 0.1720128357410431, + 0.18820315599441528, + 0.1971924901008606, + 0.19901405274868011, + 0.18742212653160095, + 0.1956271380186081 + ], + "nudging": { + "0.001": [ + -0.000869398470968008, + -0.00042921488056890666, + -0.0005759936757385731, + -0.0006805005250498652, + -0.0007694564992561936, + -0.0008467672159895301, + -0.0008808936108835042, + -0.0009030184592120349, + -0.0009463174501433969, + -0.000948121421970427, + -0.0009286807617172599, + -0.000908168382011354 + ], + "0.003": [ + -0.00256392196752131, + -0.0012864901218563318, + -0.0017271814867854118, + -0.002043036511167884, + -0.0023080133832991123, + -0.002536242129281163, + -0.002642394509166479, + -0.00270812027156353, + -0.0028397280257195234, + -0.002845325041562319, + -0.0027879015542566776, + -0.0027260873466730118 + ], + "0.01": [ + -0.00799381174147129, + -0.0042757005430758, + -0.005744780879467726, + -0.006799482740461826, + -0.0076793828047811985, + -0.008442584425210953, + -0.008797119371592999, + -0.009013657458126545, + -0.009450232610106468, + -0.009471941739320755, + -0.009278533980250359, + -0.009069977328181267 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a0.5_L12_s456.json b/results/synth_ladder_v2_hi/synth_a0.5_L12_s456.json new file mode 100644 index 0000000..2eac31c --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a0.5_L12_s456.json @@ -0,0 +1,1722 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.0399647656440736, + 0.5801911403656006, + 0.44912500467300415, + 0.4777579921722412, + 0.39411258869171145, + 0.3850814968109131, + 0.366568944978714, + 0.3459391833782196, + 0.3640839920282364, + 0.2808071050643921, + 0.27807387437820436, + 0.28600655393600466, + 0.28525742359161377, + 0.41426767587661745, + 0.32584802840948107, + 0.2218840173482895, + 0.23068335400819778, + 0.20809108746051788, + 0.22863631756305694, + 0.20474828234910966, + 0.1990956850528717, + 0.2024397686958313, + 0.2252926200389862, + 0.18378393414020538, + 0.18460674629211427, + 0.20635630996227264, + 0.1624528563261032, + 0.14138628933429717, + 0.15325817773342132, + 0.1448709319114685, + 0.20757121787071228, + 0.14481499516963958, + 0.11939099235534668, + 0.11831074991226197, + 0.10753689811229705, + 0.14279772633314133, + 0.10776034088134766, + 0.1341373483777046, + 0.09477192969322204, + 0.10186409213542938, + 0.11290034632086754, + 0.07553712728023529, + 0.07299047479629517, + 0.07112597908973693, + 0.07655592976808548, + 0.06261439298391343, + 0.06049537926912308, + 0.04479087981581688, + 0.038241669833660126, + 0.03606927845478058, + 0.04739076436012983, + 0.03390505993962288, + 0.03161321499347687, + 0.030190881507098675, + 0.026108801245689393, + 0.032475268816947934, + 0.026346699427068233, + 0.022964472925662994, + 0.02266303038597107, + 0.021826831635832787, + 0.020797414591908456, + 0.02012179616689682, + 0.02016616339087486, + 0.019080601900815963, + 0.0190194882273674, + 0.019803267088532448, + 0.018120336823165415, + 0.01736899336576462, + 0.017093995988368988, + 0.017035954880714417, + 0.016762651598453523, + 0.016471507793664932, + 0.016212560105323792, + 0.016106035402417184, + 0.01601193640232086, + 0.015896790677309036, + 0.015815340642631053, + 0.015758654138445856, + 0.015722464257478714, + 0.01570532155185938 + ], + "train_acc": [ + 0.6193, + 0.7754, + 0.8227, + 0.8164, + 0.8453, + 0.8489, + 0.8571, + 0.8603, + 0.8547, + 0.8868, + 0.8888, + 0.8858, + 0.8865, + 0.8483, + 0.8728, + 0.9135, + 0.9089, + 0.9205, + 0.9081, + 0.9167, + 0.9215, + 0.9221, + 0.9121, + 0.9259, + 0.927, + 0.9208, + 0.9376, + 0.9462, + 0.9427, + 0.9467, + 0.9245, + 0.9457, + 0.9547, + 0.9557, + 0.9617, + 0.9532, + 0.9629, + 0.9514, + 0.9685, + 0.9634, + 0.9591, + 0.9769, + 0.9773, + 0.9791, + 0.9767, + 0.9812, + 0.9834, + 0.9908, + 0.9944, + 0.9957, + 0.9885, + 0.9968, + 0.9973, + 0.9967, + 0.9987, + 0.9955, + 0.998, + 0.9994, + 0.9993, + 0.9994, + 0.9995, + 0.9993, + 0.9994, + 0.9999, + 0.9998, + 0.9993, + 0.9997, + 0.9999, + 0.9999, + 0.9998, + 0.9999, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.767, + 0.7795, + 0.807, + 0.8175, + 0.8155, + 0.828, + 0.8305, + 0.8315, + 0.817, + 0.848, + 0.843, + 0.843, + 0.842, + 0.82, + 0.8395, + 0.8475, + 0.85, + 0.8465, + 0.8455, + 0.8455, + 0.846, + 0.847, + 0.844, + 0.846, + 0.854, + 0.845, + 0.8535, + 0.857, + 0.8495, + 0.8515, + 0.85, + 0.857, + 0.862, + 0.8465, + 0.8665, + 0.848, + 0.861, + 0.8595, + 0.857, + 0.856, + 0.856, + 0.8595, + 0.861, + 0.8585, + 0.864, + 0.8635, + 0.8625, + 0.864, + 0.8675, + 0.869, + 0.871, + 0.8665, + 0.8685, + 0.8675, + 0.868, + 0.861, + 0.868, + 0.868, + 0.863, + 0.8705, + 0.8705, + 0.8655, + 0.868, + 0.8685, + 0.868, + 0.87, + 0.869, + 0.869, + 0.87, + 0.8685, + 0.868, + 0.869, + 0.869, + 0.869, + 0.869, + 0.869, + 0.8685, + 0.8685, + 0.869, + 0.869 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.802544355392456, + 0.7848162055015564, + 0.7700465321540833, + 0.7570744752883911, + 0.7440193891525269, + 0.733696699142456, + 0.7256457805633545, + 0.7199540734291077, + 0.7157886028289795, + 0.7124584913253784, + 0.7102035284042358, + 0.7086857557296753 + ], + "perturbation_rho": [ + 0.9999985694885254, + 0.9999974966049194, + 0.9999951720237732, + 0.9999867677688599, + 0.9999691843986511, + 0.9999383687973022, + 0.9999032020568848, + 0.9998719692230225, + 0.9998380541801453, + 0.9998047351837158, + 0.9996931552886963, + 0.9996466040611267 + ], + "nudging": { + "0.001": [ + -0.03132425993680954, + -0.019242331385612488, + -0.011778481304645538, + -0.007423160132020712, + -0.0049812826327979565, + -0.0036035804077982903, + -0.002788721350952983, + -0.002277323277667165, + -0.001938710454851389, + -0.001707348506897688, + -0.0015431708889082074, + -0.0014260823372751474 + ], + "0.003": [ + -0.0852988138794899, + -0.05447565019130707, + -0.03411520645022392, + -0.02178676798939705, + -0.01472880132496357, + -0.010699238628149033, + -0.008299889042973518, + -0.006788033060729504, + -0.005784356966614723, + -0.005097454413771629, + -0.004609576426446438, + -0.004260959103703499 + ], + "0.01": [ + -0.20057430863380432, + -0.1480334997177124, + -0.10051561146974564, + -0.0672251284122467, + -0.04664912819862366, + -0.03438428044319153, + -0.026901239529252052, + -0.02211749367415905, + -0.018912356346845627, + -0.01670587807893753, + -0.015132123604416847, + -0.01400449313223362 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.149601824569702, + 1.1820548335075378, + 0.8234183177947998, + 0.7200943376541138, + 0.6561116080284118, + 0.620822652053833, + 0.5853398329257965, + 0.5778777595520019, + 0.7235412719726563, + 0.6490978884458541, + 0.6030288267135621, + 0.6537958155632019, + 0.612600318145752, + 0.7587651762008667, + 0.6095341785430908, + 0.607348887681961, + 0.6443412380218506, + 0.7816055872917175, + 0.6487067770004272, + 0.5616429460525513, + 0.7008121586799622, + 0.9083496631622314, + 0.7033928192138672, + 0.8647868811607361, + 0.7038018920898438, + 0.8607533900737763, + 1.1982451632499695, + 0.716190754699707, + 0.796311668586731, + 0.7249050006866455, + 1.0628387544631959, + 0.9199559782981872, + 0.6391925012588501, + 0.7518097076416016, + 0.9904849645614624, + 0.8506406380176544, + 0.6844657245635987, + 0.7756393531799316, + 0.6564820529937744, + 0.6705869068145752, + 0.8701811204910278, + 0.6173303858757019, + 0.6615938651561737, + 0.7780586873054505, + 0.7907266628265381, + 0.7058374786376953, + 0.73820833568573, + 0.6771799244880676, + 0.6215859540939331, + 0.6903766424179077, + 0.5457969979286194, + 0.5275934984207153, + 0.5418724191665649, + 0.6481596652507782, + 0.5005363792419434, + 0.5815837169647217, + 0.6330155878543854, + 0.47478886585235597, + 0.6646243638038635, + 0.50522829580307, + 0.4747637662887573, + 0.5031630943536758, + 0.4689687178134918, + 0.45459979906082154, + 0.4733929946899414, + 0.4546206594467163, + 0.4687062328338623, + 0.44810478954315186, + 0.46362107830047605, + 0.45515496921539306, + 0.4470784990310669, + 0.44082560133934023, + 0.436901840877533, + 0.4296060552597046, + 0.42962351865768433, + 0.427029859828949, + 0.42571502952575685, + 0.42384919719696046, + 0.4223989706993103, + 0.42166884746551514 + ], + "train_acc": [ + 0.2223, + 0.5787, + 0.6929, + 0.7332, + 0.7588, + 0.7712, + 0.7889, + 0.785, + 0.7456, + 0.767, + 0.7725, + 0.7687, + 0.7774, + 0.736, + 0.78, + 0.7792, + 0.7658, + 0.7313, + 0.765, + 0.7913, + 0.7498, + 0.7208, + 0.7511, + 0.7212, + 0.7568, + 0.7148, + 0.6906, + 0.7532, + 0.7328, + 0.7448, + 0.6827, + 0.6978, + 0.7627, + 0.7378, + 0.7077, + 0.7215, + 0.7553, + 0.7385, + 0.7615, + 0.765, + 0.7164, + 0.7733, + 0.7629, + 0.7301, + 0.7281, + 0.7514, + 0.7471, + 0.7564, + 0.7725, + 0.7726, + 0.7939, + 0.8034, + 0.7971, + 0.7687, + 0.809, + 0.7824, + 0.774, + 0.818, + 0.7646, + 0.8096, + 0.8157, + 0.8114, + 0.8225, + 0.8258, + 0.8217, + 0.8254, + 0.819, + 0.8251, + 0.8233, + 0.8234, + 0.8285, + 0.8311, + 0.8341, + 0.8354, + 0.8332, + 0.8357, + 0.8338, + 0.8378, + 0.8381, + 0.8381 + ], + "test_acc": [ + 0.4755, + 0.659, + 0.6965, + 0.696, + 0.691, + 0.7085, + 0.7325, + 0.632, + 0.7105, + 0.702, + 0.6305, + 0.694, + 0.6055, + 0.7155, + 0.733, + 0.659, + 0.6925, + 0.705, + 0.685, + 0.7295, + 0.4795, + 0.653, + 0.6625, + 0.6745, + 0.6525, + 0.5535, + 0.6245, + 0.6075, + 0.667, + 0.5685, + 0.548, + 0.727, + 0.67, + 0.543, + 0.574, + 0.679, + 0.6475, + 0.674, + 0.545, + 0.5625, + 0.6385, + 0.5985, + 0.5905, + 0.6415, + 0.6215, + 0.545, + 0.6555, + 0.6855, + 0.6105, + 0.699, + 0.7005, + 0.6905, + 0.68, + 0.755, + 0.6995, + 0.6885, + 0.765, + 0.674, + 0.763, + 0.7675, + 0.729, + 0.7535, + 0.7645, + 0.7775, + 0.7695, + 0.7725, + 0.7805, + 0.7835, + 0.7825, + 0.794, + 0.7905, + 0.797, + 0.795, + 0.7925, + 0.7995, + 0.7975, + 0.801, + 0.7995, + 0.802, + 0.8 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.04262668639421463, + 0.2711353898048401, + 0.1898173838853836, + 0.1387583613395691, + 0.09531620889902115, + 0.1376194804906845, + 0.07653278112411499, + 0.08707999438047409, + 0.09030534327030182, + 0.10221391171216965, + 0.06503984332084656, + 0.09489849209785461 + ], + "perturbation_rho": [ + 0.0572824701666832, + 0.20349135994911194, + 0.20036441087722778, + 0.17148703336715698, + 0.0623050183057785, + 0.14095279574394226, + 0.05262026563286781, + 0.12087561190128326, + 0.10731191188097, + 0.061124786734580994, + 0.07995927333831787, + 0.10992658138275146 + ], + "nudging": { + "0.001": [ + -0.0009717136854305863, + -0.0008302950882352889, + -0.0005646379431709647, + -0.00043579499470070004, + -0.0003014454268850386, + -0.00036783237010240555, + -0.00023612093355040997, + -0.0002637406578287482, + -0.00028259685495868325, + -0.00030849844915792346, + -0.0002243968192487955, + -0.0002889384631998837 + ], + "0.003": [ + -0.002888135612010956, + -0.0024814684875309467, + -0.0016913014696910977, + -0.0013047860702499747, + -0.0009024770115502179, + -0.001099176937714219, + -0.0007079166825860739, + -0.000786340911872685, + -0.0008432960603386164, + -0.0009207193506881595, + -0.0006701031234115362, + -0.0008658755104988813 + ], + "0.01": [ + -0.009360449388623238, + -0.00823313370347023, + -0.005617598537355661, + -0.004333253484219313, + -0.0029935596976429224, + -0.0036506117321550846, + -0.002341690007597208, + -0.002613792195916176, + -0.0027945097535848618, + -0.003059752518311143, + -0.002222315641120076, + -0.002874229568988085 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.805193168258667, + 1.141331272315979, + 0.9508048683166503, + 0.9720903642654419, + 1.0046518413543701, + 0.9624762474060059, + 0.9729494636535645, + 1.0329874326705932, + 1.0622312829971314, + 1.0902450609207153, + 1.0945431290626526, + 1.069749507522583, + 1.1206140889167786, + 1.1198603658676147, + 1.1902899974822998, + 1.129691632080078, + 1.1558469427108764, + 1.1596178537368775, + 1.1152971502304077, + 1.064276761817932, + 1.0659262399673461, + 1.003252516078949, + 1.006612749671936, + 0.995271017742157, + 1.0372564929962158, + 1.038958420085907, + 0.9995165836334229, + 1.0195529424667358, + 1.0122160236358642, + 1.0052064245224, + 0.9874209686279297, + 0.9727250333786011, + 0.9502078426361084, + 0.9627310655593873, + 0.9769992012023926, + 0.957837372303009, + 0.9192021017074585, + 0.9082319145202636, + 0.8588509743690491, + 0.8644218370437622, + 0.9094936531066895, + 0.8525595251083374, + 0.8475208776473999, + 0.8696963483810425, + 0.8863502472877502, + 0.8889586301803589, + 0.87190883436203, + 0.881449456501007, + 0.8687530401229858, + 0.8472485889434814, + 0.8228015476226807, + 0.8475295688629151, + 0.80593205909729, + 0.826126581954956, + 0.803306018447876, + 0.7851613706588745, + 0.789908846282959, + 0.8011346731185913, + 0.7741047975540161, + 0.7727820636749267, + 0.7508127551078796, + 0.7668908029556274, + 0.7510881311416626, + 0.749227946472168, + 0.7397995502471924, + 0.7420588563919067, + 0.7414700748443603, + 0.7316560808181762, + 0.7311081711769104, + 0.7289228174209594, + 0.718748868560791, + 0.719284348487854, + 0.7172070171356201, + 0.715237936592102, + 0.7131600219726563, + 0.7131189462661743, + 0.7111798879623413, + 0.7104117455482483, + 0.7099139176368713, + 0.7095409453392029 + ], + "train_acc": [ + 0.3709, + 0.5803, + 0.6538, + 0.6647, + 0.6778, + 0.6794, + 0.6696, + 0.6516, + 0.6416, + 0.6217, + 0.6176, + 0.6296, + 0.6117, + 0.6034, + 0.5943, + 0.6069, + 0.6078, + 0.6125, + 0.6227, + 0.6395, + 0.6313, + 0.6501, + 0.6486, + 0.6505, + 0.6382, + 0.6416, + 0.6519, + 0.6507, + 0.6519, + 0.6583, + 0.664, + 0.6627, + 0.674, + 0.6597, + 0.6604, + 0.6646, + 0.6778, + 0.68, + 0.6945, + 0.6937, + 0.688, + 0.6978, + 0.7007, + 0.6932, + 0.6887, + 0.6921, + 0.692, + 0.6911, + 0.6934, + 0.7005, + 0.708, + 0.6977, + 0.7073, + 0.6989, + 0.7051, + 0.7132, + 0.7119, + 0.7087, + 0.7146, + 0.7158, + 0.7208, + 0.7171, + 0.718, + 0.7186, + 0.7237, + 0.7212, + 0.7217, + 0.7247, + 0.7269, + 0.7235, + 0.7261, + 0.7261, + 0.7309, + 0.7315, + 0.7304, + 0.7293, + 0.7312, + 0.7309, + 0.7309, + 0.7318 + ], + "test_acc": [ + 0.557, + 0.6055, + 0.6535, + 0.6415, + 0.664, + 0.6595, + 0.6375, + 0.6035, + 0.5975, + 0.595, + 0.601, + 0.5835, + 0.5835, + 0.5645, + 0.584, + 0.5695, + 0.5745, + 0.609, + 0.574, + 0.598, + 0.626, + 0.63, + 0.6245, + 0.621, + 0.6155, + 0.6145, + 0.634, + 0.633, + 0.6315, + 0.628, + 0.6495, + 0.6495, + 0.643, + 0.645, + 0.6315, + 0.658, + 0.6415, + 0.66, + 0.673, + 0.626, + 0.658, + 0.6685, + 0.6695, + 0.6535, + 0.6545, + 0.6515, + 0.652, + 0.665, + 0.67, + 0.673, + 0.634, + 0.676, + 0.6375, + 0.659, + 0.6855, + 0.672, + 0.6405, + 0.674, + 0.671, + 0.682, + 0.679, + 0.6815, + 0.678, + 0.682, + 0.7015, + 0.695, + 0.6895, + 0.6945, + 0.6905, + 0.701, + 0.6995, + 0.6985, + 0.697, + 0.7025, + 0.7035, + 0.701, + 0.701, + 0.703, + 0.701, + 0.702 + ], + "state_pred_error": [ + 0.6440004120349884, + 0.22280715556144715, + 0.19949485445022583, + 0.20333513226509095, + 0.1995665676832199, + 0.17360950779914855, + 0.1714025309562683, + 0.17567809512615204, + 0.1685861314535141, + 0.16071651792526245, + 0.1619973666191101, + 0.15727631628513336, + 0.14492446608543397, + 0.12553655084371568, + 0.1107056671500206, + 0.11173754686117172, + 0.09973258945941925, + 0.08481347136497498, + 0.07910840909481048, + 0.07374589838981628, + 0.061310838890075686, + 0.06086507865786552, + 0.06732999970912934, + 0.07213088345527649, + 0.0809302486538887, + 0.08693374264240265, + 0.07419926369190216, + 0.06476001297235488, + 0.059982232785224916, + 0.05517140857577324, + 0.054124026930332185, + 0.05320052717924118, + 0.052594351238012316, + 0.05146298713684082, + 0.051765013629198074, + 0.05068567814826965, + 0.04570020427107811, + 0.04117140547633171, + 0.03618445234298706, + 0.03204310758709907, + 0.030476485627889634, + 0.030838667666912078, + 0.03160947210788727, + 0.033142930656671524, + 0.03333787830770016, + 0.032523459002375604, + 0.0311232088804245, + 0.02853037500679493, + 0.02451359252333641, + 0.02123837867975235, + 0.018589539101719857, + 0.016551195853948594, + 0.015129762995243072, + 0.013792664562165737, + 0.012773465797305107, + 0.011814959405362606, + 0.011233214758336545, + 0.010517877446115017, + 0.009914308138936758, + 0.009384106412529946, + 0.008977115654200316, + 0.00859420112669468, + 0.008317897130548955, + 0.008036257766187192, + 0.0078045787990093235, + 0.007604624762386084, + 0.007382925689220428, + 0.007202555446326733, + 0.007032391829788685, + 0.006897161689400673, + 0.006739879739284515, + 0.00660956681072712, + 0.0065333484672009945, + 0.006379267732799053, + 0.006277855364978314, + 0.00618511489033699, + 0.006059934399276972, + 0.0059683645233511926, + 0.005828300928324461, + 0.0057282065466046335 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.7615377902984619, + 0.3628881573677063, + 0.1397334486246109, + 0.13061293959617615, + 0.11024273186922073, + 0.09393852204084396, + 0.10003305226564407, + 0.10794281214475632, + 0.10362739115953445, + 0.10100233554840088, + 0.1030983105301857, + 0.12448301911354065 + ], + "perturbation_rho": [ + 0.7019654512405396, + 0.3051794767379761, + 0.12004730850458145, + 0.11974964290857315, + 0.1315283179283142, + 0.11543487757444382, + 0.08415813744068146, + 0.14185138046741486, + 0.12905646860599518, + 0.0691840872168541, + 0.12997986376285553, + 0.09520171582698822 + ], + "nudging": { + "0.001": [ + -0.020074496045708656, + -0.0011415289482101798, + -0.0003986226802226156, + -0.00038571454933844507, + -0.0003159685875289142, + -0.000282247900031507, + -0.0002976277028210461, + -0.0003108965465798974, + -0.00029459979850798845, + -0.0002931723720394075, + -0.00029093120247125626, + -0.00034520530607551336 + ], + "0.003": [ + -0.05917724594473839, + -0.0034206160344183445, + -0.0011960607953369617, + -0.0011569153284654021, + -0.0009477420244365931, + -0.0008460878161713481, + -0.0008919922402128577, + -0.0009325277060270309, + -0.0008838848443701863, + -0.0008802718948572874, + -0.0008727886597625911, + -0.0010357015999034047 + ], + "0.01": [ + -0.1852446049451828, + -0.011355580762028694, + -0.003981029614806175, + -0.0038526845164597034, + -0.0031567115802317858, + -0.0028176922351121902, + -0.0029711187817156315, + -0.0031051787082105875, + -0.0029434349853545427, + -0.002931142458692193, + -0.002905802335590124, + -0.0034490139223635197 + ] + }, + "state_pred_error_per_layer": [ + 8110.80078125, + 4497.13623046875, + 2448.651123046875, + 2213.206298828125, + 2038.592041015625, + 2361.478515625, + 2122.5341796875, + 2178.11474609375, + 2310.2265625, + 2081.50390625, + 2114.170654296875, + 2407.947998046875 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.148776465988159, + 1.1814707509994506, + 0.8142018517971039, + 0.7088346358299256, + 0.6350752319335937, + 0.6011627590179444, + 0.5896312768936157, + 0.6038155675411224, + 0.6367639873504639, + 0.611630228805542, + 0.6156754608631134, + 0.5475868948936462, + 0.7217369768142701, + 0.6653201589584351, + 0.6549628901481629, + 0.5913608861923217, + 0.6288921371459961, + 0.6264215920448303, + 0.6552036820411682, + 0.7734859038352966, + 0.620717143535614, + 0.6559980722427368, + 0.7568615766525268, + 0.7035983097076416, + 0.7369053153991699, + 0.7277791313171387, + 0.7967849886417389, + 0.9040812728881836, + 1.0086228225708007, + 0.8652441547393799, + 0.8433989980697632, + 1.068234407043457, + 1.4739661707878113, + 1.8162412731170654, + 1.680437289237976, + 1.391745728302002, + 1.656255067062378, + 1.4110714862823486, + 1.1851400486946106, + 1.0099994808197021, + 1.028020666885376, + 1.008147621154785, + 1.0491145919799805, + 1.1494903202056885, + 1.1833931898117065, + 1.189606708717346, + 1.184402177619934, + 1.1652568649291992, + 1.1241227840423584, + 1.0456886117458344, + 1.0670725841522217, + 1.0937847711563111, + 1.0900941519737244, + 1.091909122467041, + 1.0541937410354614, + 1.0984298721313477, + 1.0692434198379517, + 1.0763300409317016, + 1.0832363823890685, + 1.0875951803207398, + 1.1035369068145753, + 1.1004417110443114, + 1.0955762950897217, + 1.1328410696029663, + 1.121702961540222, + 1.0941922254562377, + 1.105709262084961, + 1.0955168069839478, + 1.0915766580581665, + 1.0790838848114013, + 1.0844950397491455, + 1.073964795780182, + 1.0757515462875367, + 1.0671116413116455, + 1.0617354885101318, + 1.0602436627388, + 1.0596875606536866, + 1.0585092328071595, + 1.0569489337921143, + 1.0562909119606019 + ], + "train_acc": [ + 0.2285, + 0.5769, + 0.6984, + 0.7352, + 0.7623, + 0.7801, + 0.7797, + 0.7776, + 0.7734, + 0.7791, + 0.7788, + 0.7976, + 0.744, + 0.7694, + 0.7669, + 0.7867, + 0.7689, + 0.773, + 0.7709, + 0.7432, + 0.7765, + 0.7624, + 0.7403, + 0.7537, + 0.741, + 0.751, + 0.7441, + 0.7342, + 0.7249, + 0.7502, + 0.7602, + 0.7391, + 0.7015, + 0.6897, + 0.6865, + 0.7091, + 0.6805, + 0.686, + 0.6956, + 0.7113, + 0.7053, + 0.7082, + 0.6983, + 0.6802, + 0.6718, + 0.6675, + 0.6669, + 0.6705, + 0.6697, + 0.6817, + 0.6679, + 0.6617, + 0.6593, + 0.6606, + 0.6628, + 0.654, + 0.6602, + 0.6538, + 0.6552, + 0.6518, + 0.6501, + 0.6485, + 0.6555, + 0.642, + 0.6462, + 0.652, + 0.653, + 0.6516, + 0.6506, + 0.6531, + 0.6546, + 0.6555, + 0.6554, + 0.6555, + 0.6585, + 0.6578, + 0.6573, + 0.6583, + 0.6578, + 0.6575 + ], + "test_acc": [ + 0.4705, + 0.6455, + 0.697, + 0.7195, + 0.7395, + 0.7235, + 0.721, + 0.654, + 0.7045, + 0.733, + 0.733, + 0.7205, + 0.6075, + 0.6015, + 0.667, + 0.695, + 0.692, + 0.717, + 0.65, + 0.7155, + 0.721, + 0.7095, + 0.6685, + 0.6755, + 0.6915, + 0.65, + 0.6675, + 0.694, + 0.6315, + 0.704, + 0.6575, + 0.655, + 0.6615, + 0.6415, + 0.656, + 0.6295, + 0.597, + 0.619, + 0.652, + 0.629, + 0.6645, + 0.677, + 0.6305, + 0.594, + 0.6205, + 0.6565, + 0.614, + 0.578, + 0.6325, + 0.6345, + 0.617, + 0.604, + 0.6015, + 0.5935, + 0.595, + 0.5985, + 0.612, + 0.614, + 0.612, + 0.624, + 0.623, + 0.619, + 0.607, + 0.6145, + 0.6235, + 0.6355, + 0.624, + 0.625, + 0.6245, + 0.621, + 0.6325, + 0.6165, + 0.6335, + 0.6355, + 0.633, + 0.6335, + 0.636, + 0.635, + 0.637, + 0.6375 + ], + "value_loss": [ + 2.8110924012184144, + 1.0558870765686035, + 0.8168890055179596, + 0.7087526061058045, + 0.6747339898109436, + 0.7047410857200622, + 0.6946773962974548, + 0.7863340533733368, + 0.9412341720581054, + 0.831102158164978, + 0.8582201668739319, + 0.662950705909729, + 1.1160548944473268, + 0.9702559132099151, + 0.9050511346578598, + 0.7823492926597595, + 0.7541343150138855, + 0.7990150864124298, + 1.004567841720581, + 1.4750306210517883, + 0.9225585294723511, + 0.9900291267395019, + 1.4712504830360413, + 1.0571229331970216, + 1.0176424533843995, + 1.2388241514205933, + 1.5617137315750123, + 2.2647137912750246, + 2.398833445739746, + 2.148024677848816, + 2.2395449771881104, + 3.704381360244751, + 6.6345307513237, + 8.889485812377929, + 7.216513509845734, + 4.78957142868042, + 5.98610913848877, + 4.262736887645722, + 2.9974183382034303, + 2.16633946557045, + 2.0203945972442625, + 2.078467296600342, + 2.2245993151664734, + 2.3508366590499876, + 1.990233847808838, + 2.1123542598724363, + 1.7581531209945678, + 1.6216532674789428, + 1.6240478748321534, + 1.1111126909255982, + 1.1907436922073364, + 1.2514173234939576, + 1.0694399843215943, + 1.0288991886138916, + 0.924325085067749, + 0.9715163703918457, + 1.034997721195221, + 1.0296417493820191, + 0.9379981343746185, + 0.929289114189148, + 0.9188536177635193, + 0.8787575536727905, + 0.8616826787948608, + 0.9979259113311768, + 0.9289968961715698, + 0.8151037572860718, + 0.8430522988319397, + 0.7192770887374877, + 0.7140207627296448, + 0.7555822341918945, + 0.8249447187423706, + 0.7111081220149994, + 0.7195552299499511, + 0.696260218334198, + 0.6993004722595215, + 0.6393350621223449, + 0.6692558577537536, + 0.6552567146778107, + 0.6035549112319947, + 0.6376882638454437 + ], + "term_loss": [ + 1.6429537870407105, + 0.7799642414569855, + 0.6450700888633728, + 0.544001949596405, + 0.5029326514720917, + 0.5384751222610473, + 0.5338305097579956, + 0.6271685851097107, + 0.7759458763122559, + 0.670561255645752, + 0.6930260807037354, + 0.5142842155456543, + 0.9223114760398865, + 0.7909464566707611, + 0.7283711557388306, + 0.6134422359228134, + 0.5745167485713959, + 0.6179891448736191, + 0.8072999868392944, + 1.1685954872608184, + 0.6874509717941284, + 0.6915433479309082, + 1.0379761940956116, + 0.7678791676044464, + 0.7365385051727295, + 0.888452003288269, + 1.1689853934288026, + 1.8738205919265747, + 1.9812078285217285, + 1.755995346546173, + 1.9156217575073242, + 3.2754078594207763, + 5.931076295042038, + 7.799770739746093, + 6.220347383117676, + 4.235098806762696, + 5.208815985870362, + 3.6477620443344114, + 2.481362159538269, + 1.721485794878006, + 1.6364931385040282, + 1.7316909828186036, + 1.7622679103374481, + 1.8701237350463866, + 1.5614522430419921, + 1.6687043725967408, + 1.3664477088928222, + 1.2542131168365478, + 1.2503349880218506, + 0.7934518660068512, + 0.8526655314445496, + 0.8882325883865356, + 0.7314094313621521, + 0.7021425265312194, + 0.6122970679283142, + 0.6549327205717563, + 0.7135983491659165, + 0.707961343383789, + 0.618238576579094, + 0.6056517326354981, + 0.5986014746427536, + 0.5598198036670685, + 0.5442600372314453, + 0.6618821332931518, + 0.5999844347953797, + 0.5050875579357147, + 0.5238150319099426, + 0.4168266535282135, + 0.4121341013431549, + 0.44742312049865723, + 0.508048579788208, + 0.41021962761878966, + 0.41673866806030274, + 0.39615153601169584, + 0.3979441471099853, + 0.3492745657533407, + 0.3673823845863342, + 0.3611060200572014, + 0.31359378118515013, + 0.3444120800256729 + ], + "bridge_loss": [ + 0.8798169805285463, + 0.06988263263404369, + 0.007221714366972446, + 0.009977325683832168, + 0.026867762994766235, + 0.02428093141168356, + 0.017750029611587524, + 0.01041710512638092, + 0.008498724353313445, + 0.007494112598896026, + 0.009115628288686275, + 0.006687443786859512, + 0.009187254488468171, + 0.0071553698055446145, + 0.0083095718793571, + 0.0106832455098629, + 0.009414582189917564, + 0.011997878777980805, + 0.025829354831576348, + 0.1085723452091217, + 0.06851940405368805, + 0.1190645812034607, + 0.23382153396606445, + 0.09718898033499718, + 0.08073521366119385, + 0.15449185333251952, + 0.19037553939819335, + 0.17207214410305025, + 0.1772028945326805, + 0.18125318269729615, + 0.12484188132286071, + 0.20437312326431276, + 0.44104156914949416, + 0.8135768440246582, + 0.7194256249904633, + 0.3012491428375244, + 0.4917928521633148, + 0.3458102744579315, + 0.2624234221935272, + 0.2108467219054699, + 0.14520962963104248, + 0.1109061488866806, + 0.22237445271611214, + 0.22470301866531373, + 0.16589241380691527, + 0.17665138913393022, + 0.12355085052251816, + 0.10024731488227845, + 0.1102370167851448, + 0.0632073667794466, + 0.07717509996891021, + 0.09432626271247864, + 0.07223957173526287, + 0.05831001040935516, + 0.04691112922430039, + 0.04399191717505455, + 0.054682890085875985, + 0.05131758269071579, + 0.04948833506703377, + 0.05090191900730133, + 0.04628677634000778, + 0.04592856809794903, + 0.04618706555068493, + 0.05831435605287552, + 0.05219041556119919, + 0.038912322914600374, + 0.04784802967309952, + 0.029901893815398217, + 0.03067267468571663, + 0.039136952781677246, + 0.047098509496450426, + 0.03316549341678619, + 0.034926051980257035, + 0.03337522785365581, + 0.036731080013513565, + 0.026030787551403044, + 0.037166545414924625, + 0.029469560922682287, + 0.02593328186273575, + 0.029638116455078124 + ], + "tgrad_loss": [ + 0.28832164726257326, + 0.2060401952266693, + 0.16459719829559327, + 0.15477333117723466, + 0.14493357677459717, + 0.14198503303527832, + 0.14309685859680177, + 0.14874836663007737, + 0.15678957319259643, + 0.15304679074287414, + 0.15607846132516862, + 0.14197904839515685, + 0.18455617270469665, + 0.17215408868789672, + 0.16837040560245514, + 0.15822381327152252, + 0.17020298886299134, + 0.16902806978225707, + 0.17143850438594818, + 0.19786279382705688, + 0.16658815627098084, + 0.1794211902618408, + 0.19945275497436524, + 0.19205478763580322, + 0.20036873846054076, + 0.19588031902313233, + 0.20235279903411865, + 0.21882107915878296, + 0.24042275769710542, + 0.21077616119384765, + 0.19908131561279296, + 0.22460036993026733, + 0.26241290621757507, + 0.2761381866455078, + 0.27674061311483383, + 0.25322344913482664, + 0.28550028896331786, + 0.26916457452774045, + 0.25363275275230407, + 0.23400697290897368, + 0.2386918211221695, + 0.23587018747329713, + 0.2399569533109665, + 0.2560098692417145, + 0.26288919100761415, + 0.266998498249054, + 0.2681545648574829, + 0.26719284348487854, + 0.2634758550167084, + 0.2544534649372101, + 0.2609030704975128, + 0.26885847454071043, + 0.26579098694324493, + 0.2684466419219971, + 0.2651168885231018, + 0.2725917413234711, + 0.26671648054122926, + 0.2703628271102905, + 0.27027122049331664, + 0.27273546109199526, + 0.27396536240577696, + 0.27300917959213256, + 0.2712355743408203, + 0.2777294144630432, + 0.27682205362319945, + 0.27110387902259825, + 0.2713892430782318, + 0.2725485424041748, + 0.27121399002075197, + 0.2690221670150757, + 0.2697976267337799, + 0.2677230007648468, + 0.2678905071258545, + 0.26673345193862913, + 0.26462524137496946, + 0.2640297092437744, + 0.26470692901611326, + 0.2646811327219009, + 0.2640278464794159, + 0.2636380691766739 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.0012992812553420663, + 0.028360359370708466, + 0.07222752273082733, + 0.06384990364313126, + 0.0745362713932991, + 0.10235601663589478, + 0.11958298832178116, + 0.12767711281776428, + 0.12978672981262207, + 0.13033980131149292, + 0.131376713514328, + 0.13925974071025848 + ], + "perturbation_rho": [ + -0.036700520664453506, + 0.08258875459432602, + 0.18529893457889557, + 0.1350553333759308, + 0.14971259236335754, + 0.23370781540870667, + 0.15428856015205383, + 0.2475280910730362, + 0.20684200525283813, + 0.26022571325302124, + 0.23770767450332642, + 0.24039392173290253 + ], + "nudging": { + "0.001": [ + 1.9588624127209187e-05, + -0.00022895228175912052, + -0.0007079594652168453, + -0.0005056310910731554, + -0.0005876067443750799, + -0.0007552369497716427, + -0.0008725673542357981, + -0.0009411656064912677, + -0.0009967443766072392, + -0.0010289904894307256, + -0.001046083401888609, + -0.001075628912076354 + ], + "0.003": [ + 7.772856042720377e-05, + -0.0006833757506683469, + -0.002122018486261368, + -0.001515379874035716, + -0.001759801642037928, + -0.002262262161821127, + -0.002616232493892312, + -0.0028189788572490215, + -0.002985659521073103, + -0.003085652831941843, + -0.0031352993100881577, + -0.003224627347663045 + ], + "0.01": [ + 0.0004691533395089209, + -0.002260619541630149, + -0.007056917063891888, + -0.005040735937654972, + -0.005857650190591812, + -0.007526098750531673, + -0.008702869527041912, + -0.009377602487802505, + -0.009931675158441067, + -0.01026402972638607, + -0.010433407500386238, + -0.010728873312473297 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a0.5_L2_s123.json b/results/synth_ladder_v2_hi/synth_a0.5_L2_s123.json new file mode 100644 index 0000000..f6a54ab --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a0.5_L2_s123.json @@ -0,0 +1,1512 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.8134757766723633, + 0.9264522449493409, + 0.5520310824871063, + 0.4102143557548523, + 0.3579074279308319, + 0.318011970949173, + 0.30238913650512694, + 0.2825048192024231, + 0.27405023584365845, + 0.2710430831432343, + 0.2594404198884964, + 0.2341841076850891, + 0.2375671992301941, + 0.22861384831666948, + 0.21102480673789978, + 0.2138878378510475, + 0.20143119230270387, + 0.21637656970024108, + 0.19791898612976075, + 0.2010431251525879, + 0.1995568153619766, + 0.18589567379951477, + 0.18345476458072663, + 0.17632593874931335, + 0.16185988569259643, + 0.16167333889007568, + 0.17501846678256988, + 0.16296407165527343, + 0.1489872475385666, + 0.14913332681655883, + 0.14884000272750855, + 0.14476664385795593, + 0.14326060855388642, + 0.13225111142992974, + 0.12688777947425842, + 0.12592163169384002, + 0.12174792432785034, + 0.12096801409721375, + 0.11985228304862976, + 0.11514121813774109, + 0.1118896684885025, + 0.11161191877126694, + 0.10568768167495728, + 0.10417118835449218, + 0.10223673396110534, + 0.09966703229546547, + 0.09637608439922332, + 0.09464550490379334, + 0.09507670216560364, + 0.0932104425907135, + 0.09320190250873565, + 0.08970492560863495, + 0.0869272301197052, + 0.08439444209337235, + 0.08397750174999237, + 0.08251788482666016, + 0.08170321741104127, + 0.08105333895683288, + 0.07938651487827302, + 0.07741225541234016, + 0.07588316562175751, + 0.07549352577328682, + 0.07457819412350655, + 0.07359826315939426, + 0.0727104668855667, + 0.07231093420982361, + 0.07182440527677536, + 0.0712629911661148, + 0.07068480265140534, + 0.07020738124847412, + 0.06981901693344116, + 0.06955654413104058, + 0.06925340088009835, + 0.0689685908973217, + 0.06875414711236953, + 0.06860008796453476, + 0.06846473612785339, + 0.06837011733651162, + 0.06830710372775793, + 0.06827167451381683 + ], + "train_acc": [ + 0.3965, + 0.7393, + 0.8506, + 0.8812, + 0.8823, + 0.8914, + 0.8952, + 0.8966, + 0.9002, + 0.8984, + 0.9022, + 0.9147, + 0.9091, + 0.9149, + 0.926, + 0.9208, + 0.9255, + 0.9218, + 0.9277, + 0.9246, + 0.9251, + 0.9335, + 0.932, + 0.9386, + 0.9446, + 0.9436, + 0.9356, + 0.9407, + 0.9506, + 0.9491, + 0.9448, + 0.95, + 0.9517, + 0.9562, + 0.9606, + 0.9603, + 0.9601, + 0.9621, + 0.9626, + 0.9648, + 0.9683, + 0.9658, + 0.9701, + 0.9708, + 0.9721, + 0.9739, + 0.9756, + 0.9763, + 0.9752, + 0.977, + 0.9741, + 0.978, + 0.9797, + 0.9818, + 0.9827, + 0.9829, + 0.9834, + 0.9831, + 0.9832, + 0.9843, + 0.9868, + 0.9873, + 0.9874, + 0.9881, + 0.9882, + 0.9881, + 0.9887, + 0.9896, + 0.9896, + 0.9896, + 0.9897, + 0.9902, + 0.9903, + 0.9903, + 0.9905, + 0.9909, + 0.9909, + 0.991, + 0.9911, + 0.9911 + ], + "test_acc": [ + 0.6275, + 0.8135, + 0.8475, + 0.8675, + 0.864, + 0.8715, + 0.8725, + 0.875, + 0.879, + 0.8785, + 0.8755, + 0.8875, + 0.8715, + 0.8865, + 0.8865, + 0.889, + 0.887, + 0.8815, + 0.8845, + 0.8855, + 0.8885, + 0.8845, + 0.885, + 0.8855, + 0.89, + 0.882, + 0.885, + 0.8935, + 0.89, + 0.8875, + 0.891, + 0.8875, + 0.888, + 0.8935, + 0.8905, + 0.8965, + 0.888, + 0.888, + 0.8935, + 0.89, + 0.887, + 0.888, + 0.888, + 0.892, + 0.89, + 0.888, + 0.892, + 0.89, + 0.8935, + 0.892, + 0.888, + 0.8885, + 0.8915, + 0.897, + 0.894, + 0.892, + 0.8945, + 0.8945, + 0.8935, + 0.893, + 0.8945, + 0.896, + 0.8945, + 0.895, + 0.897, + 0.894, + 0.8975, + 0.894, + 0.8945, + 0.8935, + 0.893, + 0.895, + 0.896, + 0.8955, + 0.895, + 0.8955, + 0.8955, + 0.895, + 0.895, + 0.895 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8870643973350525, + 0.8695865869522095 + ], + "perturbation_rho": [ + 0.9999991059303284, + 0.9999968409538269 + ], + "nudging": { + "0.001": [ + -0.027860965579748154, + -0.011582823470234871 + ], + "0.003": [ + -0.07713194191455841, + -0.03366940841078758 + ], + "0.01": [ + -0.1920192688703537, + -0.10025370121002197 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2277308601379393, + 1.6089211181640626, + 1.0115381980895997, + 0.6971575919151306, + 0.5460078211784363, + 0.4641047782897949, + 0.42421296977996825, + 0.4004480885982513, + 0.3980832378387451, + 0.40035034217834475, + 0.4053838936328888, + 0.4165379599571228, + 0.41093469638824465, + 0.4381900384902954, + 0.40459541647434233, + 0.4161624723672867, + 0.4243528455734253, + 0.4472506643295288, + 0.4197193340301514, + 0.4405568720817566, + 0.4483852259159088, + 0.4182058423995972, + 0.46347024388313296, + 0.4317498147010803, + 0.4455674554824829, + 0.468244349861145, + 0.5031647268295288, + 0.48595187821388247, + 0.420454656124115, + 0.4349890894889831, + 0.4568765145778656, + 0.4257242699623108, + 0.4918008323669434, + 0.4292266354560852, + 0.4412042767524719, + 0.44511404564380647, + 0.4060916609764099, + 0.42281134433746337, + 0.45205292596817015, + 0.4296050157546997, + 0.46153125472068784, + 0.4331648801326752, + 0.4328668572425842, + 0.4199811037063599, + 0.40794372041225435, + 0.40181673164367676, + 0.390487536406517, + 0.4007012459754944, + 0.3911929183483124, + 0.39021644287109375, + 0.3868677257537842, + 0.38623606929779053, + 0.3859286364555359, + 0.37683377466201784, + 0.37579740810394285, + 0.36816846113204954, + 0.38835712060928346, + 0.3590394494056702, + 0.3600341588020325, + 0.3655199574947357, + 0.35341513319015505, + 0.35888077273368835, + 0.3514525812149048, + 0.34960040357112887, + 0.3468650718688965, + 0.34670376050472257, + 0.34839404121637346, + 0.3450363240242004, + 0.34819836664199827, + 0.3415450521469116, + 0.3402742134094238, + 0.3409415246963501, + 0.33930211052894593, + 0.3378286985516548, + 0.336081723356247, + 0.33632210760116577, + 0.3354383348464966, + 0.33510682430267336, + 0.33467428114414216, + 0.3344334460377693 + ], + "train_acc": [ + 0.1851, + 0.4619, + 0.667, + 0.7593, + 0.8055, + 0.8235, + 0.8372, + 0.8475, + 0.8481, + 0.8464, + 0.8516, + 0.8462, + 0.8502, + 0.8408, + 0.8569, + 0.8511, + 0.8507, + 0.845, + 0.8533, + 0.8491, + 0.8504, + 0.8561, + 0.8458, + 0.8526, + 0.8442, + 0.837, + 0.8328, + 0.8409, + 0.8521, + 0.8489, + 0.8443, + 0.852, + 0.8386, + 0.8507, + 0.8496, + 0.8493, + 0.8601, + 0.8535, + 0.8468, + 0.8539, + 0.8447, + 0.8467, + 0.8532, + 0.8539, + 0.857, + 0.8613, + 0.8621, + 0.8575, + 0.8576, + 0.8617, + 0.8614, + 0.8608, + 0.8634, + 0.862, + 0.8663, + 0.8653, + 0.8609, + 0.8653, + 0.871, + 0.8647, + 0.8717, + 0.8682, + 0.8698, + 0.8719, + 0.8716, + 0.8717, + 0.8727, + 0.8707, + 0.8708, + 0.8733, + 0.8724, + 0.8706, + 0.875, + 0.8729, + 0.8735, + 0.8754, + 0.8737, + 0.8758, + 0.8757, + 0.8752 + ], + "test_acc": [ + 0.327, + 0.5655, + 0.6935, + 0.763, + 0.79, + 0.802, + 0.816, + 0.816, + 0.8205, + 0.8155, + 0.808, + 0.808, + 0.806, + 0.81, + 0.826, + 0.8225, + 0.7905, + 0.818, + 0.8115, + 0.8055, + 0.81, + 0.809, + 0.803, + 0.8035, + 0.8065, + 0.7965, + 0.782, + 0.814, + 0.8025, + 0.813, + 0.818, + 0.8045, + 0.797, + 0.8185, + 0.821, + 0.808, + 0.8125, + 0.8105, + 0.8065, + 0.8165, + 0.7885, + 0.7975, + 0.793, + 0.816, + 0.8205, + 0.834, + 0.8385, + 0.8095, + 0.815, + 0.8125, + 0.821, + 0.8245, + 0.816, + 0.8215, + 0.826, + 0.8205, + 0.8265, + 0.835, + 0.82, + 0.8325, + 0.8355, + 0.837, + 0.835, + 0.835, + 0.836, + 0.831, + 0.835, + 0.8385, + 0.8365, + 0.843, + 0.837, + 0.8345, + 0.837, + 0.841, + 0.8385, + 0.841, + 0.839, + 0.84, + 0.84, + 0.8405 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.05535196140408516, + 0.11400651931762695 + ], + "perturbation_rho": [ + 0.07898944616317749, + 0.06743785738945007 + ], + "nudging": { + "0.001": [ + -0.0015921953599900007, + -0.0004352356481831521 + ], + "0.003": [ + -0.004735918715596199, + -0.0013046588283032179 + ], + "0.01": [ + -0.015302825719118118, + -0.004326905123889446 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 2.0606787532806394, + 1.1567006985664368, + 0.6476440377235413, + 0.46067230157852174, + 0.4016605010986328, + 0.3913002317428589, + 0.3918870966911316, + 0.39221469788551333, + 0.38962100603580474, + 0.39011064352989194, + 0.3833303677558899, + 0.39151409659385683, + 0.383689892745018, + 0.3887174612045288, + 0.39423247394561767, + 0.3862614650726318, + 0.3907231846809387, + 0.3773960693836212, + 0.3979664779663086, + 0.4017488422870636, + 0.3948758713722229, + 0.4106588708877563, + 0.43649713220596315, + 0.41689020500183105, + 0.46598345975875854, + 0.42229409980773924, + 0.4376958209991455, + 0.4556465253829956, + 0.43013258485794065, + 0.4284559500694275, + 0.41865804080963137, + 0.42352541952133177, + 0.4187520936965942, + 0.4412714430809021, + 0.4290276056289673, + 0.43953913819789886, + 0.4115768392086029, + 0.416507855796814, + 0.4253982139587402, + 0.4240591028213501, + 0.4231268990516663, + 0.4098381155014038, + 0.4129206636428833, + 0.4102262992143631, + 0.4049965745925903, + 0.41237741203308104, + 0.4174180850028992, + 0.4078349845647812, + 0.40372915534973147, + 0.4217507261276245, + 0.39810289478302, + 0.4005114579439163, + 0.4004998396396637, + 0.3945280794143677, + 0.3943117833137512, + 0.39065166521072386, + 0.394280153131485, + 0.3958699932575226, + 0.38747738513946534, + 0.39019425966739657, + 0.3880472351312637, + 0.38656279892921447, + 0.3849751262664795, + 0.3862720604419708, + 0.38301447155475615, + 0.3807786055088043, + 0.38096148087978365, + 0.3796463566303253, + 0.37803510179519656, + 0.37694546613693236, + 0.3765466928482056, + 0.37544756646156313, + 0.37575010981559753, + 0.3745943290710449, + 0.37441092958450317, + 0.37395868825912476, + 0.3735989002227783, + 0.37321364402770996, + 0.3729501468658447, + 0.3728492456436157 + ], + "train_acc": [ + 0.266, + 0.6291, + 0.783, + 0.8371, + 0.8528, + 0.8519, + 0.8521, + 0.8492, + 0.8514, + 0.8543, + 0.8537, + 0.8506, + 0.8546, + 0.8501, + 0.8505, + 0.8562, + 0.8552, + 0.8552, + 0.847, + 0.8483, + 0.8517, + 0.8447, + 0.836, + 0.8429, + 0.8252, + 0.8384, + 0.832, + 0.8295, + 0.8331, + 0.8389, + 0.8421, + 0.8405, + 0.8377, + 0.8343, + 0.8382, + 0.833, + 0.8436, + 0.8422, + 0.8403, + 0.8412, + 0.8388, + 0.8428, + 0.8441, + 0.8439, + 0.8453, + 0.8456, + 0.8418, + 0.8458, + 0.8488, + 0.8419, + 0.8495, + 0.8502, + 0.8498, + 0.8521, + 0.8518, + 0.8521, + 0.8511, + 0.8513, + 0.8534, + 0.8523, + 0.8537, + 0.8544, + 0.8558, + 0.8543, + 0.8564, + 0.8578, + 0.8557, + 0.8573, + 0.8582, + 0.8566, + 0.8587, + 0.859, + 0.8584, + 0.8585, + 0.8596, + 0.8596, + 0.8602, + 0.8601, + 0.86, + 0.8601 + ], + "test_acc": [ + 0.4795, + 0.7045, + 0.7885, + 0.817, + 0.8265, + 0.821, + 0.817, + 0.8225, + 0.8195, + 0.8245, + 0.8125, + 0.818, + 0.826, + 0.828, + 0.8185, + 0.811, + 0.8165, + 0.814, + 0.8045, + 0.811, + 0.8025, + 0.8025, + 0.801, + 0.7825, + 0.807, + 0.806, + 0.7985, + 0.795, + 0.7975, + 0.8035, + 0.798, + 0.816, + 0.8095, + 0.8005, + 0.803, + 0.8065, + 0.803, + 0.803, + 0.81, + 0.8105, + 0.8155, + 0.803, + 0.815, + 0.8185, + 0.8135, + 0.8195, + 0.819, + 0.816, + 0.819, + 0.8155, + 0.8295, + 0.8125, + 0.8125, + 0.816, + 0.8255, + 0.815, + 0.826, + 0.825, + 0.8165, + 0.8255, + 0.8265, + 0.826, + 0.829, + 0.827, + 0.8265, + 0.829, + 0.8305, + 0.8275, + 0.8285, + 0.827, + 0.823, + 0.8295, + 0.8295, + 0.827, + 0.828, + 0.829, + 0.8285, + 0.829, + 0.83, + 0.8305 + ], + "state_pred_error": [ + 0.8031414375305176, + 0.35727285192012787, + 0.20822873120307922, + 0.17016679759025574, + 0.15798014035224914, + 0.1421566589951515, + 0.12269669504165649, + 0.1036052488565445, + 0.08826953535079957, + 0.07445642170906067, + 0.06234971261024475, + 0.05339485208392143, + 0.045877391409873965, + 0.0403602089881897, + 0.03642171306014061, + 0.03317514306306839, + 0.03129510297775268, + 0.028174708819389344, + 0.02580746712088585, + 0.02427465500831604, + 0.023034810265898705, + 0.022062225687503816, + 0.022103151264786722, + 0.020669510221481325, + 0.020476308749616146, + 0.019967139992117883, + 0.019168919190764428, + 0.018457811444997786, + 0.018327979081869124, + 0.01801105038076639, + 0.01739282046556473, + 0.016778514325618745, + 0.015847790563106538, + 0.0158354807138443, + 0.01575601952970028, + 0.014686103010177613, + 0.014878038236498832, + 0.01409349731504917, + 0.014016203632950783, + 0.0138145767390728, + 0.013226337088644504, + 0.013212937781214714, + 0.012958681486546993, + 0.013233311638236047, + 0.012328391301631927, + 0.012101875373721123, + 0.011980755272507668, + 0.011779027014970779, + 0.011585621590912342, + 0.011263450093567372, + 0.011011741843819619, + 0.011311796459555625, + 0.010854876567423344, + 0.010849458143115043, + 0.011040620262175798, + 0.010131367165595293, + 0.0099437257707119, + 0.010218308821320533, + 0.009720495526492595, + 0.01009982328414917, + 0.009624038696289063, + 0.009806264831125736, + 0.009349493139982224, + 0.009056915233284234, + 0.008922270947694778, + 0.008910164754092693, + 0.008901315172761678, + 0.008582982118427753, + 0.008406809172034263, + 0.00853000564724207, + 0.008742392796278, + 0.00837141503021121, + 0.008199263268709183, + 0.008339552146196366, + 0.00796095138937235, + 0.007939809998869896, + 0.007585817550122738, + 0.0076191362425684925, + 0.008353407859802247, + 0.00735080057233572 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8879689574241638, + 0.43028849363327026 + ], + "perturbation_rho": [ + 0.7560213804244995, + 0.38433945178985596 + ], + "nudging": { + "0.001": [ + -0.02204158343374729, + -0.0024646292440593243 + ], + "0.003": [ + -0.0634373351931572, + -0.007362409494817257 + ], + "0.01": [ + -0.18288554251194, + -0.02417319267988205 + ] + }, + "state_pred_error_per_layer": [ + 1696.6031494140625, + 278.31060791015625 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2291323978424074, + 1.6088748979568481, + 1.0196145711898803, + 0.7028882287025452, + 0.5439308270454407, + 0.46666228404045107, + 0.4218287401199341, + 0.39928707320690154, + 0.3870831217050552, + 0.39015878410339355, + 0.4016779498100281, + 0.4121299880504608, + 0.3897958308696747, + 0.40895366220474244, + 0.41575607891082766, + 0.4268762981414795, + 0.424427557182312, + 0.4411251617431641, + 0.4447257128238678, + 0.4506887272834778, + 0.4911063948631287, + 0.5097891534805298, + 0.5217780744075775, + 0.5186571026802063, + 0.5549187143325806, + 0.5775168406486512, + 0.6109977385520935, + 0.6179571244239808, + 0.588416787147522, + 0.591089683008194, + 0.5984664674758912, + 0.6150432247161866, + 0.6514943526268006, + 0.6930927798271179, + 0.6797385078430176, + 0.7172976000785828, + 0.7486782361745834, + 0.7203411834716796, + 0.7663027370452881, + 0.716061837387085, + 0.7416047885894775, + 0.7384530964851379, + 0.7653874188423156, + 0.759270369720459, + 0.779615391254425, + 0.795836368560791, + 0.8164382888793945, + 0.8216145399093628, + 0.8497391104698181, + 0.8565743488311768, + 0.8682084201812744, + 0.8817925959587097, + 0.8865997703552246, + 0.9067432309150696, + 0.912219108581543, + 0.9159337846755982, + 0.9211236267089844, + 0.9347142765045166, + 0.9267299753189087, + 0.9395195854187012, + 0.9390426496505737, + 0.9382089434623718, + 0.9440257927894592, + 0.9453169227600098, + 0.9499050285339355, + 0.9569249134063721, + 0.9552145975112915, + 0.9529026988983155, + 0.9567554153442382, + 0.9556082971572876, + 0.9563019279479981, + 0.9571789653778077, + 0.9569482453346252, + 0.957211256980896, + 0.9569433841705323, + 0.9578723815917969, + 0.9576466073989868, + 0.9571835817337037, + 0.957071294593811, + 0.9570294202804566 + ], + "train_acc": [ + 0.1861, + 0.4691, + 0.6611, + 0.7602, + 0.8045, + 0.8242, + 0.8421, + 0.8477, + 0.8527, + 0.8563, + 0.852, + 0.8492, + 0.8551, + 0.853, + 0.85, + 0.8472, + 0.8486, + 0.8498, + 0.8454, + 0.8425, + 0.8351, + 0.8246, + 0.82, + 0.8229, + 0.8095, + 0.8061, + 0.7985, + 0.7995, + 0.8095, + 0.8076, + 0.7982, + 0.7964, + 0.782, + 0.7683, + 0.7696, + 0.7501, + 0.7418, + 0.7483, + 0.736, + 0.742, + 0.7375, + 0.7364, + 0.727, + 0.729, + 0.7205, + 0.7165, + 0.7103, + 0.7074, + 0.703, + 0.6976, + 0.6981, + 0.6932, + 0.6898, + 0.6861, + 0.6848, + 0.6826, + 0.6805, + 0.6789, + 0.6796, + 0.6767, + 0.6791, + 0.6804, + 0.676, + 0.6738, + 0.6705, + 0.6731, + 0.6752, + 0.6735, + 0.6737, + 0.6727, + 0.6723, + 0.674, + 0.6734, + 0.6735, + 0.673, + 0.673, + 0.672, + 0.6725, + 0.6736, + 0.6736 + ], + "test_acc": [ + 0.324, + 0.5505, + 0.701, + 0.7625, + 0.7905, + 0.8045, + 0.81, + 0.823, + 0.814, + 0.82, + 0.8095, + 0.811, + 0.818, + 0.8155, + 0.8065, + 0.822, + 0.8185, + 0.8125, + 0.809, + 0.7835, + 0.792, + 0.778, + 0.792, + 0.7685, + 0.7625, + 0.755, + 0.756, + 0.766, + 0.751, + 0.748, + 0.7385, + 0.741, + 0.7315, + 0.7215, + 0.7095, + 0.695, + 0.688, + 0.684, + 0.685, + 0.6905, + 0.6945, + 0.6885, + 0.688, + 0.674, + 0.6685, + 0.675, + 0.67, + 0.6655, + 0.657, + 0.656, + 0.6585, + 0.658, + 0.6605, + 0.6525, + 0.657, + 0.643, + 0.6475, + 0.647, + 0.649, + 0.642, + 0.6455, + 0.6405, + 0.6465, + 0.646, + 0.6375, + 0.641, + 0.6385, + 0.6335, + 0.6385, + 0.6355, + 0.64, + 0.6365, + 0.6355, + 0.6355, + 0.6345, + 0.635, + 0.635, + 0.635, + 0.6345, + 0.634 + ], + "value_loss": [ + 2.8833280738830567, + 0.7847226623535156, + 0.6052224683761597, + 0.5364442230701446, + 0.4866952224731445, + 0.4644027402877808, + 0.4624986822128296, + 0.4973188815355301, + 0.5199405098438263, + 0.5218789057254791, + 0.5600632459640503, + 0.6151528795719147, + 0.5766617219448089, + 0.6344908997654914, + 0.6626247673034668, + 0.6810169264793396, + 0.7056573510169983, + 0.7149781924247741, + 0.7052933280229569, + 0.7567739087104798, + 0.8160911297798157, + 0.8792114803314209, + 0.8207113800048829, + 0.8191835897922516, + 0.8597163372039794, + 0.8457223380088806, + 0.9193719961166382, + 0.850219428062439, + 0.856592936706543, + 0.7682788232326507, + 0.730324414896965, + 0.6971390293121338, + 0.6743249478340149, + 0.7776916447639466, + 0.6412680940628052, + 0.6544103482246398, + 0.7206561564207077, + 0.5922124248504639, + 0.6333092123031616, + 0.5453343061447143, + 0.6317949431419373, + 0.5274795674324035, + 0.5396580792427063, + 0.5128086106300354, + 0.5516833471298218, + 0.5616566513061524, + 0.5372079795360565, + 0.5528788970947266, + 0.6155030704498291, + 0.5729360949516297, + 0.5764620405197144, + 0.5704575545310974, + 0.5842877408981323, + 0.5995055549621582, + 0.6123614057540894, + 0.5957472767353058, + 0.5835577243804931, + 0.6090386015415191, + 0.5883770040035248, + 0.5994154201507569, + 0.6209961592674256, + 0.5821904572486878, + 0.5925648178815842, + 0.5761626353263855, + 0.5682975249290466, + 0.5920660761833191, + 0.5835506136417389, + 0.5641262327194214, + 0.5669574682235717, + 0.567772633266449, + 0.5559127983093262, + 0.5391036891937255, + 0.5507662886142731, + 0.53783765001297, + 0.5338259760856628, + 0.5350430037975311, + 0.5220288526058197, + 0.5302294264793396, + 0.5155424662590027, + 0.5198581983566284 + ], + "term_loss": [ + 1.6454794772148131, + 0.3263517658233643, + 0.3324782820701599, + 0.3084365834712982, + 0.2733846814155579, + 0.2562745343327522, + 0.2620648564338684, + 0.30091398467719555, + 0.3289512038171291, + 0.3290699499607086, + 0.36417594809532167, + 0.4142481907606125, + 0.3883945213317871, + 0.4393215751647949, + 0.46501498188972473, + 0.47925249347686766, + 0.5046797016382217, + 0.5087765357494354, + 0.4967124795019627, + 0.5429100960731507, + 0.5926241361141205, + 0.6447086326599121, + 0.579509374666214, + 0.5835422896981239, + 0.6090982981204986, + 0.5876830438613891, + 0.6432878967761994, + 0.5675156433582306, + 0.5771616685867309, + 0.49196799931526186, + 0.45263598628044127, + 0.42308012866973876, + 0.3907915468931198, + 0.4852942128777504, + 0.35577588975429536, + 0.35834191608428956, + 0.4150521718651056, + 0.29623276604413984, + 0.32230763597488404, + 0.2524558412909508, + 0.3255671339035034, + 0.22805521211624147, + 0.22856105840206145, + 0.20706634080410002, + 0.23393898310661315, + 0.2354411078929901, + 0.20956240813434124, + 0.22007010972499846, + 0.27335089936256407, + 0.23113303844928743, + 0.2274341112136841, + 0.21985646319389343, + 0.23131886804103852, + 0.24329911168664695, + 0.24918984038829803, + 0.23453153626918793, + 0.2230271029472351, + 0.24042806271016598, + 0.2237975647866726, + 0.23123242053985596, + 0.25471574842333794, + 0.21881105394363404, + 0.22694692747592926, + 0.21005943071842192, + 0.1994040913105011, + 0.22424529371261598, + 0.217019234085083, + 0.20118717231750488, + 0.2016641976118088, + 0.2034522614955902, + 0.19620529432296752, + 0.18044703192710876, + 0.19134235957562923, + 0.1797063545227051, + 0.1764101204633713, + 0.1779283276796341, + 0.16668891739845276, + 0.1740751401245594, + 0.161777489733696, + 0.1660363396883011 + ], + "bridge_loss": [ + 0.9377871763861156, + 0.14766500053405762, + 0.02877580658942461, + 0.009598655062913894, + 0.016668824788928033, + 0.02121675037741661, + 0.020100663328170777, + 0.017548368653655052, + 0.015006689450144767, + 0.01513301545009017, + 0.014232833042740822, + 0.013891240073740482, + 0.011406736245751382, + 0.012642510639876127, + 0.01458835108205676, + 0.013680042466521262, + 0.015419781844317913, + 0.017810679003596307, + 0.019589692229777574, + 0.024900535257905723, + 0.02252660002708435, + 0.02607555223107338, + 0.027234175610542297, + 0.024702777102589606, + 0.027225637090206145, + 0.029620801931619645, + 0.03768093141317368, + 0.046393069380521776, + 0.05361589749455452, + 0.04968858813345432, + 0.04719689604640007, + 0.04035842423439026, + 0.033826103353500364, + 0.030835032051801683, + 0.026682524013519286, + 0.024017449873685835, + 0.024913296768814326, + 0.02244833298623562, + 0.024258126384019852, + 0.01988215004503727, + 0.025355869579315186, + 0.019808240255713462, + 0.022530729496479034, + 0.020299413734674452, + 0.024030086208879947, + 0.028282125863432886, + 0.02460381360054016, + 0.029118296933174134, + 0.03094438911676407, + 0.028381625938415526, + 0.03409786782264709, + 0.03280818447470665, + 0.033095910048484806, + 0.03300321333706379, + 0.038769859731197356, + 0.03602361143529415, + 0.03425909789800644, + 0.039217023247480394, + 0.03850839220881462, + 0.038296847838163374, + 0.03764004505872726, + 0.03555820371508598, + 0.036610432869195936, + 0.0361909857749939, + 0.03747819612622261, + 0.03717733380794525, + 0.035828465853631496, + 0.03396679884195328, + 0.034303515052795414, + 0.033811005836725236, + 0.02981514204442501, + 0.029429450476169586, + 0.030180443140864373, + 0.02941783722639084, + 0.028960870635509492, + 0.028137443059682847, + 0.02695192684829235, + 0.028193890061974525, + 0.02632337526679039, + 0.026915473002195357 + ], + "tgrad_loss": [ + 0.30006144156455994, + 0.3107058983325958, + 0.2439683804512024, + 0.21840898594856262, + 0.1966417160987854, + 0.186911457157135, + 0.18033316440582275, + 0.1788565274655819, + 0.17598261984586716, + 0.17767594091892241, + 0.1816544674873352, + 0.18701344912052154, + 0.17686045913696288, + 0.18252681477069854, + 0.18302143425941467, + 0.188084393119812, + 0.18555786571502686, + 0.18839098315238953, + 0.18899115829467775, + 0.18896327831745147, + 0.20094039404392242, + 0.20842729425430298, + 0.21396782894134522, + 0.21093851894140245, + 0.2233924026966095, + 0.22841848783493043, + 0.238403165769577, + 0.2363107090950012, + 0.2258153675556183, + 0.2266222387313843, + 0.23049153771400452, + 0.2337004735469818, + 0.24970730090141297, + 0.26156239709854123, + 0.2588096812725067, + 0.27205098791122434, + 0.28069068645238876, + 0.27353132772445676, + 0.28674344885349273, + 0.2729963088989258, + 0.28087194566726686, + 0.27961610980033874, + 0.2885662919044495, + 0.28544285264015196, + 0.2937142786502838, + 0.2979334186553955, + 0.30304175670146943, + 0.3036904903411865, + 0.31120778708457947, + 0.3134214277267456, + 0.3149300651550293, + 0.31779290962219237, + 0.319872961807251, + 0.32320322750806807, + 0.324401708316803, + 0.32519212522506713, + 0.32627151918411257, + 0.3293935173988342, + 0.32607104771137235, + 0.32988615398406984, + 0.32864036498069765, + 0.327821196937561, + 0.3290074566841126, + 0.32991221575737, + 0.3314152413368225, + 0.33064344997406003, + 0.3307029154062271, + 0.32897226009368896, + 0.3309897524833679, + 0.33050937223434446, + 0.3298923659324646, + 0.32922720794677734, + 0.3292434865236282, + 0.3287134552001953, + 0.32845498433113096, + 0.32897723731994627, + 0.3283880082130432, + 0.3279603928089142, + 0.32744160184860227, + 0.32690638537406924 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.11650891602039337, + 0.31434422731399536 + ], + "perturbation_rho": [ + 0.23759987950325012, + 0.5255968570709229 + ], + "nudging": { + "0.001": [ + -0.006046381313353777, + -0.002862941939383745 + ], + "0.003": [ + -0.018019597977399826, + -0.008575741201639175 + ], + "0.01": [ + -0.05865050479769707, + -0.028432408347725868 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a0.5_L2_s42.json b/results/synth_ladder_v2_hi/synth_a0.5_L2_s42.json new file mode 100644 index 0000000..1a9a155 --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a0.5_L2_s42.json @@ -0,0 +1,1512 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.838883076095581, + 0.9228713939666748, + 0.5369283601760865, + 0.40869176201820373, + 0.35351916384696963, + 0.3149320938587189, + 0.29885801305770876, + 0.28874192085266115, + 0.27495671865940097, + 0.25859400782585146, + 0.2618196714401245, + 0.23570404744148254, + 0.23764698023796083, + 0.22304832377433778, + 0.22278955578804016, + 0.21679949054718017, + 0.2098624146461487, + 0.22450098567008972, + 0.20582314471006394, + 0.19091342453956603, + 0.20230956523418425, + 0.19248483119010926, + 0.18207436051368714, + 0.17455288028717042, + 0.1746367334008217, + 0.16596168351173402, + 0.1632581250101328, + 0.15257979717254638, + 0.16552851646244526, + 0.14555678157806395, + 0.14922121838331223, + 0.14138047268390655, + 0.14168458592295646, + 0.1322138198852539, + 0.14060876342654227, + 0.12736148176193238, + 0.12787616213560105, + 0.1222807457447052, + 0.12329775819778442, + 0.11754269520044326, + 0.11509358530044556, + 0.11533700299263, + 0.11486885561943054, + 0.11302210004329681, + 0.10378158293962479, + 0.10055346679091454, + 0.09701502611041068, + 0.09453871037364006, + 0.09318371058702468, + 0.09154418442249299, + 0.09060858163833618, + 0.09153713397979736, + 0.09077880887985229, + 0.088396619617939, + 0.08532250515222549, + 0.08318007454872131, + 0.08344659991264343, + 0.08225398402810097, + 0.07986635602712631, + 0.0784351842880249, + 0.07738790756464005, + 0.07704619092941284, + 0.07655080541372299, + 0.07576740589141846, + 0.07471019058227539, + 0.07399410808086396, + 0.07352103772759437, + 0.07262729846835136, + 0.07196982672214508, + 0.07155210624933243, + 0.07116250815391541, + 0.0708568405330181, + 0.07056542416810989, + 0.0702718249976635, + 0.07004092693328857, + 0.06988665665090084, + 0.06974752879142761, + 0.06964604835510253, + 0.06959020309448243, + 0.06955153443813324 + ], + "train_acc": [ + 0.3784, + 0.7515, + 0.8523, + 0.8765, + 0.8855, + 0.8965, + 0.8923, + 0.8925, + 0.8988, + 0.9032, + 0.8988, + 0.9143, + 0.9105, + 0.9173, + 0.9156, + 0.9185, + 0.9199, + 0.9103, + 0.9237, + 0.9303, + 0.9244, + 0.9259, + 0.9334, + 0.937, + 0.9364, + 0.9408, + 0.9403, + 0.9477, + 0.9368, + 0.9522, + 0.9467, + 0.9517, + 0.9516, + 0.9582, + 0.9506, + 0.9601, + 0.9585, + 0.9614, + 0.9597, + 0.9636, + 0.9653, + 0.9646, + 0.963, + 0.9651, + 0.9713, + 0.9737, + 0.9769, + 0.9776, + 0.9782, + 0.9795, + 0.9796, + 0.9782, + 0.9778, + 0.979, + 0.9821, + 0.9832, + 0.9823, + 0.9834, + 0.986, + 0.9868, + 0.9869, + 0.9865, + 0.9863, + 0.9871, + 0.9871, + 0.9887, + 0.9888, + 0.9896, + 0.9905, + 0.9898, + 0.9901, + 0.9902, + 0.9901, + 0.9903, + 0.9905, + 0.9907, + 0.9906, + 0.9906, + 0.9907, + 0.9907 + ], + "test_acc": [ + 0.624, + 0.7945, + 0.8405, + 0.8615, + 0.864, + 0.867, + 0.8645, + 0.8595, + 0.8565, + 0.8585, + 0.8625, + 0.872, + 0.87, + 0.8735, + 0.8735, + 0.879, + 0.8725, + 0.8635, + 0.8725, + 0.8785, + 0.875, + 0.8775, + 0.8735, + 0.8815, + 0.8775, + 0.874, + 0.883, + 0.8805, + 0.873, + 0.8815, + 0.8765, + 0.88, + 0.8785, + 0.877, + 0.8795, + 0.879, + 0.8785, + 0.882, + 0.8855, + 0.883, + 0.884, + 0.8845, + 0.8805, + 0.884, + 0.882, + 0.8845, + 0.881, + 0.8845, + 0.882, + 0.883, + 0.883, + 0.887, + 0.8835, + 0.8845, + 0.8825, + 0.8825, + 0.888, + 0.8845, + 0.886, + 0.884, + 0.885, + 0.882, + 0.8825, + 0.8805, + 0.882, + 0.8825, + 0.885, + 0.8855, + 0.8835, + 0.8865, + 0.886, + 0.8845, + 0.885, + 0.885, + 0.885, + 0.8845, + 0.885, + 0.8845, + 0.8845, + 0.8845 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9165740013122559, + 0.911247193813324 + ], + "perturbation_rho": [ + 0.9999988079071045, + 0.9999961853027344 + ], + "nudging": { + "0.001": [ + -0.031085949391126633, + -0.012861143797636032 + ], + "0.003": [ + -0.08586536347866058, + -0.037327297031879425 + ], + "0.01": [ + -0.21485117077827454, + -0.11073540896177292 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2755904403686524, + 1.6745083744049072, + 1.051408309841156, + 0.7111780145645141, + 0.5445409080028534, + 0.45879194836616516, + 0.41605077290534975, + 0.3957563140869141, + 0.389960843372345, + 0.39417654418945314, + 0.40389546192884446, + 0.3980479574203491, + 0.4083562989473343, + 0.4132358487606049, + 0.4187182967185974, + 0.4203802880525589, + 0.4387013870239258, + 0.44252231817245485, + 0.42820124464035036, + 0.42269960770606996, + 0.4413509990692139, + 0.43839888401031496, + 0.43627189745903017, + 0.44073323020935057, + 0.454564675951004, + 0.4474758553981781, + 0.4394855237007141, + 0.42114640197753905, + 0.4659817192912102, + 0.4296913712501526, + 0.46042858691215516, + 0.4541965922832489, + 0.450060701084137, + 0.4527084307670593, + 0.42569710931777954, + 0.43842885856628416, + 0.44364037351608276, + 0.4300214008808136, + 0.43460112380981447, + 0.4649988492846489, + 0.42098810606002807, + 0.44036443765163424, + 0.4068041382312775, + 0.40084986300468445, + 0.41328212876319886, + 0.4015606360435486, + 0.3978891236066818, + 0.38384996640682223, + 0.3901183885335922, + 0.3906126615524292, + 0.3949475336074829, + 0.39353401985168457, + 0.3902185819149017, + 0.37436509132385254, + 0.3824869274377823, + 0.3752282187461853, + 0.37405086925029757, + 0.36902116994857787, + 0.3608111560344696, + 0.3636643335342407, + 0.3624928609967232, + 0.35216776008605954, + 0.3643767790794373, + 0.35711028456687927, + 0.35238478226661685, + 0.3484013397693634, + 0.3534255467891693, + 0.348143867456913, + 0.3460024874687195, + 0.3450613434791565, + 0.3417489238739014, + 0.34155446233749387, + 0.3391765214204788, + 0.3387234467029572, + 0.3374306505203247, + 0.3369725195646286, + 0.3359765763282776, + 0.3355955307006836, + 0.33527027835845946, + 0.33505802783966065 + ], + "train_acc": [ + 0.1665, + 0.4478, + 0.6483, + 0.7502, + 0.8014, + 0.8266, + 0.8438, + 0.8473, + 0.8477, + 0.8517, + 0.8501, + 0.8535, + 0.8499, + 0.8495, + 0.8522, + 0.8513, + 0.8458, + 0.8451, + 0.851, + 0.8505, + 0.8496, + 0.847, + 0.8494, + 0.8488, + 0.8426, + 0.8479, + 0.8514, + 0.852, + 0.8439, + 0.8499, + 0.8395, + 0.8447, + 0.8463, + 0.845, + 0.8544, + 0.8501, + 0.8467, + 0.8505, + 0.8497, + 0.84, + 0.8514, + 0.8481, + 0.8557, + 0.8585, + 0.8563, + 0.8562, + 0.8607, + 0.8612, + 0.8577, + 0.8597, + 0.8584, + 0.8559, + 0.8588, + 0.8641, + 0.86, + 0.8622, + 0.8628, + 0.862, + 0.8658, + 0.8662, + 0.8701, + 0.8703, + 0.8654, + 0.8655, + 0.8704, + 0.8694, + 0.8693, + 0.8692, + 0.8702, + 0.8704, + 0.8721, + 0.8719, + 0.875, + 0.8726, + 0.8731, + 0.8743, + 0.8737, + 0.8737, + 0.8739, + 0.8742 + ], + "test_acc": [ + 0.291, + 0.555, + 0.6845, + 0.7495, + 0.7785, + 0.7975, + 0.8, + 0.803, + 0.802, + 0.8, + 0.798, + 0.801, + 0.809, + 0.7975, + 0.8, + 0.8045, + 0.787, + 0.805, + 0.7945, + 0.8025, + 0.7985, + 0.7985, + 0.793, + 0.7855, + 0.795, + 0.7945, + 0.8085, + 0.801, + 0.788, + 0.7925, + 0.784, + 0.8085, + 0.801, + 0.783, + 0.799, + 0.7995, + 0.812, + 0.801, + 0.781, + 0.7775, + 0.801, + 0.8085, + 0.8085, + 0.8015, + 0.8015, + 0.8015, + 0.806, + 0.805, + 0.81, + 0.804, + 0.7985, + 0.803, + 0.8185, + 0.8125, + 0.81, + 0.808, + 0.812, + 0.8115, + 0.8165, + 0.813, + 0.8155, + 0.8165, + 0.814, + 0.82, + 0.8245, + 0.819, + 0.816, + 0.816, + 0.822, + 0.8165, + 0.819, + 0.817, + 0.815, + 0.819, + 0.8215, + 0.82, + 0.819, + 0.8175, + 0.8185, + 0.8185 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.008949288167059422, + 0.035725876688957214 + ], + "perturbation_rho": [ + -0.042064815759658813, + 0.02075618878006935 + ], + "nudging": { + "0.001": [ + 0.00033832876943051815, + -0.00013122413656674325 + ], + "0.003": [ + 0.0010789502412080765, + -0.00039280677447095513 + ], + "0.01": [ + 0.004335631616413593, + -0.0013084581587463617 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 2.0824829721450806, + 1.1837396372795106, + 0.6673484756469726, + 0.46784576473236084, + 0.39523904933929443, + 0.38305578269958496, + 0.3820614227294922, + 0.37770698080062864, + 0.3784868881225586, + 0.37788698201179505, + 0.3775497382640839, + 0.3720602925300598, + 0.3787012303352356, + 0.3716680085659027, + 0.3765100636959076, + 0.37162504646778105, + 0.3775796483516693, + 0.3912089412689209, + 0.387017729139328, + 0.4038709951400757, + 0.40551300468444823, + 0.3929386008262634, + 0.396329621219635, + 0.4018239990234375, + 0.4215829294204712, + 0.41799877495765686, + 0.400916418671608, + 0.4175464694023132, + 0.4196605001449585, + 0.4193920916557312, + 0.4106157903432846, + 0.4156774042248726, + 0.4019841181755066, + 0.42924740953445434, + 0.3962015940189362, + 0.39606657152175906, + 0.4141406083583832, + 0.38865602951049805, + 0.38985962376594546, + 0.3957322010993958, + 0.3951152558326721, + 0.3955321859359741, + 0.38211313061714175, + 0.3885132269382477, + 0.38207339782714844, + 0.3849307601928711, + 0.3814076686859131, + 0.3850557041168213, + 0.38029749584197997, + 0.3717133730888367, + 0.372594402885437, + 0.36705199470520017, + 0.3703877753973007, + 0.3687688379049301, + 0.36827292232513426, + 0.36861963114738466, + 0.37049537568092344, + 0.3622209189414978, + 0.3624863251686096, + 0.36258873243331907, + 0.3604560327529907, + 0.3598629186630249, + 0.3558103786945343, + 0.35572401695251465, + 0.355719638299942, + 0.35422387681007383, + 0.35251914834976195, + 0.3532273498058319, + 0.35069880657196045, + 0.35031716957092285, + 0.35007772364616396, + 0.348374769115448, + 0.3486006237268448, + 0.34740313987731936, + 0.34712638473510743, + 0.3469550308704376, + 0.3464403437614441, + 0.34619485507011416, + 0.34601595051288603, + 0.3458989464759827 + ], + "train_acc": [ + 0.2525, + 0.6165, + 0.7765, + 0.8288, + 0.8516, + 0.8542, + 0.8548, + 0.8578, + 0.8525, + 0.8583, + 0.86, + 0.8615, + 0.8544, + 0.8571, + 0.855, + 0.8575, + 0.855, + 0.8501, + 0.8497, + 0.8444, + 0.8439, + 0.847, + 0.8461, + 0.8469, + 0.8394, + 0.8386, + 0.8468, + 0.8443, + 0.8435, + 0.8421, + 0.8452, + 0.8418, + 0.8473, + 0.8383, + 0.8475, + 0.8508, + 0.845, + 0.8518, + 0.8531, + 0.8483, + 0.8518, + 0.8501, + 0.8565, + 0.8506, + 0.854, + 0.8562, + 0.8542, + 0.8513, + 0.8526, + 0.8579, + 0.8569, + 0.8608, + 0.8564, + 0.8592, + 0.86, + 0.8594, + 0.8585, + 0.8609, + 0.8615, + 0.8614, + 0.8597, + 0.861, + 0.8636, + 0.8645, + 0.8643, + 0.8661, + 0.8645, + 0.8628, + 0.865, + 0.8676, + 0.8665, + 0.8651, + 0.8654, + 0.8665, + 0.866, + 0.8674, + 0.8664, + 0.8674, + 0.8668, + 0.8667 + ], + "test_acc": [ + 0.4625, + 0.687, + 0.7785, + 0.809, + 0.818, + 0.8145, + 0.816, + 0.8135, + 0.816, + 0.8225, + 0.8045, + 0.816, + 0.809, + 0.7965, + 0.818, + 0.802, + 0.8055, + 0.806, + 0.801, + 0.7785, + 0.7905, + 0.786, + 0.796, + 0.7845, + 0.7915, + 0.793, + 0.781, + 0.789, + 0.797, + 0.7885, + 0.794, + 0.7775, + 0.7755, + 0.8045, + 0.809, + 0.7795, + 0.8005, + 0.8025, + 0.805, + 0.793, + 0.806, + 0.8155, + 0.7985, + 0.81, + 0.8055, + 0.807, + 0.8065, + 0.8025, + 0.8065, + 0.8015, + 0.815, + 0.808, + 0.821, + 0.8065, + 0.8095, + 0.8065, + 0.813, + 0.812, + 0.8115, + 0.813, + 0.812, + 0.812, + 0.812, + 0.8125, + 0.815, + 0.8105, + 0.811, + 0.8145, + 0.8105, + 0.812, + 0.811, + 0.809, + 0.813, + 0.8125, + 0.8115, + 0.8115, + 0.8135, + 0.8125, + 0.812, + 0.8125 + ], + "state_pred_error": [ + 0.8001734064102173, + 0.35873693199157713, + 0.20844954159259796, + 0.16903454799652098, + 0.1555667249441147, + 0.14051846435070037, + 0.1219131733417511, + 0.10268338766098023, + 0.08544955713748932, + 0.0714530954003334, + 0.05912637507915497, + 0.051166046524047853, + 0.046080123180150985, + 0.039346986520290374, + 0.03611734768152237, + 0.0322635617017746, + 0.030359485450387, + 0.03046627066731453, + 0.026333281344175338, + 0.024863469672203063, + 0.023385335299372673, + 0.022591026341915132, + 0.02149942193031311, + 0.02068497442305088, + 0.020433403274416923, + 0.019626461285352708, + 0.018830640947818757, + 0.018304855170845985, + 0.017805312702059747, + 0.01717169118821621, + 0.016883350095152856, + 0.016305500897765158, + 0.015936558076739313, + 0.01556376437842846, + 0.015504471227526665, + 0.014957618600130082, + 0.014713572627305984, + 0.014142402538657188, + 0.013960958057641982, + 0.013590541940927505, + 0.013389594730734825, + 0.01309183569997549, + 0.012976301842927933, + 0.012886276030540466, + 0.012688130004703998, + 0.012546944618225097, + 0.012055124607682228, + 0.01186397502720356, + 0.01177666329741478, + 0.011594580093026162, + 0.011158815479278564, + 0.011128936088085175, + 0.011975047792494297, + 0.011167761707305908, + 0.011209322269260883, + 0.010609170261025428, + 0.010340626280009747, + 0.010262261213362217, + 0.010345043289661408, + 0.009869915609061718, + 0.009639052687585354, + 0.0098008942425251, + 0.009379881481826306, + 0.009180352842807769, + 0.009155150799453258, + 0.009056310991942882, + 0.009078112874925137, + 0.008794386529922486, + 0.009374980270862579, + 0.00883906733840704, + 0.00854088044166565, + 0.008424869784712791, + 0.008193799455463887, + 0.008154722370207309, + 0.008421275785565376, + 0.008421709784865379, + 0.007775320902466774, + 0.007672330512851476, + 0.007632624515891075, + 0.007539259477704763 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8927175402641296, + 0.4237706661224365 + ], + "perturbation_rho": [ + 0.8139950037002563, + 0.41992679238319397 + ], + "nudging": { + "0.001": [ + -0.025281934067606926, + -0.002599178347736597 + ], + "0.003": [ + -0.0727418065071106, + -0.007764648646116257 + ], + "0.01": [ + -0.20875152945518494, + -0.02549745701253414 + ] + }, + "state_pred_error_per_layer": [ + 1690.90478515625, + 278.7707214355469 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2748748617172243, + 1.6707266681671142, + 1.0525237585067748, + 0.7069919948577881, + 0.5450144615650176, + 0.45492432718276976, + 0.41742202892303465, + 0.3915238172531128, + 0.39175787649154664, + 0.402530827999115, + 0.3909166872024536, + 0.4053274774312973, + 0.4120564586639404, + 0.4225111320972443, + 0.41647812595367434, + 0.4272260865688324, + 0.4241933352470398, + 0.436232319188118, + 0.4387337839603424, + 0.48842136354446414, + 0.4558315635681152, + 0.496497424864769, + 0.5087396056175232, + 0.5397198664665223, + 0.5651827428102494, + 0.5744139050483703, + 0.6307690343141555, + 0.6128013428688049, + 0.60693001537323, + 0.6117362999916076, + 0.6191363915443421, + 0.6438410203933715, + 0.6246722332954406, + 0.6266048515319824, + 0.7066175966262818, + 0.6940338945388794, + 0.7162334120035172, + 0.6737902103900909, + 0.6885660154342651, + 0.7021305454254151, + 0.7599561199188233, + 0.7359864574432373, + 0.7280522350311279, + 0.7489439949035644, + 0.7662384524345398, + 0.7572000256061554, + 0.793046563911438, + 0.8030659034729004, + 0.8452127780914307, + 0.8339548164367676, + 0.8519316087722778, + 0.8606153854370118, + 0.8828687825202942, + 0.8765805198669434, + 0.8856307614326477, + 0.8939145570755005, + 0.9057541777610779, + 0.9066044025421143, + 0.9265142164230347, + 0.9460746621131897, + 0.9285282844543457, + 0.9477956159591675, + 0.9402782894134522, + 0.9547298575401306, + 0.9442226867675781, + 0.9431581373214721, + 0.9486260055541992, + 0.9491145337104797, + 0.9437961555480957, + 0.9449379459381103, + 0.9478061424255371, + 0.9438842529296875, + 0.9436823980331421, + 0.9449532516479492, + 0.9425712206840515, + 0.9426206575393676, + 0.9418610684394837, + 0.9410846166610718, + 0.9404826469421387, + 0.9403811920166015 + ], + "train_acc": [ + 0.1647, + 0.4464, + 0.6456, + 0.7527, + 0.799, + 0.8277, + 0.8397, + 0.8494, + 0.8508, + 0.8487, + 0.854, + 0.8527, + 0.8524, + 0.8481, + 0.852, + 0.8512, + 0.8519, + 0.8467, + 0.8483, + 0.8324, + 0.8415, + 0.8269, + 0.8204, + 0.8121, + 0.7989, + 0.7968, + 0.779, + 0.7808, + 0.7806, + 0.7763, + 0.7698, + 0.7613, + 0.772, + 0.7673, + 0.7448, + 0.7523, + 0.7421, + 0.7509, + 0.7413, + 0.7353, + 0.723, + 0.7235, + 0.7278, + 0.7207, + 0.7179, + 0.7164, + 0.707, + 0.7045, + 0.6896, + 0.6959, + 0.6871, + 0.6856, + 0.6808, + 0.6836, + 0.6847, + 0.6802, + 0.6752, + 0.6736, + 0.6755, + 0.6695, + 0.6699, + 0.6663, + 0.6683, + 0.6646, + 0.6638, + 0.6659, + 0.6658, + 0.6623, + 0.6667, + 0.6675, + 0.6626, + 0.6646, + 0.6644, + 0.6634, + 0.6665, + 0.6678, + 0.6671, + 0.6661, + 0.6671, + 0.6662 + ], + "test_acc": [ + 0.296, + 0.559, + 0.678, + 0.75, + 0.779, + 0.785, + 0.8035, + 0.8045, + 0.8035, + 0.803, + 0.8035, + 0.7935, + 0.8035, + 0.8075, + 0.7975, + 0.803, + 0.8045, + 0.7895, + 0.7895, + 0.7865, + 0.777, + 0.783, + 0.7405, + 0.746, + 0.7595, + 0.7225, + 0.7535, + 0.7385, + 0.7125, + 0.72, + 0.7055, + 0.72, + 0.715, + 0.6885, + 0.6685, + 0.682, + 0.7085, + 0.691, + 0.7045, + 0.6865, + 0.67, + 0.6955, + 0.694, + 0.6645, + 0.697, + 0.6845, + 0.674, + 0.648, + 0.661, + 0.6545, + 0.6685, + 0.6485, + 0.66, + 0.6625, + 0.657, + 0.6355, + 0.653, + 0.6455, + 0.6315, + 0.649, + 0.6295, + 0.635, + 0.64, + 0.6355, + 0.633, + 0.639, + 0.637, + 0.644, + 0.636, + 0.636, + 0.6355, + 0.6365, + 0.6395, + 0.639, + 0.6385, + 0.6365, + 0.635, + 0.638, + 0.6375, + 0.6365 + ], + "value_loss": [ + 2.9257629440307618, + 0.7867631932258606, + 0.6331243370056152, + 0.5934987301826478, + 0.5538255891799927, + 0.5144483612060546, + 0.5357967885971069, + 0.5191175822257995, + 0.5425653838157654, + 0.5752897667884826, + 0.5554038842201233, + 0.5964856115818024, + 0.6071936506271363, + 0.615453130531311, + 0.6215356389522553, + 0.640991295337677, + 0.6377853952407837, + 0.6480764210224151, + 0.6319464739322662, + 0.7916026724815368, + 0.6787179851531983, + 0.7052958431005478, + 0.7116784429550171, + 0.7465570999145508, + 0.7610727603912354, + 0.7122495373725891, + 0.7205907410621643, + 0.657422287940979, + 0.5804553174972534, + 0.5339653887748719, + 0.5028113806247712, + 0.5306310165405274, + 0.5148042221546173, + 0.4575808104991913, + 0.5487925732135772, + 0.520268959236145, + 0.5565902183890342, + 0.4398930975198746, + 0.428002223110199, + 0.46429021530151365, + 0.5170863667488098, + 0.49451336669921875, + 0.44284208660125735, + 0.4522279070854187, + 0.4726058319091797, + 0.4598690043926239, + 0.49018758878707885, + 0.49822337799072264, + 0.5199945873260498, + 0.5039699987411499, + 0.502354536151886, + 0.506885662651062, + 0.5282695870876313, + 0.5126925681591034, + 0.5460992843151092, + 0.54484206199646, + 0.5474184717178344, + 0.531292943572998, + 0.5684735743522644, + 0.580509339427948, + 0.5237845591068268, + 0.5362084387779236, + 0.5471626996994019, + 0.5834163922786713, + 0.5274406147003173, + 0.5316431431770324, + 0.5337949501037598, + 0.5416967335224152, + 0.5303698273181915, + 0.5200471870422363, + 0.517787770652771, + 0.5033083886146545, + 0.5138760683059692, + 0.4955048748970032, + 0.5053999238967896, + 0.4936981360912323, + 0.4910477494955063, + 0.511811295413971, + 0.5135351393938065, + 0.48061015357971193 + ], + "term_loss": [ + 1.6786233594894409, + 0.3261142881393433, + 0.35359204120635984, + 0.36565287389755247, + 0.3406023171067238, + 0.30883846073150634, + 0.33299512271881104, + 0.3214617775917053, + 0.3527043153762817, + 0.3891282879829407, + 0.3804077454328537, + 0.41708505935668944, + 0.4277315420150757, + 0.4346309417724609, + 0.44325669355392455, + 0.45943074939250944, + 0.4560778746962547, + 0.46359605444073676, + 0.44748154599666595, + 0.5874906051158905, + 0.4832541675567627, + 0.49596090741157534, + 0.49860577583312987, + 0.5199280709385872, + 0.5220767303347588, + 0.47179154951572416, + 0.4561684895634651, + 0.396670174407959, + 0.3203327759504318, + 0.2695784947603941, + 0.23113118069171906, + 0.26142542295455934, + 0.24953778635263443, + 0.1960149597465992, + 0.25626748807430266, + 0.23220936818122864, + 0.25846885913610457, + 0.15887275909483434, + 0.14909111514091491, + 0.17712726273536683, + 0.2125454505801201, + 0.19927165834903718, + 0.15077278842926026, + 0.15682997941970825, + 0.17086780786514283, + 0.1594958031475544, + 0.17793601125180722, + 0.18321620383262635, + 0.18637006669044495, + 0.18034391679763795, + 0.17549167909622193, + 0.17889143224954604, + 0.19318077889084817, + 0.1766836573123932, + 0.20506124428510666, + 0.2066309697151184, + 0.2060998435020447, + 0.19079111275672914, + 0.21746273097991944, + 0.22661366835832597, + 0.18412061611413955, + 0.18906878393888474, + 0.20128634595870973, + 0.22696166688501834, + 0.18461333600878715, + 0.184559454703331, + 0.1873170636177063, + 0.19381926721930504, + 0.1840388169169426, + 0.1760092082500458, + 0.1739466248512268, + 0.16277697925567627, + 0.1703468280673027, + 0.1561721340417862, + 0.162870410490036, + 0.15363481096029283, + 0.1529178817510605, + 0.16665865235328675, + 0.16918066250383854, + 0.14492559936642646 + ], + "bridge_loss": [ + 0.9221068814527592, + 0.13852903740406036, + 0.027906007751822472, + 0.007166545861959458, + 0.014753102254867553, + 0.026205083185434342, + 0.029608502185344696, + 0.031953351217508315, + 0.02295173071026802, + 0.01737342191487551, + 0.012457077103853225, + 0.012833337373286485, + 0.013563652062416076, + 0.015525699077546596, + 0.015380015002191067, + 0.01761208213567734, + 0.018523025204241275, + 0.019238843723386526, + 0.020741728362441064, + 0.026043444299697877, + 0.026606431709229945, + 0.026109171213954688, + 0.02512398416996002, + 0.02966944384723902, + 0.03190348414927721, + 0.03136296460032463, + 0.0352400288939476, + 0.03681477851495147, + 0.03777945480048656, + 0.03949151403903961, + 0.042446378648281095, + 0.03484680913388729, + 0.03507048722356558, + 0.03070030620098114, + 0.037034362864494325, + 0.03802529795318842, + 0.03755567114502192, + 0.03274250242859125, + 0.025108824491500856, + 0.02743995731472969, + 0.030794216075539588, + 0.027399995332956315, + 0.025184972828626633, + 0.021072593542933463, + 0.023606113910675047, + 0.023853830067813397, + 0.02481825648620725, + 0.025949978299438955, + 0.031083991938829422, + 0.02635702279806137, + 0.023137952852249146, + 0.0238148014575243, + 0.024979108849167823, + 0.02769171332716942, + 0.03249237573444843, + 0.026965303349494932, + 0.027073483538627624, + 0.026444199299812315, + 0.0334527153134346, + 0.031996575450897215, + 0.022713612192869187, + 0.02537522009909153, + 0.026704606008529662, + 0.03316631828993559, + 0.022604483069479465, + 0.027801525264978408, + 0.026084369909763337, + 0.027263763999938965, + 0.028293249532580375, + 0.02589754301905632, + 0.024716552674770357, + 0.023096822041273116, + 0.02594154703617096, + 0.021842101486027242, + 0.026323819369077683, + 0.023422936725616454, + 0.02182629337310791, + 0.029627591571211816, + 0.028926070278510452, + 0.020528473022580148 + ], + "tgrad_loss": [ + 0.3250327301979065, + 0.32211986951828003, + 0.25162628445625307, + 0.22067930517196654, + 0.19847016725540162, + 0.17940481848716736, + 0.17319316334724427, + 0.16570244748592378, + 0.1669093354701996, + 0.1687880607366562, + 0.16253906288146971, + 0.1665672171831131, + 0.16589845621585847, + 0.16529648394584656, + 0.16289891986846924, + 0.16394846611022948, + 0.1631844938635826, + 0.16524152487516403, + 0.16372319452762604, + 0.17806861238479615, + 0.16885738246440887, + 0.18322576223015785, + 0.1879486857175827, + 0.1969595804452896, + 0.20709255154132844, + 0.20909501893520355, + 0.22918222160339355, + 0.2239373251914978, + 0.22234308688640594, + 0.22489537620544434, + 0.2292338173866272, + 0.23435878076553346, + 0.2301959456205368, + 0.230865545129776, + 0.2554907244682312, + 0.25003429362773893, + 0.2605656830072403, + 0.24827783651351928, + 0.2538022830486298, + 0.2597229935646057, + 0.2737467042684555, + 0.267841713476181, + 0.2668843271255493, + 0.2743253367424011, + 0.27813191254138947, + 0.27651937108039853, + 0.2874333247303963, + 0.2890572003364563, + 0.30254052896499634, + 0.29726906032562256, + 0.3037249053001404, + 0.3041794305801392, + 0.3101097016096115, + 0.3083171933889389, + 0.3085456686496735, + 0.3112457883834839, + 0.31424513998031617, + 0.3140576331615448, + 0.317558126449585, + 0.3218990971326828, + 0.316950329208374, + 0.32176443276405337, + 0.31917174434661866, + 0.32328840069770814, + 0.3202227909088135, + 0.31928216705322265, + 0.3203935170173645, + 0.3206137029647827, + 0.31803776168823245, + 0.318140433883667, + 0.31912459449768066, + 0.3174345845222473, + 0.3175876950263977, + 0.3174906392097473, + 0.3162056918144226, + 0.3166403913497925, + 0.3163035747528076, + 0.3155250496149063, + 0.315428409576416, + 0.31515607919692995 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.12511783838272095, + 0.3428286910057068 + ], + "perturbation_rho": [ + 0.21235734224319458, + 0.40894150733947754 + ], + "nudging": { + "0.001": [ + -0.006335020065307617, + -0.0028843185864388943 + ], + "0.003": [ + -0.01891140267252922, + -0.008641792461276054 + ], + "0.01": [ + -0.061930932104587555, + -0.028679829090833664 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a0.5_L2_s456.json b/results/synth_ladder_v2_hi/synth_a0.5_L2_s456.json new file mode 100644 index 0000000..789fd7e --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a0.5_L2_s456.json @@ -0,0 +1,1512 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.8481016555786134, + 0.9383245440483093, + 0.5530562189102173, + 0.4207325527191162, + 0.3648026519775391, + 0.33118328647613526, + 0.30579332513809204, + 0.2921482180595398, + 0.27799103627204896, + 0.2656113090753555, + 0.24957744574546814, + 0.24830586805343627, + 0.23826434144973754, + 0.2328869005203247, + 0.23377245817184447, + 0.21636449333429336, + 0.20429278337955475, + 0.20855472791194915, + 0.19823554830551146, + 0.2091533320426941, + 0.20433888306617737, + 0.19799854063987732, + 0.19555453977584838, + 0.20201841781139374, + 0.17265325379371643, + 0.17817161355018615, + 0.1800253779888153, + 0.17401057000160217, + 0.15778406052589417, + 0.15227047762870788, + 0.15033258476257325, + 0.1582992364168167, + 0.14341525144577028, + 0.14620398755073546, + 0.13611152563095094, + 0.13021500449180604, + 0.13004287123680114, + 0.12128764119148254, + 0.12444672923088074, + 0.12398484301567078, + 0.11453234956264496, + 0.11252437950372696, + 0.10943108355998993, + 0.10496705238819122, + 0.10266255812644959, + 0.10154881967306137, + 0.10175266758203506, + 0.09900797365903855, + 0.09833709491491317, + 0.09685812762379646, + 0.09284526603221893, + 0.09493725802898408, + 0.09160899226665496, + 0.08873112607002258, + 0.08736398074626922, + 0.08597083683013916, + 0.08495140401124954, + 0.0827208865404129, + 0.08080789630413056, + 0.08073672647476196, + 0.0794020817041397, + 0.07836829566955567, + 0.07724489649534226, + 0.07661290149688721, + 0.07624617738723755, + 0.07564639663696289, + 0.07505405854582786, + 0.07433921251296997, + 0.07382495956420898, + 0.07335682852268219, + 0.07298146123290061, + 0.07261739144325256, + 0.07231389728188514, + 0.07207126158475875, + 0.07183933544158935, + 0.07167200578451156, + 0.07155075296163559, + 0.07146113570928574, + 0.07139736030101776, + 0.07136157937049865 + ], + "train_acc": [ + 0.3796, + 0.7381, + 0.8485, + 0.8707, + 0.8806, + 0.8876, + 0.8931, + 0.8978, + 0.8991, + 0.9028, + 0.9094, + 0.9066, + 0.9114, + 0.9114, + 0.9111, + 0.9206, + 0.9236, + 0.9233, + 0.9259, + 0.9229, + 0.9238, + 0.9253, + 0.924, + 0.9242, + 0.9379, + 0.9344, + 0.9337, + 0.9342, + 0.9451, + 0.948, + 0.9497, + 0.9444, + 0.9519, + 0.9511, + 0.9554, + 0.9589, + 0.9581, + 0.9646, + 0.9596, + 0.9603, + 0.9675, + 0.9677, + 0.9698, + 0.9716, + 0.9738, + 0.9756, + 0.9729, + 0.9748, + 0.9753, + 0.9762, + 0.9779, + 0.9784, + 0.9783, + 0.981, + 0.9822, + 0.9824, + 0.9817, + 0.9852, + 0.9859, + 0.9858, + 0.9865, + 0.9864, + 0.9874, + 0.9876, + 0.9883, + 0.989, + 0.9884, + 0.9892, + 0.9895, + 0.9905, + 0.9903, + 0.9907, + 0.9908, + 0.9912, + 0.9913, + 0.9917, + 0.9917, + 0.9919, + 0.9919, + 0.9919 + ], + "test_acc": [ + 0.6245, + 0.792, + 0.833, + 0.848, + 0.855, + 0.85, + 0.8595, + 0.86, + 0.86, + 0.8615, + 0.862, + 0.8655, + 0.86, + 0.8685, + 0.8695, + 0.866, + 0.87, + 0.863, + 0.8685, + 0.864, + 0.8715, + 0.866, + 0.8675, + 0.8615, + 0.8705, + 0.867, + 0.8665, + 0.873, + 0.876, + 0.873, + 0.874, + 0.8655, + 0.8695, + 0.8665, + 0.869, + 0.872, + 0.8735, + 0.872, + 0.87, + 0.8685, + 0.8725, + 0.874, + 0.875, + 0.875, + 0.874, + 0.8765, + 0.876, + 0.8775, + 0.8775, + 0.875, + 0.8745, + 0.8755, + 0.8735, + 0.8765, + 0.878, + 0.8785, + 0.874, + 0.876, + 0.875, + 0.8785, + 0.8775, + 0.8765, + 0.878, + 0.877, + 0.877, + 0.876, + 0.876, + 0.874, + 0.874, + 0.8755, + 0.876, + 0.876, + 0.876, + 0.8765, + 0.8755, + 0.876, + 0.875, + 0.875, + 0.875, + 0.875 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8992727398872375, + 0.8809841871261597 + ], + "perturbation_rho": [ + 0.999998927116394, + 0.9999969005584717 + ], + "nudging": { + "0.001": [ + -0.034776899963617325, + -0.014410343021154404 + ], + "0.003": [ + -0.09730946272611618, + -0.04205682873725891 + ], + "0.01": [ + -0.2502431571483612, + -0.12689679861068726 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2870552124023438, + 1.6535948223114014, + 1.0296381690979004, + 0.7126224917411804, + 0.5591352634429931, + 0.4811658450603485, + 0.4388775806427002, + 0.4253014211177826, + 0.4193685954093933, + 0.4093106484889984, + 0.41880208411216735, + 0.42850149631500245, + 0.428736455821991, + 0.43955466747283933, + 0.4433642386198044, + 0.44784595458507537, + 0.435849981212616, + 0.47222038536071775, + 0.4397192087173462, + 0.45586099319458007, + 0.46415687026977537, + 0.48371028423309326, + 0.451132914352417, + 0.47991643798351286, + 0.45130317702293393, + 0.480626265335083, + 0.46450931119918826, + 0.4824261344909668, + 0.4816949737071991, + 0.48009960498809817, + 0.5074262315750122, + 0.4895252437353134, + 0.4705415657997131, + 0.4835156498908997, + 0.47929900856018065, + 0.4537247060775757, + 0.471054771232605, + 0.48902023096084596, + 0.49175932846069337, + 0.5241551312446594, + 0.451823796248436, + 0.43896633648872374, + 0.4653335520744324, + 0.4502745701789856, + 0.4341614744186401, + 0.46303419842720034, + 0.44793482451438904, + 0.44024938931465146, + 0.4392324646472931, + 0.43231110212504864, + 0.41355489072799684, + 0.453599790096283, + 0.4247152150630951, + 0.4223084320545197, + 0.42320016803741456, + 0.4448660778999329, + 0.4123545353651047, + 0.4022479995727539, + 0.412995005607605, + 0.40325671529769896, + 0.39850479309558867, + 0.3982270024299622, + 0.39613970642089846, + 0.38792987279891966, + 0.3912136312961578, + 0.38957534875869754, + 0.38518679401874545, + 0.37867675232887266, + 0.3806942042350769, + 0.3797240556240082, + 0.37711212148666384, + 0.3763957218170166, + 0.3759556182384491, + 0.37444110627174376, + 0.37315322313308713, + 0.3726344390392303, + 0.37197003917694094, + 0.37117694425582887, + 0.3707807907104492, + 0.37058883180618285 + ], + "train_acc": [ + 0.1553, + 0.4555, + 0.6508, + 0.7471, + 0.7963, + 0.8138, + 0.8276, + 0.8342, + 0.8353, + 0.8425, + 0.8412, + 0.842, + 0.8405, + 0.8401, + 0.8417, + 0.8395, + 0.8456, + 0.8309, + 0.8454, + 0.8409, + 0.8372, + 0.8369, + 0.8441, + 0.8365, + 0.8411, + 0.8366, + 0.8391, + 0.8356, + 0.8369, + 0.8348, + 0.8271, + 0.834, + 0.8399, + 0.8353, + 0.8389, + 0.8421, + 0.8418, + 0.8384, + 0.8358, + 0.83, + 0.8435, + 0.8456, + 0.8404, + 0.8454, + 0.8476, + 0.8414, + 0.8448, + 0.8462, + 0.8459, + 0.8498, + 0.8517, + 0.8429, + 0.8496, + 0.8487, + 0.8517, + 0.8471, + 0.8535, + 0.8553, + 0.8542, + 0.8567, + 0.8577, + 0.8566, + 0.8585, + 0.8587, + 0.8593, + 0.8596, + 0.862, + 0.8632, + 0.86, + 0.861, + 0.8631, + 0.8617, + 0.8635, + 0.8641, + 0.8646, + 0.8644, + 0.8636, + 0.865, + 0.8652, + 0.8653 + ], + "test_acc": [ + 0.292, + 0.56, + 0.691, + 0.739, + 0.776, + 0.7805, + 0.8045, + 0.799, + 0.8065, + 0.8065, + 0.8085, + 0.8025, + 0.8075, + 0.794, + 0.8075, + 0.8135, + 0.802, + 0.7955, + 0.8005, + 0.801, + 0.79, + 0.7845, + 0.798, + 0.798, + 0.7875, + 0.791, + 0.7895, + 0.796, + 0.7865, + 0.777, + 0.8005, + 0.7835, + 0.788, + 0.7905, + 0.806, + 0.8025, + 0.785, + 0.789, + 0.781, + 0.798, + 0.804, + 0.799, + 0.801, + 0.8115, + 0.8015, + 0.797, + 0.81, + 0.797, + 0.808, + 0.796, + 0.7955, + 0.8085, + 0.8125, + 0.807, + 0.8, + 0.808, + 0.811, + 0.811, + 0.812, + 0.808, + 0.8125, + 0.812, + 0.8135, + 0.8135, + 0.8125, + 0.816, + 0.8145, + 0.813, + 0.817, + 0.8135, + 0.816, + 0.8165, + 0.817, + 0.815, + 0.8155, + 0.8175, + 0.815, + 0.8155, + 0.816, + 0.816 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.017043430358171463, + 0.0684005469083786 + ], + "perturbation_rho": [ + -0.039058439433574677, + 0.11359640955924988 + ], + "nudging": { + "0.001": [ + -0.0006350737530738115, + -0.0003296324284747243 + ], + "0.003": [ + -0.0018682447262108326, + -0.0009874338284134865 + ], + "0.01": [ + -0.005804130807518959, + -0.0032830811105668545 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 2.085509059524536, + 1.1997124633789062, + 0.7052989973068238, + 0.4944884951114655, + 0.42731611585617063, + 0.40364177112579347, + 0.40250489449501037, + 0.39572899947166446, + 0.3938576333761215, + 0.3945821855545044, + 0.3956324628829956, + 0.39204095797538757, + 0.38553655610084536, + 0.39142296171188357, + 0.38895199718475343, + 0.3898035387039185, + 0.3947607610702515, + 0.3965999175071716, + 0.40212894287109374, + 0.40160218105316164, + 0.4069850404262543, + 0.41640855975151064, + 0.4233110466003418, + 0.44071909160614015, + 0.4416384401321411, + 0.44119831857681274, + 0.43994840660095214, + 0.44008309478759766, + 0.43364879651069643, + 0.43739947289228437, + 0.4283482677459717, + 0.4456914433956146, + 0.4563638810157776, + 0.4303118309020996, + 0.4327080216407776, + 0.42274960250854493, + 0.4333017177581787, + 0.4467815902233124, + 0.4313963102340698, + 0.4363329181671143, + 0.4287542325496674, + 0.43090186014175413, + 0.4246362741470337, + 0.4307769187927246, + 0.4269701943397522, + 0.4238660922050476, + 0.4403623225688934, + 0.4208802846908569, + 0.42905401678085325, + 0.4272002784252167, + 0.4219598471641541, + 0.420378928565979, + 0.42290292086601255, + 0.42269562950134276, + 0.43232801451683045, + 0.42110945229530333, + 0.4163690044403076, + 0.41736082611083986, + 0.42144253940582277, + 0.41818094477653506, + 0.41234604358673094, + 0.41562650147676466, + 0.41009650206565856, + 0.40981764011383054, + 0.41089948043823243, + 0.40907523860931394, + 0.4101927646636963, + 0.40733580865859986, + 0.40593432711362837, + 0.4065796292304993, + 0.4045049686193466, + 0.4033273178577423, + 0.4033346746444702, + 0.40280530282258986, + 0.40217347147464755, + 0.40183706488609316, + 0.40159110057353975, + 0.4014276859283447, + 0.4012072265625, + 0.4011442585945129 + ], + "train_acc": [ + 0.2521, + 0.5991, + 0.755, + 0.8222, + 0.8411, + 0.84, + 0.8422, + 0.8464, + 0.8469, + 0.8473, + 0.8491, + 0.8489, + 0.8501, + 0.8519, + 0.8481, + 0.8513, + 0.8456, + 0.8504, + 0.8409, + 0.8404, + 0.8442, + 0.8367, + 0.8395, + 0.8318, + 0.8321, + 0.8325, + 0.8338, + 0.8322, + 0.8372, + 0.8354, + 0.8394, + 0.8302, + 0.8256, + 0.8384, + 0.8364, + 0.8386, + 0.8358, + 0.8351, + 0.8371, + 0.8371, + 0.8389, + 0.8385, + 0.84, + 0.8378, + 0.8431, + 0.8455, + 0.8375, + 0.8435, + 0.8435, + 0.841, + 0.8446, + 0.843, + 0.8406, + 0.8426, + 0.8414, + 0.8449, + 0.8453, + 0.8452, + 0.8436, + 0.8447, + 0.8475, + 0.8473, + 0.8463, + 0.8479, + 0.8491, + 0.8491, + 0.8477, + 0.8484, + 0.8494, + 0.8499, + 0.8498, + 0.8509, + 0.8502, + 0.8514, + 0.8519, + 0.8517, + 0.8518, + 0.8512, + 0.8514, + 0.8515 + ], + "test_acc": [ + 0.49, + 0.6875, + 0.7605, + 0.804, + 0.805, + 0.802, + 0.8065, + 0.806, + 0.8055, + 0.808, + 0.8085, + 0.8055, + 0.8105, + 0.804, + 0.807, + 0.8155, + 0.8115, + 0.812, + 0.7955, + 0.8025, + 0.8, + 0.8115, + 0.8055, + 0.805, + 0.796, + 0.7895, + 0.7965, + 0.7935, + 0.7905, + 0.7845, + 0.799, + 0.7695, + 0.7965, + 0.7995, + 0.7985, + 0.7955, + 0.799, + 0.79, + 0.787, + 0.788, + 0.792, + 0.7935, + 0.7915, + 0.7995, + 0.797, + 0.7935, + 0.7995, + 0.799, + 0.7975, + 0.8025, + 0.8005, + 0.8015, + 0.7955, + 0.7985, + 0.808, + 0.8025, + 0.802, + 0.8045, + 0.8015, + 0.8035, + 0.7955, + 0.8025, + 0.8085, + 0.8055, + 0.805, + 0.8045, + 0.8035, + 0.8065, + 0.8035, + 0.8075, + 0.807, + 0.807, + 0.806, + 0.8065, + 0.806, + 0.8065, + 0.8075, + 0.807, + 0.8075, + 0.807 + ], + "state_pred_error": [ + 0.8011611330986023, + 0.3609474738121033, + 0.21311738922595977, + 0.17308431911468505, + 0.15645604510307312, + 0.13793717213869094, + 0.11612963346242905, + 0.09631521614789963, + 0.07912670748233795, + 0.06581646353006362, + 0.055194634342193606, + 0.046884950709342954, + 0.04106640879511833, + 0.03793207856416702, + 0.03359296218752861, + 0.03188889281153679, + 0.029081323546171187, + 0.02699935197234154, + 0.025859476828575135, + 0.024149730026721956, + 0.023846294847130776, + 0.022766227704286577, + 0.02158056313097477, + 0.020458749863505363, + 0.019927274003624915, + 0.019538553309440612, + 0.0188307683467865, + 0.01786738821566105, + 0.01805778686106205, + 0.017307938440144062, + 0.01650934716016054, + 0.01636997167468071, + 0.016149957418441774, + 0.015640711134672164, + 0.015530829256772995, + 0.015072985544800759, + 0.014928080968558789, + 0.014236513023078441, + 0.013992103570699691, + 0.013805941741168498, + 0.013859274068474769, + 0.013517734362185, + 0.013017747814953327, + 0.012777870306372643, + 0.012784181451797485, + 0.012523168560862542, + 0.012562317198514939, + 0.01242608730494976, + 0.012103212547302246, + 0.013212937520444393, + 0.011627227926254272, + 0.011481619267165661, + 0.011224271242320538, + 0.011096839188039304, + 0.01085965276658535, + 0.01071037351489067, + 0.010505712181329728, + 0.010282582534849644, + 0.010697883084416389, + 0.011361672592163086, + 0.010023625978827477, + 0.009966823917627335, + 0.010207099059224128, + 0.009507107688486576, + 0.009546992440521717, + 0.009390620791912078, + 0.009162344363331795, + 0.00911178617477417, + 0.009029264736175538, + 0.009068329860270024, + 0.008832447521388532, + 0.008576158338785172, + 0.008559903579950333, + 0.008348167736828328, + 0.008216162344813347, + 0.008780301743745804, + 0.008052194035053252, + 0.00799637444615364, + 0.007933191792666912, + 0.0086071118183434 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8896123766899109, + 0.46193015575408936 + ], + "perturbation_rho": [ + 0.8089620471000671, + 0.3910723328590393 + ], + "nudging": { + "0.001": [ + -0.02786075323820114, + -0.003570881672203541 + ], + "0.003": [ + -0.08058245480060577, + -0.010666092857718468 + ], + "0.01": [ + -0.23563425242900848, + -0.03502008318901062 + ] + }, + "state_pred_error_per_layer": [ + 1470.6129150390625, + 266.84222412109375 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2876405261993407, + 1.6589315502166748, + 1.032972918510437, + 0.7166166153907776, + 0.5627004514217376, + 0.48185237402915954, + 0.4412262492656708, + 0.42024023895263674, + 0.4159124126434326, + 0.41783777375221254, + 0.43015226793289185, + 0.41944336700439455, + 0.4336165071964264, + 0.431957585144043, + 0.4321355306863785, + 0.443198069190979, + 0.4393294587135315, + 0.45416013383865356, + 0.48345874342918393, + 0.5023631313323974, + 0.5149450803756714, + 0.5199348605155945, + 0.539059090423584, + 0.5481982292175293, + 0.5818891710281372, + 0.5882292882919311, + 0.5962150434494019, + 0.6086743747711182, + 0.6369373207092285, + 0.65568203125, + 0.6485560325622559, + 0.6509528552055359, + 0.6618397993087769, + 0.6784751142501831, + 0.6892412689208984, + 0.6599728857994079, + 0.6764159112930298, + 0.7006567495346069, + 0.7071641028404236, + 0.6960477909088135, + 0.6928154678344727, + 0.7350670424461365, + 0.7627396492004395, + 0.7707545019149781, + 0.737790333366394, + 0.7868994663238525, + 0.7634784624099732, + 0.7762238646507263, + 0.8018951994895935, + 0.7849565597534179, + 0.8176450714111329, + 0.8360422663688659, + 0.8193753229141235, + 0.8155689338684082, + 0.8275344564437866, + 0.837344129371643, + 0.8366100923538208, + 0.8482813408851624, + 0.8508966381072998, + 0.8566178089141846, + 0.8539601694107055, + 0.8565668355941772, + 0.8545724077224731, + 0.8627288048744202, + 0.8558533429145813, + 0.8527083917617798, + 0.8515555647850037, + 0.8542263612747193, + 0.8479507312774658, + 0.8465972842216491, + 0.8489613071441651, + 0.8499880193710327, + 0.846294707107544, + 0.8456767027854919, + 0.845595064163208, + 0.8452041431427002, + 0.8436063968658447, + 0.8431942218780517, + 0.8428546760559082, + 0.8426003468513489 + ], + "train_acc": [ + 0.1549, + 0.4565, + 0.6491, + 0.7495, + 0.7914, + 0.8171, + 0.8312, + 0.8359, + 0.8383, + 0.8393, + 0.836, + 0.845, + 0.8405, + 0.8425, + 0.847, + 0.8429, + 0.844, + 0.8405, + 0.834, + 0.8242, + 0.8215, + 0.8184, + 0.8131, + 0.8131, + 0.8035, + 0.7999, + 0.7919, + 0.7925, + 0.7806, + 0.7764, + 0.7749, + 0.7707, + 0.7607, + 0.7559, + 0.7527, + 0.7565, + 0.7486, + 0.7427, + 0.7405, + 0.7469, + 0.7427, + 0.7273, + 0.7239, + 0.7253, + 0.7276, + 0.7123, + 0.7175, + 0.7178, + 0.7059, + 0.712, + 0.7045, + 0.6954, + 0.704, + 0.7011, + 0.6979, + 0.6962, + 0.6944, + 0.6863, + 0.693, + 0.6882, + 0.6881, + 0.6873, + 0.6891, + 0.6867, + 0.6883, + 0.6876, + 0.6863, + 0.6879, + 0.6895, + 0.6914, + 0.6879, + 0.6912, + 0.6914, + 0.691, + 0.6902, + 0.69, + 0.691, + 0.6912, + 0.6911, + 0.6911 + ], + "test_acc": [ + 0.2915, + 0.5615, + 0.6735, + 0.74, + 0.766, + 0.786, + 0.7965, + 0.798, + 0.803, + 0.811, + 0.804, + 0.8, + 0.8035, + 0.805, + 0.802, + 0.813, + 0.801, + 0.8045, + 0.7865, + 0.781, + 0.7965, + 0.7855, + 0.776, + 0.7705, + 0.757, + 0.763, + 0.7455, + 0.7345, + 0.7365, + 0.7225, + 0.724, + 0.7285, + 0.6945, + 0.703, + 0.7045, + 0.707, + 0.6745, + 0.698, + 0.7005, + 0.7015, + 0.6935, + 0.6745, + 0.6835, + 0.6915, + 0.6855, + 0.6795, + 0.669, + 0.657, + 0.68, + 0.6605, + 0.6665, + 0.66, + 0.6615, + 0.646, + 0.663, + 0.6575, + 0.659, + 0.655, + 0.652, + 0.6565, + 0.662, + 0.657, + 0.657, + 0.658, + 0.6535, + 0.659, + 0.657, + 0.653, + 0.6525, + 0.656, + 0.6535, + 0.657, + 0.6565, + 0.6585, + 0.6575, + 0.658, + 0.658, + 0.659, + 0.66, + 0.6605 + ], + "value_loss": [ + 3.201891397190094, + 0.779361897277832, + 0.626858753490448, + 0.6105666812896728, + 0.5514641007423401, + 0.517792618727684, + 0.5215819624900818, + 0.5292677600860596, + 0.552981759929657, + 0.5698205958366394, + 0.5810090668201446, + 0.5961851135253906, + 0.6149938448905945, + 0.6305486402511596, + 0.6387381959915162, + 0.6182627209663392, + 0.6587734882354737, + 0.6572166347026825, + 0.7393287518978119, + 0.7575859657287598, + 0.7096261032104492, + 0.7378914642333985, + 0.7248077880859375, + 0.7350102340698242, + 0.7564734949111939, + 0.6695011586904526, + 0.644234440612793, + 0.5980740191459656, + 0.5971753816604615, + 0.5931948877334595, + 0.5637484560966491, + 0.5179620209217072, + 0.49389802017211915, + 0.5098487597942353, + 0.4865056258678436, + 0.4405415944099426, + 0.4353645149230957, + 0.4501692766189575, + 0.45002960472106934, + 0.422652059841156, + 0.4055860691070557, + 0.4549039573431015, + 0.46190376739501954, + 0.471636429977417, + 0.4265621903419495, + 0.4594758994102478, + 0.42435137259960176, + 0.44350295667648315, + 0.46465742254257203, + 0.44208196215629575, + 0.4832916920661926, + 0.5232693849563599, + 0.4623278817176819, + 0.4547371855735779, + 0.4594089942932129, + 0.46912296028137207, + 0.47726550636291504, + 0.4601418377876282, + 0.46802607822418213, + 0.4529942394256592, + 0.4592748096942902, + 0.47371763911247255, + 0.4452900604248047, + 0.4446146511077881, + 0.4409138162612915, + 0.45059286756515504, + 0.42469289593696596, + 0.4136852811336517, + 0.4327469911813736, + 0.4167798330545425, + 0.4059099773406982, + 0.4036043640613556, + 0.4098508264541626, + 0.4066617407798767, + 0.39713848648071287, + 0.40763027248382566, + 0.3894461953163147, + 0.3812183334350586, + 0.38804075756073, + 0.3851433990240097 + ], + "term_loss": [ + 1.8095692808151245, + 0.3307587965011597, + 0.3579055207252502, + 0.38751730251312255, + 0.3419568935394287, + 0.31203726736307147, + 0.31745839205980303, + 0.33440028057098387, + 0.3659660063266754, + 0.3876699714303017, + 0.39679462888240813, + 0.4184996568202972, + 0.43375586037635805, + 0.44975857195854185, + 0.45838220162391663, + 0.435672639131546, + 0.4776378852844238, + 0.4704463632583618, + 0.5460535125732422, + 0.5489175643920898, + 0.49749358978271485, + 0.5227905928611756, + 0.4984749317169189, + 0.5076854391098022, + 0.5196511005163192, + 0.4271921033501625, + 0.39845617814064027, + 0.3495673320531845, + 0.3406120599746704, + 0.3369556130170822, + 0.3124081336021423, + 0.26228452085256576, + 0.23591850142478943, + 0.24258239690363406, + 0.21891801595687865, + 0.18692822000980377, + 0.17564877446889876, + 0.1858476457595825, + 0.18565895201563834, + 0.16571398117542266, + 0.1499946511030197, + 0.18262819264009594, + 0.18550563032627107, + 0.19401416344642639, + 0.15707174652814865, + 0.17475576095581055, + 0.1460891138225794, + 0.16268992478847505, + 0.17513533658981323, + 0.15897264647483825, + 0.1887047908782959, + 0.21617013705968857, + 0.16718865274786948, + 0.16259072281122208, + 0.16479001131057738, + 0.16972213253974913, + 0.17816825335025788, + 0.160431849360466, + 0.1674132004737854, + 0.1533277048110962, + 0.15940114099383354, + 0.16802982873916625, + 0.14754837176799773, + 0.14664715819358826, + 0.14326468232870102, + 0.15353368443846702, + 0.13146308953166008, + 0.12186262704730035, + 0.13736094230413437, + 0.12571639954447747, + 0.1161090140581131, + 0.1144715744972229, + 0.12061160337924957, + 0.11733541253209114, + 0.11001659770011901, + 0.11899287624359131, + 0.10357448959499597, + 0.09714262957572938, + 0.1018681374579668, + 0.10070284021273256 + ], + "bridge_loss": [ + 1.0979772183747263, + 0.14488070307970047, + 0.032327918493747713, + 0.01006056183576584, + 0.01405837194621563, + 0.02506896505355835, + 0.029270013190805914, + 0.024456803676486016, + 0.01778325879126787, + 0.011628757537901402, + 0.010623802649974824, + 0.01033981561884284, + 0.010671415086835622, + 0.012105880802869796, + 0.015091647936403751, + 0.014290212792158127, + 0.017276279383152723, + 0.01755652065873146, + 0.01865756440013647, + 0.025649653977155684, + 0.025815965831279753, + 0.026902742621302603, + 0.03349096584320068, + 0.03358717203140259, + 0.03484274614453316, + 0.036431199651956556, + 0.03821594860553741, + 0.03984641134142876, + 0.0399793375492096, + 0.035500000548362734, + 0.0335044051527977, + 0.03535626398921013, + 0.034901417164504525, + 0.03535908999443054, + 0.03244625160694122, + 0.0270990745306015, + 0.028194128577411173, + 0.025620638090372086, + 0.02424610341191292, + 0.02160915930122137, + 0.01955409088283777, + 0.02624212960600853, + 0.022223139250278474, + 0.023016857573390007, + 0.0221236746609211, + 0.023469938251376152, + 0.022684386810660363, + 0.02442432513833046, + 0.02541698269248009, + 0.024323033849895, + 0.02966375322341919, + 0.03533650541305542, + 0.028947667813301086, + 0.02696481726169586, + 0.027019736531376837, + 0.029223014229536055, + 0.02940545443892479, + 0.026615454608201982, + 0.02830494921207428, + 0.025745924377441408, + 0.027217651453614235, + 0.03207499958276749, + 0.024836220550537108, + 0.023358790194988252, + 0.024930324649065732, + 0.024928521275520324, + 0.022257217685878277, + 0.01982123215943575, + 0.025022566971182825, + 0.021975069151818752, + 0.01949193856716156, + 0.018918460190296173, + 0.02019774815738201, + 0.020446433125436307, + 0.01855314065515995, + 0.02024043953716755, + 0.017883623769879342, + 0.01658413535952568, + 0.019047247916460036, + 0.01744421122968197 + ], + "tgrad_loss": [ + 0.294344884967804, + 0.30372239556312564, + 0.23662530732154846, + 0.2129888197660446, + 0.19544884057044984, + 0.18068639143705367, + 0.17485355710983277, + 0.17041067209243774, + 0.16923249213695526, + 0.1705218675136566, + 0.17359062929153443, + 0.16734564185142517, + 0.17056657358407976, + 0.16868418793678283, + 0.16526433700919152, + 0.1682998752593994, + 0.1638593245267868, + 0.16921375732421876, + 0.17461767234802247, + 0.18301874628067016, + 0.18631654744148254, + 0.18819813222885132, + 0.19284189145565034, + 0.19373762021064758, + 0.20197965245246888, + 0.20587785987854004, + 0.2075623162984848, + 0.20866027362346648, + 0.21658398847579957, + 0.22073927323818207, + 0.21783591961860657, + 0.22032123794555664, + 0.2230780988931656, + 0.2319072772026062, + 0.2351413604259491, + 0.22651429884433746, + 0.23152161231040955, + 0.238700989484787, + 0.24012455048561096, + 0.23532891595363617, + 0.23603732614517212, + 0.24603363862037658, + 0.2541750002861023, + 0.2546054096698761, + 0.24736676750183106, + 0.26125019659996035, + 0.2555778726577759, + 0.2563887059211731, + 0.264105103969574, + 0.25878628327846526, + 0.26492314825057983, + 0.27176274490356445, + 0.26619156007766726, + 0.26518164477348327, + 0.26759924521446227, + 0.27017781343460084, + 0.26969179601669313, + 0.2730945366859436, + 0.2723079304218292, + 0.2739206102371216, + 0.2726560173988342, + 0.2736128067970276, + 0.27290546894073486, + 0.27460870208740235, + 0.272718811917305, + 0.2721306644439697, + 0.270972588634491, + 0.2720014189720154, + 0.2703634834766388, + 0.2690883653879166, + 0.27030902328491213, + 0.2702143274307251, + 0.26904147510528564, + 0.2688798934936523, + 0.26856874713897705, + 0.2683969561100006, + 0.26798808333873747, + 0.26749156715869904, + 0.2671253750085831, + 0.26699634662866595 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.15452352166175842, + 0.31575465202331543 + ], + "perturbation_rho": [ + 0.26963475346565247, + 0.4633495509624481 + ], + "nudging": { + "0.001": [ + -0.007989507168531418, + -0.002687511034309864 + ], + "0.003": [ + -0.02384537272155285, + -0.008051736280322075 + ], + "0.01": [ + -0.07802344858646393, + -0.026711856946349144 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a0.5_L4_s123.json b/results/synth_ladder_v2_hi/synth_a0.5_L4_s123.json new file mode 100644 index 0000000..24023da --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a0.5_L4_s123.json @@ -0,0 +1,1554 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.4834706062316894, + 0.5430349823951721, + 0.38668747143745424, + 0.34510154552459715, + 0.33817491273880007, + 0.2920334846019745, + 0.2970120040655136, + 0.2641972427368164, + 0.2674439710021019, + 0.2409529842853546, + 0.2405674941301346, + 0.2373046693444252, + 0.2162545440196991, + 0.24015355696678162, + 0.21905847864151, + 0.21977773468494416, + 0.17934191759824752, + 0.16521801726818083, + 0.1855501010656357, + 0.16433925240039826, + 0.18235039415359497, + 0.20661087665557862, + 0.19766983861923218, + 0.15200146064758302, + 0.14539728266000748, + 0.12806377177238465, + 0.13287909836769105, + 0.14254976189136506, + 0.1169908158659935, + 0.10335765879154206, + 0.0976445425748825, + 0.1269135407447815, + 0.10905979499816895, + 0.1036293788909912, + 0.08703284446001053, + 0.07714519078731537, + 0.0854867350578308, + 0.07759437730312348, + 0.08323309755325317, + 0.06878422734737397, + 0.06057573595643043, + 0.056178426837921146, + 0.0535672729074955, + 0.05012710075974464, + 0.0464719173014164, + 0.044800338208675385, + 0.05190476224422455, + 0.04983877096027136, + 0.041653870904445646, + 0.039705309933424, + 0.036863119888305665, + 0.042920396673679355, + 0.03639051071405411, + 0.03289378116130829, + 0.035526476675271985, + 0.033458709704875945, + 0.029977919310331346, + 0.028593969064950944, + 0.02730948829650879, + 0.02754064207971096, + 0.026273250000178813, + 0.02554192252755165, + 0.025177255961298942, + 0.024420051104575395, + 0.023936483108997344, + 0.023976508555561302, + 0.023393685922026633, + 0.023062897664308548, + 0.02284297253638506, + 0.0225670176923275, + 0.02237149138152599, + 0.022162008368223907, + 0.021948657459020613, + 0.021801631617546082, + 0.021714019361883403, + 0.021613608975708486, + 0.02154767996519804, + 0.021490249353647232, + 0.02145659771114588, + 0.02143701379299164 + ], + "train_acc": [ + 0.5114, + 0.8219, + 0.8579, + 0.8666, + 0.8671, + 0.8848, + 0.8822, + 0.8982, + 0.8949, + 0.909, + 0.907, + 0.9076, + 0.9125, + 0.9065, + 0.9148, + 0.9142, + 0.9331, + 0.9382, + 0.9255, + 0.9384, + 0.9247, + 0.9212, + 0.9216, + 0.9426, + 0.947, + 0.9543, + 0.9517, + 0.9467, + 0.9569, + 0.9688, + 0.9707, + 0.9526, + 0.9639, + 0.9648, + 0.9728, + 0.9806, + 0.972, + 0.9773, + 0.9745, + 0.9815, + 0.9875, + 0.9885, + 0.99, + 0.9916, + 0.9942, + 0.994, + 0.9899, + 0.9906, + 0.9953, + 0.9956, + 0.9971, + 0.9926, + 0.9971, + 0.9978, + 0.9966, + 0.9971, + 0.999, + 0.9988, + 0.9994, + 0.9989, + 0.9998, + 0.9998, + 0.9998, + 1.0, + 0.9999, + 0.9999, + 1.0, + 0.9999, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.7605, + 0.85, + 0.859, + 0.865, + 0.8715, + 0.87, + 0.857, + 0.8675, + 0.8675, + 0.8715, + 0.88, + 0.8645, + 0.868, + 0.868, + 0.8735, + 0.874, + 0.8685, + 0.8815, + 0.8755, + 0.8785, + 0.8785, + 0.872, + 0.871, + 0.88, + 0.8785, + 0.879, + 0.8755, + 0.875, + 0.8835, + 0.8805, + 0.877, + 0.8715, + 0.883, + 0.8785, + 0.881, + 0.8775, + 0.8845, + 0.8835, + 0.875, + 0.8825, + 0.885, + 0.881, + 0.878, + 0.8825, + 0.8825, + 0.883, + 0.881, + 0.881, + 0.88, + 0.8845, + 0.883, + 0.88, + 0.884, + 0.8805, + 0.883, + 0.88, + 0.8775, + 0.8815, + 0.881, + 0.88, + 0.8815, + 0.8795, + 0.881, + 0.88, + 0.8795, + 0.8785, + 0.8805, + 0.8795, + 0.883, + 0.884, + 0.8825, + 0.881, + 0.8815, + 0.8815, + 0.8825, + 0.8825, + 0.883, + 0.883, + 0.882, + 0.882 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.817541241645813, + 0.7992762923240662, + 0.7803024053573608, + 0.749271035194397 + ], + "perturbation_rho": [ + 0.9999992847442627, + 0.9999971389770508, + 0.9999915361404419, + 0.9999540448188782 + ], + "nudging": { + "0.001": [ + -0.039698582142591476, + -0.021919304504990578, + -0.010462507605552673, + -0.004785426892340183 + ], + "0.003": [ + -0.10896631330251694, + -0.06271065026521683, + -0.030694259330630302, + -0.014211377128958702 + ], + "0.01": [ + -0.25995129346847534, + -0.17589232325553894, + -0.09449617564678192, + -0.04570754989981651 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2335582107543943, + 1.4812821199417114, + 0.8872520751953125, + 0.6475240196228027, + 0.5359860889434814, + 0.46958555698394777, + 0.45785905749797823, + 0.4420524597644806, + 0.46240528092384336, + 0.438674670791626, + 0.4997645055770874, + 0.4712224443435669, + 0.48766630415916445, + 0.4953000538825989, + 0.4773715334892273, + 0.5531020860195159, + 0.47040989060401917, + 0.4952229196548462, + 0.6815311771392822, + 0.5375438184738159, + 0.569130647277832, + 0.5825253881454467, + 0.6240433019638062, + 0.5191664490699768, + 0.5594121186256409, + 0.5025074581623077, + 0.568897618484497, + 0.797276012134552, + 0.6494657384395599, + 0.5863183005809784, + 0.5042545314788819, + 0.6360464210510254, + 0.5303603213310242, + 0.6333333390235901, + 0.5571413533687591, + 0.521467384147644, + 0.6245811168670654, + 0.4870353964805603, + 0.5776216228485107, + 0.6220016703605652, + 0.663741721868515, + 0.6662271121025085, + 0.6002572847366333, + 0.6127229302406311, + 0.5246655365228653, + 0.4890981090545654, + 0.5078178949356079, + 0.45640108737945556, + 0.5856611510276795, + 0.5142886983633042, + 0.49405618019104003, + 0.5483347434997559, + 0.5194024101734162, + 0.5156882713317871, + 0.48824515991210937, + 0.46362982807159425, + 0.48169746732711793, + 0.4621458419799805, + 0.48525344228744505, + 0.4669917287349701, + 0.43736272325515746, + 0.4267999319076538, + 0.447295890045166, + 0.44295010929107664, + 0.42769963054656984, + 0.43936410925388336, + 0.42555498695373534, + 0.4199682415962219, + 0.4203143095970154, + 0.4061591213226318, + 0.4136860329627991, + 0.4161090198516846, + 0.4061859919548035, + 0.4035600830078125, + 0.40434388854503633, + 0.40137048931121827, + 0.40382256450653076, + 0.39942702045440676, + 0.3986932475566864, + 0.39767972602844237 + ], + "train_acc": [ + 0.1852, + 0.484, + 0.6814, + 0.7576, + 0.8008, + 0.8232, + 0.8259, + 0.8299, + 0.8242, + 0.8325, + 0.815, + 0.8246, + 0.8193, + 0.8158, + 0.8202, + 0.8012, + 0.8253, + 0.8114, + 0.7706, + 0.8045, + 0.7946, + 0.7887, + 0.7805, + 0.8032, + 0.7913, + 0.8114, + 0.7894, + 0.7385, + 0.7662, + 0.7862, + 0.8128, + 0.764, + 0.8006, + 0.7743, + 0.7941, + 0.8065, + 0.7786, + 0.8154, + 0.7877, + 0.775, + 0.7658, + 0.765, + 0.7887, + 0.7835, + 0.806, + 0.8177, + 0.8082, + 0.8231, + 0.7853, + 0.8043, + 0.8151, + 0.797, + 0.8023, + 0.8106, + 0.8192, + 0.8253, + 0.8167, + 0.822, + 0.8158, + 0.8208, + 0.8345, + 0.8374, + 0.8289, + 0.8276, + 0.8334, + 0.8309, + 0.8372, + 0.8371, + 0.8392, + 0.8448, + 0.8397, + 0.8405, + 0.8417, + 0.8454, + 0.8438, + 0.8444, + 0.844, + 0.8454, + 0.8473, + 0.8469 + ], + "test_acc": [ + 0.329, + 0.6095, + 0.7115, + 0.77, + 0.7765, + 0.797, + 0.7935, + 0.77, + 0.793, + 0.7595, + 0.7995, + 0.781, + 0.744, + 0.7505, + 0.7555, + 0.7825, + 0.779, + 0.6505, + 0.7605, + 0.684, + 0.754, + 0.654, + 0.7145, + 0.7395, + 0.7465, + 0.7285, + 0.626, + 0.6385, + 0.728, + 0.7255, + 0.659, + 0.7475, + 0.6745, + 0.668, + 0.7795, + 0.749, + 0.7725, + 0.7285, + 0.6635, + 0.6505, + 0.727, + 0.675, + 0.6695, + 0.746, + 0.743, + 0.702, + 0.7945, + 0.667, + 0.7215, + 0.7375, + 0.71, + 0.7465, + 0.744, + 0.704, + 0.7515, + 0.744, + 0.7415, + 0.7765, + 0.775, + 0.782, + 0.795, + 0.792, + 0.795, + 0.7705, + 0.7955, + 0.7975, + 0.787, + 0.778, + 0.796, + 0.8075, + 0.793, + 0.806, + 0.8035, + 0.8055, + 0.8085, + 0.799, + 0.803, + 0.8065, + 0.804, + 0.8045 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.027901431545615196, + 0.2837410271167755, + 0.17885790765285492, + 0.12107238173484802 + ], + "perturbation_rho": [ + -0.007988158613443375, + 0.25683730840682983, + 0.21096175909042358, + 0.1645408272743225 + ], + "nudging": { + "0.001": [ + 0.00047835364239290357, + -0.0009741741232573986, + -0.0005935455556027591, + -0.00044419028563424945 + ], + "0.003": [ + 0.0014678429579362273, + -0.002917262725532055, + -0.0017763640498742461, + -0.0013300562277436256 + ], + "0.01": [ + 0.005267709027975798, + -0.009674372151494026, + -0.005893784575164318, + -0.0044119693338871 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.8521444786071777, + 0.8489539235115051, + 0.49778255472183225, + 0.44921045970916745, + 0.4791688131332397, + 0.5339837857246399, + 0.6159221937656403, + 0.6920900274276733, + 0.7395291107177734, + 0.7648588424682617, + 0.7390518695831299, + 0.7285711270332337, + 0.756377292728424, + 0.7920883464813232, + 0.7511230406761169, + 0.7427966569900513, + 0.7848520866394043, + 0.7643903920173645, + 0.747663676071167, + 0.7614839931488037, + 0.7973562688827515, + 0.805117155122757, + 0.8282611333847046, + 0.8117145735740662, + 0.77988141746521, + 0.7727121877670288, + 0.7857501653671265, + 0.7532362991333008, + 0.7174396375656128, + 0.6707095355987549, + 0.6616346151351928, + 0.6730950567245484, + 0.6997067294597625, + 0.6670414597511292, + 0.7028018656730652, + 0.6884466652870178, + 0.6903644677162171, + 0.6862619149208069, + 0.6891118244171143, + 0.6871656932830811, + 0.7013169605255127, + 0.6584716122150421, + 0.6772907896995545, + 0.6789146376609803, + 0.6993297848701477, + 0.6749252514839172, + 0.6679595365524292, + 0.6602012983322143, + 0.6643224500656127, + 0.6685716100692749, + 0.6538269229888916, + 0.6759916665077209, + 0.6566515842437745, + 0.6645777332305908, + 0.6630637623786926, + 0.6612954006195069, + 0.6419784454345703, + 0.649862062215805, + 0.6516496278762818, + 0.6557377228736877, + 0.6478088115215301, + 0.6365815505981446, + 0.6575287200927734, + 0.6443278756141663, + 0.6441601477622986, + 0.647724620437622, + 0.6438550380706787, + 0.6339428859710693, + 0.635849730682373, + 0.6402260863304138, + 0.6340386274337768, + 0.635369322013855, + 0.6311982594490051, + 0.6316978254318237, + 0.6306024626731872, + 0.6300158632278442, + 0.6289655219078064, + 0.6281617763519287, + 0.6276290187835694, + 0.6273329115867615 + ], + "train_acc": [ + 0.3353, + 0.6866, + 0.8142, + 0.8275, + 0.8164, + 0.8031, + 0.7812, + 0.7662, + 0.7541, + 0.7442, + 0.7411, + 0.7383, + 0.7284, + 0.7118, + 0.7334, + 0.7317, + 0.7181, + 0.73, + 0.7275, + 0.727, + 0.7215, + 0.7129, + 0.7122, + 0.719, + 0.7334, + 0.7359, + 0.7363, + 0.7488, + 0.7578, + 0.7726, + 0.7687, + 0.7618, + 0.7597, + 0.7667, + 0.7523, + 0.7602, + 0.763, + 0.7613, + 0.7607, + 0.759, + 0.7594, + 0.7722, + 0.7641, + 0.7591, + 0.7553, + 0.7664, + 0.7625, + 0.7675, + 0.7694, + 0.7625, + 0.7663, + 0.7654, + 0.767, + 0.7656, + 0.7673, + 0.7678, + 0.7709, + 0.7701, + 0.769, + 0.7704, + 0.7723, + 0.778, + 0.7657, + 0.7699, + 0.7732, + 0.7689, + 0.7764, + 0.7744, + 0.7746, + 0.7734, + 0.7761, + 0.7759, + 0.7764, + 0.7775, + 0.7782, + 0.7754, + 0.7773, + 0.7776, + 0.7789, + 0.7788 + ], + "test_acc": [ + 0.5775, + 0.7495, + 0.7955, + 0.793, + 0.779, + 0.7605, + 0.7395, + 0.73, + 0.7225, + 0.712, + 0.7185, + 0.724, + 0.702, + 0.707, + 0.702, + 0.7015, + 0.709, + 0.7075, + 0.7135, + 0.707, + 0.711, + 0.712, + 0.693, + 0.701, + 0.701, + 0.7115, + 0.7185, + 0.734, + 0.7445, + 0.7265, + 0.733, + 0.7365, + 0.724, + 0.7235, + 0.7295, + 0.721, + 0.7345, + 0.7035, + 0.724, + 0.7195, + 0.7045, + 0.715, + 0.721, + 0.7245, + 0.7245, + 0.733, + 0.7365, + 0.719, + 0.731, + 0.719, + 0.715, + 0.7195, + 0.7295, + 0.7165, + 0.7325, + 0.722, + 0.7225, + 0.724, + 0.725, + 0.7315, + 0.7305, + 0.731, + 0.721, + 0.7255, + 0.732, + 0.727, + 0.736, + 0.7325, + 0.7405, + 0.7305, + 0.7335, + 0.7335, + 0.735, + 0.7355, + 0.7325, + 0.733, + 0.7355, + 0.734, + 0.7345, + 0.7345 + ], + "state_pred_error": [ + 0.7540362793922424, + 0.2618380335569382, + 0.17575423958301545, + 0.158187340092659, + 0.15769709210395813, + 0.16296500368118286, + 0.16990506443977357, + 0.1747624362707138, + 0.18139113659858705, + 0.17765859956741334, + 0.1602109962463379, + 0.14175251982212067, + 0.12335596957206726, + 0.10387119936943054, + 0.08755449919700622, + 0.07622657419443131, + 0.07090357104539871, + 0.06943184436559677, + 0.07135494997501374, + 0.07029388542175292, + 0.06737940437793731, + 0.06583633923530578, + 0.06345893771648407, + 0.05942388106584549, + 0.06105950610637665, + 0.06514391770958901, + 0.06618037341833115, + 0.06543034576177598, + 0.0635401979148388, + 0.06032257821559906, + 0.05693511110544205, + 0.05423654878139496, + 0.049708415055274964, + 0.046185979115962984, + 0.04225068616271019, + 0.0371412379860878, + 0.03288117943108082, + 0.028753877902030944, + 0.02540679348707199, + 0.022826728397607802, + 0.020825295001268385, + 0.01934205988943577, + 0.017717279280722142, + 0.016153786206245423, + 0.01561382452249527, + 0.013925037890672684, + 0.012696143777668477, + 0.011785201603174209, + 0.010956936873495578, + 0.010217144775390624, + 0.009551341994851827, + 0.009032958608865738, + 0.008615280666947365, + 0.008203100349009037, + 0.007876600304245949, + 0.008993487451970577, + 0.007320681408047676, + 0.007038792558014393, + 0.006822358392179012, + 0.006652445471286773, + 0.0065686072878539566, + 0.006301340243220329, + 0.006194311405718326, + 0.006011598140001297, + 0.005876070992648602, + 0.005961736746132374, + 0.0057346595384180545, + 0.005598231753706932, + 0.005515987113118172, + 0.005370079948008061, + 0.005283707259595394, + 0.005166467700898647, + 0.0051793598145246506, + 0.004988818861544132, + 0.004967996621131897, + 0.004830757288634777, + 0.004682945563271642, + 0.004599864952266216, + 0.004583264472708106, + 0.004458400094695389 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8108769655227661, + 0.3922353684902191, + 0.15907782316207886, + 0.149577796459198 + ], + "perturbation_rho": [ + 0.6536975502967834, + 0.33696871995925903, + 0.15431806445121765, + 0.1703358292579651 + ], + "nudging": { + "0.001": [ + -0.02259242907166481, + -0.0016305823810398579, + -0.0006174352020025253, + -0.0005583323654718697 + ], + "0.003": [ + -0.06632187962532043, + -0.004884002730250359, + -0.0018520723097026348, + -0.0016746381297707558 + ], + "0.01": [ + -0.2048409879207611, + -0.01618226245045662, + -0.006159749813377857, + -0.005569745786488056 + ] + }, + "state_pred_error_per_layer": [ + 3474.9130859375, + 1348.3646240234375, + 1462.0654296875, + 924.672607421875 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.238513381195068, + 1.478446886062622, + 0.8984584705352783, + 0.6479596544265747, + 0.5321606098175049, + 0.46738452167510985, + 0.45212909936904905, + 0.4412958154678345, + 0.4428103973388672, + 0.45779245624542236, + 0.5129776763916015, + 0.48493399066925047, + 0.4955709422111511, + 0.5551924660682678, + 0.4973321964263916, + 0.5596337683677673, + 0.5621023122787475, + 0.5936956991195679, + 0.506741700553894, + 0.5527004140377044, + 0.5299466539382934, + 0.5636592745780945, + 0.5512495688438416, + 0.6911539608955384, + 0.7126970441818238, + 0.757884527015686, + 0.7561026565551758, + 0.8022804564714432, + 0.756680935382843, + 0.7413855548858642, + 0.7616110191345214, + 0.8522287889480591, + 0.90401587972641, + 0.8410554805755616, + 0.8393038982391358, + 0.8351445549964904, + 0.8266246129989624, + 0.8432566371917725, + 0.8550898251533509, + 0.8253010906219482, + 0.8000944749832153, + 0.7725691860198974, + 0.7631549596786499, + 0.7787857055664062, + 0.766472288608551, + 0.7898382484436035, + 0.8000267809867859, + 0.7795157686710358, + 0.784522922706604, + 0.7961834842681885, + 0.788183743095398, + 0.8009099166870117, + 0.7960924263954162, + 0.803066586303711, + 0.8122837594032287, + 0.7979355515480041, + 0.796984415435791, + 0.8062079792022705, + 0.8164349870204926, + 0.8265008636474609, + 0.8436849462509155, + 0.8493386405944824, + 0.8505276624202728, + 0.8448130174636841, + 0.8579680969238281, + 0.8611232654571533, + 0.8577412282943726, + 0.8524883877754211, + 0.8455306541442871, + 0.8488166980743408, + 0.8484283323287964, + 0.8408801859378815, + 0.8399367668151856, + 0.836677680015564, + 0.8344884692192077, + 0.834986524772644, + 0.8330111223220825, + 0.831924938583374, + 0.8312370910644531, + 0.830715307712555 + ], + "train_acc": [ + 0.1882, + 0.4923, + 0.6703, + 0.7584, + 0.8033, + 0.8246, + 0.8287, + 0.8365, + 0.8324, + 0.8263, + 0.8083, + 0.8171, + 0.8156, + 0.7956, + 0.8162, + 0.7952, + 0.7916, + 0.7863, + 0.8148, + 0.7992, + 0.813, + 0.8006, + 0.807, + 0.7772, + 0.768, + 0.7701, + 0.7688, + 0.7684, + 0.7655, + 0.7659, + 0.7579, + 0.737, + 0.7298, + 0.7463, + 0.7444, + 0.7461, + 0.7425, + 0.7347, + 0.7221, + 0.7309, + 0.7318, + 0.7317, + 0.7296, + 0.7252, + 0.7239, + 0.7159, + 0.7167, + 0.7169, + 0.7148, + 0.7099, + 0.7175, + 0.7085, + 0.7141, + 0.7089, + 0.7032, + 0.7083, + 0.7078, + 0.7084, + 0.7, + 0.7029, + 0.699, + 0.6951, + 0.6969, + 0.7002, + 0.695, + 0.6961, + 0.6957, + 0.6967, + 0.6991, + 0.6987, + 0.6988, + 0.6979, + 0.6988, + 0.7004, + 0.7003, + 0.7004, + 0.7006, + 0.7006, + 0.6997, + 0.7005 + ], + "test_acc": [ + 0.323, + 0.5955, + 0.715, + 0.766, + 0.7775, + 0.7915, + 0.7825, + 0.7865, + 0.785, + 0.7675, + 0.7915, + 0.747, + 0.7365, + 0.735, + 0.764, + 0.734, + 0.698, + 0.7815, + 0.7405, + 0.7365, + 0.7935, + 0.7415, + 0.716, + 0.7395, + 0.7405, + 0.738, + 0.7435, + 0.74, + 0.7195, + 0.729, + 0.717, + 0.663, + 0.7105, + 0.706, + 0.704, + 0.717, + 0.681, + 0.6935, + 0.722, + 0.6965, + 0.7145, + 0.706, + 0.7015, + 0.689, + 0.6965, + 0.693, + 0.705, + 0.6995, + 0.7, + 0.6905, + 0.6875, + 0.6795, + 0.6915, + 0.6805, + 0.6915, + 0.674, + 0.6855, + 0.673, + 0.669, + 0.665, + 0.6705, + 0.6655, + 0.67, + 0.666, + 0.6695, + 0.671, + 0.6665, + 0.667, + 0.668, + 0.664, + 0.6675, + 0.6705, + 0.668, + 0.668, + 0.67, + 0.665, + 0.6695, + 0.6695, + 0.6675, + 0.668 + ], + "value_loss": [ + 2.8863564193725586, + 0.9040914880752563, + 0.7810646405220032, + 0.6981226700782776, + 0.6097434432029724, + 0.6142956817626953, + 0.5842859931945801, + 0.517870895576477, + 0.5182754273414611, + 0.6007693460464477, + 0.680942530632019, + 0.5966949496269226, + 0.6465810567855835, + 0.7795912544250488, + 0.6385285264253616, + 0.7629974831581116, + 0.7991079656600952, + 0.8916878988265992, + 0.6929094882965088, + 0.7491918589115143, + 0.7855519455432892, + 0.8720088466644287, + 0.8952933601379395, + 1.208518335723877, + 1.2596970233917237, + 1.3889865486145019, + 1.3504928841590882, + 1.76775849237442, + 1.5157122314453124, + 1.3177562489509582, + 1.1500543141365052, + 1.3385095929145814, + 1.4191001964569092, + 1.2026564547538758, + 1.1336268447875977, + 1.130702359199524, + 1.011481032371521, + 1.033429777431488, + 0.9805498022079467, + 0.8623548080444335, + 0.7880003303527832, + 0.7476288684844971, + 0.6462140014648438, + 0.6593039730072021, + 0.5621418162345886, + 0.6217806543350219, + 0.6747557874679565, + 0.6232282665967941, + 0.6294091362953186, + 0.6572539217948914, + 0.5706359854221345, + 0.5169425714492798, + 0.5537946958541871, + 0.5706222624778747, + 0.5587895211219788, + 0.5054799375534058, + 0.5031447858333588, + 0.5232256004333496, + 0.5240278210163116, + 0.5081352228164673, + 0.5495406572341919, + 0.6334876583099365, + 0.5355876060128212, + 0.5040627335548401, + 0.55469250831604, + 0.5250602727890015, + 0.5236522147178649, + 0.5053264931678771, + 0.4896225148200989, + 0.4833145246982574, + 0.48712017555236814, + 0.48232889132499696, + 0.4699660972595215, + 0.48501924810409547, + 0.4632767639636993, + 0.4829914659500122, + 0.46285762519836426, + 0.4791563155412674, + 0.46995122051239013, + 0.4729928963661194 + ], + "term_loss": [ + 1.6036672487258912, + 0.4866477812767029, + 0.5500622243881226, + 0.5111940277099609, + 0.4329673198699951, + 0.4469112928390503, + 0.41419190340042117, + 0.3552157738447189, + 0.3613631259679794, + 0.43681443691253663, + 0.49862520866394044, + 0.42397409868240354, + 0.46771746263504027, + 0.5842745771408081, + 0.4544785821020603, + 0.5597044972896575, + 0.5882236742973328, + 0.6682760814666748, + 0.4957572563171387, + 0.5435506319046021, + 0.5837905749320984, + 0.6493298694610595, + 0.6785561132907867, + 0.93956556224823, + 0.9792157770156861, + 1.0973765476226807, + 1.0527679742336273, + 1.4304333041667938, + 1.1945446773529054, + 1.0108222512960434, + 0.845477667427063, + 1.021408819437027, + 1.070293742442131, + 0.8828932909011841, + 0.8144708358764648, + 0.8031732571125031, + 0.6978397472381592, + 0.7110097882270813, + 0.6671629565238952, + 0.5662335210800171, + 0.4992787841796875, + 0.459820813703537, + 0.36139142322540285, + 0.37380871934890747, + 0.27486766773462296, + 0.31456750046014786, + 0.35646585421562194, + 0.30645070412158965, + 0.3155028410434723, + 0.35171530480384827, + 0.262723495388031, + 0.2240681984901428, + 0.2624427561759949, + 0.2767317503809929, + 0.2615759829521179, + 0.21678510558605193, + 0.213090805208683, + 0.22851175367832183, + 0.22521133567094803, + 0.20825024695396424, + 0.23806381833553314, + 0.30820584111213684, + 0.22358069960772992, + 0.19847816874980925, + 0.23981675534248353, + 0.21385586824417113, + 0.21096881765127182, + 0.19432116413116454, + 0.18428481633663177, + 0.1760320121526718, + 0.17917428448200226, + 0.17456265774965285, + 0.16240413327217101, + 0.17174850260019303, + 0.15498115499019624, + 0.16968325634002684, + 0.1520833549261093, + 0.16171157859563828, + 0.15455809693336486, + 0.15622255086898804 + ], + "bridge_loss": [ + 0.9791954847954563, + 0.12670794755816459, + 0.017565081167966127, + 0.007164146476984024, + 0.017620862129330634, + 0.02251181682050228, + 0.026151837778091432, + 0.01914508735835552, + 0.010432719926536084, + 0.010145348550379277, + 0.011001840087771416, + 0.009505402293801308, + 0.008902425718307495, + 0.011087563878297806, + 0.009357659213244916, + 0.011638822643458844, + 0.014301572993397713, + 0.013270902928709983, + 0.01884037252739072, + 0.01476599485501647, + 0.017172387784719467, + 0.026732139322161674, + 0.02380416285097599, + 0.03586443645805121, + 0.04554584881961345, + 0.051492015558481215, + 0.0620356507062912, + 0.10263055491447448, + 0.08920669302195311, + 0.06797399497032165, + 0.05848033113479614, + 0.04522013221681118, + 0.06130107210278511, + 0.053479281087219714, + 0.05635778515636921, + 0.06460995850861073, + 0.05289331116974354, + 0.05607377367392182, + 0.04042225465476513, + 0.030378661921620368, + 0.025389883720874785, + 0.027952989809960128, + 0.025545942783355712, + 0.021930139112472533, + 0.02298613493666053, + 0.03622410003766417, + 0.0450515654027462, + 0.04776753831878305, + 0.043910300672054293, + 0.03366219551563263, + 0.03776019195318222, + 0.018074785171449184, + 0.017864137798547744, + 0.017495711874961854, + 0.017257797373831273, + 0.012870814455673098, + 0.013426685670018196, + 0.01694126845598221, + 0.01702145220786333, + 0.016847654724121093, + 0.023266981953382494, + 0.035923548865318296, + 0.022870525400713087, + 0.018457241381704806, + 0.02394478079676628, + 0.020566632018983365, + 0.022281900307536125, + 0.021731911043822764, + 0.018568690180778502, + 0.019266699397563935, + 0.019932482597231866, + 0.02130942338705063, + 0.021624688065052033, + 0.028506877756118775, + 0.02428789115548134, + 0.029018885892629624, + 0.02777098114490509, + 0.03438006125688553, + 0.03253316249623895, + 0.034451057982444765 + ], + "tgrad_loss": [ + 0.30349363470077517, + 0.29073575751781466, + 0.21343733773231507, + 0.17976449966430663, + 0.15915526002645491, + 0.1448725718975067, + 0.14394225373268127, + 0.14351004109382628, + 0.1464795805335045, + 0.15380956373214721, + 0.17131548562049867, + 0.16321545238494872, + 0.1699611658334732, + 0.18422911157608032, + 0.17469229288101196, + 0.19165415947437286, + 0.1965827165365219, + 0.21014091815948485, + 0.17831186084747314, + 0.19087522847652436, + 0.1845889872074127, + 0.1959468394756317, + 0.19293308794498443, + 0.23308833079338073, + 0.234935409450531, + 0.24011796731948853, + 0.2356892698287964, + 0.2346946145772934, + 0.23196086978912353, + 0.23896000286340713, + 0.246096316075325, + 0.271880633354187, + 0.28750537996292114, + 0.2662838943958282, + 0.2627982192516327, + 0.2629191486597061, + 0.26074797649383546, + 0.2663462108612061, + 0.2729646023273468, + 0.2657426230430603, + 0.26333165884017945, + 0.259855065202713, + 0.25927663507461546, + 0.26356511487960815, + 0.2642880185127258, + 0.2709890515089035, + 0.27323836481571195, + 0.2690100230574608, + 0.2699959950447082, + 0.2718764228820801, + 0.2701522953510284, + 0.27479958691596984, + 0.27348780364990233, + 0.2763948000907898, + 0.27995573606491087, + 0.2758240224838257, + 0.2766272976398468, + 0.27777257800102234, + 0.28179502913951876, + 0.2830373200416565, + 0.2882098621368408, + 0.28935827159881594, + 0.28913638255596164, + 0.2871273239135742, + 0.2909309693336487, + 0.2906377738952637, + 0.29040149817466737, + 0.2892734199285507, + 0.28676901168823243, + 0.28801581645011903, + 0.28801341381073, + 0.28645680844783783, + 0.2859372780799866, + 0.2847638677597046, + 0.2840077176332474, + 0.28428932056427003, + 0.2830032865524292, + 0.2830646735906601, + 0.2828599617004395, + 0.28231928570270537 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.05806349962949753, + 0.19388319551944733, + 0.1997416615486145, + 0.19820059835910797 + ], + "perturbation_rho": [ + 0.05481833964586258, + 0.3572811782360077, + 0.4186326265335083, + 0.3411045968532562 + ], + "nudging": { + "0.001": [ + -0.0029148743487894535, + -0.0016693011857569218, + -0.0016626573633402586, + -0.0016281461575999856 + ], + "0.003": [ + -0.008709331974387169, + -0.005001912824809551, + -0.004982108250260353, + -0.004877123050391674 + ], + "0.01": [ + -0.0286177359521389, + -0.01660466194152832, + -0.01654389500617981, + -0.016194619238376617 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a0.5_L4_s42.json b/results/synth_ladder_v2_hi/synth_a0.5_L4_s42.json new file mode 100644 index 0000000..0727c71 --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a0.5_L4_s42.json @@ -0,0 +1,1554 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.5250055702209473, + 0.5507197608947754, + 0.3841320207595825, + 0.35932164669036865, + 0.31933714962005616, + 0.3227846714496613, + 0.3028541946411133, + 0.29807121329307557, + 0.27894931735992434, + 0.30708285484313963, + 0.2654671094417572, + 0.2526435827255249, + 0.22071890375614167, + 0.20774164290428163, + 0.2417035475730896, + 0.239601744556427, + 0.2061288031578064, + 0.20110705008506774, + 0.19673097145557403, + 0.17361064953804017, + 0.16336524235010147, + 0.1541515984773636, + 0.17720441585183144, + 0.15197478637695314, + 0.1717322502374649, + 0.15199407002925872, + 0.13259448325634002, + 0.14251351101398468, + 0.11849438445568085, + 0.12607571827173233, + 0.11433437283039093, + 0.10952981774806976, + 0.10948647691607476, + 0.09781867054402828, + 0.08961167633533478, + 0.10128397414684295, + 0.09377768075466156, + 0.086143566852808, + 0.07471307250261307, + 0.06912044876217842, + 0.06486728579998016, + 0.06798115438222885, + 0.06793259272575379, + 0.06783070080280304, + 0.06020965424776077, + 0.05598097594976425, + 0.0566912874341011, + 0.04851433913707733, + 0.05244531365633011, + 0.04565400942564011, + 0.04321225633025169, + 0.04449230827391148, + 0.039462119901180266, + 0.040013881278038024, + 0.03971400515437126, + 0.0358551750421524, + 0.03401491985321045, + 0.034367064037919046, + 0.032305684411525724, + 0.03139898471236229, + 0.030498171234130858, + 0.029822335571050643, + 0.029149569642543793, + 0.0281656219124794, + 0.028202341210842134, + 0.027365115937590598, + 0.026671420013904573, + 0.027203523302078248, + 0.026499097537994384, + 0.026119756138324738, + 0.025678298735618593, + 0.025355695700645445, + 0.025052896262705324, + 0.024881752938032152, + 0.024743154951930045, + 0.02462823152542114, + 0.024543652564287186, + 0.02447993883341551, + 0.024439664232730866, + 0.024415402659773825 + ], + "train_acc": [ + 0.498, + 0.8183, + 0.8589, + 0.8608, + 0.8736, + 0.8748, + 0.8796, + 0.8843, + 0.8915, + 0.88, + 0.8949, + 0.902, + 0.9137, + 0.9217, + 0.9068, + 0.9048, + 0.92, + 0.9225, + 0.9271, + 0.9331, + 0.9391, + 0.9439, + 0.9306, + 0.9439, + 0.9334, + 0.9419, + 0.9511, + 0.9454, + 0.9596, + 0.955, + 0.9606, + 0.9634, + 0.9623, + 0.9662, + 0.9726, + 0.9664, + 0.9714, + 0.9752, + 0.9799, + 0.9834, + 0.9869, + 0.9828, + 0.9825, + 0.9829, + 0.9881, + 0.9878, + 0.9892, + 0.9925, + 0.9894, + 0.9932, + 0.9943, + 0.9938, + 0.9963, + 0.9954, + 0.9952, + 0.9971, + 0.9978, + 0.9979, + 0.9989, + 0.9989, + 0.9986, + 0.999, + 0.999, + 0.9995, + 0.9993, + 0.9996, + 0.9998, + 0.9995, + 0.9996, + 0.9997, + 0.9997, + 0.9998, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999 + ], + "test_acc": [ + 0.763, + 0.8435, + 0.857, + 0.85, + 0.8625, + 0.8615, + 0.8655, + 0.8555, + 0.856, + 0.8635, + 0.864, + 0.8715, + 0.878, + 0.869, + 0.8615, + 0.8775, + 0.8695, + 0.869, + 0.8755, + 0.8725, + 0.875, + 0.872, + 0.8785, + 0.8775, + 0.8685, + 0.8775, + 0.8795, + 0.878, + 0.8825, + 0.876, + 0.882, + 0.8805, + 0.89, + 0.885, + 0.885, + 0.8795, + 0.8845, + 0.8835, + 0.881, + 0.8765, + 0.879, + 0.8815, + 0.8825, + 0.8835, + 0.877, + 0.8835, + 0.88, + 0.884, + 0.879, + 0.8825, + 0.881, + 0.879, + 0.8835, + 0.8815, + 0.8815, + 0.8825, + 0.8835, + 0.8815, + 0.8815, + 0.8835, + 0.8815, + 0.8835, + 0.8815, + 0.883, + 0.885, + 0.884, + 0.883, + 0.8815, + 0.883, + 0.8825, + 0.882, + 0.8825, + 0.8815, + 0.8825, + 0.8825, + 0.883, + 0.8825, + 0.883, + 0.883, + 0.883 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8572149276733398, + 0.8503379821777344, + 0.8309497833251953, + 0.8099952340126038 + ], + "perturbation_rho": [ + 0.9999990463256836, + 0.9999980330467224, + 0.999992311000824, + 0.9999608993530273 + ], + "nudging": { + "0.001": [ + -0.042521148920059204, + -0.023217972368001938, + -0.011091032065451145, + -0.005212459247559309 + ], + "0.003": [ + -0.1181650310754776, + -0.06687315553426743, + -0.032639797776937485, + -0.015497863292694092 + ], + "0.01": [ + -0.29344552755355835, + -0.19200363755226135, + -0.10158533602952957, + -0.050049468874931335 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.261956468582153, + 1.4311306690216063, + 0.818257098197937, + 0.5983575573444366, + 0.500597601890564, + 0.45219913649559024, + 0.4174496747016907, + 0.409495729637146, + 0.4188644021987915, + 0.45328485565185545, + 0.42861666593551634, + 0.46300609769821166, + 0.4457720745563507, + 0.45008082075119016, + 0.4816469186782837, + 0.491936355304718, + 0.4805133812904358, + 0.5310946586608887, + 0.5184094581604004, + 0.5349128709316253, + 0.503399237036705, + 0.5629850885391235, + 0.6070423364162445, + 0.5541394971847534, + 0.5405849707126618, + 0.5269447027683258, + 0.5041178157329559, + 0.5237154272437096, + 0.4906633505821228, + 0.6188776139259339, + 0.5532598972320557, + 0.5653144476890564, + 0.5119002490878105, + 0.5062383512377739, + 0.5014870280742645, + 0.5912513525962829, + 0.6307907728433609, + 0.5102149733304977, + 0.5199897046327591, + 0.5104138412237167, + 0.504832841014862, + 0.5849459474563599, + 0.5909522429466247, + 0.6081267190933227, + 0.5230989686727524, + 0.5009066128730774, + 0.4870625690460205, + 0.5026308774948121, + 0.513473293876648, + 0.48188849410749973, + 0.45255061175823214, + 0.46306118438243865, + 0.481172536277771, + 0.4813159273266792, + 0.4563068170785904, + 0.4633492294549942, + 0.45527973327636717, + 0.4800791665077209, + 0.4427429686546326, + 0.43737694044113157, + 0.45122047100067136, + 0.4516987937927246, + 0.4359778087615967, + 0.43745238494873045, + 0.4318913806915283, + 0.4248273630142212, + 0.41580243453979493, + 0.4173020489692688, + 0.41921982488632203, + 0.4114777256965637, + 0.4125749154686928, + 0.4053273830771446, + 0.4055808573246002, + 0.40145073013305665, + 0.4026311701536179, + 0.4003137221336365, + 0.3996645420074463, + 0.3981458621025085, + 0.3979306438922882, + 0.3975636598587036 + ], + "train_acc": [ + 0.1709, + 0.5147, + 0.692, + 0.7731, + 0.808, + 0.8242, + 0.8375, + 0.8453, + 0.8442, + 0.8349, + 0.8443, + 0.835, + 0.8441, + 0.8444, + 0.8351, + 0.8365, + 0.8411, + 0.8326, + 0.8345, + 0.8285, + 0.8374, + 0.8265, + 0.8206, + 0.8325, + 0.8334, + 0.8373, + 0.846, + 0.8393, + 0.8428, + 0.8205, + 0.8357, + 0.8299, + 0.8419, + 0.8418, + 0.8454, + 0.8266, + 0.8236, + 0.8434, + 0.8437, + 0.8446, + 0.8477, + 0.8375, + 0.8298, + 0.8288, + 0.842, + 0.848, + 0.8548, + 0.8496, + 0.8494, + 0.8506, + 0.8598, + 0.8581, + 0.8553, + 0.8512, + 0.8594, + 0.8581, + 0.8586, + 0.8553, + 0.8628, + 0.8646, + 0.8613, + 0.863, + 0.8651, + 0.8621, + 0.8631, + 0.864, + 0.871, + 0.8671, + 0.8717, + 0.8696, + 0.8701, + 0.8722, + 0.8724, + 0.8723, + 0.8715, + 0.8733, + 0.8733, + 0.8743, + 0.8735, + 0.8741 + ], + "test_acc": [ + 0.325, + 0.622, + 0.7225, + 0.764, + 0.783, + 0.8075, + 0.8055, + 0.8055, + 0.797, + 0.8075, + 0.7835, + 0.799, + 0.7925, + 0.793, + 0.8, + 0.8055, + 0.785, + 0.7905, + 0.79, + 0.791, + 0.7925, + 0.758, + 0.7805, + 0.783, + 0.8055, + 0.7965, + 0.787, + 0.804, + 0.7835, + 0.7975, + 0.7785, + 0.771, + 0.798, + 0.801, + 0.768, + 0.792, + 0.7705, + 0.791, + 0.81, + 0.7995, + 0.7865, + 0.7915, + 0.769, + 0.806, + 0.795, + 0.806, + 0.812, + 0.805, + 0.813, + 0.806, + 0.8075, + 0.8085, + 0.808, + 0.8185, + 0.8025, + 0.8185, + 0.8175, + 0.8155, + 0.8175, + 0.8095, + 0.817, + 0.818, + 0.817, + 0.823, + 0.818, + 0.828, + 0.823, + 0.82, + 0.8205, + 0.824, + 0.8235, + 0.824, + 0.8235, + 0.8245, + 0.8235, + 0.8265, + 0.827, + 0.8255, + 0.825, + 0.825 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.0060789515264332294, + 0.09873200953006744, + 0.10723873972892761, + 0.1101943776011467 + ], + "perturbation_rho": [ + -0.012974856421351433, + 0.14552229642868042, + 0.08513970673084259, + 0.06377018243074417 + ], + "nudging": { + "0.001": [ + -0.00029901170637458563, + -0.0006812716601416469, + -0.0004231537168379873, + -0.0004066851979587227 + ], + "0.003": [ + -0.0008656850550323725, + -0.0020401428919285536, + -0.0012693263124674559, + -0.001218506833538413 + ], + "0.01": [ + -0.0025177751667797565, + -0.006775799673050642, + -0.004219442140311003, + -0.00405311631038785 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.90833014793396, + 0.8779405179977418, + 0.5064040044784546, + 0.4657335244178772, + 0.4902631205320358, + 0.5776193201065063, + 0.649845489025116, + 0.6730898847579956, + 0.6785502085208893, + 0.6754426885128021, + 0.6688244145870209, + 0.6485107803106308, + 0.6637302653312683, + 0.6521788113594055, + 0.6718272481918335, + 0.6910618996620178, + 0.7287369018554688, + 0.7307573244094848, + 0.7283793703079223, + 0.79008408908844, + 0.8179881494522094, + 0.8709803493499756, + 0.8228100231170654, + 0.8579356725692749, + 0.8632372360229492, + 0.8647078338623047, + 0.8247142519950866, + 0.8100111122131348, + 0.827653882598877, + 0.7867350393295288, + 0.7713617871284485, + 0.7540933326721191, + 0.7635929446220397, + 0.731565843629837, + 0.7520291829109191, + 0.7454802143096924, + 0.7568781739234924, + 0.7290890070438385, + 0.7567377836227417, + 0.7685284609794617, + 0.7458412083625794, + 0.739471393108368, + 0.7550339795112609, + 0.7631093349456787, + 0.7788069766998291, + 0.7642952583789825, + 0.7572312101840973, + 0.7669681239128113, + 0.7663568916320801, + 0.7649306897163392, + 0.7452942167282105, + 0.7477542019367218, + 0.7388495827674866, + 0.7364303831100464, + 0.7253182221412658, + 0.7264514459609985, + 0.7120715827941895, + 0.711595621585846, + 0.7125990421295166, + 0.6964491970062255, + 0.690447259426117, + 0.686346722984314, + 0.6837696258544922, + 0.6897882652282715, + 0.6716403135299682, + 0.6684516845226288, + 0.658786863708496, + 0.6592671649932861, + 0.6566618491172791, + 0.6524367179870606, + 0.6484959433555603, + 0.6476131733894348, + 0.645097210597992, + 0.6444143989562988, + 0.6423414867401123, + 0.6404327310562133, + 0.6396769283294678, + 0.6387527324676514, + 0.6382552500724793, + 0.6379588050365448 + ], + "train_acc": [ + 0.317, + 0.6744, + 0.8113, + 0.8207, + 0.8166, + 0.7937, + 0.7738, + 0.7632, + 0.7617, + 0.7675, + 0.765, + 0.77, + 0.7642, + 0.7658, + 0.757, + 0.7525, + 0.7407, + 0.7439, + 0.7443, + 0.7262, + 0.7243, + 0.7127, + 0.728, + 0.7172, + 0.718, + 0.7182, + 0.7229, + 0.7304, + 0.7319, + 0.7341, + 0.7352, + 0.7414, + 0.738, + 0.7511, + 0.7459, + 0.7455, + 0.7481, + 0.7508, + 0.7422, + 0.7329, + 0.7467, + 0.7435, + 0.7391, + 0.7351, + 0.726, + 0.7289, + 0.7301, + 0.7278, + 0.7306, + 0.7293, + 0.7336, + 0.7358, + 0.7371, + 0.7395, + 0.7396, + 0.7388, + 0.7481, + 0.7457, + 0.7429, + 0.7528, + 0.7515, + 0.7537, + 0.7543, + 0.7518, + 0.7571, + 0.7615, + 0.7636, + 0.7662, + 0.7652, + 0.7643, + 0.766, + 0.7669, + 0.7664, + 0.7673, + 0.7688, + 0.7679, + 0.7679, + 0.7685, + 0.769, + 0.7687 + ], + "test_acc": [ + 0.5575, + 0.739, + 0.8005, + 0.8015, + 0.783, + 0.7665, + 0.747, + 0.7405, + 0.7335, + 0.7295, + 0.742, + 0.7355, + 0.7425, + 0.7325, + 0.719, + 0.7025, + 0.704, + 0.7005, + 0.692, + 0.704, + 0.6875, + 0.695, + 0.6645, + 0.684, + 0.677, + 0.697, + 0.7095, + 0.6875, + 0.7055, + 0.714, + 0.717, + 0.698, + 0.7235, + 0.7255, + 0.698, + 0.71, + 0.7215, + 0.7175, + 0.6895, + 0.7005, + 0.6965, + 0.7165, + 0.703, + 0.6825, + 0.696, + 0.709, + 0.6885, + 0.703, + 0.6925, + 0.714, + 0.705, + 0.704, + 0.7125, + 0.7125, + 0.7055, + 0.7165, + 0.72, + 0.7105, + 0.695, + 0.718, + 0.711, + 0.71, + 0.713, + 0.714, + 0.7155, + 0.72, + 0.7215, + 0.7195, + 0.718, + 0.721, + 0.724, + 0.7225, + 0.7285, + 0.724, + 0.7185, + 0.721, + 0.722, + 0.72, + 0.718, + 0.7175 + ], + "state_pred_error": [ + 0.7602040468215943, + 0.2622531470775604, + 0.17849978141784667, + 0.1614789155960083, + 0.16503283252716064, + 0.17506846377849578, + 0.17919811906814576, + 0.17643984322547912, + 0.174144562625885, + 0.16553328351974486, + 0.15643454706668855, + 0.14659336729049682, + 0.136305808365345, + 0.123571908390522, + 0.1111008218050003, + 0.10061488182544709, + 0.09224651036262513, + 0.08541531358957291, + 0.07722941876649857, + 0.07062110755443574, + 0.06594702410697938, + 0.0628838957965374, + 0.060209538972377775, + 0.05664124082326889, + 0.05358169343471527, + 0.050588799649477004, + 0.047043840610980985, + 0.043419835364818575, + 0.040251914036273956, + 0.03733443737626076, + 0.03289287920594215, + 0.030201040321588515, + 0.028524299293756484, + 0.027144377875328064, + 0.026436590403318406, + 0.02564192984700203, + 0.02490743891596794, + 0.02470569230914116, + 0.02470841442346573, + 0.02410018715262413, + 0.023862673461437226, + 0.024583475697040558, + 0.02422580669671297, + 0.024175903251767158, + 0.024176146936416627, + 0.024424808049201965, + 0.023978449884057045, + 0.023637285515666007, + 0.023030763539671897, + 0.022442915526032448, + 0.021631024262309076, + 0.02109491000175476, + 0.02076397671699524, + 0.01964172987639904, + 0.019197289264202118, + 0.01844798127412796, + 0.018010758863389494, + 0.017326503592729567, + 0.016925657695531844, + 0.01668251698166132, + 0.016097314363718033, + 0.015790151277184486, + 0.015420251709222793, + 0.015212734445929528, + 0.015064427372813225, + 0.014315600739419461, + 0.014239497092366219, + 0.01392769330739975, + 0.013602190324664115, + 0.013257772579789162, + 0.013332617598772049, + 0.012796076652407647, + 0.012833661264181137, + 0.012363243766129017, + 0.01199699844121933, + 0.011854414081573486, + 0.011675881730020047, + 0.011419792121648788, + 0.011595408976078034, + 0.011023352561891079 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.81822270154953, + 0.44441917538642883, + 0.15419423580169678, + 0.14087578654289246 + ], + "perturbation_rho": [ + 0.7556701302528381, + 0.42722654342651367, + 0.13306331634521484, + 0.10285839438438416 + ], + "nudging": { + "0.001": [ + -0.022801965475082397, + -0.0018839023541659117, + -0.0004756013513542712, + -0.0004290228243917227 + ], + "0.003": [ + -0.06668633222579956, + -0.005640539340674877, + -0.0014254236593842506, + -0.0012861560098826885 + ], + "0.01": [ + -0.2031538337469101, + -0.01867133006453514, + -0.004740326199680567, + -0.00427617784589529 + ] + }, + "state_pred_error_per_layer": [ + 6433.45703125, + 2426.59619140625, + 1950.234130859375, + 1929.63232421875 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.262130627822876, + 1.4312172101974487, + 0.818198119354248, + 0.589842716884613, + 0.49746571922302246, + 0.44104833211898803, + 0.4330927776813507, + 0.4132209104537964, + 0.4186548101425171, + 0.4405179395675659, + 0.43852746906280515, + 0.47328574361801146, + 0.5121363965034484, + 0.4439137755632401, + 0.4516206186294556, + 0.45784061965942385, + 0.5997123807907104, + 0.48465886812210085, + 0.6097313745498657, + 0.5907854682922363, + 0.5859235813617706, + 0.590377276802063, + 0.625524351978302, + 0.7122808382987976, + 0.6915377367019653, + 0.7904257673263549, + 0.8108633769989013, + 0.8236039951324463, + 0.849212548828125, + 0.724233080291748, + 0.7623365852355957, + 0.7959084012508393, + 0.7782834875106811, + 0.8130025611877442, + 0.8162316653251648, + 0.8279668930053711, + 0.759434295463562, + 0.8115165338516236, + 0.8311242639541626, + 0.8506224093437195, + 0.8758153738975525, + 0.9087218969345093, + 0.9493237188339233, + 0.9206383923530579, + 0.9653225570678711, + 1.0096012796401979, + 0.9753759350776673, + 0.9789245065689087, + 1.0101529162406921, + 1.0138245718002319, + 1.0072479097366334, + 0.9653099195480347, + 0.968689307975769, + 0.9597694366455078, + 0.9519970666885376, + 0.9325507595062256, + 0.9163512690544129, + 0.9141956408500671, + 0.900567813205719, + 0.9053131622314453, + 0.8990885392189026, + 0.88783081741333, + 0.8858179836273193, + 0.891084521484375, + 0.8845443550109864, + 0.8778420943260193, + 0.8832936000823974, + 0.8880286014556885, + 0.8798037006378174, + 0.8909469594955445, + 0.8816548425674439, + 0.8780255848884583, + 0.8818641589641572, + 0.8773575880050659, + 0.876659261894226, + 0.8753621809005737, + 0.8751238561630249, + 0.8746530110836029, + 0.8737541898727417, + 0.8735915374755859 + ], + "train_acc": [ + 0.1742, + 0.5142, + 0.696, + 0.7751, + 0.8086, + 0.8296, + 0.8316, + 0.8419, + 0.8428, + 0.836, + 0.8431, + 0.8345, + 0.8294, + 0.849, + 0.8483, + 0.8465, + 0.8266, + 0.8466, + 0.8239, + 0.8237, + 0.8236, + 0.8235, + 0.8125, + 0.8013, + 0.7991, + 0.7778, + 0.7777, + 0.7636, + 0.7595, + 0.7692, + 0.7558, + 0.7432, + 0.7414, + 0.7234, + 0.72, + 0.7211, + 0.7351, + 0.7224, + 0.7159, + 0.7168, + 0.709, + 0.7059, + 0.6956, + 0.703, + 0.6912, + 0.6837, + 0.6921, + 0.6868, + 0.6771, + 0.6761, + 0.6757, + 0.6829, + 0.6764, + 0.6743, + 0.6757, + 0.6818, + 0.6796, + 0.6813, + 0.6852, + 0.6819, + 0.6807, + 0.6857, + 0.6895, + 0.684, + 0.6886, + 0.6874, + 0.686, + 0.6841, + 0.6864, + 0.6836, + 0.6887, + 0.687, + 0.6865, + 0.6878, + 0.6895, + 0.6872, + 0.6875, + 0.6882, + 0.6877, + 0.6878 + ], + "test_acc": [ + 0.318, + 0.624, + 0.7205, + 0.758, + 0.791, + 0.8005, + 0.8045, + 0.802, + 0.809, + 0.799, + 0.7845, + 0.7945, + 0.8075, + 0.7995, + 0.8025, + 0.8045, + 0.795, + 0.801, + 0.793, + 0.7855, + 0.7965, + 0.7685, + 0.751, + 0.763, + 0.77, + 0.749, + 0.7495, + 0.717, + 0.727, + 0.727, + 0.7105, + 0.7045, + 0.723, + 0.691, + 0.6775, + 0.6825, + 0.691, + 0.672, + 0.69, + 0.6865, + 0.683, + 0.6695, + 0.663, + 0.656, + 0.638, + 0.6515, + 0.662, + 0.638, + 0.6275, + 0.6255, + 0.6435, + 0.645, + 0.641, + 0.6485, + 0.642, + 0.6545, + 0.6475, + 0.651, + 0.6355, + 0.6495, + 0.645, + 0.6555, + 0.6505, + 0.6585, + 0.6655, + 0.6595, + 0.6545, + 0.656, + 0.6575, + 0.6515, + 0.661, + 0.6555, + 0.657, + 0.659, + 0.6645, + 0.659, + 0.6605, + 0.6615, + 0.663, + 0.662 + ], + "value_loss": [ + 2.836528095149994, + 0.816120489692688, + 0.7672985095977783, + 0.6673721037864685, + 0.6218352233886719, + 0.5661839260101318, + 0.5949610354423523, + 0.5516304483413697, + 0.5791759598731995, + 0.6596351661682129, + 0.6578461580753326, + 0.7922459089279175, + 0.9037014740467072, + 0.7193802554607391, + 0.7673241809844971, + 0.7787123111724854, + 1.3601861742019654, + 0.9313673071861267, + 1.474704369354248, + 1.3335748901367188, + 1.270239903330803, + 1.269356042098999, + 1.4781879760742187, + 1.7342560359954835, + 1.3972830940246581, + 1.6526852645874024, + 1.6395666912078857, + 1.56644215965271, + 1.5341948862075805, + 0.9233963856697083, + 1.0111778057098388, + 0.9221102019548416, + 0.7878839856147766, + 0.7374455715179443, + 0.8913812401771546, + 0.8214996140480042, + 0.6318444541931152, + 0.6830074096679688, + 0.6844325854301453, + 0.7359561821460724, + 0.7201960114479065, + 0.9737900894165039, + 0.9896724973022938, + 0.7746155975341796, + 0.8274507285118103, + 0.9665608058929444, + 0.8868430158615113, + 0.7537654181957245, + 0.8216570307731629, + 0.9841215091705322, + 0.769625757598877, + 0.7049013290405274, + 0.6331182146072387, + 0.573897342300415, + 0.6105682130813599, + 0.5479789059877396, + 0.5798083689689636, + 0.536684540271759, + 0.5124590743064881, + 0.5254100856781005, + 0.4978441138267517, + 0.471036555147171, + 0.4788544952392578, + 0.4990608347892761, + 0.4809326467514038, + 0.46791065502166745, + 0.457541916513443, + 0.49322594323158264, + 0.4535485433578491, + 0.4952109790802002, + 0.46238712191581727, + 0.47982813143730163, + 0.4530548775434494, + 0.4594691922664642, + 0.4442018630981445, + 0.44861485176086424, + 0.46499351823329926, + 0.424641322183609, + 0.4401831715106964, + 0.4397273305892944 + ], + "term_loss": [ + 1.6414134392738342, + 0.4443137921333313, + 0.559983926486969, + 0.49769357573986056, + 0.4615332902908325, + 0.4038254972457886, + 0.42386618661880493, + 0.39851482734680177, + 0.43347569313049317, + 0.5093920680999756, + 0.51156728348732, + 0.6394623676300049, + 0.7410367949008941, + 0.5717715268313884, + 0.6199797077178955, + 0.6282519329071045, + 1.1741165599822998, + 0.7754406516075134, + 1.2814094917297363, + 1.1448762008666993, + 1.078112751597166, + 1.0786702735185623, + 1.2648520378112793, + 1.4924066591262817, + 1.1564546440124512, + 1.3825412983894347, + 1.3632638927459717, + 1.273400711774826, + 1.2350535747528075, + 0.6543076923370361, + 0.743414258146286, + 0.6539574896752834, + 0.5301746461391449, + 0.47235264806747435, + 0.6108167475700378, + 0.5428714781761169, + 0.36918434228897096, + 0.4127294704437256, + 0.4095069869041443, + 0.4532541881084442, + 0.42979537315368654, + 0.657108716583252, + 0.6661989997468889, + 0.48077965931892397, + 0.5223898464202881, + 0.6413800700187683, + 0.5746263883352279, + 0.45323983748555186, + 0.5107939560890198, + 0.6490193854093551, + 0.45889209270477294, + 0.3982938908576965, + 0.3374675412416458, + 0.2782774634361267, + 0.3107684251785278, + 0.25898139514923096, + 0.2855128740787506, + 0.25347770825624466, + 0.23208063430786133, + 0.2410294221639633, + 0.2160837390065193, + 0.19500134890079499, + 0.20165469875335693, + 0.21840870115756988, + 0.20449393968582152, + 0.19281733981966973, + 0.18233885293602944, + 0.20709821685552596, + 0.1764617787361145, + 0.20976627004146575, + 0.18346078137159347, + 0.19315808384418487, + 0.174583125397563, + 0.18013888797163963, + 0.16657554160356522, + 0.16982417922019957, + 0.17727276504337788, + 0.15045344903618096, + 0.16139265533685684, + 0.15641304728984834 + ], + "bridge_loss": [ + 0.900298724684713, + 0.10897476739883423, + 0.013502670300006866, + 0.007317591543495655, + 0.013260967975854873, + 0.026125178402662277, + 0.03503929834663868, + 0.02188970936536789, + 0.013026782926917077, + 0.011307439970970154, + 0.010092764848843217, + 0.010237911105155945, + 0.013995288537442684, + 0.012832430324703456, + 0.012492080415040255, + 0.014081171977519989, + 0.02573243781030178, + 0.01742579458653927, + 0.02827236390709877, + 0.029418908831477165, + 0.030862452240288257, + 0.029623181630671024, + 0.0410612174987793, + 0.05416689481958747, + 0.05351105071902275, + 0.06370576785802841, + 0.07011887242197991, + 0.08096941623687744, + 0.07904928328990936, + 0.06591862261295318, + 0.05198305888175964, + 0.04291395637691021, + 0.03001920160204172, + 0.026808916348218918, + 0.041261438471078875, + 0.037955932024121286, + 0.03391407470107079, + 0.029103711080551146, + 0.02739130940437317, + 0.033617016315460206, + 0.03501213674545288, + 0.05587814524173736, + 0.05730794131085277, + 0.03438319742679596, + 0.039327720046043395, + 0.05050214891731739, + 0.04590215096473694, + 0.03501346428096294, + 0.03831291145086289, + 0.06274814118742943, + 0.03908389060497284, + 0.041417847597599027, + 0.02885300542116165, + 0.028863998132944105, + 0.03592278670668602, + 0.029343222188949584, + 0.036601207423210144, + 0.026603504705429076, + 0.026558925279974936, + 0.02896751680970192, + 0.02652877620458603, + 0.023973076324164868, + 0.026193797969818116, + 0.029547524043917656, + 0.0260269956946373, + 0.02558014368414879, + 0.025181468015909196, + 0.03461530534923077, + 0.027815614938735963, + 0.03386597931981087, + 0.02894253313243389, + 0.03772374717593193, + 0.028875116419792176, + 0.030721370708942413, + 0.029193979501724244, + 0.030907452699542044, + 0.03893886293917894, + 0.025970697021484374, + 0.030952987808734178, + 0.03557699205875397 + ], + "tgrad_loss": [ + 0.29481595182418824, + 0.2628319282531738, + 0.19381191189289093, + 0.1623609337568283, + 0.14704096510410308, + 0.1362332438468933, + 0.13605555095672608, + 0.13122591376304626, + 0.13267348070144652, + 0.13893566043376923, + 0.13618611092567443, + 0.14254561347961425, + 0.14866939194202422, + 0.13477630219459533, + 0.13485239193439483, + 0.1363792091369629, + 0.16033716580867768, + 0.13850085837841034, + 0.16502252187728883, + 0.15927977619171144, + 0.1612646919131279, + 0.161062579369545, + 0.1722747184753418, + 0.187682466506958, + 0.18731740918159484, + 0.20643819508552552, + 0.2061839234828949, + 0.2120720314979553, + 0.2200920252084732, + 0.20317007291316985, + 0.21578048248291015, + 0.2252387508034706, + 0.2276901375055313, + 0.23828400321006774, + 0.23930306017398834, + 0.24067220277786255, + 0.22874603548049927, + 0.24117423267364502, + 0.24753428769111632, + 0.24908498060703277, + 0.25538849935531616, + 0.2608032299041748, + 0.26616555204987524, + 0.25945273523330686, + 0.26573316116333007, + 0.2746785915374756, + 0.26631446256637575, + 0.26551211733818053, + 0.27255016849040986, + 0.2723539809703827, + 0.2716497754096985, + 0.2651895927429199, + 0.266797674536705, + 0.2667558801651001, + 0.2638769968032837, + 0.25965428969860077, + 0.2576942884683609, + 0.25660332770347594, + 0.2538195102930069, + 0.2554131515979767, + 0.2552316018819809, + 0.25206212692260743, + 0.25100599851608274, + 0.2511046103000641, + 0.2504117116451263, + 0.2495131744623184, + 0.2500215957164764, + 0.2515124215364456, + 0.24927114658355712, + 0.2515787253379822, + 0.24998380770683287, + 0.24894629969596863, + 0.24959663410186766, + 0.24860893502235412, + 0.2484323462486267, + 0.2478832187652588, + 0.24878188691139222, + 0.24821717635989188, + 0.24783752670288087, + 0.24773729231357575 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.08037468791007996, + 0.24492917954921722, + 0.2708122730255127, + 0.26078444719314575 + ], + "perturbation_rho": [ + 0.14874565601348877, + 0.4311285614967346, + 0.48388832807540894, + 0.44747647643089294 + ], + "nudging": { + "0.001": [ + -0.003998343367129564, + -0.0020397088956087828, + -0.0019317157566547394, + -0.001842876197770238 + ], + "0.003": [ + -0.011952575296163559, + -0.006111519411206245, + -0.005789835937321186, + -0.005522121675312519 + ], + "0.01": [ + -0.03933826461434364, + -0.020281529054045677, + -0.01922188699245453, + -0.018336530774831772 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a0.5_L4_s456.json b/results/synth_ladder_v2_hi/synth_a0.5_L4_s456.json new file mode 100644 index 0000000..533ce8d --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a0.5_L4_s456.json @@ -0,0 +1,1554 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.4960858375549317, + 0.5346975540161133, + 0.38716840896606447, + 0.35499444410800934, + 0.30661033401489257, + 0.30922529895305634, + 0.27481330077648164, + 0.269934020614624, + 0.29978428807258606, + 0.25284944949150084, + 0.25780958070755006, + 0.23303727264404298, + 0.24132988526821136, + 0.20776223244667053, + 0.1969887863755226, + 0.1761551865696907, + 0.16374456174373628, + 0.18347106391191484, + 0.1597210103750229, + 0.1635675217628479, + 0.17662811236381531, + 0.15870836329460145, + 0.1737984106183052, + 0.13217050411701203, + 0.1460229372382164, + 0.12168637955188752, + 0.1280234918475151, + 0.12693974618911744, + 0.11462656342983246, + 0.1029154019355774, + 0.13926502933502197, + 0.10933776559829712, + 0.09320529713630676, + 0.09527391186952591, + 0.079886494910717, + 0.07977066860198975, + 0.07166484508514405, + 0.07007486948370933, + 0.06268392709493636, + 0.06896026997566224, + 0.06800698767900466, + 0.05527717870473862, + 0.06054863209873438, + 0.04793440787792206, + 0.054939467120170594, + 0.043425172302126884, + 0.04000619463920593, + 0.04502314983308315, + 0.03696476737260818, + 0.042237274646759033, + 0.043874549174308775, + 0.038109699201583865, + 0.03395200428068638, + 0.029588924580812453, + 0.028190810793638228, + 0.02734000713825226, + 0.028795221200585364, + 0.02614459018409252, + 0.02498855213224888, + 0.02417927698493004, + 0.024668072617053987, + 0.023915421676635743, + 0.023400312945246696, + 0.02246341987848282, + 0.022365201508998872, + 0.021897871212661266, + 0.021433941733837128, + 0.02118105274736881, + 0.020932374608516692, + 0.02072743790745735, + 0.020465456957370044, + 0.020281540298461916, + 0.02012429815530777, + 0.0200213955193758, + 0.01993154845237732, + 0.019858657205104827, + 0.019795786088705063, + 0.019747656816244127, + 0.01971831915974617, + 0.019699555786699057 + ], + "train_acc": [ + 0.5077, + 0.8231, + 0.8605, + 0.8665, + 0.8838, + 0.8805, + 0.891, + 0.8918, + 0.8816, + 0.9026, + 0.8988, + 0.9096, + 0.9022, + 0.919, + 0.9242, + 0.9348, + 0.9395, + 0.9298, + 0.9397, + 0.9393, + 0.9299, + 0.9363, + 0.9316, + 0.9518, + 0.9452, + 0.9571, + 0.9536, + 0.9555, + 0.9601, + 0.9645, + 0.9455, + 0.9596, + 0.969, + 0.9686, + 0.9778, + 0.9762, + 0.9809, + 0.9817, + 0.9867, + 0.9815, + 0.982, + 0.9885, + 0.9851, + 0.9931, + 0.9872, + 0.9941, + 0.9973, + 0.9923, + 0.9964, + 0.9936, + 0.9927, + 0.9951, + 0.9969, + 0.9991, + 0.9995, + 0.9994, + 0.9984, + 0.9996, + 0.9996, + 0.9997, + 0.9994, + 1.0, + 0.9999, + 1.0, + 0.9999, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.75, + 0.8525, + 0.866, + 0.8635, + 0.8695, + 0.871, + 0.8765, + 0.8645, + 0.8605, + 0.8785, + 0.8745, + 0.8675, + 0.8715, + 0.8745, + 0.871, + 0.881, + 0.883, + 0.8775, + 0.8775, + 0.88, + 0.8765, + 0.879, + 0.876, + 0.8835, + 0.8815, + 0.8775, + 0.878, + 0.8845, + 0.8815, + 0.8815, + 0.876, + 0.8855, + 0.8835, + 0.8875, + 0.8875, + 0.884, + 0.8805, + 0.8825, + 0.8835, + 0.885, + 0.886, + 0.883, + 0.8845, + 0.8885, + 0.8935, + 0.8865, + 0.8865, + 0.882, + 0.886, + 0.889, + 0.884, + 0.8855, + 0.887, + 0.886, + 0.885, + 0.8875, + 0.885, + 0.885, + 0.889, + 0.8885, + 0.8875, + 0.8875, + 0.89, + 0.8875, + 0.887, + 0.8835, + 0.887, + 0.8865, + 0.887, + 0.888, + 0.8875, + 0.887, + 0.8855, + 0.886, + 0.886, + 0.8855, + 0.8855, + 0.8855, + 0.8855, + 0.8855 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.792909562587738, + 0.7804109454154968, + 0.7618845105171204, + 0.7463140487670898 + ], + "perturbation_rho": [ + 0.9999990463256836, + 0.9999976754188538, + 0.9999912977218628, + 0.9999581575393677 + ], + "nudging": { + "0.001": [ + -0.03518236428499222, + -0.019823763519525528, + -0.009707804769277573, + -0.004611268639564514 + ], + "0.003": [ + -0.09652796387672424, + -0.05666226148605347, + -0.028457924723625183, + -0.013685199432075024 + ], + "0.01": [ + -0.2336917370557785, + -0.1588592678308487, + -0.0874030739068985, + -0.04391264170408249 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2411655475616454, + 1.4526173705101013, + 0.8525485153198242, + 0.6137924177646636, + 0.5145371016025543, + 0.446749422454834, + 0.4214886118412018, + 0.4195548385620117, + 0.4367940719604492, + 0.4271266968727112, + 0.4506368330955505, + 0.431544850730896, + 0.47056838960647585, + 0.4950884919166565, + 0.46457617955207825, + 0.44138867642879487, + 0.46890158281326294, + 0.5305374766528607, + 0.473049675154686, + 0.5022008052349091, + 0.5181013618469238, + 0.5725814378738403, + 0.6426745875835419, + 0.5557390186309814, + 0.5579349591135979, + 0.5740194640159607, + 0.5308336600065231, + 0.5652545422554016, + 0.5799481949329376, + 0.5444272952079773, + 0.6203189346969128, + 0.5797858777523041, + 0.5540922529220581, + 0.6830843738555908, + 0.615204192352295, + 0.5617164747238159, + 0.5623749876022339, + 0.6315483769670129, + 0.5285355776786804, + 0.5771580843925476, + 0.5868863337516784, + 0.5256145215988159, + 0.5623120756149292, + 0.5721551623344422, + 0.5184764307022095, + 0.5232071911811829, + 0.5361109107017518, + 0.5600172671496868, + 0.4889044641494751, + 0.5039423065185547, + 0.48181177968978883, + 0.5018940591812133, + 0.5007769202709198, + 0.48498369932174684, + 0.49861330699920653, + 0.50194164686203, + 0.5412097283363342, + 0.4756260334253311, + 0.45754834973812103, + 0.44795829181671143, + 0.4544060218811035, + 0.44153900299072263, + 0.45146822926998137, + 0.4521883423805237, + 0.4729661870479584, + 0.4337798559188843, + 0.43757696523666384, + 0.42876729426383975, + 0.4239328568458557, + 0.42891270719766617, + 0.4150575352668762, + 0.41506909675598147, + 0.41555006608963013, + 0.41147264165878294, + 0.4131491298675537, + 0.41100745553970336, + 0.40833550534248353, + 0.4068710644721985, + 0.4059945067882538, + 0.40573364531993866 + ], + "train_acc": [ + 0.186, + 0.5098, + 0.6861, + 0.7694, + 0.803, + 0.8305, + 0.8387, + 0.8401, + 0.8367, + 0.8391, + 0.836, + 0.8406, + 0.8345, + 0.8287, + 0.837, + 0.8435, + 0.8413, + 0.8283, + 0.8436, + 0.8394, + 0.8373, + 0.822, + 0.8238, + 0.8295, + 0.8343, + 0.8312, + 0.8379, + 0.8308, + 0.83, + 0.8388, + 0.8251, + 0.836, + 0.8379, + 0.8196, + 0.8331, + 0.8437, + 0.8403, + 0.8265, + 0.8473, + 0.8364, + 0.8374, + 0.8477, + 0.8394, + 0.8473, + 0.8507, + 0.8521, + 0.8455, + 0.8448, + 0.8579, + 0.8505, + 0.8592, + 0.8549, + 0.8576, + 0.8598, + 0.8569, + 0.8518, + 0.8476, + 0.8597, + 0.8621, + 0.8677, + 0.8657, + 0.8661, + 0.8651, + 0.8658, + 0.8604, + 0.8685, + 0.8672, + 0.8697, + 0.8726, + 0.8692, + 0.8725, + 0.8752, + 0.8726, + 0.8731, + 0.8738, + 0.8747, + 0.874, + 0.8756, + 0.8752, + 0.8756 + ], + "test_acc": [ + 0.355, + 0.613, + 0.726, + 0.765, + 0.7915, + 0.7945, + 0.796, + 0.8035, + 0.7775, + 0.7815, + 0.7895, + 0.779, + 0.768, + 0.7545, + 0.7975, + 0.8, + 0.781, + 0.7915, + 0.799, + 0.783, + 0.7645, + 0.775, + 0.792, + 0.783, + 0.786, + 0.7715, + 0.7735, + 0.772, + 0.7965, + 0.756, + 0.761, + 0.801, + 0.735, + 0.7755, + 0.7805, + 0.794, + 0.7575, + 0.7605, + 0.7725, + 0.783, + 0.793, + 0.786, + 0.794, + 0.788, + 0.7975, + 0.784, + 0.7785, + 0.8035, + 0.8, + 0.808, + 0.797, + 0.799, + 0.795, + 0.793, + 0.806, + 0.7975, + 0.8075, + 0.793, + 0.8045, + 0.8165, + 0.809, + 0.816, + 0.815, + 0.81, + 0.808, + 0.8165, + 0.809, + 0.8195, + 0.8135, + 0.812, + 0.817, + 0.8165, + 0.816, + 0.8175, + 0.814, + 0.8165, + 0.817, + 0.817, + 0.8175, + 0.817 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.010789386928081512, + 0.08449429273605347, + 0.10027095675468445, + 0.1133105605840683 + ], + "perturbation_rho": [ + -0.022197294980287552, + 0.02167895808815956, + 0.18905602395534515, + 0.18277563154697418 + ], + "nudging": { + "0.001": [ + -8.850065933074802e-05, + -0.0005693648708984256, + -0.00039813597686588764, + -0.00038892755401320755 + ], + "0.003": [ + -0.000241757370531559, + -0.0017084539867937565, + -0.00119449058547616, + -0.0011681977193802595 + ], + "0.01": [ + -0.0005262043559923768, + -0.005684657022356987, + -0.003974507562816143, + -0.0038818921893835068 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.8605559646606444, + 0.8181579312324524, + 0.4888786570072174, + 0.46094297194480893, + 0.5146874758720398, + 0.5756171208381653, + 0.6119997030258179, + 0.631787965297699, + 0.6700198846817017, + 0.7132655641555786, + 0.7236264010429382, + 0.7378828598022461, + 0.7261418657302856, + 0.727296348953247, + 0.7321721215248108, + 0.736586001586914, + 0.7621609721183776, + 0.763503788948059, + 0.7666075186729431, + 0.7711701553344726, + 0.7736121963500977, + 0.7452512830734253, + 0.7567199333190918, + 0.7540113342285156, + 0.7480614219665528, + 0.735906481552124, + 0.7370582301139832, + 0.6966712136268616, + 0.6802552005767822, + 0.6610010339736938, + 0.6873619891166687, + 0.6534000772476196, + 0.6929481398582459, + 0.6387723390579224, + 0.6156042585372925, + 0.6434125867843627, + 0.6252378331184387, + 0.6347130266189576, + 0.6249235614776611, + 0.6330950705289841, + 0.5946530082702637, + 0.6063001970291138, + 0.622239726114273, + 0.6078498930931091, + 0.5940731934547424, + 0.5847301836967468, + 0.5914536945343017, + 0.5992654499053955, + 0.5896003244400024, + 0.5899710475921631, + 0.5955881645202636, + 0.5772649069786072, + 0.579361309337616, + 0.5728494137763978, + 0.5764807563781739, + 0.5744461917877197, + 0.5702900684833526, + 0.577054048538208, + 0.5672821633338928, + 0.5654981985330582, + 0.5666977419853211, + 0.5643723483085632, + 0.5685850902557373, + 0.5597343187332153, + 0.5564246373176575, + 0.5545753452301025, + 0.5560362690925598, + 0.5581320198059082, + 0.547701037311554, + 0.5481671844482422, + 0.5475796377182007, + 0.5468229295730591, + 0.5432382588863373, + 0.5421132974624634, + 0.541416937828064, + 0.5409614672660827, + 0.5399176012039184, + 0.5391464573860169, + 0.5387552119731903, + 0.5384695112228394 + ], + "train_acc": [ + 0.3368, + 0.698, + 0.8163, + 0.8254, + 0.8097, + 0.7944, + 0.7835, + 0.7788, + 0.7649, + 0.7552, + 0.7385, + 0.7349, + 0.7359, + 0.7379, + 0.7343, + 0.7369, + 0.7296, + 0.7292, + 0.7336, + 0.7291, + 0.7343, + 0.7384, + 0.7402, + 0.7364, + 0.7392, + 0.7441, + 0.7439, + 0.7548, + 0.7638, + 0.77, + 0.7606, + 0.7728, + 0.7621, + 0.7791, + 0.7881, + 0.7784, + 0.7809, + 0.7789, + 0.7816, + 0.7812, + 0.7897, + 0.7883, + 0.7816, + 0.7874, + 0.7903, + 0.7956, + 0.791, + 0.788, + 0.7929, + 0.7935, + 0.7895, + 0.7969, + 0.7941, + 0.7975, + 0.7985, + 0.7961, + 0.8005, + 0.7976, + 0.8006, + 0.7995, + 0.7997, + 0.8015, + 0.8009, + 0.8023, + 0.8038, + 0.8063, + 0.8055, + 0.8068, + 0.8086, + 0.8086, + 0.8099, + 0.8084, + 0.812, + 0.8089, + 0.8106, + 0.8101, + 0.8105, + 0.813, + 0.8116, + 0.8115 + ], + "test_acc": [ + 0.5775, + 0.758, + 0.8025, + 0.7935, + 0.784, + 0.77, + 0.7645, + 0.749, + 0.7345, + 0.7205, + 0.7075, + 0.712, + 0.7105, + 0.716, + 0.7255, + 0.706, + 0.693, + 0.6855, + 0.716, + 0.719, + 0.716, + 0.7045, + 0.7215, + 0.705, + 0.7195, + 0.6925, + 0.7125, + 0.711, + 0.7125, + 0.7145, + 0.747, + 0.7325, + 0.7205, + 0.7515, + 0.7295, + 0.7535, + 0.7225, + 0.7535, + 0.739, + 0.7455, + 0.7515, + 0.7435, + 0.749, + 0.7635, + 0.755, + 0.7415, + 0.755, + 0.752, + 0.7465, + 0.7605, + 0.759, + 0.745, + 0.7625, + 0.748, + 0.7625, + 0.7665, + 0.7555, + 0.754, + 0.767, + 0.759, + 0.76, + 0.761, + 0.7705, + 0.765, + 0.7645, + 0.76, + 0.765, + 0.773, + 0.7705, + 0.7675, + 0.771, + 0.769, + 0.7705, + 0.764, + 0.767, + 0.766, + 0.7675, + 0.768, + 0.7675, + 0.7675 + ], + "state_pred_error": [ + 0.7528388725280761, + 0.2578148658514023, + 0.16944917948246002, + 0.15115742516517638, + 0.14653776726722717, + 0.1493137075185776, + 0.15279092507362366, + 0.1516626188278198, + 0.14644639718532562, + 0.1432818317890167, + 0.1341671544909477, + 0.12109726746082305, + 0.10874035103321075, + 0.09516428833007813, + 0.08291223795413971, + 0.0741053925871849, + 0.06677378851175308, + 0.05990288783311844, + 0.05339719951748848, + 0.047321006536483766, + 0.04257492316961289, + 0.039824042534828186, + 0.03776356348991394, + 0.03543094688653946, + 0.03290540891289711, + 0.030680635172128677, + 0.029502621805667876, + 0.028691610008478165, + 0.028108215525746345, + 0.02795259121656418, + 0.02805232812166214, + 0.028190095496177674, + 0.02814672722220421, + 0.028008159649372102, + 0.027467489010095596, + 0.02668677789568901, + 0.026043729621171952, + 0.025943757286667823, + 0.024753411382436752, + 0.024162132585048676, + 0.023421377569437025, + 0.022592406967282295, + 0.021806583201885225, + 0.020894898462295534, + 0.021760780826210975, + 0.01970126095712185, + 0.018973005139827727, + 0.018254657858610152, + 0.01774941844791174, + 0.017085333578288554, + 0.01667745073735714, + 0.015917856815457345, + 0.015461402994394302, + 0.015105176398158074, + 0.014731700393557548, + 0.014277263483405113, + 0.014336085096001625, + 0.013835087125003339, + 0.013015667875111103, + 0.012977058197557926, + 0.012411148184537887, + 0.012218371331691742, + 0.011917488634586334, + 0.011587343527376651, + 0.011386518168449402, + 0.010996050210297108, + 0.011000375728309154, + 0.01093198662251234, + 0.010665439885854722, + 0.010713081985712051, + 0.010309466387331486, + 0.009999687269330025, + 0.00984979961514473, + 0.00978974297195673, + 0.009679957465827465, + 0.009439942936599255, + 0.009190370073914527, + 0.009009707018733024, + 0.008934175878763198, + 0.008844223669171333 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8223247528076172, + 0.5256583094596863, + 0.17289233207702637, + 0.1550998091697693 + ], + "perturbation_rho": [ + 0.7023045420646667, + 0.4341009259223938, + 0.10907860845327377, + 0.14972183108329773 + ], + "nudging": { + "0.001": [ + -0.02259308099746704, + -0.0022590490989387035, + -0.0004881378263235092, + -0.00040942247142083943 + ], + "0.003": [ + -0.06565646827220917, + -0.00675535574555397, + -0.0014629701618105173, + -0.0012272088788449764 + ], + "0.01": [ + -0.19577056169509888, + -0.022263746708631516, + -0.004863455425947905, + -0.0040816450491547585 + ] + }, + "state_pred_error_per_layer": [ + 6500.04248046875, + 2179.638671875, + 1695.392333984375, + 1466.414306640625 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2343986097335815, + 1.453624027633667, + 0.8504115339279175, + 0.615304591178894, + 0.5090120125770569, + 0.45330931091308596, + 0.43282444887161253, + 0.43574942698478697, + 0.4284877701282501, + 0.43351908864974975, + 0.4202498661994934, + 0.4424209837436676, + 0.4577544458389282, + 0.492310822057724, + 0.48694960260391235, + 0.48417129316329954, + 0.4986941133260727, + 0.4728296154022217, + 0.5724463475704193, + 0.5595875578403473, + 0.532526982831955, + 0.5746327924728394, + 0.7126660821914673, + 0.7370420686721801, + 0.7313992212295533, + 0.7004754811286926, + 0.6956765615463257, + 0.7959447092533112, + 0.7934829597473144, + 0.856204462814331, + 0.8262276921272278, + 0.9044902267456054, + 0.8700028440475464, + 0.9274394365310669, + 0.9137028537750244, + 0.8890384769439698, + 1.0017674032211303, + 0.9142154163360595, + 0.9766313817024231, + 0.9468437704086303, + 0.9564611262321472, + 0.9481983922958374, + 0.985984567451477, + 0.9648167610168457, + 0.9928602050304413, + 0.9667063350677491, + 1.0476517265319825, + 1.0296577951431274, + 1.0196615926742554, + 0.9884319522857666, + 0.9943711001396179, + 0.996761853981018, + 0.9902983669281006, + 1.0116610792160035, + 0.9913013689041138, + 1.0162655168533326, + 0.9909055713653564, + 0.9940459415435791, + 0.9812287101745606, + 0.990528486442566, + 0.9934272569656372, + 0.9935013324737548, + 0.9953188559532166, + 0.9872588449478149, + 0.9923500513076782, + 0.9922672483444214, + 0.9931164207458496, + 0.985268419933319, + 0.9802879577636718, + 0.9865230370521545, + 0.9794404148101806, + 0.9768617332458496, + 0.9763567300796508, + 0.9761575534820557, + 0.974729040145874, + 0.972526121520996, + 0.9724656517028809, + 0.9720203231811524, + 0.9705313505172729, + 0.9701843170166016 + ], + "train_acc": [ + 0.1851, + 0.501, + 0.6924, + 0.7691, + 0.8101, + 0.8278, + 0.835, + 0.8321, + 0.838, + 0.8381, + 0.8452, + 0.8374, + 0.8368, + 0.8319, + 0.8298, + 0.8348, + 0.8353, + 0.8419, + 0.8244, + 0.8207, + 0.8248, + 0.8189, + 0.7836, + 0.7768, + 0.7709, + 0.7698, + 0.7677, + 0.7396, + 0.7351, + 0.7219, + 0.7224, + 0.7057, + 0.7025, + 0.6881, + 0.6911, + 0.6874, + 0.6617, + 0.6805, + 0.6654, + 0.67, + 0.6657, + 0.6666, + 0.6567, + 0.6515, + 0.6552, + 0.6553, + 0.6316, + 0.6448, + 0.6405, + 0.6466, + 0.6417, + 0.6463, + 0.643, + 0.6361, + 0.6427, + 0.6356, + 0.6455, + 0.645, + 0.6491, + 0.6414, + 0.642, + 0.6422, + 0.6438, + 0.6421, + 0.6378, + 0.6408, + 0.6401, + 0.6414, + 0.6434, + 0.6414, + 0.6442, + 0.6453, + 0.6441, + 0.646, + 0.6456, + 0.6434, + 0.645, + 0.6472, + 0.647, + 0.646 + ], + "test_acc": [ + 0.3695, + 0.6125, + 0.732, + 0.772, + 0.7855, + 0.7905, + 0.787, + 0.7925, + 0.798, + 0.802, + 0.7885, + 0.7805, + 0.7755, + 0.7785, + 0.779, + 0.7655, + 0.787, + 0.791, + 0.767, + 0.7695, + 0.767, + 0.707, + 0.7315, + 0.727, + 0.727, + 0.743, + 0.664, + 0.644, + 0.649, + 0.679, + 0.6495, + 0.651, + 0.6245, + 0.6465, + 0.6635, + 0.5545, + 0.6445, + 0.629, + 0.6125, + 0.6, + 0.6175, + 0.6225, + 0.59, + 0.5935, + 0.622, + 0.609, + 0.5955, + 0.5945, + 0.605, + 0.6335, + 0.5985, + 0.618, + 0.6125, + 0.615, + 0.612, + 0.626, + 0.6145, + 0.6215, + 0.622, + 0.614, + 0.6205, + 0.6205, + 0.619, + 0.6145, + 0.617, + 0.616, + 0.612, + 0.624, + 0.614, + 0.6145, + 0.6135, + 0.6175, + 0.6185, + 0.617, + 0.621, + 0.6165, + 0.6175, + 0.6165, + 0.615, + 0.617 + ], + "value_loss": [ + 3.023894792175293, + 0.8986896438598633, + 0.7798821739196777, + 0.6909401836395264, + 0.5764653768539428, + 0.5349095309972763, + 0.5056781127929687, + 0.5260066257476806, + 0.5290905786275863, + 0.5714910756111145, + 0.593832552909851, + 0.6378607465744018, + 0.7068720542907715, + 0.812154634809494, + 0.8033107622146607, + 0.8015370043754577, + 0.9214076406240463, + 0.7881726276397705, + 1.2114888192653657, + 1.0848007547855376, + 0.8881485988616943, + 1.0654814292907715, + 1.5107799823760986, + 1.4600254564762116, + 1.2796008218765258, + 1.135435813999176, + 0.9691264488220215, + 1.1726920662879945, + 1.129703632736206, + 1.1240834852218629, + 1.0206818098068238, + 1.0843358610153198, + 0.8683985090255737, + 0.9091012100219726, + 0.8982777906417847, + 0.740005069732666, + 0.9086256595611573, + 0.7258960815429687, + 0.8782961148262024, + 0.6398888462066651, + 0.7080119153976441, + 0.6535386414527893, + 0.6868848449230194, + 0.6373141875267029, + 0.6819823276519775, + 0.6544397377014161, + 0.8417046590805054, + 0.6846742402076721, + 0.6666352437019348, + 0.5878526174545288, + 0.5703939646720886, + 0.6319679483890533, + 0.5580304244041443, + 0.5517775423049927, + 0.5550727502822876, + 0.5422627649307251, + 0.526749885725975, + 0.5252036747217178, + 0.4967438272476196, + 0.5272078440189362, + 0.5113776790618897, + 0.5110072200298309, + 0.5037453308582306, + 0.501118311882019, + 0.48052791557312013, + 0.491667214345932, + 0.4838150468826294, + 0.4674044004917145, + 0.4652326403617859, + 0.45715550484657286, + 0.47330021438598635, + 0.45846579232215884, + 0.4664739728450775, + 0.4596080785751343, + 0.44709101357460024, + 0.5086768847942352, + 0.44456540699005126, + 0.4510745820999146, + 0.4489506968975067, + 0.4424677228450775 + ], + "term_loss": [ + 1.7427010470867157, + 0.48208142280578614, + 0.5679618017196655, + 0.5195615575790405, + 0.41694380503892897, + 0.37342323462963106, + 0.3461394340753555, + 0.3736634975910187, + 0.38409003803730013, + 0.424897181892395, + 0.4506664439201355, + 0.4885968829154968, + 0.5525542941093445, + 0.6469054134488106, + 0.6400146143913269, + 0.6403206890821457, + 0.7548702710151672, + 0.6292312892913818, + 1.030323140335083, + 0.8977560731410981, + 0.7063375649988651, + 0.8753381670951843, + 1.2645243648529052, + 1.2143967106819153, + 1.0314008697509767, + 0.8851956583857536, + 0.7202553007125855, + 0.8874784625053406, + 0.8458867080688477, + 0.8219177357673645, + 0.7048627055644989, + 0.7606868861675262, + 0.554924451828003, + 0.5762491623401642, + 0.5633525419235229, + 0.4294536910057068, + 0.5648997817039489, + 0.4093684819459915, + 0.5367715572834015, + 0.31539287347793576, + 0.3760087685585022, + 0.3255245527982712, + 0.35008056272268295, + 0.30248967091441153, + 0.3320766371250153, + 0.3127023727416992, + 0.46781888790130616, + 0.32705182971954344, + 0.3015207302093506, + 0.23376340117454528, + 0.2302341274499893, + 0.28476220836639404, + 0.21570249412059783, + 0.2140086658477783, + 0.2207069280743599, + 0.2051979726791382, + 0.19757021386027337, + 0.19944336045682431, + 0.1797251489162445, + 0.19338219695091247, + 0.1890155040860176, + 0.19045120375156402, + 0.17334317658543585, + 0.17656912994384766, + 0.15950183691978453, + 0.1694078619301319, + 0.16317301561832429, + 0.1491153277337551, + 0.14835610117912293, + 0.1391140363395214, + 0.15004074268341064, + 0.14137677636146545, + 0.14710547543764113, + 0.14120989878177642, + 0.13093972239494323, + 0.17345181898772716, + 0.12735800666809083, + 0.12920580761432648, + 0.12803946260213853, + 0.12383701201379299 + ], + "bridge_loss": [ + 0.9911150374100427, + 0.14225238285660743, + 0.01897906306087971, + 0.008157095196843147, + 0.016066196286678314, + 0.026334887421131135, + 0.025152397060394287, + 0.013772669732570648, + 0.009419957700371743, + 0.009206166239082813, + 0.009388158424198628, + 0.01007876497283578, + 0.010257267847657204, + 0.013791960202157498, + 0.015348700781166553, + 0.012856689554452896, + 0.018292034401744605, + 0.017754782377555966, + 0.020485600554943084, + 0.024397531032562255, + 0.022133925661444665, + 0.024291416144371032, + 0.04369710162878036, + 0.03945274412930012, + 0.040382358980178834, + 0.04041987403035164, + 0.035525544452667236, + 0.045289935863018035, + 0.04489333842992783, + 0.04701487867832184, + 0.06372669532299041, + 0.053910273158550265, + 0.04901574258804321, + 0.049852415746450426, + 0.05743934147357941, + 0.03363188169002533, + 0.04151349928379059, + 0.03473072373867035, + 0.05004978265017271, + 0.037063263088464735, + 0.03867579575777054, + 0.03736003184020519, + 0.03446328945159912, + 0.038409869611263275, + 0.04414601467847824, + 0.04355271501541138, + 0.058919631719589236, + 0.04385834427475929, + 0.05479392580688, + 0.0494567804440856, + 0.03416308156847954, + 0.04137864155471325, + 0.037130875611305236, + 0.02873442330956459, + 0.03029374772310257, + 0.02444745374917984, + 0.02370999895334244, + 0.022537667311728002, + 0.018014887282252312, + 0.03064262791275978, + 0.0187765949845314, + 0.017979868005216122, + 0.02728003891259432, + 0.02337435365319252, + 0.018309101203083992, + 0.020601727521419526, + 0.019028106117248537, + 0.01750932685434818, + 0.01801943519115448, + 0.017622895017266275, + 0.025175228443741798, + 0.019320746524631977, + 0.022181396812200545, + 0.021180605521798134, + 0.019371255433559418, + 0.03914435167312622, + 0.02086639016866684, + 0.025725779765844344, + 0.025558402460813524, + 0.02319883658438921 + ], + "tgrad_loss": [ + 0.29007866830825807, + 0.2743558446407318, + 0.19294130930900574, + 0.16322152862548828, + 0.14345537494421004, + 0.1351514089345932, + 0.13438627982139587, + 0.13857046403884887, + 0.13558058288097383, + 0.13738772497177124, + 0.13377795510292054, + 0.13918509731292725, + 0.1440604922056198, + 0.15145726749897004, + 0.14794744772911073, + 0.14835962448120119, + 0.14824533681869506, + 0.14118656301498414, + 0.16068009790182114, + 0.16264715282917022, + 0.15967711250782013, + 0.16585184245109558, + 0.2025585355758667, + 0.20617600531578065, + 0.20781758627891542, + 0.20982027254104615, + 0.21334560272693634, + 0.2399236711025238, + 0.23892358722686768, + 0.2551508683681488, + 0.252092413854599, + 0.2697386896133423, + 0.26445830760002137, + 0.28299963884353635, + 0.27748590664863587, + 0.27691949067115784, + 0.30221237459182737, + 0.2817968795776367, + 0.2914747746706009, + 0.2874327032566071, + 0.2933273449897766, + 0.2906540577888489, + 0.3023409938812256, + 0.29641464624404906, + 0.3057596742391586, + 0.2981846487045288, + 0.3149661375999451, + 0.31376406354904174, + 0.31032058653831485, + 0.3046324390411377, + 0.30599675626754763, + 0.3058270953178406, + 0.3051970504760742, + 0.30903445119857786, + 0.3040720769882202, + 0.3126173446655273, + 0.3054696724653244, + 0.3032226475715637, + 0.29900379276275635, + 0.3031830202102661, + 0.3035855787754059, + 0.3025761491298676, + 0.3031221126079559, + 0.30117482986450195, + 0.3027169793128967, + 0.3016576295852661, + 0.3016139295578003, + 0.30077974333763124, + 0.2988571047782898, + 0.30041857199668887, + 0.29808423919677735, + 0.297768265581131, + 0.29718710403442383, + 0.29721757326126097, + 0.29678003549575804, + 0.29608071341514586, + 0.2963410082817078, + 0.29614299502372743, + 0.29535283389091493, + 0.29543187527656556 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.0613640733063221, + 0.23986753821372986, + 0.24101567268371582, + 0.25395530462265015 + ], + "perturbation_rho": [ + 0.07897584140300751, + 0.3258228003978729, + 0.35056060552597046, + 0.3584677577018738 + ], + "nudging": { + "0.001": [ + -0.0019706960301846266, + -0.0017678625881671906, + -0.0016834724228829145, + -0.0017289909301325679 + ], + "0.003": [ + -0.005873056128621101, + -0.0052978526800870895, + -0.005045462399721146, + -0.005181802436709404 + ], + "0.01": [ + -0.019116222858428955, + -0.01759088784456253, + -0.016751645132899284, + -0.017206376418471336 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a0.5_L8_s123.json b/results/synth_ladder_v2_hi/synth_a0.5_L8_s123.json new file mode 100644 index 0000000..c42babb --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a0.5_L8_s123.json @@ -0,0 +1,1638 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.1690437764167785, + 0.526579748916626, + 0.4612072874069214, + 0.40229701833724973, + 0.3932571681022644, + 0.37171179904937746, + 0.37635504052639007, + 0.34792573761940004, + 0.33135794601440427, + 0.35720210390090945, + 0.2971177682876587, + 0.3144925072669983, + 0.2908399796247482, + 0.2602632574081421, + 0.3234870526790619, + 0.24370513725280762, + 0.25297106668949126, + 0.23075523381233215, + 0.23605980478525163, + 0.1943365602493286, + 0.23846449284553528, + 0.24400404317379, + 0.17749837155342102, + 0.18690768659114837, + 0.16863750772476196, + 0.20593492636680602, + 0.18994918286800386, + 0.16939699206352235, + 0.16769693479537964, + 0.12983431510925292, + 0.12260556392669678, + 0.15693657582998274, + 0.12875397876501082, + 0.13655461661815643, + 0.12720586278438567, + 0.11327027233839035, + 0.09552236033678055, + 0.0885159835100174, + 0.1007383291721344, + 0.11100154314041137, + 0.0981293179988861, + 0.0829784469485283, + 0.08495590468645096, + 0.06667495827674866, + 0.07823006441593171, + 0.07924402866363525, + 0.059052948009967805, + 0.06082535365819931, + 0.05081702738404274, + 0.046299984288215634, + 0.04768944467306137, + 0.04482775348424912, + 0.041376980124413966, + 0.03780490176081657, + 0.03604337072968483, + 0.03766505457162857, + 0.036802976721525195, + 0.03326233586370945, + 0.03231097190827131, + 0.030569579753279685, + 0.02986507187783718, + 0.028971056300401688, + 0.0288686943218112, + 0.02757761981189251, + 0.026668703991174696, + 0.026556660920381545, + 0.02589243197739124, + 0.025469816410541534, + 0.025155014288425447, + 0.024874832066893577, + 0.024470695948600768, + 0.024159772795438766, + 0.02393993109166622, + 0.023741512601077555, + 0.023583258251845835, + 0.023436618757247923, + 0.023351033651828765, + 0.02327720703482628, + 0.023227938520908355, + 0.0232003643065691 + ], + "train_acc": [ + 0.5941, + 0.8016, + 0.8207, + 0.8431, + 0.8474, + 0.8526, + 0.8539, + 0.8625, + 0.8701, + 0.8566, + 0.8817, + 0.8785, + 0.8863, + 0.9006, + 0.8764, + 0.9076, + 0.8996, + 0.9098, + 0.908, + 0.9244, + 0.9092, + 0.9053, + 0.9308, + 0.9258, + 0.9361, + 0.9215, + 0.9249, + 0.9344, + 0.9364, + 0.9568, + 0.9558, + 0.9416, + 0.9524, + 0.9504, + 0.9534, + 0.9615, + 0.9714, + 0.9737, + 0.965, + 0.9609, + 0.9671, + 0.9744, + 0.9736, + 0.9826, + 0.9761, + 0.9756, + 0.9869, + 0.986, + 0.9917, + 0.9946, + 0.9915, + 0.9935, + 0.9948, + 0.9972, + 0.9978, + 0.9967, + 0.9969, + 0.998, + 0.9984, + 0.9994, + 0.9991, + 0.9996, + 0.9995, + 0.9992, + 0.9997, + 0.9997, + 0.9997, + 0.9997, + 0.9996, + 0.9999, + 0.9998, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999 + ], + "test_acc": [ + 0.8045, + 0.826, + 0.825, + 0.845, + 0.8415, + 0.8465, + 0.8505, + 0.843, + 0.845, + 0.852, + 0.8615, + 0.84, + 0.852, + 0.858, + 0.8395, + 0.855, + 0.857, + 0.8625, + 0.865, + 0.865, + 0.8535, + 0.856, + 0.875, + 0.8655, + 0.8605, + 0.8615, + 0.8535, + 0.8615, + 0.8625, + 0.869, + 0.8635, + 0.858, + 0.8685, + 0.865, + 0.8665, + 0.863, + 0.868, + 0.859, + 0.8665, + 0.867, + 0.865, + 0.86, + 0.8655, + 0.8715, + 0.86, + 0.866, + 0.8655, + 0.865, + 0.8635, + 0.8655, + 0.868, + 0.8635, + 0.8635, + 0.8645, + 0.8665, + 0.869, + 0.866, + 0.8675, + 0.8655, + 0.866, + 0.8655, + 0.866, + 0.867, + 0.868, + 0.8675, + 0.867, + 0.8685, + 0.868, + 0.868, + 0.868, + 0.8675, + 0.867, + 0.8665, + 0.868, + 0.867, + 0.868, + 0.868, + 0.8675, + 0.868, + 0.868 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8442516326904297, + 0.8351782560348511, + 0.8238041400909424, + 0.811212420463562, + 0.800036609172821, + 0.789252519607544, + 0.7798817157745361, + 0.7730016708374023 + ], + "perturbation_rho": [ + 0.9999992251396179, + 0.9999983906745911, + 0.9999960660934448, + 0.99998939037323, + 0.9999715685844421, + 0.9999511241912842, + 0.9999076128005981, + 0.9998621940612793 + ], + "nudging": { + "0.001": [ + -0.04046643525362015, + -0.024846579879522324, + -0.014939611777663231, + -0.009067585691809654, + -0.00585249625146389, + -0.004124765284359455, + -0.0031854582484811544, + -0.0026463749818503857 + ], + "0.003": [ + -0.11249453574419022, + -0.07127158343791962, + -0.04364899545907974, + -0.026772987097501755, + -0.01737922430038452, + -0.012286147102713585, + -0.009504282847046852, + -0.007903642021119595 + ], + "0.01": [ + -0.281266987323761, + -0.2009655237197876, + -0.1321270614862442, + -0.08429376780986786, + -0.05586903542280197, + -0.039932381361722946, + -0.031076554208993912, + -0.025931723415851593 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.269032752609253, + 1.3050836851119996, + 0.8196908255577088, + 0.6588153503417968, + 0.5856991597175598, + 0.5283262263298034, + 0.5579123854637146, + 0.537654877281189, + 0.5828713527679443, + 0.6058343980789185, + 0.5558601338386535, + 0.5963786434173584, + 0.6240195028305053, + 0.6347664480209351, + 0.6456235321044922, + 0.6269678426742553, + 0.680553484249115, + 0.7317787364006042, + 0.794128333234787, + 0.6699356523513794, + 0.7476618877410889, + 0.8156976552963257, + 0.8354362937927247, + 0.7994426628112793, + 0.8500595897674561, + 0.9119489772796631, + 0.8346799810171127, + 0.8067910364151001, + 0.8339261085391044, + 0.7884325521469117, + 0.9549632612228394, + 0.875113792848587, + 0.7741540772438049, + 0.7001222875595092, + 0.7371560405731201, + 0.8241119850158691, + 0.7078411004543305, + 0.6887535285949707, + 0.7490071479797363, + 0.8013861232757569, + 0.7634008598327636, + 0.7581863780975342, + 0.6919024399757385, + 0.7027303151130676, + 0.6885574837267399, + 0.6507348452329635, + 0.6334816108703614, + 0.7169007764339447, + 0.6046502321720123, + 0.6008657840728759, + 0.7073253668785096, + 0.5771534276008606, + 0.620348064994812, + 0.5736126258850097, + 0.571743147277832, + 0.5836609784126282, + 0.5414934496879578, + 0.5247059268951416, + 0.529977638244629, + 0.5427842017531395, + 0.4983853917121887, + 0.5128863627433777, + 0.5041354479789734, + 0.5157700657367706, + 0.4914438611984253, + 0.4841920606136322, + 0.4769712302207947, + 0.4743790678024292, + 0.46768182845115663, + 0.4689002415180206, + 0.46644191064834595, + 0.4690598597049713, + 0.4642826473712921, + 0.46037765583992, + 0.45840771598815916, + 0.4571617786407471, + 0.45624103908538816, + 0.45523289976119996, + 0.45433819589614866, + 0.45354745016098025 + ], + "train_acc": [ + 0.1781, + 0.5294, + 0.6941, + 0.7522, + 0.7802, + 0.8039, + 0.7927, + 0.8033, + 0.7925, + 0.7912, + 0.8084, + 0.7955, + 0.7969, + 0.8011, + 0.798, + 0.8034, + 0.7941, + 0.7909, + 0.7855, + 0.8019, + 0.7902, + 0.7846, + 0.7813, + 0.787, + 0.7701, + 0.7786, + 0.7873, + 0.7865, + 0.7839, + 0.7916, + 0.7679, + 0.776, + 0.7934, + 0.8069, + 0.7998, + 0.7868, + 0.8001, + 0.8046, + 0.7948, + 0.7903, + 0.7909, + 0.7912, + 0.8001, + 0.8016, + 0.8037, + 0.8076, + 0.8143, + 0.7984, + 0.8156, + 0.8164, + 0.8, + 0.8198, + 0.8087, + 0.8181, + 0.8181, + 0.8174, + 0.8239, + 0.8221, + 0.8247, + 0.8211, + 0.8325, + 0.8307, + 0.8328, + 0.8272, + 0.8349, + 0.8344, + 0.836, + 0.8351, + 0.8394, + 0.8372, + 0.8397, + 0.8376, + 0.8392, + 0.8407, + 0.8395, + 0.8389, + 0.8404, + 0.8409, + 0.8412, + 0.841 + ], + "test_acc": [ + 0.376, + 0.6365, + 0.7185, + 0.747, + 0.7765, + 0.7345, + 0.76, + 0.7695, + 0.7125, + 0.7515, + 0.779, + 0.754, + 0.7795, + 0.7235, + 0.7565, + 0.756, + 0.7435, + 0.757, + 0.7585, + 0.7165, + 0.7445, + 0.7265, + 0.717, + 0.737, + 0.6785, + 0.731, + 0.7275, + 0.726, + 0.77, + 0.7255, + 0.7295, + 0.752, + 0.747, + 0.7735, + 0.732, + 0.7185, + 0.747, + 0.756, + 0.7365, + 0.737, + 0.734, + 0.761, + 0.7685, + 0.7725, + 0.74, + 0.782, + 0.773, + 0.776, + 0.7855, + 0.7195, + 0.7775, + 0.7715, + 0.7815, + 0.7905, + 0.7755, + 0.792, + 0.798, + 0.7885, + 0.7895, + 0.7885, + 0.794, + 0.794, + 0.797, + 0.793, + 0.806, + 0.8065, + 0.799, + 0.798, + 0.8025, + 0.801, + 0.8015, + 0.8095, + 0.808, + 0.8065, + 0.8, + 0.804, + 0.8015, + 0.8015, + 0.802, + 0.8 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.02832707017660141, + 0.13987571001052856, + 0.07857642322778702, + 0.061437755823135376, + 0.0877213403582573, + 0.09552451223134995, + 0.07042402029037476, + 0.08406771719455719 + ], + "perturbation_rho": [ + 0.034647777676582336, + 0.1467832326889038, + 0.036387018859386444, + 0.061308689415454865, + 0.1038040965795517, + 0.09023141860961914, + 0.03672575205564499, + 0.08190295100212097 + ], + "nudging": { + "0.001": [ + 0.0011414524633437395, + -0.0005393982864916325, + -0.00023700599558651447, + -0.00016539759235456586, + -0.00020502961706370115, + -0.0002788097772281617, + -0.00019945131498388946, + -0.0002334596065338701 + ], + "0.003": [ + 0.003470724681392312, + -0.0016172737814486027, + -0.0007110200822353363, + -0.0004955856129527092, + -0.0006145928637124598, + -0.0008353168377652764, + -0.0005977450637146831, + -0.0006998619646765292 + ], + "0.01": [ + 0.012113340198993683, + -0.00537356361746788, + -0.0023620566353201866, + -0.001645779935643077, + -0.002037967788055539, + -0.0027765799313783646, + -0.001988787204027176, + -0.002327942755073309 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.7007782346725464, + 0.8164017862319947, + 0.6423392364501953, + 0.7302445079803467, + 0.823608984375, + 0.9137458106994629, + 0.9564488334655762, + 0.9002143922328949, + 0.8733619658470154, + 0.8754102369308472, + 0.911200912475586, + 0.9395248275756836, + 0.9669746287345886, + 0.9382185889244079, + 0.901768593788147, + 0.9082238527297973, + 0.915930258178711, + 0.9233985857009888, + 0.8726478023529053, + 0.8490028512954712, + 0.8677912174224853, + 0.905773146533966, + 0.9145678676605224, + 0.8721040974617005, + 0.817108702468872, + 0.8035082785606384, + 0.740993898010254, + 0.7614496314525604, + 0.7472923977851867, + 0.746871427154541, + 0.7268754315376281, + 0.7289572984695435, + 0.7670538501739502, + 0.7607598701477051, + 0.7636146975517273, + 0.7497062658309936, + 0.7167949647426605, + 0.7196091802597046, + 0.718072020149231, + 0.7154478120803833, + 0.7283960567474366, + 0.7365614126205444, + 0.726603537940979, + 0.7100282831192016, + 0.694857945728302, + 0.6909708969116211, + 0.7026924235343933, + 0.723259468460083, + 0.7301779090881347, + 0.7366840793609619, + 0.7489474256515503, + 0.7501752611160278, + 0.7374589855194091, + 0.726950154876709, + 0.7204151838302613, + 0.7631172191619873, + 0.719224785232544, + 0.6950305696487427, + 0.6910476376533509, + 0.6889386486053467, + 0.6827648526191712, + 0.6788733221054077, + 0.6739130449295044, + 0.6725200511932373, + 0.673500218963623, + 0.6744556049346924, + 0.6729164401054383, + 0.6747148495674133, + 0.6735565113067628, + 0.6700731378555298, + 0.6690107128620147, + 0.6688071804046631, + 0.6681381563186646, + 0.6684000648498535, + 0.6678468257904052, + 0.6672025471687317, + 0.666564640045166, + 0.6660951887130737, + 0.666175397491455, + 0.6660839390754699 + ], + "train_acc": [ + 0.3802, + 0.6878, + 0.7608, + 0.7495, + 0.7293, + 0.6969, + 0.6768, + 0.6867, + 0.6862, + 0.6815, + 0.6774, + 0.6691, + 0.6534, + 0.6688, + 0.6753, + 0.6818, + 0.6749, + 0.6772, + 0.6934, + 0.694, + 0.6881, + 0.6835, + 0.6787, + 0.6872, + 0.7081, + 0.7135, + 0.7349, + 0.7261, + 0.7292, + 0.7292, + 0.7298, + 0.7329, + 0.7202, + 0.7235, + 0.7237, + 0.7284, + 0.7367, + 0.7329, + 0.7328, + 0.7355, + 0.7306, + 0.7288, + 0.731, + 0.7444, + 0.7426, + 0.7406, + 0.7403, + 0.7323, + 0.7344, + 0.7309, + 0.7275, + 0.7286, + 0.7301, + 0.7334, + 0.7389, + 0.7237, + 0.734, + 0.7472, + 0.7479, + 0.7468, + 0.7487, + 0.7464, + 0.7523, + 0.7524, + 0.7528, + 0.753, + 0.7511, + 0.7528, + 0.7546, + 0.7523, + 0.7553, + 0.7583, + 0.7551, + 0.7559, + 0.7534, + 0.7548, + 0.7541, + 0.7561, + 0.7552, + 0.7551 + ], + "test_acc": [ + 0.608, + 0.7325, + 0.725, + 0.7065, + 0.6975, + 0.671, + 0.6655, + 0.671, + 0.641, + 0.651, + 0.638, + 0.623, + 0.617, + 0.6505, + 0.633, + 0.6655, + 0.647, + 0.648, + 0.66, + 0.6445, + 0.656, + 0.6565, + 0.656, + 0.6785, + 0.6985, + 0.7075, + 0.7025, + 0.7125, + 0.711, + 0.715, + 0.71, + 0.71, + 0.706, + 0.6895, + 0.703, + 0.7085, + 0.7065, + 0.706, + 0.703, + 0.707, + 0.6915, + 0.7005, + 0.702, + 0.6995, + 0.7135, + 0.71, + 0.6905, + 0.7045, + 0.699, + 0.692, + 0.6975, + 0.687, + 0.707, + 0.7, + 0.688, + 0.7115, + 0.7185, + 0.722, + 0.72, + 0.707, + 0.7295, + 0.725, + 0.725, + 0.724, + 0.722, + 0.7175, + 0.7195, + 0.715, + 0.719, + 0.7185, + 0.719, + 0.716, + 0.7165, + 0.7175, + 0.716, + 0.7175, + 0.7175, + 0.7155, + 0.718, + 0.718 + ], + "state_pred_error": [ + 0.6709408867359161, + 0.18942265737056732, + 0.14080595693588258, + 0.1511134099006653, + 0.17209407310485839, + 0.1766144100666046, + 0.17131005449295045, + 0.16910524086952208, + 0.1503032527923584, + 0.14637641661167144, + 0.1414107642650604, + 0.12289449031352997, + 0.0937490943312645, + 0.07194982548952103, + 0.06582723281383514, + 0.0680177249968052, + 0.0612314338862896, + 0.05455904011726379, + 0.05373732958436012, + 0.05378581196665764, + 0.052673121321201326, + 0.04773973789215088, + 0.04812903320789337, + 0.05376589905619621, + 0.05221608868837357, + 0.0511037185549736, + 0.04819248498678207, + 0.04678433921933174, + 0.047127060896158215, + 0.04397982689738274, + 0.04087346328496933, + 0.04046012075543404, + 0.04122381027340889, + 0.04241861761212349, + 0.042094694751501086, + 0.0412453974545002, + 0.038724960923194884, + 0.03562711297273636, + 0.03296822139620781, + 0.0325114149659872, + 0.03283161758184433, + 0.035513292720913886, + 0.035710234045982364, + 0.03682430787086487, + 0.033476365625858304, + 0.03093737213909626, + 0.027777787262201308, + 0.02414869005382061, + 0.020448731756210328, + 0.017831652319431304, + 0.015582082697749139, + 0.014428501343727113, + 0.012960297419130802, + 0.012180000832676887, + 0.011530775272846221, + 0.010874310192465783, + 0.010527618415653705, + 0.010202822449803353, + 0.00984742543399334, + 0.009536775915324688, + 0.009180539272725581, + 0.008970437014102935, + 0.008827724769711495, + 0.008530926664918661, + 0.008309092213958503, + 0.008101929514110089, + 0.008094769676029682, + 0.007767554499208927, + 0.007610894358158112, + 0.007408130565285683, + 0.007262326770275831, + 0.007150135292857886, + 0.007085654979944229, + 0.0073706810601055625, + 0.006943213131278754, + 0.0066695098660886284, + 0.006669323475658894, + 0.006493967983126641, + 0.006413866003602743, + 0.006445458614826202 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8429861068725586, + 0.3551006317138672, + 0.246289923787117, + 0.21019335091114044, + 0.17309927940368652, + 0.14295682311058044, + 0.15966862440109253, + 0.13815715909004211 + ], + "perturbation_rho": [ + 0.7732758522033691, + 0.2933464050292969, + 0.24295836687088013, + 0.22880345582962036, + 0.1602117419242859, + 0.11042392998933792, + 0.18763291835784912, + 0.14856110513210297 + ], + "nudging": { + "0.001": [ + -0.017513541504740715, + -0.0010910499840974808, + -0.000708599342033267, + -0.0005966786993667483, + -0.00047664318117313087, + -0.0004276464751455933, + -0.0004729896318167448, + -0.0004151453322265297 + ], + "0.003": [ + -0.05139407142996788, + -0.003268325934186578, + -0.0021239686757326126, + -0.0017886366695165634, + -0.0014290767721831799, + -0.0012818754184991121, + -0.0014177404809743166, + -0.0012440300779417157 + ], + "0.01": [ + -0.15847395360469818, + -0.010836342349648476, + -0.007060050964355469, + -0.005947217810899019, + -0.004753550048917532, + -0.004264200571924448, + -0.004713424481451511, + -0.0041376142762601376 + ] + }, + "state_pred_error_per_layer": [ + 3389.93017578125, + 4477.634765625, + 1038.2586669921875, + 911.949951171875, + 702.6972045898438, + 659.9431762695312, + 824.164794921875, + 821.9293212890625 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2660294412612916, + 1.3016457880973815, + 0.8186747265815735, + 0.6697447069168091, + 0.5803643805503845, + 0.5512525676727295, + 0.549796287727356, + 0.5450847043991088, + 0.5275615032196045, + 0.5319187931060791, + 0.5584789258956909, + 0.6303564451217651, + 0.6530141715049743, + 0.647641095161438, + 0.6535977718353272, + 0.6668755978107452, + 0.6444538109302521, + 0.7376987361907958, + 0.8571814809799194, + 0.8484122044563294, + 0.7817753293991089, + 0.8637002775192261, + 0.8521189229011535, + 0.8361198561668396, + 0.806985737991333, + 0.7815130719184875, + 0.802376530122757, + 0.8485978384971619, + 0.8367114802360535, + 0.8168601245880127, + 0.7851902055740356, + 0.7358182970046997, + 0.8997399300575256, + 0.9225360271453857, + 0.8570411529541015, + 0.8411993549346923, + 0.9375005828857422, + 0.8463716927528382, + 0.862580227470398, + 1.0098564163208008, + 0.9812262915611267, + 0.8729387621879577, + 0.8571597898483276, + 0.9974828210830688, + 0.8864622016906738, + 1.0887743062019348, + 1.0035358074188232, + 0.9521108211517334, + 0.9903197944641113, + 1.036623720550537, + 1.0008409860610963, + 1.0380868854522705, + 1.1012060861587525, + 1.0651326690673828, + 1.1333419822692872, + 1.0603330505371094, + 1.0721593137741088, + 1.0658496725082398, + 1.0947151290893555, + 1.099305485343933, + 1.0801114864349366, + 1.0791620138168334, + 1.0618044708251952, + 1.0570447917938233, + 1.0758753734588622, + 1.0394710207939148, + 1.029822176551819, + 1.041756462097168, + 1.0217557413101197, + 1.0205562198638916, + 1.0147280132293701, + 1.0095306674957276, + 1.001978309726715, + 0.9974158168792725, + 0.9953814093589782, + 0.9926533555030823, + 0.9918749931335449, + 0.9889670114517212, + 0.9879606288909912, + 0.9873974003791809 + ], + "train_acc": [ + 0.1797, + 0.5356, + 0.6972, + 0.7485, + 0.7819, + 0.7901, + 0.7974, + 0.8001, + 0.8077, + 0.8076, + 0.8072, + 0.79, + 0.7937, + 0.7962, + 0.7957, + 0.8015, + 0.8017, + 0.7861, + 0.7668, + 0.7721, + 0.7765, + 0.7621, + 0.7721, + 0.7745, + 0.7768, + 0.7865, + 0.7782, + 0.7703, + 0.7686, + 0.7611, + 0.752, + 0.7558, + 0.7123, + 0.6954, + 0.7044, + 0.7167, + 0.6963, + 0.7005, + 0.6968, + 0.6591, + 0.6589, + 0.6849, + 0.6881, + 0.6512, + 0.6785, + 0.6251, + 0.6467, + 0.6578, + 0.6456, + 0.6288, + 0.6419, + 0.6188, + 0.6092, + 0.6176, + 0.6027, + 0.6198, + 0.6133, + 0.6127, + 0.6121, + 0.6075, + 0.6127, + 0.6089, + 0.6184, + 0.6212, + 0.6156, + 0.6286, + 0.6251, + 0.626, + 0.6275, + 0.6322, + 0.6357, + 0.6335, + 0.6347, + 0.6367, + 0.6371, + 0.6398, + 0.6414, + 0.6418, + 0.6432, + 0.6433 + ], + "test_acc": [ + 0.3745, + 0.6335, + 0.7105, + 0.7265, + 0.7415, + 0.763, + 0.7755, + 0.7625, + 0.769, + 0.769, + 0.748, + 0.7415, + 0.728, + 0.75, + 0.739, + 0.7405, + 0.733, + 0.706, + 0.7025, + 0.737, + 0.715, + 0.7405, + 0.7475, + 0.722, + 0.7435, + 0.7475, + 0.7205, + 0.7215, + 0.713, + 0.687, + 0.7035, + 0.685, + 0.6305, + 0.6265, + 0.6465, + 0.594, + 0.613, + 0.624, + 0.583, + 0.568, + 0.6055, + 0.5875, + 0.572, + 0.636, + 0.5545, + 0.508, + 0.585, + 0.5945, + 0.5505, + 0.5855, + 0.563, + 0.534, + 0.55, + 0.5745, + 0.5905, + 0.567, + 0.587, + 0.532, + 0.554, + 0.5735, + 0.5795, + 0.5895, + 0.58, + 0.5915, + 0.601, + 0.599, + 0.6035, + 0.588, + 0.6105, + 0.6085, + 0.6065, + 0.6115, + 0.6185, + 0.6245, + 0.619, + 0.62, + 0.6225, + 0.617, + 0.618, + 0.6185 + ], + "value_loss": [ + 3.06523074798584, + 1.0051734189987183, + 0.9336865198135376, + 0.8656800090789795, + 0.7873764232635498, + 0.781440449142456, + 0.7908254833221435, + 0.8565213081359864, + 0.8310571252822876, + 0.8515260807037354, + 0.9407390365600586, + 1.1463200833320617, + 1.3171742897033691, + 1.262915803527832, + 1.386610294342041, + 1.402245961523056, + 1.353079345226288, + 1.6632261469364167, + 2.160128380584717, + 2.152520423412323, + 2.048775052833557, + 2.179873471832275, + 2.0917932035446167, + 2.110498323726654, + 2.0249694913864134, + 1.9754539145469665, + 2.0863923776626585, + 2.2604428833007812, + 1.882617956161499, + 1.6480644565582276, + 1.4238870953798295, + 1.0796037145614623, + 1.2265830523490906, + 1.1315664192199708, + 0.8243012958526611, + 1.5025688316345214, + 1.2351813243865968, + 1.0440775310993196, + 0.8022228635787964, + 0.9494114886283874, + 1.6274977996826172, + 0.7025753731250763, + 0.6086838336467743, + 0.85253525390625, + 0.5798639675140381, + 0.9239351823806763, + 0.7397382484912872, + 0.5377552442789078, + 0.5661793855428696, + 0.591952879333496, + 0.5815083159923553, + 0.5666080118179321, + 0.6167471637010574, + 0.5116942359924317, + 0.6500419594287873, + 0.5058183356523513, + 0.5127271728992462, + 0.5146393095970154, + 0.513179197883606, + 0.5277192692756653, + 0.5301190893173218, + 0.4902091938018799, + 0.4643077433586121, + 0.46406279153823854, + 0.47324425945281984, + 0.4390524193763733, + 0.43308766808509824, + 0.4483348261833191, + 0.45758007364273073, + 0.4258517781257629, + 0.40843180713653565, + 0.39923065466880797, + 0.3923787565469742, + 0.39694422893524167, + 0.388149334526062, + 0.3989525201797485, + 0.3880426513195038, + 0.38228393292427065, + 0.3847649987220764, + 0.3728706964492798 + ], + "term_loss": [ + 1.759378063583374, + 0.6950865835666656, + 0.7524722458839417, + 0.7025897565841674, + 0.630735333108902, + 0.6144626032829285, + 0.6203483947753906, + 0.6912198863983154, + 0.6812775425195694, + 0.7021899845123291, + 0.7890356311798096, + 0.9806006479740143, + 1.1520600126743317, + 1.0969103591918945, + 1.218403604888916, + 1.234606753462553, + 1.1846878055810928, + 1.4810678904533385, + 1.9551898319244385, + 1.9328652121543883, + 1.8252225715637207, + 1.9255873363494873, + 1.8419472370386123, + 1.8514944805145264, + 1.7480499786376953, + 1.7230984504699707, + 1.7801577151060104, + 1.9261333221912385, + 1.5824289985656739, + 1.3395356185913085, + 1.1190976068019867, + 0.8095712727546692, + 0.9129751841545105, + 0.8099967944145202, + 0.5449157089233398, + 1.1429317752838135, + 0.8717972569465637, + 0.7612683668017387, + 0.5363850374221801, + 0.6509348512649537, + 1.2403230022907257, + 0.44119430227279666, + 0.36985179181098937, + 0.5657508541107178, + 0.3316444114685059, + 0.6092286487579346, + 0.45416003305912017, + 0.2803884910583496, + 0.30142446330189704, + 0.32512425956726076, + 0.31511888599395754, + 0.2933908362150192, + 0.3304207047402859, + 0.23888909721374513, + 0.3518457849144936, + 0.2321460828304291, + 0.23690145794153214, + 0.24031942974328996, + 0.234180108833313, + 0.2491055172920227, + 0.2518234708428383, + 0.21771380550265312, + 0.19746038370132446, + 0.19613629539012908, + 0.20217996973991395, + 0.17647680728435516, + 0.1724887050151825, + 0.18513125069141387, + 0.19194528245925904, + 0.16750827902555465, + 0.15352465214729308, + 0.1455474760055542, + 0.1407638990163803, + 0.14426077477931976, + 0.13678922175168992, + 0.1451073505997658, + 0.13600888509750367, + 0.1320053924381733, + 0.13196719620227815, + 0.12118487646579743 + ], + "bridge_loss": [ + 1.0057456545681402, + 0.07984932231307029, + 0.006921142427995801, + 0.0070113932192325595, + 0.014598682332038879, + 0.028220770037174225, + 0.03126658735275269, + 0.026600006234645843, + 0.015867197705805303, + 0.015546117241680622, + 0.012967191728949546, + 0.015010805013775826, + 0.01505515177845955, + 0.016979839408397673, + 0.017059055781364442, + 0.021047090664505958, + 0.023958049084246157, + 0.022573659014701843, + 0.029818001449108122, + 0.044388598722219466, + 0.05576009316444397, + 0.07712252329587936, + 0.07596050485372544, + 0.089072286555171, + 0.1078504252910614, + 0.08938403369188308, + 0.13860380922555923, + 0.16278210570812227, + 0.12334684269428253, + 0.12987734815478325, + 0.1283024751573801, + 0.09875854194164276, + 0.1132021647453308, + 0.114243505692482, + 0.07930920803546905, + 0.16031358633041382, + 0.1483750568330288, + 0.07615681183040142, + 0.05947322273850441, + 0.06707281012535095, + 0.1555256877541542, + 0.04927767667770386, + 0.027832713788747788, + 0.05109234853982925, + 0.03510485389232636, + 0.06433321557044983, + 0.0509399315007031, + 0.029501312471553683, + 0.029298018515110016, + 0.022007736629247664, + 0.026509742373228073, + 0.02547568997144699, + 0.028158922368288042, + 0.01945364822745323, + 0.032367846205830574, + 0.021171480375528337, + 0.02125774438381195, + 0.021097413665056228, + 0.02262683149129152, + 0.021077597737312315, + 0.022499435234069824, + 0.017363783645629884, + 0.01511413771212101, + 0.016478369894623757, + 0.018426007288694382, + 0.01539817702770233, + 0.015168809753656387, + 0.017221828517317773, + 0.022410498839616776, + 0.015976610014587642, + 0.013848819640278816, + 0.012749422067403794, + 0.012547081257402897, + 0.014398891832679511, + 0.013543046182394028, + 0.01616565254330635, + 0.015339582663774491, + 0.014028705531358718, + 0.016140032187104227, + 0.015310661105066539 + ], + "tgrad_loss": [ + 0.30010702733993533, + 0.23023750939369203, + 0.17429312868118285, + 0.15607886154651643, + 0.14204240217208863, + 0.1387570774078369, + 0.13921050038337707, + 0.13870142607688904, + 0.13391238613128661, + 0.13378998804092407, + 0.13873620960712432, + 0.15070862843990326, + 0.1500591349840164, + 0.14902560558319092, + 0.15114763839244844, + 0.1465921157836914, + 0.14443349993228913, + 0.15958458815813065, + 0.17512055349349975, + 0.17526660327911378, + 0.16779239134788512, + 0.1771635971069336, + 0.17388546850681305, + 0.16993154878616332, + 0.16906907887458802, + 0.16297144203186034, + 0.16763084147572518, + 0.17152745275497436, + 0.17684210817813872, + 0.17865150032043456, + 0.17648701427578925, + 0.17127388672828675, + 0.20040569903850555, + 0.2073261212348938, + 0.20007638354301452, + 0.1993234664916992, + 0.21500900251865387, + 0.206652339220047, + 0.20636459765434265, + 0.23140381593704223, + 0.2316491063594818, + 0.21210338969230652, + 0.21099932672977448, + 0.23569203791618348, + 0.21311470336914062, + 0.25037331929206846, + 0.23463827657699585, + 0.2278654456615448, + 0.23545689868927003, + 0.2448208836555481, + 0.2398796889066696, + 0.2477414860725403, + 0.25816753516197205, + 0.2533514893531799, + 0.26582832283973695, + 0.2525007682800293, + 0.2545679742336273, + 0.25322246961593625, + 0.25637225708961486, + 0.25753615407943725, + 0.25579618854522707, + 0.25513160409927366, + 0.2517332214355469, + 0.25144813041687014, + 0.2526382836341858, + 0.2471774356842041, + 0.24543014860153198, + 0.24598174903392792, + 0.2432242931842804, + 0.24236688857078553, + 0.24105833854675293, + 0.24093375723361968, + 0.23906777582168579, + 0.23828456206321716, + 0.23781706585884094, + 0.23767951769828796, + 0.2366941836833954, + 0.23624983654022216, + 0.23665776674747466, + 0.23637515988349914 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.024487923830747604, + 0.1551763117313385, + 0.17440856993198395, + 0.18776318430900574, + 0.163284569978714, + 0.17855775356292725, + 0.162883460521698, + 0.17358574271202087 + ], + "perturbation_rho": [ + 0.024775028228759766, + 0.25605684518814087, + 0.2314496785402298, + 0.2697882056236267, + 0.24329833686351776, + 0.3152206242084503, + 0.23843368887901306, + 0.2751646637916565 + ], + "nudging": { + "0.001": [ + -0.0010546729899942875, + -0.0011491177137941122, + -0.001177083933725953, + -0.0012467143824324012, + -0.0011091993656009436, + -0.0011924341088160872, + -0.0011279901955276728, + -0.0011755195446312428 + ], + "0.003": [ + -0.0031479522585868835, + -0.0034450858365744352, + -0.00352866156026721, + -0.0037402876187115908, + -0.0033245475497096777, + -0.0035774726420640945, + -0.0033813398331403732, + -0.0035263618919998407 + ], + "0.01": [ + -0.010280786082148552, + -0.011451397091150284, + -0.01173271145671606, + -0.012431012466549873, + -0.01105603575706482, + -0.011893808841705322, + -0.011241357773542404, + -0.011722835712134838 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a0.5_L8_s42.json b/results/synth_ladder_v2_hi/synth_a0.5_L8_s42.json new file mode 100644 index 0000000..75ed461 --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a0.5_L8_s42.json @@ -0,0 +1,1638 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.1754807784080505, + 0.5181709585666656, + 0.4592852454185486, + 0.48108175311088563, + 0.36512076749801636, + 0.34354006390571595, + 0.3322723610162735, + 0.297065003323555, + 0.3262266932606697, + 0.28987626616954804, + 0.30052861709594725, + 0.30294343957901, + 0.33569810996055605, + 0.2807107723712921, + 0.24509782445430756, + 0.22368610286712645, + 0.2224589084148407, + 0.22678682289123536, + 0.23643300566673278, + 0.261921722304821, + 0.18664481525421142, + 0.2196642207145691, + 0.17971987835168837, + 0.15603925316333772, + 0.14970590219497681, + 0.21505068674087524, + 0.20973155901432036, + 0.18755916361808778, + 0.15954147424697876, + 0.1524156427383423, + 0.1794239527463913, + 0.14108568379878997, + 0.13159887236356735, + 0.11600628448724747, + 0.1008336604475975, + 0.09575988247394562, + 0.09875326882600784, + 0.09757538337707519, + 0.0814407280921936, + 0.1022400197148323, + 0.09087320072650909, + 0.08520868092179298, + 0.06907072774618864, + 0.05944656895399093, + 0.06366101975440978, + 0.07264506211280823, + 0.08344530180692673, + 0.06239017713665962, + 0.05024316610693932, + 0.044702837443351746, + 0.045005498057976365, + 0.03973149275779724, + 0.04285087337195873, + 0.03791879476606846, + 0.0346739610761404, + 0.03288826472461224, + 0.031093527680635454, + 0.03032451833486557, + 0.03242490175962448, + 0.030104601883888246, + 0.028860807363316417, + 0.027365653735399245, + 0.027397248911857606, + 0.026892173463106156, + 0.025769270791113377, + 0.02494896683692932, + 0.02501359928548336, + 0.024235507121682168, + 0.023822496247291564, + 0.02354036187529564, + 0.023214907813072203, + 0.023110688921809196, + 0.022794095242023468, + 0.022592110830545426, + 0.0224503764398396, + 0.02231179800629616, + 0.02221992956995964, + 0.02214076687693596, + 0.022098414012789728, + 0.022070704632252455 + ], + "train_acc": [ + 0.5833, + 0.7995, + 0.8206, + 0.8106, + 0.8579, + 0.8631, + 0.8703, + 0.8866, + 0.8694, + 0.8846, + 0.8829, + 0.882, + 0.8702, + 0.888, + 0.9044, + 0.9149, + 0.9147, + 0.9108, + 0.9112, + 0.8992, + 0.9269, + 0.9152, + 0.9309, + 0.9441, + 0.9445, + 0.9223, + 0.919, + 0.93, + 0.9399, + 0.943, + 0.9314, + 0.949, + 0.953, + 0.9601, + 0.966, + 0.9715, + 0.9683, + 0.9679, + 0.9768, + 0.9662, + 0.9716, + 0.9727, + 0.9824, + 0.9876, + 0.985, + 0.9808, + 0.973, + 0.9843, + 0.9903, + 0.9935, + 0.9935, + 0.9959, + 0.9938, + 0.9957, + 0.9974, + 0.9976, + 0.9983, + 0.9982, + 0.9974, + 0.9979, + 0.9984, + 0.9988, + 0.9984, + 0.999, + 0.9987, + 0.9991, + 0.9991, + 0.9994, + 0.9993, + 0.9993, + 0.9996, + 0.9993, + 0.9995, + 0.9994, + 0.9994, + 0.9995, + 0.9996, + 0.9996, + 0.9995, + 0.9995 + ], + "test_acc": [ + 0.7705, + 0.82, + 0.8285, + 0.8205, + 0.823, + 0.824, + 0.8385, + 0.845, + 0.8365, + 0.846, + 0.838, + 0.8475, + 0.833, + 0.8455, + 0.833, + 0.8555, + 0.8565, + 0.8535, + 0.8545, + 0.849, + 0.8605, + 0.853, + 0.86, + 0.862, + 0.869, + 0.867, + 0.856, + 0.862, + 0.8655, + 0.8665, + 0.8545, + 0.86, + 0.862, + 0.8595, + 0.8675, + 0.863, + 0.8745, + 0.8655, + 0.867, + 0.872, + 0.873, + 0.875, + 0.871, + 0.8765, + 0.875, + 0.874, + 0.86, + 0.8715, + 0.87, + 0.8705, + 0.872, + 0.873, + 0.8755, + 0.8685, + 0.871, + 0.8735, + 0.87, + 0.872, + 0.874, + 0.871, + 0.8715, + 0.8725, + 0.873, + 0.871, + 0.871, + 0.872, + 0.8705, + 0.8715, + 0.873, + 0.871, + 0.8695, + 0.8695, + 0.87, + 0.8715, + 0.87, + 0.87, + 0.8715, + 0.8715, + 0.8715, + 0.8715 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8294941186904907, + 0.823101282119751, + 0.815970778465271, + 0.8095235824584961, + 0.8066394329071045, + 0.8012610673904419, + 0.7956615686416626, + 0.7900899648666382 + ], + "perturbation_rho": [ + 0.999998927116394, + 0.999997615814209, + 0.9999938011169434, + 0.9999845027923584, + 0.9999604225158691, + 0.9999330043792725, + 0.999873697757721, + 0.999819278717041 + ], + "nudging": { + "0.001": [ + -0.035539593547582626, + -0.021562810987234116, + -0.012927833944559097, + -0.007899895310401917, + -0.005169217474758625, + -0.0036920299753546715, + -0.0028583952225744724, + -0.002364233136177063 + ], + "0.003": [ + -0.0985700860619545, + -0.0616692453622818, + -0.037691134959459305, + -0.023295730352401733, + -0.015336824581027031, + -0.01098954863846302, + -0.008523097261786461, + -0.007056646980345249 + ], + "0.01": [ + -0.2528620958328247, + -0.17482446134090424, + -0.11384513974189758, + -0.07313278317451477, + -0.04917728155851364, + -0.03563641011714935, + -0.02781001478433609, + -0.02310660108923912 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.1838191192626955, + 1.202098671722412, + 0.7546534229278564, + 0.6286930981874466, + 0.5413522202730179, + 0.5016274568080902, + 0.4973876078605652, + 0.5006243084907531, + 0.491056324505806, + 0.5162841996192932, + 0.503458097076416, + 0.5122841632843017, + 0.6047590888977051, + 0.5742595722198486, + 0.6101696805477143, + 0.5846948350906372, + 0.6041797488331795, + 0.5839841031074524, + 0.6028947599411011, + 0.6573390657663345, + 0.6277515439033509, + 0.7153009181976319, + 0.6114065330982208, + 0.7203419920444488, + 0.704536079788208, + 0.7316081617355347, + 0.7904250410079956, + 0.7298012476921082, + 0.9584419759750367, + 0.7364888837814331, + 0.7200859572410584, + 0.7152903346061706, + 0.7418321360588074, + 0.6785042297184467, + 0.7197946992874146, + 0.7295546224594116, + 0.7811001716613769, + 0.7459795353889466, + 0.7168794848442077, + 0.8068981638908386, + 0.6808593973636627, + 0.6812150555133819, + 0.6748936148405075, + 0.7090878666877747, + 0.6815416418075562, + 0.7244775035858154, + 0.7989970844268799, + 0.7369783718109131, + 0.6676865758895874, + 0.6741015150070191, + 0.6873524452403188, + 0.6283843026161194, + 0.6744810340195895, + 0.6269000155448914, + 0.7053837902069092, + 0.647765721988678, + 0.6138295706748962, + 0.6056019225120545, + 0.6158565293312073, + 0.6043323511123657, + 0.6008664073240012, + 0.5667676944732666, + 0.5763443781375885, + 0.5698577795982361, + 0.5726742564201355, + 0.5617806459903717, + 0.5556433219909668, + 0.5606436388015748, + 0.5541526489257812, + 0.5531132131576538, + 0.5459820462226868, + 0.5402892316818237, + 0.5384351867675782, + 0.5412482352614403, + 0.5334744161128998, + 0.5311016474723816, + 0.5313176528930664, + 0.5276195110797882, + 0.526644831725955, + 0.5260294675350189 + ], + "train_acc": [ + 0.2066, + 0.5772, + 0.7178, + 0.7667, + 0.7971, + 0.8116, + 0.8113, + 0.8184, + 0.8219, + 0.8197, + 0.8231, + 0.8219, + 0.8026, + 0.814, + 0.8081, + 0.8205, + 0.8152, + 0.8241, + 0.8169, + 0.8076, + 0.8168, + 0.8118, + 0.8261, + 0.8074, + 0.8136, + 0.811, + 0.8037, + 0.8151, + 0.7895, + 0.8177, + 0.8222, + 0.819, + 0.8215, + 0.8305, + 0.8227, + 0.8213, + 0.8166, + 0.8222, + 0.8271, + 0.814, + 0.8341, + 0.8325, + 0.8348, + 0.8234, + 0.8302, + 0.825, + 0.818, + 0.8222, + 0.8356, + 0.8346, + 0.8324, + 0.8422, + 0.8386, + 0.8419, + 0.8283, + 0.8399, + 0.8478, + 0.8481, + 0.8417, + 0.848, + 0.8489, + 0.8569, + 0.8523, + 0.8537, + 0.8533, + 0.8548, + 0.8574, + 0.8564, + 0.8571, + 0.8579, + 0.8587, + 0.8613, + 0.8608, + 0.8598, + 0.8623, + 0.8616, + 0.8606, + 0.8618, + 0.8622, + 0.8617 + ], + "test_acc": [ + 0.4245, + 0.633, + 0.7, + 0.7355, + 0.7595, + 0.771, + 0.781, + 0.776, + 0.7695, + 0.7775, + 0.785, + 0.7285, + 0.7645, + 0.7665, + 0.7315, + 0.7645, + 0.742, + 0.767, + 0.7485, + 0.772, + 0.7575, + 0.769, + 0.739, + 0.715, + 0.723, + 0.721, + 0.755, + 0.685, + 0.7375, + 0.747, + 0.7845, + 0.7575, + 0.788, + 0.7475, + 0.7465, + 0.734, + 0.786, + 0.7485, + 0.7305, + 0.7745, + 0.7775, + 0.779, + 0.756, + 0.7395, + 0.784, + 0.7605, + 0.7665, + 0.7785, + 0.77, + 0.7655, + 0.7925, + 0.7745, + 0.7755, + 0.7855, + 0.764, + 0.785, + 0.777, + 0.769, + 0.783, + 0.792, + 0.7985, + 0.807, + 0.803, + 0.803, + 0.8035, + 0.8065, + 0.7965, + 0.7995, + 0.8065, + 0.811, + 0.8015, + 0.8015, + 0.8035, + 0.8, + 0.8, + 0.8045, + 0.8025, + 0.806, + 0.8045, + 0.804 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.029147807508707047, + 0.09590217471122742, + 0.0916377604007721, + 0.10714393854141235, + 0.10661958158016205, + 0.05731643736362457, + 0.06447312980890274, + 0.05185993015766144 + ], + "perturbation_rho": [ + -0.08288859575986862, + 0.14039787650108337, + 0.1433517336845398, + 0.1548803746700287, + 0.09298646450042725, + 0.08800182491540909, + 0.09949750453233719, + 0.02763376198709011 + ], + "nudging": { + "0.001": [ + 0.0017877263016998768, + -0.000630493275821209, + -0.00031784665770828724, + -0.00033820740645751357, + -0.0003272043541073799, + -0.00018869461200665683, + -0.0002295648882864043, + -0.00016335875261574984 + ], + "0.003": [ + 0.005449830554425716, + -0.001886849058791995, + -0.0009509308729320765, + -0.0010138512589037418, + -0.0009805148001760244, + -0.0005645205965265632, + -0.0006858182605355978, + -0.00048740144120529294 + ], + "0.01": [ + 0.019184602424502373, + -0.0062692309729754925, + -0.0031640869565308094, + -0.0033698435872793198, + -0.003262510057538748, + -0.0018756084609776735, + -0.0022803605534136295, + -0.0016227040905505419 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.7473140567779541, + 0.9251619996070862, + 0.7068822136878967, + 0.6734603995323181, + 0.7457750282287597, + 0.8054894256591797, + 0.8525734433174134, + 0.8588375370025635, + 0.8834347763061523, + 0.8960849166870117, + 0.9051341072082519, + 0.9054860986709595, + 0.9049023498535156, + 0.9338330560684204, + 0.8942585109710693, + 0.866205068397522, + 0.8675411263465881, + 0.8408319032192231, + 0.8157361579895019, + 0.8383380194664002, + 0.7929928570747375, + 0.8159124660491943, + 0.8006898342132568, + 0.7805020513534546, + 0.7467561506271362, + 0.7769838253021241, + 0.740959705066681, + 0.7387035996437072, + 0.7201678607463836, + 0.7209407108306884, + 0.7474315497398376, + 0.7333630378723145, + 0.7624125885009766, + 0.7098405016899109, + 0.7155334932327271, + 0.7373080111503602, + 0.6897648265838623, + 0.7116705716133118, + 0.6977139730453491, + 0.689065051651001, + 0.7276701536178589, + 0.726329208946228, + 0.7151447709083557, + 0.7019258667945861, + 0.7494557568073272, + 0.7007609943389893, + 0.7020422275543213, + 0.6922769821166992, + 0.6776938212394714, + 0.6798969288825989, + 0.6656915367126465, + 0.6746529310703278, + 0.6393669857978821, + 0.6383698108673096, + 0.6358671523094177, + 0.6303783107280732, + 0.6350876825332642, + 0.6365802597522736, + 0.6297786211013794, + 0.6428515602111816, + 0.6437168377876282, + 0.6237785207748413, + 0.6191892197608948, + 0.6191086200714111, + 0.6186483777046203, + 0.6168421429157257, + 0.6117486687660217, + 0.6113159837722778, + 0.6117036319255829, + 0.607511134815216, + 0.6095974473953247, + 0.6053294305801391, + 0.6047506375312806, + 0.6027808818817139, + 0.6011299852371216, + 0.6004490308761596, + 0.5999058860778809, + 0.5991122978210449, + 0.598829758644104, + 0.598610949087143 + ], + "train_acc": [ + 0.364, + 0.6574, + 0.7329, + 0.753, + 0.7398, + 0.7248, + 0.7084, + 0.698, + 0.6894, + 0.6845, + 0.6805, + 0.6781, + 0.6804, + 0.6737, + 0.6854, + 0.6889, + 0.6907, + 0.6997, + 0.7082, + 0.7014, + 0.7176, + 0.7145, + 0.7188, + 0.7206, + 0.7318, + 0.7271, + 0.7373, + 0.735, + 0.7415, + 0.7401, + 0.744, + 0.7405, + 0.7346, + 0.7542, + 0.746, + 0.739, + 0.7483, + 0.751, + 0.7539, + 0.748, + 0.7431, + 0.744, + 0.7449, + 0.7473, + 0.7364, + 0.7478, + 0.7439, + 0.7468, + 0.7538, + 0.7511, + 0.7531, + 0.7538, + 0.7664, + 0.7687, + 0.7632, + 0.7699, + 0.7701, + 0.7688, + 0.7692, + 0.765, + 0.7657, + 0.77, + 0.7734, + 0.7728, + 0.7735, + 0.7713, + 0.7752, + 0.777, + 0.7762, + 0.7752, + 0.7746, + 0.7782, + 0.7776, + 0.7801, + 0.7778, + 0.7788, + 0.7778, + 0.7797, + 0.7787, + 0.7793 + ], + "test_acc": [ + 0.557, + 0.6835, + 0.712, + 0.7145, + 0.693, + 0.687, + 0.6815, + 0.674, + 0.672, + 0.661, + 0.6595, + 0.661, + 0.6535, + 0.6555, + 0.66, + 0.6525, + 0.6575, + 0.6745, + 0.662, + 0.665, + 0.6775, + 0.6725, + 0.6565, + 0.685, + 0.6865, + 0.6955, + 0.6925, + 0.6985, + 0.6935, + 0.674, + 0.7045, + 0.6865, + 0.7, + 0.7075, + 0.679, + 0.706, + 0.7085, + 0.7025, + 0.718, + 0.7025, + 0.7085, + 0.6865, + 0.709, + 0.681, + 0.713, + 0.7125, + 0.714, + 0.7035, + 0.7085, + 0.7075, + 0.7005, + 0.722, + 0.725, + 0.7115, + 0.7165, + 0.728, + 0.7245, + 0.7215, + 0.7265, + 0.7275, + 0.7165, + 0.727, + 0.731, + 0.7285, + 0.7265, + 0.7245, + 0.7275, + 0.7215, + 0.724, + 0.7265, + 0.7285, + 0.723, + 0.7275, + 0.7275, + 0.7275, + 0.728, + 0.729, + 0.7285, + 0.727, + 0.7265 + ], + "state_pred_error": [ + 0.6621009309768677, + 0.18949966685771943, + 0.1467816726922989, + 0.15708787188529968, + 0.17524181332588196, + 0.19041815445423127, + 0.19469740133285524, + 0.19334899117946625, + 0.18909891850948335, + 0.1834290199995041, + 0.1776910136461258, + 0.1693726092338562, + 0.1593346801996231, + 0.15057109451293946, + 0.13607191491127013, + 0.12221740016937256, + 0.11063073590993881, + 0.10139462573528289, + 0.09178647582530976, + 0.08364639749526978, + 0.0763305801987648, + 0.07042970400452614, + 0.06602095465660095, + 0.06487999885678292, + 0.06271354095935822, + 0.061520341455936434, + 0.059059248542785645, + 0.056564629304409024, + 0.05402934091091156, + 0.05196828144788742, + 0.050360298389196395, + 0.0480489935874939, + 0.04519245035648346, + 0.04349969825744629, + 0.04201801525950432, + 0.04072046799659729, + 0.03955439219474793, + 0.03672264353334904, + 0.03492691957950592, + 0.03289650791883469, + 0.03177874554991722, + 0.030649135023355485, + 0.02864566181600094, + 0.02688669348657131, + 0.025244250574707985, + 0.023715209478139876, + 0.021778766030073164, + 0.020335312649607657, + 0.019033752544224264, + 0.018155685628950594, + 0.017363225120306015, + 0.016726057812571526, + 0.01624702921509743, + 0.015930817434191703, + 0.015584588533639908, + 0.015295122048258782, + 0.015127958336472512, + 0.014801454600691795, + 0.014687491267919541, + 0.014063061302900314, + 0.01438164930343628, + 0.01355879987180233, + 0.01320074545443058, + 0.012842133796215058, + 0.01253392604291439, + 0.01236460832208395, + 0.011886253049969674, + 0.011621960616111756, + 0.011426134213805198, + 0.011017198014259339, + 0.010708265140652656, + 0.01054772773683071, + 0.01050231020450592, + 0.010149630855768919, + 0.009902083823084832, + 0.009754141983389855, + 0.009604894667863845, + 0.00941408416479826, + 0.009380772784352303, + 0.009179592244327068 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8188973069190979, + 0.4508240222930908, + 0.20906424522399902, + 0.16529136896133423, + 0.1612900048494339, + 0.1292058229446411, + 0.14780420064926147, + 0.1308501958847046 + ], + "perturbation_rho": [ + 0.7345798015594482, + 0.40806666016578674, + 0.18922817707061768, + 0.1360217034816742, + 0.11187596619129181, + 0.1472519189119339, + 0.12442155927419662, + 0.11949814856052399 + ], + "nudging": { + "0.001": [ + -0.021930836141109467, + -0.0014364664675667882, + -0.0005421066889539361, + -0.0004351946117822081, + -0.00039058327092789114, + -0.0003250233712606132, + -0.00035381075576879084, + -0.00031243677949532866 + ], + "0.003": [ + -0.0643623024225235, + -0.004303464200347662, + -0.0016258403193205595, + -0.0013055813033133745, + -0.0011712429113686085, + -0.0009750650497153401, + -0.0010611845646053553, + -0.0009370018960908055 + ], + "0.01": [ + -0.19829359650611877, + -0.01426965557038784, + -0.005409521050751209, + -0.004344802349805832, + -0.0038992268964648247, + -0.0032464847899973392, + -0.003532196395099163, + -0.00311922375112772 + ] + }, + "state_pred_error_per_layer": [ + 5640.76416015625, + 3768.9912109375, + 2209.80126953125, + 1863.6328125, + 1833.0330810546875, + 2052.747802734375, + 1687.1876220703125, + 1871.18310546875 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.186090153121948, + 1.1984385531425477, + 0.758064928817749, + 0.626275444984436, + 0.5633068831443787, + 0.5013768714904785, + 0.5079200323104859, + 0.5059850447654725, + 0.4841378322124481, + 0.519163568687439, + 0.5544459510803222, + 0.5611598224639892, + 0.5388422620296478, + 0.6585407733917237, + 0.576538342666626, + 0.600434935760498, + 0.6034886390686035, + 0.6376714500427246, + 0.6580952283859253, + 0.663741570186615, + 0.7861046495437622, + 0.7275902103424072, + 0.7628611448287964, + 0.8346376148223877, + 0.8310700666427613, + 0.8562221878051758, + 1.003050333881378, + 1.005180773639679, + 1.0375463592529297, + 0.9521340274810791, + 1.0032074150085448, + 1.0618027465820312, + 1.0746233934402465, + 1.0948340304374695, + 1.1240816584587097, + 1.0969329462051391, + 1.1547944499969482, + 1.0115770859718323, + 1.187496001434326, + 1.1422000102996825, + 1.2583707466125489, + 1.1105651211738587, + 1.149918165588379, + 1.156761019897461, + 1.0984439032554627, + 1.153316777420044, + 1.1259891437530518, + 1.1472719621658325, + 1.116767183303833, + 1.0828887168884278, + 1.06634891872406, + 1.1018301118850709, + 1.1700591009140016, + 1.119646194076538, + 1.1126467975616454, + 1.128969659423828, + 1.1335998802185059, + 1.116425537109375, + 1.1152625152587892, + 1.1043034273147583, + 1.1250763381958009, + 1.1375839376449586, + 1.1613730312347412, + 1.114402931690216, + 1.110203257751465, + 1.110114776992798, + 1.0994714338302611, + 1.10834795627594, + 1.0854792390823365, + 1.0907306499481202, + 1.0760109588623046, + 1.0793846405029297, + 1.0701058303833009, + 1.0693202518463134, + 1.0654688898086548, + 1.0643323517799377, + 1.062985421180725, + 1.063136572265625, + 1.0616274564743042, + 1.060890511226654 + ], + "train_acc": [ + 0.2037, + 0.5759, + 0.7201, + 0.7655, + 0.786, + 0.8129, + 0.8139, + 0.8149, + 0.8211, + 0.8163, + 0.8115, + 0.8102, + 0.8227, + 0.8002, + 0.8182, + 0.815, + 0.8163, + 0.8129, + 0.8129, + 0.8135, + 0.7906, + 0.7999, + 0.7921, + 0.769, + 0.7656, + 0.7611, + 0.7238, + 0.7113, + 0.6958, + 0.6976, + 0.6775, + 0.6548, + 0.6512, + 0.6319, + 0.6236, + 0.6178, + 0.611, + 0.6423, + 0.6127, + 0.61, + 0.5833, + 0.6211, + 0.612, + 0.6054, + 0.6155, + 0.6017, + 0.6061, + 0.5974, + 0.6079, + 0.6116, + 0.6099, + 0.6073, + 0.5914, + 0.5991, + 0.6026, + 0.5958, + 0.5946, + 0.6011, + 0.6002, + 0.6053, + 0.5985, + 0.5905, + 0.5887, + 0.5986, + 0.6012, + 0.6023, + 0.604, + 0.6011, + 0.6086, + 0.605, + 0.6125, + 0.6069, + 0.6108, + 0.6143, + 0.6148, + 0.6154, + 0.6165, + 0.6149, + 0.6145, + 0.616 + ], + "test_acc": [ + 0.4205, + 0.6445, + 0.6985, + 0.728, + 0.768, + 0.7555, + 0.7905, + 0.781, + 0.7895, + 0.7495, + 0.7755, + 0.767, + 0.7785, + 0.75, + 0.7695, + 0.7655, + 0.788, + 0.779, + 0.744, + 0.7345, + 0.7575, + 0.754, + 0.7015, + 0.701, + 0.7185, + 0.724, + 0.636, + 0.626, + 0.598, + 0.5585, + 0.579, + 0.579, + 0.5785, + 0.5585, + 0.5555, + 0.444, + 0.5675, + 0.4385, + 0.559, + 0.4735, + 0.5265, + 0.57, + 0.498, + 0.548, + 0.517, + 0.5415, + 0.5515, + 0.4515, + 0.5275, + 0.5605, + 0.5295, + 0.5445, + 0.5505, + 0.5395, + 0.5455, + 0.53, + 0.566, + 0.5735, + 0.579, + 0.587, + 0.56, + 0.569, + 0.575, + 0.5795, + 0.5845, + 0.576, + 0.584, + 0.5885, + 0.59, + 0.5785, + 0.5835, + 0.593, + 0.5875, + 0.5915, + 0.594, + 0.592, + 0.59, + 0.5935, + 0.5955, + 0.5935 + ], + "value_loss": [ + 2.972377465057373, + 0.9248018383979797, + 1.0020131734848023, + 1.001979987335205, + 0.9705457033157349, + 0.8233501838684082, + 0.7766179365158081, + 0.7434081115245819, + 0.6680281215190887, + 0.8222749937057495, + 0.9086565495491028, + 0.9337426007270813, + 0.8717771873474122, + 1.2898138553142549, + 1.0746097915649413, + 1.2781329341888428, + 1.1974793502807617, + 1.34198962059021, + 1.3165509941101075, + 1.5385431747436524, + 1.9559954346179962, + 1.8219638473510742, + 1.7863510093688966, + 2.057444320678711, + 1.9194623096466064, + 1.976530602836609, + 2.3657245763778687, + 2.159454160308838, + 1.9747343505859376, + 1.5638118370056153, + 1.2694459007263184, + 1.2683067232131957, + 1.1694433807373046, + 1.1675490615844726, + 1.0915654657363891, + 1.0240236600875854, + 1.7238075693130492, + 0.835702922821045, + 1.110375917816162, + 0.8499037637710571, + 1.055553258895874, + 1.0895272705078125, + 1.12765179977417, + 0.7910501505374908, + 0.6725261320114135, + 0.734961402130127, + 0.6772283415317535, + 0.6853561975479125, + 0.6990460660934448, + 0.8313457719802857, + 0.5796068740844726, + 0.6480168206691742, + 0.8037886819362641, + 0.5881471869468688, + 0.6110391419410706, + 0.5128450169563293, + 0.5585265712738037, + 0.5103896431922913, + 0.5027615876197815, + 0.5387080775737763, + 0.5066710983276367, + 0.5061055371284485, + 0.5857940488815307, + 0.47782063326835633, + 0.5022022886276245, + 0.45191595425605774, + 0.4483213914871216, + 0.44163735978603363, + 0.44864495878219607, + 0.4398085097312927, + 0.4156592011928558, + 0.4245777335166931, + 0.42239491229057313, + 0.4158617585659027, + 0.4056261803150177, + 0.3981911696434021, + 0.39951434321403506, + 0.40600771880149844, + 0.39831735172271726, + 0.3977136660575867 + ], + "term_loss": [ + 1.7086821298599244, + 0.6393537052154541, + 0.831955358505249, + 0.8549827503204346, + 0.8313716646194458, + 0.6740786487579346, + 0.6076947003364563, + 0.5965874532222748, + 0.538589419388771, + 0.6892606357574463, + 0.7693541362762452, + 0.7941495090007782, + 0.7356539968967438, + 1.1337381413698195, + 0.9334297341823578, + 1.133020539855957, + 1.0501272022247314, + 1.1906745010375976, + 1.1603767150878905, + 1.383775331878662, + 1.7672954069495201, + 1.618180365753174, + 1.5548997764587402, + 1.7815429141998291, + 1.634721337890625, + 1.6693853170394897, + 1.9992852979660034, + 1.7566577983856202, + 1.5732412117004395, + 1.1724922225952148, + 0.9129334537506103, + 0.9116888998031616, + 0.811285630607605, + 0.782278653216362, + 0.6845991757392883, + 0.5974405498027802, + 1.1749914863586426, + 0.455600013923645, + 0.733255504322052, + 0.520190512561798, + 0.697090616607666, + 0.744835383605957, + 0.7489512222290039, + 0.44376978453397753, + 0.3575445245265961, + 0.41143530030250547, + 0.36194814307689666, + 0.35318923025131227, + 0.3714102928161621, + 0.48353575496673584, + 0.2622438941001892, + 0.31617711095809936, + 0.45348238250017164, + 0.2884477474451065, + 0.3248059089899063, + 0.22525122106075288, + 0.27484396206140516, + 0.2325062701702118, + 0.22512192395329475, + 0.26193017570972443, + 0.2302307121038437, + 0.22658776865005492, + 0.29551011357307433, + 0.20677382897138596, + 0.22635481977462768, + 0.17875954384803772, + 0.1794549295425415, + 0.17492746146917343, + 0.1828258805513382, + 0.1739099319458008, + 0.15372597955465317, + 0.15907710464000702, + 0.15855794508755208, + 0.15342277257442474, + 0.14609964501857758, + 0.13945738344192504, + 0.136053040933609, + 0.1458153038263321, + 0.1393143364906311, + 0.13710964921712876 + ], + "bridge_loss": [ + 0.9758284360856575, + 0.06962661180198193, + 0.005672540656849742, + 0.003370350643992424, + 0.006644147405028343, + 0.030381520032882692, + 0.04909406066536903, + 0.026274551457166673, + 0.013745080161094665, + 0.013532327757775783, + 0.0138886878028512, + 0.013557788728922606, + 0.014762255641818047, + 0.01668152751326561, + 0.01626828481554985, + 0.01767303576171398, + 0.020321840810775756, + 0.019734235203266143, + 0.02249946554452181, + 0.022086227571964264, + 0.040416947451233864, + 0.06203577089309693, + 0.08303722366094589, + 0.11707051875591278, + 0.12063585679531097, + 0.13916499671936036, + 0.17566344423294067, + 0.20474205927848815, + 0.1913953489303589, + 0.1900377607345581, + 0.14244086827039718, + 0.12460256059169769, + 0.1259830789089203, + 0.147844007897377, + 0.16582468271255493, + 0.18581496963500976, + 0.3006300089836121, + 0.15080310106873512, + 0.12048298480510712, + 0.07477383016645908, + 0.08642990236282348, + 0.09502357883453369, + 0.12325514240264893, + 0.08798319578170777, + 0.06590155552625657, + 0.06488577566146851, + 0.06051054383516312, + 0.07300690015554429, + 0.07357583614587784, + 0.09772055714130401, + 0.0707737734824419, + 0.0786128630578518, + 0.09063167880773544, + 0.044709685909748074, + 0.03420306581407785, + 0.03227839771509171, + 0.028627947074174882, + 0.025130870291590692, + 0.02522470474541187, + 0.027251064124703406, + 0.023627802783250808, + 0.023905384761095046, + 0.02898607106804848, + 0.01962408951073885, + 0.024935207891464233, + 0.022261195167899133, + 0.020190077558159828, + 0.017063735301792622, + 0.02027609973549843, + 0.019097698336839677, + 0.017230739736557008, + 0.019787984344363213, + 0.020351601561903954, + 0.01930274936258793, + 0.016703577791899443, + 0.016038631775975226, + 0.021321783912181855, + 0.01768758919239044, + 0.017187132662534715, + 0.018799800185859205 + ], + "tgrad_loss": [ + 0.28786688737869265, + 0.2158215215921402, + 0.16438527557849883, + 0.14362689361572265, + 0.13252989099025728, + 0.11889001908302307, + 0.1198291732788086, + 0.12054610551595688, + 0.11569361996650696, + 0.11948202958106995, + 0.12541372295618058, + 0.12603530632257462, + 0.12136093652248382, + 0.13939418510198592, + 0.12491177189350128, + 0.12743936359882355, + 0.12703030982017516, + 0.13158088505268098, + 0.13367481677532195, + 0.13268162167072295, + 0.14828308132886886, + 0.14174770864248276, + 0.1484140252828598, + 0.1588308961868286, + 0.16410512266159058, + 0.16798028388023376, + 0.19077582602500914, + 0.19805429615974426, + 0.21009778094291687, + 0.20128185844421387, + 0.21407157855033873, + 0.23201526298522948, + 0.2321746678352356, + 0.23742639436721802, + 0.24114160361289977, + 0.2407681416273117, + 0.24818605904579163, + 0.2292998040676117, + 0.25663742961883546, + 0.25493942279815673, + 0.27203273811340334, + 0.24966830728054046, + 0.25544544095993044, + 0.2592971650838852, + 0.24908005418777465, + 0.25864032859802244, + 0.25476965675354, + 0.25916006617546083, + 0.25405994086265565, + 0.25008946247100833, + 0.24658920845985413, + 0.25322684478759766, + 0.2596746240615845, + 0.25498975529670714, + 0.25203017072677614, + 0.2553153970241547, + 0.25505466132164, + 0.2527525003910065, + 0.25241495661735536, + 0.24952683820724486, + 0.2528125834941864, + 0.25561238169670103, + 0.261297861289978, + 0.2514227141857147, + 0.2509122602939606, + 0.2508952157974243, + 0.2486763837337494, + 0.24964616248607635, + 0.24554297575950623, + 0.24680087909698487, + 0.2447024793624878, + 0.24571264839172363, + 0.24348536689281464, + 0.243136239695549, + 0.24282296109199525, + 0.24269515240192413, + 0.24213951697349548, + 0.2425048230648041, + 0.24181588273048402, + 0.24180421624183654 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.014968650415539742, + 0.08219218999147415, + 0.12315872311592102, + 0.1350458562374115, + 0.16176681220531464, + 0.1692444086074829, + 0.17282617092132568, + 0.17642942070960999 + ], + "perturbation_rho": [ + 0.09865723550319672, + 0.1636437624692917, + 0.19447889924049377, + 0.2091381549835205, + 0.2243458330631256, + 0.23168572783470154, + 0.2512606978416443, + 0.23721641302108765 + ], + "nudging": { + "0.001": [ + -0.0006243207026273012, + -0.0006085919449105859, + -0.0008320298511534929, + -0.0008824424585327506, + -0.000980146462097764, + -0.0010583256371319294, + -0.001075199106708169, + -0.0010938441846519709 + ], + "0.003": [ + -0.001858972478657961, + -0.001825807150453329, + -0.002494026906788349, + -0.0026476685889065266, + -0.0029380805790424347, + -0.0031721340492367744, + -0.003223641077056527, + -0.0032798685133457184 + ], + "0.01": [ + -0.006006492767482996, + -0.006066862493753433, + -0.008294559083878994, + -0.008802486583590508, + -0.009770728647708893, + -0.010544568300247192, + -0.010718668811023235, + -0.010904812254011631 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a0.5_L8_s456.json b/results/synth_ladder_v2_hi/synth_a0.5_L8_s456.json new file mode 100644 index 0000000..4d3fe23 --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a0.5_L8_s456.json @@ -0,0 +1,1638 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.1496125110149384, + 0.5061822664260864, + 0.4693412160873413, + 0.43734210863113404, + 0.3776036578655243, + 0.39574705362319945, + 0.3516918658494949, + 0.33453388838768006, + 0.3495379844665527, + 0.3402368752479553, + 0.3161138860940933, + 0.2867650896936655, + 0.24054993677139283, + 0.2714561710357666, + 0.25964800286293027, + 0.2755970516204834, + 0.24782800941467284, + 0.22855919575691222, + 0.21334439667463304, + 0.20634846214056016, + 0.19688657937049867, + 0.23594446697235108, + 0.23073553504943847, + 0.20792550567090512, + 0.1676195205926895, + 0.1842089424610138, + 0.18720704748630523, + 0.14316579525470732, + 0.17303093489408494, + 0.1381333925008774, + 0.13757353625297547, + 0.14679754115343094, + 0.13663861708641054, + 0.16062574342489241, + 0.11842985030412674, + 0.10145846538543701, + 0.09054735779762269, + 0.1080644615650177, + 0.12051263661384583, + 0.08496876339912414, + 0.09041771185398102, + 0.11978768072724343, + 0.08271067204475403, + 0.09710697619915008, + 0.09531720114350319, + 0.06220439117997885, + 0.05394122452735901, + 0.05304814251065254, + 0.04881165652275085, + 0.06747119562029838, + 0.051796284824609753, + 0.045333140206336976, + 0.04041213118433953, + 0.03992201315760612, + 0.03727436591982841, + 0.037020414257049564, + 0.03644478557109833, + 0.03349559764266014, + 0.033058264112472535, + 0.03204139881432056, + 0.02992909691929817, + 0.030789311078190804, + 0.028830358052253723, + 0.02774413277506828, + 0.027408198833465576, + 0.026751420867443084, + 0.02626628998219967, + 0.02568119297027588, + 0.02794391964673996, + 0.025825911223888397, + 0.025229841116070746, + 0.02475675569474697, + 0.02444171721935272, + 0.02418347292840481, + 0.023966037380695342, + 0.023791261124610903, + 0.02370161115527153, + 0.023618511060625316, + 0.023566739109903576, + 0.023538703203201294 + ], + "train_acc": [ + 0.6047, + 0.8052, + 0.8181, + 0.8276, + 0.8498, + 0.8476, + 0.862, + 0.863, + 0.8633, + 0.8678, + 0.8784, + 0.8865, + 0.9094, + 0.8962, + 0.8993, + 0.8902, + 0.9042, + 0.9135, + 0.9174, + 0.9199, + 0.9245, + 0.9116, + 0.9118, + 0.9205, + 0.9377, + 0.929, + 0.9273, + 0.9482, + 0.9329, + 0.95, + 0.9481, + 0.9471, + 0.9498, + 0.9397, + 0.9585, + 0.9669, + 0.9722, + 0.9615, + 0.9578, + 0.9738, + 0.9706, + 0.9567, + 0.9741, + 0.9684, + 0.9693, + 0.9856, + 0.9907, + 0.9901, + 0.9921, + 0.983, + 0.9894, + 0.9947, + 0.9951, + 0.9956, + 0.9973, + 0.9968, + 0.9967, + 0.9979, + 0.9981, + 0.9983, + 0.9988, + 0.9977, + 0.9988, + 0.999, + 0.9992, + 0.9993, + 0.9995, + 0.9994, + 0.9982, + 0.9996, + 0.9995, + 0.9998, + 0.9998, + 0.9998, + 0.9998, + 0.9998, + 0.9999, + 0.9999, + 0.9999, + 0.9999 + ], + "test_acc": [ + 0.761, + 0.7965, + 0.798, + 0.8105, + 0.808, + 0.8195, + 0.819, + 0.8365, + 0.8285, + 0.8275, + 0.8305, + 0.824, + 0.8395, + 0.8335, + 0.8365, + 0.8225, + 0.841, + 0.841, + 0.8395, + 0.845, + 0.842, + 0.833, + 0.8505, + 0.8415, + 0.849, + 0.8415, + 0.844, + 0.8435, + 0.8405, + 0.8505, + 0.8515, + 0.847, + 0.841, + 0.848, + 0.852, + 0.8585, + 0.8605, + 0.8535, + 0.857, + 0.854, + 0.8485, + 0.848, + 0.8455, + 0.8575, + 0.856, + 0.8575, + 0.8565, + 0.8585, + 0.8555, + 0.8515, + 0.8575, + 0.8595, + 0.8605, + 0.8595, + 0.861, + 0.8595, + 0.866, + 0.8605, + 0.861, + 0.8605, + 0.8575, + 0.8595, + 0.86, + 0.858, + 0.8575, + 0.8575, + 0.8565, + 0.8575, + 0.857, + 0.857, + 0.8565, + 0.854, + 0.855, + 0.8545, + 0.855, + 0.8555, + 0.8555, + 0.8555, + 0.8555, + 0.8555 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8810831904411316, + 0.8730225563049316, + 0.8656145334243774, + 0.8578245639801025, + 0.8490546345710754, + 0.8397257328033447, + 0.8311692476272583, + 0.8243355751037598 + ], + "perturbation_rho": [ + 0.9999987483024597, + 0.9999980330467224, + 0.9999955892562866, + 0.9999854564666748, + 0.9999719858169556, + 0.999948263168335, + 0.9998974204063416, + 0.9998607039451599 + ], + "nudging": { + "0.001": [ + -0.03612860292196274, + -0.02260003425180912, + -0.013746894896030426, + -0.008408663794398308, + -0.005443554371595383, + -0.003843091195449233, + -0.0029569226317107677, + -0.0024378034286201 + ], + "0.003": [ + -0.09868516772985458, + -0.06405734270811081, + -0.03987570106983185, + -0.024722333997488022, + -0.01612165942788124, + -0.011425917968153954, + -0.008809964172542095, + -0.007272382732480764 + ], + "0.01": [ + -0.23731596767902374, + -0.17453062534332275, + -0.11795195937156677, + -0.07674264907836914, + -0.05135927349328995, + -0.036901768296957016, + -0.028667811304330826, + -0.02376912161707878 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.1675753231048582, + 1.1856547933578492, + 0.7580281761169434, + 0.6381688435554504, + 0.5754390489578247, + 0.5642330053329467, + 0.5420730123996734, + 0.5234871512413025, + 0.5435975284576416, + 0.5557498501777649, + 0.5523532521486282, + 0.5620559630751609, + 0.557824009513855, + 0.6107632051467895, + 0.603276273059845, + 0.6159, + 0.6201973339080811, + 0.6276999963760376, + 0.721551043510437, + 0.7058568975448608, + 0.6804799362182617, + 0.8315831820487976, + 0.8213359106063842, + 0.7040662940979003, + 0.7242366206169129, + 0.7309036163330078, + 0.8841015676498413, + 0.7365514185905456, + 0.7004390016555786, + 0.7948915409207344, + 0.7725572082519532, + 0.7417861236095429, + 0.7524257236361503, + 0.7014043121337891, + 0.8019312177658081, + 0.7336400012016296, + 0.746234344291687, + 0.7332810028076172, + 0.7219296333312988, + 0.663898908996582, + 0.8586195873260498, + 0.766791400718689, + 0.8692042198181152, + 0.6851024099349976, + 0.7478959278404713, + 0.6670105101585388, + 0.6914398956298828, + 0.8393889261245727, + 0.7394916067123413, + 0.6740026753425599, + 0.6510983401298523, + 0.6899495806217194, + 0.6442845206975937, + 0.5954629945755004, + 0.6383736618518829, + 0.6042263046264649, + 0.6990487686634064, + 0.5667548357009887, + 0.6024624797821045, + 0.5855678743302822, + 0.5720387092590332, + 0.5841287456512451, + 0.5879881093502045, + 0.5573869585037231, + 0.5499968002319336, + 0.5739686104774475, + 0.5461770409703255, + 0.5319844762802124, + 0.5512453693389893, + 0.5292456346511841, + 0.528937708568573, + 0.5258590517044067, + 0.5199304915189743, + 0.5163791128158569, + 0.5159513384819031, + 0.5147338192939759, + 0.5139513021469116, + 0.5105164805054665, + 0.5090386550664902, + 0.5086064174175262 + ], + "train_acc": [ + 0.2113, + 0.5768, + 0.7207, + 0.7623, + 0.7827, + 0.7893, + 0.7994, + 0.8061, + 0.8041, + 0.8103, + 0.807, + 0.8079, + 0.8151, + 0.8028, + 0.8134, + 0.8128, + 0.8123, + 0.8091, + 0.7976, + 0.8004, + 0.8062, + 0.7834, + 0.7907, + 0.8099, + 0.8061, + 0.8062, + 0.7875, + 0.8111, + 0.811, + 0.7996, + 0.7993, + 0.808, + 0.8062, + 0.8152, + 0.7973, + 0.8111, + 0.8104, + 0.8107, + 0.8152, + 0.8178, + 0.7866, + 0.8024, + 0.7844, + 0.8167, + 0.8026, + 0.8254, + 0.8192, + 0.7921, + 0.809, + 0.8179, + 0.8206, + 0.8156, + 0.8235, + 0.8322, + 0.8207, + 0.83, + 0.8145, + 0.8345, + 0.8257, + 0.8301, + 0.8322, + 0.8341, + 0.8296, + 0.8373, + 0.8403, + 0.8335, + 0.8369, + 0.8424, + 0.8379, + 0.8438, + 0.841, + 0.8409, + 0.8451, + 0.8438, + 0.8447, + 0.8457, + 0.8451, + 0.8461, + 0.8469, + 0.8469 + ], + "test_acc": [ + 0.409, + 0.647, + 0.72, + 0.737, + 0.733, + 0.7465, + 0.7405, + 0.758, + 0.7695, + 0.744, + 0.7575, + 0.755, + 0.751, + 0.743, + 0.7635, + 0.765, + 0.756, + 0.7515, + 0.7465, + 0.72, + 0.724, + 0.7135, + 0.764, + 0.776, + 0.7465, + 0.663, + 0.738, + 0.756, + 0.7275, + 0.762, + 0.7695, + 0.7285, + 0.7305, + 0.7585, + 0.742, + 0.756, + 0.736, + 0.762, + 0.771, + 0.716, + 0.75, + 0.716, + 0.7745, + 0.75, + 0.7535, + 0.742, + 0.7085, + 0.746, + 0.75, + 0.7585, + 0.753, + 0.78, + 0.7735, + 0.7895, + 0.788, + 0.7515, + 0.7745, + 0.7725, + 0.784, + 0.783, + 0.7705, + 0.7865, + 0.781, + 0.798, + 0.7755, + 0.7975, + 0.802, + 0.7925, + 0.7955, + 0.7955, + 0.7945, + 0.7945, + 0.794, + 0.7985, + 0.797, + 0.798, + 0.8, + 0.799, + 0.7995, + 0.7985 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.027731137350201607, + 0.10604047030210495, + 0.13601002097129822, + 0.07596071809530258, + 0.0985877588391304, + 0.08992618322372437, + 0.1115533858537674, + 0.10418008267879486 + ], + "perturbation_rho": [ + -0.01300876960158348, + 0.12486347556114197, + 0.1899794042110443, + 0.08801613748073578, + 0.11934874951839447, + 0.15905101597309113, + 0.1374979466199875, + 0.167507603764534 + ], + "nudging": { + "0.001": [ + -0.00116775743663311, + -0.0005817725323140621, + -0.0004425079678185284, + -0.0002278374886373058, + -0.00030131125822663307, + -0.0003067472716793418, + -0.00033343967515975237, + -0.00031045585637912154 + ], + "0.003": [ + -0.003487181384116411, + -0.0017464003758504987, + -0.0013272382784634829, + -0.0006842178991064429, + -0.0009047683561220765, + -0.0009237582562491298, + -0.001001371769234538, + -0.0009321005782112479 + ], + "0.01": [ + -0.011210349388420582, + -0.00580610241740942, + -0.004417200107127428, + -0.002277099061757326, + -0.003015844151377678, + -0.0030763214454054832, + -0.003333096392452717, + -0.003100896719843149 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.6784069482803345, + 0.8538369147300721, + 0.6258324602127076, + 0.668401536655426, + 0.7467584712982178, + 0.8377721960067749, + 0.9246440408706665, + 0.9443994323730469, + 0.8772222507476807, + 0.8539061568260193, + 0.8640116756439209, + 0.8537434608459472, + 0.8456798457145691, + 0.8172312419891358, + 0.8153982551574707, + 0.8007552943229675, + 0.794915559387207, + 0.8125922817230224, + 0.8261112766265869, + 0.8598634362220764, + 0.8852636333465577, + 0.8463179750442504, + 0.8648002141952514, + 0.8659900695800781, + 0.8808840075492859, + 0.8678793494224548, + 0.8149205436706543, + 0.8051315529823303, + 0.7829432733535766, + 0.8025028318405152, + 0.806145126914978, + 0.7712487247467041, + 0.7314799781799316, + 0.7506569934844971, + 0.7251035878658295, + 0.7171359412193299, + 0.7223926441192627, + 0.7606710305213928, + 0.7542281196594238, + 0.7664629793167115, + 0.7547179684638977, + 0.7321481575012208, + 0.7432650357246399, + 0.759351619386673, + 0.7231213260650635, + 0.7028192038059234, + 0.7018617664337158, + 0.6897621598243714, + 0.6744844152450562, + 0.661704832649231, + 0.6507027347564698, + 0.651756622838974, + 0.6367372986793518, + 0.6331114406585694, + 0.621852323770523, + 0.6100035942077636, + 0.6207889963150024, + 0.6060253511428833, + 0.6061938572883606, + 0.5996559371948242, + 0.5985591208934784, + 0.594506115436554, + 0.5957340684890747, + 0.5967603279113769, + 0.5868529572486877, + 0.5819584226608276, + 0.5830897835254669, + 0.5751743601322175, + 0.5750890419960022, + 0.5712065260887146, + 0.5768221997261047, + 0.57174985704422, + 0.5698016437530518, + 0.5679710320472717, + 0.5670583985328674, + 0.5655418931007385, + 0.5647730830669403, + 0.564036203956604, + 0.5634859690189361, + 0.5633206834793091 + ], + "train_acc": [ + 0.3775, + 0.6775, + 0.7658, + 0.7622, + 0.7479, + 0.7153, + 0.683, + 0.6745, + 0.6916, + 0.6924, + 0.6903, + 0.6979, + 0.6947, + 0.7022, + 0.7023, + 0.7059, + 0.7174, + 0.7102, + 0.7041, + 0.7003, + 0.6969, + 0.7058, + 0.6969, + 0.6961, + 0.6944, + 0.7061, + 0.7134, + 0.7147, + 0.7232, + 0.7225, + 0.7195, + 0.7299, + 0.7416, + 0.7358, + 0.7423, + 0.7457, + 0.7415, + 0.7298, + 0.7298, + 0.7304, + 0.7341, + 0.7385, + 0.7345, + 0.7343, + 0.7411, + 0.7455, + 0.7503, + 0.7477, + 0.758, + 0.7611, + 0.7653, + 0.7635, + 0.769, + 0.769, + 0.7748, + 0.7762, + 0.7738, + 0.7796, + 0.7799, + 0.7829, + 0.7854, + 0.7821, + 0.7841, + 0.7834, + 0.7892, + 0.7867, + 0.7844, + 0.7916, + 0.7943, + 0.7908, + 0.7905, + 0.7918, + 0.7904, + 0.7928, + 0.7977, + 0.7965, + 0.7967, + 0.7968, + 0.7979, + 0.7976 + ], + "test_acc": [ + 0.5905, + 0.713, + 0.732, + 0.735, + 0.709, + 0.6775, + 0.632, + 0.668, + 0.6925, + 0.6775, + 0.668, + 0.654, + 0.6655, + 0.6685, + 0.6705, + 0.665, + 0.647, + 0.672, + 0.647, + 0.6545, + 0.666, + 0.669, + 0.6395, + 0.654, + 0.6495, + 0.6735, + 0.684, + 0.69, + 0.6515, + 0.6245, + 0.638, + 0.681, + 0.684, + 0.6905, + 0.6955, + 0.6795, + 0.679, + 0.6915, + 0.6655, + 0.683, + 0.6745, + 0.6925, + 0.6685, + 0.6965, + 0.6905, + 0.7015, + 0.7225, + 0.7035, + 0.713, + 0.7285, + 0.7095, + 0.727, + 0.717, + 0.7325, + 0.7405, + 0.742, + 0.7285, + 0.733, + 0.733, + 0.741, + 0.745, + 0.7425, + 0.741, + 0.7395, + 0.739, + 0.748, + 0.7505, + 0.743, + 0.7455, + 0.7465, + 0.7455, + 0.749, + 0.751, + 0.748, + 0.755, + 0.7485, + 0.7515, + 0.749, + 0.7505, + 0.7505 + ], + "state_pred_error": [ + 0.6772782639980316, + 0.19106789288520812, + 0.13515139267444612, + 0.13850510149002077, + 0.15888860702514648, + 0.1779759260416031, + 0.18962191469669343, + 0.19099906651973725, + 0.19079499611854553, + 0.1884487063884735, + 0.16957074830532073, + 0.1468679202079773, + 0.13275577713251113, + 0.12061098921298981, + 0.11245400367975235, + 0.1107190781712532, + 0.10698225569725037, + 0.10462268464565277, + 0.10515006263256073, + 0.1079078679561615, + 0.10459889571666718, + 0.09621057146787644, + 0.09101127699613572, + 0.0875964389204979, + 0.08520031116008758, + 0.07949715087413788, + 0.07065141149759292, + 0.059809070467948915, + 0.05204611879587173, + 0.04686824198961258, + 0.04378255767822266, + 0.04081880375742912, + 0.03798793787956238, + 0.0367397832930088, + 0.03546322963833809, + 0.03455261668562889, + 0.0339633260011673, + 0.033648267769813535, + 0.032997100949287414, + 0.03264095353484154, + 0.03156215361058712, + 0.03050885224044323, + 0.029427878975868224, + 0.028430858767032625, + 0.027126849246025084, + 0.025839528360962868, + 0.024351652067899705, + 0.022825814968347548, + 0.021286853644251823, + 0.019926348620653154, + 0.018836932730674744, + 0.017829388728737832, + 0.017018498905003072, + 0.01635422433912754, + 0.015619463436305523, + 0.015121812850236893, + 0.014551292099058628, + 0.014125415742397309, + 0.01379347063228488, + 0.013232204216718673, + 0.012918133257329463, + 0.012570921210944653, + 0.012321776081621647, + 0.011932332634925841, + 0.012032916615903378, + 0.011654329168796539, + 0.01127493067085743, + 0.010999307538568974, + 0.010814604671299457, + 0.010433502918481826, + 0.010403014844655991, + 0.010025098942220211, + 0.009788281431794166, + 0.009658125045895577, + 0.009502492478489876, + 0.00937487707734108, + 0.009174802857637405, + 0.00912027053758502, + 0.008794732482731342, + 0.008746991481631994 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8145060539245605, + 0.39495280385017395, + 0.15602949261665344, + 0.14954066276550293, + 0.1189848780632019, + 0.14297258853912354, + 0.11834269762039185, + 0.11334948241710663 + ], + "perturbation_rho": [ + 0.7131592035293579, + 0.31938445568084717, + 0.13574811816215515, + 0.13510501384735107, + 0.12680554389953613, + 0.13444143533706665, + 0.1260460913181305, + 0.09450235962867737 + ], + "nudging": { + "0.001": [ + -0.02241743914783001, + -0.0012560778995975852, + -0.00039777648635208607, + -0.00037799825076945126, + -0.0003125373332295567, + -0.00036414398346096277, + -0.00031964073423296213, + -0.00029873993480578065 + ], + "0.003": [ + -0.06559374928474426, + -0.0037621967494487762, + -0.001192728290334344, + -0.0011324514634907246, + -0.0009376248344779015, + -0.0010918397456407547, + -0.000958584132604301, + -0.0008956205565482378 + ], + "0.01": [ + -0.20040717720985413, + -0.012472910806536674, + -0.003969438374042511, + -0.003768536727875471, + -0.0031205681152641773, + -0.00363306887447834, + -0.0031901695765554905, + -0.002980557270348072 + ] + }, + "state_pred_error_per_layer": [ + 7208.7744140625, + 4043.077392578125, + 2431.6259765625, + 2036.907958984375, + 1977.547119140625, + 1708.2327880859375, + 1901.497314453125, + 1821.6331787109375 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.169899132156372, + 1.197789729309082, + 0.7590794116973877, + 0.6422608478546142, + 0.584924817276001, + 0.5648346998214722, + 0.5388649930000305, + 0.5851700714111329, + 0.5517988770008088, + 0.525461665058136, + 0.5722274063110352, + 0.5967739044189453, + 0.599816835308075, + 0.6654899589538574, + 0.524122939491272, + 0.5636429683685302, + 0.7308413411140442, + 0.653116132569313, + 0.7010653434753418, + 0.7020271137237549, + 0.6951467881679535, + 0.7047059141159058, + 0.735547448348999, + 0.9342722967147827, + 0.8680836700439453, + 0.9131568016052246, + 0.9096203659534454, + 1.0347100614547728, + 0.9645821760177612, + 0.9702437899589539, + 0.9094774784564972, + 0.9601590196609497, + 1.0798742359161377, + 1.092118327331543, + 1.032936611366272, + 1.1091057176589967, + 1.0215610338211059, + 0.9568075794219971, + 1.0716010482788085, + 1.0599199287414551, + 1.2421540455818176, + 1.2023227766036988, + 1.1708740584373474, + 1.1385227828979492, + 1.1439118378639221, + 1.0960134803771973, + 1.1730884643554687, + 1.102697074317932, + 1.1464144012451172, + 1.0509382783889771, + 1.0821549007415772, + 1.164067378616333, + 1.0707063930511476, + 1.1033225898742676, + 1.1311242740631104, + 1.1095260940551759, + 1.103656944656372, + 1.093299767112732, + 1.1076723503112793, + 1.1251354174613952, + 1.1135358158111572, + 1.1405975442886354, + 1.1332505071640016, + 1.1395424041748048, + 1.1576629329681396, + 1.1703690267562865, + 1.1598464979171752, + 1.1532865390777587, + 1.1590178819656372, + 1.1575250087738038, + 1.1601745920181274, + 1.1568465393066407, + 1.1543491954803466, + 1.154213610458374, + 1.1500441106796264, + 1.1494695510864257, + 1.1487898721694947, + 1.1466926807403564, + 1.1453759771347045, + 1.144642575263977 + ], + "train_acc": [ + 0.214, + 0.572, + 0.7171, + 0.762, + 0.7828, + 0.7896, + 0.7977, + 0.7902, + 0.8043, + 0.8146, + 0.8075, + 0.8023, + 0.8098, + 0.7934, + 0.8285, + 0.8211, + 0.7869, + 0.8048, + 0.7953, + 0.7903, + 0.791, + 0.7912, + 0.7783, + 0.7442, + 0.7565, + 0.7494, + 0.7425, + 0.7158, + 0.7176, + 0.7073, + 0.709, + 0.6874, + 0.6568, + 0.6523, + 0.6548, + 0.631, + 0.6549, + 0.6643, + 0.6365, + 0.636, + 0.6048, + 0.611, + 0.6129, + 0.6199, + 0.6083, + 0.6216, + 0.6033, + 0.6136, + 0.607, + 0.6242, + 0.6212, + 0.5947, + 0.6192, + 0.6108, + 0.6008, + 0.6101, + 0.6167, + 0.6127, + 0.6161, + 0.6081, + 0.6131, + 0.6068, + 0.6051, + 0.6046, + 0.5949, + 0.597, + 0.5965, + 0.5993, + 0.5982, + 0.5988, + 0.5983, + 0.601, + 0.599, + 0.6012, + 0.5997, + 0.5996, + 0.6003, + 0.6001, + 0.6019, + 0.6011 + ], + "test_acc": [ + 0.4045, + 0.6525, + 0.71, + 0.7445, + 0.741, + 0.75, + 0.757, + 0.7435, + 0.7555, + 0.765, + 0.7525, + 0.7735, + 0.7285, + 0.772, + 0.7585, + 0.7385, + 0.719, + 0.734, + 0.76, + 0.7505, + 0.745, + 0.7105, + 0.711, + 0.717, + 0.708, + 0.694, + 0.6665, + 0.692, + 0.633, + 0.587, + 0.621, + 0.5625, + 0.586, + 0.536, + 0.4865, + 0.5185, + 0.5765, + 0.5355, + 0.6045, + 0.5395, + 0.514, + 0.476, + 0.553, + 0.528, + 0.5495, + 0.507, + 0.5325, + 0.479, + 0.547, + 0.558, + 0.4865, + 0.579, + 0.5495, + 0.492, + 0.536, + 0.5855, + 0.563, + 0.572, + 0.5725, + 0.562, + 0.5645, + 0.5625, + 0.559, + 0.54, + 0.551, + 0.5415, + 0.559, + 0.563, + 0.5585, + 0.5535, + 0.559, + 0.55, + 0.556, + 0.564, + 0.553, + 0.559, + 0.5535, + 0.5525, + 0.555, + 0.555 + ], + "value_loss": [ + 2.7866874431610107, + 0.9174076202392578, + 0.8914946027755737, + 0.9023974754333496, + 0.8192308839321136, + 0.7574673677444458, + 0.7969445713043213, + 0.9423759811401368, + 0.9109364691734314, + 0.808044982624054, + 0.9660812770843505, + 1.1082358276367188, + 1.1196660041809081, + 1.2880344915866853, + 0.9416150609016418, + 1.0244576909065246, + 1.7019867615699769, + 1.3895921471595765, + 1.5365349853515624, + 1.5349470893859862, + 1.5058123647689818, + 1.4833002822875976, + 1.5964698181152344, + 2.332591817855835, + 2.1592319396972655, + 2.3775140846252443, + 2.055455123615265, + 2.358651049351692, + 1.9399827407836914, + 1.801168231010437, + 1.4624209257125855, + 1.3816904611587524, + 2.3037928730010986, + 1.6289699904441834, + 1.1638665494918823, + 1.3711586618423461, + 1.3940555594444275, + 0.8574702676773072, + 0.915366801071167, + 0.8432927488327027, + 2.127538126420975, + 1.3269745040893555, + 1.3527723755836487, + 1.1931525053024292, + 1.2245771019935607, + 1.1547237043857574, + 0.9767586273193359, + 1.0432306060791015, + 0.8256955463409423, + 0.6316090171813965, + 0.6487793773651123, + 0.739714870929718, + 0.5902126419067383, + 0.6460893482208252, + 0.672758955001831, + 0.6674723028182984, + 0.6114201810836792, + 0.5738068954467773, + 0.6004385272026062, + 0.5945483853816986, + 0.5871271083831787, + 0.627871448135376, + 0.6086034240722656, + 0.5733864782333374, + 0.5696756621360779, + 0.6026423274040222, + 0.6132345210075378, + 0.5927936091423035, + 0.5670827034950257, + 0.564662850189209, + 0.5607326948165894, + 0.5638655605316162, + 0.5459429302215576, + 0.5456877880096436, + 0.5736805513381958, + 0.5470059418201446, + 0.5224333214044571, + 0.5464944786071777, + 0.5188668343544006, + 0.5412774887084961 + ], + "term_loss": [ + 1.63910704536438, + 0.6317383563995361, + 0.7112859618186951, + 0.7408633338928222, + 0.6577937492370606, + 0.5729757232189179, + 0.6305919244766235, + 0.7700344627380371, + 0.7500860171318054, + 0.6568901985168457, + 0.8059835026741028, + 0.9458411903381347, + 0.954459958934784, + 1.1104201313018798, + 0.7928285349845886, + 0.8695057340621948, + 1.5071396081924437, + 1.21288857524395, + 1.3495808773040772, + 1.3286071298122406, + 1.2826879957199098, + 1.2582777523040771, + 1.3444410652160645, + 1.9734292907714843, + 1.788304136276245, + 2.006763204574585, + 1.687252942943573, + 2.00210447653532, + 1.596301502227783, + 1.428968256187439, + 1.14496179561615, + 1.0461816717147827, + 1.8839465621948241, + 1.194931499004364, + 0.8141011932373047, + 0.9930688802719116, + 1.0058540163993837, + 0.5390169447898865, + 0.5843337638854981, + 0.5027120730400085, + 1.6004343148708344, + 0.8963684169769287, + 0.893130143404007, + 0.764038823890686, + 0.7726210286140441, + 0.7405953636407853, + 0.5840272753715515, + 0.6448911304473877, + 0.4747549978256226, + 0.3141033357620239, + 0.33270398921966554, + 0.4020488702058792, + 0.2790641488313675, + 0.3292891996383667, + 0.3515699282169342, + 0.34689451780319214, + 0.3006282347202301, + 0.27147112836837767, + 0.29616545426845553, + 0.28420736417770387, + 0.2826799100875855, + 0.3165199294090271, + 0.2988843548297882, + 0.2680483558177948, + 0.261594016623497, + 0.29058788201808927, + 0.29542932945489886, + 0.2805451308965683, + 0.2601419636726379, + 0.2575787572383881, + 0.25340069789886477, + 0.2539660128593445, + 0.23847104530334473, + 0.2382884523868561, + 0.2596001932859421, + 0.23661555552482605, + 0.2207985038548708, + 0.23649365541934966, + 0.21443204939365387, + 0.23150972747802734 + ], + "bridge_loss": [ + 0.851698666994652, + 0.05855167130827904, + 0.006215408114343882, + 0.0038532218255102634, + 0.011163550445437431, + 0.037724834394454954, + 0.02354336112141609, + 0.020078385154902935, + 0.01455264826565981, + 0.012083962416648865, + 0.012597031140327454, + 0.011899129335582256, + 0.01517092033624649, + 0.016714082181453704, + 0.01529124939441681, + 0.01617379978299141, + 0.02265110963135958, + 0.02179773365855217, + 0.025880517882108687, + 0.044521565622091294, + 0.05782247805893421, + 0.05953346390724182, + 0.07923136401176453, + 0.15373265982866288, + 0.17564270244836808, + 0.1691748236656189, + 0.1638057589173317, + 0.13287635965049266, + 0.12563166702985765, + 0.14815512808561326, + 0.09730534753799439, + 0.10153535420894623, + 0.16397418546676637, + 0.16828366361260413, + 0.09841816610097885, + 0.11215688467025757, + 0.13492409853935242, + 0.0738004425406456, + 0.0662885293841362, + 0.07449169340133667, + 0.24015194996595382, + 0.1427286093711853, + 0.1754998088359833, + 0.1464556162595749, + 0.16590757843255996, + 0.13885814949274064, + 0.10230485528707504, + 0.11841529335975647, + 0.0632941883802414, + 0.04624536537528038, + 0.04330551617741585, + 0.04858552278876305, + 0.0362572277367115, + 0.03532285144329071, + 0.03417909780740738, + 0.0386603756070137, + 0.03108417900800705, + 0.025329264031350614, + 0.0265734569311142, + 0.02687511657476425, + 0.023663357776403427, + 0.027196960085630415, + 0.02578365526199341, + 0.021047952508926392, + 0.021056697730720043, + 0.022916216899454594, + 0.02991764326095581, + 0.026238187783956528, + 0.019742111763358116, + 0.02061487686634064, + 0.019812159460783005, + 0.023762189900875093, + 0.021338633975386618, + 0.021927258050441743, + 0.029114572647213937, + 0.024936546593904495, + 0.01797967905253172, + 0.025368353989720344, + 0.020480678632855416, + 0.02621319934129715 + ], + "tgrad_loss": [ + 0.295881768321991, + 0.22711758861541748, + 0.17399323415756227, + 0.15768092048168184, + 0.15027358498573304, + 0.14676680796146394, + 0.1428092940092087, + 0.15226313366889954, + 0.14629780707359313, + 0.13907082080841066, + 0.14750074167251587, + 0.15049550247192384, + 0.15003512766361238, + 0.16090027875900267, + 0.1334952704668045, + 0.13877815887928008, + 0.17219604279994966, + 0.1549058295071125, + 0.161073606300354, + 0.16181839514374732, + 0.16530189299583434, + 0.16548906588554382, + 0.17279738521575927, + 0.2054298910856247, + 0.19528509845733644, + 0.2015760479450226, + 0.20439642648696899, + 0.22367020057439804, + 0.21804955558776856, + 0.22404484484195708, + 0.220153786444664, + 0.23397343626022338, + 0.2558721103668213, + 0.2657548138618469, + 0.25134719014167783, + 0.26593290541172027, + 0.25327744019031523, + 0.2446528902053833, + 0.2647445123195648, + 0.26608898282051086, + 0.2869518846511841, + 0.28787748503684996, + 0.2841424269676209, + 0.28265806045532227, + 0.28604849166870117, + 0.275270179605484, + 0.2904265064239502, + 0.2799241715431213, + 0.2876463684082031, + 0.27126030888557434, + 0.2727698717355728, + 0.2890804699420929, + 0.2748912615776062, + 0.2814773001670837, + 0.2870099315643311, + 0.2819174147605896, + 0.27970777044296263, + 0.277006508564949, + 0.27769961276054383, + 0.28346590518951414, + 0.2807838364601135, + 0.28415455718040467, + 0.28393541340827944, + 0.28429017095565795, + 0.287024947977066, + 0.2891382306098938, + 0.2878875425100327, + 0.2860102851390839, + 0.2871986273288727, + 0.28646921577453616, + 0.2875198390007019, + 0.2861373591423035, + 0.28613325204849244, + 0.2854720791339874, + 0.2849657874107361, + 0.28545383520126344, + 0.2836551445007324, + 0.2846324709892273, + 0.28395411243438723, + 0.28355456256866457 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.03383665531873703, + 0.10378465056419373, + 0.1522345095872879, + 0.12050338089466095, + 0.12787620723247528, + 0.13963481783866882, + 0.14998120069503784, + 0.1584387719631195 + ], + "perturbation_rho": [ + 0.02018044888973236, + 0.14589767158031464, + 0.20607107877731323, + 0.18045580387115479, + 0.1894514560699463, + 0.16447019577026367, + 0.1924649477005005, + 0.2218032032251358 + ], + "nudging": { + "0.001": [ + -0.0010144492844119668, + -0.0008512640488334, + -0.0010741300648078322, + -0.0009214384481310844, + -0.0009110164828598499, + -0.0009800404077395797, + -0.0010496200993657112, + -0.0010793276596814394 + ], + "0.003": [ + -0.003022595774382353, + -0.0025523165240883827, + -0.003220552345737815, + -0.002765212208032608, + -0.002732472261413932, + -0.0029396198224276304, + -0.0031477869488298893, + -0.003236861899495125 + ], + "0.01": [ + -0.00981426052749157, + -0.00849075522273779, + -0.010712197050452232, + -0.009203735738992691, + -0.009092864580452442, + -0.00978156179189682, + -0.010470103472471237, + -0.010766083374619484 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a1.0_L12_s123.json b/results/synth_ladder_v2_hi/synth_a1.0_L12_s123.json new file mode 100644 index 0000000..e1e1009 --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a1.0_L12_s123.json @@ -0,0 +1,1722 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.238738206100464, + 0.6613351190567016, + 0.5395772783279419, + 0.4733346885681152, + 0.4231542590379715, + 0.3620361569643021, + 0.3230682401239872, + 0.2523321887969971, + 0.3470890686511993, + 0.25146674609184266, + 0.24440096678733825, + 0.1842203591823578, + 0.24344354785680772, + 0.11816815827786922, + 0.06866284420490265, + 0.08833205785751343, + 0.09207577448785305, + 0.0486494089782238, + 0.046294594306498765, + 0.027046850475668908, + 0.015711779367923735, + 0.012188610082678497, + 0.007740385116636753, + 0.00582380747757852, + 0.0050085094667971135, + 0.00443948317989707, + 0.004161420274153352, + 0.003766811668127775, + 0.0034422829911112786, + 0.0034336333803832533, + 0.0030249461911618708, + 0.002912200229614973, + 0.0027408694557845593, + 0.0024907449718564747, + 0.0023011812917888164, + 0.0021857335910201075, + 0.002056089808046818, + 0.0019683007838204505, + 0.0018585119150578975, + 0.001773246581107378, + 0.001690511012636125, + 0.0016192044278606772, + 0.0015656297475099563, + 0.0015094914896413684, + 0.001456394356675446, + 0.001409525142610073, + 0.001370351544767618, + 0.0013320897528901695, + 0.0012892388922162354, + 0.0012502161199226976, + 0.0012188509058207273, + 0.0011895375870168208, + 0.001164797018840909, + 0.0011384376548230649, + 0.001114835398364812, + 0.0010922997965477407, + 0.0010709371257573367, + 0.0010527558989822865, + 0.0010423784567043185, + 0.0010238841459155083, + 0.001007764333859086, + 0.00099469233751297, + 0.000982387449592352, + 0.0009712855339050292, + 0.000962210407666862, + 0.0009533346139825881, + 0.0009455815449357032, + 0.0009392593406140805, + 0.0009328387510031461, + 0.000927877208031714, + 0.0009235073435120285, + 0.0009196365909650922, + 0.000916477270424366, + 0.0009136286557652056, + 0.0009118279222398996, + 0.0009102091716602444, + 0.0009090610071085393, + 0.0009083506962284446, + 0.0009078968527726829, + 0.0009076604296453298 + ], + "train_acc": [ + 0.5545, + 0.7429, + 0.7953, + 0.8162, + 0.8395, + 0.8666, + 0.8809, + 0.9067, + 0.8711, + 0.9101, + 0.9094, + 0.938, + 0.911, + 0.9619, + 0.9852, + 0.974, + 0.9711, + 0.9893, + 0.9889, + 0.9964, + 0.9996, + 0.9994, + 0.9999, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.711, + 0.7345, + 0.743, + 0.7465, + 0.749, + 0.7505, + 0.7575, + 0.759, + 0.7535, + 0.7525, + 0.748, + 0.751, + 0.7425, + 0.766, + 0.7635, + 0.7515, + 0.7645, + 0.7585, + 0.771, + 0.7665, + 0.765, + 0.7635, + 0.7695, + 0.767, + 0.77, + 0.7695, + 0.7695, + 0.77, + 0.7695, + 0.7655, + 0.766, + 0.7665, + 0.7655, + 0.7645, + 0.766, + 0.7665, + 0.7655, + 0.765, + 0.766, + 0.766, + 0.7665, + 0.7655, + 0.765, + 0.766, + 0.7655, + 0.7655, + 0.7645, + 0.764, + 0.765, + 0.766, + 0.767, + 0.765, + 0.7645, + 0.764, + 0.7635, + 0.7635, + 0.7635, + 0.7645, + 0.763, + 0.763, + 0.7635, + 0.7645, + 0.7625, + 0.764, + 0.7625, + 0.763, + 0.763, + 0.7625, + 0.761, + 0.7625, + 0.762, + 0.762, + 0.7615, + 0.7615, + 0.7615, + 0.7615, + 0.7615, + 0.7615, + 0.7615, + 0.7615 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.86488276720047, + 0.8622424006462097, + 0.8600971698760986, + 0.85722416639328, + 0.8523166179656982, + 0.8457985520362854, + 0.8359642028808594, + 0.828606367111206, + 0.8221874237060547, + 0.8125513792037964, + 0.80171799659729, + 0.7934804558753967 + ], + "perturbation_rho": [ + 0.9999992251396179, + 0.9999991655349731, + 0.9999990463256836, + 0.9999980330467224, + 0.9999971389770508, + 0.9999936819076538, + 0.9999881386756897, + 0.9999800324440002, + 0.9999632835388184, + 0.999937891960144, + 0.9999018311500549, + 0.9998522996902466 + ], + "nudging": { + "0.001": [ + -0.05972275882959366, + -0.04901757463812828, + -0.039307620376348495, + -0.03037886694073677, + -0.02256305143237114, + -0.016410548239946365, + -0.01194553542882204, + -0.008773503825068474, + -0.006583607289940119, + -0.0050867884419858456, + -0.004056186880916357, + -0.0033473381772637367 + ], + "0.003": [ + -0.1681329607963562, + -0.13970935344696045, + -0.11326389014720917, + -0.08840985596179962, + -0.06622078269720078, + -0.04846895486116409, + -0.03543655201792717, + -0.026105739176273346, + -0.01962977647781372, + -0.015187501907348633, + -0.012121773324906826, + -0.010009994730353355 + ], + "0.01": [ + -0.4491935074329376, + -0.38857996463775635, + -0.3270212411880493, + -0.26439201831817627, + -0.20410630106925964, + -0.15283547341823578, + -0.11351937055587769, + -0.08454076200723648, + -0.06403174996376038, + -0.04978282377123833, + -0.03986590355634689, + -0.032995663583278656 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.202339591217041, + 1.3197662359237672, + 0.9467211002349853, + 0.8428364715576172, + 0.7896131301879883, + 0.7633397129058838, + 0.7488100243568421, + 0.740450912284851, + 0.7766979461669922, + 0.785177182006836, + 0.8205275463104248, + 0.8195417936325073, + 0.8523592538833619, + 0.8628508913516998, + 0.8150059830665588, + 0.8488281514167786, + 0.8909374650001526, + 0.9010982797622681, + 0.8784109934806824, + 0.9215612866401672, + 0.9492555601119995, + 0.9399690055847167, + 0.9057739995956421, + 0.9514210477828979, + 0.9790562412261963, + 1.0058076820373536, + 1.074447036266327, + 0.9894476831436158, + 1.0674426013946534, + 0.9942384609222412, + 1.0341941476821899, + 0.9958202060699463, + 1.031863384246826, + 1.0247520631790161, + 1.0434253861427307, + 1.0245234265327454, + 1.032747696876526, + 1.0287066256523132, + 1.0981156536102294, + 1.0315956830978394, + 1.007985222530365, + 1.0512058019638062, + 1.109238450717926, + 1.0539381145238875, + 1.0085170584678649, + 0.9916242378234863, + 0.9867569475173951, + 1.0172756858825684, + 1.0578618814468383, + 0.986051445388794, + 1.0299558208465576, + 1.0038312606811524, + 0.9938522087097168, + 1.019758701324463, + 1.005025187397003, + 0.9923043254852295, + 0.9744973911285401, + 1.0040310264587402, + 0.9865996182441712, + 0.9762414364814759, + 0.9743295421600342, + 0.9790146026611328, + 0.9765340627670288, + 0.9596751022338867, + 0.9693172966003418, + 0.9597562124252319, + 0.9473907022476197, + 0.9487135580062867, + 0.9539228395462036, + 0.9419368682861328, + 0.9428634670257569, + 0.9420891220092773, + 0.9357248798370361, + 0.931165361404419, + 0.9303673110961914, + 0.9292953009605408, + 0.927647031211853, + 0.9273946614265441, + 0.9265368665695191, + 0.9260309785842895 + ], + "train_acc": [ + 0.1979, + 0.5343, + 0.6507, + 0.6875, + 0.7091, + 0.7175, + 0.7241, + 0.7294, + 0.7197, + 0.7169, + 0.7153, + 0.7131, + 0.7078, + 0.7083, + 0.7195, + 0.7154, + 0.7076, + 0.7037, + 0.7105, + 0.704, + 0.7021, + 0.7031, + 0.7096, + 0.6981, + 0.6947, + 0.6952, + 0.6824, + 0.6966, + 0.6853, + 0.6956, + 0.6917, + 0.6964, + 0.6918, + 0.6949, + 0.6958, + 0.6963, + 0.6897, + 0.6914, + 0.6832, + 0.6913, + 0.6921, + 0.6858, + 0.6735, + 0.6891, + 0.6964, + 0.6999, + 0.6977, + 0.6923, + 0.6861, + 0.6982, + 0.6883, + 0.6948, + 0.6937, + 0.6934, + 0.6957, + 0.6988, + 0.7001, + 0.6931, + 0.6994, + 0.6959, + 0.7026, + 0.7006, + 0.7007, + 0.7069, + 0.7045, + 0.7053, + 0.709, + 0.707, + 0.7033, + 0.7088, + 0.7057, + 0.7079, + 0.7123, + 0.7097, + 0.7125, + 0.7096, + 0.7121, + 0.712, + 0.7117, + 0.7117 + ], + "test_acc": [ + 0.395, + 0.5915, + 0.6425, + 0.661, + 0.6655, + 0.6825, + 0.679, + 0.6585, + 0.6505, + 0.6645, + 0.636, + 0.609, + 0.6505, + 0.664, + 0.6555, + 0.6495, + 0.666, + 0.655, + 0.641, + 0.638, + 0.634, + 0.6485, + 0.6025, + 0.63, + 0.6215, + 0.6465, + 0.63, + 0.588, + 0.623, + 0.617, + 0.6415, + 0.6425, + 0.624, + 0.6285, + 0.628, + 0.614, + 0.6305, + 0.5995, + 0.639, + 0.6465, + 0.6095, + 0.5865, + 0.622, + 0.643, + 0.6265, + 0.6425, + 0.638, + 0.6065, + 0.6305, + 0.644, + 0.6095, + 0.6435, + 0.632, + 0.6315, + 0.6345, + 0.641, + 0.64, + 0.6495, + 0.6425, + 0.64, + 0.6325, + 0.6365, + 0.6495, + 0.6335, + 0.6435, + 0.651, + 0.646, + 0.6435, + 0.638, + 0.6445, + 0.6415, + 0.647, + 0.6485, + 0.6455, + 0.6465, + 0.6485, + 0.649, + 0.6465, + 0.648, + 0.6485 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.003139778506010771, + 0.07545783370733261, + 0.07123857736587524, + 0.04737270250916481, + 0.07089244574308395, + 0.05843178555369377, + 0.10959646850824356, + 0.04730183631181717, + 0.05721074715256691, + 0.06935717165470123, + 0.04019004851579666, + 0.04955831170082092 + ], + "perturbation_rho": [ + -0.020620837807655334, + 0.0424807034432888, + 0.07906489074230194, + -0.014874707907438278, + 0.06078936904668808, + 0.006801994517445564, + 0.11016394942998886, + 0.07577681541442871, + 0.01940302737057209, + 0.0600065141916275, + 0.020656054839491844, + 0.04902234673500061 + ], + "nudging": { + "0.001": [ + 2.8067472157999873e-05, + -0.00044735506526194513, + -0.00028866907814517617, + -0.0001569169689901173, + -0.0002910669718403369, + -0.00020299921743571758, + -0.00038177313399501145, + -0.0001458294573239982, + -0.00017777856555767357, + -0.00023665392654947937, + -0.000140793330501765, + -0.00016380546730943024 + ], + "0.003": [ + 7.542525418102741e-05, + -0.0013394037960097194, + -0.0008648735238239169, + -0.00046930869575589895, + -0.0008721597259864211, + -0.0006091208197176456, + -0.001144462265074253, + -0.00043658187496475875, + -0.0005302035133354366, + -0.0007079149945639074, + -0.00042207835940644145, + -0.000491109793074429 + ], + "0.01": [ + 0.00014946935698390007, + -0.004455030895769596, + -0.0028790468350052834, + -0.0015581330517306924, + -0.0028997263871133327, + -0.0020245155319571495, + -0.003806713502854109, + -0.0014502943959087133, + -0.0017623959574848413, + -0.002352846320718527, + -0.001400630921125412, + -0.001629082253202796 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.749035419845581, + 1.0243288425445556, + 0.8783701831817627, + 0.909792195892334, + 0.9442022832870484, + 0.9765333101272583, + 1.0286593907356263, + 1.0600357536315919, + 1.0744477998733521, + 1.0949515160560608, + 1.107298709487915, + 1.105529815006256, + 1.1191591522216797, + 1.1270570775032043, + 1.1219041606903075, + 1.1523450615882873, + 1.1470273632049561, + 1.1214436004638673, + 1.113154112625122, + 1.1083291893005371, + 1.1125688663482667, + 1.0901233867645264, + 1.1175277576446534, + 1.1061762510299682, + 1.098485195541382, + 1.073400117111206, + 1.0892397708892823, + 1.0714881011962891, + 1.0761865495681762, + 1.0466925691604614, + 1.0452186401367187, + 1.0483840522766112, + 1.0655384910583496, + 1.0514549810409546, + 1.0704036350250243, + 1.039493140411377, + 1.0796428539276124, + 1.0604299968719482, + 1.069408202934265, + 1.069653288078308, + 1.061051636505127, + 1.0919126817703246, + 1.0595819647789002, + 1.044873174381256, + 1.0483424802780152, + 1.0358262340545654, + 1.0114229215621948, + 1.0345991500854492, + 1.0097949793815613, + 1.0033580027580262, + 1.0089688102722167, + 1.0225816150665283, + 1.0164037592887878, + 1.0124317664146423, + 1.0002467834472657, + 0.9989970367431641, + 1.0164838801383973, + 1.004414942932129, + 1.004607903289795, + 1.0115055170059204, + 1.0030508796691895, + 1.0010437889099122, + 0.9871210842132568, + 0.9881696207046509, + 0.9858065430641174, + 0.9832741060256958, + 0.9794693752288819, + 0.9825818849563599, + 0.9798864183425904, + 0.9814815460205079, + 0.9754757759094238, + 0.9757995666503906, + 0.9724037355422973, + 0.9745183243751526, + 0.9712728879928589, + 0.9709235038757325, + 0.9703462394714355, + 0.96921721534729, + 0.9688208660125732, + 0.9686514762878418 + ], + "train_acc": [ + 0.3634, + 0.6211, + 0.6854, + 0.6813, + 0.6738, + 0.6665, + 0.6452, + 0.6313, + 0.6285, + 0.6158, + 0.6087, + 0.6099, + 0.6038, + 0.5951, + 0.5951, + 0.5841, + 0.5923, + 0.6045, + 0.6012, + 0.6087, + 0.6088, + 0.6154, + 0.6041, + 0.6088, + 0.612, + 0.613, + 0.6176, + 0.6184, + 0.6114, + 0.6244, + 0.6234, + 0.623, + 0.6199, + 0.6204, + 0.6242, + 0.6274, + 0.6168, + 0.6209, + 0.6184, + 0.6194, + 0.6226, + 0.6174, + 0.6234, + 0.6247, + 0.6284, + 0.6284, + 0.6376, + 0.6326, + 0.6348, + 0.6392, + 0.6387, + 0.6324, + 0.6374, + 0.641, + 0.6435, + 0.6435, + 0.6384, + 0.6422, + 0.641, + 0.6427, + 0.6412, + 0.6426, + 0.6497, + 0.6502, + 0.6483, + 0.651, + 0.651, + 0.6484, + 0.6489, + 0.6511, + 0.6543, + 0.6493, + 0.6513, + 0.651, + 0.6536, + 0.6539, + 0.6524, + 0.652, + 0.6524, + 0.6533 + ], + "test_acc": [ + 0.529, + 0.647, + 0.6585, + 0.6455, + 0.64, + 0.6245, + 0.6135, + 0.6005, + 0.5845, + 0.5955, + 0.596, + 0.591, + 0.5615, + 0.551, + 0.537, + 0.549, + 0.56, + 0.553, + 0.554, + 0.5685, + 0.582, + 0.5715, + 0.5755, + 0.5575, + 0.584, + 0.5715, + 0.572, + 0.582, + 0.6025, + 0.5755, + 0.5965, + 0.592, + 0.5875, + 0.57, + 0.596, + 0.5795, + 0.582, + 0.558, + 0.5735, + 0.5855, + 0.5895, + 0.5995, + 0.5965, + 0.576, + 0.59, + 0.58, + 0.58, + 0.588, + 0.6025, + 0.587, + 0.604, + 0.5895, + 0.602, + 0.605, + 0.5935, + 0.6085, + 0.6035, + 0.609, + 0.605, + 0.596, + 0.5905, + 0.5965, + 0.6055, + 0.6015, + 0.5995, + 0.5985, + 0.593, + 0.6025, + 0.6085, + 0.6065, + 0.5995, + 0.604, + 0.6025, + 0.6035, + 0.602, + 0.605, + 0.6055, + 0.6075, + 0.6055, + 0.6055 + ], + "state_pred_error": [ + 0.6761728614807129, + 0.21007038679122925, + 0.15122513897418977, + 0.15703817780017854, + 0.16187702651023864, + 0.16339434959888458, + 0.16375452308654787, + 0.1625989185333252, + 0.18113663201332092, + 0.18272390701770783, + 0.1627283350467682, + 0.14700518136024476, + 0.13181535266637803, + 0.12005224347114563, + 0.11299885964393616, + 0.1068722818851471, + 0.10560559153556824, + 0.10757571039199829, + 0.10467144322395325, + 0.1023048233985901, + 0.09685005626678467, + 0.08491257979869843, + 0.07876403373479843, + 0.08301222360134125, + 0.08308529872894287, + 0.07449215137958527, + 0.06773201476931572, + 0.056569082129001615, + 0.04849699649810791, + 0.049368930143117905, + 0.04768026757240296, + 0.047298075234889984, + 0.04672931938171387, + 0.0405069172680378, + 0.03569790207147598, + 0.03157345391511917, + 0.027607627579569815, + 0.02504954431951046, + 0.02399016918540001, + 0.023421166968345643, + 0.023441646620631217, + 0.023209517675638197, + 0.02208724093735218, + 0.02086319588124752, + 0.01903458271920681, + 0.017419935330748558, + 0.016029068379104137, + 0.01474376180768013, + 0.014213219347596168, + 0.013581229855120181, + 0.01300986272096634, + 0.012749762377142907, + 0.012476563104987145, + 0.012336783754825591, + 0.012144882160425186, + 0.011600321805477142, + 0.011149377970397473, + 0.01074126893132925, + 0.01038957173228264, + 0.010054622607678174, + 0.009704671692848206, + 0.009379986931383609, + 0.00918807327747345, + 0.009165769296884537, + 0.008629796648025512, + 0.008511535508930683, + 0.008247988541424275, + 0.008038113085925579, + 0.007830396504700184, + 0.007626112474501133, + 0.007495704552531243, + 0.007370948339998722, + 0.007175249060243368, + 0.007102033820748329, + 0.006948738685995341, + 0.006806399586051702, + 0.006733712537586689, + 0.0066317357584834095, + 0.006558584788441658, + 0.006476805159449577 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.5538393259048462, + 0.4287089705467224, + 0.25277969241142273, + 0.2402075231075287, + 0.180599182844162, + 0.15653815865516663, + 0.1736883521080017, + 0.18825414776802063, + 0.1335570216178894, + 0.13271775841712952, + 0.15632027387619019, + 0.17869922518730164 + ], + "perturbation_rho": [ + 0.4586557149887085, + 0.4002187252044678, + 0.23149724304676056, + 0.21227607131004333, + 0.1842716634273529, + 0.16792945563793182, + 0.21390791237354279, + 0.19318881630897522, + 0.08300350606441498, + 0.10752588510513306, + 0.12254554033279419, + 0.14822974801063538 + ], + "nudging": { + "0.001": [ + -0.017140686511993408, + -0.0020858882926404476, + -0.000841023400425911, + -0.0007581148529425263, + -0.0005702057387679815, + -0.0004698220291174948, + -0.0005242021288722754, + -0.0005487058660946786, + -0.0003889029612764716, + -0.00041283376049250364, + -0.00047568423906341195, + -0.0005249952664598823 + ], + "0.003": [ + -0.05075468868017197, + -0.006247954908758402, + -0.0025209763552993536, + -0.002272759098559618, + -0.0017102723941206932, + -0.0014094945508986712, + -0.0015723016113042831, + -0.0016451808623969555, + -0.0011662597535178065, + -0.001238692319020629, + -0.0014261179603636265, + -0.0015746946446597576 + ], + "0.01": [ + -0.16128812730312347, + -0.02071414887905121, + -0.008381091989576817, + -0.007560182362794876, + -0.005691731348633766, + -0.0046913521364331245, + -0.005232630763202906, + -0.0054755983874201775, + -0.0038832086138427258, + -0.004123975522816181, + -0.004747895523905754, + -0.005240642465651035 + ] + }, + "state_pred_error_per_layer": [ + 8762.341796875, + 2348.0966796875, + 1278.38525390625, + 1081.769287109375, + 948.214599609375, + 985.5714111328125, + 775.6072387695312, + 713.37109375, + 927.2667846679688, + 1123.047119140625, + 1035.65966796875, + 864.7014770507812 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.204398078918457, + 1.3323631601333619, + 0.939462133026123, + 0.8349250438690186, + 0.798751298904419, + 0.7939926111221314, + 0.7538516298294068, + 0.7327921364307404, + 0.742140693473816, + 0.7984744975090027, + 0.7808600081443786, + 0.8111224076271057, + 0.818068535232544, + 0.8957202894210815, + 0.8786147340774536, + 0.8623664060592652, + 0.8652821689605713, + 0.9185279735088349, + 0.8737060611724854, + 0.940954065990448, + 0.9426063217163086, + 0.908225214099884, + 0.9119476990699769, + 0.8843687942504883, + 0.9302285919189454, + 0.9095543444633484, + 0.9696534498214722, + 0.9564951679229736, + 0.9960936920166016, + 1.0560175716400146, + 1.1218799053192139, + 1.1106456901550292, + 1.0888444778442383, + 1.108365227508545, + 1.1747237308502196, + 1.2570761484146118, + 1.2447720569610596, + 1.2861640047073364, + 1.345813150215149, + 1.2783869490623474, + 1.3102022647857665, + 1.3111451290130616, + 1.4334182024002076, + 1.3955786741256715, + 1.3985937965393067, + 1.4631241582870484, + 1.4292581964492799, + 1.4031433605194092, + 1.3756659330368042, + 1.3795376932144165, + 1.411164945602417, + 1.4335111087799073, + 1.4586236274719238, + 1.4378290100097657, + 1.4357496648788453, + 1.4363289024353028, + 1.4281649717330933, + 1.4307859104156495, + 1.4162574897766114, + 1.4109557525634766, + 1.4151159925460814, + 1.420570283126831, + 1.4031930568695068, + 1.409527113342285, + 1.4357126949310304, + 1.4103048273086547, + 1.4155527072906493, + 1.4083967643737794, + 1.4091735534667968, + 1.4099473182678222, + 1.4108677118301391, + 1.408898620223999, + 1.4091830333709716, + 1.4098944646835327, + 1.4084725885391236, + 1.409889715385437, + 1.4083553493499756, + 1.4081398155212401, + 1.4072429025650024, + 1.4070011655807495 + ], + "train_acc": [ + 0.1991, + 0.5286, + 0.6485, + 0.6923, + 0.7027, + 0.7121, + 0.7236, + 0.7332, + 0.7311, + 0.716, + 0.7232, + 0.7181, + 0.7132, + 0.7007, + 0.7034, + 0.7123, + 0.7171, + 0.7002, + 0.7115, + 0.6923, + 0.6879, + 0.6876, + 0.6828, + 0.6776, + 0.6602, + 0.6618, + 0.6434, + 0.6461, + 0.6328, + 0.6178, + 0.6044, + 0.6045, + 0.609, + 0.601, + 0.5795, + 0.5567, + 0.5526, + 0.5399, + 0.5257, + 0.5417, + 0.5249, + 0.5266, + 0.4915, + 0.4993, + 0.5061, + 0.4856, + 0.4925, + 0.4971, + 0.508, + 0.505, + 0.5012, + 0.4919, + 0.4814, + 0.4907, + 0.4888, + 0.4928, + 0.4872, + 0.4958, + 0.4988, + 0.4997, + 0.4948, + 0.4912, + 0.5021, + 0.4987, + 0.4862, + 0.4982, + 0.4953, + 0.5003, + 0.5009, + 0.4983, + 0.4985, + 0.4948, + 0.5005, + 0.499, + 0.4999, + 0.4979, + 0.4993, + 0.5032, + 0.5009, + 0.5014 + ], + "test_acc": [ + 0.397, + 0.5865, + 0.641, + 0.6645, + 0.638, + 0.674, + 0.681, + 0.6705, + 0.6525, + 0.669, + 0.666, + 0.654, + 0.6265, + 0.643, + 0.6705, + 0.648, + 0.6345, + 0.6565, + 0.6645, + 0.574, + 0.634, + 0.61, + 0.6255, + 0.6125, + 0.5815, + 0.5585, + 0.6005, + 0.6075, + 0.559, + 0.4235, + 0.448, + 0.5565, + 0.553, + 0.517, + 0.4805, + 0.5115, + 0.524, + 0.4995, + 0.518, + 0.501, + 0.5085, + 0.4275, + 0.453, + 0.49, + 0.464, + 0.471, + 0.4775, + 0.4765, + 0.4555, + 0.4755, + 0.4685, + 0.468, + 0.4685, + 0.4875, + 0.482, + 0.4705, + 0.479, + 0.479, + 0.4855, + 0.485, + 0.4695, + 0.4805, + 0.4875, + 0.4875, + 0.479, + 0.475, + 0.487, + 0.468, + 0.491, + 0.4805, + 0.476, + 0.491, + 0.489, + 0.4885, + 0.486, + 0.4915, + 0.485, + 0.489, + 0.4895, + 0.4905 + ], + "value_loss": [ + 3.072301338768005, + 1.0501791610717774, + 1.0778185897827148, + 1.0126153490543366, + 0.998683154296875, + 0.9888383563995361, + 0.8846181859016419, + 0.8152826041698455, + 0.8302651134490967, + 0.9819407861709595, + 0.9652068530082702, + 1.1237351128578186, + 1.0813433986663818, + 1.3806844716072082, + 1.2488904823303222, + 1.228573577594757, + 1.1786334270477294, + 1.2712596101760865, + 1.0855240513801574, + 1.2746817573547364, + 1.4511885639190674, + 1.154007823562622, + 1.1356486251831055, + 0.8443335267066956, + 0.837488655948639, + 0.6225753863334655, + 0.5785563923358917, + 0.7533490206718445, + 0.6095168882369996, + 0.7007707824707031, + 0.9116703001976013, + 1.3587798122406005, + 0.6592352680206299, + 0.7766882019996643, + 0.9818611496925354, + 0.9279026880264282, + 0.7442731433868408, + 1.069021375656128, + 1.0882310218811035, + 0.8840012928962707, + 1.0135157574653626, + 0.7696918965339661, + 0.7590476123809814, + 0.7395760213851928, + 0.8738672355651855, + 1.0812955352783202, + 0.6505666202068329, + 0.6151256795883179, + 0.7894958889007568, + 0.8141936486721039, + 0.7615871824264526, + 0.8084381361007691, + 0.6589969454288482, + 0.6014902378082275, + 0.5862701393127442, + 0.5811033900737762, + 0.5623021203994751, + 0.5565869275093078, + 0.5235150679111481, + 0.498365666103363, + 0.49131153430938723, + 0.4909665864467621, + 0.4629933397769928, + 0.4505445372581482, + 0.4790896162033081, + 0.5969956729888916, + 0.44423314423561094, + 0.43307222032547, + 0.4256617294311523, + 0.42464918003082275, + 0.41452328786849973, + 0.4117308448791504, + 0.492995530462265, + 0.43538717956542966, + 0.44797500500679016, + 0.45005082321166995, + 0.43216270017623903, + 0.4251728328704834, + 0.422374821472168, + 0.42473253202438355 + ], + "term_loss": [ + 1.7486166938781738, + 0.7108752704620361, + 0.8655158786773681, + 0.8239019277572632, + 0.8041402393341065, + 0.7661406455993652, + 0.6755866965293884, + 0.623099582517147, + 0.6441212059020996, + 0.7855478297710419, + 0.7730103199958801, + 0.9227579907894135, + 0.8809278240203857, + 1.1650211508274078, + 1.0323074983596803, + 1.0175812090992928, + 0.9653120155334473, + 1.043205972623825, + 0.861967781829834, + 0.9851467721462249, + 1.081189204788208, + 0.8166846063613892, + 0.7846175181388855, + 0.5201361804962158, + 0.4929544763326645, + 0.3175636313438416, + 0.2901056621313095, + 0.3790206042051315, + 0.28499682121276854, + 0.39165965728759766, + 0.5601075654983521, + 0.8508620109081269, + 0.33566083183288575, + 0.421619176197052, + 0.6050867574691773, + 0.515362792301178, + 0.3867789220809936, + 0.6784219856262207, + 0.6523104398727417, + 0.4651505504131317, + 0.5674913283348083, + 0.3531076382637024, + 0.3762776554107666, + 0.3760048986434937, + 0.5077781436920166, + 0.6820521322250366, + 0.31234550846815107, + 0.2759421797275543, + 0.4313824357509613, + 0.4397485457479954, + 0.38583696336746215, + 0.41842482051849367, + 0.2664445846557617, + 0.21906204319000244, + 0.2155111572265625, + 0.20474896924495697, + 0.19883680510520935, + 0.20494152598381044, + 0.17496985261440276, + 0.15888627536296845, + 0.1543628900051117, + 0.15332865059375764, + 0.13052898495197296, + 0.11957870311737061, + 0.14392558531761168, + 0.25379632194042206, + 0.11639134640097618, + 0.10945621439218521, + 0.10324780325889588, + 0.10286661281585693, + 0.09357965151071548, + 0.09110170931518077, + 0.1627564148902893, + 0.1111719566822052, + 0.12263777496814728, + 0.12426246918439865, + 0.1085665447294712, + 0.10199491771459579, + 0.09939227242469788, + 0.10016471980810165 + ], + "bridge_loss": [ + 1.0408418764609495, + 0.09791754142642022, + 0.01607361673563719, + 0.006360046429932117, + 0.014202374947071075, + 0.04166019638478756, + 0.03432967491745949, + 0.019949427074193955, + 0.011893661427497863, + 0.011133648046851158, + 0.010348413701355457, + 0.013049434357136487, + 0.010591996012628078, + 0.0145958656296134, + 0.016175279641151428, + 0.016993559893965723, + 0.020114685778319836, + 0.025630270735919475, + 0.029221688157320024, + 0.08149594967365265, + 0.15875441479682922, + 0.1295387010574341, + 0.14207587864398957, + 0.11591998620033264, + 0.12578484081625937, + 0.08755512158870697, + 0.05608815929889679, + 0.14551565287113188, + 0.08840978150367737, + 0.05767350391149521, + 0.09101119253635406, + 0.24997805795669556, + 0.06637025790214539, + 0.0923533808708191, + 0.10168245515823364, + 0.12557245763540267, + 0.07143535933494567, + 0.09773503345251083, + 0.1295747906923294, + 0.12344632883071899, + 0.1439121175765991, + 0.11409828340411186, + 0.06051087834537029, + 0.04596894909143448, + 0.05061739314496517, + 0.07255705659389496, + 0.015963772785663605, + 0.020752409666776658, + 0.045115634512901306, + 0.060058649122715, + 0.056574251520633695, + 0.06645108767151832, + 0.06612748733758926, + 0.06048111979663372, + 0.04903983753621578, + 0.05445499986112118, + 0.042946648034453395, + 0.030889016561210157, + 0.030506518384814264, + 0.022617575544118883, + 0.01963778121471405, + 0.018860915641486644, + 0.017245442955195905, + 0.01516037399172783, + 0.01477146714180708, + 0.027224332422018053, + 0.010273953337222337, + 0.00838120581805706, + 0.007192303487658501, + 0.0068658689022064205, + 0.0058338915776461366, + 0.006038547176122665, + 0.01565488623380661, + 0.009810619991272689, + 0.011464775865525008, + 0.011380115568637848, + 0.009845555101335049, + 0.009616777209192514, + 0.009775398235023021, + 0.011516085395216941 + ], + "tgrad_loss": [ + 0.2828427993297577, + 0.24138634746074678, + 0.196229097366333, + 0.18235337266921997, + 0.18034052944183349, + 0.18103751921653746, + 0.17470181679725647, + 0.17223359795808793, + 0.1742502421140671, + 0.1852593088388443, + 0.18184811897277833, + 0.1879276861667633, + 0.18982358770370483, + 0.20106744194030762, + 0.2004077008485794, + 0.19399881749153136, + 0.19320672080516815, + 0.20242335736751557, + 0.19433458232879638, + 0.2080390326499939, + 0.21124494104385377, + 0.2077845230102539, + 0.20895523295402527, + 0.2082773593902588, + 0.2187493396282196, + 0.21745663344860078, + 0.23236257095336915, + 0.22881276557445526, + 0.23611028518676758, + 0.2514376239776611, + 0.26055154542922976, + 0.25793972721099856, + 0.2572041809558868, + 0.2627156461000443, + 0.27509193930625914, + 0.28696743836402894, + 0.2860588630199432, + 0.29286437664031983, + 0.3063457974433899, + 0.29540441715717314, + 0.3021123158454895, + 0.3024859708786011, + 0.32225907711982726, + 0.31760216767787935, + 0.3154716930389404, + 0.3266863531112671, + 0.3222573429584503, + 0.3184310836315155, + 0.31299782562255857, + 0.3143864481925964, + 0.3191759672164917, + 0.32356222324371336, + 0.32642487545013427, + 0.3219470790863037, + 0.3217191444396973, + 0.32189942255020143, + 0.32051866216659547, + 0.3207563879013062, + 0.3180386944770813, + 0.31686181626319887, + 0.317310862159729, + 0.3187770200252533, + 0.3152189118385315, + 0.315805460357666, + 0.3203925657749176, + 0.3159750075340271, + 0.3175678468704224, + 0.31523480253219605, + 0.31522162137031556, + 0.3149166984081268, + 0.3151097435951233, + 0.31459059040546417, + 0.3145842257976532, + 0.31440460395812986, + 0.31387245659828183, + 0.31440823793411254, + 0.31375059900283814, + 0.31356113786697387, + 0.31320715007781985, + 0.3130517265796661 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.0054779257625341415, + 0.004163481295108795, + -0.01823507994413376, + 0.06908583641052246, + 0.09582538902759552, + 0.15172168612480164, + 0.18814444541931152, + 0.21233659982681274, + 0.2397850900888443, + 0.26321661472320557, + 0.2640886902809143, + 0.2636783719062805 + ], + "perturbation_rho": [ + 0.05151631310582161, + 0.03990761935710907, + 0.02668120339512825, + 0.08933386206626892, + 0.12927217781543732, + 0.1893344521522522, + 0.20202970504760742, + 0.27141058444976807, + 0.2724490761756897, + 0.2844354808330536, + 0.2797800898551941, + 0.32699841260910034 + ], + "nudging": { + "0.001": [ + -0.0001630904444027692, + -9.781777043826878e-05, + 2.982819569297135e-05, + -0.0005619653384201229, + -0.0007587508298456669, + -0.0010895882733166218, + -0.0013035854790359735, + -0.0014455055352300406, + -0.0015995067078620195, + -0.0017208646750077605, + -0.0017206399934366345, + -0.0017194547690451145 + ], + "0.003": [ + -0.00048247227095998824, + -0.00029189756605774164, + 9.186804527416825e-05, + -0.0016840758034959435, + -0.002273733261972666, + -0.0032667750492691994, + -0.003907301928848028, + -0.004333460237830877, + -0.00479520158842206, + -0.005158073268830776, + -0.005157032050192356, + -0.005153942387551069 + ], + "0.01": [ + -0.0015225817915052176, + -0.0009501088643446565, + 0.00033305209944956005, + -0.005592360161244869, + -0.00755771528929472, + -0.010863769799470901, + -0.012987833470106125, + -0.014405487105250359, + -0.015937766060233116, + -0.017140284180641174, + -0.017137283459305763, + -0.01712280511856079 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a1.0_L12_s42.json b/results/synth_ladder_v2_hi/synth_a1.0_L12_s42.json new file mode 100644 index 0000000..25bd6f4 --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a1.0_L12_s42.json @@ -0,0 +1,1722 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.2167138540267943, + 0.6644192937850952, + 0.5506165061473847, + 0.48336037511825564, + 0.4182848771095276, + 0.40661907227039334, + 0.3424934825897217, + 0.35799139835834504, + 0.26511010785102845, + 0.23195732245445252, + 0.21270024724006653, + 0.2823052164077759, + 0.21164472794532777, + 0.13219849714040757, + 0.10133266744017601, + 0.06582562736868858, + 0.054910096859931944, + 0.0435772212266922, + 0.06975247826576234, + 0.09024971271753311, + 0.06281453031748534, + 0.0336100251019001, + 0.030896341681480408, + 0.013370775660872459, + 0.0070056052580475805, + 0.005166941817849874, + 0.004177044635638594, + 0.003664903662353754, + 0.0034957939501851797, + 0.0031688468992710113, + 0.00291866621337831, + 0.002714762531220913, + 0.002580664499104023, + 0.002398674404248595, + 0.0022654061004519464, + 0.002146232843864709, + 0.002038132343813777, + 0.001949047568999231, + 0.0018736178727820517, + 0.0017870874792337418, + 0.001717707582563162, + 0.0016691381417214871, + 0.0015940914524719119, + 0.0015403639724478125, + 0.0014816656844690442, + 0.0014313775778748096, + 0.0013872252825647593, + 0.0013475412249565125, + 0.0013132355155423283, + 0.0012787189619615673, + 0.0012495384665206074, + 0.0012182915758341551, + 0.0011908044705167412, + 0.0011678429022431373, + 0.0011426269576884807, + 0.0011216053618118167, + 0.0011020653950050473, + 0.001083208804158494, + 0.0010670971114188433, + 0.0010516460586339235, + 0.001039433507528156, + 0.0010266986285336315, + 0.0010152279118075967, + 0.0010044794451911003, + 0.0009945416286587716, + 0.0009859108565375208, + 0.000978297258168459, + 0.0009711428828537464, + 0.0009655707112513483, + 0.0009599804351106286, + 0.0009553508592769504, + 0.0009515129062347114, + 0.0009484084218507633, + 0.0009458189880475402, + 0.0009438993757590651, + 0.0009421453967690468, + 0.0009409848362207413, + 0.0009402696459554136, + 0.0009398385908454657, + 0.0009396035427227616 + ], + "train_acc": [ + 0.559, + 0.7404, + 0.787, + 0.8131, + 0.8387, + 0.8419, + 0.8708, + 0.8645, + 0.8993, + 0.9156, + 0.919, + 0.8953, + 0.9204, + 0.9563, + 0.9676, + 0.985, + 0.988, + 0.9916, + 0.9793, + 0.9696, + 0.9793, + 0.9926, + 0.9932, + 0.9992, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.7175, + 0.7345, + 0.7475, + 0.7525, + 0.7525, + 0.743, + 0.757, + 0.7615, + 0.7705, + 0.76, + 0.757, + 0.7545, + 0.759, + 0.76, + 0.768, + 0.7605, + 0.766, + 0.7695, + 0.7615, + 0.7475, + 0.7565, + 0.7525, + 0.762, + 0.758, + 0.7625, + 0.7645, + 0.763, + 0.7625, + 0.7615, + 0.765, + 0.761, + 0.7625, + 0.7595, + 0.761, + 0.7635, + 0.7615, + 0.7625, + 0.762, + 0.763, + 0.7625, + 0.763, + 0.7625, + 0.763, + 0.7635, + 0.761, + 0.7625, + 0.761, + 0.7625, + 0.762, + 0.7625, + 0.7625, + 0.7615, + 0.7605, + 0.761, + 0.7625, + 0.761, + 0.762, + 0.7615, + 0.7615, + 0.761, + 0.7615, + 0.761, + 0.7605, + 0.761, + 0.761, + 0.76, + 0.7605, + 0.76, + 0.762, + 0.7615, + 0.7615, + 0.7615, + 0.7615, + 0.7615, + 0.761, + 0.761, + 0.761, + 0.761, + 0.761, + 0.761 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9098777174949646, + 0.9046642780303955, + 0.8960509300231934, + 0.8827707171440125, + 0.8719829320907593, + 0.8605888485908508, + 0.8495617508888245, + 0.8414114117622375, + 0.8343594074249268, + 0.8291183114051819, + 0.8250235915184021, + 0.8201327323913574 + ], + "perturbation_rho": [ + 0.9999990463256836, + 0.9999990463256836, + 0.9999988675117493, + 0.9999977946281433, + 0.9999968409538269, + 0.9999942779541016, + 0.9999903440475464, + 0.9999786615371704, + 0.9999630451202393, + 0.9999446272850037, + 0.9999108910560608, + 0.9998850226402283 + ], + "nudging": { + "0.001": [ + -0.07562384009361267, + -0.062235549092292786, + -0.04947236552834511, + -0.037844814360141754, + -0.02797994762659073, + -0.020565558224916458, + -0.015074005350470543, + -0.01117792073637247, + -0.008472632616758347, + -0.006596862338483334, + -0.005293367430567741, + -0.004384535364806652 + ], + "0.003": [ + -0.21770286560058594, + -0.1805628389120102, + -0.1445462554693222, + -0.11127626150846481, + -0.0827074944972992, + -0.0610310398042202, + -0.044867098331451416, + -0.03334078937768936, + -0.025308270007371902, + -0.0197245292365551, + -0.015837673097848892, + -0.0131243746727705 + ], + "0.01": [ + -0.6227189302444458, + -0.5321269631385803, + -0.43762683868408203, + -0.34503036737442017, + -0.26150017976760864, + -0.1957385241985321, + -0.14543747901916504, + -0.10888919234275818, + -0.08308196067810059, + -0.06497863680124283, + -0.05229911208152771, + -0.043410398066043854 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.186298126029968, + 1.3170648136138916, + 0.9388262815475464, + 0.8259288063049316, + 0.7871681312561035, + 0.768296202325821, + 0.7554679615020752, + 0.7938834943771362, + 0.7564283534049988, + 0.7607723757743835, + 0.7925523330688476, + 0.8989389373779297, + 0.8784029937744141, + 0.8638933157920837, + 0.8698528030395508, + 0.8701005321502685, + 0.8684252815246583, + 0.9089286350250244, + 0.960618631362915, + 0.9822033012390137, + 1.020843323135376, + 0.9711806545257569, + 1.0430698785305024, + 1.0095568243026734, + 1.1050530094146729, + 1.069895089530945, + 1.1716613415718078, + 1.201347763824463, + 1.1283303380966188, + 1.1557568897247315, + 1.1250453087806702, + 1.1819004883766175, + 1.194346431541443, + 1.130011873483658, + 1.0376260078430175, + 1.0971675140380859, + 1.1035215358734132, + 1.1104521294593812, + 1.13454789352417, + 1.1742041780471801, + 1.2229691701889038, + 1.1794398748397827, + 1.1231036127090455, + 1.1594393963813783, + 1.1276930301189423, + 1.061903306388855, + 1.1229245660781861, + 1.073384938621521, + 1.0648032081604004, + 1.1271088062286376, + 1.068476490879059, + 1.0994879371643067, + 1.058270964050293, + 1.0784939964294433, + 1.0614496122360229, + 1.0508124362945557, + 1.065734383392334, + 1.0627044410705566, + 1.04440792427063, + 1.0639379348754883, + 1.0314187761306763, + 1.0538115164756774, + 1.0259352924346923, + 1.0052897773742675, + 0.9986613960266113, + 1.0119889862060547, + 0.9931197847366333, + 0.9905490432739258, + 0.9864775718688965, + 0.9887168021202087, + 0.9828311577796937, + 0.9784416509628295, + 0.9733598571777343, + 0.970889217376709, + 0.9696053255081176, + 0.9671486230850219, + 0.9651715932846069, + 0.9634749843597412, + 0.9624634768486023, + 0.9618757415771484 + ], + "train_acc": [ + 0.2057, + 0.5339, + 0.6457, + 0.6927, + 0.7074, + 0.7106, + 0.7227, + 0.7066, + 0.7186, + 0.7196, + 0.7107, + 0.6967, + 0.6987, + 0.7051, + 0.708, + 0.7071, + 0.7125, + 0.7034, + 0.6963, + 0.697, + 0.6885, + 0.6975, + 0.6901, + 0.694, + 0.6855, + 0.687, + 0.6777, + 0.6749, + 0.6809, + 0.6801, + 0.6866, + 0.6751, + 0.6789, + 0.6849, + 0.7045, + 0.6896, + 0.6886, + 0.6874, + 0.6841, + 0.6747, + 0.6727, + 0.6804, + 0.6875, + 0.6828, + 0.6875, + 0.6957, + 0.6864, + 0.6946, + 0.6966, + 0.6819, + 0.6936, + 0.6934, + 0.6954, + 0.6925, + 0.6991, + 0.6986, + 0.6928, + 0.6922, + 0.7001, + 0.695, + 0.6988, + 0.6989, + 0.7008, + 0.7025, + 0.7056, + 0.7027, + 0.7091, + 0.7075, + 0.7056, + 0.7094, + 0.7092, + 0.7108, + 0.7113, + 0.7103, + 0.7105, + 0.7119, + 0.712, + 0.7127, + 0.7119, + 0.7109 + ], + "test_acc": [ + 0.411, + 0.5885, + 0.6495, + 0.6605, + 0.6575, + 0.658, + 0.643, + 0.6645, + 0.6845, + 0.6295, + 0.612, + 0.5725, + 0.645, + 0.617, + 0.6705, + 0.663, + 0.6495, + 0.641, + 0.646, + 0.6305, + 0.6545, + 0.605, + 0.617, + 0.6125, + 0.6185, + 0.5835, + 0.6215, + 0.624, + 0.611, + 0.584, + 0.565, + 0.5905, + 0.5835, + 0.6395, + 0.6435, + 0.6235, + 0.6055, + 0.648, + 0.606, + 0.6105, + 0.6005, + 0.6235, + 0.5885, + 0.622, + 0.6285, + 0.6185, + 0.6225, + 0.644, + 0.628, + 0.6225, + 0.606, + 0.631, + 0.6295, + 0.6475, + 0.631, + 0.6455, + 0.6295, + 0.627, + 0.644, + 0.6445, + 0.627, + 0.6465, + 0.643, + 0.654, + 0.6615, + 0.6595, + 0.6365, + 0.6615, + 0.6505, + 0.661, + 0.657, + 0.653, + 0.6545, + 0.6515, + 0.6575, + 0.654, + 0.6565, + 0.656, + 0.6565, + 0.6555 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.019931811839342117, + 0.08357247710227966, + 0.07596792280673981, + 0.07454836368560791, + 0.08405900746583939, + 0.09273561835289001, + 0.08532143384218216, + 0.014841631054878235, + 0.05702097713947296, + 0.11365848034620285, + 0.0635562390089035, + 0.09192724525928497 + ], + "perturbation_rho": [ + -0.021908380091190338, + 0.08644437789916992, + 0.133758544921875, + 0.11560394614934921, + 0.09019643068313599, + 0.10901004821062088, + 0.05401141196489334, + 0.06626297533512115, + 0.10668720304965973, + 0.11482831090688705, + 0.07995637506246567, + 0.14062434434890747 + ], + "nudging": { + "0.001": [ + 0.0011563966982066631, + -0.0008197429706342518, + -0.00036967784399166703, + -0.00036756350891664624, + -0.0003487933427095413, + -0.0004525642143562436, + -0.0003745106514543295, + -0.00010148633737117052, + -0.00033267418621107936, + -0.00054067128803581, + -0.00029341079061850905, + -0.0004061080398969352 + ], + "0.003": [ + 0.00442184554412961, + -0.0024542496539652348, + -0.0011048256419599056, + -0.001102155540138483, + -0.0010442640632390976, + -0.0013546040281653404, + -0.0011223775800317526, + -0.00030574860284104943, + -0.0009935388807207346, + -0.0016202303813770413, + -0.0008805043180473149, + -0.0012169405817985535 + ], + "0.01": [ + 0.012093277648091316, + -0.00814887322485447, + -0.0036774289328604937, + -0.0036643892526626587, + -0.0034756590612232685, + -0.0045063551515340805, + -0.003735880134627223, + -0.00101565255317837, + -0.0033070247154682875, + -0.005390047561377287, + -0.0029281126335263252, + -0.004048082046210766 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.7927106206893921, + 1.0314875890731812, + 0.8727929697036744, + 0.9138810105323791, + 0.9269397434234619, + 0.9882902357101441, + 1.054063469696045, + 1.1199199728012086, + 1.1510957370758057, + 1.147088790512085, + 1.1919541924476624, + 1.234068378829956, + 1.2097180450439453, + 1.1891298070907592, + 1.1807195945739746, + 1.2230972785949707, + 1.1718537767410278, + 1.1954543895721434, + 1.2653305320739745, + 1.2169406047821045, + 1.1939767074584962, + 1.1432181312561036, + 1.13808095703125, + 1.1338830974578857, + 1.1148282649993897, + 1.125065263557434, + 1.084688761138916, + 1.1044120174407959, + 1.1321100765228271, + 1.1385612312316895, + 1.1563688796997071, + 1.1437482376098633, + 1.1149125736236571, + 1.1060235730171204, + 1.0663122928619384, + 1.0548065941810607, + 1.037735648727417, + 1.040986361694336, + 1.0317749416351318, + 1.0356540889739991, + 1.0302827856063843, + 1.0450294395446778, + 1.046817469215393, + 1.054090824508667, + 1.0731036259651183, + 1.0649280383110047, + 1.0700508375167848, + 1.0669750782966614, + 1.0659932651519775, + 1.0457564308166505, + 1.0646298887252807, + 1.033217864227295, + 1.020263679790497, + 1.0093394360542298, + 0.9962293283462524, + 1.002608583831787, + 0.9913532760620117, + 0.9975923980712891, + 0.9923603912353516, + 0.9835381677627564, + 0.9838607303619384, + 0.9828417135238647, + 0.9760973712921143, + 0.9737089462280274, + 0.9740158191680908, + 0.9762706676483154, + 0.9749209213256836, + 0.9819463082313538, + 0.9734501623153686, + 0.9739530671119689, + 0.9739078194618225, + 0.9717803599357605, + 0.9706060266494752, + 0.9709286643981934, + 0.9693692140579223, + 0.9688454288482666, + 0.9685833683967591, + 0.968160081577301, + 0.9678136520385742, + 0.9676551561355591 + ], + "train_acc": [ + 0.3529, + 0.617, + 0.6865, + 0.684, + 0.6808, + 0.6645, + 0.6281, + 0.6079, + 0.5946, + 0.606, + 0.5938, + 0.5933, + 0.585, + 0.5874, + 0.5821, + 0.5693, + 0.585, + 0.5767, + 0.5594, + 0.5723, + 0.5785, + 0.5954, + 0.5957, + 0.6033, + 0.5983, + 0.5932, + 0.6125, + 0.6031, + 0.5973, + 0.6013, + 0.5975, + 0.5991, + 0.6068, + 0.6046, + 0.6157, + 0.6177, + 0.6224, + 0.6263, + 0.6237, + 0.6244, + 0.6273, + 0.6203, + 0.6219, + 0.6184, + 0.6144, + 0.6174, + 0.6135, + 0.6197, + 0.617, + 0.6202, + 0.6124, + 0.6257, + 0.6283, + 0.6294, + 0.6354, + 0.6396, + 0.6378, + 0.641, + 0.6431, + 0.6427, + 0.6436, + 0.6436, + 0.6449, + 0.6471, + 0.6451, + 0.6463, + 0.6456, + 0.6422, + 0.6467, + 0.6457, + 0.6461, + 0.6474, + 0.6446, + 0.6444, + 0.646, + 0.6458, + 0.6446, + 0.6441, + 0.6447, + 0.6456 + ], + "test_acc": [ + 0.519, + 0.664, + 0.6565, + 0.6705, + 0.636, + 0.619, + 0.579, + 0.5705, + 0.5865, + 0.5705, + 0.562, + 0.5375, + 0.561, + 0.558, + 0.5465, + 0.532, + 0.5275, + 0.486, + 0.5195, + 0.5395, + 0.55, + 0.573, + 0.556, + 0.5605, + 0.5615, + 0.574, + 0.5745, + 0.556, + 0.5575, + 0.556, + 0.5545, + 0.5625, + 0.5675, + 0.57, + 0.573, + 0.588, + 0.583, + 0.5995, + 0.593, + 0.5865, + 0.588, + 0.584, + 0.587, + 0.5745, + 0.578, + 0.584, + 0.581, + 0.577, + 0.578, + 0.5575, + 0.581, + 0.588, + 0.59, + 0.5965, + 0.5935, + 0.5995, + 0.607, + 0.6035, + 0.606, + 0.617, + 0.61, + 0.6075, + 0.616, + 0.616, + 0.6045, + 0.609, + 0.6005, + 0.6105, + 0.609, + 0.612, + 0.609, + 0.61, + 0.6095, + 0.6105, + 0.6115, + 0.6105, + 0.6135, + 0.6115, + 0.6115, + 0.612 + ], + "state_pred_error": [ + 0.6679646494865418, + 0.208888227891922, + 0.15699384171962738, + 0.1473097540616989, + 0.14668454189300537, + 0.14812699263095855, + 0.14335613057613372, + 0.13920899329185485, + 0.12979220235347746, + 0.128491516828537, + 0.13504859671592712, + 0.1396056207180023, + 0.13049439578056335, + 0.1227945753455162, + 0.11947583696842194, + 0.10677306697368621, + 0.09056728343963623, + 0.0806899295091629, + 0.07537768748998643, + 0.07152788438796998, + 0.06905149774551392, + 0.062417028772830965, + 0.06347229870557786, + 0.06624231204986572, + 0.06285614745020866, + 0.0503471009016037, + 0.04555290793180466, + 0.050627702116966246, + 0.05441606894731522, + 0.055547272217273715, + 0.062450043869018555, + 0.06494303442835808, + 0.06485141371488572, + 0.06386149806976318, + 0.05790943026542664, + 0.05235746785998344, + 0.04955936104059219, + 0.05004490375518799, + 0.04749767688512802, + 0.04710491924285889, + 0.0465313448369503, + 0.04374815753698349, + 0.04258050545454025, + 0.03991454938054085, + 0.0385970116853714, + 0.03645361765027046, + 0.034857989984750745, + 0.033499520513415336, + 0.03257660132646561, + 0.03282006865441799, + 0.03126014052629471, + 0.03070251874923706, + 0.02945106231868267, + 0.02763169339597225, + 0.026091488403081894, + 0.024555341643095016, + 0.023253344959020615, + 0.02221344622075558, + 0.021545387333631514, + 0.02069348260462284, + 0.02002821311056614, + 0.019566327910125254, + 0.019089816910028458, + 0.018679450111091137, + 0.01807071948647499, + 0.017758635139465333, + 0.017390955182909965, + 0.016965231823921203, + 0.01691897337138653, + 0.016519649094343187, + 0.01632954144179821, + 0.015909486715495587, + 0.015621637430787087, + 0.01549294995367527, + 0.01523477383106947, + 0.015047570972144604, + 0.014741873973608016, + 0.014865786504745484, + 0.0145689842492342, + 0.01426824083328247 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.6137553453445435, + 0.458263099193573, + 0.30694735050201416, + 0.21984770894050598, + 0.18884725868701935, + 0.1519574671983719, + 0.14165323972702026, + 0.13691727817058563, + 0.1416233777999878, + 0.126474529504776, + 0.13544593751430511, + 0.15268874168395996 + ], + "perturbation_rho": [ + 0.5528259873390198, + 0.43722641468048096, + 0.3177984952926636, + 0.20145072042942047, + 0.17441785335540771, + 0.10548915714025497, + 0.16265320777893066, + 0.1351865828037262, + 0.16532285511493683, + 0.1285737156867981, + 0.14820542931556702, + 0.13290725648403168 + ], + "nudging": { + "0.001": [ + -0.017212403938174248, + -0.002171289175748825, + -0.0011191105004400015, + -0.0007672292995266616, + -0.0006296404171735048, + -0.0005172825185582042, + -0.00045882861013524234, + -0.00044813245767727494, + -0.0004553778562694788, + -0.00039569500950165093, + -0.00041053537279367447, + -0.0004746984923258424 + ], + "0.003": [ + -0.051028184592723846, + -0.006504997611045837, + -0.0033547731582075357, + -0.002300845691934228, + -0.0018879442941397429, + -0.0015519845765084028, + -0.001375660765916109, + -0.0013441899791359901, + -0.0013661098200827837, + -0.0011867693392559886, + -0.0012310168240219355, + -0.0014232922112569213 + ], + "0.01": [ + -0.16301177442073822, + -0.02157333306968212, + -0.011153988540172577, + -0.00765608623623848, + -0.006283854134380817, + -0.005166183691471815, + -0.0045799510553479195, + -0.004474613815546036, + -0.004547867923974991, + -0.003950329497456551, + -0.004098072648048401, + -0.004737637937068939 + ] + }, + "state_pred_error_per_layer": [ + 9663.3720703125, + 2355.42919921875, + 1189.673095703125, + 946.2671508789062, + 890.0131225585938, + 836.83837890625, + 765.7700805664062, + 776.2135009765625, + 909.9769287109375, + 744.7386474609375, + 809.6233520507812, + 764.1907958984375 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.187571883392334, + 1.326188510799408, + 0.9483794553756714, + 0.8345242721557617, + 0.7889606231689453, + 0.7665260448455811, + 0.7712172222137451, + 0.7981748757362366, + 0.7899593097686768, + 0.7801628154754638, + 0.8586313926696777, + 0.8269656328201294, + 0.807786918926239, + 0.8667379869461059, + 0.899315183544159, + 0.9044795955657959, + 0.8931566469192505, + 0.9207966779708863, + 1.0783265449047088, + 1.0466851587295531, + 1.093337151145935, + 1.1578910236358642, + 1.167968105840683, + 1.23159896774292, + 1.2349544055938722, + 1.2180055444717408, + 1.3142979488372803, + 1.2654387786865235, + 1.171596767616272, + 1.2007275730133056, + 1.1795954244613647, + 1.1870033908843993, + 1.1767311180114746, + 1.2135950805664062, + 1.158268939971924, + 1.1288424992561341, + 1.1108321193695068, + 1.1112286039352417, + 1.175734718990326, + 1.2268269479751588, + 1.26170970993042, + 1.2978283054351807, + 1.238773140335083, + 1.2101145763397216, + 1.1873152170181274, + 1.2330628694534302, + 1.226954536819458, + 1.2110083309173585, + 1.1265845808029176, + 1.116980394744873, + 1.1078424495697021, + 1.1030315553665162, + 1.1111802764892578, + 1.1046845901489257, + 1.118118372440338, + 1.123797571182251, + 1.1151752515792848, + 1.1250915416717528, + 1.1366710498809816, + 1.1448557445526124, + 1.1518292568206787, + 1.159379100227356, + 1.1686466316223145, + 1.1710848539352416, + 1.1695413871765137, + 1.1633276565551758, + 1.1677356637954712, + 1.1538119668006896, + 1.1502773937225341, + 1.1475828493118285, + 1.1402593296051025, + 1.1347655990600587, + 1.1332295770645142, + 1.1308751027107238, + 1.1288191188812255, + 1.1274588232040406, + 1.1259936437606812, + 1.1247959713935851, + 1.1243038135528565, + 1.1238948013305663 + ], + "train_acc": [ + 0.2013, + 0.5327, + 0.6437, + 0.6861, + 0.704, + 0.7125, + 0.7112, + 0.7059, + 0.7086, + 0.7123, + 0.7009, + 0.7122, + 0.7157, + 0.706, + 0.703, + 0.7039, + 0.7054, + 0.7067, + 0.6783, + 0.68, + 0.6715, + 0.6585, + 0.6541, + 0.6474, + 0.6488, + 0.6484, + 0.6234, + 0.6167, + 0.6265, + 0.6152, + 0.6068, + 0.598, + 0.6005, + 0.5804, + 0.593, + 0.5996, + 0.6022, + 0.6074, + 0.5925, + 0.5753, + 0.5686, + 0.5582, + 0.5762, + 0.5799, + 0.5923, + 0.5848, + 0.5937, + 0.5908, + 0.6006, + 0.6011, + 0.6017, + 0.6061, + 0.6037, + 0.6052, + 0.6025, + 0.6042, + 0.6109, + 0.6127, + 0.6036, + 0.6001, + 0.6004, + 0.6013, + 0.6002, + 0.5997, + 0.5996, + 0.6016, + 0.6004, + 0.6023, + 0.6007, + 0.5986, + 0.6028, + 0.6049, + 0.605, + 0.6036, + 0.6054, + 0.6047, + 0.6046, + 0.6047, + 0.605, + 0.6055 + ], + "test_acc": [ + 0.411, + 0.5885, + 0.636, + 0.6585, + 0.67, + 0.65, + 0.667, + 0.6335, + 0.6685, + 0.673, + 0.6455, + 0.6705, + 0.6075, + 0.6715, + 0.6535, + 0.649, + 0.651, + 0.53, + 0.6265, + 0.601, + 0.605, + 0.627, + 0.622, + 0.5865, + 0.6085, + 0.594, + 0.5815, + 0.589, + 0.57, + 0.5685, + 0.5505, + 0.5145, + 0.459, + 0.478, + 0.528, + 0.564, + 0.553, + 0.5485, + 0.5305, + 0.501, + 0.5365, + 0.529, + 0.5225, + 0.5515, + 0.5195, + 0.5455, + 0.5615, + 0.582, + 0.5635, + 0.574, + 0.5735, + 0.5645, + 0.551, + 0.5465, + 0.5655, + 0.5755, + 0.5495, + 0.558, + 0.5565, + 0.549, + 0.55, + 0.5515, + 0.5405, + 0.537, + 0.5375, + 0.54, + 0.5495, + 0.5415, + 0.541, + 0.5485, + 0.5475, + 0.549, + 0.549, + 0.5525, + 0.5485, + 0.5505, + 0.552, + 0.552, + 0.5505, + 0.551 + ], + "value_loss": [ + 3.0176044733047487, + 1.0615758232116699, + 1.060210463142395, + 1.0228195582389832, + 1.010133931159973, + 0.9419147435188293, + 0.9213042179107666, + 0.983886623954773, + 0.9630082674980164, + 0.9914523235321044, + 1.2916864912033081, + 1.2033885765075683, + 1.1053708289146424, + 1.3117134510040283, + 1.4571176118850708, + 1.4822016599655152, + 1.4464408508300781, + 1.494612897491455, + 1.8919828211784362, + 1.818289499282837, + 2.0769482429504396, + 2.12258825340271, + 2.033720273256302, + 2.0954800230026245, + 2.042681290435791, + 1.6873159214019775, + 1.8694674877166748, + 1.7658453981399536, + 1.2227107414245606, + 1.1675872913360597, + 1.0477982774734498, + 1.0205717498779296, + 0.988148659324646, + 1.2007792435646056, + 1.2352806282043458, + 0.7386786937713623, + 0.6201939727783203, + 0.6657010184288025, + 0.6853000906467438, + 0.8492486668586731, + 0.9932778938293457, + 0.7683114501953126, + 0.7004810465812683, + 0.6364181649208069, + 0.7614990028381348, + 0.9295081817626953, + 0.9417757865428924, + 0.9216889915466309, + 1.110058699989319, + 0.6404524593353271, + 0.5510710064888, + 0.5543017141342164, + 0.5552202627182007, + 0.5762319219589234, + 0.5093711531162262, + 0.5778757699012756, + 0.5336550855636597, + 0.5517868465423584, + 0.5429261692523957, + 0.5305708591222763, + 0.5233953864097595, + 0.5504776068687439, + 0.539759356212616, + 0.549393851852417, + 0.5086777307510376, + 0.5206843482017517, + 0.5520425520896911, + 0.48353495416641235, + 0.4974589912414551, + 0.44917406425476075, + 0.43793688774108885, + 0.45631180305480956, + 0.4439697093963623, + 0.42663677763938906, + 0.42073239850997923, + 0.42288827419281005, + 0.41220576906204226, + 0.4032818036079407, + 0.39890543241500853, + 0.40481987361907956 + ], + "term_loss": [ + 1.7119286471366881, + 0.7037585079193115, + 0.8388954549789429, + 0.8274686014175415, + 0.8159207627296448, + 0.7364932671546937, + 0.7016430713653564, + 0.7591273450374604, + 0.7492439122200012, + 0.7837357002258301, + 1.0731903156280518, + 0.9902451916694641, + 0.8949025638103485, + 1.0940426338195801, + 1.2338541860580445, + 1.2540717607498169, + 1.2233770456314086, + 1.266107029724121, + 1.6277973073005676, + 1.5449570091247558, + 1.7487831764221191, + 1.7418235130310058, + 1.6319917914390565, + 1.6619985774993897, + 1.5998232263565064, + 1.291028978919983, + 1.443897636795044, + 1.282541985321045, + 0.8302469918251038, + 0.7786969506263733, + 0.6696095920085907, + 0.629389222240448, + 0.6078266143798828, + 0.7563104814052581, + 0.7805323437929154, + 0.4057512969493866, + 0.3186667461395264, + 0.36671760559082034, + 0.3813627925157547, + 0.5274563785791397, + 0.6265791069030762, + 0.42749316444396973, + 0.3737451464653015, + 0.3232894562005997, + 0.4397853298187256, + 0.603940721321106, + 0.6182400625228882, + 0.5936727350234985, + 0.729513829421997, + 0.3043965761899948, + 0.25340475018024444, + 0.27099439952373505, + 0.2766846051216125, + 0.29747566282749177, + 0.24260444918870927, + 0.3014756342887878, + 0.2654747169494629, + 0.2814042194366455, + 0.2751402094900608, + 0.2607534381270409, + 0.2544426300525665, + 0.2766920667171478, + 0.26777749214172364, + 0.27581927382946014, + 0.24122158317565917, + 0.25178992862701416, + 0.27741119154691696, + 0.22030126638412476, + 0.2316324962377548, + 0.19071975877285002, + 0.1823152543067932, + 0.196656636095047, + 0.186306823015213, + 0.16951884495019912, + 0.1646258558511734, + 0.16557776184082032, + 0.15581585245132445, + 0.1488703131914139, + 0.1448495783805847, + 0.14867231681346893 + ], + "bridge_loss": [ + 1.0148520425139926, + 0.10943376184105873, + 0.016118820284307004, + 0.00479079963862896, + 0.00932531143128872, + 0.022979111295938492, + 0.03275809189677238, + 0.030009772622585296, + 0.018097961828112602, + 0.01276451837271452, + 0.011840740299224854, + 0.011681876456737518, + 0.011498133054375649, + 0.012259974516928196, + 0.012814128774404526, + 0.016967138912528754, + 0.015625382725894452, + 0.016673024797439574, + 0.026665059140324594, + 0.040999473381042484, + 0.08775637840032577, + 0.13471563642024995, + 0.15264853343963622, + 0.17042632131576538, + 0.1846267404794693, + 0.1426714852333069, + 0.15643644499778747, + 0.21692225222587586, + 0.1381309385061264, + 0.13067246084213258, + 0.12024339685440064, + 0.12863199595212937, + 0.11999726004600525, + 0.1790491102874279, + 0.19895550255775452, + 0.07846425278186799, + 0.0521241464138031, + 0.050531299328804014, + 0.048225503075122834, + 0.0573767644226551, + 0.09494609681367874, + 0.06426656882762909, + 0.057834729897975924, + 0.04925961502492428, + 0.061063556718826295, + 0.05985300147533417, + 0.062644553732872, + 0.0668293038368225, + 0.13089194159507753, + 0.08827434695959091, + 0.051028902739286425, + 0.03809687232673168, + 0.033848379123210905, + 0.03457036361694336, + 0.02108327111005783, + 0.029492683643102646, + 0.02455984553694725, + 0.02582640761435032, + 0.021667973601818085, + 0.022328672303259373, + 0.02060983867049217, + 0.023895200684666634, + 0.022121075198054313, + 0.02329711413383484, + 0.017430856196582318, + 0.019568592843413352, + 0.025390091779083013, + 0.015601030120253562, + 0.019178162130713463, + 0.011871388348937034, + 0.011855170375108718, + 0.016089519263803958, + 0.014637802371382713, + 0.014631265115737915, + 0.014274802702665328, + 0.014835487592220307, + 0.014966160023212433, + 0.013275021009892226, + 0.013311498472094535, + 0.015895452450215817 + ], + "tgrad_loss": [ + 0.29082378821372984, + 0.2483835512638092, + 0.2051961945772171, + 0.1905601591825485, + 0.18488785667419433, + 0.1824423761844635, + 0.1869030656814575, + 0.1947495018005371, + 0.19566639924049378, + 0.1949521035194397, + 0.20665544452667237, + 0.20146149559020995, + 0.19897012882232665, + 0.20541083397865295, + 0.21044929957389832, + 0.21116275901794435, + 0.20743842515945435, + 0.21183283591270446, + 0.2375204436659813, + 0.23233302335739137, + 0.24040868864059448, + 0.24604910697937013, + 0.2490799533367157, + 0.2630551248550415, + 0.258231339263916, + 0.25361546020507814, + 0.2691334120750427, + 0.2663811700344086, + 0.2543328045845032, + 0.2582178777694702, + 0.2579452847003937, + 0.2625505379915237, + 0.26032478485107424, + 0.265419658946991, + 0.2557927810668945, + 0.2544631404399872, + 0.2494030824661255, + 0.24845211391448974, + 0.2557117907762527, + 0.26441551985740663, + 0.2717526791572571, + 0.2765517095565796, + 0.2689011663913727, + 0.2638690975189209, + 0.2606501162528992, + 0.26571446528434756, + 0.26089117522239685, + 0.2611869606494904, + 0.2496529348373413, + 0.2477815414428711, + 0.2466373523712158, + 0.2452104380130768, + 0.2446872700691223, + 0.24418589582443237, + 0.2456834303855896, + 0.24690745534896852, + 0.24362052619457245, + 0.244556223154068, + 0.24611798746585847, + 0.24748875288963318, + 0.2483429102420807, + 0.24989033243656159, + 0.24986078734397887, + 0.25027746453285216, + 0.25002529113292693, + 0.24932582616806032, + 0.24924127697944642, + 0.24763265438079834, + 0.24664833087921142, + 0.24658291368484497, + 0.24376646332740784, + 0.24356564955711366, + 0.2430250828266144, + 0.24248666682243347, + 0.24183174138069152, + 0.24247501969337462, + 0.24142375493049623, + 0.24113646895885468, + 0.2407443552494049, + 0.24025210301876068 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.050826266407966614, + 0.1324397623538971, + 0.19395378232002258, + 0.22954219579696655, + 0.24835197627544403, + 0.26261672377586365, + 0.2866933345794678, + 0.3069983422756195, + 0.3148944675922394, + 0.31817084550857544, + 0.3155951499938965, + 0.31555619835853577 + ], + "perturbation_rho": [ + 0.024354537948966026, + 0.23902058601379395, + 0.29458120465278625, + 0.31519168615341187, + 0.3208061456680298, + 0.38384467363357544, + 0.38460177183151245, + 0.4478553831577301, + 0.41032421588897705, + 0.452781081199646, + 0.43433815240859985, + 0.434899240732193 + ], + "nudging": { + "0.001": [ + -0.0018732836470007896, + -0.0014186109183356166, + -0.0016378036234527826, + -0.001764438347890973, + -0.0018913769163191319, + -0.002036110032349825, + -0.0021226275712251663, + -0.0021735229529440403, + -0.002216566586866975, + -0.0022331401705741882, + -0.002216600114479661, + -0.0022018395829945803 + ], + "0.003": [ + -0.005605676211416721, + -0.004251755774021149, + -0.004909512121230364, + -0.00528964027762413, + -0.005669655278325081, + -0.0061027128249406815, + -0.006363155320286751, + -0.006514269858598709, + -0.006643516011536121, + -0.006693107541650534, + -0.006642842199653387, + -0.006598594132810831 + ], + "0.01": [ + -0.018513288348913193, + -0.014132995158433914, + -0.016322217881679535, + -0.017585258930921555, + -0.018846090883016586, + -0.02027801051735878, + -0.021141095086932182, + -0.02164183184504509, + -0.02207053080201149, + -0.022233182564377785, + -0.02206714265048504, + -0.021919995546340942 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a1.0_L12_s456.json b/results/synth_ladder_v2_hi/synth_a1.0_L12_s456.json new file mode 100644 index 0000000..dee781b --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a1.0_L12_s456.json @@ -0,0 +1,1722 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.2214362565994263, + 0.6880987966537475, + 0.573380104637146, + 0.504524497127533, + 0.4304532258987427, + 0.4075445725917816, + 0.3505498517990112, + 0.33131821126937866, + 0.316932852602005, + 0.2321077467918396, + 0.24117032368183136, + 0.18791021666526794, + 0.1795637712955475, + 0.22588226013183593, + 0.12590660848617555, + 0.0935815057039261, + 0.08925642510652543, + 0.06074653144180775, + 0.03752641976475716, + 0.029369706916809082, + 0.022727268996834755, + 0.013826664884388447, + 0.009437553413957358, + 0.006844828377664089, + 0.005729820974171161, + 0.005235948743671179, + 0.004590337446331978, + 0.004217684137821197, + 0.0039060393817722796, + 0.0036189329497516155, + 0.0033334961384534835, + 0.0030410941667854785, + 0.00281677149515599, + 0.002593890456110239, + 0.0025124770160764457, + 0.002334106710460037, + 0.0021957552917301654, + 0.0020749030753970145, + 0.0020024682715535165, + 0.0019192409418523312, + 0.001830386008322239, + 0.0017719921819865704, + 0.0016809766824357213, + 0.0016068122006952764, + 0.0015503323614597321, + 0.0014956797890365123, + 0.001446343973185867, + 0.001398251862078905, + 0.0013568441493436694, + 0.001320645131357014, + 0.0012880230963230133, + 0.0012557724336162209, + 0.0012244191642850637, + 0.001201738376915455, + 0.0011770459957420826, + 0.001153542260825634, + 0.0011285611988976598, + 0.0011068878036923707, + 0.0010875567765906452, + 0.0010707868609577417, + 0.001056193824671209, + 0.0010415504628792406, + 0.001029124596528709, + 0.001017341089528054, + 0.0010068201394751667, + 0.0009978911615908146, + 0.000990417231619358, + 0.0009832257608883082, + 0.00097659575836733, + 0.0009707848763093352, + 0.0009656708472408354, + 0.0009617022202350199, + 0.0009582118788734078, + 0.0009554196711629629, + 0.0009532522734254598, + 0.0009515513226389885, + 0.0009503170928917825, + 0.0009495424324646592, + 0.0009490435067564249, + 0.0009488068943843246 + ], + "train_acc": [ + 0.5591, + 0.7376, + 0.7816, + 0.8038, + 0.832, + 0.8395, + 0.865, + 0.8744, + 0.8816, + 0.9157, + 0.907, + 0.9327, + 0.9345, + 0.918, + 0.9564, + 0.9711, + 0.9739, + 0.9841, + 0.9937, + 0.9955, + 0.9983, + 0.9998, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.714, + 0.733, + 0.739, + 0.7415, + 0.749, + 0.7445, + 0.7555, + 0.753, + 0.758, + 0.764, + 0.7605, + 0.763, + 0.751, + 0.7495, + 0.76, + 0.758, + 0.7535, + 0.762, + 0.763, + 0.7595, + 0.7655, + 0.766, + 0.7655, + 0.7665, + 0.7635, + 0.7635, + 0.7625, + 0.763, + 0.765, + 0.765, + 0.765, + 0.7605, + 0.762, + 0.7625, + 0.7625, + 0.7625, + 0.765, + 0.7625, + 0.761, + 0.7635, + 0.763, + 0.762, + 0.7645, + 0.762, + 0.7625, + 0.762, + 0.7615, + 0.761, + 0.7605, + 0.762, + 0.761, + 0.7625, + 0.761, + 0.763, + 0.7615, + 0.76, + 0.7615, + 0.761, + 0.7605, + 0.76, + 0.7585, + 0.7605, + 0.7595, + 0.76, + 0.7605, + 0.76, + 0.761, + 0.7615, + 0.7605, + 0.761, + 0.761, + 0.7615, + 0.762, + 0.762, + 0.762, + 0.762, + 0.762, + 0.762, + 0.762, + 0.762 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8338037729263306, + 0.8328856229782104, + 0.8300410509109497, + 0.823561429977417, + 0.8153207302093506, + 0.8093391060829163, + 0.8022103309631348, + 0.797042727470398, + 0.7909072041511536, + 0.7847579121589661, + 0.7778322100639343, + 0.7729053497314453 + ], + "perturbation_rho": [ + 0.9999991059303284, + 0.999998927116394, + 0.9999983906745911, + 0.9999978542327881, + 0.999996542930603, + 0.9999936819076538, + 0.9999876022338867, + 0.9999791383743286, + 0.9999581575393677, + 0.9999358057975769, + 0.9998983144760132, + 0.9998669624328613 + ], + "nudging": { + "0.001": [ + -0.06551718711853027, + -0.05436878278851509, + -0.04374578222632408, + -0.03377873823046684, + -0.02519271895289421, + -0.018464749678969383, + -0.01353352889418602, + -0.010026221163570881, + -0.007582810707390308, + -0.0058988286182284355, + -0.004728769883513451, + -0.003913772292435169 + ], + "0.003": [ + -0.18775689601898193, + -0.15706855058670044, + -0.1273409128189087, + -0.09902073442935944, + -0.07429663836956024, + -0.05470982939004898, + -0.040235307067632675, + -0.029878726229071617, + -0.022634346038103104, + -0.017627287656068802, + -0.01414164062589407, + -0.011711093597114086 + ], + "0.01": [ + -0.5344969034194946, + -0.45930254459381104, + -0.3820700943470001, + -0.30436116456985474, + -0.2331882268190384, + -0.17455099523067474, + -0.12991222739219666, + -0.09728521853685379, + -0.07412658631801605, + -0.05795694515109062, + -0.04662308096885681, + -0.03868289291858673 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.207177610397339, + 1.3553162548065185, + 0.9701127763748169, + 0.8732295251846314, + 0.8323645715236664, + 0.7960227321624755, + 0.7760959873199463, + 0.7735449209213257, + 0.8278698476791382, + 0.7780323928833007, + 0.7878356379508972, + 0.8351406150817872, + 0.8288927593231201, + 0.8574019664764404, + 0.9053186392784118, + 0.8401385468482971, + 0.9288690845489502, + 0.9082258205413818, + 0.9345129062652587, + 0.9014082008361817, + 0.9392737476348877, + 0.9890750411033631, + 0.9745229903221131, + 1.012724796485901, + 1.0476140842437744, + 1.0703742972373962, + 1.0096880889892579, + 1.0171483258247376, + 0.993707428073883, + 1.0268911544799804, + 1.0893181150436402, + 1.0987916242599487, + 1.1768492286682128, + 1.0336660877227783, + 1.0487600833892823, + 1.0165627954006196, + 1.0527002319335939, + 1.0847500762939453, + 1.0983065540313721, + 1.1062523952484131, + 1.1631684410095215, + 1.0733569494247437, + 1.0690837306976317, + 1.0478396898269653, + 1.0268214958190918, + 1.0501665784835816, + 1.0577228107452392, + 1.0538366958618164, + 1.0179664922714233, + 1.0134689270019532, + 0.9985476385116577, + 1.0454052556991578, + 1.0207467739105225, + 1.0244656821250915, + 0.9939537384033204, + 1.0521814125061035, + 1.0026006247520447, + 0.9790403079986573, + 1.0003239252090455, + 0.9621838529586793, + 0.9900179187774658, + 0.9625193190574646, + 0.9366787405014038, + 0.9520282551765442, + 0.9402749418258667, + 0.9276724267959595, + 0.926775997543335, + 0.9376771799087524, + 0.9245368611335755, + 0.9217848522186279, + 0.9227305391311645, + 0.9204626731872558, + 0.9151489919662475, + 0.9102424224853516, + 0.9097598545074463, + 0.9079971894264222, + 0.905090577507019, + 0.9043300183296203, + 0.9026400138854981, + 0.9020073030471801 + ], + "train_acc": [ + 0.1971, + 0.5182, + 0.6448, + 0.6792, + 0.6936, + 0.7075, + 0.7157, + 0.7152, + 0.7044, + 0.7158, + 0.7198, + 0.7091, + 0.711, + 0.7059, + 0.6962, + 0.7185, + 0.697, + 0.709, + 0.7009, + 0.7141, + 0.7042, + 0.6947, + 0.7025, + 0.695, + 0.6896, + 0.6896, + 0.6981, + 0.7002, + 0.6978, + 0.6927, + 0.6839, + 0.6831, + 0.6728, + 0.6945, + 0.6934, + 0.7016, + 0.6898, + 0.6859, + 0.6837, + 0.6842, + 0.6775, + 0.687, + 0.6887, + 0.6933, + 0.6962, + 0.692, + 0.6919, + 0.6894, + 0.6975, + 0.6978, + 0.6962, + 0.6928, + 0.6957, + 0.6958, + 0.6997, + 0.6891, + 0.6983, + 0.7021, + 0.6988, + 0.7051, + 0.6999, + 0.7047, + 0.7081, + 0.7054, + 0.7081, + 0.7125, + 0.7133, + 0.7084, + 0.7098, + 0.7114, + 0.7082, + 0.7122, + 0.7119, + 0.7132, + 0.7132, + 0.7142, + 0.7158, + 0.7147, + 0.7147, + 0.7152 + ], + "test_acc": [ + 0.3905, + 0.579, + 0.641, + 0.641, + 0.628, + 0.6535, + 0.659, + 0.6255, + 0.6425, + 0.6445, + 0.6375, + 0.6555, + 0.654, + 0.619, + 0.6675, + 0.6245, + 0.6405, + 0.6555, + 0.673, + 0.6335, + 0.6435, + 0.633, + 0.641, + 0.619, + 0.6355, + 0.658, + 0.6185, + 0.644, + 0.6485, + 0.6035, + 0.589, + 0.614, + 0.6475, + 0.6145, + 0.6325, + 0.6305, + 0.6445, + 0.623, + 0.62, + 0.609, + 0.644, + 0.6335, + 0.616, + 0.6435, + 0.626, + 0.617, + 0.6195, + 0.6375, + 0.6395, + 0.658, + 0.6355, + 0.657, + 0.6365, + 0.6435, + 0.63, + 0.651, + 0.6595, + 0.643, + 0.6525, + 0.647, + 0.6515, + 0.66, + 0.654, + 0.6595, + 0.66, + 0.6645, + 0.6615, + 0.668, + 0.664, + 0.6545, + 0.6665, + 0.6665, + 0.6655, + 0.6625, + 0.666, + 0.665, + 0.6685, + 0.6695, + 0.6705, + 0.6705 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.04563574492931366, + 0.07466404139995575, + 0.07062304764986038, + 0.07941032946109772, + 0.08478259295225143, + 0.1176375150680542, + 0.051365386694669724, + 0.07094398140907288, + 0.06898803263902664, + 0.07310269773006439, + 0.0635182335972786, + 0.11305823177099228 + ], + "perturbation_rho": [ + 0.026268895715475082, + 0.03733495995402336, + 0.07775422930717468, + 0.12396883964538574, + 0.05687103420495987, + 0.13703036308288574, + -0.0030320845544338226, + 0.08171480149030685, + 0.06336408108472824, + 0.09909991919994354, + 0.06059148907661438, + 0.12057653069496155 + ], + "nudging": { + "0.001": [ + -0.0016007821541279554, + -0.0005322497454471886, + -0.00031997537007555366, + -0.00037323293508961797, + -0.000361767306458205, + -0.0004932747106067836, + -0.00017937232041731477, + -0.0002972582005895674, + -0.0003065706114284694, + -0.0003170697018504143, + -0.000248884956818074, + -0.00045291916467249393 + ], + "0.003": [ + -0.004783018957823515, + -0.0015951856039464474, + -0.0009565058862790465, + -0.0011192618403583765, + -0.0010866662487387657, + -0.0014763758517801762, + -0.0005387155106291175, + -0.0008894718484953046, + -0.0009208020055666566, + -0.000954244751483202, + -0.0007453658035956323, + -0.0013566396664828062 + ], + "0.01": [ + -0.015672076493501663, + -0.0053095086477696896, + -0.0031822575256228447, + -0.003722358262166381, + -0.0036155935376882553, + -0.004913205746561289, + -0.0017889357404783368, + -0.002959918463602662, + -0.003063073381781578, + -0.003171245101839304, + -0.0024787387810647488, + -0.004513401538133621 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.7777370233535768, + 1.039262655735016, + 0.8970872451782227, + 0.9651401982307434, + 0.963715316581726, + 0.9871692520141602, + 1.0162057588577271, + 1.0440610739707947, + 1.0629752737998963, + 1.0943596759796144, + 1.1322574831008911, + 1.1550358348846435, + 1.1498169647216796, + 1.0954011442184448, + 1.1236124910354615, + 1.1751378925323486, + 1.1859121335983276, + 1.1846929653167724, + 1.2153968069076537, + 1.1254301585197448, + 1.1320601383209228, + 1.1558818790435792, + 1.133813604736328, + 1.1268145646095276, + 1.1400998264312745, + 1.0998258207321168, + 1.0921298738479615, + 1.0851680498123168, + 1.0914192169189454, + 1.0816248546600342, + 1.0882935146331787, + 1.0556492755889892, + 1.0454220704078674, + 1.0455451524734498, + 1.0445414920806886, + 1.0483357555389405, + 1.057666886138916, + 1.0440490622520446, + 1.0286948212623597, + 1.036337445449829, + 1.054752719116211, + 1.03532038230896, + 1.0384975449562073, + 1.0404673326492309, + 1.041804114151001, + 1.0244333234786986, + 1.0268776634216308, + 1.031060266494751, + 1.0237797790527343, + 1.0266751319885254, + 1.0234112846374512, + 1.0229099086761475, + 1.0279601011276245, + 1.0144617162704468, + 1.0212466983795165, + 1.0155485634803771, + 1.0136163455963134, + 1.0249474774360656, + 1.0065589557647705, + 1.006953769683838, + 1.0076389682769775, + 1.0087233503341675, + 1.000064527130127, + 1.0004527723312377, + 1.0012750885009765, + 1.0030569223403931, + 0.9993479643821717, + 0.9943592184066773, + 0.9925341587066651, + 0.9925664705276489, + 0.9892626775741578, + 0.9883018711090088, + 0.9872277095794678, + 0.9865430347442627, + 0.9849344594955445, + 0.9844682892799378, + 0.9840617263793945, + 0.9834357357025146, + 0.9830780168533325, + 0.9829166003227234 + ], + "train_acc": [ + 0.3546, + 0.6171, + 0.6761, + 0.6705, + 0.6713, + 0.6597, + 0.6514, + 0.635, + 0.6289, + 0.6197, + 0.6115, + 0.5982, + 0.5987, + 0.6114, + 0.5955, + 0.5854, + 0.5868, + 0.5799, + 0.5763, + 0.5979, + 0.5943, + 0.5958, + 0.6015, + 0.6004, + 0.6039, + 0.611, + 0.6139, + 0.6125, + 0.609, + 0.6141, + 0.6158, + 0.6242, + 0.6266, + 0.6278, + 0.6316, + 0.6286, + 0.6254, + 0.6351, + 0.6368, + 0.6323, + 0.6252, + 0.6313, + 0.6321, + 0.628, + 0.6275, + 0.6354, + 0.6371, + 0.6314, + 0.6355, + 0.637, + 0.6368, + 0.6366, + 0.6366, + 0.6398, + 0.6375, + 0.6408, + 0.6381, + 0.6356, + 0.6412, + 0.6429, + 0.6404, + 0.6428, + 0.6433, + 0.6423, + 0.6424, + 0.6418, + 0.644, + 0.6422, + 0.6459, + 0.6459, + 0.6462, + 0.6452, + 0.6476, + 0.6465, + 0.6483, + 0.6461, + 0.6473, + 0.6477, + 0.648, + 0.6484 + ], + "test_acc": [ + 0.5575, + 0.608, + 0.6735, + 0.626, + 0.6365, + 0.6265, + 0.6, + 0.601, + 0.5965, + 0.5965, + 0.581, + 0.5795, + 0.5845, + 0.5935, + 0.5525, + 0.5735, + 0.563, + 0.5485, + 0.5615, + 0.569, + 0.572, + 0.5765, + 0.5625, + 0.569, + 0.581, + 0.572, + 0.574, + 0.574, + 0.594, + 0.5745, + 0.591, + 0.6005, + 0.6115, + 0.6095, + 0.595, + 0.582, + 0.598, + 0.5855, + 0.598, + 0.5945, + 0.596, + 0.601, + 0.5955, + 0.5815, + 0.5915, + 0.597, + 0.588, + 0.5995, + 0.5845, + 0.5995, + 0.5955, + 0.589, + 0.5965, + 0.618, + 0.6, + 0.6025, + 0.609, + 0.6025, + 0.605, + 0.6045, + 0.601, + 0.6105, + 0.611, + 0.6055, + 0.6025, + 0.6035, + 0.597, + 0.598, + 0.605, + 0.598, + 0.6025, + 0.6035, + 0.603, + 0.601, + 0.6025, + 0.6045, + 0.6035, + 0.6025, + 0.6025, + 0.6015 + ], + "state_pred_error": [ + 0.6630272414207459, + 0.2079629589319229, + 0.16196079077720643, + 0.1663352201938629, + 0.1627671336174011, + 0.1762225886821747, + 0.1813463003873825, + 0.17045307669639587, + 0.16121247019767762, + 0.15743737254142762, + 0.16037912952899933, + 0.14473771260976792, + 0.1326150424480438, + 0.12846465719938277, + 0.11744894111156463, + 0.11671908056735993, + 0.11889441428184509, + 0.12293256052732468, + 0.11396846870183945, + 0.10545692546367645, + 0.10248748415708542, + 0.08661013205051422, + 0.07915450052022933, + 0.09114358839988708, + 0.08691594620943069, + 0.08266509202718735, + 0.08061882747411728, + 0.07838099582195282, + 0.07678124432563782, + 0.075958416223526, + 0.07330761730670929, + 0.07064944109916688, + 0.06765280425548553, + 0.06359503600597381, + 0.06085543820858002, + 0.059145973962545395, + 0.057147851037979126, + 0.05545796197652817, + 0.05472242616415024, + 0.05328660033941269, + 0.052086339628696444, + 0.0522535075366497, + 0.052079638755321504, + 0.05211708617210388, + 0.0511810753941536, + 0.04935787490606308, + 0.046508885717391965, + 0.044714570379257204, + 0.043279960918426515, + 0.042027167618274686, + 0.04071626418828964, + 0.03979887268543243, + 0.03903335108757019, + 0.03792436560988426, + 0.03741062755584717, + 0.03643448035120964, + 0.03576543673872948, + 0.0351304425060749, + 0.03429401182532311, + 0.03371152082681656, + 0.03313189471960068, + 0.03265186365842819, + 0.032182833680510524, + 0.0312529805958271, + 0.030570048174262048, + 0.029929270273447037, + 0.029457912415266036, + 0.028828839021921158, + 0.028277097725868224, + 0.028308763039112093, + 0.02776089369058609, + 0.026589947140216827, + 0.026290152072906494, + 0.025718347430229188, + 0.025397347101569177, + 0.02519998631477356, + 0.02490392438173294, + 0.024270719787478447, + 0.024019235450029375, + 0.02374415186047554 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.5561584234237671, + 0.39794063568115234, + 0.20452159643173218, + 0.14641982316970825, + 0.11315252631902695, + 0.12314423173666, + 0.11100500077009201, + 0.11256138980388641, + 0.12550771236419678, + 0.11898934841156006, + 0.11000233888626099, + 0.10332056879997253 + ], + "perturbation_rho": [ + 0.4663659632205963, + 0.38622361421585083, + 0.20298895239830017, + 0.1521472930908203, + 0.10572830587625504, + 0.14532539248466492, + 0.1235864907503128, + 0.12295880913734436, + 0.1263602077960968, + 0.1123446375131607, + 0.14707674086093903, + 0.1404699832201004 + ], + "nudging": { + "0.001": [ + -0.01762799359858036, + -0.0021035720128566027, + -0.00075343600474298, + -0.0005018080701120198, + -0.00037483975756913424, + -0.00040054353303276, + -0.00037695514038205147, + -0.0003710503806360066, + -0.00040657291538082063, + -0.0003865875187329948, + -0.00035775359719991684, + -0.00033668274409137666 + ], + "0.003": [ + -0.05237508937716484, + -0.006302305497229099, + -0.0022594095207750797, + -0.0015049520879983902, + -0.001124655595049262, + -0.0012015008833259344, + -0.00113069883082062, + -0.0011128759942948818, + -0.0012195921735838056, + -0.001159440609626472, + -0.0010727422777563334, + -0.0010099414503201842 + ], + "0.01": [ + -0.16852372884750366, + -0.020911922678351402, + -0.007518916856497526, + -0.005010381806641817, + -0.0037449360825121403, + -0.004001074004918337, + -0.0037657374050468206, + -0.0037060989998281, + -0.00406123511493206, + -0.003861584234982729, + -0.0035726726055145264, + -0.0033634149003773928 + ] + }, + "state_pred_error_per_layer": [ + 16351.89453125, + 3139.08837890625, + 1824.6005859375, + 1391.949462890625, + 1295.1900634765625, + 1149.4605712890625, + 981.4422607421875, + 921.3729248046875, + 954.6389770507812, + 1032.970703125, + 1065.58984375, + 1272.3818359375 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.207360833930969, + 1.3511120353698731, + 0.9661354298591613, + 0.8680098114967346, + 0.8263119333267211, + 0.7979276044845581, + 0.7925828973770142, + 0.7783180428504943, + 0.7965024029731751, + 0.7947660594463348, + 0.7717324380874634, + 0.8037697998046875, + 0.8354542464256287, + 0.8516409687042237, + 0.883002855014801, + 0.8535399710655213, + 0.9378591158866882, + 0.9240535995960235, + 0.920214697265625, + 1.0051448905944824, + 0.896866081237793, + 0.964885433959961, + 1.036075691986084, + 1.0164314723968506, + 1.1041621470451355, + 1.0689070242881775, + 1.1327576055526734, + 1.3177466125488282, + 1.3560321712493897, + 1.2767763432502746, + 1.1126590032577515, + 1.0944596376419067, + 1.1537445356369018, + 1.1305477544784546, + 1.162183289718628, + 1.110354697036743, + 1.138338935279846, + 1.0938628067016603, + 1.0949970287322999, + 1.1010143295288086, + 1.1742381256103516, + 1.1792693685531617, + 1.1362173608779906, + 1.1625488094329834, + 1.1804513359069824, + 1.1834693833351135, + 1.1848550859451294, + 1.1936074775695802, + 1.1980674312591553, + 1.2182542015075684, + 1.2160317821502686, + 1.2099562562942505, + 1.2189889129638671, + 1.2211134176254272, + 1.1966558967590333, + 1.2248574840545654, + 1.204994546699524, + 1.2041459096908569, + 1.2023766017913817, + 1.210695701599121, + 1.2113554904937744, + 1.205434011077881, + 1.2068788354873656, + 1.2005671588897706, + 1.203082329940796, + 1.1969014379501344, + 1.2014315116882324, + 1.188254769706726, + 1.1834532361984254, + 1.1865405479431153, + 1.1853660331726075, + 1.180847424697876, + 1.1774358226776123, + 1.173608071899414, + 1.1725929969787598, + 1.171435493850708, + 1.1699126182556152, + 1.1699759094238282, + 1.168540977859497, + 1.1682494367599487 + ], + "train_acc": [ + 0.1977, + 0.5172, + 0.64, + 0.6814, + 0.6953, + 0.7097, + 0.7096, + 0.7174, + 0.7107, + 0.7156, + 0.7238, + 0.7169, + 0.7142, + 0.7094, + 0.7077, + 0.7179, + 0.6979, + 0.7028, + 0.7047, + 0.6864, + 0.7106, + 0.6876, + 0.6734, + 0.6686, + 0.6469, + 0.6496, + 0.6328, + 0.6153, + 0.6178, + 0.6298, + 0.6242, + 0.6312, + 0.6123, + 0.6315, + 0.618, + 0.6186, + 0.6135, + 0.6144, + 0.6056, + 0.6093, + 0.5855, + 0.5801, + 0.5917, + 0.5761, + 0.5702, + 0.5688, + 0.5723, + 0.5661, + 0.5684, + 0.5549, + 0.5581, + 0.5567, + 0.5572, + 0.5518, + 0.5626, + 0.5541, + 0.5579, + 0.5572, + 0.5623, + 0.5514, + 0.5565, + 0.5607, + 0.5585, + 0.559, + 0.5538, + 0.564, + 0.5567, + 0.5616, + 0.5637, + 0.5666, + 0.5637, + 0.5619, + 0.5675, + 0.5666, + 0.5669, + 0.5694, + 0.5697, + 0.5686, + 0.5695, + 0.5689 + ], + "test_acc": [ + 0.3955, + 0.5785, + 0.6265, + 0.652, + 0.6485, + 0.621, + 0.6335, + 0.6655, + 0.67, + 0.689, + 0.6655, + 0.626, + 0.638, + 0.644, + 0.6145, + 0.6285, + 0.667, + 0.645, + 0.644, + 0.6665, + 0.662, + 0.643, + 0.627, + 0.615, + 0.6205, + 0.5915, + 0.528, + 0.5505, + 0.575, + 0.5655, + 0.552, + 0.57, + 0.5755, + 0.581, + 0.582, + 0.5765, + 0.553, + 0.5395, + 0.5435, + 0.558, + 0.535, + 0.5635, + 0.5525, + 0.5505, + 0.526, + 0.544, + 0.5335, + 0.5235, + 0.5315, + 0.5345, + 0.5095, + 0.5005, + 0.4775, + 0.5465, + 0.526, + 0.533, + 0.5515, + 0.5615, + 0.5635, + 0.5495, + 0.5475, + 0.5435, + 0.5485, + 0.5485, + 0.5555, + 0.5515, + 0.566, + 0.5585, + 0.554, + 0.551, + 0.5565, + 0.5555, + 0.549, + 0.554, + 0.5525, + 0.5605, + 0.5575, + 0.558, + 0.5575, + 0.5585 + ], + "value_loss": [ + 2.8914731563568115, + 1.0116421065330505, + 0.9792686163425446, + 0.9698389565467834, + 0.9745230066776276, + 0.9593441887855529, + 0.9914514320373535, + 0.9008937696456909, + 0.9442315740585328, + 0.9354399297237396, + 0.9357834646224975, + 1.0310763645172119, + 1.1280350433349609, + 1.1904344772338866, + 1.3550069772720337, + 1.3053666845321654, + 1.4593678120613098, + 1.4700158073425293, + 1.3546633718490602, + 1.6431034988403321, + 1.3852640265464782, + 1.322731337928772, + 1.518436873435974, + 1.1696343566894531, + 1.454881266784668, + 1.370015459060669, + 1.363555002975464, + 1.872614532470703, + 2.4025319738388062, + 3.2879290182590486, + 1.1695105950355529, + 1.0109361934661865, + 1.1540400910377502, + 1.209294234085083, + 1.211466327047348, + 0.8347042934417724, + 0.8668873561859131, + 0.8094220149993896, + 0.741839238357544, + 0.6732744760513306, + 0.7854546588897705, + 0.6755673208236694, + 0.5728948916435241, + 0.6133837251663208, + 0.6896575976371765, + 0.6329740990638733, + 0.5643162271499634, + 0.5344781528472901, + 0.6565200087070465, + 0.5923100409507751, + 0.5163188346862793, + 0.5435176980018616, + 0.532232845401764, + 0.5047218198776245, + 0.47310378370285033, + 0.45587757511138916, + 0.4523937116146088, + 0.4488687247276306, + 0.445998570728302, + 0.4277126375198364, + 0.43870710592269896, + 0.406502858543396, + 0.5107559196472168, + 0.42902055196762084, + 0.3890920462608337, + 0.38705502166748046, + 0.4119320761680603, + 0.38806987524032593, + 0.3780417576313019, + 0.3852014954566956, + 0.3755380168914795, + 0.3765079488277435, + 0.3590162860870361, + 0.36511458950042724, + 0.3516147146701813, + 0.3548973054409027, + 0.3555239068031311, + 0.3550170949459076, + 0.3455959125518799, + 0.3557061047077179 + ], + "term_loss": [ + 1.6602315026283263, + 0.6487982746124268, + 0.7606359968185424, + 0.7683342950582505, + 0.7632556185245514, + 0.7351340337753296, + 0.7646495252609253, + 0.6887249355316162, + 0.7335731735229493, + 0.7274465770244598, + 0.7336520937919617, + 0.8231202568054199, + 0.9113656562805176, + 0.9691344513893128, + 1.131781807899475, + 1.0871996644496917, + 1.2227107072830201, + 1.2319942425727843, + 1.1140453166007995, + 1.3427057041168213, + 1.0584808224439621, + 0.9781823832035065, + 1.124849826812744, + 0.8163653163909912, + 1.0391017780303955, + 0.9161141554832458, + 0.9728089346885681, + 1.4108687118530274, + 1.913311016893387, + 2.474852797269821, + 0.7707266288757324, + 0.6442933590888977, + 0.7695344947814942, + 0.8129353022575379, + 0.7860277270078659, + 0.4854595648765564, + 0.5304397300720215, + 0.48523606872558595, + 0.4136289978981018, + 0.3496486745357513, + 0.43072265305519103, + 0.3545576292037964, + 0.2707749304056168, + 0.30003291432857515, + 0.3649471400976181, + 0.3097132356643677, + 0.24948634128570557, + 0.21672172679901122, + 0.31764200187921526, + 0.2645720922470093, + 0.1943810030221939, + 0.21808994147777558, + 0.20612887120246887, + 0.1831600733757019, + 0.1579606840133667, + 0.13959807016849518, + 0.13821850581765174, + 0.1346768367767334, + 0.13379685539007186, + 0.11722139341831207, + 0.12373274766206742, + 0.1021266034603119, + 0.18962102710008621, + 0.12173434302210807, + 0.0886700010061264, + 0.08855389852523804, + 0.10985714473724366, + 0.09126245896220207, + 0.08464143277704715, + 0.08802928638458252, + 0.08116196565628052, + 0.08235352320671081, + 0.06943840010166168, + 0.07480848977863788, + 0.06362296106815338, + 0.06547020068168641, + 0.0663039342880249, + 0.06582048626542092, + 0.0589083580493927, + 0.06590610226392746 + ], + "bridge_loss": [ + 0.9331698284233862, + 0.11649462137520314, + 0.015715979816019535, + 0.00671334265768528, + 0.018271303272247314, + 0.03326347976624966, + 0.03348449106514454, + 0.020532348553836347, + 0.013244135062396526, + 0.009722792905569077, + 0.008876127330958843, + 0.009582126937806607, + 0.011055101352930068, + 0.011870610010623932, + 0.013375742612779141, + 0.0155577556848526, + 0.019751004827022554, + 0.017863361442089082, + 0.027747771644592287, + 0.07066093260645867, + 0.11650513218641281, + 0.12101610896587371, + 0.15459786736965178, + 0.11606869056224824, + 0.15967000955343247, + 0.19558869359493256, + 0.11933131771087646, + 0.16814801473617555, + 0.19006015786528588, + 0.5340570589244366, + 0.13764213082790375, + 0.10621524007320404, + 0.11688521416187286, + 0.13697189807891846, + 0.16142817224264144, + 0.08553076691031455, + 0.06714614820480347, + 0.058368180775642396, + 0.06367164892554283, + 0.058401806330680844, + 0.07510955965518952, + 0.04296272074580192, + 0.030555253785848616, + 0.03590657195448876, + 0.0444308792591095, + 0.040885373382270336, + 0.031827708619832994, + 0.031135463285446165, + 0.05048181757330895, + 0.03556546043753624, + 0.029527773827314377, + 0.033380622804164886, + 0.032867836010456085, + 0.029423796927928923, + 0.026511628997325898, + 0.02286296658962965, + 0.02306612728089094, + 0.02427403473854065, + 0.022651293496787548, + 0.02018927168995142, + 0.023878360521793367, + 0.015088292667269706, + 0.031936795590817926, + 0.018752254104614258, + 0.010989018613100051, + 0.011456697177141905, + 0.014083520233631134, + 0.010883450951427221, + 0.00928245914876461, + 0.01226512822508812, + 0.009397232201695442, + 0.009936634358018637, + 0.006541926475614309, + 0.008306315709650517, + 0.006603296869248152, + 0.008167878417670726, + 0.008434691524505615, + 0.00860220458805561, + 0.006883558386564255, + 0.010093027733266353 + ], + "tgrad_loss": [ + 0.2980718096733093, + 0.24634920997619628, + 0.2029166358470917, + 0.19479132684469222, + 0.1929960819721222, + 0.19094667139053345, + 0.19331741120815277, + 0.1916364851951599, + 0.19741427063941955, + 0.19827055424451828, + 0.19325523676872253, + 0.19837397718429564, + 0.20561428740024568, + 0.20942940578460692, + 0.20984943301677703, + 0.20260925273895264, + 0.21690608932971955, + 0.22015822021961212, + 0.2128702841281891, + 0.22973685836791993, + 0.21027806951999664, + 0.22353285098075867, + 0.23898917541503906, + 0.23720036025047303, + 0.25610947241783144, + 0.25831260244846344, + 0.2714147402048111, + 0.29359780797958374, + 0.29916080503463743, + 0.2790191856145859, + 0.2611418417930603, + 0.2604275827884674, + 0.26762038497924806, + 0.25938703508377076, + 0.2640104354381561, + 0.2637139617919922, + 0.2693014838695526, + 0.2658177710533142, + 0.2645385955810547, + 0.26522399611473085, + 0.27962244243621825, + 0.27804697461128236, + 0.27156470761299134, + 0.27744423763751985, + 0.2802795831680298, + 0.28237549018859864, + 0.28300217514038084, + 0.2866209662437439, + 0.28839618926048277, + 0.29217248883247376, + 0.2924100575447083, + 0.2920471329689026, + 0.29323613867759707, + 0.2921379543304443, + 0.2886314691543579, + 0.2934165405750275, + 0.2911090755939484, + 0.28991785345077514, + 0.28955041818618776, + 0.290301975774765, + 0.29109600009918213, + 0.2892879591941834, + 0.2891980986595154, + 0.2885339534759521, + 0.28943302466869353, + 0.2870444281578064, + 0.2879914128303528, + 0.28592396450042723, + 0.2841178658246994, + 0.284907079744339, + 0.28497882013320924, + 0.28421779255867, + 0.2830359622001648, + 0.2819997839927673, + 0.2813884559631348, + 0.2812592257499695, + 0.2807852788448334, + 0.2805944046497345, + 0.2798039969444275, + 0.2797069767475128 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.05994441360235214, + 0.19127817451953888, + 0.25874069333076477, + 0.31905949115753174, + 0.31442493200302124, + 0.3214789927005768, + 0.368133008480072, + 0.38988351821899414, + 0.4050426781177521, + 0.416469931602478, + 0.4253390431404114, + 0.4322451949119568 + ], + "perturbation_rho": [ + 0.1191493421792984, + 0.31643322110176086, + 0.4170604646205902, + 0.42330044507980347, + 0.4319503903388977, + 0.42732322216033936, + 0.46659332513809204, + 0.487338662147522, + 0.496512234210968, + 0.4787842035293579, + 0.5010949969291687, + 0.5059125423431396 + ], + "nudging": { + "0.001": [ + -0.0016103468369692564, + -0.0018254828173667192, + -0.0021413436625152826, + -0.0023662694729864597, + -0.0023437764029949903, + -0.0023424234241247177, + -0.002533233491703868, + -0.002567564370110631, + -0.00262308563105762, + -0.002670108340680599, + -0.0027196200098842382, + -0.002735825488343835 + ], + "0.003": [ + -0.004815170541405678, + -0.005469394847750664, + -0.0064151170663535595, + -0.007090517785400152, + -0.007022828795015812, + -0.007019806653261185, + -0.007589289918541908, + -0.007691953331232071, + -0.007857399061322212, + -0.007999258115887642, + -0.008147023618221283, + -0.008196018636226654 + ], + "0.01": [ + -0.015865826979279518, + -0.018151750788092613, + -0.021288521587848663, + -0.02352731302380562, + -0.023306310176849365, + -0.02329857647418976, + -0.025182321667671204, + -0.025520823895931244, + -0.026067661121487617, + -0.026535863056778908, + -0.027021951973438263, + -0.02718108892440796 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a1.0_L2_s123.json b/results/synth_ladder_v2_hi/synth_a1.0_L2_s123.json new file mode 100644 index 0000000..17c5ae1 --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a1.0_L2_s123.json @@ -0,0 +1,1512 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.91867273311615, + 1.1479057174682616, + 0.7667448886871338, + 0.6092986298084259, + 0.5399450777053832, + 0.4998543502807617, + 0.4701059171676636, + 0.44774744348526, + 0.433194176864624, + 0.4138288654327393, + 0.38988096828460694, + 0.37067162165641787, + 0.35758755187988284, + 0.3432540241241455, + 0.32265024185180663, + 0.31479289903640745, + 0.2948722456932068, + 0.2916181824684143, + 0.26947770991325376, + 0.26305155229568483, + 0.2504066630601883, + 0.23246315641403198, + 0.22475692710876466, + 0.21131145256757736, + 0.19484182257652283, + 0.1904493874311447, + 0.17960406827926637, + 0.1701004672050476, + 0.15617957714796066, + 0.1445945238351822, + 0.1391076461791992, + 0.13091985216140747, + 0.12840345685482024, + 0.1167986627459526, + 0.1053664587020874, + 0.1000328464448452, + 0.09326313433647156, + 0.09093141227960587, + 0.08538822884559631, + 0.08038766567707062, + 0.07611644887924195, + 0.07148764984607696, + 0.06654568490982056, + 0.062096750885248186, + 0.058967465686798094, + 0.05627817189693451, + 0.05370346330404282, + 0.05124748470783234, + 0.04963369052410126, + 0.048742957431077955, + 0.045943583583831785, + 0.04393785551190376, + 0.04209109454154968, + 0.040698669242858886, + 0.039860168999433516, + 0.03850054189264775, + 0.03725776370763779, + 0.03654853151440621, + 0.03559232919216156, + 0.03459027769565582, + 0.033881497570872304, + 0.03315351962447166, + 0.03260607058405876, + 0.032083336877822874, + 0.03177986741065979, + 0.03131906301379204, + 0.03093072702884674, + 0.030623940539360045, + 0.030301975291967393, + 0.03005140163898468, + 0.029858090263605117, + 0.0296798649340868, + 0.02952518635392189, + 0.02939634127020836, + 0.02930180861055851, + 0.029228065556287767, + 0.029173334753513337, + 0.02913727904856205, + 0.029115084266662598, + 0.029103587424755096 + ], + "train_acc": [ + 0.3489, + 0.6623, + 0.7738, + 0.8007, + 0.809, + 0.8183, + 0.8298, + 0.832, + 0.8382, + 0.847, + 0.8588, + 0.8646, + 0.8689, + 0.8788, + 0.8876, + 0.8885, + 0.8985, + 0.8966, + 0.9061, + 0.9087, + 0.9133, + 0.9254, + 0.9282, + 0.9339, + 0.9436, + 0.9446, + 0.948, + 0.9528, + 0.9619, + 0.9665, + 0.9683, + 0.9737, + 0.9716, + 0.9784, + 0.9853, + 0.9846, + 0.9887, + 0.9888, + 0.9903, + 0.9923, + 0.9938, + 0.9947, + 0.9964, + 0.9974, + 0.9979, + 0.9985, + 0.9989, + 0.9991, + 0.9989, + 0.9988, + 0.9993, + 0.9998, + 0.9994, + 0.9997, + 0.9997, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 0.9999, + 1.0, + 0.9999, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.5505, + 0.719, + 0.762, + 0.7795, + 0.7805, + 0.7905, + 0.7925, + 0.79, + 0.7925, + 0.8, + 0.801, + 0.805, + 0.802, + 0.799, + 0.805, + 0.8105, + 0.8055, + 0.8095, + 0.811, + 0.8165, + 0.8135, + 0.8105, + 0.808, + 0.8095, + 0.8175, + 0.808, + 0.813, + 0.8105, + 0.816, + 0.8165, + 0.812, + 0.806, + 0.8045, + 0.808, + 0.8115, + 0.81, + 0.8085, + 0.8065, + 0.808, + 0.8095, + 0.807, + 0.809, + 0.8085, + 0.8115, + 0.8115, + 0.809, + 0.811, + 0.811, + 0.8095, + 0.8095, + 0.81, + 0.811, + 0.808, + 0.8095, + 0.81, + 0.81, + 0.8105, + 0.8105, + 0.813, + 0.812, + 0.811, + 0.809, + 0.8105, + 0.8095, + 0.809, + 0.811, + 0.81, + 0.811, + 0.809, + 0.8095, + 0.8095, + 0.809, + 0.81, + 0.809, + 0.809, + 0.809, + 0.809, + 0.809, + 0.809, + 0.809 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9615377187728882, + 0.9503427743911743 + ], + "perturbation_rho": [ + 0.9999992847442627, + 0.9999980926513672 + ], + "nudging": { + "0.001": [ + -0.039457522332668304, + -0.024251405149698257 + ], + "0.003": [ + -0.112161785364151, + -0.07042354345321655 + ], + "0.01": [ + -0.3078651428222656, + -0.20883342623710632 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2375081497192384, + 1.7361759670257568, + 1.2429127569198608, + 0.9395764049530029, + 0.7808661069869995, + 0.6961161418914795, + 0.6507503452301026, + 0.6232247513771058, + 0.6140826705932617, + 0.6100598525047303, + 0.6097840148925782, + 0.6079091403961182, + 0.6147353491783142, + 0.625060820388794, + 0.6120452221870423, + 0.6118313233852386, + 0.6170345478057861, + 0.6308931268692016, + 0.6096509483337402, + 0.6289821960449219, + 0.6240285701751709, + 0.6105122757911682, + 0.6274244334220886, + 0.624420170545578, + 0.6367384799957275, + 0.6205670486450195, + 0.6451194002628327, + 0.6397207110404969, + 0.6331547710895539, + 0.6178243230819702, + 0.6200193851470948, + 0.6195074583053589, + 0.6206575379371643, + 0.634155012702942, + 0.615179602432251, + 0.6146862535953522, + 0.6101961803436279, + 0.6337929145812988, + 0.6142671315193177, + 0.6192339191436768, + 0.6337637168884277, + 0.6212720799446106, + 0.6151982610702514, + 0.6175067305564881, + 0.6094939004898071, + 0.6124663307189941, + 0.6089740102767944, + 0.6123239847183227, + 0.6024780527114868, + 0.6105386233329773, + 0.6048168488502502, + 0.6060228562355041, + 0.6015618727684021, + 0.6025503917694092, + 0.606540693283081, + 0.6046217224121094, + 0.6020105275154114, + 0.5989886571884155, + 0.5957996716499329, + 0.5930134090423584, + 0.5924007635116577, + 0.5917772497177124, + 0.5893407508850098, + 0.5879429389953613, + 0.5886952852249145, + 0.5894091831207275, + 0.5875062602043152, + 0.5855383790969849, + 0.588559229850769, + 0.5866112979888916, + 0.5849664820671081, + 0.5839488779067993, + 0.5831396820545196, + 0.5823268011569976, + 0.5813585290908814, + 0.5809845569610596, + 0.5809995307922363, + 0.5807093320846558, + 0.580496221113205, + 0.5803627859115601 + ], + "train_acc": [ + 0.1817, + 0.4247, + 0.5944, + 0.6799, + 0.7242, + 0.743, + 0.7568, + 0.7621, + 0.7633, + 0.7658, + 0.765, + 0.7691, + 0.7663, + 0.7644, + 0.7655, + 0.7648, + 0.765, + 0.76, + 0.7687, + 0.7625, + 0.7632, + 0.7672, + 0.76, + 0.7618, + 0.7565, + 0.7633, + 0.7548, + 0.7574, + 0.7599, + 0.7656, + 0.7647, + 0.7638, + 0.7623, + 0.7576, + 0.7634, + 0.7656, + 0.7698, + 0.7589, + 0.7686, + 0.7666, + 0.7616, + 0.7627, + 0.7646, + 0.7651, + 0.7654, + 0.7664, + 0.7662, + 0.7668, + 0.7677, + 0.7666, + 0.7709, + 0.7704, + 0.771, + 0.7701, + 0.7652, + 0.7687, + 0.7699, + 0.7706, + 0.7726, + 0.7751, + 0.7733, + 0.772, + 0.7766, + 0.7765, + 0.7755, + 0.7768, + 0.7744, + 0.7762, + 0.7779, + 0.7769, + 0.7777, + 0.7789, + 0.7769, + 0.7779, + 0.7789, + 0.7794, + 0.7796, + 0.7797, + 0.7797, + 0.7794 + ], + "test_acc": [ + 0.3, + 0.5165, + 0.615, + 0.6725, + 0.703, + 0.7205, + 0.7365, + 0.736, + 0.747, + 0.73, + 0.7455, + 0.7245, + 0.733, + 0.745, + 0.7425, + 0.7435, + 0.7225, + 0.734, + 0.738, + 0.7425, + 0.737, + 0.737, + 0.733, + 0.745, + 0.7465, + 0.7335, + 0.7105, + 0.7395, + 0.7435, + 0.743, + 0.7315, + 0.739, + 0.719, + 0.75, + 0.738, + 0.737, + 0.719, + 0.7325, + 0.734, + 0.7345, + 0.737, + 0.7355, + 0.7375, + 0.739, + 0.7385, + 0.7325, + 0.7485, + 0.7315, + 0.7385, + 0.7455, + 0.7365, + 0.7405, + 0.739, + 0.742, + 0.739, + 0.736, + 0.7445, + 0.743, + 0.7455, + 0.7405, + 0.745, + 0.7405, + 0.7495, + 0.745, + 0.74, + 0.741, + 0.7475, + 0.738, + 0.7465, + 0.7445, + 0.7395, + 0.746, + 0.745, + 0.745, + 0.7445, + 0.743, + 0.7425, + 0.7445, + 0.745, + 0.7455 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.057878345251083374, + 0.044283460825681686 + ], + "perturbation_rho": [ + 0.047237616032361984, + 0.057848647236824036 + ], + "nudging": { + "0.001": [ + -0.001372040482237935, + -0.00028313416987657547 + ], + "0.003": [ + -0.004096671007573605, + -0.0008487798040732741 + ], + "0.01": [ + -0.013432648032903671, + -0.0028225481510162354 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 2.112877722930908, + 1.3453919006347657, + 0.8530845092773438, + 0.6524277864456177, + 0.5891991994857788, + 0.5847635634422302, + 0.592608453655243, + 0.6057582305908203, + 0.6155280767440796, + 0.6204281776428223, + 0.6222802136421204, + 0.6336911476135254, + 0.6332369559764862, + 0.6409030424118042, + 0.6451990050315857, + 0.6432888597488403, + 0.6504793170452118, + 0.6488698028564454, + 0.6648889320373536, + 0.6648780859947204, + 0.6609582979202271, + 0.6829509294509888, + 0.6857342351913452, + 0.6814190738677979, + 0.7037225786209107, + 0.6873076982498169, + 0.6848377838134766, + 0.7062060134887695, + 0.6998137535095215, + 0.7062244556427002, + 0.6963958681583404, + 0.7014524417877197, + 0.7018667848587036, + 0.7262831351280212, + 0.7100254920959472, + 0.7035775151729584, + 0.7036934041023254, + 0.7135613971710205, + 0.7221006870269775, + 0.7178686738967895, + 0.7212300780296326, + 0.714849740409851, + 0.7274992438316346, + 0.7240300461053848, + 0.714347897529602, + 0.7246765565872192, + 0.7239525049209595, + 0.7174782312393189, + 0.7213153991699218, + 0.728120307636261, + 0.7173239303588868, + 0.7183942793846131, + 0.7177051811218261, + 0.7196143941879273, + 0.7186342420101166, + 0.7172569666862488, + 0.7178284223556518, + 0.7189222101211548, + 0.7157055911064147, + 0.7150581773281097, + 0.7151817399978637, + 0.7204799012184143, + 0.7162576667785645, + 0.7143902016639709, + 0.7139085925102234, + 0.7124319374084472, + 0.713122578048706, + 0.7114446897506714, + 0.7103520916938781, + 0.7107818853378296, + 0.7102423515319825, + 0.7096256306648254, + 0.7096317663192749, + 0.7086990943908691, + 0.7084270180702209, + 0.7081380405426025, + 0.707952843284607, + 0.707770827293396, + 0.707584428024292, + 0.7075364337921143 + ], + "train_acc": [ + 0.2434, + 0.5738, + 0.712, + 0.7633, + 0.7744, + 0.7804, + 0.777, + 0.7713, + 0.7682, + 0.7693, + 0.7672, + 0.7633, + 0.7613, + 0.7616, + 0.7578, + 0.7572, + 0.753, + 0.7544, + 0.7468, + 0.7481, + 0.749, + 0.7422, + 0.741, + 0.7439, + 0.7354, + 0.7391, + 0.7405, + 0.734, + 0.7368, + 0.7353, + 0.737, + 0.7375, + 0.7347, + 0.7272, + 0.734, + 0.7322, + 0.7385, + 0.7289, + 0.7345, + 0.731, + 0.7283, + 0.7305, + 0.731, + 0.7284, + 0.7312, + 0.7256, + 0.7282, + 0.7321, + 0.7276, + 0.7278, + 0.7271, + 0.7316, + 0.7358, + 0.7299, + 0.7307, + 0.7343, + 0.7326, + 0.7313, + 0.7348, + 0.7314, + 0.7322, + 0.7278, + 0.7332, + 0.734, + 0.7326, + 0.7349, + 0.7342, + 0.7325, + 0.7354, + 0.734, + 0.7355, + 0.7345, + 0.7333, + 0.7353, + 0.7337, + 0.7358, + 0.7349, + 0.7344, + 0.7351, + 0.7349 + ], + "test_acc": [ + 0.4185, + 0.6385, + 0.722, + 0.753, + 0.7545, + 0.7595, + 0.754, + 0.7555, + 0.746, + 0.7515, + 0.7455, + 0.749, + 0.741, + 0.7415, + 0.7325, + 0.7375, + 0.7325, + 0.734, + 0.7025, + 0.7235, + 0.704, + 0.7255, + 0.715, + 0.7095, + 0.723, + 0.7215, + 0.7085, + 0.7045, + 0.696, + 0.6995, + 0.7005, + 0.6985, + 0.6945, + 0.7, + 0.694, + 0.699, + 0.7085, + 0.707, + 0.688, + 0.695, + 0.688, + 0.695, + 0.7025, + 0.704, + 0.7, + 0.6935, + 0.7025, + 0.699, + 0.701, + 0.6995, + 0.707, + 0.698, + 0.6995, + 0.703, + 0.6975, + 0.701, + 0.702, + 0.704, + 0.703, + 0.697, + 0.6985, + 0.701, + 0.7035, + 0.703, + 0.697, + 0.705, + 0.699, + 0.705, + 0.7045, + 0.703, + 0.7045, + 0.705, + 0.7035, + 0.7045, + 0.704, + 0.705, + 0.7045, + 0.704, + 0.704, + 0.704 + ], + "state_pred_error": [ + 0.8095995555877685, + 0.3882428121566772, + 0.2308805763721466, + 0.18112203476428987, + 0.1711174297809601, + 0.16875883374214173, + 0.16341322889328003, + 0.15181930413246156, + 0.14281459897756577, + 0.13198619084358215, + 0.12386900899410248, + 0.11684971523284912, + 0.1063781147480011, + 0.10181989614963531, + 0.09462909796237945, + 0.09080729238986969, + 0.09330907866954803, + 0.08593169351816177, + 0.08261528482437133, + 0.08104809004068375, + 0.07903132175207138, + 0.0811789864897728, + 0.07889583976268769, + 0.07535211365222931, + 0.07496694247722625, + 0.07436191855669022, + 0.07170565111637116, + 0.07015852246284485, + 0.06947937307357788, + 0.07390546046495437, + 0.0672236066699028, + 0.0676369900584221, + 0.06531769858598709, + 0.06412407599687577, + 0.06779091021418572, + 0.061958674085140227, + 0.06110408489704132, + 0.05947654608488083, + 0.05972578684091568, + 0.0575266836643219, + 0.056766388463974, + 0.05588359162211418, + 0.05469989988803863, + 0.05403341302871704, + 0.05278837133646011, + 0.05157833698987961, + 0.0505847239613533, + 0.04964255269765854, + 0.04889418448805809, + 0.047440138363838195, + 0.04654076889753342, + 0.04614740904569626, + 0.04542005708217621, + 0.045353537750244144, + 0.044121516728401186, + 0.04308061329722405, + 0.04115980257987976, + 0.04113629130125046, + 0.03981171528100967, + 0.039929159170389174, + 0.0388361143887043, + 0.03803186722993851, + 0.03724679838418961, + 0.03623849350214005, + 0.03561221360564232, + 0.035675781297683715, + 0.034312749603390695, + 0.03334942335486412, + 0.03278148359060287, + 0.033142901480197905, + 0.03213295520246029, + 0.031465019971132276, + 0.03125819475650787, + 0.03060810247063637, + 0.03033074073791504, + 0.029707073709368707, + 0.028831332409381866, + 0.028942875340580942, + 0.02833888658285141, + 0.02753113317489624 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.6596157550811768, + 0.3606003522872925 + ], + "perturbation_rho": [ + 0.5883278250694275, + 0.3191852569580078 + ], + "nudging": { + "0.001": [ + -0.017385665327310562, + -0.002226560842245817 + ], + "0.003": [ + -0.051287051290273666, + -0.006665656343102455 + ], + "0.01": [ + -0.16100725531578064, + -0.02204928547143936 + ] + }, + "state_pred_error_per_layer": [ + 4266.72509765625, + 268.82733154296875 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2380937477111815, + 1.7368752170562745, + 1.247110534477234, + 0.9422531213760376, + 0.7818900457382202, + 0.6963684833049775, + 0.6489226391792298, + 0.6235558547019958, + 0.6110991809844971, + 0.6021781756877899, + 0.6104926061630249, + 0.6089201513290405, + 0.6008785103797912, + 0.6032293972492218, + 0.6087587015151977, + 0.6239664590835571, + 0.6048972602844238, + 0.6251128030776978, + 0.6191382528305054, + 0.6513575605392457, + 0.6536323498725891, + 0.6655845951080323, + 0.697906189918518, + 0.7237542797088623, + 0.7615356777191162, + 0.7806874334335328, + 0.7626848733901977, + 0.7719258213043213, + 0.8015456851005555, + 0.7952612302780151, + 0.8358330780029297, + 0.8377494823455811, + 0.8617944671630859, + 0.893122191619873, + 0.9658586881637573, + 0.951087232875824, + 0.9932956078529358, + 0.973046259021759, + 1.0269800101280213, + 1.091286882019043, + 1.049387868309021, + 1.039117106819153, + 1.0862663068771363, + 1.1109466655731202, + 1.1169811058044434, + 1.1130835620880126, + 1.140358045768738, + 1.1365852942466736, + 1.166709309577942, + 1.1524968084335327, + 1.1656600997924804, + 1.1640733276367188, + 1.1447783031463623, + 1.1532186569213867, + 1.1554683305740356, + 1.1585779469490052, + 1.1513005790710449, + 1.1763495040893555, + 1.1652228436470031, + 1.160971817779541, + 1.1603875598907472, + 1.1720654415130616, + 1.1610611295700073, + 1.1604611679077148, + 1.1669549285888672, + 1.1649753171920776, + 1.1652250712394714, + 1.1625843957901, + 1.1613554042816163, + 1.1618295280456543, + 1.1623823530197144, + 1.1611020141601562, + 1.1617642910003663, + 1.160661350440979, + 1.1612861026763917, + 1.1604403768539429, + 1.1600851245880126, + 1.1589638542175293, + 1.1586398794174195, + 1.1584538543701173 + ], + "train_acc": [ + 0.1805, + 0.4295, + 0.5854, + 0.6816, + 0.7232, + 0.7453, + 0.7578, + 0.7627, + 0.767, + 0.7698, + 0.7674, + 0.7712, + 0.7689, + 0.7693, + 0.7697, + 0.7636, + 0.7694, + 0.7637, + 0.7683, + 0.7552, + 0.7546, + 0.7502, + 0.7414, + 0.7298, + 0.7152, + 0.7063, + 0.7053, + 0.7096, + 0.6956, + 0.6988, + 0.6823, + 0.683, + 0.6722, + 0.6676, + 0.6425, + 0.6452, + 0.6316, + 0.6408, + 0.6223, + 0.6103, + 0.6161, + 0.6207, + 0.61, + 0.6007, + 0.594, + 0.5997, + 0.5949, + 0.5917, + 0.5845, + 0.5866, + 0.5824, + 0.5815, + 0.5852, + 0.5848, + 0.582, + 0.5831, + 0.5847, + 0.5705, + 0.578, + 0.5773, + 0.5786, + 0.5773, + 0.5763, + 0.5778, + 0.5759, + 0.5758, + 0.5752, + 0.5768, + 0.5778, + 0.5789, + 0.5765, + 0.5752, + 0.5796, + 0.5757, + 0.5738, + 0.5774, + 0.5767, + 0.5783, + 0.5772, + 0.5771 + ], + "test_acc": [ + 0.297, + 0.5115, + 0.6125, + 0.6815, + 0.712, + 0.7225, + 0.7345, + 0.744, + 0.748, + 0.7445, + 0.749, + 0.745, + 0.7505, + 0.7335, + 0.7315, + 0.7335, + 0.7405, + 0.7455, + 0.7215, + 0.73, + 0.7215, + 0.6985, + 0.719, + 0.697, + 0.6825, + 0.681, + 0.666, + 0.669, + 0.6695, + 0.652, + 0.6475, + 0.6345, + 0.611, + 0.578, + 0.6175, + 0.6025, + 0.609, + 0.582, + 0.56, + 0.557, + 0.5955, + 0.548, + 0.5675, + 0.5615, + 0.543, + 0.5465, + 0.5425, + 0.512, + 0.5365, + 0.546, + 0.5385, + 0.527, + 0.5405, + 0.5505, + 0.5325, + 0.5365, + 0.536, + 0.5295, + 0.53, + 0.54, + 0.5285, + 0.5275, + 0.5385, + 0.521, + 0.526, + 0.5285, + 0.5265, + 0.535, + 0.531, + 0.537, + 0.5325, + 0.54, + 0.5395, + 0.533, + 0.5335, + 0.541, + 0.533, + 0.5345, + 0.5365, + 0.536 + ], + "value_loss": [ + 2.8999951864242552, + 0.7982039636611938, + 0.6231087951660156, + 0.6235683647155762, + 0.6510119610786438, + 0.6574029609680175, + 0.661902648639679, + 0.7232611547470092, + 0.7032762868881226, + 0.6919255361557007, + 0.7005036912918091, + 0.6871883411884308, + 0.6459709981918335, + 0.6207397105693817, + 0.5787431469917297, + 0.5738487885951996, + 0.49071356387138365, + 0.4994966497421265, + 0.5125479884147645, + 0.5344232748031617, + 0.5196464547634124, + 0.5054446277618408, + 0.5345541868209839, + 0.5356824696063995, + 0.5677979762077332, + 0.5936019785881043, + 0.616796201133728, + 0.5785986241340637, + 0.5595448421478272, + 0.5678593179702759, + 0.5715507450580597, + 0.6120299976348877, + 0.5863943153381348, + 0.620256681060791, + 0.7131400769233703, + 0.6758115397930146, + 0.7279217919349671, + 0.6957201073169709, + 0.7316431989669799, + 0.910994045162201, + 0.7714889019966126, + 0.7304159112930297, + 0.7455276274681091, + 0.7825681743621826, + 0.7847769620895386, + 0.7706142486572266, + 0.7944970536231994, + 0.755725611782074, + 0.7909631139755249, + 0.767102459526062, + 0.7675446573257446, + 0.7427639607429505, + 0.7238150234222412, + 0.7105594779968262, + 0.7095693937301636, + 0.7146307023525238, + 0.7035578219413757, + 0.7189086032867431, + 0.7045238473415375, + 0.7113368612289429, + 0.6826634825706482, + 0.7114790539741516, + 0.6764884037971497, + 0.6730886434555053, + 0.6832352916717529, + 0.6705672347068786, + 0.6654141647815704, + 0.661842516708374, + 0.6488363645553589, + 0.6599813184738159, + 0.6824844323158265, + 0.6469198275566101, + 0.6482479458808899, + 0.6483881031036377, + 0.6463980459213257, + 0.6377046259403228, + 0.6387022176742554, + 0.6419951785087585, + 0.6271527135848999, + 0.6294826040267945 + ], + "term_loss": [ + 1.6536145017623902, + 0.2872389350891113, + 0.2957951427459717, + 0.3277177954673767, + 0.35520133118629454, + 0.35080455672740934, + 0.3522775351524353, + 0.4084164577126503, + 0.3896090238571167, + 0.37719122750759126, + 0.3783260108947754, + 0.3623295561790466, + 0.3226280775785446, + 0.2973626697540283, + 0.25232165038585663, + 0.2382216954112053, + 0.16664299157857895, + 0.1696927706718445, + 0.18322805758714675, + 0.18419794851541518, + 0.16826269830465318, + 0.14073927689790725, + 0.1580813282728195, + 0.1483071831703186, + 0.16409634435176848, + 0.1795245831489563, + 0.20835158178806304, + 0.1586458904504776, + 0.12719613885879516, + 0.13672583611011505, + 0.1154970666050911, + 0.15508873583078384, + 0.11837394280433655, + 0.13465832443237305, + 0.1757084409713745, + 0.15625774239301682, + 0.18290834587812424, + 0.15941560641527175, + 0.17247684068679808, + 0.3142263666391373, + 0.19758950917720794, + 0.16822293348312378, + 0.16599564211368562, + 0.18643067319393158, + 0.1906030725479126, + 0.17354270300865174, + 0.190151411318779, + 0.16186344304680825, + 0.18504287223815918, + 0.16807004487514496, + 0.1641414586544037, + 0.14297979036569594, + 0.1323266510486603, + 0.11856548438072205, + 0.11844867148399353, + 0.12127343907505274, + 0.11366841349601746, + 0.11914558122456073, + 0.11114272320270538, + 0.11924513355195522, + 0.09191340049505234, + 0.11707625112533569, + 0.09362382492423058, + 0.08999293868541718, + 0.09747600502967835, + 0.08926903312206268, + 0.08351160589009524, + 0.0834198350906372, + 0.07212909150123596, + 0.08118207498788833, + 0.10144669079780579, + 0.07279943599700928, + 0.07422557829022408, + 0.0754525229036808, + 0.072295490193367, + 0.06723054624646901, + 0.06944241292476654, + 0.07294909111261368, + 0.062184989684820176, + 0.06573917962312699 + ], + "bridge_loss": [ + 0.9464236948174454, + 0.18291140983104706, + 0.040363617214560506, + 0.011110359174013137, + 0.014245689526200294, + 0.023089023917913436, + 0.026216036486625672, + 0.025270551985502245, + 0.02219347151517868, + 0.022526981167495252, + 0.02307244484424591, + 0.02531819911599159, + 0.026737871503829957, + 0.02819551814943552, + 0.02993385853767395, + 0.03290943032503128, + 0.03119678609371185, + 0.031117037105560304, + 0.03405936537981033, + 0.04018406002521515, + 0.04106122210025787, + 0.04750789144039154, + 0.04383225578665733, + 0.040461724130809305, + 0.03670376715362072, + 0.03275604227185249, + 0.028076053726673125, + 0.03254394011795521, + 0.02899654289186001, + 0.027491856512427332, + 0.03153896740376949, + 0.03142815798521042, + 0.027842609399557114, + 0.031923864197731015, + 0.04680985162556171, + 0.04004504739642143, + 0.047192381888628, + 0.04468500956296921, + 0.04510729597210884, + 0.061515051746368406, + 0.04885982053875923, + 0.045153148594498635, + 0.044507554531097414, + 0.05041837334632873, + 0.04725242199897766, + 0.054280938601493835, + 0.05214150484800339, + 0.04225666461288929, + 0.04533897556066513, + 0.040540956717729566, + 0.042374949568510054, + 0.039801810497045516, + 0.03651453158855438, + 0.03338572339117527, + 0.03220605453252792, + 0.03330056329071522, + 0.03362610780000687, + 0.0321112134590745, + 0.031176293939352034, + 0.03122947336435318, + 0.03098687102794647, + 0.031619531428813935, + 0.02434463834017515, + 0.02416698544025421, + 0.024347744315862657, + 0.022427195864915848, + 0.022219545251131057, + 0.02096850683093071, + 0.01963008977174759, + 0.021793972712755204, + 0.02480321912765503, + 0.018299329644441604, + 0.019186521348357202, + 0.01893142442405224, + 0.019846682327985764, + 0.01753948959261179, + 0.017655849578976632, + 0.01780163335800171, + 0.015271758063137532, + 0.01474373927861452 + ], + "tgrad_loss": [ + 0.2999570077896118, + 0.3280536154747009, + 0.2869500336647034, + 0.28474021162986757, + 0.2815649441242218, + 0.2835093786716461, + 0.28340907335281373, + 0.28957414956092836, + 0.29147378697395326, + 0.2922073318719864, + 0.29910522994995115, + 0.29954058151245117, + 0.2966050533294678, + 0.2951815227985382, + 0.29648763222694396, + 0.30271766862869265, + 0.29287378659248353, + 0.2986868423938751, + 0.2952605631351471, + 0.31004127130508424, + 0.3103225353717804, + 0.31719745807647703, + 0.3326406021118164, + 0.34691356320381167, + 0.36699786424636843, + 0.38132135572433473, + 0.3803685675859451, + 0.38740879821777346, + 0.40335216054916384, + 0.4036416297912598, + 0.42451471338272095, + 0.4255130994796753, + 0.4401777680397034, + 0.45367448930740356, + 0.49062178344726565, + 0.47950875129699705, + 0.49782106022834777, + 0.4916194935798645, + 0.5140590587615966, + 0.5352526268959046, + 0.5250395781517029, + 0.5170398303031921, + 0.5350244320869446, + 0.5457191298484803, + 0.546921465921402, + 0.5427906059265136, + 0.5522041378021241, + 0.5516055016517639, + 0.5605812623023987, + 0.5584914489746093, + 0.5610282512664795, + 0.5599823703765869, + 0.5549738362312316, + 0.5586082744121551, + 0.5589146682739258, + 0.5600566972255707, + 0.5562633040428162, + 0.5676518079757691, + 0.5622048275470733, + 0.5608622529029846, + 0.5597632151603699, + 0.5627832710266113, + 0.5585199429988861, + 0.5589287233352661, + 0.5614115441322327, + 0.558871001625061, + 0.5596830134391785, + 0.5574541716575623, + 0.557077182006836, + 0.5570052715301513, + 0.5562345240592956, + 0.5558210565567017, + 0.5548358437061309, + 0.5540041534423829, + 0.5542558710098267, + 0.5529345960140228, + 0.5516039566040039, + 0.5512444511413574, + 0.5496959585189819, + 0.5489996829986572 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.3330497741699219, + 0.6669624447822571 + ], + "perturbation_rho": [ + 0.38148215413093567, + 0.652411937713623 + ], + "nudging": { + "0.001": [ + -0.008725257590413094, + -0.005841934122145176 + ], + "0.003": [ + -0.026054667308926582, + -0.01747780293226242 + ], + "0.01": [ + -0.08540114760398865, + -0.05768381431698799 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a1.0_L2_s42.json b/results/synth_ladder_v2_hi/synth_a1.0_L2_s42.json new file mode 100644 index 0000000..9108ab1 --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a1.0_L2_s42.json @@ -0,0 +1,1512 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.946318034172058, + 1.1516875396728516, + 0.7581935514450073, + 0.605016669845581, + 0.5396797653198242, + 0.4972745149612427, + 0.47234574098587034, + 0.4495224585533142, + 0.4272374426364899, + 0.40758763122558594, + 0.39252452518939973, + 0.36916465797424314, + 0.36600809767246245, + 0.3410687928676605, + 0.32793644909858705, + 0.31304756975173953, + 0.3007715271472931, + 0.28627579979896545, + 0.2755886849164963, + 0.2579380422592163, + 0.25807462005615234, + 0.24107852401733398, + 0.22887857472896575, + 0.21563715391159058, + 0.2035831698536873, + 0.18830533595085144, + 0.17980405967235566, + 0.1690865597963333, + 0.1624095736503601, + 0.14769727175235747, + 0.14151963140964507, + 0.13674119498729706, + 0.12849826879501342, + 0.11771546969413757, + 0.11224533882141113, + 0.10299252641201019, + 0.09757299244403839, + 0.09114479880332947, + 0.08575093656778336, + 0.08185386205613614, + 0.0756724079966545, + 0.07218986920118332, + 0.07176458925008773, + 0.06660606263875961, + 0.061819399589300154, + 0.058563033843040464, + 0.055636672776937485, + 0.05303103420138359, + 0.05044965471625328, + 0.04851883066296577, + 0.046696959590911864, + 0.045260662871599196, + 0.043802720510959625, + 0.04223582611083984, + 0.04100226702690125, + 0.039826682758331296, + 0.03853288550376892, + 0.03745495624542236, + 0.036505805373191834, + 0.035624118888378145, + 0.0349866281747818, + 0.034375298815965655, + 0.03376467539072037, + 0.033166321152448656, + 0.03267900042831898, + 0.03222526069879532, + 0.0318170808583498, + 0.031466467666625975, + 0.031191858434677124, + 0.030932255566120146, + 0.030712535017728807, + 0.030533779421448706, + 0.030381300014257432, + 0.03024109920859337, + 0.030137208765745164, + 0.030061321771889925, + 0.03000315922498703, + 0.029963677549362182, + 0.02994104051887989, + 0.029928466534614562 + ], + "train_acc": [ + 0.3257, + 0.6596, + 0.769, + 0.7981, + 0.8069, + 0.8192, + 0.8248, + 0.8293, + 0.8386, + 0.8518, + 0.8547, + 0.864, + 0.8627, + 0.8793, + 0.8817, + 0.8875, + 0.893, + 0.8973, + 0.9031, + 0.9135, + 0.9086, + 0.9203, + 0.9247, + 0.93, + 0.9403, + 0.946, + 0.9502, + 0.9538, + 0.957, + 0.9651, + 0.9677, + 0.9686, + 0.9732, + 0.9792, + 0.9798, + 0.9861, + 0.9867, + 0.9888, + 0.9909, + 0.991, + 0.9941, + 0.9952, + 0.9935, + 0.9954, + 0.9966, + 0.9976, + 0.9984, + 0.9987, + 0.999, + 0.9989, + 0.9993, + 0.999, + 0.9993, + 0.9993, + 0.9995, + 0.9996, + 0.9993, + 0.9994, + 0.9996, + 0.9995, + 0.9996, + 0.9997, + 0.9998, + 0.9998, + 0.9998, + 0.9998, + 0.9998, + 0.9998, + 0.9998, + 0.9998, + 0.9998, + 0.9998, + 0.9998, + 0.9998, + 0.9998, + 0.9998, + 0.9998, + 0.9998, + 0.9998, + 0.9998 + ], + "test_acc": [ + 0.5395, + 0.703, + 0.755, + 0.763, + 0.755, + 0.768, + 0.765, + 0.7725, + 0.77, + 0.772, + 0.782, + 0.781, + 0.7805, + 0.785, + 0.7875, + 0.791, + 0.7895, + 0.7865, + 0.7925, + 0.794, + 0.791, + 0.7955, + 0.79, + 0.7975, + 0.8015, + 0.799, + 0.801, + 0.7965, + 0.787, + 0.7945, + 0.793, + 0.7915, + 0.788, + 0.794, + 0.797, + 0.7965, + 0.7925, + 0.797, + 0.795, + 0.795, + 0.7965, + 0.795, + 0.7945, + 0.792, + 0.7935, + 0.794, + 0.7925, + 0.792, + 0.7905, + 0.79, + 0.791, + 0.789, + 0.79, + 0.788, + 0.7905, + 0.79, + 0.7885, + 0.79, + 0.7895, + 0.791, + 0.7905, + 0.792, + 0.7895, + 0.7915, + 0.793, + 0.7925, + 0.791, + 0.791, + 0.791, + 0.791, + 0.791, + 0.791, + 0.791, + 0.7905, + 0.791, + 0.792, + 0.792, + 0.7915, + 0.7915, + 0.7915 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.937772274017334, + 0.9376006126403809 + ], + "perturbation_rho": [ + 0.9999990463256836, + 0.9999986886978149 + ], + "nudging": { + "0.001": [ + -0.04965643584728241, + -0.030679266899824142 + ], + "0.003": [ + -0.14321433007717133, + -0.08988389372825623 + ], + "0.01": [ + -0.4167234003543854, + -0.27598124742507935 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.282194623565674, + 1.8021317630767821, + 1.290370544052124, + 0.9686317783355712, + 0.7942994188308716, + 0.7037483291625977, + 0.6552832854270935, + 0.6296794363975525, + 0.6148017653465271, + 0.6100365350723267, + 0.6096824949026107, + 0.604195829296112, + 0.6080462079524994, + 0.6034878133773803, + 0.6054122657775879, + 0.6029368188858032, + 0.6196025349617005, + 0.6137223323822022, + 0.6131332286834716, + 0.607370358657837, + 0.6205254472732544, + 0.6207848463058472, + 0.6232059438705444, + 0.6186815485954285, + 0.6224006581783295, + 0.6181600985527038, + 0.6084850495815277, + 0.6079479592323304, + 0.629641656780243, + 0.6227955137252807, + 0.6316008956909179, + 0.6274790578842163, + 0.6385569313049316, + 0.6368639594554901, + 0.6237436760902405, + 0.6281486724853516, + 0.6293207456588745, + 0.6216304894447326, + 0.6239378217697144, + 0.6469531507015228, + 0.6208334467887878, + 0.6244380719184875, + 0.6174096193313598, + 0.6198301626205445, + 0.6222816544532775, + 0.6192285632133484, + 0.6139031839370728, + 0.6136475460052491, + 0.6211447484016418, + 0.6104061424255371, + 0.6133950750350952, + 0.6175869959831238, + 0.6119502241134643, + 0.6125527906417847, + 0.6169743155002594, + 0.6045381330490113, + 0.6027683501243591, + 0.6022960813522339, + 0.6013002532958984, + 0.6025074361801147, + 0.5996582602500915, + 0.5981982765197754, + 0.5991991576194763, + 0.5996488208770752, + 0.595704001712799, + 0.5946896816253662, + 0.5987521299839019, + 0.592281983089447, + 0.5919814961433411, + 0.5917617532730103, + 0.5915903926849365, + 0.5901475148677826, + 0.5897085474967957, + 0.5893317813873291, + 0.5883101566314697, + 0.5882777759075165, + 0.5877544073104859, + 0.587434159374237, + 0.5873497516155243, + 0.5872392297744751 + ], + "train_acc": [ + 0.1615, + 0.3999, + 0.5808, + 0.6687, + 0.7161, + 0.7409, + 0.7516, + 0.7604, + 0.7653, + 0.7674, + 0.7681, + 0.7689, + 0.767, + 0.7713, + 0.7724, + 0.7726, + 0.7652, + 0.7648, + 0.7675, + 0.766, + 0.7639, + 0.7664, + 0.7614, + 0.7654, + 0.7661, + 0.764, + 0.7739, + 0.7688, + 0.7627, + 0.764, + 0.7612, + 0.7644, + 0.7603, + 0.7611, + 0.7638, + 0.7587, + 0.7605, + 0.761, + 0.7654, + 0.7567, + 0.7658, + 0.7671, + 0.7691, + 0.7652, + 0.7656, + 0.7674, + 0.7658, + 0.7699, + 0.7617, + 0.7703, + 0.7686, + 0.7653, + 0.7677, + 0.7681, + 0.7659, + 0.771, + 0.7726, + 0.7735, + 0.7712, + 0.7739, + 0.7732, + 0.7758, + 0.7719, + 0.7712, + 0.774, + 0.7726, + 0.7726, + 0.7759, + 0.7776, + 0.7775, + 0.7778, + 0.7776, + 0.7772, + 0.7772, + 0.7778, + 0.7764, + 0.7777, + 0.7786, + 0.7785, + 0.7784 + ], + "test_acc": [ + 0.265, + 0.5165, + 0.6045, + 0.6645, + 0.697, + 0.7095, + 0.7115, + 0.7185, + 0.7185, + 0.7185, + 0.7125, + 0.716, + 0.7215, + 0.716, + 0.7115, + 0.7095, + 0.7125, + 0.706, + 0.699, + 0.6985, + 0.718, + 0.7035, + 0.7025, + 0.699, + 0.7015, + 0.6985, + 0.712, + 0.709, + 0.699, + 0.696, + 0.705, + 0.713, + 0.698, + 0.704, + 0.6915, + 0.6945, + 0.6965, + 0.694, + 0.6945, + 0.69, + 0.7055, + 0.697, + 0.7045, + 0.693, + 0.7075, + 0.698, + 0.693, + 0.6945, + 0.7015, + 0.697, + 0.699, + 0.6975, + 0.699, + 0.7035, + 0.6985, + 0.7035, + 0.699, + 0.703, + 0.699, + 0.7045, + 0.703, + 0.7085, + 0.7005, + 0.701, + 0.699, + 0.7025, + 0.707, + 0.701, + 0.704, + 0.7065, + 0.7045, + 0.705, + 0.705, + 0.7045, + 0.7035, + 0.705, + 0.7045, + 0.7035, + 0.7035, + 0.7025 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.005922339856624603, + 0.020320668816566467 + ], + "perturbation_rho": [ + -0.003393532708287239, + 0.013989023864269257 + ], + "nudging": { + "0.001": [ + -1.6870606486918405e-05, + -0.0001334029802819714 + ], + "0.003": [ + -3.559933975338936e-05, + -0.0004005617811344564 + ], + "0.01": [ + 5.659737507812679e-05, + -0.0013348986394703388 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 2.135848754119873, + 1.3642803058624267, + 0.8708873195648194, + 0.6620696384429932, + 0.5891413642883301, + 0.57967520570755, + 0.5887710757732392, + 0.5980366667747498, + 0.6088974040985108, + 0.6177972668647767, + 0.6234511965751648, + 0.6228584952354431, + 0.6300664884567261, + 0.6292729211807251, + 0.6327571807861329, + 0.6370973803520202, + 0.6390834430217743, + 0.6375089395999909, + 0.6519857896804809, + 0.6564193545341491, + 0.6642557950973511, + 0.6591811975479126, + 0.6635806708335876, + 0.6719323859214783, + 0.681973802947998, + 0.6752701175689697, + 0.6823263836860657, + 0.680218187904358, + 0.6895751893997193, + 0.6950895532131195, + 0.690692015838623, + 0.7078337843418121, + 0.693129168510437, + 0.6974928091049194, + 0.7008464097976684, + 0.7004407194137573, + 0.696805198431015, + 0.7037288009643554, + 0.696394179725647, + 0.7049403734207154, + 0.718198802280426, + 0.7099995137214661, + 0.7002471772193909, + 0.7115488752365112, + 0.7011648622512817, + 0.705596800327301, + 0.7055955667495728, + 0.7068639204978943, + 0.712410222530365, + 0.7061294185638428, + 0.7098195759773255, + 0.7036320822715759, + 0.7083044646263122, + 0.7005896663665772, + 0.7051161972999572, + 0.7042372000694275, + 0.7064647805690766, + 0.703298209953308, + 0.7030874502182007, + 0.7018115946769714, + 0.7009259914398194, + 0.7010174451828003, + 0.7004158262252808, + 0.7019228082180023, + 0.6986435826301575, + 0.6975876085281372, + 0.6982375308990478, + 0.6989794599533081, + 0.6969254281044006, + 0.6955446625709534, + 0.696240187549591, + 0.6952586332321167, + 0.6951992818832398, + 0.6944246446609497, + 0.6940418438911438, + 0.6938989589691162, + 0.6935289325714111, + 0.6932655550956726, + 0.6931727689743042, + 0.6930741609573364 + ], + "train_acc": [ + 0.231, + 0.5519, + 0.704, + 0.7597, + 0.7786, + 0.776, + 0.7753, + 0.7712, + 0.7689, + 0.7718, + 0.7668, + 0.7683, + 0.7644, + 0.7634, + 0.7586, + 0.7587, + 0.7535, + 0.7585, + 0.7496, + 0.7509, + 0.7513, + 0.7463, + 0.7498, + 0.7442, + 0.7432, + 0.7474, + 0.7412, + 0.7453, + 0.7404, + 0.7381, + 0.7374, + 0.7304, + 0.7417, + 0.7382, + 0.7395, + 0.738, + 0.7394, + 0.7367, + 0.7336, + 0.7345, + 0.7327, + 0.7336, + 0.7406, + 0.7313, + 0.7329, + 0.7331, + 0.7364, + 0.7362, + 0.7308, + 0.7342, + 0.7326, + 0.7363, + 0.734, + 0.7356, + 0.7308, + 0.7347, + 0.7327, + 0.7349, + 0.735, + 0.7372, + 0.7391, + 0.7353, + 0.7343, + 0.7373, + 0.7375, + 0.7371, + 0.738, + 0.7376, + 0.7359, + 0.7372, + 0.7369, + 0.7367, + 0.7383, + 0.7383, + 0.7371, + 0.7378, + 0.7377, + 0.7377, + 0.7376, + 0.7377 + ], + "test_acc": [ + 0.4135, + 0.627, + 0.7015, + 0.731, + 0.732, + 0.7305, + 0.715, + 0.7105, + 0.7035, + 0.7215, + 0.7115, + 0.7095, + 0.711, + 0.7055, + 0.694, + 0.6975, + 0.7035, + 0.693, + 0.701, + 0.6925, + 0.696, + 0.689, + 0.691, + 0.688, + 0.6935, + 0.6805, + 0.6875, + 0.686, + 0.6855, + 0.669, + 0.682, + 0.685, + 0.67, + 0.6755, + 0.676, + 0.6715, + 0.6735, + 0.6815, + 0.6735, + 0.6615, + 0.6705, + 0.678, + 0.673, + 0.6755, + 0.679, + 0.6795, + 0.671, + 0.669, + 0.675, + 0.665, + 0.6725, + 0.674, + 0.676, + 0.671, + 0.674, + 0.6665, + 0.676, + 0.6755, + 0.679, + 0.6815, + 0.6775, + 0.673, + 0.6775, + 0.6755, + 0.6745, + 0.673, + 0.674, + 0.6755, + 0.675, + 0.676, + 0.6755, + 0.673, + 0.673, + 0.675, + 0.6745, + 0.6725, + 0.673, + 0.674, + 0.6735, + 0.6735 + ], + "state_pred_error": [ + 0.8063683609008789, + 0.3884696524143219, + 0.2311003609418869, + 0.18046433920860291, + 0.16924471125602722, + 0.16555276873111724, + 0.1602503327846527, + 0.15167320017814637, + 0.140824283182621, + 0.1298466329574585, + 0.11834586684703827, + 0.11143888697624206, + 0.10435668296813964, + 0.10323678240776062, + 0.0928786245584488, + 0.08840008661746979, + 0.08519339587688446, + 0.08778857303857804, + 0.08263514815568924, + 0.08055064792633057, + 0.07980460293293, + 0.07705434393882751, + 0.07739766277074814, + 0.07446456137895584, + 0.0734913741350174, + 0.07287049880027771, + 0.07218570121526718, + 0.07035595026016235, + 0.07018024356365204, + 0.0692975877046585, + 0.06897079907655716, + 0.06649487104415894, + 0.06588162162899971, + 0.06435961349010468, + 0.06434023708701134, + 0.06222202478647232, + 0.0626620704293251, + 0.06185628715753555, + 0.05922087868452072, + 0.057531780862808225, + 0.05768225061893463, + 0.0554687408208847, + 0.054569963669776914, + 0.05414690698385238, + 0.05308204159736633, + 0.05163135576248169, + 0.05053922039270401, + 0.049180154889822005, + 0.04925686872601509, + 0.047615612363815306, + 0.046402145498991014, + 0.04576419175863266, + 0.045621140229702, + 0.04635717123746872, + 0.04377198639512062, + 0.043869176548719406, + 0.04219145889282227, + 0.04124122514724732, + 0.04061387507915497, + 0.04018232229351997, + 0.039839565473794934, + 0.03889179226756096, + 0.03857449699044228, + 0.03783939574360847, + 0.03660583376288414, + 0.03604392006397247, + 0.03533379606604576, + 0.03495548709630966, + 0.03465898452997208, + 0.0342097640991211, + 0.0333374612390995, + 0.03270132002830505, + 0.03256121125221252, + 0.03309162433743477, + 0.03434458671808243, + 0.031629494720697406, + 0.030447168147563933, + 0.029967701929807664, + 0.029437697196006776, + 0.028844930332899095 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.6727198958396912, + 0.3693685829639435 + ], + "perturbation_rho": [ + 0.6028042435646057, + 0.36745399236679077 + ], + "nudging": { + "0.001": [ + -0.02099989913403988, + -0.0025365445762872696 + ], + "0.003": [ + -0.06207232177257538, + -0.007595579605549574 + ], + "0.01": [ + -0.19608698785305023, + -0.025156188756227493 + ] + }, + "state_pred_error_per_layer": [ + 4083.197509765625, + 262.47991943359375 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2804126327514647, + 1.7985749383926393, + 1.2908005512237548, + 0.9662449172019959, + 0.7956621127128601, + 0.7016273497581482, + 0.6522905420303344, + 0.6255401084899902, + 0.6117714551925659, + 0.6128746815681457, + 0.6068986643791199, + 0.6044070498466492, + 0.6102572951316834, + 0.6062020353317261, + 0.6156517067909241, + 0.6126874660491943, + 0.6097104368209839, + 0.6174453516960144, + 0.6185816154479981, + 0.6438342502593994, + 0.6368237316131592, + 0.6804909427642822, + 0.6997053329467774, + 0.7258448196411132, + 0.7487138278961182, + 0.7556256717681885, + 0.7934631998062134, + 0.802038497543335, + 0.8157362140655517, + 0.8650238488197327, + 0.8622131116867066, + 0.8802598802566528, + 0.9258453697204589, + 0.9959634174346924, + 0.9478269100189209, + 1.0003521003723144, + 1.077512856578827, + 1.0192589988708496, + 1.028103258895874, + 1.0586500679016113, + 1.0699232969284058, + 1.0799424433708191, + 1.0838925231933594, + 1.1248778113365174, + 1.1027689414978028, + 1.1598035910606384, + 1.1366910076141357, + 1.1348427181243896, + 1.1708768878936768, + 1.1435981479644775, + 1.1552022342681885, + 1.2040845465660095, + 1.1642921708106995, + 1.1581912057876587, + 1.1544302150726318, + 1.1856851593017579, + 1.1730238010406495, + 1.1706515258789063, + 1.175933620452881, + 1.2015250160217286, + 1.179624587059021, + 1.18775200214386, + 1.1831196794509888, + 1.1909604908943177, + 1.1947224998474122, + 1.1949542335510255, + 1.1888987186431885, + 1.1910899550437928, + 1.1911025504112243, + 1.195369605255127, + 1.193122798538208, + 1.194731010055542, + 1.1899194046020507, + 1.1925264017105102, + 1.191719772720337, + 1.1909632276535034, + 1.189614386367798, + 1.1892432201385499, + 1.188741414451599, + 1.1885441581726075 + ], + "train_acc": [ + 0.1623, + 0.4052, + 0.5791, + 0.6702, + 0.7173, + 0.7455, + 0.7557, + 0.7621, + 0.7675, + 0.7666, + 0.7696, + 0.7723, + 0.7664, + 0.7713, + 0.7708, + 0.7678, + 0.7703, + 0.7652, + 0.7695, + 0.7575, + 0.7586, + 0.7436, + 0.734, + 0.7259, + 0.723, + 0.7172, + 0.703, + 0.6981, + 0.6893, + 0.6707, + 0.6709, + 0.6653, + 0.6557, + 0.6313, + 0.644, + 0.623, + 0.6036, + 0.6162, + 0.613, + 0.6077, + 0.6007, + 0.5952, + 0.598, + 0.5809, + 0.5939, + 0.571, + 0.583, + 0.5811, + 0.5635, + 0.5749, + 0.578, + 0.5625, + 0.5689, + 0.5734, + 0.5731, + 0.5696, + 0.5712, + 0.5682, + 0.5694, + 0.5553, + 0.5659, + 0.5635, + 0.566, + 0.5599, + 0.5604, + 0.5627, + 0.5634, + 0.5593, + 0.5621, + 0.5604, + 0.5607, + 0.5593, + 0.5635, + 0.5619, + 0.5657, + 0.5614, + 0.5632, + 0.565, + 0.5645, + 0.5642 + ], + "test_acc": [ + 0.268, + 0.513, + 0.6075, + 0.6595, + 0.696, + 0.7095, + 0.7215, + 0.7145, + 0.723, + 0.72, + 0.7195, + 0.7195, + 0.723, + 0.713, + 0.708, + 0.718, + 0.711, + 0.7065, + 0.7095, + 0.694, + 0.6845, + 0.6965, + 0.654, + 0.6715, + 0.67, + 0.655, + 0.6405, + 0.6595, + 0.6045, + 0.612, + 0.62, + 0.5865, + 0.5695, + 0.5475, + 0.5605, + 0.528, + 0.5695, + 0.5465, + 0.552, + 0.5245, + 0.525, + 0.5495, + 0.5245, + 0.549, + 0.5255, + 0.4805, + 0.5195, + 0.484, + 0.532, + 0.522, + 0.5115, + 0.5325, + 0.5325, + 0.5145, + 0.494, + 0.5195, + 0.5155, + 0.5115, + 0.5065, + 0.511, + 0.513, + 0.524, + 0.5115, + 0.5165, + 0.5135, + 0.508, + 0.513, + 0.502, + 0.5045, + 0.504, + 0.5175, + 0.514, + 0.5145, + 0.5165, + 0.51, + 0.5135, + 0.5115, + 0.5125, + 0.513, + 0.5125 + ], + "value_loss": [ + 2.940468542289734, + 0.79788527135849, + 0.6377222188949585, + 0.68224133644104, + 0.7263548100471496, + 0.7324671993255615, + 0.7309100345611572, + 0.717535104560852, + 0.7103414190292359, + 0.6660294913291931, + 0.6247495171546936, + 0.5396882646560669, + 0.4996064971446991, + 0.45136471157073976, + 0.4529336892604828, + 0.4058929618358612, + 0.391290897321701, + 0.39949184267520904, + 0.40146105794906617, + 0.4176544015884399, + 0.3929467046737671, + 0.4356102319717407, + 0.44995045413970947, + 0.4677547811985016, + 0.506061519908905, + 0.4956396166801453, + 0.5163082196235657, + 0.5677194129943848, + 0.5988344200134277, + 0.599899713230133, + 0.5649642105102539, + 0.597481498336792, + 0.62520577750206, + 0.7375187145233154, + 0.624705169582367, + 0.6632982563972473, + 0.7675839500427246, + 0.669120393371582, + 0.6651788431167602, + 0.7156087099552154, + 0.696215266418457, + 0.6955457643985749, + 0.6779295589447022, + 0.7293293210983276, + 0.6809166513442994, + 0.764018877029419, + 0.7062238107681275, + 0.685149402809143, + 0.7134047386169433, + 0.6853949756622314, + 0.6999969066619873, + 0.7731949109077454, + 0.6987295764446259, + 0.6907983577728272, + 0.6681401613235474, + 0.7007834080696106, + 0.6814730290412903, + 0.661990501499176, + 0.6626340481758117, + 0.705364034461975, + 0.6682385860443115, + 0.6713524225234986, + 0.6693500059127807, + 0.6651503324508667, + 0.6654500586509705, + 0.6543948979377746, + 0.6422414421081543, + 0.6383527196884156, + 0.6420085886001586, + 0.6456019569396972, + 0.6395301539421081, + 0.6431583649635315, + 0.6233767694473267, + 0.6305849503517151, + 0.6271460248947144, + 0.6468473421096802, + 0.6199060997486114, + 0.6318170052528381, + 0.6215379253387451, + 0.6212269179344178 + ], + "term_loss": [ + 1.6892825514793397, + 0.28991217994689944, + 0.30822358050346377, + 0.3786318918466568, + 0.42494087133407593, + 0.42721891040802, + 0.4199708504676819, + 0.4035639883041382, + 0.3996427752017975, + 0.3595923094034195, + 0.33094902596473696, + 0.2548507522583008, + 0.21975787994861604, + 0.17496245877742767, + 0.173782960999012, + 0.12534335107803346, + 0.1120484961271286, + 0.11436202818453312, + 0.11488216164112092, + 0.11582057362794876, + 0.08930488972663879, + 0.10528950003981591, + 0.10394810205698013, + 0.10426158441305161, + 0.12753498150110246, + 0.10871876295804977, + 0.11132348638176918, + 0.14436086015701294, + 0.14408548067808152, + 0.13344688698649407, + 0.10571571690440178, + 0.13017865498065948, + 0.13939437173306943, + 0.20552679252624512, + 0.11907351903915406, + 0.13748738572597505, + 0.19904934087991716, + 0.13540437815189363, + 0.12853734107017517, + 0.1618148654460907, + 0.13909575666189194, + 0.13520186334848405, + 0.12121448392868042, + 0.1466166281223297, + 0.12041640423536301, + 0.16912428863048554, + 0.13152958631515502, + 0.11219572712182999, + 0.12457058460712434, + 0.10920219086408615, + 0.1173021228313446, + 0.16791136612892152, + 0.11367217564582825, + 0.10726595187187195, + 0.09067037861347199, + 0.11207262431383133, + 0.09823015294075012, + 0.08530473515987397, + 0.08550616343021393, + 0.10875923759937287, + 0.08709428926706314, + 0.08641628972291947, + 0.08627706418037415, + 0.08137298605442048, + 0.0812585338205099, + 0.07228367166519165, + 0.06536642589569092, + 0.0619819268733263, + 0.06462425166070461, + 0.06505866675376892, + 0.06278609230518341, + 0.0658116526722908, + 0.0513275152683258, + 0.056986387073993686, + 0.05485347003340721, + 0.07127472396492958, + 0.050447821268439295, + 0.06053386932611465, + 0.05252971643209457, + 0.05304660900235176 + ], + "bridge_loss": [ + 0.9279641841857811, + 0.16856330198049546, + 0.039708731412887575, + 0.010337709330767393, + 0.011771508574485778, + 0.022529736855626106, + 0.03331982454061508, + 0.03982229630947113, + 0.03738117287158966, + 0.03454190602302551, + 0.027281567510962487, + 0.024664730344712733, + 0.023858268588781355, + 0.025735928761959077, + 0.0272073194026947, + 0.02882993689775467, + 0.027838965237140655, + 0.028774000322818755, + 0.02812835749387741, + 0.03022514525949955, + 0.030929905086755752, + 0.03656129573583603, + 0.04052359770536423, + 0.04557864816188812, + 0.04997927314043045, + 0.050188125783205036, + 0.04993401603698731, + 0.05739394021034241, + 0.07838522285223007, + 0.06485828175544739, + 0.05224925307035446, + 0.0506726308375597, + 0.051239190012216565, + 0.0647153436422348, + 0.053563565707206724, + 0.05078575596809387, + 0.06262156112790107, + 0.04680149354934692, + 0.04500690677165985, + 0.049841736525297164, + 0.046847368633747104, + 0.04284440612792969, + 0.03791265842914581, + 0.046439746141433716, + 0.03537028197050095, + 0.04456134281158447, + 0.03218785969913006, + 0.030664079475402832, + 0.03130132013559341, + 0.029161811190843583, + 0.032022461515665054, + 0.03898258820772171, + 0.02969357035756111, + 0.02903288689851761, + 0.02478138956427574, + 0.0249088092982769, + 0.02389162595272064, + 0.019117333182692528, + 0.018994592445343732, + 0.023708287239074706, + 0.019777522890269756, + 0.018769464632868767, + 0.020211394253373146, + 0.017110029135644435, + 0.017269017577171326, + 0.014731672486662864, + 0.012424837739765644, + 0.01189460586681962, + 0.01335356667637825, + 0.014654298931360246, + 0.012049511376023293, + 0.012707741624116897, + 0.009858337254822254, + 0.010841082896292209, + 0.011562466982007026, + 0.015217449271678925, + 0.009477784027159214, + 0.01224556357562542, + 0.011088584440946578, + 0.010462266248464584 + ], + "tgrad_loss": [ + 0.32322183175086977, + 0.33940978274345396, + 0.2897899122238159, + 0.29327174363136294, + 0.28964242973327636, + 0.28271855030059817, + 0.27761935591697695, + 0.27414881958961484, + 0.27331746387481687, + 0.27189527068138125, + 0.26651892404556277, + 0.2601727846622467, + 0.25599034695625306, + 0.25066632494926455, + 0.25194340829849243, + 0.2517196734428406, + 0.2514034350395203, + 0.25635581159591675, + 0.25845054063796996, + 0.2716086819887161, + 0.2727119073867798, + 0.29375943875312804, + 0.30547875442504885, + 0.31791454901695254, + 0.32854726486206054, + 0.3367327250480652, + 0.3550507174730301, + 0.36596461181640627, + 0.37636372227668763, + 0.4015945445537567, + 0.40699923944473265, + 0.41663020915985105, + 0.4345722186088562, + 0.46727658042907716, + 0.4520680808544159, + 0.4750251211166382, + 0.5059130459785461, + 0.4869145246505737, + 0.49163460040092466, + 0.5039521028518676, + 0.5102721470355988, + 0.5174995000839233, + 0.5188024171829224, + 0.5362729483604431, + 0.5251299654006958, + 0.5503332437992096, + 0.5425063617706298, + 0.5422895937919616, + 0.5575328386306763, + 0.5470309760093689, + 0.5506723180770874, + 0.5663009528160096, + 0.5553638293266296, + 0.5544995170593262, + 0.5526883927822113, + 0.563801976966858, + 0.5593512482643127, + 0.5575684350967407, + 0.5581332973480224, + 0.5728965188980103, + 0.5613667737007141, + 0.5661666715621948, + 0.5628615488052369, + 0.5666673162460327, + 0.5669225110054016, + 0.5673795532226562, + 0.5644501794815063, + 0.5644761901378632, + 0.5640307699203492, + 0.5658889928817749, + 0.5646945568084717, + 0.5646389728546143, + 0.5621909219741821, + 0.5627574834823609, + 0.5607300892829895, + 0.5603551671981811, + 0.559980492067337, + 0.5590375660896302, + 0.5579196195602417, + 0.5577180406570434 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.39126425981521606, + 0.7445269823074341 + ], + "perturbation_rho": [ + 0.44417524337768555, + 0.7429547905921936 + ], + "nudging": { + "0.001": [ + -0.009039473719894886, + -0.006878397427499294 + ], + "0.003": [ + -0.027019120752811432, + -0.020580623298883438 + ], + "0.01": [ + -0.08887787163257599, + -0.06797216832637787 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a1.0_L2_s456.json b/results/synth_ladder_v2_hi/synth_a1.0_L2_s456.json new file mode 100644 index 0000000..3e9ec33 --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a1.0_L2_s456.json @@ -0,0 +1,1512 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.9560056144714355, + 1.1671714973449707, + 0.7729741273880005, + 0.6163077599525452, + 0.5501252895355224, + 0.5102293436050415, + 0.47986490659713743, + 0.4551184079170227, + 0.4281283717632294, + 0.41059817826747896, + 0.3900598440170288, + 0.3775464247703552, + 0.35782486624717713, + 0.34545214071273805, + 0.32954725866317747, + 0.312077562713623, + 0.3001769031524658, + 0.2857774089574814, + 0.268246430015564, + 0.2654800416946411, + 0.24711972908973695, + 0.23591814823150634, + 0.22430862407684327, + 0.21694810314178467, + 0.19728492946624757, + 0.19133227586746215, + 0.18050886018276216, + 0.16754731903076173, + 0.15603712682724, + 0.14723092963695525, + 0.1393954524040222, + 0.13442619478702544, + 0.12217882280349732, + 0.11515008834600449, + 0.10545161597728729, + 0.0976712616443634, + 0.09565990908145905, + 0.08852378897666931, + 0.08450308041572571, + 0.07969852757751941, + 0.07292226366400718, + 0.06799264116883277, + 0.06508905214071274, + 0.061624961662292484, + 0.05785034103393555, + 0.05549244320392609, + 0.053127787148952485, + 0.050860308933258054, + 0.048702414500713345, + 0.04664224576950073, + 0.04522364996671677, + 0.04416376640796661, + 0.04225023184418678, + 0.0404514856338501, + 0.039005454522371294, + 0.03781551446318626, + 0.03683884832262993, + 0.035825042724609374, + 0.034970838397741316, + 0.03423578343987465, + 0.03352795054614544, + 0.03287497969865799, + 0.0322679201349616, + 0.03175261213183403, + 0.03134917322397232, + 0.03098049667477608, + 0.030580134057998656, + 0.03025078364908695, + 0.029965906804800033, + 0.029746233332157136, + 0.029537916985154154, + 0.029368729928135873, + 0.029206447684764863, + 0.029097266083955766, + 0.028998262310028076, + 0.028925995123386384, + 0.028875470691919328, + 0.028838179144263267, + 0.028815924447774886, + 0.028804841729998587 + ], + "train_acc": [ + 0.3249, + 0.6552, + 0.7598, + 0.7934, + 0.8034, + 0.8132, + 0.8258, + 0.8368, + 0.8409, + 0.8468, + 0.8571, + 0.8623, + 0.8682, + 0.8719, + 0.882, + 0.8883, + 0.8916, + 0.9008, + 0.9064, + 0.9096, + 0.9171, + 0.9213, + 0.9265, + 0.9316, + 0.9423, + 0.9439, + 0.9489, + 0.9549, + 0.9613, + 0.9653, + 0.9682, + 0.9692, + 0.9762, + 0.9794, + 0.9845, + 0.9883, + 0.9886, + 0.9905, + 0.9913, + 0.9924, + 0.9951, + 0.9961, + 0.9968, + 0.9974, + 0.9982, + 0.9984, + 0.9985, + 0.9992, + 0.9991, + 0.9992, + 0.9993, + 0.9993, + 0.9994, + 0.9996, + 0.9996, + 0.9998, + 0.9998, + 0.9999, + 0.9999, + 0.9999, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.5485, + 0.7015, + 0.7495, + 0.7625, + 0.768, + 0.769, + 0.775, + 0.774, + 0.779, + 0.7795, + 0.782, + 0.7905, + 0.788, + 0.7875, + 0.7895, + 0.7925, + 0.7875, + 0.797, + 0.797, + 0.796, + 0.8025, + 0.799, + 0.7925, + 0.802, + 0.7925, + 0.7925, + 0.7965, + 0.796, + 0.802, + 0.7975, + 0.8, + 0.7925, + 0.799, + 0.7945, + 0.7965, + 0.797, + 0.791, + 0.793, + 0.795, + 0.7905, + 0.7945, + 0.796, + 0.795, + 0.793, + 0.7945, + 0.796, + 0.7925, + 0.794, + 0.7945, + 0.7935, + 0.7905, + 0.7905, + 0.7845, + 0.788, + 0.7885, + 0.789, + 0.7895, + 0.7885, + 0.79, + 0.7905, + 0.791, + 0.791, + 0.79, + 0.7905, + 0.79, + 0.789, + 0.789, + 0.791, + 0.79, + 0.79, + 0.791, + 0.7905, + 0.791, + 0.7905, + 0.791, + 0.79, + 0.7905, + 0.7905, + 0.7905, + 0.7905 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9291538000106812, + 0.9242061376571655 + ], + "perturbation_rho": [ + 0.9999991059303284, + 0.9999985694885254 + ], + "nudging": { + "0.001": [ + -0.045578956604003906, + -0.02785908617079258 + ], + "0.003": [ + -0.13051706552505493, + -0.0812857374548912 + ], + "0.01": [ + -0.36666756868362427, + -0.24512334167957306 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2925382926940916, + 1.7889437934875487, + 1.260253756904602, + 0.9539756924629211, + 0.7977886853218079, + 0.7140761584281922, + 0.6654267780303955, + 0.6397091209411621, + 0.6243139269828797, + 0.6154428773880005, + 0.6143751846313477, + 0.6155710045814514, + 0.6156138698577881, + 0.6219459392547607, + 0.6182852596759796, + 0.6140298984527588, + 0.6210012950897217, + 0.6292118134498597, + 0.6216321679115295, + 0.6227944535255432, + 0.6250838468551636, + 0.6302425016403198, + 0.6193829513549804, + 0.6351193978309632, + 0.6367992011070251, + 0.650238129234314, + 0.6344584981918335, + 0.6519463251113892, + 0.6449099941253662, + 0.6615370457649231, + 0.6371989486694336, + 0.6602863219261169, + 0.6565528917312622, + 0.6482889573097229, + 0.6413513114929199, + 0.6494462338447571, + 0.6409127470016479, + 0.6464275256156922, + 0.648155325126648, + 0.6618475336074829, + 0.6339232350826264, + 0.6367729577064514, + 0.6629635499000549, + 0.6310218623638153, + 0.6272157665252686, + 0.6426493437290192, + 0.6343029105186463, + 0.626497606754303, + 0.6296635850906372, + 0.6324865888595581, + 0.625750997543335, + 0.6378193023681641, + 0.6297788947105408, + 0.6210315748214722, + 0.624997318649292, + 0.6212919867515564, + 0.6215335542201996, + 0.6199177579879761, + 0.6204080033302307, + 0.6204842404842377, + 0.6156154773712158, + 0.6164784337997437, + 0.6144172075271607, + 0.61289912109375, + 0.6115792436599732, + 0.6114538358688355, + 0.6116359647274018, + 0.6083082750320434, + 0.6086608262062073, + 0.6079776787757873, + 0.6070331044197083, + 0.6068843227386475, + 0.6061222413063049, + 0.6054628374576568, + 0.604520062637329, + 0.6041548914432525, + 0.6038100759506225, + 0.6035206285476684, + 0.6033140742301941, + 0.6032149271965027 + ], + "train_acc": [ + 0.1535, + 0.405, + 0.5877, + 0.6723, + 0.7129, + 0.7316, + 0.7494, + 0.7562, + 0.7635, + 0.7636, + 0.7659, + 0.7655, + 0.7659, + 0.7638, + 0.7629, + 0.7636, + 0.7632, + 0.761, + 0.7595, + 0.7621, + 0.7619, + 0.7576, + 0.7662, + 0.7592, + 0.7583, + 0.7543, + 0.7593, + 0.7561, + 0.7595, + 0.7512, + 0.7575, + 0.7494, + 0.7525, + 0.7562, + 0.756, + 0.7541, + 0.7569, + 0.7583, + 0.7539, + 0.7511, + 0.7617, + 0.7574, + 0.7493, + 0.7613, + 0.7607, + 0.752, + 0.7581, + 0.7592, + 0.7602, + 0.7593, + 0.7591, + 0.7563, + 0.7569, + 0.7631, + 0.7601, + 0.7629, + 0.763, + 0.7645, + 0.7651, + 0.7623, + 0.7671, + 0.7636, + 0.7652, + 0.7662, + 0.7644, + 0.766, + 0.769, + 0.7658, + 0.7697, + 0.7674, + 0.7685, + 0.7671, + 0.7688, + 0.7701, + 0.7691, + 0.7691, + 0.7701, + 0.7697, + 0.7701, + 0.77 + ], + "test_acc": [ + 0.2575, + 0.5275, + 0.6195, + 0.6685, + 0.6845, + 0.701, + 0.7085, + 0.72, + 0.7235, + 0.7225, + 0.7265, + 0.7345, + 0.7315, + 0.73, + 0.7255, + 0.723, + 0.7285, + 0.729, + 0.726, + 0.728, + 0.73, + 0.718, + 0.717, + 0.725, + 0.7125, + 0.7275, + 0.705, + 0.7205, + 0.7095, + 0.7145, + 0.721, + 0.718, + 0.7235, + 0.7245, + 0.7205, + 0.711, + 0.7185, + 0.7225, + 0.721, + 0.726, + 0.719, + 0.726, + 0.7235, + 0.7175, + 0.707, + 0.7215, + 0.719, + 0.718, + 0.723, + 0.7265, + 0.718, + 0.719, + 0.726, + 0.7185, + 0.7165, + 0.7215, + 0.721, + 0.723, + 0.7265, + 0.7255, + 0.726, + 0.724, + 0.728, + 0.7225, + 0.7245, + 0.7255, + 0.7245, + 0.727, + 0.724, + 0.7245, + 0.7265, + 0.729, + 0.7285, + 0.7305, + 0.73, + 0.73, + 0.729, + 0.731, + 0.73, + 0.73 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.02131858840584755, + 0.03880482539534569 + ], + "perturbation_rho": [ + 0.006325956434011459, + 0.07241131365299225 + ], + "nudging": { + "0.001": [ + -0.0007009014952927828, + -0.00027983251493424177 + ], + "0.003": [ + -0.002087946515530348, + -0.0008400778751820326 + ], + "0.01": [ + -0.006775922141969204, + -0.002794599626213312 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 2.1408685943603514, + 1.3764964288711548, + 0.8937187995910645, + 0.6806521401405334, + 0.6063734632492065, + 0.5921373236656189, + 0.6012698959350586, + 0.6085097344875335, + 0.618865624332428, + 0.6229370524406433, + 0.6271081844329834, + 0.6296928139686584, + 0.6329344481468201, + 0.6373940747737884, + 0.6441978803634644, + 0.6502310201644897, + 0.6577924034118653, + 0.6638825251579284, + 0.6633781417846679, + 0.662655659198761, + 0.671446533203125, + 0.6748080488204956, + 0.6730749175071716, + 0.6885585793495178, + 0.6853348649978638, + 0.6937937314987183, + 0.7025538193225861, + 0.6914417263031006, + 0.6994074465751648, + 0.7016401989936829, + 0.7077653275966644, + 0.7140635179519653, + 0.719589767742157, + 0.7156314441680908, + 0.7186767238616943, + 0.7123939609527588, + 0.7217615343093872, + 0.7193854808807373, + 0.7269024057388306, + 0.7369294118881226, + 0.7207375118255616, + 0.7266824924468994, + 0.731508938407898, + 0.725278225517273, + 0.7310970863819123, + 0.7277004768371582, + 0.7388540773391724, + 0.7262511849403381, + 0.7372460752487182, + 0.7248942784309387, + 0.7235971044540406, + 0.7246456790924072, + 0.7409098614692688, + 0.7274047603607178, + 0.7256083255767822, + 0.7254483180999756, + 0.7276198521614075, + 0.726950217628479, + 0.725731752204895, + 0.7291518458366394, + 0.7226115200996399, + 0.7278635671615601, + 0.7244456878662109, + 0.7224804187774658, + 0.7225179643630981, + 0.7228940364837646, + 0.721614897441864, + 0.7204741502761841, + 0.7193958771705627, + 0.7201352106094361, + 0.7190518887519837, + 0.7184531566619873, + 0.7180235387802124, + 0.7173173397064209, + 0.7167859954833984, + 0.7164597539424896, + 0.7162381525039673, + 0.7160966100692749, + 0.7159361206054687, + 0.7158677879333496 + ], + "train_acc": [ + 0.2242, + 0.5483, + 0.693, + 0.7528, + 0.7704, + 0.7716, + 0.7678, + 0.7698, + 0.7661, + 0.7652, + 0.7631, + 0.7655, + 0.7626, + 0.7634, + 0.7573, + 0.7524, + 0.7496, + 0.7523, + 0.7482, + 0.7508, + 0.7477, + 0.7456, + 0.7467, + 0.7432, + 0.7436, + 0.7385, + 0.7362, + 0.7417, + 0.741, + 0.7403, + 0.7365, + 0.7338, + 0.7302, + 0.7333, + 0.7367, + 0.7347, + 0.7324, + 0.731, + 0.729, + 0.7291, + 0.7328, + 0.7293, + 0.726, + 0.7307, + 0.7315, + 0.7312, + 0.7276, + 0.7278, + 0.7248, + 0.7315, + 0.7328, + 0.7319, + 0.7249, + 0.7287, + 0.7328, + 0.7342, + 0.7285, + 0.7311, + 0.7316, + 0.7284, + 0.7332, + 0.7295, + 0.7326, + 0.7339, + 0.7349, + 0.7327, + 0.7321, + 0.7348, + 0.7331, + 0.7339, + 0.7336, + 0.7336, + 0.7346, + 0.736, + 0.7342, + 0.7352, + 0.7351, + 0.7353, + 0.7355, + 0.7359 + ], + "test_acc": [ + 0.4415, + 0.6245, + 0.6935, + 0.725, + 0.7325, + 0.7305, + 0.7295, + 0.735, + 0.723, + 0.723, + 0.7235, + 0.722, + 0.716, + 0.7185, + 0.708, + 0.708, + 0.712, + 0.7085, + 0.713, + 0.7005, + 0.702, + 0.7055, + 0.7015, + 0.6855, + 0.6955, + 0.695, + 0.687, + 0.692, + 0.6915, + 0.691, + 0.6865, + 0.6765, + 0.685, + 0.686, + 0.6875, + 0.6875, + 0.6865, + 0.678, + 0.675, + 0.6825, + 0.6795, + 0.6825, + 0.6835, + 0.679, + 0.681, + 0.6775, + 0.677, + 0.672, + 0.6755, + 0.6765, + 0.6815, + 0.6765, + 0.672, + 0.6775, + 0.678, + 0.675, + 0.675, + 0.682, + 0.6735, + 0.6745, + 0.6785, + 0.669, + 0.6865, + 0.677, + 0.6775, + 0.6735, + 0.6715, + 0.675, + 0.6725, + 0.6735, + 0.6755, + 0.677, + 0.677, + 0.676, + 0.6765, + 0.676, + 0.675, + 0.675, + 0.675, + 0.6755 + ], + "state_pred_error": [ + 0.8080644834518432, + 0.39239263830184934, + 0.23570088872909545, + 0.18436644830703736, + 0.17015166330337525, + 0.16577841153144837, + 0.15891898512840272, + 0.14670312795639037, + 0.13382397260665893, + 0.1253697662591934, + 0.11607049119472504, + 0.10657218925952912, + 0.09855207993984222, + 0.0928174996972084, + 0.08665878224372864, + 0.08460470433235169, + 0.08135875176787376, + 0.07774004120826722, + 0.07695613958835602, + 0.075308149933815, + 0.07403676271438599, + 0.0740367253780365, + 0.07511613126993179, + 0.06968745267391205, + 0.06773570336103439, + 0.06727046658992768, + 0.06653650290369988, + 0.06482027760744095, + 0.06515331575870514, + 0.0638981928229332, + 0.0620466558098793, + 0.06260543761253357, + 0.06213358806967735, + 0.06028746428489685, + 0.05951403741836548, + 0.05873561415076256, + 0.05801951932907105, + 0.05811610379815101, + 0.05617883744239807, + 0.05539749718904495, + 0.054504805290699, + 0.0535935148537159, + 0.053170457899570464, + 0.05185950981974602, + 0.051334794068336485, + 0.05101199344396591, + 0.050492712152004245, + 0.05117302381396294, + 0.04784535982608795, + 0.04772583312392235, + 0.04679878767132759, + 0.045225712451338766, + 0.04433399237394333, + 0.043538872480392454, + 0.04340486377477646, + 0.04172027028799057, + 0.040727964186668394, + 0.04038996203541756, + 0.04039305700659752, + 0.040595778387784956, + 0.0387884624004364, + 0.03819443533420563, + 0.037498074996471405, + 0.03695043048858643, + 0.036768312060832975, + 0.03635304583311081, + 0.03555620402693749, + 0.034702681583166126, + 0.03439524923563003, + 0.033875951832532884, + 0.032905505937337876, + 0.0324125466644764, + 0.031943915390968323, + 0.03169405475258827, + 0.03094981493651867, + 0.031065510040521622, + 0.03044595140218735, + 0.0299276578605175, + 0.029405312579870224, + 0.02933962969481945 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.669547975063324, + 0.3677923083305359 + ], + "perturbation_rho": [ + 0.6219363808631897, + 0.33943480253219604 + ], + "nudging": { + "0.001": [ + -0.02052037976682186, + -0.002662357408553362 + ], + "0.003": [ + -0.06065082550048828, + -0.007972602732479572 + ], + "0.01": [ + -0.19162335991859436, + -0.026401527225971222 + ] + }, + "state_pred_error_per_layer": [ + 3936.27783203125, + 288.300537109375 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2930677429199218, + 1.7906015796661376, + 1.2635988039970398, + 0.9581242958068847, + 0.8003487806320191, + 0.7156089757919312, + 0.6689188489913941, + 0.643795274734497, + 0.6305122444152832, + 0.623988843202591, + 0.6187444662094116, + 0.6178006851196289, + 0.6173453359603882, + 0.6273444614410401, + 0.6134593425750733, + 0.6198339825630188, + 0.6272809553146362, + 0.6293932919502259, + 0.6404480037689209, + 0.6594240272521973, + 0.659067080116272, + 0.6821993915557861, + 0.6791766733169555, + 0.734606586265564, + 0.7313875273704529, + 0.7563578330993652, + 0.7668250580310821, + 0.8190950353622437, + 0.826333743095398, + 0.9198218053817749, + 0.896049147605896, + 0.9007102657318116, + 0.9501289850234985, + 0.9285598526000977, + 0.9668602191925049, + 0.998112233543396, + 0.9962548406600952, + 1.025565596961975, + 1.0426634029388429, + 1.1057414449691771, + 1.06785728225708, + 1.127798579788208, + 1.095726201725006, + 1.1017658351898194, + 1.1498224843978881, + 1.1459971050262452, + 1.1370128602981568, + 1.149132413482666, + 1.1653138580322266, + 1.1741461233139039, + 1.1763445219039916, + 1.1848371679306031, + 1.1794607717514038, + 1.1951260248184203, + 1.1707811889648438, + 1.198930864906311, + 1.2012914625167848, + 1.206768136692047, + 1.204185746574402, + 1.2064070075988769, + 1.2319160966873168, + 1.2115518913269043, + 1.2102981552124024, + 1.221316057395935, + 1.2108774530410766, + 1.216943055343628, + 1.2206229318618775, + 1.2132027009963988, + 1.2105617532730102, + 1.2109660068511963, + 1.2121095266342163, + 1.2105155519485473, + 1.2125362398147583, + 1.2109583696365356, + 1.2117174470901488, + 1.211683067703247, + 1.2104114021301269, + 1.2101064739227294, + 1.209652373123169, + 1.209543790435791 + ], + "train_acc": [ + 0.154, + 0.4077, + 0.5905, + 0.6696, + 0.7103, + 0.7321, + 0.7438, + 0.7522, + 0.7595, + 0.7621, + 0.7628, + 0.7618, + 0.766, + 0.7603, + 0.7657, + 0.7652, + 0.7642, + 0.7582, + 0.7593, + 0.7481, + 0.7532, + 0.7425, + 0.7412, + 0.7202, + 0.7208, + 0.7118, + 0.7112, + 0.6904, + 0.6906, + 0.6662, + 0.6651, + 0.6607, + 0.6499, + 0.6509, + 0.636, + 0.6327, + 0.6251, + 0.6248, + 0.6112, + 0.5911, + 0.6054, + 0.5861, + 0.5939, + 0.597, + 0.574, + 0.574, + 0.5828, + 0.5792, + 0.5716, + 0.571, + 0.5708, + 0.5644, + 0.5659, + 0.564, + 0.5724, + 0.5651, + 0.5621, + 0.5623, + 0.5635, + 0.5608, + 0.5521, + 0.5568, + 0.5596, + 0.553, + 0.559, + 0.5588, + 0.5573, + 0.5606, + 0.5627, + 0.5631, + 0.5594, + 0.5612, + 0.5637, + 0.5609, + 0.5609, + 0.5635, + 0.5612, + 0.5626, + 0.5622, + 0.5622 + ], + "test_acc": [ + 0.2615, + 0.529, + 0.614, + 0.661, + 0.692, + 0.7, + 0.714, + 0.72, + 0.7285, + 0.7265, + 0.731, + 0.7265, + 0.716, + 0.726, + 0.7255, + 0.727, + 0.7255, + 0.718, + 0.7035, + 0.727, + 0.707, + 0.692, + 0.684, + 0.6745, + 0.655, + 0.6735, + 0.6505, + 0.626, + 0.6035, + 0.65, + 0.6145, + 0.626, + 0.624, + 0.5915, + 0.6, + 0.5885, + 0.592, + 0.5785, + 0.547, + 0.5985, + 0.553, + 0.558, + 0.5605, + 0.556, + 0.568, + 0.5725, + 0.5595, + 0.576, + 0.5515, + 0.521, + 0.554, + 0.545, + 0.558, + 0.5545, + 0.539, + 0.555, + 0.5535, + 0.5615, + 0.549, + 0.5325, + 0.55, + 0.546, + 0.544, + 0.5395, + 0.5525, + 0.549, + 0.545, + 0.55, + 0.548, + 0.548, + 0.548, + 0.549, + 0.5445, + 0.5435, + 0.549, + 0.543, + 0.5435, + 0.543, + 0.545, + 0.544 + ], + "value_loss": [ + 3.2248993295669557, + 0.7993324143409729, + 0.6241890686035156, + 0.6834478240966797, + 0.7149497946739197, + 0.7328285658836364, + 0.7252531176567077, + 0.7242275772094726, + 0.6944476741790772, + 0.6577629441261291, + 0.5848735992431641, + 0.5314478209733963, + 0.5021982323169708, + 0.46592460460662843, + 0.43146484746932984, + 0.42146070685386655, + 0.4119085889816284, + 0.39813878288269045, + 0.41772686648368834, + 0.4242308696746826, + 0.4232831803321838, + 0.4443666146278381, + 0.4284376886367798, + 0.48585635566711427, + 0.5515175453186035, + 0.48890927267074585, + 0.5025943306922913, + 0.5741351163864136, + 0.5820644855499267, + 0.6837124898910523, + 0.6473771015167237, + 0.6066724607467652, + 0.6526529814243317, + 0.6264799011230469, + 0.6441321707725525, + 0.6961791508674622, + 0.6708058875083923, + 0.7160791521072387, + 0.7070828273773193, + 0.7737439245223999, + 0.6961604730606079, + 0.759050937461853, + 0.7100138769149781, + 0.7116358661174774, + 0.7559867481231689, + 0.7568133228302002, + 0.7395440124511719, + 0.7170330075263978, + 0.7338975098609924, + 0.7261011720657349, + 0.720359804058075, + 0.7117862114906311, + 0.6998868808746338, + 0.7118762451171875, + 0.6942419066429139, + 0.708058609008789, + 0.6941633409500122, + 0.692590379858017, + 0.6789092469215393, + 0.6850510005950927, + 0.716767284488678, + 0.68156391954422, + 0.6771818018913269, + 0.6850450862884522, + 0.6689441861152648, + 0.7021669523239136, + 0.657691025352478, + 0.6575634796142578, + 0.6773880264282227, + 0.6467782649993896, + 0.6400901229858399, + 0.6624997299194336, + 0.649611467552185, + 0.6397799256324768, + 0.641498973274231, + 0.6482289396286011, + 0.6444473560333251, + 0.630499946641922, + 0.6389780987739563, + 0.6262330022811889 + ], + "term_loss": [ + 1.8183423800468446, + 0.29775885496139526, + 0.3068508393764496, + 0.39105849962234496, + 0.42729952583312986, + 0.4394968143463135, + 0.4197773234128952, + 0.4148836517333984, + 0.3934750539779663, + 0.36719825417995455, + 0.29819075326919553, + 0.24998210138082505, + 0.22208165415525435, + 0.18075168552398682, + 0.14858310407996178, + 0.1344268194437027, + 0.12288439840078354, + 0.10251754094362259, + 0.11906026402711868, + 0.10960771135091782, + 0.10353840012550354, + 0.11309561696052552, + 0.0958007196843624, + 0.1258739206790924, + 0.17593133050203325, + 0.11036868476867676, + 0.11591389536857605, + 0.16073772571086883, + 0.15807414741516113, + 0.21683111358880996, + 0.17209635527133943, + 0.13972420678138733, + 0.15794085698723792, + 0.13904727120399474, + 0.13483572725057602, + 0.1666991223335266, + 0.1425665506362915, + 0.16871983683109285, + 0.14408435807228087, + 0.18444827466011046, + 0.1321460841655731, + 0.16269202904701233, + 0.13014199110269548, + 0.1294034091487527, + 0.1440461580991745, + 0.15523652358055115, + 0.14207189916372298, + 0.12285058436393738, + 0.13586411867141723, + 0.1288945063829422, + 0.12319473965168, + 0.11254922043085099, + 0.10359074312001466, + 0.11389455975294113, + 0.10458315942287445, + 0.1094145234465599, + 0.09637801191806793, + 0.09371047725081444, + 0.08351869256496429, + 0.08925566356182098, + 0.10697866353988647, + 0.08361842547655106, + 0.08154404339790344, + 0.08493596833944321, + 0.0752170923113823, + 0.10030660749673843, + 0.06409129187166691, + 0.06702304346561432, + 0.08525947888493537, + 0.0602948613345623, + 0.056035476887226106, + 0.07380687378048897, + 0.06269274026155472, + 0.05782889631986618, + 0.05753139565885067, + 0.062405730831623075, + 0.06079903078079223, + 0.0512572136759758, + 0.05954945843219757, + 0.049621654653549195 + ], + "bridge_loss": [ + 1.1121261556328157, + 0.18033452768325806, + 0.044868849658966065, + 0.014689313915371895, + 0.01023074924647808, + 0.01922336928844452, + 0.03395731185674667, + 0.03782916660308838, + 0.03113397532105446, + 0.022801124688982963, + 0.02172847282886505, + 0.020213665278255938, + 0.022226871091127396, + 0.025470469930768014, + 0.028755379277467727, + 0.029124588099122047, + 0.02939661954641342, + 0.029101639929413795, + 0.02919348032474518, + 0.03238499325215816, + 0.032242322093248364, + 0.03024594938158989, + 0.026401079308986664, + 0.024576114797592162, + 0.03187911439538002, + 0.02190283774137497, + 0.02207313554286957, + 0.023493554462492464, + 0.027907810562849043, + 0.03462046889662743, + 0.04101263058185577, + 0.03280288675427437, + 0.03566813161671162, + 0.03487102485895157, + 0.03985436806678772, + 0.04859413042068481, + 0.044892528000473976, + 0.05330698952078819, + 0.05985534909963608, + 0.06091915727853775, + 0.05097657561898231, + 0.055695305168628695, + 0.05239534618854523, + 0.053533487647771834, + 0.06308192758560181, + 0.056202594065666196, + 0.052459887611866, + 0.04611912113130093, + 0.04382932303547859, + 0.039009837090969085, + 0.037849784502387046, + 0.035277613407373426, + 0.03421798730790615, + 0.03130286419391632, + 0.030226914799213408, + 0.02961234229207039, + 0.02709128211736679, + 0.025383359724283218, + 0.02319343387782574, + 0.02375578812658787, + 0.025886915796995164, + 0.02316858033835888, + 0.021137660603225233, + 0.02238177977204323, + 0.019515478390455247, + 0.026733190059661866, + 0.016641176676750184, + 0.017249585717916488, + 0.020065816271305083, + 0.015035193768143653, + 0.013222106355428696, + 0.017796086595952512, + 0.016782105472683908, + 0.013273935839533806, + 0.014949301466345787, + 0.01761808745712042, + 0.016150817796587943, + 0.01291478123217821, + 0.013207211822271346, + 0.011661755262315273 + ], + "tgrad_loss": [ + 0.29443079996109006, + 0.32123903341293336, + 0.2724693781852722, + 0.2777000066757202, + 0.27741951839923856, + 0.27410838158130646, + 0.2715184868335724, + 0.27151475338935854, + 0.26983864469528196, + 0.267763564658165, + 0.2649543730735779, + 0.261252060508728, + 0.2578897050380707, + 0.259702449131012, + 0.254126366353035, + 0.257909298157692, + 0.25962757234573364, + 0.2665196026802063, + 0.26947312445640564, + 0.2822381624221802, + 0.2875024567604065, + 0.3010250496864319, + 0.306235889339447, + 0.33540631856918335, + 0.34370709981918335, + 0.3566377507209778, + 0.3646072976827621, + 0.3899038382530212, + 0.39608252487182616, + 0.43226090650558474, + 0.43426811542510985, + 0.43414536876678467, + 0.4590439986228943, + 0.4525616018295288, + 0.4694420761108398, + 0.4808858978271484, + 0.4833468080043793, + 0.4940523235321045, + 0.5031431226730346, + 0.5283764887332916, + 0.5130378133773804, + 0.5406636076927185, + 0.5274765404701233, + 0.5286989701747894, + 0.5488586637496948, + 0.5453742033958435, + 0.5450122264862061, + 0.5480633078575134, + 0.5542040694236755, + 0.5581968259811402, + 0.5593152769088745, + 0.5639593736648559, + 0.5620781542778015, + 0.5666788202285766, + 0.559431838798523, + 0.5690317416191101, + 0.5706940474510193, + 0.5734965413570404, + 0.5721971173286438, + 0.5720395500183105, + 0.5839017023563385, + 0.5747769118309021, + 0.5745000981330871, + 0.5777273398399353, + 0.5742116190910339, + 0.5751271549224853, + 0.5769585556983948, + 0.5732908483505249, + 0.5720627280235291, + 0.5714482112884521, + 0.5708325432777405, + 0.5708967746734619, + 0.5701366203308106, + 0.5686770866394043, + 0.5690182728767395, + 0.5682051241397857, + 0.5674975052833557, + 0.5663279546737671, + 0.5662214254856109, + 0.5649495909690857 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.35489675402641296, + 0.6773503422737122 + ], + "perturbation_rho": [ + 0.4646533727645874, + 0.7230339646339417 + ], + "nudging": { + "0.001": [ + -0.007704081013798714, + -0.005977225489914417 + ], + "0.003": [ + -0.023026108741760254, + -0.017880568280816078 + ], + "0.01": [ + -0.07572861015796661, + -0.059002168476581573 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a1.0_L4_s123.json b/results/synth_ladder_v2_hi/synth_a1.0_L4_s123.json new file mode 100644 index 0000000..ca9c224 --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a1.0_L4_s123.json @@ -0,0 +1,1554 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.6485030268669127, + 0.7620264513015748, + 0.5550794436454773, + 0.48446305503845216, + 0.4474473762512207, + 0.4145241394519806, + 0.3731674439430237, + 0.3462322264909744, + 0.3150002685546875, + 0.2903987177371979, + 0.26924062194824216, + 0.23645675805807115, + 0.19837250323295594, + 0.18251929836273192, + 0.18135696101188659, + 0.15074845348596572, + 0.11649558038413525, + 0.09285263032913207, + 0.09888959465026856, + 0.08603223395347595, + 0.06269924810230731, + 0.046742530822753904, + 0.04394126555845142, + 0.031720275783538816, + 0.026758466351032257, + 0.023394752728939056, + 0.019812115742266177, + 0.01714037846326828, + 0.015127740550041199, + 0.013289766156673431, + 0.01228538273870945, + 0.012052093788981437, + 0.01026724858507514, + 0.00912058850824833, + 0.00848468861579895, + 0.00808774781525135, + 0.0072535969689488415, + 0.0068384970754385, + 0.0065235509559512135, + 0.00603497141264379, + 0.00568141555711627, + 0.005382864147424698, + 0.005199306092783808, + 0.00492797272503376, + 0.004693482632003724, + 0.004515291118621826, + 0.004368959432840347, + 0.004224653296917677, + 0.004046281071379781, + 0.003903051765821874, + 0.0037841040194034575, + 0.0036743775807321073, + 0.0035745090641081333, + 0.003476204214990139, + 0.0033944160878658296, + 0.0033240677129477265, + 0.0032490688487887384, + 0.0031777531236410143, + 0.0031181889969855545, + 0.0030590228272601963, + 0.003005053073912859, + 0.0029609910145401955, + 0.0029263747449964285, + 0.0028864801935851573, + 0.0028537690378725527, + 0.002823205841332674, + 0.002794191201776266, + 0.0027695251271128655, + 0.0027482865223661065, + 0.0027297443959861992, + 0.002714714765176177, + 0.0027010637482628224, + 0.0026901938542723655, + 0.0026811452329158782, + 0.00267406751178205, + 0.0026686322901397943, + 0.0026645718470215797, + 0.0026618377018719913, + 0.0026602591374889017, + 0.0026594095595180987 + ], + "train_acc": [ + 0.4485, + 0.7375, + 0.7923, + 0.8155, + 0.8282, + 0.8423, + 0.8571, + 0.8716, + 0.8789, + 0.89, + 0.9023, + 0.9173, + 0.9347, + 0.9407, + 0.9378, + 0.9517, + 0.9694, + 0.9813, + 0.9738, + 0.9822, + 0.9909, + 0.9955, + 0.9962, + 0.999, + 0.9999, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.665, + 0.768, + 0.783, + 0.7825, + 0.783, + 0.794, + 0.787, + 0.7995, + 0.789, + 0.793, + 0.796, + 0.795, + 0.797, + 0.793, + 0.8005, + 0.7975, + 0.7935, + 0.7945, + 0.7905, + 0.791, + 0.796, + 0.7935, + 0.792, + 0.7925, + 0.7915, + 0.7905, + 0.788, + 0.793, + 0.788, + 0.789, + 0.79, + 0.7865, + 0.7905, + 0.788, + 0.788, + 0.788, + 0.789, + 0.7835, + 0.788, + 0.7865, + 0.7855, + 0.786, + 0.7855, + 0.787, + 0.786, + 0.786, + 0.7845, + 0.783, + 0.7845, + 0.784, + 0.7845, + 0.7855, + 0.7865, + 0.787, + 0.787, + 0.7865, + 0.7855, + 0.7865, + 0.786, + 0.786, + 0.787, + 0.7865, + 0.7855, + 0.7855, + 0.7865, + 0.786, + 0.786, + 0.787, + 0.7865, + 0.7865, + 0.7865, + 0.7865, + 0.786, + 0.786, + 0.786, + 0.786, + 0.786, + 0.786, + 0.786, + 0.786 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8610074520111084, + 0.8541143536567688, + 0.8321727514266968, + 0.7993940114974976 + ], + "perturbation_rho": [ + 0.9999990463256836, + 0.9999986886978149, + 0.9999971389770508, + 0.9999833703041077 + ], + "nudging": { + "0.001": [ + -0.061208125203847885, + -0.048201389610767365, + -0.027980640530586243, + -0.012230003252625465 + ], + "0.003": [ + -0.1748121678829193, + -0.13912320137023926, + -0.08209913969039917, + -0.03633902221918106 + ], + "0.01": [ + -0.492245614528656, + -0.40577083826065063, + -0.25304561853408813, + -0.117084801197052 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.244384346008301, + 1.6658402580261231, + 1.122510219192505, + 0.8736206652641296, + 0.7597340629577637, + 0.6988716425895691, + 0.6796123376846314, + 0.6578597159862518, + 0.6504812906265259, + 0.6735348190307617, + 0.6848076729774475, + 0.6858792749404907, + 0.6815519685745239, + 0.6852759933471679, + 0.7381223386764526, + 0.7184744972229004, + 0.6851869500160217, + 0.7189444061279296, + 0.7768984985351562, + 0.728230765914917, + 0.7206257730484009, + 0.7248182010650634, + 0.7614868778228759, + 0.7475514825820923, + 0.7896351873397827, + 0.7320388195991516, + 0.7398907415866852, + 0.7591429317474365, + 0.7483150260925293, + 0.7531359097480774, + 0.7545860271453857, + 0.8287553598403931, + 0.7648152837753296, + 0.771906914806366, + 0.7739894755363464, + 0.7938769704818726, + 0.7921385692596435, + 0.7916910556793213, + 0.8290664767742157, + 0.7879267723083496, + 0.8088912184476852, + 0.798623261642456, + 0.800121602153778, + 0.7935735574245453, + 0.7912781294822693, + 0.8075062445163727, + 0.7912796350479125, + 0.7820112172603607, + 0.787954132270813, + 0.7751848423004151, + 0.7753581878662109, + 0.7797921692848205, + 0.7868508473396302, + 0.7874830360412598, + 0.7783025196075439, + 0.7713859317302704, + 0.7603790185928345, + 0.7596016332626343, + 0.7514689461231232, + 0.7495272707939148, + 0.7444016216278077, + 0.7518722133636475, + 0.7441502522945405, + 0.7440012859344483, + 0.7390048952102661, + 0.739477536201477, + 0.7372656646728516, + 0.734891752910614, + 0.7310723892688751, + 0.728121880531311, + 0.7290601845741272, + 0.7274617082595826, + 0.7263197314262391, + 0.7242576133728027, + 0.7240845788955689, + 0.7236108267784118, + 0.7226919463157654, + 0.7218466625213623, + 0.7212368441104889, + 0.7210169439315796 + ], + "train_acc": [ + 0.1771, + 0.4329, + 0.5991, + 0.6748, + 0.7141, + 0.7359, + 0.7439, + 0.7517, + 0.7556, + 0.7448, + 0.7473, + 0.7457, + 0.7492, + 0.7504, + 0.7355, + 0.7435, + 0.7536, + 0.7422, + 0.7257, + 0.7412, + 0.743, + 0.7378, + 0.73, + 0.7369, + 0.7233, + 0.7438, + 0.7408, + 0.736, + 0.7384, + 0.7424, + 0.7353, + 0.7203, + 0.7372, + 0.7362, + 0.7369, + 0.7316, + 0.7361, + 0.7297, + 0.7274, + 0.7303, + 0.7311, + 0.7304, + 0.7304, + 0.7325, + 0.7398, + 0.7282, + 0.7346, + 0.7348, + 0.7357, + 0.7391, + 0.7357, + 0.7392, + 0.7322, + 0.7313, + 0.7375, + 0.736, + 0.7434, + 0.7412, + 0.7436, + 0.7417, + 0.7455, + 0.7431, + 0.745, + 0.7429, + 0.7461, + 0.7436, + 0.7447, + 0.7457, + 0.7459, + 0.748, + 0.7469, + 0.747, + 0.7516, + 0.7472, + 0.7476, + 0.7486, + 0.7501, + 0.7492, + 0.7493, + 0.7499 + ], + "test_acc": [ + 0.2955, + 0.537, + 0.639, + 0.6815, + 0.7015, + 0.713, + 0.7055, + 0.7105, + 0.694, + 0.6975, + 0.6945, + 0.7035, + 0.6945, + 0.637, + 0.695, + 0.6955, + 0.696, + 0.6375, + 0.6905, + 0.7005, + 0.7, + 0.697, + 0.6775, + 0.6955, + 0.691, + 0.6925, + 0.6785, + 0.6975, + 0.673, + 0.6935, + 0.6645, + 0.683, + 0.6875, + 0.679, + 0.6825, + 0.6765, + 0.6835, + 0.685, + 0.675, + 0.668, + 0.6735, + 0.6695, + 0.675, + 0.684, + 0.675, + 0.655, + 0.6665, + 0.662, + 0.6705, + 0.68, + 0.6675, + 0.6695, + 0.67, + 0.6585, + 0.6675, + 0.684, + 0.6655, + 0.669, + 0.678, + 0.677, + 0.68, + 0.674, + 0.675, + 0.677, + 0.676, + 0.675, + 0.6775, + 0.6795, + 0.6795, + 0.6785, + 0.682, + 0.6765, + 0.677, + 0.677, + 0.679, + 0.6825, + 0.68, + 0.6825, + 0.6825, + 0.682 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.008613362908363342, + 0.039367884397506714, + 0.07619941979646683, + 0.0912623256444931 + ], + "perturbation_rho": [ + -0.007624803110957146, + 0.008791688829660416, + 0.13103844225406647, + 0.12304534018039703 + ], + "nudging": { + "0.001": [ + 0.0005033417255617678, + -0.00032083888072520494, + -0.0003624922828748822, + -0.0004093719180673361 + ], + "0.003": [ + 0.0015421062707901, + -0.0009612979483790696, + -0.0010858506429940462, + -0.0012270397273823619 + ], + "0.01": [ + 0.005509334150701761, + -0.003195145633071661, + -0.0036095697432756424, + -0.004080047365278006 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.9460896991729737, + 1.02048748588562, + 0.6666754946231842, + 0.5997845686912536, + 0.6188174986362457, + 0.6522882369995118, + 0.702923126411438, + 0.7500360467910766, + 0.7784844299316406, + 0.8033292488098145, + 0.8202642150878906, + 0.8388009960174561, + 0.8644936017990112, + 0.8621721601486206, + 0.8420976860046386, + 0.8441275070190429, + 0.8518479587554931, + 0.8519618356704712, + 0.8573237961769103, + 0.8466630826950073, + 0.8620194334030151, + 0.872311677646637, + 0.8844598554611206, + 0.8897781185150146, + 0.8986350463867188, + 0.9107674625396729, + 0.9466994457244873, + 0.937027760887146, + 0.9229575090408325, + 0.9407363571166992, + 0.9483418552398681, + 0.9390256658554077, + 0.9403314212799072, + 0.9275119705200195, + 0.9150855571746827, + 0.9282055849075317, + 0.9308360594749451, + 0.9139512258529663, + 0.932987433052063, + 0.9214247636795044, + 0.9115749345779419, + 0.9211696140289307, + 0.9204665400505065, + 0.9168176971912384, + 0.9151170783996582, + 0.9214367736816407, + 0.9209912311553955, + 0.9118391947746277, + 0.9123114767074585, + 0.92075571975708, + 0.9061430419921875, + 0.9054867052078247, + 0.8936779041290284, + 0.9038484088897705, + 0.9033261381149292, + 0.8901759426116943, + 0.8972558786392212, + 0.8854782384872436, + 0.8886939645767212, + 0.8866627412796021, + 0.8855161333084106, + 0.8790008495330811, + 0.8785218952178955, + 0.87869962849617, + 0.8714217117309571, + 0.8715060123443603, + 0.8701889377593994, + 0.866465859413147, + 0.8666391557693481, + 0.8658134422302246, + 0.8639697080612183, + 0.8635739400863648, + 0.8614107210159302, + 0.8612226030349731, + 0.860686711883545, + 0.8599462993621826, + 0.8594131113052368, + 0.8590457509994507, + 0.8588304187774658, + 0.8587044605255127 + ], + "train_acc": [ + 0.3069, + 0.631, + 0.745, + 0.7677, + 0.7673, + 0.7585, + 0.7431, + 0.7285, + 0.7221, + 0.711, + 0.7088, + 0.6988, + 0.6899, + 0.6911, + 0.6931, + 0.6895, + 0.6821, + 0.6871, + 0.6841, + 0.6861, + 0.685, + 0.6788, + 0.681, + 0.6818, + 0.6734, + 0.6787, + 0.6673, + 0.668, + 0.6761, + 0.6688, + 0.6658, + 0.6669, + 0.6636, + 0.6717, + 0.6721, + 0.6659, + 0.6707, + 0.6746, + 0.6666, + 0.6708, + 0.6728, + 0.6736, + 0.6688, + 0.6701, + 0.6778, + 0.6721, + 0.6728, + 0.6757, + 0.6743, + 0.6693, + 0.6738, + 0.6802, + 0.6788, + 0.6783, + 0.677, + 0.6837, + 0.677, + 0.6814, + 0.6807, + 0.6834, + 0.6819, + 0.6821, + 0.683, + 0.6832, + 0.6838, + 0.6858, + 0.6834, + 0.6856, + 0.6852, + 0.6866, + 0.6868, + 0.687, + 0.6865, + 0.6889, + 0.6866, + 0.6866, + 0.6872, + 0.6871, + 0.6874, + 0.6876 + ], + "test_acc": [ + 0.522, + 0.686, + 0.7305, + 0.725, + 0.7175, + 0.7205, + 0.6945, + 0.692, + 0.6795, + 0.6775, + 0.6695, + 0.657, + 0.657, + 0.6595, + 0.662, + 0.6585, + 0.64, + 0.648, + 0.6455, + 0.6335, + 0.6255, + 0.6325, + 0.6285, + 0.6225, + 0.6235, + 0.62, + 0.6245, + 0.624, + 0.628, + 0.6205, + 0.6235, + 0.6265, + 0.6115, + 0.6265, + 0.6175, + 0.6205, + 0.6225, + 0.6235, + 0.621, + 0.628, + 0.628, + 0.6265, + 0.624, + 0.625, + 0.6195, + 0.6285, + 0.632, + 0.6255, + 0.623, + 0.6335, + 0.6115, + 0.6285, + 0.6285, + 0.632, + 0.626, + 0.6255, + 0.6265, + 0.628, + 0.6265, + 0.635, + 0.634, + 0.629, + 0.632, + 0.633, + 0.6325, + 0.6295, + 0.6325, + 0.632, + 0.636, + 0.6265, + 0.6335, + 0.6305, + 0.6315, + 0.634, + 0.6325, + 0.6295, + 0.631, + 0.6315, + 0.6305, + 0.6305 + ], + "state_pred_error": [ + 0.7793568561077118, + 0.3118565825223923, + 0.20360799007415772, + 0.17635596759319305, + 0.16408502702713013, + 0.1599778488636017, + 0.16032327077388764, + 0.16038565831184387, + 0.15718616988658904, + 0.1544437967300415, + 0.15516557030677797, + 0.15298717787265778, + 0.1504029001235962, + 0.14225415984392167, + 0.13645789219141005, + 0.12674877222776412, + 0.11889368886947632, + 0.11306129736900329, + 0.10757653653621674, + 0.10412199894189834, + 0.09768045265674591, + 0.09353149293661117, + 0.09076726281642913, + 0.08965073142051697, + 0.08674556518793106, + 0.08478252203464508, + 0.08322861977815628, + 0.08022089281082154, + 0.07800674693584442, + 0.07719690150022507, + 0.07593471973538399, + 0.07448869940042496, + 0.07324682236909866, + 0.07216234427690506, + 0.07157725752592087, + 0.06850798486471177, + 0.06744037889242173, + 0.06449633466005325, + 0.06279489300251007, + 0.060556842333078384, + 0.05860834004878998, + 0.056899214422702786, + 0.05532535774707794, + 0.053600450432300564, + 0.05157438895106316, + 0.05032240780591965, + 0.049856857776641846, + 0.04676780249476433, + 0.04521846981048584, + 0.04605005966424942, + 0.04307681691348553, + 0.04080379275083542, + 0.03996113035082817, + 0.03907167859077454, + 0.03806798343658447, + 0.036509654211997984, + 0.03606395539045334, + 0.03462406445145607, + 0.033797594472765924, + 0.03285828292965889, + 0.03233671128153801, + 0.03190984711050987, + 0.03070613071322441, + 0.030161835169792175, + 0.029909810426831246, + 0.02907034457921982, + 0.028224628251791, + 0.0277183085501194, + 0.028236137807369232, + 0.026743644657731058, + 0.026232112246751784, + 0.02569632602930069, + 0.025446067842841147, + 0.025489903342723847, + 0.024715018486976624, + 0.024953959307074548, + 0.02375960406959057, + 0.023399142843484877, + 0.023335635387897492, + 0.022959388345479965 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.5847928524017334, + 0.3501134514808655, + 0.17105570435523987, + 0.15130013227462769 + ], + "perturbation_rho": [ + 0.5387442708015442, + 0.3080189526081085, + 0.17941737174987793, + 0.20768526196479797 + ], + "nudging": { + "0.001": [ + -0.017160478979349136, + -0.0019152601016685367, + -0.0006842610309831798, + -0.0005889273015782237 + ], + "0.003": [ + -0.05081973969936371, + -0.00573696568608284, + -0.002051552291959524, + -0.0017658264841884375 + ], + "0.01": [ + -0.16164088249206543, + -0.01902196928858757, + -0.006823995150625706, + -0.005875328555703163 + ] + }, + "state_pred_error_per_layer": [ + 10103.57421875, + 1132.8861083984375, + 636.5859375, + 537.355224609375 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2463353088378906, + 1.6628951946258546, + 1.1295779554367065, + 0.8783353236198426, + 0.7639653888702392, + 0.7047067642211914, + 0.6768319065093994, + 0.68182680311203, + 0.6602677572250366, + 0.6724473495483398, + 0.6855211343765258, + 0.6726006875991821, + 0.7052314999580384, + 0.7074386056900024, + 0.7129003076553345, + 0.7024357145309448, + 0.7227834997177124, + 0.7313135984420777, + 0.7373644021987915, + 0.7224393496513367, + 0.7700278699874878, + 0.7357270636558533, + 0.8003145306587219, + 0.8743129741668701, + 0.9247114940643311, + 0.9404189452171325, + 0.915456344985962, + 0.9703503519058227, + 1.0076803161621093, + 1.0813798515319824, + 1.1350637050628662, + 1.1440386219978333, + 1.1056740509033203, + 1.166263697052002, + 1.2001307735443114, + 1.227112310028076, + 1.2333890773773193, + 1.3325600746154784, + 1.314357687187195, + 1.3420076190948487, + 1.3500135983467103, + 1.434612279510498, + 1.4547458221435547, + 1.5096508449554444, + 1.5078580778121948, + 1.591580895614624, + 1.496910350227356, + 1.450836026954651, + 1.4903024017333983, + 1.4724365951538085, + 1.4564998203277588, + 1.4475345220565796, + 1.4865602378845215, + 1.4574821096420287, + 1.4633408412933349, + 1.4454458599090576, + 1.4607100917816163, + 1.4355232284545898, + 1.4373876348495482, + 1.447427599143982, + 1.4473964019775392, + 1.4408766548156737, + 1.4291354480743408, + 1.4133699844360352, + 1.426364598274231, + 1.4254159889221192, + 1.4199595382690429, + 1.422476571083069, + 1.4094791442871093, + 1.4061016763687133, + 1.4055855443954468, + 1.4035878326416016, + 1.402430838394165, + 1.3991222805023193, + 1.3999051294326783, + 1.3970819057464599, + 1.3952340185165406, + 1.3938718709945679, + 1.3935380973815918, + 1.3929829921722412 + ], + "train_acc": [ + 0.1808, + 0.4377, + 0.5916, + 0.6766, + 0.716, + 0.7362, + 0.7476, + 0.7486, + 0.7527, + 0.7524, + 0.7446, + 0.7487, + 0.7415, + 0.7441, + 0.7413, + 0.7448, + 0.7382, + 0.7389, + 0.7355, + 0.743, + 0.7278, + 0.7372, + 0.7243, + 0.7026, + 0.6916, + 0.6858, + 0.6794, + 0.665, + 0.6553, + 0.6355, + 0.6132, + 0.6106, + 0.6108, + 0.5876, + 0.581, + 0.5631, + 0.5618, + 0.5438, + 0.5425, + 0.5328, + 0.5346, + 0.5133, + 0.5039, + 0.4927, + 0.4913, + 0.4756, + 0.4905, + 0.4983, + 0.4826, + 0.4915, + 0.4942, + 0.4966, + 0.4945, + 0.4911, + 0.4899, + 0.4916, + 0.4894, + 0.4955, + 0.4961, + 0.4848, + 0.4874, + 0.4913, + 0.4996, + 0.5021, + 0.5002, + 0.4975, + 0.496, + 0.4951, + 0.4993, + 0.4999, + 0.501, + 0.5021, + 0.5, + 0.5032, + 0.5005, + 0.5015, + 0.505, + 0.5026, + 0.5038, + 0.504 + ], + "test_acc": [ + 0.286, + 0.5365, + 0.6435, + 0.684, + 0.6895, + 0.717, + 0.7055, + 0.7145, + 0.706, + 0.695, + 0.702, + 0.6775, + 0.695, + 0.6835, + 0.703, + 0.6965, + 0.6885, + 0.6755, + 0.6835, + 0.6775, + 0.684, + 0.689, + 0.667, + 0.6625, + 0.64, + 0.649, + 0.636, + 0.627, + 0.6065, + 0.592, + 0.5795, + 0.593, + 0.5605, + 0.571, + 0.523, + 0.5305, + 0.503, + 0.5135, + 0.521, + 0.518, + 0.4995, + 0.491, + 0.4555, + 0.4515, + 0.452, + 0.4625, + 0.509, + 0.475, + 0.497, + 0.4865, + 0.4855, + 0.476, + 0.4865, + 0.488, + 0.4805, + 0.4825, + 0.499, + 0.4955, + 0.487, + 0.497, + 0.4805, + 0.4785, + 0.4875, + 0.481, + 0.4945, + 0.4895, + 0.4905, + 0.4995, + 0.489, + 0.4975, + 0.496, + 0.5045, + 0.4955, + 0.4995, + 0.507, + 0.5015, + 0.5025, + 0.5015, + 0.5025, + 0.502 + ], + "value_loss": [ + 2.911659792137146, + 0.8996274837493896, + 0.7878434350967407, + 0.833689813041687, + 0.8365230781555176, + 0.8657572345733643, + 0.908541974067688, + 0.8480338787078857, + 0.8042462064743042, + 0.8133011533737182, + 0.8212067371368408, + 0.7808171772003174, + 0.8961290629386902, + 0.8653587206840515, + 0.8886142436981201, + 0.8761268617630005, + 0.884904754447937, + 0.8448927827835083, + 0.7980134412765503, + 0.6888658224105835, + 0.7473662647247314, + 0.65811010055542, + 0.7839856298923492, + 0.880495791387558, + 0.9084092624664306, + 0.8530173231601715, + 0.7625637437820435, + 1.0123852161407472, + 0.7736059984683991, + 0.8328087013244629, + 0.8140958374023437, + 0.8670786144256591, + 0.7377396880626679, + 0.7568698725700378, + 0.8068661364555358, + 0.7318669836044311, + 0.8281291389465332, + 0.8503475652694702, + 0.7644144630432129, + 0.7720902391433716, + 0.7514402165412902, + 0.9521960460662842, + 0.8458146006584167, + 0.891452622795105, + 0.8914439929962158, + 1.057370574760437, + 0.8315652293205261, + 0.7571992207050323, + 0.7947545112609863, + 0.7905970148086547, + 0.7850572494506836, + 0.7695828517913819, + 0.7652045320510864, + 0.7695798728942871, + 0.7152940567016601, + 0.6907661506652832, + 0.7097496647834778, + 0.6639136574745178, + 0.6959176488876343, + 0.6530081424713134, + 0.6744708864212036, + 0.7077253155708313, + 0.6539039137840271, + 0.6366007213592529, + 0.6607606963157654, + 0.6579708410263061, + 0.6630125551223754, + 0.6548057119369507, + 0.6407008107185364, + 0.6340464912891388, + 0.6079182727813721, + 0.6078491495132446, + 0.597375852394104, + 0.5983859522819519, + 0.5880393584251404, + 0.5987486978530884, + 0.5848587021827698, + 0.5729552617073059, + 0.5823435966968536, + 0.5799021621704101 + ], + "term_loss": [ + 1.6125608334541321, + 0.3840840371608734, + 0.48750869870185853, + 0.5739233162879944, + 0.583460131931305, + 0.611264087486267, + 0.6456350657463074, + 0.5810235898971557, + 0.5565879321813584, + 0.5670145713806153, + 0.5748216830253601, + 0.5389469696044922, + 0.6412990503311157, + 0.611316840839386, + 0.6310292453765869, + 0.6179455483436584, + 0.6184575637817383, + 0.5764782516479492, + 0.527465288066864, + 0.41762967494726183, + 0.4613805497169495, + 0.3795637038946152, + 0.48266787681579587, + 0.5520704276800156, + 0.5708891902923584, + 0.5130272762060165, + 0.4277731086730957, + 0.6448732345700264, + 0.4158886254787445, + 0.4512560091495514, + 0.42728045053482056, + 0.47845339875221254, + 0.36093939908742906, + 0.3623666671514511, + 0.3938521237373352, + 0.30772404375076295, + 0.38484077141284945, + 0.3804583154678345, + 0.3062211089849472, + 0.31390601534843443, + 0.29931726670265196, + 0.46709287190437315, + 0.3718694251537323, + 0.4082421121120453, + 0.4114425645828247, + 0.5396676266670227, + 0.3574508339881897, + 0.30055283591747284, + 0.3261272901535034, + 0.32341902742385864, + 0.31227895908355713, + 0.3047007039070129, + 0.2977863587141037, + 0.2951382811933756, + 0.25380487928390505, + 0.2323027446269989, + 0.2462068591594696, + 0.21350320754051208, + 0.23597208461761474, + 0.19863421688079835, + 0.21512561297416688, + 0.24010928027629852, + 0.19815546962618827, + 0.1846117480993271, + 0.20065309627056122, + 0.20074695563316344, + 0.20255926916599273, + 0.19159356966018676, + 0.183841939163208, + 0.17822789697647096, + 0.1608728482246399, + 0.16112907934188841, + 0.15298778686523437, + 0.1534871971011162, + 0.14573802747726441, + 0.1528574206352234, + 0.14455881164073944, + 0.13546503726243972, + 0.1438804125547409, + 0.1424343505382538 + ], + "bridge_loss": [ + 0.9979561433154623, + 0.1923502779841423, + 0.03369875200092792, + 0.010089649520814419, + 0.017109860217571257, + 0.026464090970158578, + 0.03847438667416572, + 0.03879255889952183, + 0.022746800869703293, + 0.015745803397893905, + 0.012550205962359905, + 0.011100650027394295, + 0.01492225005030632, + 0.013557523837685584, + 0.015981767566502093, + 0.017492658911645413, + 0.016710551595687868, + 0.020652121636271475, + 0.021984567886590957, + 0.027721646511554718, + 0.02861447253227234, + 0.029199581980705262, + 0.036015259969234464, + 0.0433954286724329, + 0.04418629710674286, + 0.04494130345731974, + 0.04159592981934548, + 0.05838559107780456, + 0.03970318132787943, + 0.043886014127731326, + 0.03409061102867127, + 0.03418889250457287, + 0.02945999857187271, + 0.029395705950260163, + 0.04250650172829628, + 0.045237154906988146, + 0.06208780016303062, + 0.06760461230278016, + 0.05713116898536682, + 0.05177076178789139, + 0.0454777575224638, + 0.06035384655445814, + 0.045845873348414896, + 0.04476448094546795, + 0.04259207730293274, + 0.0661571847498417, + 0.04104372414797545, + 0.03152658507525921, + 0.03633371991813183, + 0.04221771730184555, + 0.048432806301116946, + 0.043537792390584945, + 0.04238384801149368, + 0.05086035580188036, + 0.0377189158320427, + 0.039344362449645995, + 0.04182275475263596, + 0.03353696493506431, + 0.042798616722226145, + 0.03527422734498978, + 0.04015132822394371, + 0.049883893620967866, + 0.040538436710834506, + 0.04075850441455841, + 0.04582972603738308, + 0.044166031336784366, + 0.0475761167883873, + 0.048364759862422946, + 0.04714719864577055, + 0.04529150511026382, + 0.03810691610574722, + 0.03794098879098892, + 0.03586618504524231, + 0.03720670894086361, + 0.03536857309937477, + 0.038663346046209336, + 0.035329807829856875, + 0.031151742255687714, + 0.03266222105920315, + 0.03182844363451004 + ], + "tgrad_loss": [ + 0.3011428183555603, + 0.32319316704273227, + 0.2666359860420227, + 0.24967685322761535, + 0.23595308814048768, + 0.22802906050682067, + 0.224432515001297, + 0.22821773476600646, + 0.22491148040294648, + 0.23054077467918396, + 0.2338348491191864, + 0.2307695638656616, + 0.23990776176452636, + 0.24048435621261596, + 0.24160322992801667, + 0.24068865609169007, + 0.24973663783073424, + 0.24776240782737732, + 0.24856358866691589, + 0.243514501452446, + 0.2573712419271469, + 0.24934680943489074, + 0.26530250334739686, + 0.28502992734909055, + 0.2933337756156921, + 0.2950487338542938, + 0.293194704246521, + 0.3091263904094696, + 0.31801419608592985, + 0.33766667613983153, + 0.3527247706413269, + 0.35443632416725157, + 0.3473402920246124, + 0.36510749626159666, + 0.3705075058937073, + 0.3789057858467102, + 0.3812005734443665, + 0.4022846411705017, + 0.4010621870994568, + 0.40641346549987795, + 0.4066451931238174, + 0.42474932079315186, + 0.4280993054389954, + 0.43844602947235106, + 0.4374093544960022, + 0.45154575901031496, + 0.43307066822052004, + 0.4251198007583618, + 0.43229349727630617, + 0.4249602687358856, + 0.42434548816680906, + 0.42134435329437253, + 0.42503432445526124, + 0.42358124074935916, + 0.4237702589035034, + 0.4191190438270569, + 0.4217200475215912, + 0.4168734808921814, + 0.4171469500541687, + 0.4190996997833252, + 0.41919394392967224, + 0.4177321403503418, + 0.4152100051879883, + 0.4112304693222046, + 0.4142778721809387, + 0.41305785455703736, + 0.41287716846466066, + 0.41484738330841064, + 0.4097116720199585, + 0.41052708587646486, + 0.4089385024547577, + 0.40877908191680906, + 0.4085218800544739, + 0.4076920410633087, + 0.40693275775909427, + 0.4072279285430908, + 0.40497008571624754, + 0.4063384813308716, + 0.4058009665966034, + 0.4056393639087677 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.1632033884525299, + 0.4602273404598236, + 0.4661305546760559, + 0.47359973192214966 + ], + "perturbation_rho": [ + 0.20324298739433289, + 0.5429707169532776, + 0.5653814077377319, + 0.5405630469322205 + ], + "nudging": { + "0.001": [ + -0.004459770396351814, + -0.0037539242766797543, + -0.003678151872009039, + -0.0036794268526136875 + ], + "0.003": [ + -0.013349814340472221, + -0.011245567351579666, + -0.011020736768841743, + -0.011023622006177902 + ], + "0.01": [ + -0.04415123537182808, + -0.037312425673007965, + -0.03657253086566925, + -0.036583565175533295 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a1.0_L4_s42.json b/results/synth_ladder_v2_hi/synth_a1.0_L4_s42.json new file mode 100644 index 0000000..fa96d0f --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a1.0_L4_s42.json @@ -0,0 +1,1554 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.7025919662475586, + 0.7795055631637573, + 0.5677913279533386, + 0.5046968063354492, + 0.4608808174133301, + 0.4361949195861816, + 0.40271503200531006, + 0.362711107635498, + 0.33460533142089843, + 0.31974913997650145, + 0.28304471197128295, + 0.26439799995422364, + 0.23186020562648774, + 0.20645251512527465, + 0.1854053668022156, + 0.1883622447013855, + 0.1564298264503479, + 0.13204074223041534, + 0.10547249886989593, + 0.10665607880353928, + 0.08874446132183075, + 0.07009058383703232, + 0.05733880244493485, + 0.043911282253265384, + 0.03912401325702667, + 0.03387549254000187, + 0.02815464017689228, + 0.02348671322837472, + 0.019660550662875174, + 0.017395093828439713, + 0.015793408343195914, + 0.014198495180904866, + 0.012760633385181427, + 0.0120456358730793, + 0.011391607284545899, + 0.010471956431865692, + 0.009712862337380647, + 0.008671599093079567, + 0.008101777815818787, + 0.007641905176639557, + 0.0070717818230390545, + 0.006704615060985088, + 0.006303096756339073, + 0.006046279940009117, + 0.00574500061199069, + 0.005459648424386978, + 0.005366687068715691, + 0.005106282755732537, + 0.0048983019106090065, + 0.004707646728307009, + 0.004541327039897442, + 0.004420189782977104, + 0.004278477553278208, + 0.004159028781205416, + 0.0040608737718313935, + 0.003950595530960709, + 0.003842289924249053, + 0.0037566692493855953, + 0.003692386071756482, + 0.003627489294856787, + 0.0035626379638910295, + 0.003507125860080123, + 0.0034519337229430677, + 0.0034051366314291954, + 0.0033655297085642814, + 0.003327148025482893, + 0.0032939382158219815, + 0.003263653342053294, + 0.0032373780891299248, + 0.0032149843648076057, + 0.0031963624887168408, + 0.0031805660903453828, + 0.003166854461468756, + 0.0031557184338569643, + 0.003146645697206259, + 0.003140145140886307, + 0.0031351621329784394, + 0.0031318566258996725, + 0.0031298461467027666, + 0.0031287998259067534 + ], + "train_acc": [ + 0.4243, + 0.7371, + 0.7887, + 0.8026, + 0.82, + 0.832, + 0.8453, + 0.8624, + 0.8743, + 0.881, + 0.8937, + 0.907, + 0.9186, + 0.9333, + 0.9397, + 0.9326, + 0.9481, + 0.9624, + 0.9761, + 0.971, + 0.9793, + 0.9886, + 0.9935, + 0.9975, + 0.9981, + 0.9988, + 0.9996, + 0.9999, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.6665, + 0.765, + 0.759, + 0.7695, + 0.7725, + 0.7735, + 0.777, + 0.783, + 0.7815, + 0.7765, + 0.7895, + 0.781, + 0.7895, + 0.785, + 0.7865, + 0.786, + 0.789, + 0.7905, + 0.792, + 0.7855, + 0.7905, + 0.792, + 0.7955, + 0.7895, + 0.7915, + 0.793, + 0.7905, + 0.79, + 0.791, + 0.788, + 0.7935, + 0.792, + 0.79, + 0.7925, + 0.792, + 0.79, + 0.7855, + 0.791, + 0.788, + 0.789, + 0.79, + 0.7885, + 0.7895, + 0.7895, + 0.7915, + 0.7895, + 0.792, + 0.7905, + 0.7915, + 0.789, + 0.7885, + 0.789, + 0.789, + 0.7885, + 0.7885, + 0.788, + 0.7875, + 0.7875, + 0.787, + 0.7875, + 0.787, + 0.7875, + 0.7875, + 0.7865, + 0.787, + 0.7875, + 0.7865, + 0.7875, + 0.787, + 0.788, + 0.7875, + 0.788, + 0.7875, + 0.7875, + 0.7875, + 0.7875, + 0.7875, + 0.7875, + 0.7875, + 0.7875 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8902335166931152, + 0.8886877298355103, + 0.8827626705169678, + 0.8678592443466187 + ], + "perturbation_rho": [ + 0.9999993443489075, + 0.9999990463256836, + 0.9999973773956299, + 0.9999867081642151 + ], + "nudging": { + "0.001": [ + -0.05980858951807022, + -0.047062948346138, + -0.02711305394768715, + -0.011864672414958477 + ], + "0.003": [ + -0.17234034836292267, + -0.13683676719665527, + -0.07991128414869308, + -0.035327523946762085 + ], + "0.01": [ + -0.49256381392478943, + -0.4056996703147888, + -0.2497977763414383, + -0.11465895175933838 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2805367691040037, + 1.6415521514892577, + 1.0540750062942505, + 0.8191366905212403, + 0.720514697265625, + 0.6729900581359863, + 0.6483235983848572, + 0.6373948863983154, + 0.6437193074226379, + 0.6749926948547363, + 0.6499340630531311, + 0.6586005910873413, + 0.6826166941642762, + 0.6718164960861206, + 0.675482904624939, + 0.6877107390403747, + 0.7121948526382447, + 0.7166374977111817, + 0.7339209732055664, + 0.7540338826179505, + 0.7380614143371582, + 0.760818413734436, + 0.7298965669393539, + 0.745001176738739, + 0.7385975076675415, + 0.7762571002960205, + 0.7398200908660889, + 0.7519381859302521, + 0.7321780063629151, + 0.7773449554443359, + 0.84277982339859, + 0.784512722492218, + 0.7535494892120361, + 0.7960302189826965, + 0.7641264217376709, + 0.8023091213226319, + 0.7795416162490845, + 0.7875791462898254, + 0.760817495918274, + 0.7777634320259095, + 0.752805848312378, + 0.7481458770751953, + 0.7761073146820069, + 0.8001040952682495, + 0.7761383037567139, + 0.7439687911987305, + 0.7440207496643066, + 0.744167911529541, + 0.7687978046417236, + 0.7441968929290772, + 0.72595838098526, + 0.7307925410270691, + 0.7274970026016235, + 0.7375823734283448, + 0.7422896279573441, + 0.7248193643569947, + 0.7262517263412476, + 0.7219201570510865, + 0.7164952000141144, + 0.7161007792472839, + 0.7057839481353759, + 0.7116451340675354, + 0.708030333328247, + 0.711191120147705, + 0.7084746857643127, + 0.7060219361305237, + 0.7035173624038696, + 0.7019980341911316, + 0.6986017496109008, + 0.6976793788909912, + 0.6944869701385498, + 0.6933993984222412, + 0.6916578367948533, + 0.6894085638046265, + 0.689437709903717, + 0.68888226146698, + 0.6875977687835694, + 0.6869268341064453, + 0.6862103477478028, + 0.6858732402801514 + ], + "train_acc": [ + 0.1637, + 0.4532, + 0.6262, + 0.6939, + 0.7262, + 0.7438, + 0.7515, + 0.7572, + 0.7574, + 0.7472, + 0.7561, + 0.7538, + 0.7522, + 0.7545, + 0.7545, + 0.7499, + 0.7451, + 0.7464, + 0.7449, + 0.7378, + 0.7428, + 0.7358, + 0.7379, + 0.7375, + 0.7425, + 0.7304, + 0.7404, + 0.7376, + 0.741, + 0.7343, + 0.718, + 0.725, + 0.7363, + 0.7261, + 0.7303, + 0.7238, + 0.7288, + 0.7261, + 0.7343, + 0.7289, + 0.7322, + 0.7365, + 0.728, + 0.7232, + 0.7339, + 0.7365, + 0.7335, + 0.7383, + 0.7344, + 0.7359, + 0.7378, + 0.7373, + 0.7406, + 0.7376, + 0.7332, + 0.7401, + 0.7417, + 0.7442, + 0.745, + 0.7417, + 0.7427, + 0.7461, + 0.7451, + 0.7423, + 0.7436, + 0.7439, + 0.7452, + 0.7474, + 0.7481, + 0.7489, + 0.7489, + 0.7508, + 0.7484, + 0.7516, + 0.7485, + 0.7492, + 0.7498, + 0.7506, + 0.7498, + 0.7502 + ], + "test_acc": [ + 0.2825, + 0.546, + 0.6555, + 0.684, + 0.71, + 0.713, + 0.7245, + 0.723, + 0.7205, + 0.7245, + 0.7095, + 0.703, + 0.7015, + 0.709, + 0.714, + 0.699, + 0.712, + 0.692, + 0.681, + 0.701, + 0.69, + 0.703, + 0.6915, + 0.692, + 0.677, + 0.6985, + 0.6885, + 0.699, + 0.6855, + 0.6565, + 0.679, + 0.704, + 0.678, + 0.694, + 0.679, + 0.6945, + 0.6745, + 0.6855, + 0.69, + 0.676, + 0.701, + 0.6765, + 0.6765, + 0.685, + 0.699, + 0.6915, + 0.6885, + 0.686, + 0.696, + 0.695, + 0.6985, + 0.701, + 0.6925, + 0.6985, + 0.6985, + 0.694, + 0.701, + 0.705, + 0.695, + 0.7085, + 0.6975, + 0.697, + 0.697, + 0.705, + 0.707, + 0.707, + 0.705, + 0.6975, + 0.701, + 0.6995, + 0.707, + 0.7065, + 0.707, + 0.7055, + 0.706, + 0.705, + 0.7055, + 0.706, + 0.7065, + 0.7075 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.026215966790914536, + 0.05776425451040268, + 0.07666948437690735, + 0.08296040445566177 + ], + "perturbation_rho": [ + 0.04998716711997986, + 0.09949691593647003, + 0.049676910042762756, + 0.012540214695036411 + ], + "nudging": { + "0.001": [ + -0.0008748910040594637, + -0.00038322899490594864, + -0.0003354061918798834, + -0.00033481494756415486 + ], + "0.003": [ + -0.0026117637753486633, + -0.0011494184145703912, + -0.001006446429528296, + -0.0010040509514510632 + ], + "0.01": [ + -0.008544353768229485, + -0.0038241599686443806, + -0.0033461027778685093, + -0.003339859191328287 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 2.007753798675537, + 1.0622356224060059, + 0.69143017578125, + 0.6239932517051697, + 0.6335793426036834, + 0.674501599407196, + 0.7154178378105164, + 0.7578475559234619, + 0.785428904247284, + 0.7806968556404114, + 0.79781559009552, + 0.8039525414466858, + 0.8008891497612, + 0.796566740322113, + 0.8047402942657471, + 0.8085960758209229, + 0.8045371704101563, + 0.809913685798645, + 0.8109244365692139, + 0.822509958267212, + 0.8186556421279907, + 0.8206361956596374, + 0.8208891757965088, + 0.8155913323402405, + 0.8365351364135742, + 0.8417284649848938, + 0.8479398907661438, + 0.8543629753112792, + 0.8356543054580688, + 0.8371729434967041, + 0.849026389503479, + 0.8420911851882935, + 0.8437719006538391, + 0.8468664903640747, + 0.8579279032707214, + 0.8493580184936523, + 0.8420408730506896, + 0.8348710892677307, + 0.8287518863677978, + 0.8248524719238282, + 0.8344216783523559, + 0.8304245887756347, + 0.8186835735321045, + 0.8134511299133301, + 0.8171366225242614, + 0.8118591390132904, + 0.7982140255451202, + 0.7970935890197753, + 0.8015208456993103, + 0.7964595051288604, + 0.7967358273506164, + 0.8013176858901978, + 0.7927464712142944, + 0.7874492823600769, + 0.7888918502807617, + 0.8002659862518311, + 0.7785984733581542, + 0.7800743109226227, + 0.7750258285522461, + 0.7772714210510254, + 0.7739788970470428, + 0.7726497331619263, + 0.7723067853927612, + 0.7742076810836792, + 0.7713943565368653, + 0.769815579032898, + 0.7686135004043579, + 0.7663217308044433, + 0.7666474376678467, + 0.7653638418197631, + 0.7640022378921508, + 0.7641778549194336, + 0.7632465696334839, + 0.7620238209724426, + 0.7611095140457154, + 0.7607381951332093, + 0.7604392482757568, + 0.7600468851089478, + 0.7597837959289551, + 0.7596640625 + ], + "train_acc": [ + 0.282, + 0.6144, + 0.7404, + 0.7629, + 0.7625, + 0.7517, + 0.7434, + 0.7292, + 0.7245, + 0.7223, + 0.714, + 0.7117, + 0.7112, + 0.7079, + 0.7049, + 0.7033, + 0.7077, + 0.7012, + 0.6989, + 0.6952, + 0.6962, + 0.6999, + 0.698, + 0.6975, + 0.6959, + 0.6925, + 0.6911, + 0.6866, + 0.6941, + 0.6978, + 0.6929, + 0.6954, + 0.6926, + 0.6886, + 0.6905, + 0.6921, + 0.6969, + 0.6961, + 0.698, + 0.6998, + 0.694, + 0.6983, + 0.6999, + 0.7023, + 0.7011, + 0.7013, + 0.7085, + 0.7072, + 0.7043, + 0.7048, + 0.7031, + 0.7082, + 0.7094, + 0.7102, + 0.7084, + 0.7038, + 0.7109, + 0.7132, + 0.7136, + 0.7117, + 0.7123, + 0.715, + 0.7131, + 0.7154, + 0.7138, + 0.7148, + 0.7167, + 0.7178, + 0.7177, + 0.7184, + 0.7179, + 0.7185, + 0.7178, + 0.7189, + 0.7205, + 0.72, + 0.7207, + 0.7208, + 0.7205, + 0.7206 + ], + "test_acc": [ + 0.498, + 0.672, + 0.737, + 0.731, + 0.728, + 0.7105, + 0.698, + 0.7015, + 0.681, + 0.675, + 0.678, + 0.6765, + 0.68, + 0.6555, + 0.6635, + 0.6635, + 0.67, + 0.656, + 0.6685, + 0.662, + 0.662, + 0.667, + 0.671, + 0.6555, + 0.651, + 0.644, + 0.6565, + 0.641, + 0.6445, + 0.651, + 0.6485, + 0.653, + 0.6455, + 0.6365, + 0.652, + 0.6585, + 0.6445, + 0.654, + 0.6615, + 0.6605, + 0.6585, + 0.6565, + 0.6545, + 0.662, + 0.663, + 0.6595, + 0.664, + 0.6625, + 0.6565, + 0.662, + 0.645, + 0.6535, + 0.67, + 0.6685, + 0.67, + 0.6605, + 0.6615, + 0.667, + 0.668, + 0.668, + 0.662, + 0.664, + 0.6615, + 0.664, + 0.6595, + 0.666, + 0.6635, + 0.6625, + 0.66, + 0.6635, + 0.661, + 0.666, + 0.6635, + 0.664, + 0.665, + 0.663, + 0.6625, + 0.662, + 0.662, + 0.6625 + ], + "state_pred_error": [ + 0.7827486207008362, + 0.31122149848937986, + 0.20405255806446077, + 0.1785473354101181, + 0.16711481635570527, + 0.1693767168521881, + 0.1746032564878464, + 0.17555798501968384, + 0.17862845754623413, + 0.17690453650951385, + 0.17425159878730773, + 0.16519148182868956, + 0.15421706743240357, + 0.1434457843542099, + 0.13330313999652862, + 0.12446385669708251, + 0.11768645570278168, + 0.11164422111511231, + 0.10441685699224472, + 0.10158415093421937, + 0.09517893229722976, + 0.09017173348665238, + 0.08772520488500594, + 0.08342612677812576, + 0.08160507142543792, + 0.0786071489572525, + 0.07716105241775513, + 0.07485365310907365, + 0.07317224496603011, + 0.07141792141199112, + 0.06897861013412476, + 0.06749274585247039, + 0.06598065556287766, + 0.06508338479995728, + 0.06346238186359406, + 0.06226500202417374, + 0.060549116563796995, + 0.06055630297660828, + 0.05884025704264641, + 0.05801897701025009, + 0.05669505831003189, + 0.055699084228277206, + 0.05481746277809143, + 0.05341801876425743, + 0.05295276014208793, + 0.05195536425709724, + 0.050695552802085875, + 0.050078516376018525, + 0.04883329871296883, + 0.048564964467287065, + 0.047450669956207274, + 0.04657022901773453, + 0.04643023025393486, + 0.04527272279858589, + 0.045131425642967224, + 0.04429114927649498, + 0.04370682866573334, + 0.04249126278758049, + 0.04206086259484291, + 0.04127250732779503, + 0.04066784818768501, + 0.04100679843425751, + 0.03984400656223297, + 0.039111772429943084, + 0.03872905417084694, + 0.03760358746051788, + 0.037533375626802444, + 0.03731676592230797, + 0.03687030100226402, + 0.03601930988430977, + 0.0353958393573761, + 0.035445755779743196, + 0.03499365764260292, + 0.0341682822406292, + 0.03401557675898075, + 0.03333400482535362, + 0.033034325659275054, + 0.032180927592515944, + 0.03222785183191299, + 0.031816003906726835 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.6404350996017456, + 0.4214136302471161, + 0.18068093061447144, + 0.15130802989006042 + ], + "perturbation_rho": [ + 0.5499319434165955, + 0.368219256401062, + 0.21391229331493378, + 0.1835726499557495 + ], + "nudging": { + "0.001": [ + -0.020009398460388184, + -0.0023713181726634502, + -0.0006903400644659996, + -0.0005570724606513977 + ], + "0.003": [ + -0.05908045917749405, + -0.007099837996065617, + -0.00206951005384326, + -0.0016702794237062335 + ], + "0.01": [ + -0.18587297201156616, + -0.0235043503344059, + -0.00688221026211977, + -0.005556063260883093 + ] + }, + "state_pred_error_per_layer": [ + 10066.107421875, + 1273.9140625, + 696.594482421875, + 612.3014526367188 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2802715728759764, + 1.6388436302185059, + 1.053798963165283, + 0.8138567586898804, + 0.716612920665741, + 0.6672540647506714, + 0.6528224432945251, + 0.6466248464584351, + 0.6415921350479126, + 0.664950927734375, + 0.6627229480743408, + 0.685637841796875, + 0.6988411318778992, + 0.6790707836151123, + 0.6934760662078857, + 0.7018385746002197, + 0.7308993638992309, + 0.719111060333252, + 0.8150796144485474, + 0.7402855098724366, + 0.7425731256484985, + 0.7482444780349732, + 0.7917413208007813, + 0.8034436722755433, + 0.847063459777832, + 0.8898068056106567, + 0.8742546170234681, + 0.8931990461349487, + 0.979162103843689, + 1.0233091241836547, + 1.0456207696914672, + 1.088154921579361, + 1.0924738161087035, + 1.1280992248535155, + 1.14695910320282, + 1.1968199752807618, + 1.1404859788894652, + 1.1790920137405396, + 1.112723836708069, + 1.1557879085540772, + 1.1529123931884766, + 1.1391218341827392, + 1.1959625034332275, + 1.1819099002838134, + 1.1729866676330567, + 1.164624983406067, + 1.1626405437469483, + 1.199929854774475, + 1.2018864694595337, + 1.1927341426849365, + 1.1924728622436525, + 1.1670917442321778, + 1.1843838939666749, + 1.188602296257019, + 1.181069985961914, + 1.1662905952453613, + 1.1854075830459594, + 1.1842269680976867, + 1.175111684703827, + 1.1727143672943114, + 1.1815870304107665, + 1.1729837955474853, + 1.1755547443389893, + 1.1800736003875731, + 1.1686390336036683, + 1.164267241859436, + 1.164349419593811, + 1.1732585205078125, + 1.1630031745910645, + 1.1624063230514525, + 1.1623846691131592, + 1.159834877204895, + 1.1611515955924987, + 1.1584980821609496, + 1.1587893016815185, + 1.157638655281067, + 1.1562239799499512, + 1.1557205964565278, + 1.1550566940307616, + 1.1548286571502686 + ], + "train_acc": [ + 0.1636, + 0.4547, + 0.6239, + 0.6951, + 0.7301, + 0.7466, + 0.7497, + 0.7534, + 0.7585, + 0.7523, + 0.7578, + 0.7492, + 0.7447, + 0.7551, + 0.7497, + 0.7441, + 0.7418, + 0.7432, + 0.7177, + 0.7372, + 0.7402, + 0.7386, + 0.7254, + 0.714, + 0.6966, + 0.6781, + 0.6838, + 0.6829, + 0.6653, + 0.6634, + 0.6556, + 0.6476, + 0.6373, + 0.6204, + 0.6179, + 0.6068, + 0.6152, + 0.6036, + 0.6106, + 0.5958, + 0.5993, + 0.5934, + 0.5778, + 0.5834, + 0.5835, + 0.5844, + 0.582, + 0.5718, + 0.5675, + 0.5709, + 0.5721, + 0.5806, + 0.5738, + 0.5671, + 0.5744, + 0.5787, + 0.5667, + 0.5667, + 0.5721, + 0.5704, + 0.5729, + 0.571, + 0.5721, + 0.566, + 0.5693, + 0.5734, + 0.5722, + 0.5718, + 0.5726, + 0.5753, + 0.5723, + 0.5739, + 0.5712, + 0.5708, + 0.5741, + 0.5722, + 0.5735, + 0.573, + 0.5736, + 0.5732 + ], + "test_acc": [ + 0.273, + 0.547, + 0.6555, + 0.6975, + 0.713, + 0.7265, + 0.719, + 0.712, + 0.7275, + 0.7135, + 0.7205, + 0.715, + 0.7025, + 0.7075, + 0.6945, + 0.711, + 0.7125, + 0.6925, + 0.7055, + 0.698, + 0.691, + 0.679, + 0.672, + 0.671, + 0.6555, + 0.6525, + 0.6495, + 0.6265, + 0.6235, + 0.6095, + 0.616, + 0.6085, + 0.609, + 0.576, + 0.569, + 0.6095, + 0.5785, + 0.596, + 0.5725, + 0.5615, + 0.566, + 0.5295, + 0.5305, + 0.559, + 0.5535, + 0.5695, + 0.548, + 0.549, + 0.5485, + 0.5275, + 0.5555, + 0.5525, + 0.547, + 0.557, + 0.549, + 0.558, + 0.557, + 0.549, + 0.5365, + 0.55, + 0.556, + 0.559, + 0.551, + 0.558, + 0.5575, + 0.5525, + 0.5515, + 0.5475, + 0.5565, + 0.5555, + 0.563, + 0.5545, + 0.5575, + 0.56, + 0.5625, + 0.558, + 0.56, + 0.5595, + 0.558, + 0.558 + ], + "value_loss": [ + 2.8735111057281495, + 0.8335682413101196, + 0.769390998840332, + 0.8538553759574891, + 0.8522886907577515, + 0.8185532119750977, + 0.8277693967819214, + 0.7784229893684387, + 0.7300227233886719, + 0.7802330356597901, + 0.769332304763794, + 0.8283760873794556, + 0.7907809033870697, + 0.6976581485748291, + 0.7120382925987244, + 0.6482724099636078, + 0.6534354884147644, + 0.593892509841919, + 0.7452015276908874, + 0.5669822316169739, + 0.5777508046627045, + 0.5676485029220582, + 0.6005406673431396, + 0.5610708597183227, + 0.6180012318134308, + 0.6325548360347748, + 0.5494541264533996, + 0.5714878581047058, + 0.7139776704788208, + 0.8037148260116577, + 0.7602687382698059, + 0.8407878190994262, + 0.7761835197448731, + 0.7896560256004334, + 0.7990566373825073, + 0.8447199113845825, + 0.7247003343582153, + 0.7957295311450958, + 0.6422031284332276, + 0.6728523059368133, + 0.6348221732616425, + 0.5987496240615845, + 0.6573260497093201, + 0.6036061918258667, + 0.5928497138023376, + 0.5621949359416961, + 0.5422956010818482, + 0.5782992021560669, + 0.5750265427589416, + 0.5459153981685638, + 0.5251600515365601, + 0.4968988045692444, + 0.5020302026748658, + 0.48168242778778075, + 0.4782550555229187, + 0.458009272813797, + 0.48891592626571656, + 0.4619943362236023, + 0.45534752962589264, + 0.4502370168685913, + 0.47029722967147825, + 0.4379799751281738, + 0.4465416639328003, + 0.44245663313865663, + 0.44536621041297914, + 0.4246152039527893, + 0.4194586960792541, + 0.4330580853462219, + 0.4234344777107239, + 0.40113246874809266, + 0.40549428577423097, + 0.4139835561752319, + 0.4035360648393631, + 0.40140957350730894, + 0.39820902795791624, + 0.39226190814971923, + 0.3981349976539612, + 0.3976579602479935, + 0.40020361919403075, + 0.38718592133522034 + ], + "term_loss": [ + 1.6547700959205627, + 0.3569759086608887, + 0.4995730664730072, + 0.613328255558014, + 0.6194977837085723, + 0.579716089630127, + 0.5759899250984192, + 0.5267154250264168, + 0.49604031887054445, + 0.5482948890686035, + 0.5394840831756592, + 0.5940117561340332, + 0.5486331809043884, + 0.46233955211639405, + 0.46987221883535385, + 0.39907051919698716, + 0.3999391771793365, + 0.3417030059814453, + 0.4683563796043396, + 0.30888337712287905, + 0.31755629993677137, + 0.30828637447357177, + 0.33097629477381707, + 0.28669681071043013, + 0.32924925060272214, + 0.3282053912878036, + 0.2512664660692215, + 0.26445692427158357, + 0.3812099160194397, + 0.4540276463031769, + 0.412122430229187, + 0.4838629661560059, + 0.4123155319213867, + 0.4150680226564407, + 0.41444860229492186, + 0.45303762993812563, + 0.35541438927650454, + 0.4120818091392517, + 0.2860383835077286, + 0.31014277563095094, + 0.27963082504272463, + 0.25354453073143957, + 0.29737128577232363, + 0.2565148003578186, + 0.24667102131843566, + 0.21899679546356202, + 0.20547868233919145, + 0.22946879208087922, + 0.22265157461166382, + 0.20190087502002715, + 0.18589250744581223, + 0.1647626592874527, + 0.16500887289047242, + 0.14553676958084105, + 0.14562038345336914, + 0.12770656932592392, + 0.15042840227484702, + 0.12728065757751464, + 0.12067141379714012, + 0.11855436496734618, + 0.13056303629875182, + 0.10663774018287658, + 0.11145729880332947, + 0.10661706770658493, + 0.10924380402565002, + 0.09346218340396881, + 0.0898735906124115, + 0.09771707606911659, + 0.09121034116744996, + 0.07615747270733118, + 0.07712909548282623, + 0.0854458722114563, + 0.0757170934215188, + 0.07425090863108635, + 0.07251303234994412, + 0.06824812455177307, + 0.07342738398313522, + 0.07247738439813256, + 0.07439423036575317, + 0.06566130868196488 + ], + "bridge_loss": [ + 0.9250297847082954, + 0.17875594335198403, + 0.024584124499559403, + 0.009463803791999816, + 0.012518692496418952, + 0.02811788408756256, + 0.04102186490893364, + 0.03981322860121727, + 0.02342328687310219, + 0.014045343008637428, + 0.014091408693790436, + 0.01357993180155754, + 0.016431021589040758, + 0.018039470773935317, + 0.02248061062693596, + 0.02640794592499733, + 0.02815555126667023, + 0.02941792515516281, + 0.03211450355052948, + 0.031108583983778953, + 0.032093208335340025, + 0.030620017021894454, + 0.031579648739099506, + 0.030231001940369606, + 0.03265896959304809, + 0.038522472846508025, + 0.035252166825532914, + 0.039083953332901, + 0.05084649066925049, + 0.058725530803203585, + 0.057208517038822175, + 0.06136698402166366, + 0.06703151053190232, + 0.07173536076545715, + 0.07859825726747513, + 0.07978210234642029, + 0.06855812752246856, + 0.07676569232344628, + 0.06038619836568832, + 0.05801328845620155, + 0.052716735702753065, + 0.043914621901512144, + 0.04799848956018686, + 0.039276413369178774, + 0.03984246690273285, + 0.03797423206567764, + 0.03278059434294701, + 0.036813641035556795, + 0.039771160554885866, + 0.03320262667536736, + 0.028382191380858422, + 0.026151864609122277, + 0.02777043187022209, + 0.025728233271837233, + 0.02371621637940407, + 0.024555341345071792, + 0.028544853276014328, + 0.024363518065214158, + 0.026727474239468575, + 0.023022234451770783, + 0.03015930926799774, + 0.02283631842434406, + 0.026408934420347214, + 0.025617169830203058, + 0.028104463522136212, + 0.024197242438793183, + 0.022750669395923614, + 0.02691462599337101, + 0.02528082738518715, + 0.01895334949493408, + 0.02164241167008877, + 0.022592386800050736, + 0.021976949539780615, + 0.02176335347890854, + 0.020175418317317964, + 0.019235759457945825, + 0.02052777136415243, + 0.020854398973286153, + 0.021812593013048172, + 0.01777836950570345 + ], + "tgrad_loss": [ + 0.2937112254619598, + 0.29783638520240785, + 0.24523381710052491, + 0.23106331899166108, + 0.22027222232818602, + 0.21071923723220826, + 0.21075760734081267, + 0.2118943401813507, + 0.21055911660194396, + 0.21789281148910522, + 0.2157568175792694, + 0.22078439950942993, + 0.2257167013168335, + 0.2172791259288788, + 0.21968546645641326, + 0.22279394526481627, + 0.22534075746536256, + 0.22277158393859864, + 0.24473064098358155, + 0.22699026865959168, + 0.22810129499435425, + 0.22874211015701293, + 0.23798472149372102, + 0.2441430545091629, + 0.2560930178642273, + 0.2658269679546356, + 0.26293549556732176, + 0.2679469756603241, + 0.2819212636470795, + 0.29096164264678953, + 0.29093779606819153, + 0.2955578689336777, + 0.2968364751815796, + 0.3028526331424713, + 0.3060097746372223, + 0.3119001868247986, + 0.3007278199195862, + 0.306882026720047, + 0.29577854566574097, + 0.3046962371826172, + 0.3024746113777161, + 0.3012904730796814, + 0.3119562791347504, + 0.3078149768829346, + 0.3063362253189087, + 0.3052239120483398, + 0.3040363299369812, + 0.3120167656898499, + 0.31260380606651306, + 0.31081189460754394, + 0.31088535375595094, + 0.30598428030014035, + 0.30925089569091796, + 0.3104174225330353, + 0.30891845417022706, + 0.3057473627090454, + 0.30994266691207883, + 0.31035016078948974, + 0.3079486409187317, + 0.30866041717529297, + 0.3095748833656311, + 0.3085059157371521, + 0.30867542929649355, + 0.310222395324707, + 0.3080179396867752, + 0.30695577449798583, + 0.306834437084198, + 0.3084263841152191, + 0.3069433072566986, + 0.3060216453075409, + 0.3067227794647217, + 0.30594529614448546, + 0.30584202256202697, + 0.30539531021118166, + 0.3055205769062042, + 0.3047780241012573, + 0.3041798396587372, + 0.3043261778593063, + 0.30399679365158083, + 0.30374624242782594 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.17809242010116577, + 0.5349531173706055, + 0.5522423982620239, + 0.5664830207824707 + ], + "perturbation_rho": [ + 0.22843755781650543, + 0.5910820364952087, + 0.6707864999771118, + 0.638596773147583 + ], + "nudging": { + "0.001": [ + -0.004492362029850483, + -0.00375316827557981, + -0.0035423573572188616, + -0.003583954880014062 + ], + "0.003": [ + -0.01343991793692112, + -0.011238809674978256, + -0.010609426535665989, + -0.010733431205153465 + ], + "0.01": [ + -0.044362872838974, + -0.03722546622157097, + -0.03515344485640526, + -0.0355607345700264 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a1.0_L4_s456.json b/results/synth_ladder_v2_hi/synth_a1.0_L4_s456.json new file mode 100644 index 0000000..6147814 --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a1.0_L4_s456.json @@ -0,0 +1,1554 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.6721104705810548, + 0.7631012835502624, + 0.5599466526031495, + 0.5009647348403931, + 0.44250268206596377, + 0.4112984040737152, + 0.37521746096611025, + 0.35069607543945314, + 0.32816796259880066, + 0.28571113114356994, + 0.26920412228107454, + 0.23822724075317384, + 0.2403384908914566, + 0.19125519732236862, + 0.16398012406826018, + 0.14183301560282707, + 0.11679492046833038, + 0.11636687972545624, + 0.0922450327694416, + 0.07265362660884857, + 0.0646497187614441, + 0.06649317836761474, + 0.05584645546674728, + 0.03784047375321388, + 0.030665161864459514, + 0.02323187246620655, + 0.020697732216119768, + 0.01984555126428604, + 0.01643712175488472, + 0.014849836444854736, + 0.012898893329501152, + 0.011405612179636955, + 0.010688650423288345, + 0.010941692940890788, + 0.00924009888395667, + 0.008266829562187194, + 0.007798123356699944, + 0.007352828028798103, + 0.006834007120877505, + 0.0063644687902182345, + 0.00597649103552103, + 0.005696629038453102, + 0.00541699848882854, + 0.005169383949041367, + 0.004989086370170116, + 0.004769640618562699, + 0.0046363350734114645, + 0.004409096204489469, + 0.004235530799627304, + 0.004112518234550953, + 0.004026416325569153, + 0.0038965860821306704, + 0.0037635557891800998, + 0.00364411306977272, + 0.0035582759173586965, + 0.0034678645484149456, + 0.0034067507416009903, + 0.003331349766626954, + 0.003267878529988229, + 0.0032062796097248793, + 0.003156200988590717, + 0.003108995720744133, + 0.0030637201324105264, + 0.0030205708354711534, + 0.002985149787738919, + 0.0029531347144395115, + 0.0029254953995347024, + 0.0029017341434955596, + 0.0028784529194235803, + 0.0028606591559946536, + 0.0028430704237893223, + 0.0028297565318644046, + 0.0028177733197808264, + 0.002808107787370682, + 0.0028007785379886626, + 0.0027947440318763254, + 0.0027906116507947446, + 0.0027877884034067392, + 0.002786100262776017, + 0.0027851809598505497 + ], + "train_acc": [ + 0.4351, + 0.7466, + 0.7912, + 0.8118, + 0.8313, + 0.8447, + 0.8567, + 0.8703, + 0.8784, + 0.9005, + 0.9017, + 0.9151, + 0.9117, + 0.9381, + 0.9491, + 0.9615, + 0.9722, + 0.9694, + 0.9811, + 0.9884, + 0.9905, + 0.9899, + 0.9915, + 0.9975, + 0.9992, + 0.9999, + 1.0, + 0.9995, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.6795, + 0.754, + 0.7735, + 0.7805, + 0.7865, + 0.787, + 0.788, + 0.785, + 0.791, + 0.7955, + 0.7885, + 0.7945, + 0.787, + 0.7945, + 0.7965, + 0.795, + 0.7985, + 0.7915, + 0.7945, + 0.791, + 0.792, + 0.791, + 0.7915, + 0.7945, + 0.796, + 0.788, + 0.791, + 0.79, + 0.7925, + 0.792, + 0.7895, + 0.7935, + 0.791, + 0.789, + 0.793, + 0.791, + 0.792, + 0.7915, + 0.7905, + 0.7925, + 0.793, + 0.794, + 0.7905, + 0.7915, + 0.79, + 0.79, + 0.7915, + 0.79, + 0.793, + 0.793, + 0.791, + 0.7945, + 0.794, + 0.793, + 0.7925, + 0.794, + 0.792, + 0.7905, + 0.79, + 0.7895, + 0.792, + 0.7915, + 0.7925, + 0.792, + 0.792, + 0.7925, + 0.7925, + 0.7925, + 0.7925, + 0.793, + 0.7925, + 0.7925, + 0.792, + 0.7915, + 0.7925, + 0.792, + 0.792, + 0.792, + 0.792, + 0.792 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8668075799942017, + 0.8621845245361328, + 0.8550785779953003, + 0.8370286226272583 + ], + "perturbation_rho": [ + 0.9999995827674866, + 0.9999990463256836, + 0.999997615814209, + 0.9999850988388062 + ], + "nudging": { + "0.001": [ + -0.05954365432262421, + -0.04705682024359703, + -0.02751990780234337, + -0.01213783212006092 + ], + "0.003": [ + -0.17067265510559082, + -0.13620686531066895, + -0.0808744877576828, + -0.036085594445466995 + ], + "0.01": [ + -0.4802546799182892, + -0.3984469175338745, + -0.2503964900970459, + -0.11649051308631897 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2574989524841307, + 1.6380552871704102, + 1.0905220043182373, + 0.8434843078613281, + 0.7422607097625732, + 0.6838733669281006, + 0.6608151784896851, + 0.6541139087677001, + 0.6700486952781677, + 0.6548487804412841, + 0.6903288414001465, + 0.6872687412261963, + 0.7067448139190674, + 0.6931972984313964, + 0.7313086133956909, + 0.7074429125785827, + 0.7189123779296875, + 0.7329434277057648, + 0.7488891769409179, + 0.7615507186889648, + 0.7562071540832519, + 0.7549555555343628, + 0.772114220046997, + 0.7851960697174072, + 0.7795265257835389, + 0.7939942949295044, + 0.7774659820079803, + 0.8024665214061737, + 0.7958273443222046, + 0.8216977993011475, + 0.8670008243560791, + 0.8302605041503907, + 0.8018192520141602, + 0.818106721830368, + 0.7778735799789429, + 0.8109884427070617, + 0.8029882509231567, + 0.7874313503265381, + 0.7778594578742981, + 0.7777205188751221, + 0.8068863299846649, + 0.780433825969696, + 0.7781887583732605, + 0.7730012133598327, + 0.769133717250824, + 0.7593815219879151, + 0.7997064087867737, + 0.782936147928238, + 0.7640992984771728, + 0.7745265226364135, + 0.7642938511848449, + 0.7603380409240723, + 0.7646475133419037, + 0.751522674369812, + 0.7650270447731018, + 0.7674694633483887, + 0.7579075176239014, + 0.7549170202255249, + 0.7451096672534943, + 0.7400417304992676, + 0.7386390338897705, + 0.727668257522583, + 0.7409649150848389, + 0.7316446098327637, + 0.7244855234146118, + 0.7241755498886109, + 0.7200836553573609, + 0.7214753667831421, + 0.7202660327911377, + 0.7165880686283111, + 0.7148458456993103, + 0.7100509027481079, + 0.7098775724411011, + 0.7100581963539123, + 0.708662319278717, + 0.7074518667221069, + 0.7055805969238281, + 0.7049286954879761, + 0.7044133127212524, + 0.7041960348129273 + ], + "train_acc": [ + 0.1772, + 0.452, + 0.6052, + 0.6909, + 0.7204, + 0.743, + 0.753, + 0.751, + 0.7511, + 0.7583, + 0.7472, + 0.7483, + 0.7455, + 0.7476, + 0.7404, + 0.7448, + 0.7447, + 0.7427, + 0.7342, + 0.7382, + 0.7419, + 0.7362, + 0.7394, + 0.7329, + 0.7374, + 0.7314, + 0.7371, + 0.7304, + 0.7337, + 0.7245, + 0.7187, + 0.7191, + 0.729, + 0.7308, + 0.7314, + 0.724, + 0.7301, + 0.7352, + 0.7325, + 0.7365, + 0.7319, + 0.7365, + 0.737, + 0.7367, + 0.7384, + 0.7407, + 0.7294, + 0.7387, + 0.7397, + 0.7325, + 0.738, + 0.738, + 0.7356, + 0.7392, + 0.7364, + 0.7387, + 0.7374, + 0.7368, + 0.7402, + 0.7425, + 0.7449, + 0.7465, + 0.7412, + 0.743, + 0.7442, + 0.7456, + 0.7468, + 0.745, + 0.7466, + 0.748, + 0.7493, + 0.7503, + 0.7517, + 0.75, + 0.7512, + 0.7515, + 0.7518, + 0.7503, + 0.7516, + 0.7519 + ], + "test_acc": [ + 0.309, + 0.543, + 0.6365, + 0.6885, + 0.7, + 0.7145, + 0.714, + 0.714, + 0.716, + 0.6965, + 0.705, + 0.6995, + 0.698, + 0.686, + 0.7, + 0.703, + 0.704, + 0.697, + 0.693, + 0.676, + 0.677, + 0.6665, + 0.6905, + 0.6885, + 0.6755, + 0.6875, + 0.681, + 0.677, + 0.6845, + 0.652, + 0.6575, + 0.692, + 0.6525, + 0.6685, + 0.6775, + 0.678, + 0.682, + 0.67, + 0.669, + 0.6635, + 0.677, + 0.68, + 0.675, + 0.678, + 0.671, + 0.667, + 0.6665, + 0.677, + 0.671, + 0.671, + 0.669, + 0.6855, + 0.679, + 0.6725, + 0.664, + 0.673, + 0.6785, + 0.6795, + 0.6755, + 0.6755, + 0.688, + 0.684, + 0.684, + 0.686, + 0.673, + 0.6795, + 0.6815, + 0.6785, + 0.674, + 0.68, + 0.6825, + 0.683, + 0.6785, + 0.6755, + 0.6765, + 0.683, + 0.6805, + 0.6815, + 0.6815, + 0.68 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.001797341974452138, + 0.06668862700462341, + 0.05448886379599571, + 0.09004470705986023 + ], + "perturbation_rho": [ + -0.01287321001291275, + 0.007983170449733734, + 0.10568365454673767, + 0.12522897124290466 + ], + "nudging": { + "0.001": [ + -0.0001986024435609579, + -0.0004886264214292169, + -0.0003064559423364699, + -0.000437408743891865 + ], + "0.003": [ + -0.0005703098722733557, + -0.0014648186042904854, + -0.0009188501280732453, + -0.001311213942244649 + ], + "0.01": [ + -0.0016110537108033895, + -0.004868227988481522, + -0.0030549662187695503, + -0.004361548461019993 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.970423934173584, + 1.0188906314849853, + 0.6803888530254364, + 0.6183670483589172, + 0.6407907210350037, + 0.675392436504364, + 0.7211614998817444, + 0.7503331409454346, + 0.7658470903396607, + 0.78841116065979, + 0.8109269844055176, + 0.8219402812957763, + 0.8228919342041016, + 0.8259679775238037, + 0.8465613422393798, + 0.8502985542297363, + 0.8594941413879394, + 0.8541229305267334, + 0.8707549245834351, + 0.8710284989356994, + 0.8676784825325012, + 0.8654314409255981, + 0.847813544845581, + 0.8484393062591553, + 0.8654967462539673, + 0.8576792402267456, + 0.8482211884498596, + 0.8531449937820434, + 0.8563604249954223, + 0.8368509140014648, + 0.8605183853149414, + 0.8388536148071289, + 0.8804149766921997, + 0.8480586463928222, + 0.838437174987793, + 0.8545515079498291, + 0.8535089003562927, + 0.8567220569610595, + 0.8433004068374634, + 0.8453849071502686, + 0.8383244281768799, + 0.8520817733764648, + 0.8613478240966796, + 0.8393393857955933, + 0.8388194683074951, + 0.8312189640045166, + 0.8367521869659423, + 0.8318347694396973, + 0.8283476368904114, + 0.8408833297729492, + 0.835852100944519, + 0.8230558944702149, + 0.8201510600090027, + 0.8144685863494873, + 0.8189937896728515, + 0.8204439929962158, + 0.8067114233970643, + 0.8116221212387085, + 0.8106674427986145, + 0.8022418712615966, + 0.7973626476287842, + 0.7976334384918213, + 0.8014879680633545, + 0.7981612595558166, + 0.7937649499893189, + 0.7902321870803833, + 0.7896893333435059, + 0.792438854598999, + 0.7878884392738342, + 0.7869910089492798, + 0.7866397365570068, + 0.7847629238128662, + 0.7840681342124939, + 0.783345707321167, + 0.7829301319122315, + 0.7823859727859497, + 0.7819064727783203, + 0.7816107426643372, + 0.7811750866889954, + 0.7810312837600708 + ], + "train_acc": [ + 0.2987, + 0.6326, + 0.7384, + 0.7635, + 0.7608, + 0.752, + 0.739, + 0.7292, + 0.7226, + 0.7148, + 0.7083, + 0.7011, + 0.7004, + 0.6955, + 0.6874, + 0.6843, + 0.6841, + 0.6859, + 0.6828, + 0.6814, + 0.6789, + 0.6862, + 0.6884, + 0.6901, + 0.6848, + 0.688, + 0.6941, + 0.6957, + 0.6931, + 0.7012, + 0.6928, + 0.6995, + 0.6831, + 0.6954, + 0.7021, + 0.6914, + 0.6947, + 0.6912, + 0.6951, + 0.6947, + 0.6961, + 0.6885, + 0.6895, + 0.6978, + 0.6978, + 0.6951, + 0.6949, + 0.6957, + 0.6969, + 0.6962, + 0.6955, + 0.6991, + 0.7018, + 0.7031, + 0.696, + 0.6985, + 0.7039, + 0.7033, + 0.7045, + 0.701, + 0.7066, + 0.708, + 0.7076, + 0.7037, + 0.7087, + 0.7092, + 0.7073, + 0.7101, + 0.7095, + 0.7096, + 0.7095, + 0.7118, + 0.7094, + 0.7102, + 0.7117, + 0.7089, + 0.7102, + 0.7095, + 0.7106, + 0.7106 + ], + "test_acc": [ + 0.5375, + 0.696, + 0.736, + 0.7335, + 0.728, + 0.7125, + 0.702, + 0.6935, + 0.6735, + 0.673, + 0.6755, + 0.6665, + 0.671, + 0.6575, + 0.6495, + 0.656, + 0.6575, + 0.6585, + 0.6585, + 0.647, + 0.6555, + 0.6535, + 0.661, + 0.6695, + 0.6645, + 0.676, + 0.673, + 0.649, + 0.6695, + 0.6595, + 0.66, + 0.6585, + 0.636, + 0.657, + 0.6365, + 0.651, + 0.6575, + 0.658, + 0.658, + 0.6615, + 0.65, + 0.644, + 0.6525, + 0.654, + 0.6425, + 0.638, + 0.6455, + 0.6455, + 0.6465, + 0.6515, + 0.6505, + 0.6475, + 0.6525, + 0.644, + 0.65, + 0.655, + 0.6475, + 0.652, + 0.6515, + 0.6495, + 0.6595, + 0.649, + 0.6575, + 0.6505, + 0.6525, + 0.652, + 0.6505, + 0.6525, + 0.6535, + 0.6545, + 0.657, + 0.6535, + 0.655, + 0.652, + 0.653, + 0.651, + 0.652, + 0.6525, + 0.651, + 0.651 + ], + "state_pred_error": [ + 0.7786139750480652, + 0.3122247148036957, + 0.20072943181991576, + 0.17233864879608154, + 0.15799049963951112, + 0.1520016979455948, + 0.15061514353752137, + 0.15201976532936096, + 0.15393238065242767, + 0.15233531470298767, + 0.1529501548051834, + 0.1518586612224579, + 0.14777747428417207, + 0.1396225711941719, + 0.13393001658916473, + 0.12688448318243026, + 0.11889619739055633, + 0.11048878728151322, + 0.10281732966899872, + 0.09756427093744278, + 0.09126090179681778, + 0.08596743443012238, + 0.0826011387348175, + 0.07700357694625855, + 0.07508404291868209, + 0.07156078473329544, + 0.06937397572994232, + 0.06786044591665268, + 0.06689649878144265, + 0.0628541961312294, + 0.061125951021909715, + 0.059071518713235856, + 0.05804442538022995, + 0.05559697550535202, + 0.05349199259877205, + 0.0510828118801117, + 0.050134736907482144, + 0.050006070119142536, + 0.04583842672109604, + 0.04389976638555527, + 0.04246980703473091, + 0.04128407181501389, + 0.03976263640522957, + 0.03883026147484779, + 0.03822557154297829, + 0.03655906445980072, + 0.03534454255104065, + 0.034419277024269106, + 0.03396104025840759, + 0.03280952478647232, + 0.031770370733737945, + 0.03110829921364784, + 0.030244355934858323, + 0.029577301198244095, + 0.02884054028391838, + 0.0280285452991724, + 0.02734226542413235, + 0.02653370050191879, + 0.02591722692847252, + 0.02562211912572384, + 0.024784083288908004, + 0.02415384087264538, + 0.023749950650334358, + 0.023075414776802063, + 0.022662506771087648, + 0.022168341422080993, + 0.0219087354272604, + 0.021405927726626396, + 0.021224218714237214, + 0.020873518934845924, + 0.020796752271056176, + 0.020648898005485535, + 0.01995813894569874, + 0.01966182319521904, + 0.0194194305062294, + 0.018996354737877846, + 0.01872855971157551, + 0.018467084999382495, + 0.018039076521992683, + 0.018002220337092877 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.6501579284667969, + 0.4189426302909851, + 0.1800653487443924, + 0.1647701859474182 + ], + "perturbation_rho": [ + 0.5907484292984009, + 0.36159276962280273, + 0.19337056577205658, + 0.1794498711824417 + ], + "nudging": { + "0.001": [ + -0.019326727837324142, + -0.002377996686846018, + -0.0006870059878565371, + -0.000631407368928194 + ], + "0.003": [ + -0.05702997371554375, + -0.007118801586329937, + -0.002059582155197859, + -0.0018930428195744753 + ], + "0.01": [ + -0.1790994107723236, + -0.023556631058454514, + -0.006848426535725594, + -0.0062964376993477345 + ] + }, + "state_pred_error_per_layer": [ + 7107.7138671875, + 890.22314453125, + 493.5357360839844, + 407.69677734375 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2540888969421387, + 1.6410298145294189, + 1.0899561918258667, + 0.8455374429702759, + 0.7378649179458618, + 0.6901313011169433, + 0.6735435390472412, + 0.6544258743286133, + 0.6543777503967285, + 0.6590329810142517, + 0.6783974195480347, + 0.6698754477500916, + 0.6935008029937744, + 0.716245794391632, + 0.6978517965316773, + 0.7255995491027832, + 0.7385436865806579, + 0.7370423707962036, + 0.7421768573760986, + 0.7866301471710205, + 0.7981218069076538, + 0.7994531000137329, + 0.850463445854187, + 0.8955202503204346, + 0.8870052036285401, + 0.8269047240257263, + 0.837711269569397, + 0.8814192169189453, + 0.9286035356521607, + 1.0078046418190003, + 0.9495850528717041, + 0.9831599643707275, + 1.0586618783950805, + 1.0358479290008544, + 1.060762398147583, + 1.0723051456451416, + 1.1363716716766357, + 1.080968037033081, + 1.134492848777771, + 1.1133343200683594, + 1.154938784980774, + 1.1417428504943847, + 1.1993848468780517, + 1.1748576559066772, + 1.1947654231071472, + 1.2083104314804076, + 1.2755975540161133, + 1.2453838123321532, + 1.2651009052276612, + 1.2496138525009155, + 1.2461695442199707, + 1.2764700059890748, + 1.2867469375610352, + 1.304604454421997, + 1.3014329265594482, + 1.3248945934295655, + 1.33621167678833, + 1.3619223628997803, + 1.3417739696502686, + 1.3370944692611695, + 1.3508729553222656, + 1.355317646408081, + 1.3528772338867188, + 1.3464540214538574, + 1.3568033025741577, + 1.343411579322815, + 1.347543560028076, + 1.3430934253692628, + 1.3378395433425903, + 1.3415356441497803, + 1.3368797145843505, + 1.334293141937256, + 1.3349700309753418, + 1.3334004755020141, + 1.3332426280975342, + 1.33172604637146, + 1.3308066741943358, + 1.3304414348602296, + 1.3295167798995973, + 1.3292806955337524 + ], + "train_acc": [ + 0.1748, + 0.4499, + 0.6102, + 0.6889, + 0.7225, + 0.7409, + 0.7502, + 0.7518, + 0.7565, + 0.7574, + 0.7488, + 0.7508, + 0.743, + 0.7405, + 0.7472, + 0.7427, + 0.7371, + 0.7393, + 0.7409, + 0.7318, + 0.7263, + 0.7189, + 0.7077, + 0.6892, + 0.6857, + 0.7034, + 0.6947, + 0.6808, + 0.66, + 0.6346, + 0.6524, + 0.6394, + 0.6107, + 0.6184, + 0.6119, + 0.6065, + 0.587, + 0.6025, + 0.5811, + 0.5889, + 0.5741, + 0.5813, + 0.5675, + 0.5699, + 0.5636, + 0.5586, + 0.5374, + 0.5432, + 0.5426, + 0.5476, + 0.5501, + 0.5398, + 0.5383, + 0.5309, + 0.5355, + 0.52, + 0.5204, + 0.5127, + 0.5132, + 0.5169, + 0.5118, + 0.5122, + 0.5094, + 0.5203, + 0.5167, + 0.5177, + 0.5163, + 0.5199, + 0.5187, + 0.5212, + 0.5216, + 0.519, + 0.5225, + 0.5223, + 0.5225, + 0.5227, + 0.525, + 0.5242, + 0.5248, + 0.5255 + ], + "test_acc": [ + 0.31, + 0.5485, + 0.645, + 0.6845, + 0.7065, + 0.707, + 0.71, + 0.7125, + 0.717, + 0.709, + 0.701, + 0.698, + 0.691, + 0.7055, + 0.698, + 0.698, + 0.7, + 0.6845, + 0.669, + 0.656, + 0.683, + 0.6625, + 0.645, + 0.6275, + 0.626, + 0.631, + 0.6235, + 0.5625, + 0.5655, + 0.586, + 0.6095, + 0.5555, + 0.5475, + 0.5435, + 0.569, + 0.484, + 0.558, + 0.5495, + 0.5545, + 0.5155, + 0.548, + 0.514, + 0.513, + 0.532, + 0.4845, + 0.5125, + 0.5315, + 0.47, + 0.5255, + 0.525, + 0.499, + 0.5145, + 0.4825, + 0.497, + 0.4915, + 0.505, + 0.453, + 0.4795, + 0.4955, + 0.495, + 0.4815, + 0.496, + 0.497, + 0.4835, + 0.4905, + 0.492, + 0.494, + 0.49, + 0.4895, + 0.4885, + 0.4845, + 0.4925, + 0.4845, + 0.484, + 0.49, + 0.4865, + 0.4895, + 0.4905, + 0.489, + 0.487 + ], + "value_loss": [ + 3.067925698852539, + 0.8872503746986389, + 0.784230032157898, + 0.8464786403656006, + 0.8567787155151367, + 0.8420232248306274, + 0.8107911947250366, + 0.76327637424469, + 0.7439310749053956, + 0.7632134145736694, + 0.8066229679107666, + 0.7526053647041321, + 0.8069936139583588, + 0.8536850826263428, + 0.7878379513263702, + 0.8329431747436523, + 0.8027177619695663, + 0.7358918642997742, + 0.7229702713966369, + 0.7154047614097595, + 0.7539727543354035, + 0.6649943606376648, + 0.6917212394714356, + 0.7406036077499389, + 0.6360067028522491, + 0.5150869111537933, + 0.5327004407882691, + 0.4914137007713318, + 0.5129998965263367, + 0.5935896294116974, + 0.4661740849494934, + 0.4586599859714508, + 0.5206927395820617, + 0.5325411680221558, + 0.5089368036270142, + 0.5612850030899048, + 0.6255286026954651, + 0.4715394420623779, + 0.537113422870636, + 0.4809487106323242, + 0.5100893694877624, + 0.491378253364563, + 0.5363532768249512, + 0.4960866286277771, + 0.4698116518497467, + 0.4960141607284546, + 0.5674628148078918, + 0.5025658918380738, + 0.5430127717494965, + 0.5158628129005433, + 0.48981055545806884, + 0.5012782106876373, + 0.4980415323257446, + 0.5117126678466797, + 0.4960208126068115, + 0.5151057609558105, + 0.5090823886871337, + 0.5225202934265136, + 0.5217664462089538, + 0.5103578377723694, + 0.4982886472702026, + 0.5127610027790069, + 0.5053389938354492, + 0.4992716392040253, + 0.4872829970359802, + 0.4732895241737366, + 0.47746601195335386, + 0.49208361549377444, + 0.46516202363967896, + 0.467171999502182, + 0.4678579177856445, + 0.4566397163391113, + 0.46912312126159667, + 0.46011261644363405, + 0.46119874806404115, + 0.45755069794654846, + 0.45454912757873533, + 0.46414966630935667, + 0.46496015009880065, + 0.46226135368347165 + ], + "term_loss": [ + 1.7594063854694366, + 0.37591145000457765, + 0.5036363396644592, + 0.6062044906616211, + 0.6242774119853973, + 0.6045010264396667, + 0.5617577237606048, + 0.5238085851669312, + 0.5167714694976807, + 0.536994783115387, + 0.5744672933578491, + 0.5201116055488586, + 0.567726757800579, + 0.6057433352708816, + 0.5440834599018097, + 0.5835855722904205, + 0.5459397554039955, + 0.47647206230163575, + 0.4662741364479065, + 0.44569241828918454, + 0.476298482632637, + 0.3910742021560669, + 0.4032438316345215, + 0.44340121884346007, + 0.34564229555130005, + 0.24595328629016877, + 0.2536192675590515, + 0.20336173225641252, + 0.2100383534669876, + 0.2641002653121948, + 0.15515764528512954, + 0.13755231359004974, + 0.17821311106681823, + 0.19600526194572448, + 0.17045617690086365, + 0.2182028594017029, + 0.25423940081596375, + 0.1316945064663887, + 0.17203917299509047, + 0.1263727828025818, + 0.1424735504388809, + 0.1306004422903061, + 0.15452624399662018, + 0.1187472231388092, + 0.09432517062425613, + 0.1164723228931427, + 0.1585537355899811, + 0.1041444504737854, + 0.13414050550460815, + 0.11696476354598999, + 0.09393293557167053, + 0.09930002460479737, + 0.09558204698562622, + 0.10497297461628914, + 0.09059979002475739, + 0.10161748363077641, + 0.09518039667606354, + 0.10102285161018372, + 0.10330084440708161, + 0.09370956559181214, + 0.08114260835647583, + 0.09380301012992859, + 0.08571744566559791, + 0.0824426296055317, + 0.071114610221982, + 0.061979551124572756, + 0.06477263647913933, + 0.0772924101471901, + 0.05530736327469349, + 0.05676423398256302, + 0.05725909180641174, + 0.04929078468978405, + 0.05781498133838177, + 0.050458201050758364, + 0.051463548076152804, + 0.04791119509935379, + 0.045457855463027955, + 0.05178614779412746, + 0.05226057640612125, + 0.049428026616573334 + ], + "bridge_loss": [ + 1.0179481054047559, + 0.20606108825802802, + 0.03427657631635666, + 0.010473076432943344, + 0.016603080600500107, + 0.02517593368291855, + 0.03693295772075653, + 0.028744317154586314, + 0.014567548152804375, + 0.012067488829791546, + 0.012867180669307709, + 0.012119705080986023, + 0.014082370281219482, + 0.018210298416018487, + 0.02226397890150547, + 0.02276896116733551, + 0.025944879484176637, + 0.030690657392144202, + 0.030334649151563645, + 0.0356466594517231, + 0.0373953173071146, + 0.03450476716756821, + 0.03414955579042435, + 0.03280657273828983, + 0.028484632873535157, + 0.021447348003461958, + 0.026165857848525046, + 0.022548073571920395, + 0.023626256749033927, + 0.03081165543794632, + 0.024572184744477272, + 0.024584364867210388, + 0.026557748287916183, + 0.0237947801977396, + 0.019455672904849054, + 0.018987117165327073, + 0.029922924302518368, + 0.01343661539554596, + 0.02296329292356968, + 0.017573897647857665, + 0.02051718008518219, + 0.016063079220056533, + 0.022041453886032104, + 0.02147355371117592, + 0.014992918160557747, + 0.01587340624332428, + 0.02909149942398071, + 0.02134713576436043, + 0.027834608449041842, + 0.021670415142178535, + 0.018895103727281093, + 0.017823033079504967, + 0.016468752840161322, + 0.015435275170207024, + 0.015470961254835129, + 0.017179324565827846, + 0.01504898190498352, + 0.017772416092455386, + 0.018987592327594758, + 0.018407849557697774, + 0.015608608210086822, + 0.01722142017632723, + 0.01781987230181694, + 0.017794143831729888, + 0.014897557091712952, + 0.01346850597858429, + 0.014480280113220214, + 0.018174419306218624, + 0.013706611354649068, + 0.014696067751944064, + 0.015800623482465744, + 0.013735510259866714, + 0.01802016984522343, + 0.01632189666777849, + 0.01686810880601406, + 0.017228992500901222, + 0.01766794673204422, + 0.021452254375815393, + 0.022196426358819007, + 0.022721626716852187 + ], + "tgrad_loss": [ + 0.29057118844985963, + 0.30527783031463623, + 0.24631710891723632, + 0.22980107893943785, + 0.21589822309017181, + 0.21234626097679138, + 0.2121005094051361, + 0.21072347102165223, + 0.21259205179214477, + 0.2141511384963989, + 0.2192884954929352, + 0.22037405626773834, + 0.22518448123931883, + 0.22973145468235015, + 0.22149051184654237, + 0.22658863916397096, + 0.2308331280350685, + 0.22872914137840272, + 0.2263614887237549, + 0.23406568908691405, + 0.24027895650863648, + 0.23941539039611817, + 0.2543278500080109, + 0.26439581327438355, + 0.26187977333068846, + 0.24768628034591675, + 0.2529153157234192, + 0.2655038944244385, + 0.2793352873802185, + 0.298677712726593, + 0.28644425497055054, + 0.29652330493927004, + 0.31592187337875366, + 0.3127411260604858, + 0.3190249535560608, + 0.3240950348377228, + 0.34136627588272095, + 0.3264083216667175, + 0.3421109504699707, + 0.33700203189849853, + 0.3470986408233643, + 0.3447147289276123, + 0.359785578918457, + 0.3558658477306366, + 0.3604935604095459, + 0.36366842856407167, + 0.37981757740974426, + 0.3770743095874786, + 0.38103766255378724, + 0.3772276309490204, + 0.37698251342773437, + 0.3841551516532898, + 0.38599073448181154, + 0.39130441913604735, + 0.38995005826950074, + 0.39630895295143126, + 0.3988530141830444, + 0.40372502479553224, + 0.3994780075073242, + 0.39824042444229124, + 0.4015374305725098, + 0.40173657608032226, + 0.40180167770385744, + 0.3990348654270172, + 0.4012708299636841, + 0.3978414667129517, + 0.3982130952835083, + 0.39661678586006166, + 0.3961480514526367, + 0.3957116979598999, + 0.3947981976032257, + 0.3936134231567383, + 0.3932879699230194, + 0.3933325177192688, + 0.3928670913696289, + 0.3924105140209198, + 0.39142332553863524, + 0.3909112627029419, + 0.39050314569473266, + 0.39011170201301576 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.20670706033706665, + 0.594096302986145, + 0.6002212762832642, + 0.6189069747924805 + ], + "perturbation_rho": [ + 0.24109239876270294, + 0.6317664384841919, + 0.6270265579223633, + 0.6285783648490906 + ], + "nudging": { + "0.001": [ + -0.0037710254546254873, + -0.004560340661555529, + -0.004485958255827427, + -0.004530656151473522 + ], + "0.003": [ + -0.011285749264061451, + -0.013657940551638603, + -0.013435271568596363, + -0.013568824157118797 + ], + "0.01": [ + -0.03731346130371094, + -0.04525235667824745, + -0.044518306851387024, + -0.04495714232325554 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a1.0_L8_s123.json b/results/synth_ladder_v2_hi/synth_a1.0_L8_s123.json new file mode 100644 index 0000000..a363017 --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a1.0_L8_s123.json @@ -0,0 +1,1638 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.3597605170249938, + 0.6515352805137634, + 0.5761591612815857, + 0.5036653388023377, + 0.4378750482082367, + 0.3986785667896271, + 0.3651514029026032, + 0.32824506731033326, + 0.3065573793888092, + 0.25960179257392885, + 0.22397090587615967, + 0.18577685337066652, + 0.17314567223787308, + 0.13219234380722045, + 0.2145008885383606, + 0.14060048987865448, + 0.1320132321357727, + 0.15602792205810548, + 0.08493568333983421, + 0.04347894575595856, + 0.04405979743897915, + 0.026510945428907872, + 0.017329008316993712, + 0.014953341521322727, + 0.011717742429673671, + 0.010508880212903023, + 0.009168952202051878, + 0.008036357240378857, + 0.007489554305374622, + 0.006532931604981422, + 0.00620891650468111, + 0.005510815745592117, + 0.005301155371963978, + 0.004775684664398432, + 0.00437106367573142, + 0.004044459429383278, + 0.003801189873740077, + 0.003582138231769204, + 0.003404493835568428, + 0.003254202524572611, + 0.0030735614743083715, + 0.0029319060567766426, + 0.0028157311901450158, + 0.0027169062765315176, + 0.0026012683637440205, + 0.0024921510376036166, + 0.0024171145718544724, + 0.002337812060303986, + 0.0022599145282059907, + 0.0021856731843203307, + 0.00212739445772022, + 0.002071296547073871, + 0.0020127466212958097, + 0.00196753548104316, + 0.0019216904461383819, + 0.0018877944979816676, + 0.0018499503599479794, + 0.0018118849888443948, + 0.001789958526287228, + 0.0017553682591766118, + 0.0017257725574076177, + 0.0017022816266864537, + 0.00168052331879735, + 0.0016581403171643614, + 0.001639620173163712, + 0.001623599848151207, + 0.0016086858851835132, + 0.0015953668985515834, + 0.0015842857133597135, + 0.001574385955557227, + 0.0015660683127120137, + 0.001558823443762958, + 0.0015531524984166026, + 0.0015484464213252067, + 0.0015443269031122327, + 0.0015414506535977126, + 0.001539355414081365, + 0.001538024666160345, + 0.0015371435042470694, + 0.001536688283085823 + ], + "train_acc": [ + 0.5267, + 0.7494, + 0.7766, + 0.8091, + 0.8373, + 0.846, + 0.8606, + 0.8759, + 0.8863, + 0.9065, + 0.9204, + 0.9385, + 0.9412, + 0.9602, + 0.9215, + 0.9529, + 0.9556, + 0.9471, + 0.9748, + 0.9941, + 0.9925, + 0.9989, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.7505, + 0.7575, + 0.758, + 0.7665, + 0.7615, + 0.7685, + 0.7675, + 0.7595, + 0.7745, + 0.7615, + 0.765, + 0.7595, + 0.764, + 0.7675, + 0.763, + 0.746, + 0.7585, + 0.764, + 0.763, + 0.776, + 0.771, + 0.769, + 0.772, + 0.7795, + 0.7725, + 0.7755, + 0.7765, + 0.772, + 0.773, + 0.7735, + 0.7745, + 0.774, + 0.7705, + 0.773, + 0.773, + 0.7735, + 0.7765, + 0.775, + 0.7735, + 0.7725, + 0.774, + 0.772, + 0.774, + 0.772, + 0.7705, + 0.7725, + 0.772, + 0.772, + 0.7725, + 0.7725, + 0.773, + 0.773, + 0.773, + 0.7745, + 0.773, + 0.771, + 0.772, + 0.772, + 0.77, + 0.772, + 0.7715, + 0.771, + 0.771, + 0.7715, + 0.772, + 0.7715, + 0.7715, + 0.7705, + 0.7715, + 0.771, + 0.7715, + 0.771, + 0.7715, + 0.771, + 0.7715, + 0.7715, + 0.7715, + 0.7715, + 0.7715, + 0.7715 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8705248832702637, + 0.8637571334838867, + 0.8509291410446167, + 0.8393645286560059, + 0.8308560848236084, + 0.8178726434707642, + 0.800449013710022, + 0.780108630657196 + ], + "perturbation_rho": [ + 0.9999995231628418, + 0.9999995827674866, + 0.9999989867210388, + 0.9999984502792358, + 0.9999953508377075, + 0.9999901056289673, + 0.9999750852584839, + 0.9999430179595947 + ], + "nudging": { + "0.001": [ + -0.06178125739097595, + -0.05145343393087387, + -0.040026240050792694, + -0.028534352779388428, + -0.018970515578985214, + -0.012147586792707443, + -0.007833496667444706, + -0.0053112502209842205 + ], + "0.003": [ + -0.17677445709705353, + -0.14845409989356995, + -0.11653909087181091, + -0.0838426947593689, + -0.056151725351810455, + -0.03613904491066933, + -0.02337692305445671, + -0.015877680853009224 + ], + "0.01": [ + -0.5067576169967651, + -0.4360688626766205, + -0.3518902063369751, + -0.26053690910339355, + -0.1787266880273819, + -0.1170111671090126, + -0.07650406658649445, + -0.052279047667980194 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.286389960861206, + 1.5046793308258057, + 1.003141529273987, + 0.8502165521621704, + 0.79491765127182, + 0.7619345289707183, + 0.7414057087898255, + 0.7364994804382324, + 0.7720167747497558, + 0.762273980808258, + 0.7816535405158996, + 0.8181071807861328, + 0.8168456993103027, + 0.8073886169433594, + 0.8274958035469056, + 0.8190181507110595, + 0.8747408109664917, + 0.9060320697784424, + 0.8967771499633789, + 0.8795616693496704, + 0.9533623218059539, + 0.9225506632804871, + 0.8967089427947998, + 1.0248757438659668, + 0.9947487607955933, + 1.0210036689758302, + 0.9943507525444031, + 0.9633036288261414, + 1.059937081384659, + 1.017498482131958, + 1.0583956523895264, + 1.0057311573028564, + 1.0065682273864747, + 1.0264606199264525, + 0.9849345092773437, + 1.0307427364349364, + 1.0011034609794616, + 1.0081669438362122, + 1.0175197954177857, + 1.049601664352417, + 1.0101221143722534, + 1.0102649535179138, + 1.0285917793273927, + 1.0752605737686156, + 1.0722829106330871, + 1.013289751815796, + 1.0027215727806091, + 0.9726143455982208, + 0.9526057465553284, + 1.0113349676132202, + 1.0276539045333861, + 0.9834941878318787, + 0.979356449508667, + 0.9529389619827271, + 0.9780878620147705, + 0.9671504787445069, + 0.9552891291618347, + 0.9549959115982055, + 0.9576946084022522, + 0.9455600605010986, + 0.945126536655426, + 0.9525565906047821, + 0.942156244468689, + 0.9393270302772522, + 0.9270951150894166, + 0.9252788740158081, + 0.9220846809387208, + 0.9299989045143128, + 0.9116277715682983, + 0.9150181134700776, + 0.9048595577239991, + 0.9056384092330932, + 0.9041959270477294, + 0.9009678789138794, + 0.9005821381568909, + 0.898265645122528, + 0.8972719952583313, + 0.8961263038635254, + 0.8954417029380798, + 0.8950483352661133 + ], + "train_acc": [ + 0.1682, + 0.4702, + 0.632, + 0.6851, + 0.7067, + 0.7165, + 0.7266, + 0.734, + 0.7213, + 0.7267, + 0.7244, + 0.7156, + 0.7148, + 0.7218, + 0.7179, + 0.7252, + 0.7109, + 0.7081, + 0.7083, + 0.7121, + 0.6998, + 0.7084, + 0.7135, + 0.696, + 0.6957, + 0.6912, + 0.7041, + 0.7055, + 0.6957, + 0.6988, + 0.6907, + 0.6998, + 0.6982, + 0.6939, + 0.704, + 0.6938, + 0.7025, + 0.6989, + 0.6988, + 0.6956, + 0.6967, + 0.6992, + 0.6908, + 0.6888, + 0.6808, + 0.7012, + 0.6984, + 0.7053, + 0.7083, + 0.6966, + 0.6956, + 0.7002, + 0.7045, + 0.7086, + 0.7024, + 0.707, + 0.7061, + 0.7049, + 0.7, + 0.7084, + 0.7063, + 0.7042, + 0.7075, + 0.7088, + 0.7096, + 0.7082, + 0.7103, + 0.7108, + 0.712, + 0.7136, + 0.717, + 0.7138, + 0.7123, + 0.7121, + 0.7125, + 0.7124, + 0.7132, + 0.7141, + 0.7138, + 0.7138 + ], + "test_acc": [ + 0.316, + 0.5695, + 0.6415, + 0.682, + 0.6865, + 0.7005, + 0.688, + 0.6815, + 0.677, + 0.6925, + 0.694, + 0.691, + 0.682, + 0.6885, + 0.667, + 0.639, + 0.6545, + 0.647, + 0.6855, + 0.6465, + 0.6645, + 0.6715, + 0.63, + 0.655, + 0.63, + 0.6585, + 0.666, + 0.664, + 0.64, + 0.641, + 0.632, + 0.6545, + 0.6605, + 0.6435, + 0.602, + 0.6495, + 0.6465, + 0.6625, + 0.64, + 0.6735, + 0.654, + 0.6435, + 0.612, + 0.621, + 0.6465, + 0.6645, + 0.656, + 0.663, + 0.636, + 0.639, + 0.647, + 0.662, + 0.654, + 0.646, + 0.6435, + 0.662, + 0.6725, + 0.6515, + 0.6605, + 0.6575, + 0.6595, + 0.6725, + 0.665, + 0.656, + 0.668, + 0.67, + 0.66, + 0.6705, + 0.664, + 0.67, + 0.671, + 0.6665, + 0.666, + 0.667, + 0.6685, + 0.6665, + 0.67, + 0.6705, + 0.6695, + 0.67 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.006531993858516216, + 0.06646430492401123, + 0.03470785170793533, + 0.06075863167643547, + 0.08359120786190033, + 0.10361115634441376, + 0.07729409635066986, + 0.08058023452758789 + ], + "perturbation_rho": [ + -0.009454472921788692, + 0.027615420520305634, + 0.016344428062438965, + 0.07737872004508972, + 0.07998150587081909, + 0.10012705624103546, + 0.06766189634799957, + 0.10667626559734344 + ], + "nudging": { + "0.001": [ + 0.0007423138595186174, + -0.0004339630249887705, + -0.000128742161905393, + -0.00022700021509081125, + -0.00032891874434426427, + -0.0003692444588523358, + -0.0002555775863584131, + -0.0003090384416282177 + ], + "0.003": [ + 0.0022933646105229855, + -0.0012996066361665726, + -0.00038488200516439974, + -0.0006815677043050528, + -0.000985405407845974, + -0.001108917174860835, + -0.0007655198569409549, + -0.000927455781493336 + ], + "0.01": [ + 0.008429424837231636, + -0.004321999382227659, + -0.0012797827366739511, + -0.0022665630094707012, + -0.003274995367974043, + -0.0036867314483970404, + -0.0025471593253314495, + -0.0030862612184137106 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.7888231441497802, + 0.9241861874580384, + 0.7240635061264038, + 0.7652610589981079, + 0.8191699273109436, + 0.8505851211547851, + 0.8939923881530761, + 0.9012255577087402, + 0.9081583255767822, + 0.9199252265930176, + 0.9214971921920776, + 0.9398935409545899, + 0.9513171270370483, + 0.9611785633087159, + 0.9746305106163025, + 0.9664869049072266, + 0.9556780141830444, + 0.9599577611923218, + 0.9653084876060486, + 0.9609654689788818, + 0.9881143209457397, + 0.9882149921417236, + 0.9909763618469238, + 0.9672609125137329, + 0.9692873673439026, + 0.9848963592529297, + 0.9834712471008301, + 0.9938116626739502, + 0.9761260354995728, + 0.9862309640884399, + 0.9964988097190857, + 0.9895741086959838, + 1.0031852451324463, + 0.9945528154373169, + 0.9938870990753174, + 0.9850039566040039, + 0.982766799736023, + 0.9940546441078186, + 0.9699371845245361, + 1.0030255681037903, + 0.9629069705963135, + 0.9917603145599365, + 0.9868170715332031, + 0.9635244643211365, + 0.9542290064811707, + 0.9522285627365112, + 0.959105701637268, + 0.9572865758895874, + 0.9609386156082154, + 0.9519588193893432, + 0.9662731432914734, + 0.9482017148971558, + 0.9449867942810058, + 0.9475737733840942, + 0.9366802082061768, + 0.9512895627021789, + 0.9357378484725952, + 0.9315478944778443, + 0.930592444229126, + 0.925588726234436, + 0.9228597645759582, + 0.918616138458252, + 0.920361442565918, + 0.9141858814239502, + 0.9206330242156983, + 0.912045624256134, + 0.9115395063400269, + 0.9120437767028808, + 0.9089287811756134, + 0.9052299271583557, + 0.9062120104789734, + 0.9052583214759826, + 0.903732003068924, + 0.9017038101196289, + 0.9016088019371032, + 0.900925235080719, + 0.9002337282180786, + 0.89950648021698, + 0.899344504737854, + 0.8991525621414185 + ], + "train_acc": [ + 0.3518, + 0.6507, + 0.7278, + 0.7221, + 0.7157, + 0.704, + 0.6837, + 0.6747, + 0.6723, + 0.672, + 0.6664, + 0.6583, + 0.6557, + 0.6516, + 0.6463, + 0.6463, + 0.6498, + 0.6501, + 0.6474, + 0.653, + 0.6426, + 0.6447, + 0.6445, + 0.6507, + 0.6485, + 0.6467, + 0.6437, + 0.6427, + 0.6479, + 0.6483, + 0.6431, + 0.6429, + 0.6416, + 0.6448, + 0.6449, + 0.646, + 0.6441, + 0.6436, + 0.6521, + 0.6445, + 0.6551, + 0.6524, + 0.6439, + 0.6597, + 0.6584, + 0.6558, + 0.6528, + 0.6547, + 0.6585, + 0.6601, + 0.6553, + 0.6599, + 0.6603, + 0.6637, + 0.6623, + 0.6554, + 0.6631, + 0.6682, + 0.6642, + 0.6686, + 0.6645, + 0.6711, + 0.672, + 0.6707, + 0.6677, + 0.6712, + 0.6738, + 0.6701, + 0.6731, + 0.6735, + 0.6748, + 0.6746, + 0.6743, + 0.6749, + 0.6778, + 0.6736, + 0.6769, + 0.676, + 0.6765, + 0.6766 + ], + "test_acc": [ + 0.58, + 0.696, + 0.719, + 0.706, + 0.6865, + 0.67, + 0.6525, + 0.648, + 0.639, + 0.622, + 0.626, + 0.6225, + 0.6215, + 0.628, + 0.612, + 0.628, + 0.6145, + 0.6255, + 0.6265, + 0.6135, + 0.6095, + 0.6135, + 0.621, + 0.6175, + 0.626, + 0.6125, + 0.6105, + 0.6065, + 0.604, + 0.599, + 0.5715, + 0.6055, + 0.5985, + 0.6065, + 0.616, + 0.6205, + 0.5945, + 0.6145, + 0.6205, + 0.62, + 0.61, + 0.619, + 0.609, + 0.6145, + 0.616, + 0.612, + 0.617, + 0.5945, + 0.6145, + 0.605, + 0.611, + 0.6145, + 0.6095, + 0.616, + 0.6075, + 0.6085, + 0.6185, + 0.6165, + 0.6155, + 0.6145, + 0.616, + 0.622, + 0.6225, + 0.6185, + 0.626, + 0.6225, + 0.6215, + 0.6255, + 0.622, + 0.626, + 0.6245, + 0.6255, + 0.628, + 0.625, + 0.628, + 0.6275, + 0.6295, + 0.629, + 0.6295, + 0.63 + ], + "state_pred_error": [ + 0.7095542505741119, + 0.2204969837665558, + 0.15315507028102876, + 0.1501929506778717, + 0.1680251207113266, + 0.18483844525814055, + 0.1927951848268509, + 0.18053169043064118, + 0.15416607925891876, + 0.13751740345954894, + 0.13204463099241256, + 0.137019335603714, + 0.14018229098320006, + 0.13985622874498368, + 0.13382404689788818, + 0.12563955969810486, + 0.11495544098615647, + 0.10729084681272506, + 0.0991292914390564, + 0.0913941947221756, + 0.08400755655765534, + 0.07665130922794341, + 0.06990957274436951, + 0.06544679455757141, + 0.06332790016531945, + 0.059688883173465726, + 0.05787863445281982, + 0.05242338265180588, + 0.04925893352627754, + 0.0445285712659359, + 0.03784902328848839, + 0.03432314455509186, + 0.03293032890856266, + 0.0331594014942646, + 0.033307562443614006, + 0.03299136911034584, + 0.033409500086307525, + 0.033616409802436825, + 0.03379755539298058, + 0.033649980002641675, + 0.032497336408495905, + 0.03118463564515114, + 0.02951844048500061, + 0.02854375030398369, + 0.026753420197963715, + 0.025368909916281702, + 0.024291560703516006, + 0.023437905433773994, + 0.022952947756648065, + 0.02232878315448761, + 0.02181797335743904, + 0.021106301710009576, + 0.020409608674049378, + 0.019760580214858055, + 0.019138308236002922, + 0.018568420615792273, + 0.01808371136188507, + 0.01727056083083153, + 0.016739256817102432, + 0.016109547036886215, + 0.015664903444051744, + 0.015091081549227238, + 0.014631217294931411, + 0.014197941839694977, + 0.013777997905015946, + 0.01357243129312992, + 0.013283110724389553, + 0.012890019401907921, + 0.012523587247729302, + 0.012299926532804966, + 0.012003950168192386, + 0.01177265168428421, + 0.011549191689491272, + 0.011507066878676414, + 0.011230636714398862, + 0.011101334499567747, + 0.010917466147243976, + 0.010862733283638954, + 0.010788837406039238, + 0.010658458246290683 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.6138853430747986, + 0.41074037551879883, + 0.25203365087509155, + 0.20834164321422577, + 0.16624599695205688, + 0.15929004549980164, + 0.15449269115924835, + 0.175917387008667 + ], + "perturbation_rho": [ + 0.5534218549728394, + 0.3554393947124481, + 0.28831934928894043, + 0.1869889795780182, + 0.14766299724578857, + 0.176305890083313, + 0.1294843554496765, + 0.16089865565299988 + ], + "nudging": { + "0.001": [ + -0.015559096820652485, + -0.0017606341280043125, + -0.0007992807659320533, + -0.0006281178793869913, + -0.0004932679585181177, + -0.00045871903421357274, + -0.0004438266041688621, + -0.000502013775985688 + ], + "0.003": [ + -0.04605434834957123, + -0.005273702088743448, + -0.002395393792539835, + -0.0018838276155292988, + -0.0014792272122576833, + -0.0013755084946751595, + -0.0013307692715898156, + -0.0015053658280521631 + ], + "0.01": [ + -0.14630448818206787, + -0.017482426017522812, + -0.00796731747686863, + -0.006267632823437452, + -0.00492177763953805, + -0.00457757618278265, + -0.004429594613611698, + -0.00500995060428977 + ] + }, + "state_pred_error_per_layer": [ + 7478.478515625, + 1555.7657470703125, + 846.884521484375, + 607.9534301757812, + 659.867919921875, + 614.796630859375, + 546.969482421875, + 518.796142578125 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.285308999633789, + 1.4970221282958984, + 0.9958043640136719, + 0.8577417706489563, + 0.7985360019683838, + 0.7742141094207764, + 0.7541868792533875, + 0.7383458856582642, + 0.7444160983085633, + 0.7699382993698121, + 0.7617377349853516, + 0.8131803276062012, + 0.8340744517326355, + 0.8096075185775757, + 0.8233888305664062, + 0.8715233425140381, + 0.8412395213127136, + 0.8587033317565917, + 0.9323606998443603, + 0.9511387075424195, + 0.9220583269119262, + 0.9964756969451904, + 1.047953590965271, + 1.1211483845710755, + 1.1204530166625977, + 1.0928433876991273, + 1.1379628707885743, + 1.1724885011672974, + 1.11281310005188, + 1.0867287273406983, + 1.1001608766555786, + 1.064141231918335, + 1.0878272228240966, + 1.1576579273223877, + 1.1238960628509522, + 1.1606859970092773, + 1.1523268983840942, + 1.1631495752334595, + 1.1449461145401, + 1.2007387851715088, + 1.1955321371078491, + 1.1975843044281005, + 1.2237273839950562, + 1.2380825258255004, + 1.2528655261993409, + 1.2506139860153198, + 1.2446461044311523, + 1.2601920402526856, + 1.260292972946167, + 1.2225133561134338, + 1.1815817672729492, + 1.1279201912879944, + 1.1294625114440917, + 1.126245882987976, + 1.1246654704093932, + 1.1226116451263428, + 1.1226808778762818, + 1.1285088397979737, + 1.134099857711792, + 1.1264239824295044, + 1.1293188371658325, + 1.1205401794433594, + 1.119812659072876, + 1.1148133518218994, + 1.1078978939056396, + 1.1084100891113282, + 1.1039220796585083, + 1.106314839553833, + 1.1013267883300781, + 1.0988227684020997, + 1.0977583408355713, + 1.101661016845703, + 1.0976945793151855, + 1.1002184070587158, + 1.099597325706482, + 1.0982094870567323, + 1.098354042339325, + 1.0976181301116943, + 1.0973274658203125, + 1.0970626482963561 + ], + "train_acc": [ + 0.1665, + 0.4746, + 0.6308, + 0.6803, + 0.7017, + 0.7154, + 0.7205, + 0.7292, + 0.73, + 0.7237, + 0.7274, + 0.7147, + 0.7123, + 0.7201, + 0.7199, + 0.7116, + 0.7175, + 0.7182, + 0.7036, + 0.7017, + 0.6986, + 0.6771, + 0.661, + 0.6447, + 0.6427, + 0.6598, + 0.6551, + 0.6497, + 0.6566, + 0.6492, + 0.6392, + 0.6489, + 0.6354, + 0.6221, + 0.6365, + 0.6315, + 0.6316, + 0.6282, + 0.6354, + 0.6243, + 0.6263, + 0.6224, + 0.6126, + 0.613, + 0.6049, + 0.6047, + 0.5997, + 0.5934, + 0.5851, + 0.5892, + 0.5947, + 0.6053, + 0.6035, + 0.6011, + 0.6009, + 0.5983, + 0.5968, + 0.5938, + 0.5937, + 0.5964, + 0.5939, + 0.5953, + 0.5948, + 0.5983, + 0.6019, + 0.5955, + 0.5977, + 0.5985, + 0.5988, + 0.6014, + 0.6007, + 0.5982, + 0.6019, + 0.6017, + 0.6018, + 0.601, + 0.6003, + 0.6017, + 0.6011, + 0.6004 + ], + "test_acc": [ + 0.316, + 0.563, + 0.64, + 0.6705, + 0.6875, + 0.685, + 0.6855, + 0.695, + 0.6965, + 0.687, + 0.693, + 0.6385, + 0.68, + 0.6835, + 0.68, + 0.6845, + 0.6595, + 0.6695, + 0.648, + 0.6475, + 0.613, + 0.6205, + 0.617, + 0.6065, + 0.6275, + 0.6195, + 0.6055, + 0.625, + 0.6255, + 0.597, + 0.61, + 0.5655, + 0.592, + 0.577, + 0.5845, + 0.591, + 0.6035, + 0.6095, + 0.5905, + 0.5985, + 0.5995, + 0.5795, + 0.5785, + 0.5825, + 0.573, + 0.572, + 0.576, + 0.564, + 0.5665, + 0.5555, + 0.5655, + 0.5595, + 0.565, + 0.561, + 0.5715, + 0.5725, + 0.567, + 0.5575, + 0.566, + 0.559, + 0.5665, + 0.565, + 0.571, + 0.566, + 0.564, + 0.566, + 0.5705, + 0.569, + 0.572, + 0.5725, + 0.566, + 0.5685, + 0.5685, + 0.5695, + 0.571, + 0.5675, + 0.569, + 0.5695, + 0.569, + 0.5695 + ], + "value_loss": [ + 3.1271000915527343, + 0.9862023504257202, + 0.999002813911438, + 1.0425576148986817, + 1.0681012689590454, + 1.03996553068161, + 0.9741387175559998, + 0.9252232690811157, + 0.9215318450927734, + 1.0047331087112428, + 0.9920830215454102, + 1.0844781509399415, + 1.1991877380371094, + 1.1131661165237428, + 1.208943075942993, + 1.3144514158248901, + 1.2510551253318787, + 1.2366151815414428, + 1.4193125873565673, + 1.4414832863807678, + 1.234130789375305, + 1.1814983905792236, + 1.181002953338623, + 1.3016531824111939, + 1.1382783500671387, + 1.170673362350464, + 1.5918773588180541, + 1.2830027442932128, + 1.0921055715560912, + 1.0236657138824463, + 0.9862152492523193, + 0.849021138381958, + 0.9729941846847534, + 1.055552239227295, + 0.9573497166633606, + 0.979692142868042, + 0.8536088975906372, + 0.9205917440414428, + 0.9167158931732178, + 1.0006125350952149, + 0.9375052051544189, + 0.9362507380485535, + 0.8874157619476318, + 0.8648644126415252, + 0.9101438512802124, + 0.8190106260299682, + 0.8930434572219849, + 0.7672423245429992, + 0.7594193473815918, + 0.6917994091033935, + 0.6012004543304443, + 0.5240080141067505, + 0.5561031037807465, + 0.4888970242500305, + 0.45605546112060547, + 0.4390888867855072, + 0.43424798107147217, + 0.44492525901794433, + 0.43093778166770935, + 0.4075843402862549, + 0.41335898056030274, + 0.4024799570083618, + 0.4438731932640076, + 0.4120406524181366, + 0.3898531212806702, + 0.36487685375213624, + 0.4172193419456482, + 0.38758800344467165, + 0.34658458247184754, + 0.3497850526809692, + 0.34360920906066894, + 0.3693427942276001, + 0.34669516372680664, + 0.3415595028400421, + 0.3338581629753113, + 0.33175049436092374, + 0.32902164781093596, + 0.3372193983078003, + 0.34403223628997803, + 0.32433377566337585 + ], + "term_loss": [ + 1.7688616269111632, + 0.5567039131641388, + 0.7618842126846314, + 0.8274082384109497, + 0.8563696183204651, + 0.8081515713214874, + 0.7371555940628052, + 0.702651878452301, + 0.7090443038940429, + 0.7881656875610351, + 0.7814326080322266, + 0.8664573314666748, + 0.9778367706298828, + 0.8968942291259766, + 0.9918186021804809, + 1.08866188955307, + 1.0337607520103456, + 1.0145263776779174, + 1.178224391078949, + 1.1919040661811828, + 0.9849708090305328, + 0.8907354804992675, + 0.8850929956436158, + 0.9636733260154724, + 0.8116515071868896, + 0.8471049592018127, + 1.2205944297790527, + 0.9197152666568756, + 0.730262474155426, + 0.6721193412780762, + 0.6394133093833924, + 0.5264073338508606, + 0.6090341857910156, + 0.6560073004722595, + 0.5808387887001037, + 0.6305022970199585, + 0.5382268703460693, + 0.608380263376236, + 0.6007443336486816, + 0.6557021521091461, + 0.5751603908538818, + 0.5770105336666107, + 0.5359605489730835, + 0.5291802062988281, + 0.573161884689331, + 0.5040334848880768, + 0.5644822202682495, + 0.46114305610656736, + 0.4538517463684082, + 0.402396319103241, + 0.3250580922603607, + 0.2615281641483307, + 0.29292033083438873, + 0.2369567009449005, + 0.20991090397834777, + 0.19518582130670548, + 0.19080099306106568, + 0.19688191146850587, + 0.18551543823480607, + 0.16424798595905304, + 0.16575304796695708, + 0.1589976065158844, + 0.19366324095726012, + 0.1671199806332588, + 0.15091914472579956, + 0.1298795120716095, + 0.169755113196373, + 0.14672498960494995, + 0.1157905509352684, + 0.11689144127368926, + 0.11296927728652954, + 0.13240787162780762, + 0.11255746988058091, + 0.10960722550153733, + 0.10443557546138764, + 0.10119444595873356, + 0.09986090980172158, + 0.10406229302883148, + 0.1090045433819294, + 0.09466714213788509 + ], + "bridge_loss": [ + 1.0573119517879341, + 0.15241351038217543, + 0.01608453490436077, + 0.0064939980387687685, + 0.00945009122788906, + 0.0323205705165863, + 0.04268855847716332, + 0.030068882912397385, + 0.01993687737584114, + 0.01725001146569848, + 0.013776662385463715, + 0.013469882538914681, + 0.014333608262240886, + 0.013788160926103592, + 0.015742842441797255, + 0.01819062510430813, + 0.017548553105443718, + 0.019768079090118407, + 0.027314204022288322, + 0.03441775139570236, + 0.038058071267604826, + 0.06389330162107945, + 0.0633503836274147, + 0.09107995666265488, + 0.08258416488170624, + 0.0874572071313858, + 0.13215684812664985, + 0.12343537128567696, + 0.12941908707618713, + 0.12270671548843384, + 0.11486915047168732, + 0.09825265907049179, + 0.13369894971847535, + 0.1591746563911438, + 0.14571076006889344, + 0.1132983045578003, + 0.08243037438392639, + 0.08029556272029877, + 0.08846713262796402, + 0.1103203533411026, + 0.1305971376657486, + 0.12747013745307922, + 0.11351788620948791, + 0.09815907695889473, + 0.09737673666477203, + 0.0758411329627037, + 0.08800876551866531, + 0.06460359013080597, + 0.06309500212669372, + 0.05380393154621124, + 0.0478264770925045, + 0.04128478689193726, + 0.042341444367170335, + 0.03188926424384117, + 0.025954529893398286, + 0.025412592981755733, + 0.02477064228951931, + 0.028199707794189455, + 0.025668095329403878, + 0.02380155615210533, + 0.02794931230545044, + 0.024946860378980636, + 0.0320184164583683, + 0.02804033151268959, + 0.023456422537565233, + 0.019551472708582877, + 0.03227331275343895, + 0.025733040750026703, + 0.016958685997128485, + 0.019350963592529295, + 0.017583922302722932, + 0.023359004205465318, + 0.021352820153534412, + 0.018858864906430243, + 0.017002299439907075, + 0.018063389497995377, + 0.01701616567224264, + 0.02123323907852173, + 0.023313335365056993, + 0.018076158130913973 + ], + "tgrad_loss": [ + 0.300926530790329, + 0.27708493127822875, + 0.2210340663909912, + 0.20865537734031678, + 0.2022815556526184, + 0.19949339275360106, + 0.19429456148147584, + 0.19250250487327575, + 0.1925506702899933, + 0.19931740417480467, + 0.19687375478744507, + 0.20455093593597412, + 0.20701736421585082, + 0.2024837209701538, + 0.20138162145614624, + 0.20759890670776368, + 0.19974581598043442, + 0.20232072179317476, + 0.21377399282455445, + 0.21516146430969238, + 0.21110190229415893, + 0.22686960439682008, + 0.2325595742225647, + 0.24689988670349122, + 0.24404268040657043, + 0.23611119108200074, + 0.2391260844707489, + 0.23985210418701172, + 0.2324240131855011, + 0.2288396686077118, + 0.23193279480934142, + 0.2243611490726471, + 0.23026104683876036, + 0.24037028608322145, + 0.23080016889572144, + 0.23589155068397522, + 0.23295164408683777, + 0.23191592471599579, + 0.22750442996025086, + 0.2345900161266327, + 0.23174768257141112, + 0.23177007055282592, + 0.23793732562065126, + 0.23752512764930725, + 0.23960522780418397, + 0.23913600816726685, + 0.24055246658325194, + 0.2414956763267517, + 0.24247259407043456, + 0.2355991590976715, + 0.22831588366031647, + 0.2211950572013855, + 0.2208413278579712, + 0.2200510561466217, + 0.22019002876281737, + 0.21849047474861144, + 0.21867634949684142, + 0.21984363961219788, + 0.21975424647331238, + 0.21953480105400086, + 0.21965661954879762, + 0.2185354926586151, + 0.21819153480529785, + 0.2168803418636322, + 0.21547755289077758, + 0.21544586992263795, + 0.21519091215133668, + 0.215129975605011, + 0.2138353454589844, + 0.21354264924526214, + 0.21305600986480713, + 0.21357592091560365, + 0.21278487405776977, + 0.21309341056346892, + 0.21242028739452362, + 0.21249265823364258, + 0.2121445729970932, + 0.21192386741638183, + 0.2117143608570099, + 0.21159047515392304 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.08390675485134125, + 0.2993828356266022, + 0.37482553720474243, + 0.3876585066318512, + 0.3966418504714966, + 0.3863479495048523, + 0.3938036561012268, + 0.39385986328125 + ], + "perturbation_rho": [ + 0.09506039321422577, + 0.3888479173183441, + 0.42724472284317017, + 0.5000925064086914, + 0.4708487391471863, + 0.47097086906433105, + 0.48436442017555237, + 0.4723408818244934 + ], + "nudging": { + "0.001": [ + -0.0027529560029506683, + -0.0023121805861592293, + -0.0022948652040213346, + -0.0022791987285017967, + -0.0022901692427694798, + -0.0022190851159393787, + -0.0022319701965898275, + -0.002243783324956894 + ], + "0.003": [ + -0.008236072957515717, + -0.006927105598151684, + -0.00687650078907609, + -0.006829372141510248, + -0.006862659007310867, + -0.0066499970853328705, + -0.006688036024570465, + -0.006723873317241669 + ], + "0.01": [ + -0.027181372046470642, + -0.02298363298177719, + -0.02282092720270157, + -0.022664468735456467, + -0.02277727797627449, + -0.02207607962191105, + -0.022199643775820732, + -0.02231789380311966 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a1.0_L8_s42.json b/results/synth_ladder_v2_hi/synth_a1.0_L8_s42.json new file mode 100644 index 0000000..c5d8746 --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a1.0_L8_s42.json @@ -0,0 +1,1638 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.3703768091201782, + 0.6740123039245606, + 0.5613458353042603, + 0.5279877727508545, + 0.42555175495147707, + 0.4008464940071106, + 0.3418552673816681, + 0.3169305899143219, + 0.2989230684995651, + 0.22381072659492493, + 0.24954671635627745, + 0.18852242698669433, + 0.17931302828788756, + 0.15236511628627777, + 0.14625489993095397, + 0.08793083952665329, + 0.0944634979724884, + 0.06237407035827637, + 0.10902504413723946, + 0.05045343590974808, + 0.05675933723151684, + 0.030447202077507972, + 0.017234644067287447, + 0.015850160157680513, + 0.020682270124554633, + 0.011260225063562394, + 0.008402103558182716, + 0.006454302641004324, + 0.0056301679342985154, + 0.005158279886841774, + 0.0048245771206915375, + 0.00440153166204691, + 0.004052742725610733, + 0.003818019072525203, + 0.003542347052693367, + 0.003333687162399292, + 0.00319532755613327, + 0.0030527794640511276, + 0.0028776524614542724, + 0.002738851569220424, + 0.002615449556335807, + 0.0024998470187187196, + 0.00237983765527606, + 0.0022845500905066727, + 0.002204404693841934, + 0.002141781159862876, + 0.002064352393895388, + 0.0019999265871942042, + 0.001937351893261075, + 0.0018773890499025584, + 0.0018315334113314747, + 0.0017837765011005104, + 0.0017335505589842796, + 0.0017015570227056742, + 0.0016626481765881181, + 0.0016315237021073698, + 0.001601293208822608, + 0.0015703001253306865, + 0.0015464611501432954, + 0.0015225628331303597, + 0.0015008840339258314, + 0.0014787248853594065, + 0.001461056488007307, + 0.0014460599626414479, + 0.0014304681217297912, + 0.0014166310345754027, + 0.001404330819286406, + 0.001393687280640006, + 0.0013846246616914869, + 0.0013766696255654097, + 0.0013697378845885396, + 0.0013638495333492756, + 0.0013587745733559132, + 0.0013546861404553055, + 0.0013515702040866016, + 0.0013490962450392544, + 0.0013473950270563365, + 0.0013461836755275726, + 0.0013454901657998562, + 0.001345112643018365 + ], + "train_acc": [ + 0.5176, + 0.7374, + 0.7823, + 0.7897, + 0.8383, + 0.8471, + 0.8716, + 0.8776, + 0.8863, + 0.9211, + 0.9088, + 0.935, + 0.9374, + 0.9488, + 0.9488, + 0.976, + 0.9719, + 0.9873, + 0.9681, + 0.9892, + 0.9856, + 0.9951, + 0.9994, + 0.999, + 0.9969, + 0.9998, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.704, + 0.7445, + 0.748, + 0.76, + 0.76, + 0.76, + 0.767, + 0.7675, + 0.7675, + 0.7645, + 0.766, + 0.764, + 0.7615, + 0.7595, + 0.759, + 0.77, + 0.7635, + 0.769, + 0.759, + 0.756, + 0.7615, + 0.7645, + 0.7665, + 0.767, + 0.7615, + 0.768, + 0.7655, + 0.767, + 0.769, + 0.7655, + 0.7645, + 0.7645, + 0.7645, + 0.7645, + 0.766, + 0.766, + 0.764, + 0.765, + 0.7665, + 0.7655, + 0.765, + 0.7635, + 0.765, + 0.764, + 0.763, + 0.764, + 0.7625, + 0.762, + 0.7625, + 0.762, + 0.7635, + 0.7635, + 0.7625, + 0.7635, + 0.764, + 0.764, + 0.764, + 0.762, + 0.7625, + 0.7625, + 0.7635, + 0.7625, + 0.7625, + 0.7625, + 0.763, + 0.763, + 0.7635, + 0.7635, + 0.762, + 0.7625, + 0.763, + 0.7625, + 0.763, + 0.763, + 0.763, + 0.763, + 0.763, + 0.763, + 0.763, + 0.763 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.85625159740448, + 0.8527897596359253, + 0.847720742225647, + 0.8408411145210266, + 0.831807017326355, + 0.8158122301101685, + 0.7960221171379089, + 0.7814224362373352 + ], + "perturbation_rho": [ + 0.999999463558197, + 0.9999992847442627, + 0.9999988079071045, + 0.9999978542327881, + 0.999994695186615, + 0.9999883770942688, + 0.9999692440032959, + 0.9999352693557739 + ], + "nudging": { + "0.001": [ + -0.06596626341342926, + -0.055192336440086365, + -0.04268433526158333, + -0.03002634271979332, + -0.019770411774516106, + -0.012638297863304615, + -0.00813499465584755, + -0.00550876185297966 + ], + "0.003": [ + -0.1898897886276245, + -0.16005799174308777, + -0.12479926645755768, + -0.08847799897193909, + -0.05861322209239006, + -0.03762739524245262, + -0.02428549900650978, + -0.01647210866212845 + ], + "0.01": [ + -0.5478029251098633, + -0.4737934172153473, + -0.3800549805164337, + -0.2769272029399872, + -0.18745023012161255, + -0.12213317304849625, + -0.07957549393177032, + -0.05427805706858635 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.231708497619629, + 1.418635772895813, + 0.943305676651001, + 0.8297181538581848, + 0.7659538966178894, + 0.7355367126464843, + 0.7249059216499328, + 0.7103497696876526, + 0.7056580327033997, + 0.7284941980361939, + 0.7514717527389526, + 0.7495575723648071, + 0.8143573719024658, + 0.7943916882514953, + 0.8353345689773559, + 0.8233354604721069, + 0.8139635746955871, + 0.8670068431854248, + 0.8794054039955139, + 0.8576095231056213, + 0.8653796346664429, + 0.8882027687072754, + 0.882841535949707, + 0.8668330222129822, + 0.9123839077949524, + 0.8965684688568115, + 0.9347959500312805, + 0.9114629460334778, + 1.0174331352233887, + 1.0257655752182007, + 0.9572873649597168, + 0.9571795852661132, + 0.955192239189148, + 0.9428499357223511, + 0.9694318241119385, + 0.9648013277053833, + 0.9437480949401855, + 1.0161491086006165, + 0.9801935592651367, + 1.0127256759643555, + 0.9624169521331787, + 0.9303661527633666, + 0.9537605016708374, + 0.9153729921340943, + 0.9333063995361328, + 0.9985080844879151, + 0.9437879688262939, + 0.9058924737930298, + 0.9471581097126007, + 0.9148890993118286, + 0.9394946533441544, + 0.8862299453735352, + 0.9382994981765747, + 0.8954874497413635, + 0.8906831897735595, + 0.884014150428772, + 0.884524594116211, + 0.8859518936157227, + 0.8956645541667938, + 0.8656166372299194, + 0.8735888675689697, + 0.861944951248169, + 0.8634599599838256, + 0.8558167356491089, + 0.844254759979248, + 0.8468807869911193, + 0.8440567171096802, + 0.84414446849823, + 0.837095554637909, + 0.835498137664795, + 0.8313182315826416, + 0.828638949584961, + 0.8268064447402954, + 0.8259873526573182, + 0.8236354766845703, + 0.8209153217315673, + 0.8198824878692627, + 0.8184344896316529, + 0.8179562203884124, + 0.8174484502792358 + ], + "train_acc": [ + 0.1815, + 0.5159, + 0.651, + 0.6912, + 0.7167, + 0.7262, + 0.7308, + 0.7384, + 0.741, + 0.7376, + 0.7324, + 0.7328, + 0.7159, + 0.7239, + 0.7173, + 0.7224, + 0.7268, + 0.7175, + 0.715, + 0.7155, + 0.7135, + 0.7083, + 0.7079, + 0.7222, + 0.7109, + 0.7127, + 0.705, + 0.7133, + 0.691, + 0.6908, + 0.7041, + 0.7043, + 0.7034, + 0.7046, + 0.6986, + 0.7039, + 0.7053, + 0.6985, + 0.6989, + 0.6932, + 0.7021, + 0.7058, + 0.7036, + 0.7103, + 0.7038, + 0.694, + 0.7059, + 0.7157, + 0.7038, + 0.7053, + 0.6982, + 0.7145, + 0.7049, + 0.7129, + 0.7097, + 0.714, + 0.7158, + 0.7144, + 0.709, + 0.7129, + 0.7151, + 0.718, + 0.7154, + 0.7205, + 0.7183, + 0.7192, + 0.7212, + 0.719, + 0.7204, + 0.7232, + 0.7219, + 0.7235, + 0.7222, + 0.7244, + 0.725, + 0.7229, + 0.7241, + 0.7237, + 0.724, + 0.7242 + ], + "test_acc": [ + 0.37, + 0.5725, + 0.639, + 0.6635, + 0.684, + 0.6775, + 0.7075, + 0.705, + 0.682, + 0.6865, + 0.673, + 0.6715, + 0.661, + 0.652, + 0.679, + 0.6745, + 0.6695, + 0.655, + 0.666, + 0.6525, + 0.6585, + 0.636, + 0.6565, + 0.654, + 0.662, + 0.6365, + 0.641, + 0.6285, + 0.5975, + 0.646, + 0.6565, + 0.65, + 0.649, + 0.6255, + 0.631, + 0.654, + 0.635, + 0.6255, + 0.6485, + 0.6345, + 0.6385, + 0.6355, + 0.628, + 0.6475, + 0.6405, + 0.63, + 0.649, + 0.6375, + 0.656, + 0.6335, + 0.64, + 0.637, + 0.6515, + 0.6585, + 0.6535, + 0.6565, + 0.656, + 0.6415, + 0.658, + 0.6475, + 0.6555, + 0.6595, + 0.651, + 0.6525, + 0.654, + 0.657, + 0.652, + 0.6495, + 0.655, + 0.6595, + 0.656, + 0.656, + 0.652, + 0.658, + 0.656, + 0.658, + 0.658, + 0.658, + 0.6565, + 0.657 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.01574046164751053, + 0.07191511988639832, + 0.043905604630708694, + 0.07308061420917511, + 0.07518148422241211, + 0.026394926011562347, + 0.06854978203773499, + 0.03262286260724068 + ], + "perturbation_rho": [ + -0.02709903195500374, + 0.1010747104883194, + 0.06438975036144257, + 0.07812117040157318, + 0.0766223892569542, + 0.026489075273275375, + 0.09218208491802216, + 0.010375358164310455 + ], + "nudging": { + "0.001": [ + 0.0007142307586036623, + -0.0005231229588389397, + -0.00022074897424317896, + -0.0003081119211856276, + -0.00031572216539643705, + -0.0001395478320773691, + -0.00030396669171750546, + -0.0001277559931622818 + ], + "0.003": [ + 0.002162146382033825, + -0.0015680594369769096, + -0.0006631950382143259, + -0.0009237516205757856, + -0.0009470301447436213, + -0.00041793263517320156, + -0.0009104788769036531, + -0.00038223061710596085 + ], + "0.01": [ + 0.007441862486302853, + -0.0052239359356462955, + -0.0022090799175202847, + -0.003076428547501564, + -0.0031523762736469507, + -0.0013899998739361763, + -0.0030318819917738438, + -0.0012708738213405013 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.8269318895339965, + 1.0051976400375366, + 0.7789531414031983, + 0.7320484294891357, + 0.7566996850967407, + 0.8095570373535156, + 0.8494610660552978, + 0.867692116355896, + 0.9100590816497802, + 0.9440827163696289, + 0.9782439228057861, + 0.9932998554229736, + 1.019014867591858, + 1.0342318592071533, + 1.0291874648094177, + 1.0253695629119872, + 1.0212761486053468, + 0.9800823013305664, + 0.9683791316986085, + 0.9785815362930298, + 0.9862299140930175, + 0.996787068939209, + 0.9779501231193543, + 0.9745217691421508, + 0.9691826663970947, + 0.9746626880645752, + 0.9487684160232543, + 0.9371404664993286, + 0.9199271064758301, + 0.9334722229003907, + 0.9503546269416809, + 0.923910745048523, + 0.9474884466171265, + 0.9268602334976196, + 0.9206624788284302, + 0.92753564453125, + 0.9302853199005127, + 0.9186395662307739, + 0.9185600196838379, + 0.9253120166778565, + 0.9207821632385254, + 0.9409901829719544, + 0.9193793958663941, + 0.92328047580719, + 0.9343797274589538, + 0.9142894317626953, + 0.9160927310943604, + 0.9014208396911622, + 0.8922535416603088, + 0.8816746612548828, + 0.875530839920044, + 0.8770241296768189, + 0.8663126466751099, + 0.8592928192138672, + 0.8631654893875123, + 0.8535493013381958, + 0.8564054052352905, + 0.8476457886695862, + 0.8455490423202514, + 0.8474060085296631, + 0.8453507354736328, + 0.8386427994728088, + 0.8379946626663208, + 0.8355536317825317, + 0.8326087244987488, + 0.8301034708023072, + 0.830259226512909, + 0.8299130233764649, + 0.8300449360847473, + 0.8248954859733582, + 0.8260357536315918, + 0.8241482278823853, + 0.8238134614944458, + 0.8230488618850708, + 0.8220901975631714, + 0.8213789791107178, + 0.820764907169342, + 0.8205714824676513, + 0.8203490972518921, + 0.8202249536514282 + ], + "train_acc": [ + 0.3329, + 0.6247, + 0.7097, + 0.7227, + 0.7276, + 0.7099, + 0.6974, + 0.6846, + 0.6714, + 0.6626, + 0.6488, + 0.6489, + 0.6369, + 0.6372, + 0.6319, + 0.632, + 0.6355, + 0.6386, + 0.6513, + 0.6427, + 0.6492, + 0.6472, + 0.6511, + 0.6486, + 0.6528, + 0.6518, + 0.6585, + 0.6669, + 0.6679, + 0.6653, + 0.6613, + 0.6667, + 0.6646, + 0.6671, + 0.6709, + 0.6708, + 0.6729, + 0.6698, + 0.6707, + 0.6667, + 0.6706, + 0.6663, + 0.6722, + 0.6713, + 0.6656, + 0.6721, + 0.6725, + 0.6774, + 0.6753, + 0.6819, + 0.686, + 0.6821, + 0.6868, + 0.687, + 0.6869, + 0.6871, + 0.6879, + 0.6917, + 0.6921, + 0.6905, + 0.6907, + 0.6917, + 0.6916, + 0.6973, + 0.6978, + 0.6964, + 0.6952, + 0.6978, + 0.6953, + 0.6958, + 0.6938, + 0.6957, + 0.6958, + 0.6957, + 0.6977, + 0.6981, + 0.6966, + 0.6975, + 0.6972, + 0.6976 + ], + "test_acc": [ + 0.5265, + 0.678, + 0.71, + 0.7075, + 0.675, + 0.665, + 0.654, + 0.6415, + 0.6275, + 0.6325, + 0.622, + 0.611, + 0.5895, + 0.5935, + 0.5915, + 0.5865, + 0.6105, + 0.6065, + 0.618, + 0.607, + 0.612, + 0.6175, + 0.609, + 0.615, + 0.6155, + 0.617, + 0.619, + 0.626, + 0.6165, + 0.615, + 0.622, + 0.633, + 0.6425, + 0.6285, + 0.6315, + 0.629, + 0.6235, + 0.63, + 0.6265, + 0.633, + 0.6165, + 0.627, + 0.6225, + 0.6145, + 0.6265, + 0.623, + 0.625, + 0.616, + 0.6225, + 0.628, + 0.6305, + 0.6375, + 0.6365, + 0.636, + 0.635, + 0.6425, + 0.6325, + 0.6285, + 0.6305, + 0.6385, + 0.638, + 0.64, + 0.6425, + 0.6405, + 0.644, + 0.646, + 0.6455, + 0.646, + 0.643, + 0.644, + 0.648, + 0.648, + 0.6505, + 0.65, + 0.647, + 0.6485, + 0.648, + 0.6485, + 0.649, + 0.65 + ], + "state_pred_error": [ + 0.7002311863422394, + 0.22084679579734803, + 0.15376953585147857, + 0.1484843623161316, + 0.15982647223472596, + 0.1811715921163559, + 0.1945667941093445, + 0.20176007509231567, + 0.20261625909805298, + 0.19124769098758698, + 0.18218962874412536, + 0.1763947120666504, + 0.17245661504268647, + 0.1630336755514145, + 0.15171641788482665, + 0.14321954603195192, + 0.13387794542312623, + 0.12238948247432709, + 0.11191521211862564, + 0.10725419701337814, + 0.10254445215463638, + 0.09755742149353028, + 0.09333524917364121, + 0.08919921718835831, + 0.08560046610832214, + 0.08166285650730133, + 0.07877540134191513, + 0.07652937555313111, + 0.0737526822566986, + 0.07185606707334519, + 0.07086474553346633, + 0.06932573999166489, + 0.06812271840572358, + 0.06726093112230301, + 0.06480677745938301, + 0.06218134503364563, + 0.06057768109440804, + 0.05787591310143471, + 0.05514800155162811, + 0.05402169469594956, + 0.053021151185035705, + 0.0528799110531807, + 0.05364514610171318, + 0.05383548038005829, + 0.05424729347229004, + 0.052925097239017484, + 0.051881495702266696, + 0.050513546645641325, + 0.05008096670508385, + 0.04856216832399368, + 0.047455233627557755, + 0.0464736877143383, + 0.04560171290636063, + 0.044719690442085264, + 0.04401536261439323, + 0.0430379842877388, + 0.042287754344940184, + 0.04157426287531853, + 0.041074179071187975, + 0.039926473212242124, + 0.03941906256079674, + 0.03929359982609749, + 0.03810683597326279, + 0.03805391449332237, + 0.03690763158798218, + 0.03655427814722061, + 0.0361525127530098, + 0.035647189819812776, + 0.03503355433940888, + 0.03485284671187401, + 0.03406067345738411, + 0.03359544692635536, + 0.0335003142118454, + 0.03281750077009201, + 0.032709699648618695, + 0.03246098607182503, + 0.032299374321103094, + 0.03149260161221027, + 0.03101077135503292, + 0.031075275203585623 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.6320836544036865, + 0.4503885507583618, + 0.22882479429244995, + 0.17507168650627136, + 0.15456035733222961, + 0.15327030420303345, + 0.14079461991786957, + 0.1386653482913971 + ], + "perturbation_rho": [ + 0.5491607189178467, + 0.3870346248149872, + 0.23711450397968292, + 0.15141981840133667, + 0.12508505582809448, + 0.15914584696292877, + 0.13365353643894196, + 0.11637556552886963 + ], + "nudging": { + "0.001": [ + -0.02009502425789833, + -0.0022013955749571323, + -0.000710347609128803, + -0.0005365170654840767, + -0.0004632421478163451, + -0.0004581586108542979, + -0.00041777893784455955, + -0.00040680408710613847 + ], + "0.003": [ + -0.05951227992773056, + -0.006594196427613497, + -0.002129881177097559, + -0.0016088619595393538, + -0.0013889807742089033, + -0.0013738160487264395, + -0.0012525597121566534, + -0.001220083562657237 + ], + "0.01": [ + -0.18924641609191895, + -0.02186501771211624, + -0.007085676770657301, + -0.0053551034070551395, + -0.00462403055280447, + -0.004574076272547245, + -0.004170445259660482, + -0.004062457010149956 + ] + }, + "state_pred_error_per_layer": [ + 9406.7255859375, + 1991.255126953125, + 1233.173095703125, + 996.4456787109375, + 824.75537109375, + 800.2864990234375, + 821.3734130859375, + 840.202392578125 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.232960743522644, + 1.420582393836975, + 0.9455811813354492, + 0.8257486240386963, + 0.7836144889831543, + 0.7402769828796387, + 0.729928002166748, + 0.7208036253929139, + 0.7297886791229248, + 0.7470350498199463, + 0.7721688493728638, + 0.7637209308624268, + 0.7816214589595795, + 0.7835877867221832, + 0.8151798434257508, + 0.8235684534072876, + 0.8353915449142456, + 0.9103365058898926, + 0.8753420095443726, + 0.8804965543746949, + 0.8581397535324097, + 0.8739657152175904, + 0.9016903800964355, + 0.990748242855072, + 0.9614215970993042, + 0.9776799642562867, + 0.9315557836532593, + 1.0852978912353515, + 1.141357445335388, + 1.0584074115753175, + 1.1172573081970214, + 1.2589679100036621, + 1.2367329082489014, + 1.23497767162323, + 1.190962762260437, + 1.2603005590438843, + 1.3260346855163574, + 1.3029141501426698, + 1.3730133871078491, + 1.389457112121582, + 1.410658281326294, + 1.3981717176437378, + 1.386588328552246, + 1.4026400897979736, + 1.364222408103943, + 1.352792622756958, + 1.3398897926330566, + 1.3449722723007203, + 1.3795583543777465, + 1.3794076923370362, + 1.3593113542556763, + 1.3827865106582642, + 1.4238173538208008, + 1.4441098989486694, + 1.3864106082916259, + 1.3831024318695069, + 1.3302570987701416, + 1.3178522941589355, + 1.3111997756958007, + 1.294492097091675, + 1.2957700435638428, + 1.2821458141326905, + 1.2766342969894409, + 1.270096806907654, + 1.2705438976287842, + 1.2668931608200074, + 1.2661620328903198, + 1.265557067680359, + 1.2638321792602538, + 1.2624110040664673, + 1.2631232545852662, + 1.258963946914673, + 1.2560675323486328, + 1.2551779272079469, + 1.2541378360748292, + 1.2531858157157898, + 1.2520371969223023, + 1.2515714080810547, + 1.251167310333252, + 1.2510119449615478 + ], + "train_acc": [ + 0.182, + 0.5116, + 0.6517, + 0.6921, + 0.708, + 0.7264, + 0.7306, + 0.7382, + 0.7317, + 0.731, + 0.7285, + 0.7313, + 0.7261, + 0.7293, + 0.7186, + 0.722, + 0.7219, + 0.7014, + 0.7063, + 0.7082, + 0.707, + 0.7001, + 0.6881, + 0.6614, + 0.6594, + 0.6525, + 0.6624, + 0.6161, + 0.6072, + 0.6145, + 0.5943, + 0.5501, + 0.554, + 0.5531, + 0.5665, + 0.5428, + 0.5238, + 0.5234, + 0.5168, + 0.5069, + 0.4863, + 0.5042, + 0.5041, + 0.4991, + 0.5112, + 0.5147, + 0.5196, + 0.5155, + 0.5037, + 0.5052, + 0.5158, + 0.5056, + 0.497, + 0.4917, + 0.5062, + 0.5071, + 0.5237, + 0.5225, + 0.5219, + 0.5364, + 0.5279, + 0.5373, + 0.5397, + 0.5403, + 0.5423, + 0.5425, + 0.5422, + 0.5421, + 0.5412, + 0.5445, + 0.5421, + 0.5432, + 0.5468, + 0.5464, + 0.5471, + 0.5477, + 0.548, + 0.5478, + 0.5477, + 0.5484 + ], + "test_acc": [ + 0.3665, + 0.5675, + 0.6405, + 0.6575, + 0.6705, + 0.697, + 0.69, + 0.708, + 0.7, + 0.6855, + 0.6895, + 0.679, + 0.689, + 0.671, + 0.686, + 0.672, + 0.647, + 0.647, + 0.662, + 0.648, + 0.652, + 0.649, + 0.6015, + 0.577, + 0.592, + 0.632, + 0.5725, + 0.4715, + 0.503, + 0.554, + 0.4985, + 0.4535, + 0.4465, + 0.5365, + 0.508, + 0.48, + 0.48, + 0.39, + 0.399, + 0.4295, + 0.417, + 0.4325, + 0.406, + 0.4525, + 0.461, + 0.46, + 0.494, + 0.4075, + 0.429, + 0.484, + 0.4755, + 0.4765, + 0.4635, + 0.4615, + 0.464, + 0.479, + 0.47, + 0.494, + 0.4885, + 0.4925, + 0.4965, + 0.5015, + 0.5045, + 0.51, + 0.4995, + 0.509, + 0.503, + 0.5125, + 0.506, + 0.5165, + 0.512, + 0.507, + 0.511, + 0.514, + 0.511, + 0.5155, + 0.5145, + 0.515, + 0.5165, + 0.5165 + ], + "value_loss": [ + 3.063135040283203, + 0.9178804653167725, + 1.0234842987060546, + 1.1325440734863281, + 1.1635567161560059, + 1.084977388381958, + 0.9335860944747925, + 0.8856829252243043, + 0.9029004842758178, + 0.9281125900268554, + 1.0018171398162843, + 0.9197395215988159, + 0.9605137948989868, + 0.9333957103729248, + 0.9645775228500366, + 1.000026789855957, + 0.9733592803955078, + 1.0830778367042542, + 0.9194553695678711, + 0.917877451992035, + 0.754574672961235, + 0.7473849777221679, + 0.760665825843811, + 0.8724378496170044, + 0.7502632125854493, + 0.8110419334411622, + 0.6086162291526794, + 0.8276397277832032, + 1.0285220121383667, + 0.6005109428405762, + 0.8579624128341675, + 0.8123299127578736, + 0.6401672322273254, + 0.7736768434524536, + 0.6747624232769013, + 0.509700684595108, + 0.6056561064720154, + 0.6021059381961823, + 0.6918458218574524, + 0.7592935428619385, + 0.7403267482757568, + 0.594590943145752, + 0.5076187595367432, + 0.589847268486023, + 0.6413895493507386, + 0.5144407531738281, + 0.4514115423679352, + 0.5254093447685242, + 0.4945307634830475, + 0.49715064158439637, + 0.5229528147697449, + 0.4919383934020996, + 0.5279038127899169, + 0.5955624567031861, + 0.484116339302063, + 0.48801227164268496, + 0.4493190938949585, + 0.4401164185523987, + 0.41058427753448484, + 0.4015273964881897, + 0.38259989376068115, + 0.3977900302886963, + 0.3736837770462036, + 0.38537446489334104, + 0.41789057059288026, + 0.3799989566802979, + 0.4289457809448242, + 0.37526923496723175, + 0.3512410442829132, + 0.3536668284416199, + 0.3485133903503418, + 0.3410946590900421, + 0.353677539396286, + 0.36449949283599853, + 0.35570076990127564, + 0.3507022621154785, + 0.3628367488861084, + 0.3334844871520996, + 0.33962156491279605, + 0.35056146993637083 + ], + "term_loss": [ + 1.7380315342903137, + 0.522208710193634, + 0.7970712635040283, + 0.9268595787048339, + 0.963915803527832, + 0.8737848152160644, + 0.7096522349834442, + 0.6905156551361084, + 0.717272045135498, + 0.7419232294082642, + 0.8111855196475982, + 0.7332462784767151, + 0.7724072788238525, + 0.7451452328681946, + 0.7710176473617554, + 0.8040578945159912, + 0.7748076803684235, + 0.8724104147434235, + 0.7111417359352111, + 0.708936474943161, + 0.5438156430184841, + 0.5117625785827636, + 0.5003676904678345, + 0.5760292330741882, + 0.4542557261943817, + 0.5189919714927673, + 0.3221183834314346, + 0.5177541013717651, + 0.6817261950492859, + 0.3209350066184998, + 0.5049364763259888, + 0.4522950346469879, + 0.32609601502418517, + 0.43547215032577513, + 0.35757653040885923, + 0.21219050855636595, + 0.2881464541435242, + 0.2884611166834831, + 0.3724199409008026, + 0.4170766181945801, + 0.39002414054870604, + 0.2564110339283943, + 0.18429851140975953, + 0.2539124309062958, + 0.30265880492925645, + 0.19822253029346465, + 0.14195171850919724, + 0.20319455585479737, + 0.1759055587053299, + 0.18195768083333969, + 0.20568956186771392, + 0.18406356749534608, + 0.2139556656241417, + 0.27537979845404625, + 0.18222865467071533, + 0.18534576222896576, + 0.1560566021680832, + 0.1466648970603943, + 0.12159120118618011, + 0.11602592898607254, + 0.10063835277557373, + 0.11672715072631835, + 0.09764246659278869, + 0.10889123477935791, + 0.1363328471660614, + 0.10446722288131714, + 0.14478881199359894, + 0.10136622951179743, + 0.08094131415486336, + 0.0810381259918213, + 0.0765758816510439, + 0.07205680896639824, + 0.08189015170931815, + 0.09137738156318664, + 0.08255635949671268, + 0.08009501400589943, + 0.087424889087677, + 0.06630494102239609, + 0.07004760477542878, + 0.0784306697010994 + ], + "bridge_loss": [ + 1.0358692544909136, + 0.13155127784013748, + 0.013771739280223846, + 0.006167022878676653, + 0.010226642233133316, + 0.03349325300455094, + 0.051338992768526076, + 0.025331524658203125, + 0.015777216017246246, + 0.016127415639162063, + 0.016217421828210354, + 0.014605749247968198, + 0.014789033402502537, + 0.016496201342344283, + 0.017412009951472282, + 0.020229191905260086, + 0.0237046923160553, + 0.02550773705840111, + 0.02643321447297931, + 0.02973362688422203, + 0.035443501433730124, + 0.05561487289965153, + 0.07549205500483513, + 0.09634782196283341, + 0.09850893812179566, + 0.09041237454414368, + 0.09321520891189575, + 0.09043479615449905, + 0.11861175520420074, + 0.05878040784597397, + 0.12119050502181053, + 0.10563623140454292, + 0.06031600506305695, + 0.08450027232170106, + 0.06857655513882636, + 0.03640015028715134, + 0.046798882389068604, + 0.0454333637714386, + 0.04170687899589538, + 0.059792518198490144, + 0.06378642410039902, + 0.05276329394876957, + 0.038991385126113894, + 0.04724101865887642, + 0.05553500943779945, + 0.03707851017713547, + 0.03180363908410072, + 0.04299691360294819, + 0.034361545622348784, + 0.03207299547791481, + 0.03789413919746876, + 0.025696152359247208, + 0.02592012819647789, + 0.030018769443035127, + 0.020179891040921213, + 0.021297355365753175, + 0.019295803980529307, + 0.02125145290493965, + 0.018039992034435272, + 0.017231546019017698, + 0.012940341040492059, + 0.01530613884627819, + 0.010978435875475407, + 0.012805462521314622, + 0.018135536977648734, + 0.012616378632187843, + 0.021419661676883698, + 0.01140245101414621, + 0.008457917086780072, + 0.011216394200921059, + 0.01065029435157776, + 0.00871082552820444, + 0.012181823249161243, + 0.013980842983722687, + 0.014248662017285824, + 0.012093166401982307, + 0.01729309495687485, + 0.009371091036498547, + 0.012113781988620759, + 0.0149920065253973 + ], + "tgrad_loss": [ + 0.28923423657417296, + 0.26412047119140625, + 0.21264128952026368, + 0.19951747903823852, + 0.18941426134109496, + 0.17769930906295775, + 0.17259486656188966, + 0.1698357372522354, + 0.16985121915340423, + 0.1700619439125061, + 0.17441420325040818, + 0.17188749091625213, + 0.17331748073101044, + 0.17175427423715592, + 0.1761478721141815, + 0.17573970379829407, + 0.17484690184593202, + 0.18515969462394713, + 0.18188041653633116, + 0.1792073583960533, + 0.17531552555561067, + 0.18000752310752868, + 0.18480607998371124, + 0.2000607961177826, + 0.19749854352474214, + 0.2016375789642334, + 0.19328263318538666, + 0.21945083560943604, + 0.22818406176567077, + 0.22079553413391112, + 0.23183543071746826, + 0.25439864926338196, + 0.2537552054405212, + 0.25370441846847536, + 0.24860933825969697, + 0.26111002612113954, + 0.27071076798439025, + 0.2682114581108093, + 0.2777190034866333, + 0.2824244068145752, + 0.286516183757782, + 0.28541661281585695, + 0.2843288654327393, + 0.28869381036758424, + 0.2831957377195358, + 0.27913971424102785, + 0.27765617990493774, + 0.2792178776741028, + 0.28426365900039674, + 0.2831199683666229, + 0.27936911489963534, + 0.2821786761760712, + 0.2880280209541321, + 0.29016389510631563, + 0.28170779008865354, + 0.28136915550231933, + 0.2739666873455048, + 0.27220006723403933, + 0.270953081035614, + 0.26826992158889773, + 0.26902120203971863, + 0.2657567394733429, + 0.26506287517547605, + 0.2636777688503265, + 0.26342218379974364, + 0.2629153573989868, + 0.2627373068809509, + 0.26250055599212646, + 0.2618418116569519, + 0.2614123071670532, + 0.26128721523284915, + 0.26032702457904816, + 0.25960556111335753, + 0.2591412717103958, + 0.25889574670791626, + 0.2585140820503235, + 0.25811876544952395, + 0.2578084535598755, + 0.25746017999649046, + 0.25713879618644714 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.159218892455101, + 0.41163527965545654, + 0.4353415369987488, + 0.4608742594718933, + 0.46223077178001404, + 0.4579800069332123, + 0.4774817228317261, + 0.48016148805618286 + ], + "perturbation_rho": [ + 0.16694357991218567, + 0.4445253610610962, + 0.4925374388694763, + 0.48059922456741333, + 0.4989780783653259, + 0.5061379075050354, + 0.5181043148040771, + 0.5382387638092041 + ], + "nudging": { + "0.001": [ + -0.0030890656635165215, + -0.00277144368737936, + -0.002747020684182644, + -0.00279785948805511, + -0.0027602596674114466, + -0.002695691306143999, + -0.0027822419069707394, + -0.0027705328539013863 + ], + "0.003": [ + -0.00924670323729515, + -0.00830182246863842, + -0.008229547180235386, + -0.00838212389498949, + -0.0082697793841362, + -0.008075461722910404, + -0.008334919810295105, + -0.00829961895942688 + ], + "0.01": [ + -0.030580628663301468, + -0.027534715831279755, + -0.027298064902424812, + -0.027803048491477966, + -0.027431834489107132, + -0.02679138071835041, + -0.027646536007523537, + -0.02752995677292347 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_hi/synth_a1.0_L8_s456.json b/results/synth_ladder_v2_hi/synth_a1.0_L8_s456.json new file mode 100644 index 0000000..d5471ee --- /dev/null +++ b/results/synth_ladder_v2_hi/synth_a1.0_L8_s456.json @@ -0,0 +1,1638 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.3463441451072693, + 0.656766887664795, + 0.5764270442962647, + 0.5049470205307007, + 0.44764996643066407, + 0.4062515335083008, + 0.3515693604946136, + 0.3206895810842514, + 0.2904161464214325, + 0.24753628358840943, + 0.2321726190328598, + 0.20620288902446626, + 0.14134707186222076, + 0.1381254968047142, + 0.09739616808891297, + 0.10028421921730042, + 0.08100424802601337, + 0.052481980854272844, + 0.03361937362849712, + 0.023064313806593417, + 0.016894574731588365, + 0.018029864579439163, + 0.01246860893368721, + 0.012793298210203648, + 0.009702475392818452, + 0.006933919629454613, + 0.006176107530295849, + 0.0052169317141175274, + 0.004689141265302897, + 0.004294289305061102, + 0.003947792701795697, + 0.0036314275674521924, + 0.0034709502309560776, + 0.0032241559058427812, + 0.0030264573903754353, + 0.002786829589307308, + 0.002691977459192276, + 0.0025502977319061754, + 0.0024069922894239424, + 0.002286381192691624, + 0.0021656719870865346, + 0.0020719593722373247, + 0.0019887995449826123, + 0.0019052102621644736, + 0.0018541046464815737, + 0.0017718917785212397, + 0.0017050478473305702, + 0.0016673840329051019, + 0.001611921975016594, + 0.0015704534363001584, + 0.00152546519190073, + 0.0014810588150285184, + 0.0014405241325497627, + 0.0014093171660788358, + 0.001379680984839797, + 0.0013552363596856594, + 0.0013281732812523842, + 0.0013030338326469064, + 0.0012812643218785525, + 0.0012605276802554726, + 0.0012419982708990573, + 0.0012246737219393253, + 0.0012093606535345316, + 0.0011956781635060905, + 0.0011842453136108816, + 0.0011722337789833546, + 0.0011620491795241833, + 0.0011536349520087242, + 0.001145646565500647, + 0.0011385902153328061, + 0.0011329171873629093, + 0.0011278443921357393, + 0.0011238585330545902, + 0.0011204954175278545, + 0.0011177971672266722, + 0.0011157147269695998, + 0.0011142772480845452, + 0.0011133035955950617, + 0.0011126888004131614, + 0.0011123772541992366 + ], + "train_acc": [ + 0.5307, + 0.7492, + 0.7785, + 0.8079, + 0.8279, + 0.8463, + 0.8668, + 0.8782, + 0.8923, + 0.9096, + 0.9143, + 0.9257, + 0.957, + 0.9551, + 0.9725, + 0.9702, + 0.9764, + 0.9903, + 0.9969, + 0.9996, + 0.9999, + 0.9987, + 0.9999, + 0.9995, + 0.9998, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0, + 1.0 + ], + "test_acc": [ + 0.7115, + 0.7255, + 0.7355, + 0.743, + 0.753, + 0.7475, + 0.755, + 0.7485, + 0.759, + 0.7515, + 0.7545, + 0.752, + 0.758, + 0.7455, + 0.755, + 0.7555, + 0.75, + 0.755, + 0.756, + 0.7595, + 0.7585, + 0.7595, + 0.76, + 0.7545, + 0.754, + 0.754, + 0.756, + 0.7565, + 0.7565, + 0.7595, + 0.756, + 0.7585, + 0.758, + 0.7565, + 0.7565, + 0.7575, + 0.7565, + 0.7555, + 0.757, + 0.754, + 0.756, + 0.7585, + 0.755, + 0.7545, + 0.755, + 0.7565, + 0.7565, + 0.7535, + 0.753, + 0.753, + 0.7535, + 0.754, + 0.7535, + 0.7545, + 0.753, + 0.7525, + 0.7535, + 0.754, + 0.753, + 0.754, + 0.7525, + 0.755, + 0.754, + 0.754, + 0.754, + 0.7545, + 0.755, + 0.7545, + 0.755, + 0.7535, + 0.7535, + 0.753, + 0.753, + 0.7535, + 0.7535, + 0.753, + 0.753, + 0.753, + 0.753, + 0.753 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8814424872398376, + 0.8780966401100159, + 0.8716025352478027, + 0.8659577369689941, + 0.8611791133880615, + 0.8505971431732178, + 0.840730607509613, + 0.8265380859375 + ], + "perturbation_rho": [ + 0.9999989867210388, + 0.9999986886978149, + 0.9999985694885254, + 0.9999977350234985, + 0.9999950528144836, + 0.9999887943267822, + 0.9999659657478333, + 0.9999250173568726 + ], + "nudging": { + "0.001": [ + -0.06260491907596588, + -0.05404583364725113, + -0.043221063911914825, + -0.03131342679262161, + -0.020883938297629356, + -0.013250280171632767, + -0.008379553444683552, + -0.005514292977750301 + ], + "0.003": [ + -0.17761416733264923, + -0.1546051800251007, + -0.1248859316110611, + -0.09147098660469055, + -0.06157959625124931, + -0.03932812437415123, + -0.02497147023677826, + -0.016470596194267273 + ], + "0.01": [ + -0.4892617166042328, + -0.43737056851387024, + -0.36532458662986755, + -0.27772778272628784, + -0.1931857019662857, + -0.12626537680625916, + -0.08131371438503265, + -0.05406741425395012 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2014614141464235, + 1.3978741569519042, + 0.9405525930404663, + 0.818086814880371, + 0.771164631652832, + 0.7745693199157715, + 0.7576864667892456, + 0.7463770871162414, + 0.7722696937561035, + 0.773443956565857, + 0.8196994282722473, + 0.8230226099014282, + 0.7985618083953857, + 0.8092234371185303, + 0.9053948894500733, + 0.862282297706604, + 0.8464451768875122, + 0.8680938564300537, + 0.9213174166679382, + 0.8934836537361145, + 0.8848338569641113, + 1.011159381198883, + 1.0715399806976318, + 0.9774782712936402, + 0.979182135295868, + 0.961297844696045, + 0.985339128112793, + 0.954636875629425, + 1.0366612503051758, + 1.044210665988922, + 0.9580166080474853, + 1.0057565264225006, + 1.0125841614723206, + 1.0388942193984985, + 1.02042639503479, + 0.9954714471817017, + 1.0312650917053223, + 1.0722410326957703, + 1.118370492553711, + 1.0643636600494384, + 1.0855006002426149, + 1.0861762029647828, + 1.0397474521636962, + 1.022234823036194, + 1.0104119994163514, + 1.0270879231452943, + 1.0053070098876953, + 0.9997533004760742, + 1.0271160902023315, + 1.0045647579193115, + 0.9574119953155518, + 0.9848262899398804, + 0.9798704895019531, + 0.9577104959487915, + 0.9448792140960693, + 0.9436322189331054, + 0.983009619140625, + 0.9360240677833557, + 0.9667974452972412, + 0.9391335056304931, + 0.9265738496780396, + 0.9455734071731567, + 0.9335931274414062, + 0.9092183971405029, + 0.9293749851226807, + 0.9204340211868286, + 0.9168742379188538, + 0.908523450088501, + 0.9023038515090942, + 0.9048189876556396, + 0.9040199153900147, + 0.8947954501152039, + 0.8920311195373535, + 0.8919297351837158, + 0.8907344808578491, + 0.8874358827590942, + 0.8880324649810791, + 0.8856353624343872, + 0.8847578605651856, + 0.8844726276397705 + ], + "train_acc": [ + 0.1982, + 0.5183, + 0.6515, + 0.6963, + 0.7146, + 0.7108, + 0.7191, + 0.7239, + 0.7188, + 0.7234, + 0.7114, + 0.7098, + 0.7247, + 0.7248, + 0.7024, + 0.7127, + 0.7225, + 0.7155, + 0.7086, + 0.7142, + 0.7154, + 0.6937, + 0.6873, + 0.7008, + 0.7005, + 0.7018, + 0.6989, + 0.7074, + 0.6935, + 0.6929, + 0.7088, + 0.6987, + 0.6988, + 0.6969, + 0.6981, + 0.6991, + 0.6971, + 0.6895, + 0.6819, + 0.6908, + 0.685, + 0.6889, + 0.6999, + 0.6981, + 0.7011, + 0.699, + 0.7006, + 0.6971, + 0.6944, + 0.6983, + 0.7066, + 0.6988, + 0.7024, + 0.7058, + 0.7113, + 0.7066, + 0.6974, + 0.7131, + 0.7112, + 0.7092, + 0.7148, + 0.7083, + 0.7087, + 0.7134, + 0.7109, + 0.7088, + 0.7134, + 0.7161, + 0.7161, + 0.7095, + 0.7185, + 0.7199, + 0.7198, + 0.7188, + 0.7173, + 0.7194, + 0.7216, + 0.7208, + 0.721, + 0.721 + ], + "test_acc": [ + 0.3525, + 0.593, + 0.6475, + 0.661, + 0.657, + 0.671, + 0.6795, + 0.664, + 0.674, + 0.6325, + 0.6495, + 0.664, + 0.6495, + 0.6235, + 0.6715, + 0.6375, + 0.6435, + 0.6425, + 0.6445, + 0.609, + 0.598, + 0.63, + 0.609, + 0.6375, + 0.6205, + 0.643, + 0.652, + 0.6065, + 0.618, + 0.6445, + 0.6355, + 0.629, + 0.6335, + 0.6225, + 0.6115, + 0.6205, + 0.6125, + 0.6295, + 0.6505, + 0.6245, + 0.5955, + 0.651, + 0.6355, + 0.6145, + 0.6445, + 0.64, + 0.6185, + 0.6395, + 0.633, + 0.6505, + 0.641, + 0.6495, + 0.651, + 0.641, + 0.645, + 0.637, + 0.655, + 0.6335, + 0.65, + 0.6465, + 0.644, + 0.6535, + 0.6595, + 0.661, + 0.648, + 0.657, + 0.6535, + 0.655, + 0.6515, + 0.657, + 0.658, + 0.661, + 0.651, + 0.6545, + 0.6535, + 0.6595, + 0.6555, + 0.6575, + 0.655, + 0.6545 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.025392260402441025, + 0.05978121981024742, + 0.09360896795988083, + 0.06215091794729233, + 0.08870920538902283, + 0.07948237657546997, + 0.10833052545785904, + 0.0900830328464508 + ], + "perturbation_rho": [ + -0.015408031642436981, + 0.08876338601112366, + 0.15722069144248962, + 0.07516318559646606, + 0.12132002413272858, + 0.08764688670635223, + 0.0905974954366684, + 0.06540436297655106 + ], + "nudging": { + "0.001": [ + -0.00034885239438153803, + -0.00048498986870981753, + -0.00045127709745429456, + -0.0002507510653231293, + -0.00043373170774430037, + -0.00040640440420247614, + -0.0004801496979780495, + -0.0003866151091642678 + ], + "0.003": [ + -0.000878344289958477, + -0.0014532352797687054, + -0.0013547346461564302, + -0.000751436804421246, + -0.001299282186664641, + -0.0012171604903414845, + -0.00143907661549747, + -0.0011573632946237922 + ], + "0.01": [ + -0.002068763133138418, + -0.004839141853153706, + -0.004507332108914852, + -0.002498403424397111, + -0.004324691370129585, + -0.004049480427056551, + -0.004787375684827566, + -0.0038477268535643816 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.7595297370910645, + 0.9475741659164428, + 0.7447763685226441, + 0.7581909805297852, + 0.811722692489624, + 0.8899791458129883, + 0.9688082956314087, + 0.9621414354324341, + 0.961796886062622, + 0.9538854316711426, + 0.9661616035461426, + 0.950505804157257, + 0.9727196831703186, + 1.0116887701034545, + 1.0205289869308471, + 1.0264416973114014, + 1.0210129734039306, + 0.9992835007667541, + 0.9925045486450196, + 0.9951178996086121, + 1.011065309524536, + 0.9871878826141357, + 1.0031957998275758, + 1.0000246463775635, + 0.9818914362907409, + 1.0051741329193116, + 1.0145561868667603, + 1.0072885568618775, + 0.9990146213531494, + 1.002180821800232, + 1.0145820743560792, + 1.0009088862419129, + 0.987186259841919, + 0.988260524559021, + 1.0006609676361085, + 0.9837818576812745, + 0.980894729423523, + 0.9769309595108032, + 0.9737872982025146, + 0.9583989322662354, + 0.9679641858100891, + 0.9551776586532593, + 0.9422390087127686, + 0.9537172298431397, + 0.9439899353027343, + 0.943521542930603, + 0.9479599548339843, + 0.9455261005401612, + 0.9373712139129639, + 0.9349656831741333, + 0.9430942413330078, + 0.9451345511436462, + 0.9331818491458893, + 0.9223974617004395, + 0.9274687778472901, + 0.9191716623306274, + 0.9255869388580322, + 0.923639429473877, + 0.9151927932739258, + 0.9036617515563965, + 0.912812328338623, + 0.9029623630523682, + 0.8978730960845948, + 0.8989394746780396, + 0.8928214418888092, + 0.8919049097061157, + 0.8924614941596984, + 0.8891196983337403, + 0.8863753658294677, + 0.8851543426513672, + 0.8843002077102661, + 0.8839833070755004, + 0.8812764804840088, + 0.8801170440673828, + 0.8795399000167846, + 0.878050711631775, + 0.8773804382324218, + 0.8769560194015503, + 0.8765291761398315, + 0.8763642075538636 + ], + "train_acc": [ + 0.3558, + 0.6435, + 0.7191, + 0.72, + 0.7119, + 0.6954, + 0.665, + 0.6614, + 0.656, + 0.655, + 0.6515, + 0.6551, + 0.6411, + 0.6336, + 0.6326, + 0.6305, + 0.6287, + 0.6399, + 0.638, + 0.6382, + 0.6419, + 0.6497, + 0.6435, + 0.6474, + 0.646, + 0.6446, + 0.6415, + 0.6454, + 0.6415, + 0.6452, + 0.6418, + 0.6443, + 0.6468, + 0.6466, + 0.6443, + 0.6469, + 0.6513, + 0.6506, + 0.6566, + 0.6594, + 0.6576, + 0.6564, + 0.6626, + 0.6607, + 0.6659, + 0.6638, + 0.6673, + 0.6678, + 0.6662, + 0.6658, + 0.6636, + 0.6657, + 0.6705, + 0.6712, + 0.6726, + 0.674, + 0.6661, + 0.6721, + 0.6726, + 0.6776, + 0.6756, + 0.6779, + 0.6784, + 0.6801, + 0.6808, + 0.6787, + 0.6788, + 0.6814, + 0.6802, + 0.6833, + 0.6825, + 0.6816, + 0.6842, + 0.6843, + 0.6838, + 0.6857, + 0.685, + 0.6865, + 0.6861, + 0.6863 + ], + "test_acc": [ + 0.57, + 0.665, + 0.6875, + 0.6905, + 0.6825, + 0.646, + 0.6395, + 0.6295, + 0.6295, + 0.6195, + 0.629, + 0.618, + 0.614, + 0.596, + 0.608, + 0.5895, + 0.5995, + 0.6025, + 0.604, + 0.6165, + 0.601, + 0.615, + 0.5995, + 0.602, + 0.605, + 0.6055, + 0.5865, + 0.6125, + 0.6165, + 0.602, + 0.6025, + 0.606, + 0.6015, + 0.6085, + 0.6205, + 0.6, + 0.613, + 0.6125, + 0.615, + 0.616, + 0.6095, + 0.6355, + 0.617, + 0.6205, + 0.615, + 0.619, + 0.628, + 0.626, + 0.6285, + 0.6235, + 0.618, + 0.6265, + 0.6245, + 0.6265, + 0.632, + 0.625, + 0.6235, + 0.618, + 0.627, + 0.627, + 0.6195, + 0.6265, + 0.6355, + 0.629, + 0.629, + 0.628, + 0.629, + 0.632, + 0.634, + 0.6305, + 0.632, + 0.633, + 0.6315, + 0.632, + 0.629, + 0.6325, + 0.6315, + 0.6305, + 0.631, + 0.6315 + ], + "state_pred_error": [ + 0.7119821426868439, + 0.2199285702228546, + 0.15159940316677092, + 0.1455048334121704, + 0.16011591622829438, + 0.17240723192691804, + 0.1856574460029602, + 0.19060646598339082, + 0.18461057021617888, + 0.17915196049213408, + 0.16156295392513276, + 0.1458448067188263, + 0.13951418162584306, + 0.1363513420343399, + 0.12588273421525956, + 0.11220355759859085, + 0.0940346223115921, + 0.08044589848518371, + 0.07334359179735184, + 0.06827121561765671, + 0.0638974659562111, + 0.06077894349694252, + 0.05925172871351242, + 0.05808723242282868, + 0.057569033747911454, + 0.05934881684780121, + 0.060563347887992856, + 0.060616958856582644, + 0.05973702830076218, + 0.059038369923830034, + 0.05913116801381111, + 0.06012527327537537, + 0.05976770656704903, + 0.06020231146216393, + 0.05928394560813904, + 0.058542316550016404, + 0.05818368434906006, + 0.05711043501496315, + 0.05610687211751938, + 0.05552056633830071, + 0.05414653058052063, + 0.05291242948770523, + 0.05013820585012436, + 0.048317215740680694, + 0.04606599677205086, + 0.04470588800907135, + 0.0438895072221756, + 0.041934526485204696, + 0.04082408391237259, + 0.03920472621917725, + 0.038452356386184695, + 0.03671333760023117, + 0.035519248223304746, + 0.0345638000369072, + 0.033005472686886785, + 0.03193392164707184, + 0.031188388174772264, + 0.02983923709988594, + 0.028780742260813712, + 0.02811023307144642, + 0.027198891657590867, + 0.026264052698016165, + 0.025608342266082763, + 0.024711268293857575, + 0.024092616820335387, + 0.02376379963159561, + 0.022925849288702012, + 0.022340466144680975, + 0.022190902706980705, + 0.021424786433577536, + 0.02106497337818146, + 0.020676997044682503, + 0.02055346903204918, + 0.020126914477348327, + 0.01972040805220604, + 0.019614314609766006, + 0.019187554389238356, + 0.01890986149609089, + 0.01886671639084816, + 0.018439615397155284 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.6046093106269836, + 0.3773959279060364, + 0.1675240397453308, + 0.13364183902740479, + 0.12548640370368958, + 0.11966440826654434, + 0.11708953976631165, + 0.12762311100959778 + ], + "perturbation_rho": [ + 0.5598001480102539, + 0.35775649547576904, + 0.14680343866348267, + 0.103827565908432, + 0.12472978234291077, + 0.08794894069433212, + 0.12868158519268036, + 0.09175367653369904 + ], + "nudging": { + "0.001": [ + -0.01812632381916046, + -0.0018294029869139194, + -0.0005177915445528924, + -0.00041508491267450154, + -0.00039664041833020747, + -0.00037947000237181783, + -0.0003740444080904126, + -0.0003969752578996122 + ], + "0.003": [ + -0.053716909140348434, + -0.0054817236959934235, + -0.0015528149669989944, + -0.0012443987652659416, + -0.001189632574096322, + -0.0011380251962691545, + -0.0011217063292860985, + -0.0011903976555913687 + ], + "0.01": [ + -0.17137765884399414, + -0.018192056566476822, + -0.005168645642697811, + -0.004143164958804846, + -0.0039602769538760185, + -0.0037884372286498547, + -0.003734107594937086, + -0.00396342109888792 + ] + }, + "state_pred_error_per_layer": [ + 11751.603515625, + 2306.73095703125, + 1321.091796875, + 1033.674560546875, + 973.6993408203125, + 865.9056396484375, + 869.378173828125, + 839.1387329101562 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2008896965026854, + 1.4054584117889404, + 0.9413134895324707, + 0.8322208425521851, + 0.7817444447517395, + 0.766307181072235, + 0.7719230993270874, + 0.7583044151306152, + 0.7602345886230468, + 0.7555905197143554, + 0.7762331862449646, + 0.798689239692688, + 0.8254908643722534, + 0.7902877309799194, + 0.8191847791671752, + 0.843696772480011, + 0.8999226076126099, + 0.8750352613449097, + 0.9063004100799561, + 1.0182397011756896, + 0.8965417966842651, + 0.9666744052886963, + 1.0089512565612793, + 1.007328366470337, + 1.0209112884521485, + 0.9945938415527343, + 1.0325454999923707, + 1.05485934715271, + 1.055373514175415, + 1.0699854314804078, + 1.0986695121765138, + 1.1126045949935912, + 1.1078404700279236, + 1.1185390811920166, + 1.1371925388336181, + 1.201495304107666, + 1.2209324337959289, + 1.1769378370285035, + 1.2876011058807373, + 1.269807508468628, + 1.2512431362152099, + 1.264885738182068, + 1.3760645431518554, + 1.284398963546753, + 1.2944733834266662, + 1.2793049654960633, + 1.279590975379944, + 1.2840878061294556, + 1.3577770275115968, + 1.3355762157440185, + 1.3204743861198425, + 1.3215809940338135, + 1.3097663831710815, + 1.293453282546997, + 1.318989148712158, + 1.2980890903472901, + 1.2837853858947754, + 1.3034196048736573, + 1.291077992630005, + 1.2697135080337525, + 1.276225595855713, + 1.279370401573181, + 1.253262141418457, + 1.2559870906829833, + 1.2534162567138671, + 1.249070475769043, + 1.2483550487518311, + 1.2445100688934325, + 1.2417517505645752, + 1.2406762868881225, + 1.2380864669799805, + 1.2353398445129395, + 1.2340172630310058, + 1.2329429447174072, + 1.231136992263794, + 1.2310544689178466, + 1.2299473683357238, + 1.229686898612976, + 1.229286951828003, + 1.2290444581985474 + ], + "train_acc": [ + 0.2037, + 0.516, + 0.6508, + 0.6907, + 0.7073, + 0.7123, + 0.7153, + 0.7213, + 0.7237, + 0.7267, + 0.726, + 0.7175, + 0.7129, + 0.7276, + 0.7204, + 0.7124, + 0.7065, + 0.7141, + 0.7075, + 0.684, + 0.7014, + 0.6798, + 0.6655, + 0.6582, + 0.6502, + 0.6556, + 0.64, + 0.628, + 0.6218, + 0.6158, + 0.5995, + 0.6016, + 0.5976, + 0.5955, + 0.5876, + 0.5705, + 0.5582, + 0.5704, + 0.5424, + 0.5442, + 0.5503, + 0.5452, + 0.5129, + 0.5399, + 0.5354, + 0.5425, + 0.5361, + 0.5384, + 0.5126, + 0.5154, + 0.5257, + 0.5199, + 0.5272, + 0.5292, + 0.5234, + 0.5312, + 0.5363, + 0.5287, + 0.5283, + 0.542, + 0.5333, + 0.5418, + 0.5433, + 0.5426, + 0.5425, + 0.5443, + 0.5431, + 0.5475, + 0.5473, + 0.5489, + 0.5481, + 0.5491, + 0.546, + 0.5462, + 0.5493, + 0.5477, + 0.5499, + 0.5466, + 0.5488, + 0.5486 + ], + "test_acc": [ + 0.348, + 0.5865, + 0.648, + 0.665, + 0.664, + 0.654, + 0.667, + 0.6655, + 0.6695, + 0.669, + 0.6805, + 0.6465, + 0.675, + 0.646, + 0.665, + 0.6225, + 0.654, + 0.6565, + 0.6365, + 0.6445, + 0.625, + 0.607, + 0.6095, + 0.6025, + 0.6165, + 0.614, + 0.5665, + 0.582, + 0.557, + 0.563, + 0.557, + 0.58, + 0.568, + 0.545, + 0.4575, + 0.484, + 0.534, + 0.473, + 0.4945, + 0.523, + 0.498, + 0.429, + 0.507, + 0.506, + 0.494, + 0.48, + 0.4965, + 0.484, + 0.463, + 0.474, + 0.4995, + 0.5165, + 0.505, + 0.4835, + 0.506, + 0.513, + 0.5, + 0.485, + 0.511, + 0.5185, + 0.5055, + 0.515, + 0.5165, + 0.5225, + 0.5235, + 0.5215, + 0.5255, + 0.523, + 0.526, + 0.523, + 0.5235, + 0.5235, + 0.527, + 0.526, + 0.528, + 0.528, + 0.53, + 0.527, + 0.5285, + 0.5275 + ], + "value_loss": [ + 2.8519159332275392, + 0.943093113040924, + 0.9696953145980834, + 1.0555597288131713, + 1.0231808990478515, + 1.0070185512542724, + 1.0053409986495971, + 1.0034786861419678, + 1.074703646659851, + 1.0331179862976074, + 1.1073360038757325, + 1.1542760429382324, + 1.1737403179168702, + 1.1156317903518678, + 1.1757224494934082, + 1.2075947334289552, + 1.4217233302116394, + 1.2618381538391112, + 1.2358001930236817, + 1.5412270696640014, + 0.985550724029541, + 1.0291227241516114, + 0.9544451610565186, + 0.8837470067977905, + 0.8537702310562134, + 0.7540037113189697, + 0.7435011320114135, + 0.7713030492305756, + 0.7737072071075439, + 0.7703527069091797, + 0.8406762672424316, + 0.9660953598022461, + 0.9581118317604065, + 0.8639301441192627, + 1.131364299106598, + 0.9075398429870606, + 0.7297967605352401, + 0.610801382446289, + 0.7295192481040954, + 0.6998717771530152, + 0.7179642705917358, + 0.5449347291946411, + 0.746469527053833, + 1.1022102794647217, + 0.8994069383621216, + 0.65495665807724, + 0.5736650440216065, + 0.554638107585907, + 0.6279040833473205, + 0.6575304574489593, + 0.5701413901329041, + 0.5867615478515625, + 0.6130897359848022, + 0.5448762645721436, + 0.5473845755577087, + 0.5205927000999451, + 0.5727422311782837, + 0.5688760271072387, + 0.5431896102905274, + 0.5042444682121277, + 0.4872834966659546, + 0.47681626167297364, + 0.48972151465415953, + 0.485532283782959, + 0.4564926029682159, + 0.48419216747283933, + 0.4549050573348999, + 0.4627880736351013, + 0.4412449298858643, + 0.43897649846076964, + 0.439124055480957, + 0.4265758001327515, + 0.41834584236145017, + 0.4291167945861816, + 0.4187319411754608, + 0.4475174812793732, + 0.40432348778247834, + 0.43183891644477845, + 0.4050795471668243, + 0.41436073665618894 + ], + "term_loss": [ + 1.655311958694458, + 0.549731699848175, + 0.7320676593780517, + 0.8351332375526428, + 0.8048139360427856, + 0.7700202879905701, + 0.7471456516265869, + 0.7647736320495605, + 0.8484953968286514, + 0.8139370037078857, + 0.8846953063964844, + 0.9258933193206788, + 0.9378262730121613, + 0.8885055972337723, + 0.9462037200927734, + 0.9678823600769043, + 1.1691513951301575, + 1.0146873613357543, + 0.981622580909729, + 1.2502811630249024, + 0.7126443691253662, + 0.7149904264450073, + 0.6176420908927918, + 0.5500664302825927, + 0.5115062843322754, + 0.44496897649765016, + 0.4283113181114197, + 0.44876509721279145, + 0.3894277139544487, + 0.426357678937912, + 0.46676229720115664, + 0.5529243560791015, + 0.5148136425852775, + 0.4639499371290207, + 0.6982595764636993, + 0.5183709760665893, + 0.36028967921733857, + 0.26226684079170226, + 0.3540671193122864, + 0.32895341753959656, + 0.3412381377100944, + 0.19596993993520737, + 0.358793759059906, + 0.6658679189682006, + 0.4896356201171875, + 0.28445579075813293, + 0.21803204145431518, + 0.20383631246089937, + 0.26368726410865784, + 0.28870824122428895, + 0.21559315396547318, + 0.22728329100608827, + 0.24814829128980637, + 0.18719943115711213, + 0.18591779079437257, + 0.1683158616065979, + 0.2141489410638809, + 0.210011887550354, + 0.19071238458156586, + 0.15903579448461533, + 0.14602340037822722, + 0.13510726680755616, + 0.15042966575622557, + 0.14709542198181152, + 0.12240583802461624, + 0.14543920485973358, + 0.12093815805912018, + 0.1282063971042633, + 0.10907832708358765, + 0.10826493293642998, + 0.10762279661893845, + 0.09866760165691375, + 0.0908609703540802, + 0.09999058279991149, + 0.09174880601167679, + 0.11339596772193909, + 0.08030046239048243, + 0.10032132915854454, + 0.0803849901676178, + 0.08663651337623596 + ], + "bridge_loss": [ + 0.8989060655173758, + 0.11960642929077149, + 0.015411593426018954, + 0.006060963110625744, + 0.00798061602562666, + 0.02676496696472168, + 0.0440154026389122, + 0.02723466747999191, + 0.014392563518881797, + 0.009799828293919564, + 0.009989605707675219, + 0.01066438391804695, + 0.014675824010372162, + 0.015108226895332337, + 0.014537670788168908, + 0.018136680734157563, + 0.021672747790813445, + 0.022625041630864144, + 0.02594750416278839, + 0.04525593014955521, + 0.044533857583999636, + 0.06834359543919563, + 0.0811832171201706, + 0.07807079297304154, + 0.08161697351336479, + 0.05447080357074738, + 0.05201703317463398, + 0.05524468503296375, + 0.11168219794034957, + 0.0641616762161255, + 0.08777698372602463, + 0.12359804570525884, + 0.15617993171811104, + 0.10881609472036362, + 0.13728766435980796, + 0.07868606736660004, + 0.055003388568758964, + 0.04358988349437714, + 0.05062321665287018, + 0.05054847391843796, + 0.055439580523967746, + 0.026933279258012772, + 0.042817439204454424, + 0.10670252997875214, + 0.07675310898423195, + 0.04261072409152985, + 0.028939780139923096, + 0.02048116326034069, + 0.019857217094302177, + 0.02864076868593693, + 0.017677207984775303, + 0.02280512315630913, + 0.031010216677188875, + 0.02628134009242058, + 0.025431732770800592, + 0.019921301141381263, + 0.03013700404167175, + 0.027916390109062196, + 0.022569763624668122, + 0.0205557999253273, + 0.014262732622027397, + 0.014771246069669723, + 0.01809905598759651, + 0.016506473726034164, + 0.013013275938481093, + 0.018298546454310418, + 0.01417785782366991, + 0.015295256960391999, + 0.013428864750266075, + 0.012695570394396782, + 0.013537625922262668, + 0.01115195343196392, + 0.010617554458975793, + 0.012874725475907326, + 0.01128501494526863, + 0.018389357506483794, + 0.008775913769751786, + 0.016407797276228667, + 0.009887954160571099, + 0.013127461233735085 + ], + "tgrad_loss": [ + 0.2976979078292847, + 0.2737549843788147, + 0.22221605656147003, + 0.21436553063392638, + 0.21038635082244872, + 0.21023330702781678, + 0.2141799436569214, + 0.21147037315368652, + 0.21181569137573242, + 0.20938114733695984, + 0.21265108547210693, + 0.21771834297180176, + 0.2212382229089737, + 0.21201796562671663, + 0.2149810601234436, + 0.22157568635940553, + 0.2308991893529892, + 0.22452575006484984, + 0.22823011336326599, + 0.24568997399806977, + 0.22837249422073364, + 0.24578870820999146, + 0.2556198622703552, + 0.2556097867488861, + 0.2606469665288925, + 0.25456393384933473, + 0.2631727811574936, + 0.2672932656288147, + 0.27259729590415954, + 0.27983335461616515, + 0.2861369857311249, + 0.28957296657562254, + 0.287118260717392, + 0.29116410436630247, + 0.29581704835891726, + 0.3104827980041504, + 0.31450369589328764, + 0.30494466242790225, + 0.3248289137840271, + 0.3203698843955994, + 0.32128654470443724, + 0.3220315122127533, + 0.3448583282709122, + 0.3296398288726807, + 0.3330182122707367, + 0.3278901381254196, + 0.32669322395324707, + 0.33032063636779785, + 0.3443595983505249, + 0.3401814471721649, + 0.3368710287094116, + 0.3366731337070465, + 0.33393123569488525, + 0.33139549551010133, + 0.33603504791259764, + 0.33235553741455076, + 0.3284562883377075, + 0.3309477458953857, + 0.3299074633598328, + 0.324652875328064, + 0.32699735922813417, + 0.3269377513885498, + 0.32119279050827027, + 0.32193038778305055, + 0.32107348833084104, + 0.3204544198989868, + 0.3197890423774719, + 0.319286421585083, + 0.31873773612976075, + 0.318015997505188, + 0.31796363191604615, + 0.3167562457561493, + 0.3168673168182373, + 0.31625148630142214, + 0.31569811849594115, + 0.31573215498924256, + 0.3152471107006073, + 0.3151097901344299, + 0.3148066032886505, + 0.3145967625617981 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.1268395036458969, + 0.30569249391555786, + 0.34143707156181335, + 0.3805205225944519, + 0.3833070397377014, + 0.38344305753707886, + 0.3742453455924988, + 0.3805825710296631 + ], + "perturbation_rho": [ + 0.10492167621850967, + 0.4008791148662567, + 0.42003583908081055, + 0.4331238567829132, + 0.4291571080684662, + 0.4853004217147827, + 0.4488537311553955, + 0.46586981415748596 + ], + "nudging": { + "0.001": [ + -0.0026137512177228928, + -0.002321421168744564, + -0.0024553369730710983, + -0.002636931836605072, + -0.0026186201721429825, + -0.0025994605384767056, + -0.0025331785436719656, + -0.0025637689977884293 + ], + "0.003": [ + -0.007821732200682163, + -0.0069553181529045105, + -0.0073580252937972546, + -0.007900664582848549, + -0.007845591753721237, + -0.007788289338350296, + -0.0075891693122684956, + -0.007681208662688732 + ], + "0.01": [ + -0.02585173025727272, + -0.023091215640306473, + -0.0244273878633976, + -0.026221776381134987, + -0.026039035990834236, + -0.025849176570773125, + -0.025189466774463654, + -0.02549329586327076 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/config.json b/results/synth_ladder_v2_lo/config.json new file mode 100644 index 0000000..05347bb --- /dev/null +++ b/results/synth_ladder_v2_lo/config.json @@ -0,0 +1,33 @@ +{ + "alphas": [ + 0.0, + 0.25 + ], + "depths": [ + 2, + 4, + 8, + 12 + ], + "seeds": [ + 42, + 123, + 456 + ], + "d_hidden": 128, + "num_classes": 10, + "n_train": 10000, + "n_test": 2000, + "batch_size": 256, + "epochs": 80, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "gpu": 0, + "output_dir": "results/synth_ladder_v2_lo" +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/summary.json b/results/synth_ladder_v2_lo/summary.json new file mode 100644 index 0000000..4e13fce --- /dev/null +++ b/results/synth_ladder_v2_lo/summary.json @@ -0,0 +1,3590 @@ +{ + "a0.0_L2_s42": { + "bp": { + "test_acc": 0.9185, + "mean_bp_cosine": 0.8935370743274689, + "mean_rho": 0.9999973475933075, + "mean_nudge_001": -0.016880770213901997, + "mean_nudge_003": -0.046150531619787216, + "mean_nudge_01": -0.11240250617265701, + "bp_cosine_per_layer": [ + 0.9016435146331787, + 0.885430634021759 + ], + "rho_per_layer": [ + 0.9999990463256836, + 0.9999956488609314 + ], + "nudge_per_layer": [ + -0.1530623733997345, + -0.07174263894557953 + ] + }, + "dfa": { + "test_acc": 0.842, + "mean_bp_cosine": 0.030407493002712727, + "mean_rho": 0.008977552875876427, + "mean_nudge_001": -0.00023997636890271679, + "mean_nudge_003": -0.0006689573347102851, + "mean_nudge_01": -0.0016241300618276, + "bp_cosine_per_layer": [ + -0.003507068380713463, + 0.06432205438613892 + ], + "rho_per_layer": [ + 0.009520611725747585, + 0.008434494026005268 + ], + "nudge_per_layer": [ + -0.0012172441929578781, + -0.002031015930697322 + ] + }, + "state_bridge": { + "test_acc": 0.825, + "mean_bp_cosine": 0.666242927312851, + "mean_rho": 0.5969350039958954, + "mean_nudge_001": -0.015545505564659834, + "mean_nudge_003": -0.04490915546193719, + "mean_nudge_01": -0.13079415168613195, + "bp_cosine_per_layer": [ + 0.9153801202774048, + 0.4171057343482971 + ], + "rho_per_layer": [ + 0.8286964893341064, + 0.3651735186576843 + ], + "nudge_per_layer": [ + -0.23136131465435028, + -0.030226988717913628 + ], + "state_pred_error_per_layer": [ + 438.86456298828125, + 353.2518310546875 + ], + "mean_state_pred_error": 396.0581970214844 + }, + "credit_bridge": { + "test_acc": 0.6675, + "mean_bp_cosine": 0.16703729704022408, + "mean_rho": 0.26396652311086655, + "mean_nudge_001": -0.00457099755294621, + "mean_nudge_003": -0.013636467512696981, + "mean_nudge_01": -0.04456503316760063, + "bp_cosine_per_layer": [ + 0.1011175885796547, + 0.23295700550079346 + ], + "rho_per_layer": [ + 0.19994769990444183, + 0.32798534631729126 + ], + "nudge_per_layer": [ + -0.07033564895391464, + -0.01879441738128662 + ], + "final_value_loss": 0.5091902822494507, + "final_term_loss": 0.2335890076160431, + "final_bridge_loss": 0.035112081968784334, + "final_tgrad_loss": 0.2404891884803772 + } + }, + "a0.0_L2_s123": { + "bp": { + "test_acc": 0.9205, + "mean_bp_cosine": 0.8566932380199432, + "mean_rho": 0.9999960958957672, + "mean_nudge_001": -0.015286394860595465, + "mean_nudge_003": -0.04188752360641956, + "mean_nudge_01": -0.10229892283678055, + "bp_cosine_per_layer": [ + 0.8634263277053833, + 0.8499601483345032 + ], + "rho_per_layer": [ + 0.9999988079071045, + 0.9999933838844299 + ], + "nudge_per_layer": [ + -0.13922545313835144, + -0.06537239253520966 + ] + }, + "dfa": { + "test_acc": 0.841, + "mean_bp_cosine": 0.08572041988372803, + "mean_rho": 0.10125503316521645, + "mean_nudge_001": -0.001035464447340928, + "mean_nudge_003": -0.0030792844481766224, + "mean_nudge_01": -0.009957430185750127, + "bp_cosine_per_layer": [ + 0.048809632658958435, + 0.12263120710849762 + ], + "rho_per_layer": [ + 0.09689537435770035, + 0.10561469197273254 + ], + "nudge_per_layer": [ + -0.015226385556161404, + -0.00468847481533885 + ] + }, + "state_bridge": { + "test_acc": 0.822, + "mean_bp_cosine": 0.7052022516727448, + "mean_rho": 0.608213409781456, + "mean_nudge_001": -0.014205678016878664, + "mean_nudge_003": -0.04078014753758907, + "mean_nudge_01": -0.11634222697466612, + "bp_cosine_per_layer": [ + 0.9309895038604736, + 0.47941499948501587 + ], + "rho_per_layer": [ + 0.8439192175865173, + 0.37250760197639465 + ], + "nudge_per_layer": [ + -0.2068808674812317, + -0.025803586468100548 + ], + "state_pred_error_per_layer": [ + 436.0709533691406, + 352.44915771484375 + ], + "mean_state_pred_error": 394.2600555419922 + }, + "credit_bridge": { + "test_acc": 0.664, + "mean_bp_cosine": 0.14723356813192368, + "mean_rho": 0.27719707787036896, + "mean_nudge_001": -0.0040612792945466936, + "mean_nudge_003": -0.012125232955440879, + "mean_nudge_01": -0.03972679190337658, + "bp_cosine_per_layer": [ + 0.08253486454486847, + 0.21193227171897888 + ], + "rho_per_layer": [ + 0.16999724507331848, + 0.38439691066741943 + ], + "nudge_per_layer": [ + -0.06126694008708, + -0.018186643719673157 + ], + "final_value_loss": 0.6019191103935242, + "final_term_loss": 0.28414561631679536, + "final_bridge_loss": 0.04602321577072144, + "final_tgrad_loss": 0.27175028200149537 + } + }, + "a0.0_L2_s456": { + "bp": { + "test_acc": 0.9295, + "mean_bp_cosine": 0.870507538318634, + "mean_rho": 0.9999973773956299, + "mean_nudge_001": -0.014503923710435629, + "mean_nudge_003": -0.039223295636475086, + "mean_nudge_01": -0.09240655042231083, + "bp_cosine_per_layer": [ + 0.8826531171798706, + 0.8583619594573975 + ], + "rho_per_layer": [ + 0.9999988079071045, + 0.9999959468841553 + ], + "nudge_per_layer": [ + -0.12340263277292252, + -0.06141046807169914 + ] + }, + "dfa": { + "test_acc": 0.8485, + "mean_bp_cosine": 0.051622094586491585, + "mean_rho": 0.014518704265356064, + "mean_nudge_001": -0.00044165633153170347, + "mean_nudge_003": -0.0013033851282671094, + "mean_nudge_01": -0.0040968600660562515, + "bp_cosine_per_layer": [ + 0.016239378601312637, + 0.08700481057167053 + ], + "rho_per_layer": [ + -0.0633457601070404, + 0.09238316863775253 + ], + "nudge_per_layer": [ + -0.004778302274644375, + -0.003415417857468128 + ] + }, + "state_bridge": { + "test_acc": 0.8285, + "mean_bp_cosine": 0.7213762998580933, + "mean_rho": 0.644424170255661, + "mean_nudge_001": -0.014933469472452998, + "mean_nudge_003": -0.042839838191866875, + "mean_nudge_01": -0.12188584543764591, + "bp_cosine_per_layer": [ + 0.9387110471725464, + 0.5040415525436401 + ], + "rho_per_layer": [ + 0.7997298240661621, + 0.4891185164451599 + ], + "nudge_per_layer": [ + -0.21233828365802765, + -0.031433407217264175 + ], + "state_pred_error_per_layer": [ + 387.8657531738281, + 319.336669921875 + ], + "mean_state_pred_error": 353.60121154785156 + }, + "credit_bridge": { + "test_acc": 0.7115, + "mean_bp_cosine": 0.16614358872175217, + "mean_rho": 0.25560564547777176, + "mean_nudge_001": -0.0032864182721823454, + "mean_nudge_003": -0.009816689416766167, + "mean_nudge_01": -0.03221969399601221, + "bp_cosine_per_layer": [ + 0.08927787840366364, + 0.2430092990398407 + ], + "rho_per_layer": [ + 0.16060538589954376, + 0.35060590505599976 + ], + "nudge_per_layer": [ + -0.047705113887786865, + -0.016734274104237556 + ], + "final_value_loss": 0.31588549439907077, + "final_term_loss": 0.09000624770522117, + "final_bridge_loss": 0.023082720217108728, + "final_tgrad_loss": 0.20279652795791625 + } + }, + "a0.0_L4_s42": { + "bp": { + "test_acc": 0.925, + "mean_bp_cosine": 0.8320528566837311, + "mean_rho": 0.9999772906303406, + "mean_nudge_001": -0.009003315295558423, + "mean_nudge_003": -0.024674441665410995, + "mean_nudge_01": -0.06179796298965812, + "bp_cosine_per_layer": [ + 0.8599773645401001, + 0.8422204256057739, + 0.8250665664672852, + 0.8009470701217651 + ], + "rho_per_layer": [ + 0.9999991655349731, + 0.9999953508377075, + 0.9999807476997375, + 0.9999338984489441 + ], + "nudge_per_layer": [ + -0.12188813835382462, + -0.07056954503059387, + -0.034971628338098526, + -0.019762540236115456 + ] + }, + "dfa": { + "test_acc": 0.856, + "mean_bp_cosine": 0.10417622653767467, + "mean_rho": 0.09206205606460571, + "mean_nudge_001": -0.00045079714618623257, + "mean_nudge_003": -0.0013433840940706432, + "mean_nudge_01": -0.004383910913020372, + "bp_cosine_per_layer": [ + 0.004014266654849052, + 0.16519895195960999, + 0.13244280219078064, + 0.11504888534545898 + ], + "rho_per_layer": [ + 0.042726192623376846, + 0.18379396200180054, + 0.108277827501297, + 0.03345024213194847 + ], + "nudge_per_layer": [ + -0.005573366768658161, + -0.005793239921331406, + -0.003338021691888571, + -0.002831015270203352 + ] + }, + "state_bridge": { + "test_acc": 0.7615, + "mean_bp_cosine": 0.38204737193882465, + "mean_rho": 0.3213508538901806, + "mean_nudge_001": -0.006838726330897771, + "mean_nudge_003": -0.01991741475649178, + "mean_nudge_01": -0.059746103768702596, + "bp_cosine_per_layer": [ + 0.8646283149719238, + 0.4090673327445984, + 0.1404263973236084, + 0.114067442715168 + ], + "rho_per_layer": [ + 0.7375176548957825, + 0.33617356419563293, + 0.14259827136993408, + 0.06911392509937286 + ], + "nudge_per_layer": [ + -0.218303382396698, + -0.013712376356124878, + -0.003879058640450239, + -0.0030895976815372705 + ], + "state_pred_error_per_layer": [ + 6951.521484375, + 6099.5322265625, + 5877.8310546875, + 3832.076416015625 + ], + "mean_state_pred_error": 5690.240295410156 + }, + "credit_bridge": { + "test_acc": 0.6585, + "mean_bp_cosine": 0.10922159999608994, + "mean_rho": 0.21513587795197964, + "mean_nudge_001": -0.00137018840177916, + "mean_nudge_003": -0.004100472666323185, + "mean_nudge_01": -0.013550454750657082, + "bp_cosine_per_layer": [ + 0.049023956060409546, + 0.11911389231681824, + 0.12341275811195374, + 0.14533579349517822 + ], + "rho_per_layer": [ + 0.09633419662714005, + 0.23598268628120422, + 0.24357257783412933, + 0.28465405106544495 + ], + "nudge_per_layer": [ + -0.026128236204385757, + -0.008897590450942516, + -0.009167088195681572, + -0.01000890415161848 + ], + "final_value_loss": 0.5270826056480408, + "final_term_loss": 0.22659661755561827, + "final_bridge_loss": 0.04233165686130524, + "final_tgrad_loss": 0.25815433073043825 + } + }, + "a0.0_L4_s123": { + "bp": { + "test_acc": 0.926, + "mean_bp_cosine": 0.7713210135698318, + "mean_rho": 0.9999768882989883, + "mean_nudge_001": -0.010334675083868206, + "mean_nudge_003": -0.028318932512775064, + "mean_nudge_01": -0.06953301187604666, + "bp_cosine_per_layer": [ + 0.808335542678833, + 0.780368447303772, + 0.7579712271690369, + 0.7386088371276855 + ], + "rho_per_layer": [ + 0.9999986886978149, + 0.999996542930603, + 0.9999827146530151, + 0.9999296069145203 + ], + "nudge_per_layer": [ + -0.13544964790344238, + -0.08136264234781265, + -0.039826083928346634, + -0.02149367332458496 + ] + }, + "dfa": { + "test_acc": 0.8375, + "mean_bp_cosine": 0.1401939271017909, + "mean_rho": 0.11219900287687778, + "mean_nudge_001": -0.000286264817987103, + "mean_nudge_003": -0.0008422381652053446, + "mean_nudge_01": -0.0026496590580791235, + "bp_cosine_per_layer": [ + -0.028116505593061447, + 0.29581546783447266, + 0.170908123254776, + 0.12216862291097641 + ], + "rho_per_layer": [ + -0.07312458753585815, + 0.3015226125717163, + 0.09657395631074905, + 0.12382403016090393 + ], + "nudge_per_layer": [ + 0.0038727924693375826, + -0.007415304891765118, + -0.0039948043413460255, + -0.0030613194685429335 + ] + }, + "state_bridge": { + "test_acc": 0.788, + "mean_bp_cosine": 0.3973395489156246, + "mean_rho": 0.36834993585944176, + "mean_nudge_001": -0.006569715158548206, + "mean_nudge_003": -0.019017601298401132, + "mean_nudge_01": -0.055994155758526176, + "bp_cosine_per_layer": [ + 0.8812471032142639, + 0.4430118799209595, + 0.14485391974449158, + 0.12024529278278351 + ], + "rho_per_layer": [ + 0.803270697593689, + 0.4108988642692566, + 0.12428833544254303, + 0.13494184613227844 + ], + "nudge_per_layer": [ + -0.20551547408103943, + -0.01310029998421669, + -0.0029572518542408943, + -0.0024035971146076918 + ], + "state_pred_error_per_layer": [ + 6307.859375, + 4221.2177734375, + 3825.8369140625, + 3284.16064453125 + ], + "mean_state_pred_error": 4409.7686767578125 + }, + "credit_bridge": { + "test_acc": 0.7305, + "mean_bp_cosine": 0.10989296156913042, + "mean_rho": 0.18325010500848293, + "mean_nudge_001": -0.0012505464837886393, + "mean_nudge_003": -0.00373545300681144, + "mean_nudge_01": -0.012258320581167936, + "bp_cosine_per_layer": [ + 0.03434538468718529, + 0.12379913777112961, + 0.1433446854352951, + 0.13808263838291168 + ], + "rho_per_layer": [ + 0.03924814611673355, + 0.21971622109413147, + 0.26409071683883667, + 0.20994533598423004 + ], + "nudge_per_layer": [ + -0.020018436014652252, + -0.00925234891474247, + -0.010285570286214352, + -0.009476927109062672 + ], + "final_value_loss": 0.454630423784256, + "final_term_loss": 0.185297670173645, + "final_bridge_loss": 0.03432008520960808, + "final_tgrad_loss": 0.2350126650452614 + } + }, + "a0.0_L4_s456": { + "bp": { + "test_acc": 0.9285, + "mean_bp_cosine": 0.7884698659181595, + "mean_rho": 0.999981090426445, + "mean_nudge_001": -0.01117145799798891, + "mean_nudge_003": -0.030768739874474704, + "mean_nudge_01": -0.07730476558208466, + "bp_cosine_per_layer": [ + 0.8268355131149292, + 0.7960893511772156, + 0.7726784944534302, + 0.758276104927063 + ], + "rho_per_layer": [ + 0.9999993443489075, + 0.999996542930603, + 0.999983549118042, + 0.9999449253082275 + ], + "nudge_per_layer": [ + -0.15056422352790833, + -0.08916378021240234, + -0.04451071470975876, + -0.024980343878269196 + ] + }, + "dfa": { + "test_acc": 0.8655, + "mean_bp_cosine": 0.06126724602654576, + "mean_rho": 0.09146236767992377, + "mean_nudge_001": -0.00023738171148579568, + "mean_nudge_003": -0.0006991284317336977, + "mean_nudge_01": -0.0021681145881302655, + "bp_cosine_per_layer": [ + -0.012256121262907982, + 0.07949584722518921, + 0.0787847638130188, + 0.09904449433088303 + ], + "rho_per_layer": [ + -0.003950485959649086, + 0.06165219843387604, + 0.14469987154006958, + 0.16344788670539856 + ], + "nudge_per_layer": [ + 0.002696676878258586, + -0.005506287328898907, + -0.0027312645688652992, + -0.003131583333015442 + ] + }, + "state_bridge": { + "test_acc": 0.7455, + "mean_bp_cosine": 0.4014641270041466, + "mean_rho": 0.3732803575694561, + "mean_nudge_001": -0.007542004925198853, + "mean_nudge_003": -0.022030926978914067, + "mean_nudge_01": -0.06684440147364512, + "bp_cosine_per_layer": [ + 0.8436356782913208, + 0.46039146184921265, + 0.16277557611465454, + 0.13905379176139832 + ], + "rho_per_layer": [ + 0.7277628183364868, + 0.48849108815193176, + 0.1771586537361145, + 0.09970887005329132 + ], + "nudge_per_layer": [ + -0.2401106357574463, + -0.018598388880491257, + -0.004775169305503368, + -0.0038934119511395693 + ], + "state_pred_error_per_layer": [ + 3442.556884765625, + 2195.27490234375, + 2035.546875, + 2293.3291015625 + ], + "mean_state_pred_error": 2491.6769409179688 + }, + "credit_bridge": { + "test_acc": 0.644, + "mean_bp_cosine": 0.1536249229684472, + "mean_rho": 0.26861424930393696, + "mean_nudge_001": -0.0018619927868712693, + "mean_nudge_003": -0.005573431379161775, + "mean_nudge_01": -0.018431853968650103, + "bp_cosine_per_layer": [ + 0.053475264459848404, + 0.17959368228912354, + 0.19590041041374207, + 0.18553033471107483 + ], + "rho_per_layer": [ + 0.04320300370454788, + 0.30398592352867126, + 0.35316282510757446, + 0.3741052448749542 + ], + "nudge_per_layer": [ + -0.027841825038194656, + -0.015361151657998562, + -0.015351004898548126, + -0.015173434279859066 + ], + "final_value_loss": 0.7469501955509186, + "final_term_loss": 0.4142983556270599, + "final_bridge_loss": 0.05541581681370735, + "final_tgrad_loss": 0.2772360302686691 + } + }, + "a0.0_L8_s42": { + "bp": { + "test_acc": 0.906, + "mean_bp_cosine": 0.8584278598427773, + "mean_rho": 0.9999460652470589, + "mean_nudge_001": -0.008581212867284194, + "mean_nudge_003": -0.02450006199069321, + "mean_nudge_01": -0.06902276305481791, + "bp_cosine_per_layer": [ + 0.8854324817657471, + 0.8737501502037048, + 0.8630377054214478, + 0.8562113046646118, + 0.8509326577186584, + 0.8481521606445312, + 0.84560626745224, + 0.8443001508712769 + ], + "rho_per_layer": [ + 0.9999991655349731, + 0.9999963045120239, + 0.9999881386756897, + 0.9999630451202393, + 0.9999364614486694, + 0.9999151825904846, + 0.9998926520347595, + 0.9998775720596313 + ], + "nudge_per_layer": [ + -0.21767401695251465, + -0.12408202886581421, + -0.06762672960758209, + -0.04208396375179291, + -0.031123068183660507, + -0.025745777413249016, + -0.022784877568483353, + -0.021061642095446587 + ] + }, + "dfa": { + "test_acc": 0.8325, + "mean_bp_cosine": 0.0621855678036809, + "mean_rho": 0.08102096850052476, + "mean_nudge_001": 7.459322478098329e-05, + "mean_nudge_003": 0.00026162770882365294, + "mean_nudge_01": 0.0013351911620702595, + "bp_cosine_per_layer": [ + -0.02968163788318634, + 0.08609121292829514, + 0.09377065300941467, + 0.10205866396427155, + 0.08807726949453354, + 0.053033627569675446, + 0.056919872760772705, + 0.04721488058567047 + ], + "rho_per_layer": [ + -0.09032663702964783, + 0.17043988406658173, + 0.18389353156089783, + 0.16770029067993164, + 0.1504741907119751, + 0.05179755389690399, + 0.050898581743240356, + -0.03670964762568474 + ], + "nudge_per_layer": [ + 0.028243789449334145, + -0.00520662497729063, + -0.0028999613132327795, + -0.002869710559025407, + -0.0023996694944798946, + -0.0015899656573310494, + -0.0014181910082697868, + -0.0011781371431425214 + ] + }, + "state_bridge": { + "test_acc": 0.726, + "mean_bp_cosine": 0.26912851445376873, + "mean_rho": 0.2629122715443373, + "mean_nudge_001": -0.0034038230442092754, + "mean_nudge_003": -0.010012732280301861, + "mean_nudge_01": -0.0311450962908566, + "bp_cosine_per_layer": [ + 0.8151727914810181, + 0.4042307734489441, + 0.16176781058311462, + 0.1698867678642273, + 0.14891386032104492, + 0.1726662963628769, + 0.1322125643491745, + 0.14817725121974945 + ], + "rho_per_layer": [ + 0.7261759042739868, + 0.36915943026542664, + 0.17840053141117096, + 0.16105638444423676, + 0.14931628108024597, + 0.15696927905082703, + 0.17820878326892853, + 0.1840115785598755 + ], + "nudge_per_layer": [ + -0.21425020694732666, + -0.011446774937212467, + -0.004181142896413803, + -0.004114024806767702, + -0.0038589704781770706, + -0.00422251783311367, + -0.003358659567311406, + -0.003728472860530019 + ], + "state_pred_error_per_layer": [ + 7398.20849609375, + 5242.7607421875, + 3768.9609375, + 3258.12548828125, + 3060.2021484375, + 2786.609619140625, + 3211.44921875, + 2939.81005859375 + ], + "mean_state_pred_error": 3958.265838623047 + }, + "credit_bridge": { + "test_acc": 0.64, + "mean_bp_cosine": 0.09559969999827445, + "mean_rho": 0.20091960858553648, + "mean_nudge_001": -0.0007423463721352164, + "mean_nudge_003": -0.0022244660067372024, + "mean_nudge_01": -0.007368246268015355, + "bp_cosine_per_layer": [ + 0.010387556627392769, + 0.06787668168544769, + 0.11108389496803284, + 0.11367877572774887, + 0.11491300165653229, + 0.1093105673789978, + 0.11488444358110428, + 0.12266267836093903 + ], + "rho_per_layer": [ + 0.0504305437207222, + 0.11780044436454773, + 0.23789767920970917, + 0.24238067865371704, + 0.22429296374320984, + 0.25153419375419617, + 0.25647929310798645, + 0.22654107213020325 + ], + "nudge_per_layer": [ + -0.003928218502551317, + -0.0057389335706830025, + -0.007835019379854202, + -0.008116443641483784, + -0.0081653306260705, + -0.00813683308660984, + -0.008312376216053963, + -0.00871281512081623 + ], + "final_value_loss": 0.6615465266227722, + "final_term_loss": 0.43013124598264696, + "final_bridge_loss": 0.0357342723429203, + "final_tgrad_loss": 0.19568100452423096 + } + }, + "a0.0_L8_s123": { + "bp": { + "test_acc": 0.913, + "mean_bp_cosine": 0.8645070418715477, + "mean_rho": 0.999944381415844, + "mean_nudge_001": -0.007505885470891371, + "mean_nudge_003": -0.021483065967913717, + "mean_nudge_01": -0.06040166970342398, + "bp_cosine_per_layer": [ + 0.9087610840797424, + 0.8890509605407715, + 0.8756387233734131, + 0.860000729560852, + 0.8513467311859131, + 0.8465403914451599, + 0.8431664705276489, + 0.8415512442588806 + ], + "rho_per_layer": [ + 0.9999994039535522, + 0.9999971389770508, + 0.9999857544898987, + 0.9999687671661377, + 0.9999316930770874, + 0.9999115467071533, + 0.9998936653137207, + 0.9998670816421509 + ], + "nudge_per_layer": [ + -0.19297254085540771, + -0.10940254479646683, + -0.05867426097393036, + -0.03609157353639603, + -0.026526644825935364, + -0.02192458137869835, + -0.019491419196128845, + -0.01812979206442833 + ] + }, + "dfa": { + "test_acc": 0.849, + "mean_bp_cosine": 0.07409168453887105, + "mean_rho": 0.0943274952005595, + "mean_nudge_001": -6.366873094520997e-06, + "mean_nudge_003": -1.1956191883655265e-05, + "mean_nudge_01": 5.2888659411109984e-05, + "bp_cosine_per_layer": [ + -0.02848462387919426, + 0.15189720690250397, + 0.09141203761100769, + 0.07272940874099731, + 0.09136377274990082, + 0.0857112780213356, + 0.044680722057819366, + 0.0834236741065979 + ], + "rho_per_layer": [ + 0.03057212010025978, + 0.16072696447372437, + 0.13512857258319855, + 0.0885201245546341, + 0.1377822607755661, + 0.04239961504936218, + 0.0035119224339723587, + 0.15597838163375854 + ], + "nudge_per_layer": [ + 0.015482441522181034, + -0.004561400040984154, + -0.0020816801115870476, + -0.0015152986161410809, + -0.0019329312490299344, + -0.002064004773274064, + -0.001068722689524293, + -0.0018352947663515806 + ] + }, + "state_bridge": { + "test_acc": 0.7725, + "mean_bp_cosine": 0.2933046016842127, + "mean_rho": 0.25743963569402695, + "mean_nudge_001": -0.0033750918046280276, + "mean_nudge_003": -0.009846233486314304, + "mean_nudge_01": -0.02971906404127367, + "bp_cosine_per_layer": [ + 0.8679102659225464, + 0.46438825130462646, + 0.22033852338790894, + 0.1893446445465088, + 0.16738475859165192, + 0.14945879578590393, + 0.1267041563987732, + 0.16090741753578186 + ], + "rho_per_layer": [ + 0.6897462606430054, + 0.42848390340805054, + 0.19369670748710632, + 0.19582855701446533, + 0.14048044383525848, + 0.12853404879570007, + 0.09809397161006927, + 0.18465319275856018 + ], + "nudge_per_layer": [ + -0.2050759196281433, + -0.01248687319457531, + -0.004478689283132553, + -0.003817938268184662, + -0.00330835347995162, + -0.002980519086122513, + -0.002494834130629897, + -0.003109385259449482 + ], + "state_pred_error_per_layer": [ + 7121.279296875, + 6133.4482421875, + 3940.991943359375, + 2496.587646484375, + 2560.85595703125, + 2498.587890625, + 3539.93115234375, + 2449.22607421875 + ], + "mean_state_pred_error": 3842.613525390625 + }, + "credit_bridge": { + "test_acc": 0.656, + "mean_bp_cosine": 0.092392878344981, + "mean_rho": 0.17488694936037064, + "mean_nudge_001": -0.0007325447659241036, + "mean_nudge_003": -0.002192195039242506, + "mean_nudge_01": -0.0072501768881920725, + "bp_cosine_per_layer": [ + 0.001700198045000434, + 0.04125010222196579, + 0.1112770289182663, + 0.11907510459423065, + 0.11768756806850433, + 0.11733907461166382, + 0.11329221725463867, + 0.117521733045578 + ], + "rho_per_layer": [ + 0.043069981038570404, + 0.1044735386967659, + 0.23828034102916718, + 0.18111932277679443, + 0.19782572984695435, + 0.1971191018819809, + 0.20729684829711914, + 0.2299107313156128 + ], + "nudge_per_layer": [ + -0.006082434207201004, + -0.003400696674361825, + -0.007903593592345715, + -0.008138573728501797, + -0.008289994671940804, + -0.007994470186531544, + -0.00807441771030426, + -0.008117234334349632 + ], + "final_value_loss": 0.5009399848937989, + "final_term_loss": 0.26505257573127744, + "final_bridge_loss": 0.027039055764675142, + "final_tgrad_loss": 0.20884835484027864 + } + }, + "a0.0_L8_s456": { + "bp": { + "test_acc": 0.8965, + "mean_bp_cosine": 0.8864798843860626, + "mean_rho": 0.9999493733048439, + "mean_nudge_001": -0.007212058277218603, + "mean_nudge_003": -0.02048966591246426, + "mean_nudge_01": -0.05707334354519844, + "bp_cosine_per_layer": [ + 0.9283311367034912, + 0.9162832498550415, + 0.8925424814224243, + 0.8799441456794739, + 0.8746041655540466, + 0.8698863983154297, + 0.8666130304336548, + 0.863634467124939 + ], + "rho_per_layer": [ + 0.9999991059303284, + 0.9999967217445374, + 0.9999891519546509, + 0.9999651908874512, + 0.9999410510063171, + 0.9999043941497803, + 0.9998966455459595, + 0.9999027252197266 + ], + "nudge_per_layer": [ + -0.17811693251132965, + -0.10346511751413345, + -0.05678309500217438, + -0.035222865641117096, + -0.025761041790246964, + -0.021198198199272156, + -0.01872769370675087, + -0.017311803996562958 + ] + }, + "dfa": { + "test_acc": 0.833, + "mean_bp_cosine": 0.10069436486810446, + "mean_rho": 0.11729028820991516, + "mean_nudge_001": -0.00045204991511127446, + "mean_nudge_003": -0.0013379494193941355, + "mean_nudge_01": -0.004276915889931843, + "bp_cosine_per_layer": [ + 0.020978286862373352, + 0.16464680433273315, + 0.15073026716709137, + 0.08116275072097778, + 0.08070477098226547, + 0.0867747962474823, + 0.10854049026966095, + 0.11201675236225128 + ], + "rho_per_layer": [ + 0.032643549144268036, + 0.2071959227323532, + 0.2057623416185379, + 0.09326457977294922, + 0.06205561012029648, + 0.1389445811510086, + 0.11340519785881042, + 0.08505052328109741 + ], + "nudge_per_layer": [ + -0.012655803002417088, + -0.005697320215404034, + -0.004094945732504129, + -0.0018561023753136396, + -0.0020380420610308647, + -0.0022426587529480457, + -0.002856952603906393, + -0.0027735023759305477 + ] + }, + "state_bridge": { + "test_acc": 0.7495, + "mean_bp_cosine": 0.246165806427598, + "mean_rho": 0.20948901865631342, + "mean_nudge_001": -0.0035059251604252495, + "mean_nudge_003": -0.010245608449622523, + "mean_nudge_01": -0.03114599542459473, + "bp_cosine_per_layer": [ + 0.8467778563499451, + 0.3549606502056122, + 0.1711018681526184, + 0.12375819683074951, + 0.1153455525636673, + 0.12219913303852081, + 0.12895643711090088, + 0.10622675716876984 + ], + "rho_per_layer": [ + 0.7416437268257141, + 0.2796669900417328, + 0.14060860872268677, + 0.09820520132780075, + 0.10454020649194717, + 0.08740514516830444, + 0.10375625640153885, + 0.12008601427078247 + ], + "nudge_per_layer": [ + -0.2212277054786682, + -0.010068328119814396, + -0.00393392750993371, + -0.002955838106572628, + -0.0027290289290249348, + -0.0028208147268742323, + -0.002979037119075656, + -0.002453283406794071 + ], + "state_pred_error_per_layer": [ + 10942.7939453125, + 10293.740234375, + 7482.4482421875, + 5008.9619140625, + 4863.818359375, + 4492.451171875, + 3565.2744140625, + 3837.47998046875 + ], + "mean_state_pred_error": 6310.871032714844 + }, + "credit_bridge": { + "test_acc": 0.617, + "mean_bp_cosine": 0.09351247036829591, + "mean_rho": 0.15350601403042674, + "mean_nudge_001": -0.0010894104561884888, + "mean_nudge_003": -0.0032592675706837326, + "mean_nudge_01": -0.010775732051115483, + "bp_cosine_per_layer": [ + 0.03283574804663658, + 0.05836774408817291, + 0.11590129137039185, + 0.10100162029266357, + 0.1079024076461792, + 0.10276803374290466, + 0.11581481993198395, + 0.11350809782743454 + ], + "rho_per_layer": [ + 0.06095704063773155, + 0.13836193084716797, + 0.1803440898656845, + 0.1439131498336792, + 0.14064353704452515, + 0.15858328342437744, + 0.22606094181537628, + 0.17918413877487183 + ], + "nudge_per_layer": [ + -0.023668643087148666, + -0.006166210863739252, + -0.009575091302394867, + -0.00891521479934454, + -0.00932026281952858, + -0.008899858221411705, + -0.009868312627077103, + -0.009792262688279152 + ], + "final_value_loss": 1.2871107803344726, + "final_term_loss": 0.9274139808654785, + "final_bridge_loss": 0.0815536917924881, + "final_tgrad_loss": 0.2781431001186371 + } + }, + "a0.0_L12_s42": { + "bp": { + "test_acc": 0.9135, + "mean_bp_cosine": 0.8262566576401392, + "mean_rho": 0.9998530795176824, + "mean_nudge_001": -0.005460524485291292, + "mean_nudge_003": -0.015294013021048158, + "mean_nudge_01": -0.04075813665986061, + "bp_cosine_per_layer": [ + 0.8936765193939209, + 0.875713586807251, + 0.8523612022399902, + 0.835299551486969, + 0.8243429064750671, + 0.8148068189620972, + 0.809612512588501, + 0.8055970668792725, + 0.8028815984725952, + 0.8011909127235413, + 0.8001247644424438, + 0.799472451210022 + ], + "rho_per_layer": [ + 0.9999988079071045, + 0.999997615814209, + 0.9999872446060181, + 0.9999661445617676, + 0.9999244213104248, + 0.9998762011528015, + 0.9998204708099365, + 0.9997811317443848, + 0.9997683167457581, + 0.9997478723526001, + 0.9997052550315857, + 0.9996634721755981 + ], + "nudge_per_layer": [ + -0.15880361199378967, + -0.10216463357210159, + -0.058997806161642075, + -0.0368044376373291, + -0.02622675709426403, + -0.02074911817908287, + -0.017529264092445374, + -0.015481802634894848, + -0.014148212037980556, + -0.013247357681393623, + -0.012655021622776985, + -0.012289617210626602 + ] + }, + "dfa": { + "test_acc": 0.8405, + "mean_bp_cosine": 0.06366231696059306, + "mean_rho": 0.0974447913467884, + "mean_nudge_001": -0.00019441865091115082, + "mean_nudge_003": -0.0005761026429051223, + "mean_nudge_01": -0.001826463839582478, + "bp_cosine_per_layer": [ + 0.022819485515356064, + 0.10611869394779205, + 0.08763782680034637, + 0.06361521780490875, + 0.08818645775318146, + 0.07573625445365906, + 0.07574683427810669, + 0.025106821209192276, + 0.029594242572784424, + 0.09018446505069733, + 0.04191981628537178, + 0.05728168785572052 + ], + "rho_per_layer": [ + -0.0498071163892746, + 0.18554872274398804, + 0.19663047790527344, + 0.14150168001651764, + 0.06663499772548676, + 0.12039551883935928, + 0.12434913218021393, + 0.05157296732068062, + 0.09405694901943207, + 0.07376686483621597, + 0.061272408813238144, + 0.10341489315032959 + ], + "nudge_per_layer": [ + 0.000284646637737751, + -0.005279931705445051, + -0.002400151453912258, + -0.0017087131273001432, + -0.0019207102013751864, + -0.0020927595905959606, + -0.0017691099783405662, + -0.0008208724320866168, + -0.0012333606136962771, + -0.0026537002995610237, + -0.0007275568204931915, + -0.0015953464899212122 + ] + }, + "state_bridge": { + "test_acc": 0.675, + "mean_bp_cosine": 0.16806975565850735, + "mean_rho": 0.14302178906897703, + "mean_nudge_001": -0.0021900876042006225, + "mean_nudge_003": -0.006470390944741666, + "mean_nudge_01": -0.020386384644856054, + "bp_cosine_per_layer": [ + 0.7431880235671997, + 0.2796655595302582, + 0.13151727616786957, + 0.09881292283535004, + 0.0924338698387146, + 0.10159576684236526, + 0.09764175117015839, + 0.09642879664897919, + 0.09804226458072662, + 0.09603762626647949, + 0.09261822700500488, + 0.08885498344898224 + ], + "rho_per_layer": [ + 0.611870527267456, + 0.24307268857955933, + 0.10120554268360138, + 0.09459854662418365, + 0.09521515667438507, + 0.07265714555978775, + 0.07570740580558777, + 0.0650622695684433, + 0.07738275825977325, + 0.11346932500600815, + 0.08958262950181961, + 0.07643747329711914 + ], + "nudge_per_layer": [ + -0.20912763476371765, + -0.00893338117748499, + -0.0035844063386321068, + -0.0027289288118481636, + -0.0024399380199611187, + -0.0026743747293949127, + -0.0025294050574302673, + -0.002557961270213127, + -0.0026802942156791687, + -0.002547960262745619, + -0.002460954710841179, + -0.0023713763803243637 + ], + "state_pred_error_per_layer": [ + 20223.798828125, + 14219.4013671875, + 11048.2333984375, + 10263.419921875, + 8570.201171875, + 7224.33740234375, + 7281.2197265625, + 8034.87548828125, + 6686.9033203125, + 6885.98291015625, + 6667.048828125, + 6627.78125 + ], + "mean_state_pred_error": 9477.766967773438 + }, + "credit_bridge": { + "test_acc": 0.6635, + "mean_bp_cosine": 0.07870348079207663, + "mean_rho": 0.1263093726399044, + "mean_nudge_001": -0.000519128576949394, + "mean_nudge_003": -0.0015524110640399158, + "mean_nudge_01": -0.005132454059397181, + "bp_cosine_per_layer": [ + 9.498395957052708e-05, + 0.029415149241685867, + 0.062070880085229874, + 0.07393385469913483, + 0.07970248907804489, + 0.08624569326639175, + 0.10002343356609344, + 0.10488344728946686, + 0.10920242965221405, + 0.10451158881187439, + 0.09929930418729782, + 0.09505851566791534 + ], + "rho_per_layer": [ + 0.025425152853131294, + 0.0574759915471077, + 0.13417154550552368, + 0.10034967213869095, + 0.17468321323394775, + 0.17164339125156403, + 0.15925100445747375, + 0.08668951690196991, + 0.1521437168121338, + 0.14672580361366272, + 0.1825145184993744, + 0.12463894486427307 + ], + "nudge_per_layer": [ + 0.001420565415173769, + -0.0026360084302723408, + -0.00476992130279541, + -0.005131378769874573, + -0.005615689791738987, + -0.006001932080835104, + -0.006417973432689905, + -0.006630052346736193, + -0.006984136067330837, + -0.0066003259271383286, + -0.00623705331236124, + -0.005985542666167021 + ], + "final_value_loss": 0.9863593735218048, + "final_term_loss": 0.7168336891174316, + "final_bridge_loss": 0.05245816183909774, + "final_tgrad_loss": 0.21706753172874452 + } + }, + "a0.0_L12_s123": { + "bp": { + "test_acc": 0.9145, + "mean_bp_cosine": 0.7868696798880895, + "mean_rho": 0.9998756001393, + "mean_nudge_001": -0.005259950548255195, + "mean_nudge_003": -0.014897353908357521, + "mean_nudge_01": -0.04119087569415569, + "bp_cosine_per_layer": [ + 0.832116425037384, + 0.8141677379608154, + 0.8023761510848999, + 0.7934653759002686, + 0.7857377529144287, + 0.7797414064407349, + 0.7767306566238403, + 0.7744640111923218, + 0.7725205421447754, + 0.7711977958679199, + 0.7703278064727783, + 0.7695904970169067 + ], + "rho_per_layer": [ + 0.9999991655349731, + 0.9999972581863403, + 0.9999898672103882, + 0.999970555305481, + 0.9999305009841919, + 0.9999109506607056, + 0.9998676180839539, + 0.999832808971405, + 0.9997924566268921, + 0.9997202754020691, + 0.9997268319129944, + 0.9997689127922058 + ], + "nudge_per_layer": [ + -0.17892791330814362, + -0.10439710319042206, + -0.05659153312444687, + -0.034265220165252686, + -0.02416030317544937, + -0.01895919442176819, + -0.015955276787281036, + -0.01404004916548729, + -0.01277724839746952, + -0.011922692880034447, + -0.011335920542478561, + -0.010958053171634674 + ] + }, + "dfa": { + "test_acc": 0.841, + "mean_bp_cosine": 0.10045036673545837, + "mean_rho": 0.06510928040370345, + "mean_nudge_001": -0.000200933368432743, + "mean_nudge_003": -0.000600688594810587, + "mean_nudge_01": -0.001976225830730982, + "bp_cosine_per_layer": [ + 0.009534038603305817, + 0.2771005630493164, + 0.12846891582012177, + 0.12727834284305573, + 0.09264838695526123, + 0.08494879305362701, + 0.1454543173313141, + 0.07647830247879028, + 0.055110231041908264, + 0.08491981029510498, + 0.054209403693675995, + 0.06925329566001892 + ], + "rho_per_layer": [ + -0.030354971066117287, + 0.19958093762397766, + 0.10430362075567245, + 0.06749340891838074, + 0.08917459845542908, + 0.06985980272293091, + 0.08990536630153656, + -0.0003178045153617859, + -0.05352415516972542, + 0.12398940324783325, + 0.05844062566757202, + 0.06276053190231323 + ], + "nudge_per_layer": [ + 0.0008368014823645353, + -0.00641840323805809, + -0.0027151124086230993, + -0.002792379120364785, + -0.0018645611125975847, + -0.0017843465320765972, + -0.002957880962640047, + -0.0012784524587914348, + -0.0007560949889011681, + -0.0015581869520246983, + -0.0010259757982566953, + -0.0014001178788021207 + ] + }, + "state_bridge": { + "test_acc": 0.675, + "mean_bp_cosine": 0.21027903320888677, + "mean_rho": 0.16716737858951092, + "mean_nudge_001": -0.002424063318661259, + "mean_nudge_003": -0.007164865601225756, + "mean_nudge_01": -0.02264038595603779, + "bp_cosine_per_layer": [ + 0.7589784860610962, + 0.34465640783309937, + 0.20695620775222778, + 0.15412747859954834, + 0.14041899144649506, + 0.152847021818161, + 0.1464981734752655, + 0.13855373859405518, + 0.13026131689548492, + 0.11798880249261856, + 0.11249798536300659, + 0.11956378817558289 + ], + "rho_per_layer": [ + 0.6762608289718628, + 0.29351934790611267, + 0.15623700618743896, + 0.07772233337163925, + 0.09808109700679779, + 0.14218339323997498, + 0.09985582530498505, + 0.07779418677091599, + 0.10923020541667938, + 0.10118008404970169, + 0.08211226016283035, + 0.09183197468519211 + ], + "nudge_per_layer": [ + -0.22324970364570618, + -0.01123635284602642, + -0.0056420015171170235, + -0.0040974924340844154, + -0.0037027131766080856, + -0.003983458504080772, + -0.0038626876194030046, + -0.0036268262192606926, + -0.003363188588991761, + -0.0030670221894979477, + -0.0028224957641214132, + -0.0030306889675557613 + ], + "state_pred_error_per_layer": [ + 10215.58203125, + 8926.0654296875, + 5285.6044921875, + 5192.0830078125, + 4575.35791015625, + 4063.82666015625, + 4966.6884765625, + 5378.6435546875, + 4702.37890625, + 4026.143310546875, + 3985.35595703125, + 3780.156494140625 + ], + "mean_state_pred_error": 5424.8238525390625 + }, + "credit_bridge": { + "test_acc": 0.721, + "mean_bp_cosine": 0.020079606105961528, + "mean_rho": 0.0501531979146724, + "mean_nudge_001": -0.00015450727914867457, + "mean_nudge_003": -0.0004599024711448389, + "mean_nudge_01": -0.001498352525231894, + "bp_cosine_per_layer": [ + -0.0035465662367641926, + -0.001160490675829351, + 0.00486466521397233, + 0.012821277603507042, + 0.012568866834044456, + 0.019143100827932358, + 0.022381767630577087, + 0.024246837943792343, + 0.027966029942035675, + 0.03333558514714241, + 0.04247187077999115, + 0.04586232826113701 + ], + "rho_per_layer": [ + 0.01447216235101223, + -0.01648387312889099, + 0.027175014838576317, + 0.03045208379626274, + 0.05211577191948891, + -0.0074118818156421185, + 0.0508866012096405, + 0.01983593963086605, + 0.03707783669233322, + 0.12354743480682373, + 0.16596439480781555, + 0.10420688986778259 + ], + "nudge_per_layer": [ + 0.002342540305107832, + -0.0004765552293974906, + -0.0007624666905030608, + -0.0012423819862306118, + -0.0012568822130560875, + -0.0016762344166636467, + -0.0018269497668370605, + -0.0020500137470662594, + -0.0022837575525045395, + -0.0026187507901340723, + -0.0029940432868897915, + -0.0031347349286079407 + ], + "final_value_loss": 0.37253577736616134, + "final_term_loss": 0.18445234730243684, + "final_bridge_loss": 0.0251624245762825, + "final_tgrad_loss": 0.16292100727558137 + } + }, + "a0.0_L12_s456": { + "bp": { + "test_acc": 0.9115, + "mean_bp_cosine": 0.7958964506785074, + "mean_rho": 0.9998697290817896, + "mean_nudge_001": -0.0046546936306792, + "mean_nudge_003": -0.013125322526320815, + "mean_nudge_01": -0.03561708889901638, + "bp_cosine_per_layer": [ + 0.841245174407959, + 0.830803632736206, + 0.8195754885673523, + 0.8066799640655518, + 0.7983194589614868, + 0.7908304929733276, + 0.7860588431358337, + 0.7811387777328491, + 0.7771316170692444, + 0.7744728326797485, + 0.7727954983711243, + 0.7717056274414062 + ], + "rho_per_layer": [ + 0.9999991059303284, + 0.9999973177909851, + 0.9999889731407166, + 0.9999734163284302, + 0.9999427795410156, + 0.9998763799667358, + 0.9998629093170166, + 0.9998323321342468, + 0.9997599720954895, + 0.9997479319572449, + 0.9997410774230957, + 0.9997145533561707 + ], + "nudge_per_layer": [ + -0.1470111906528473, + -0.09042022377252579, + -0.050197783857584, + -0.030754856765270233, + -0.021816428750753403, + -0.017199307680130005, + -0.014493460766971111, + -0.012762569822371006, + -0.01160583458840847, + -0.010828070342540741, + -0.010316012427210808, + -0.00999932736158371 + ] + }, + "dfa": { + "test_acc": 0.8275, + "mean_bp_cosine": 0.109907116740942, + "mean_rho": 0.10316232999321073, + "mean_nudge_001": -0.00034242031688336283, + "mean_nudge_003": -0.001020948082441464, + "mean_nudge_01": -0.0033549320845243833, + "bp_cosine_per_layer": [ + 0.0384417325258255, + 0.27492010593414307, + 0.17608770728111267, + 0.12729278206825256, + 0.09575799107551575, + 0.13158489763736725, + 0.07343505322933197, + 0.08012130856513977, + 0.08938327431678772, + 0.09414967149496078, + 0.06517850607633591, + 0.07253237068653107 + ], + "rho_per_layer": [ + -0.00336202559992671, + 0.18004602193832397, + 0.18598641455173492, + 0.15388232469558716, + 0.058810293674468994, + 0.14123386144638062, + 0.05320374667644501, + 0.10196533054113388, + 0.09802494943141937, + 0.10918877273797989, + 0.09344048798084259, + 0.0655277818441391 + ], + "nudge_per_layer": [ + -0.010087584145367146, + -0.006617182400077581, + -0.004152917303144932, + -0.0031182561069726944, + -0.0022262579295784235, + -0.0028664623387157917, + -0.0016081882640719414, + -0.0017378728371113539, + -0.0020772137213498354, + -0.002457245485857129, + -0.0015545324422419071, + -0.0017554720398038626 + ] + }, + "state_bridge": { + "test_acc": 0.684, + "mean_bp_cosine": 0.21628577137986818, + "mean_rho": 0.17074896084765592, + "mean_nudge_001": -0.0019644595328524397, + "mean_nudge_003": -0.0058011185271122185, + "mean_nudge_01": -0.018295541075834382, + "bp_cosine_per_layer": [ + 0.7363088726997375, + 0.32443851232528687, + 0.21702790260314941, + 0.21007081866264343, + 0.16975754499435425, + 0.1722516119480133, + 0.16474759578704834, + 0.12138545513153076, + 0.1178494393825531, + 0.13036376237869263, + 0.11493153870105743, + 0.1162962019443512 + ], + "rho_per_layer": [ + 0.6429969072341919, + 0.2531689405441284, + 0.22036504745483398, + 0.17542049288749695, + 0.15819020569324493, + 0.14438438415527344, + 0.07042165100574493, + 0.11963094770908356, + 0.1070300042629242, + 0.07622774690389633, + 0.035559043288230896, + 0.045592159032821655 + ], + "nudge_per_layer": [ + -0.1725819855928421, + -0.009430286474525928, + -0.0054127369076013565, + -0.005186344031244516, + -0.004062540829181671, + -0.0039931111969053745, + -0.003901706077158451, + -0.003083862829953432, + -0.002966922242194414, + -0.0033692335709929466, + -0.002796228276565671, + -0.002761534880846739 + ], + "state_pred_error_per_layer": [ + 8107.484375, + 6015.64697265625, + 3272.651123046875, + 3025.219970703125, + 3498.379150390625, + 2962.442626953125, + 2732.457275390625, + 3394.069091796875, + 3050.444091796875, + 3397.53271484375, + 3068.22607421875, + 3145.807373046875 + ], + "mean_state_pred_error": 3805.8634033203125 + }, + "credit_bridge": { + "test_acc": 0.669, + "mean_bp_cosine": 0.048155296875241525, + "mean_rho": 0.07334851861620943, + "mean_nudge_001": -0.00035685058537637815, + "mean_nudge_003": -0.0010696607399343823, + "mean_nudge_01": -0.0035326933624067656, + "bp_cosine_per_layer": [ + 0.0015124600613489747, + 0.020085982978343964, + 0.03127610310912132, + 0.03517032414674759, + 0.042219605296850204, + 0.05027471110224724, + 0.05683741718530655, + 0.057938531041145325, + 0.06581299006938934, + 0.06761687994003296, + 0.07107532024383545, + 0.07804323732852936 + ], + "rho_per_layer": [ + 0.03147998824715614, + -0.015333062037825584, + 0.020876668393611908, + 0.07304719090461731, + 0.0599740669131279, + 0.08874240517616272, + 0.05341971293091774, + 0.07721589505672455, + 0.08801877498626709, + 0.10527393221855164, + 0.16833831369876862, + 0.1291283369064331 + ], + "nudge_per_layer": [ + -0.004048495087772608, + -0.0012588155223056674, + -0.0019918864127248526, + -0.002725755563005805, + -0.0028244066052138805, + -0.003425109200179577, + -0.0036919033154845238, + -0.003999053034931421, + -0.0042928787879645824, + -0.004538967739790678, + -0.004742524586617947, + -0.004852524492889643 + ], + "final_value_loss": 0.8257113872528076, + "final_term_loss": 0.5509136886596679, + "final_bridge_loss": 0.049323998257517813, + "final_tgrad_loss": 0.22547370266914368 + } + }, + "a0.25_L2_s42": { + "bp": { + "test_acc": 0.908, + "mean_bp_cosine": 0.8980661034584045, + "mean_rho": 0.9999964535236359, + "mean_nudge_001": -0.01618960639461875, + "mean_nudge_003": -0.04483883548527956, + "mean_nudge_01": -0.11487101018428802, + "bp_cosine_per_layer": [ + 0.9068200588226318, + 0.8893121480941772 + ], + "rho_per_layer": [ + 0.9999985098838806, + 0.9999943971633911 + ], + "nudge_per_layer": [ + -0.15680165588855743, + -0.07294036448001862 + ] + }, + "dfa": { + "test_acc": 0.847, + "mean_bp_cosine": 0.026606750674545765, + "mean_rho": -0.0022891219705343246, + "mean_nudge_001": -2.3714659619145095e-05, + "mean_nudge_003": -1.6182020772248507e-05, + "mean_nudge_01": 0.0005980018759146333, + "bp_cosine_per_layer": [ + -0.008382977917790413, + 0.06159647926688194 + ], + "rho_per_layer": [ + -0.022914212197065353, + 0.018335968255996704 + ], + "nudge_per_layer": [ + 0.0033093439415097237, + -0.002113340189680457 + ] + }, + "state_bridge": { + "test_acc": 0.827, + "mean_bp_cosine": 0.6775506436824799, + "mean_rho": 0.6271905303001404, + "mean_nudge_001": -0.015066297259181738, + "mean_nudge_003": -0.04329914692789316, + "mean_nudge_01": -0.12377128005027771, + "bp_cosine_per_layer": [ + 0.9188902378082275, + 0.4362110495567322 + ], + "rho_per_layer": [ + 0.8401009440422058, + 0.41428011655807495 + ], + "nudge_per_layer": [ + -0.21947401762008667, + -0.02806854248046875 + ], + "state_pred_error_per_layer": [ + 753.1610107421875, + 333.87890625 + ], + "mean_state_pred_error": 543.5199584960938 + }, + "credit_bridge": { + "test_acc": 0.6455, + "mean_bp_cosine": 0.15288914740085602, + "mean_rho": 0.2540942281484604, + "mean_nudge_001": -0.003834493225440383, + "mean_nudge_003": -0.011456333566457033, + "mean_nudge_01": -0.03762407600879669, + "bp_cosine_per_layer": [ + 0.07500731945037842, + 0.23077097535133362 + ], + "rho_per_layer": [ + 0.12894567847251892, + 0.37924277782440186 + ], + "nudge_per_layer": [ + -0.05425257235765457, + -0.020995579659938812 + ], + "final_value_loss": 0.5630231554031372, + "final_term_loss": 0.2533654543399811, + "final_bridge_loss": 0.03314736911058426, + "final_tgrad_loss": 0.27651033034324646 + } + }, + "a0.25_L2_s123": { + "bp": { + "test_acc": 0.92, + "mean_bp_cosine": 0.8535160422325134, + "mean_rho": 0.9999972283840179, + "mean_nudge_001": -0.01451590727083385, + "mean_nudge_003": -0.03988213837146759, + "mean_nudge_01": -0.09831684827804565, + "bp_cosine_per_layer": [ + 0.8569881916046143, + 0.8500438928604126 + ], + "rho_per_layer": [ + 0.9999989867210388, + 0.9999954700469971 + ], + "nudge_per_layer": [ + -0.13159069418907166, + -0.06504300236701965 + ] + }, + "dfa": { + "test_acc": 0.853, + "mean_bp_cosine": 0.0877363346517086, + "mean_rho": 0.0626654140651226, + "mean_nudge_001": -0.0009488673531450331, + "mean_nudge_003": -0.0028224033303558826, + "mean_nudge_01": -0.009134252090007067, + "bp_cosine_per_layer": [ + 0.05345926433801651, + 0.1220134049654007 + ], + "rho_per_layer": [ + 0.09254007041454315, + 0.03279075771570206 + ], + "nudge_per_layer": [ + -0.0142319705337286, + -0.004036533646285534 + ] + }, + "state_bridge": { + "test_acc": 0.834, + "mean_bp_cosine": 0.6950189173221588, + "mean_rho": 0.5849489569664001, + "mean_nudge_001": -0.012975628254935145, + "mean_nudge_003": -0.03723907680250704, + "mean_nudge_01": -0.10619704332202673, + "bp_cosine_per_layer": [ + 0.9177796840667725, + 0.47225815057754517 + ], + "rho_per_layer": [ + 0.7912815809249878, + 0.3786163330078125 + ], + "nudge_per_layer": [ + -0.187799870967865, + -0.02459421567618847 + ], + "state_pred_error_per_layer": [ + 654.3871459960938, + 278.6759338378906 + ], + "mean_state_pred_error": 466.5315399169922 + }, + "credit_bridge": { + "test_acc": 0.638, + "mean_bp_cosine": 0.18947000801563263, + "mean_rho": 0.3388983681797981, + "mean_nudge_001": -0.004155236994847655, + "mean_nudge_003": -0.012411902891471982, + "mean_nudge_01": -0.04074052348732948, + "bp_cosine_per_layer": [ + 0.09752383828163147, + 0.2814161777496338 + ], + "rho_per_layer": [ + 0.2172888070344925, + 0.46050792932510376 + ], + "nudge_per_layer": [ + -0.05797416716814041, + -0.023506879806518555 + ], + "final_value_loss": 0.6248516966819763, + "final_term_loss": 0.2734043194293976, + "final_bridge_loss": 0.04374015842676163, + "final_tgrad_loss": 0.3077072183132172 + } + }, + "a0.25_L2_s456": { + "bp": { + "test_acc": 0.914, + "mean_bp_cosine": 0.8777631521224976, + "mean_rho": 0.9999973177909851, + "mean_nudge_001": -0.017619559541344643, + "mean_nudge_003": -0.04847448691725731, + "mean_nudge_01": -0.1200898252427578, + "bp_cosine_per_layer": [ + 0.8855119943618774, + 0.8700143098831177 + ], + "rho_per_layer": [ + 0.9999988079071045, + 0.9999958276748657 + ], + "nudge_per_layer": [ + -0.16111940145492554, + -0.07906024903059006 + ] + }, + "dfa": { + "test_acc": 0.842, + "mean_bp_cosine": 0.049672482535243034, + "mean_rho": 0.03196176886558533, + "mean_nudge_001": -0.0005511407216545194, + "mean_nudge_003": -0.0016261094715446234, + "mean_nudge_01": -0.0050985191483050585, + "bp_cosine_per_layer": [ + 0.015632983297109604, + 0.08371198177337646 + ], + "rho_per_layer": [ + -0.06864285469055176, + 0.1325663924217224 + ], + "nudge_per_layer": [ + -0.006782663054764271, + -0.003414375241845846 + ] + }, + "state_bridge": { + "test_acc": 0.817, + "mean_bp_cosine": 0.7210330367088318, + "mean_rho": 0.6920621693134308, + "mean_nudge_001": -0.01618554489687085, + "mean_nudge_003": -0.04673728672787547, + "mean_nudge_01": -0.13591178134083748, + "bp_cosine_per_layer": [ + 0.9367842674255371, + 0.5052818059921265 + ], + "rho_per_layer": [ + 0.846778392791748, + 0.5373459458351135 + ], + "nudge_per_layer": [ + -0.23458413779735565, + -0.037239424884319305 + ], + "state_pred_error_per_layer": [ + 626.5816650390625, + 277.74237060546875 + ], + "mean_state_pred_error": 452.1620178222656 + }, + "credit_bridge": { + "test_acc": 0.6685, + "mean_bp_cosine": 0.21126148104667664, + "mean_rho": 0.3547997772693634, + "mean_nudge_001": -0.004930314142256975, + "mean_nudge_003": -0.014735064469277859, + "mean_nudge_01": -0.048451079055666924, + "bp_cosine_per_layer": [ + 0.13380715250968933, + 0.28871580958366394 + ], + "rho_per_layer": [ + 0.2647465467453003, + 0.4448530077934265 + ], + "nudge_per_layer": [ + -0.07276535779237747, + -0.024136800318956375 + ], + "final_value_loss": 0.4186974630832672, + "final_term_loss": 0.13192469900846482, + "final_bridge_loss": 0.02328252377510071, + "final_tgrad_loss": 0.2634902417182922 + } + }, + "a0.25_L4_s42": { + "bp": { + "test_acc": 0.911, + "mean_bp_cosine": 0.841001495718956, + "mean_rho": 0.9999824017286301, + "mean_nudge_001": -0.012893156963400543, + "mean_nudge_003": -0.035831862362101674, + "mean_nudge_01": -0.09177740290760994, + "bp_cosine_per_layer": [ + 0.868922770023346, + 0.8429951667785645, + 0.8289605379104614, + 0.8231275081634521 + ], + "rho_per_layer": [ + 0.999998927116394, + 0.9999972581863403, + 0.9999882578849792, + 0.9999451637268066 + ], + "nudge_per_layer": [ + -0.17674864828586578, + -0.10683682560920715, + -0.05415143817663193, + -0.029372699558734894 + ] + }, + "dfa": { + "test_acc": 0.8515, + "mean_bp_cosine": 0.0922011851798743, + "mean_rho": 0.09930456057190895, + "mean_nudge_001": -0.0006074781995266676, + "mean_nudge_003": -0.001813438575481996, + "mean_nudge_01": -0.005950940365437418, + "bp_cosine_per_layer": [ + 0.006489354185760021, + 0.12851163744926453, + 0.11991241574287415, + 0.11389133334159851 + ], + "rho_per_layer": [ + 0.029786743223667145, + 0.18639126420021057, + 0.11502038687467575, + 0.06601984798908234 + ], + "nudge_per_layer": [ + -0.01056693121790886, + -0.006519604474306107, + -0.003515135496854782, + -0.003202090272679925 + ] + }, + "state_bridge": { + "test_acc": 0.738, + "mean_bp_cosine": 0.3966497778892517, + "mean_rho": 0.33668526262044907, + "mean_nudge_001": -0.006818186957389116, + "mean_nudge_003": -0.020020907453726977, + "mean_nudge_01": -0.0618970247451216, + "bp_cosine_per_layer": [ + 0.8448630571365356, + 0.4407959580421448, + 0.15707260370254517, + 0.14386749267578125 + ], + "rho_per_layer": [ + 0.7033247947692871, + 0.34020179510116577, + 0.13395404815673828, + 0.1692604124546051 + ], + "nudge_per_layer": [ + -0.2203540802001953, + -0.01797248050570488, + -0.004883656278252602, + -0.004377881996333599 + ], + "state_pred_error_per_layer": [ + 3192.55322265625, + 2613.6337890625, + 1881.11669921875, + 2102.51953125 + ], + "mean_state_pred_error": 2447.455810546875 + }, + "credit_bridge": { + "test_acc": 0.662, + "mean_bp_cosine": 0.1593644004315138, + "mean_rho": 0.2909943610429764, + "mean_nudge_001": -0.0019232924096286297, + "mean_nudge_003": -0.005755707039497793, + "mean_nudge_01": -0.019015976693481207, + "bp_cosine_per_layer": [ + 0.07093458622694016, + 0.19623729586601257, + 0.18378585577011108, + 0.18649986386299133 + ], + "rho_per_layer": [ + 0.14815130829811096, + 0.336488276720047, + 0.35506749153137207, + 0.3242703676223755 + ], + "nudge_per_layer": [ + -0.033366985619068146, + -0.015239425003528595, + -0.013842864893376827, + -0.01361463125795126 + ], + "final_value_loss": 0.5039997359514237, + "final_term_loss": 0.20441836426854135, + "final_bridge_loss": 0.03893857387006283, + "final_tgrad_loss": 0.26064279942512514 + } + }, + "a0.25_L4_s123": { + "bp": { + "test_acc": 0.917, + "mean_bp_cosine": 0.7935318648815155, + "mean_rho": 0.9999762326478958, + "mean_nudge_001": -0.01081152242841199, + "mean_nudge_003": -0.029669071780517697, + "mean_nudge_01": -0.0743116931989789, + "bp_cosine_per_layer": [ + 0.8279672861099243, + 0.8114954233169556, + 0.7863935232162476, + 0.7482712268829346 + ], + "rho_per_layer": [ + 0.9999987483024597, + 0.9999956488609314, + 0.999983012676239, + 0.9999275207519531 + ], + "nudge_per_layer": [ + -0.14138484001159668, + -0.08725307881832123, + -0.04476301744580269, + -0.023845836520195007 + ] + }, + "dfa": { + "test_acc": 0.824, + "mean_bp_cosine": 0.1441014357842505, + "mean_rho": 0.14396781660616398, + "mean_nudge_001": -0.0003178600236424245, + "mean_nudge_003": -0.0009397821850143373, + "mean_nudge_01": -0.0029927556752227247, + "bp_cosine_per_layer": [ + -0.030194921419024467, + 0.3003618121147156, + 0.18209302425384521, + 0.12414582818746567 + ], + "rho_per_layer": [ + -0.038011275231838226, + 0.29912513494491577, + 0.1735759675502777, + 0.14118143916130066 + ], + "nudge_per_layer": [ + 0.005076530389487743, + -0.00841662660241127, + -0.005011391825973988, + -0.0036195346619933844 + ] + }, + "state_bridge": { + "test_acc": 0.733, + "mean_bp_cosine": 0.3913041353225708, + "mean_rho": 0.3523585610091686, + "mean_nudge_001": -0.0061569800454890355, + "mean_nudge_003": -0.01808436232386157, + "mean_nudge_01": -0.055880151805467904, + "bp_cosine_per_layer": [ + 0.821143627166748, + 0.36722686886787415, + 0.20176959037780762, + 0.1750764548778534 + ], + "rho_per_layer": [ + 0.6905952095985413, + 0.36183467507362366, + 0.19890159368515015, + 0.15810276567935944 + ], + "nudge_per_layer": [ + -0.1973220407962799, + -0.013631552457809448, + -0.0068134344182908535, + -0.0057535795494914055 + ], + "state_pred_error_per_layer": [ + 3017.568359375, + 2069.30517578125, + 2103.28662109375, + 1370.3270263671875 + ], + "mean_state_pred_error": 2140.121795654297 + }, + "credit_bridge": { + "test_acc": 0.7085, + "mean_bp_cosine": 0.11074696853756905, + "mean_rho": 0.20390365412458777, + "mean_nudge_001": -0.0010930995340459049, + "mean_nudge_003": -0.0032710169325582683, + "mean_nudge_01": -0.010791003005579114, + "bp_cosine_per_layer": [ + 0.021101564168930054, + 0.1092284768819809, + 0.14931762218475342, + 0.16334021091461182 + ], + "rho_per_layer": [ + 0.026919251307845116, + 0.23688018321990967, + 0.28421375155448914, + 0.2676014304161072 + ], + "nudge_per_layer": [ + -0.008425744250416756, + -0.009595570154488087, + -0.012630455195903778, + -0.012512242421507835 + ], + "final_value_loss": 0.44552071504592894, + "final_term_loss": 0.1639193995475769, + "final_bridge_loss": 0.022096455523371698, + "final_tgrad_loss": 0.2595048580646515 + } + }, + "a0.25_L4_s456": { + "bp": { + "test_acc": 0.9185, + "mean_bp_cosine": 0.7816510498523712, + "mean_rho": 0.9999814331531525, + "mean_nudge_001": -0.01180829742224887, + "mean_nudge_003": -0.032709411811083555, + "mean_nudge_01": -0.08326426614075899, + "bp_cosine_per_layer": [ + 0.8029586672782898, + 0.7900986075401306, + 0.7753629684448242, + 0.7581839561462402 + ], + "rho_per_layer": [ + 0.999998927116394, + 0.9999964237213135, + 0.999983549118042, + 0.9999468326568604 + ], + "nudge_per_layer": [ + -0.15638579428195953, + -0.09745092689990997, + -0.05102477967739105, + -0.028195563703775406 + ] + }, + "dfa": { + "test_acc": 0.8515, + "mean_bp_cosine": 0.06627230579033494, + "mean_rho": 0.10299420775845647, + "mean_nudge_001": -0.000254730271990411, + "mean_nudge_003": -0.0007513021846534684, + "mean_nudge_01": -0.0023495194036513567, + "bp_cosine_per_layer": [ + -0.014162426814436913, + 0.0798005759716034, + 0.09311279654502869, + 0.10633827745914459 + ], + "rho_per_layer": [ + 0.041398823261260986, + 0.02247910387814045, + 0.1714327037334442, + 0.17666620016098022 + ], + "nudge_per_layer": [ + 0.002492401283234358, + -0.005343085154891014, + -0.0033098761923611164, + -0.003237517550587654 + ] + }, + "state_bridge": { + "test_acc": 0.7085, + "mean_bp_cosine": 0.37615348026156425, + "mean_rho": 0.3445914164185524, + "mean_nudge_001": -0.00598156735941302, + "mean_nudge_003": -0.017677294556051493, + "mean_nudge_01": -0.055878938641399145, + "bp_cosine_per_layer": [ + 0.8312708735466003, + 0.37615716457366943, + 0.14436809718608856, + 0.15281778573989868 + ], + "rho_per_layer": [ + 0.7588610649108887, + 0.34236449003219604, + 0.14024245738983154, + 0.13689765334129333 + ], + "nudge_per_layer": [ + -0.19714727997779846, + -0.01597677543759346, + -0.004914070479571819, + -0.005477628670632839 + ], + "state_pred_error_per_layer": [ + 2233.37158203125, + 1546.82080078125, + 996.9107666015625, + 942.33251953125 + ], + "mean_state_pred_error": 1429.8589172363281 + }, + "credit_bridge": { + "test_acc": 0.6185, + "mean_bp_cosine": 0.1528007835149765, + "mean_rho": 0.2638061139732599, + "mean_nudge_001": -0.0015675137401558459, + "mean_nudge_003": -0.004692548653110862, + "mean_nudge_01": -0.015524385962635279, + "bp_cosine_per_layer": [ + 0.048861026763916016, + 0.17950567603111267, + 0.17905107140541077, + 0.20378535985946655 + ], + "rho_per_layer": [ + 0.07314518839120865, + 0.3309200406074524, + 0.2789418697357178, + 0.3722173571586609 + ], + "nudge_per_layer": [ + -0.017692390829324722, + -0.014619983732700348, + -0.014469930902123451, + -0.015315238386392593 + ], + "final_value_loss": 0.64283842253685, + "final_term_loss": 0.27786159224510193, + "final_bridge_loss": 0.049283357608318326, + "final_tgrad_loss": 0.31569347660541536 + } + }, + "a0.25_L8_s42": { + "bp": { + "test_acc": 0.8955, + "mean_bp_cosine": 0.8411818519234657, + "mean_rho": 0.999948225915432, + "mean_nudge_001": -0.008358085062354803, + "mean_nudge_003": -0.023856630141381174, + "mean_nudge_01": -0.06703015509992838, + "bp_cosine_per_layer": [ + 0.8706932663917542, + 0.8596300482749939, + 0.8512309789657593, + 0.842391848564148, + 0.8334972858428955, + 0.8275372385978699, + 0.823634147644043, + 0.8208400011062622 + ], + "rho_per_layer": [ + 0.9999992847442627, + 0.9999973773956299, + 0.9999889731407166, + 0.9999737739562988, + 0.999952495098114, + 0.9999229311943054, + 0.9998778104782104, + 0.999873161315918 + ], + "nudge_per_layer": [ + -0.19971789419651031, + -0.12236367166042328, + -0.07083894312381744, + -0.044348303228616714, + -0.031799670308828354, + -0.02545534446835518, + -0.02191336825489998, + -0.01980404555797577 + ] + }, + "dfa": { + "test_acc": 0.835, + "mean_bp_cosine": 0.06675009592436254, + "mean_rho": 0.0799849673639983, + "mean_nudge_001": -6.642583684879355e-06, + "mean_nudge_003": -9.95869777398184e-06, + "mean_nudge_01": 0.00010420403850730509, + "bp_cosine_per_layer": [ + -0.029614916071295738, + 0.08655504137277603, + 0.09347832202911377, + 0.10665939003229141, + 0.10298001766204834, + 0.055703092366456985, + 0.06406168639659882, + 0.054178133606910706 + ], + "rho_per_layer": [ + -0.10576558113098145, + 0.13653026521205902, + 0.13744692504405975, + 0.169493168592453, + 0.1142939031124115, + 0.09325758367776871, + 0.1042378693819046, + -0.00961439497768879 + ], + "nudge_per_layer": [ + 0.021624702960252762, + -0.006033358629792929, + -0.003085250034928322, + -0.0032903538085520267, + -0.0030274176970124245, + -0.0016871094703674316, + -0.0020643905736505985, + -0.0016031904378905892 + ] + }, + "state_bridge": { + "test_acc": 0.7705, + "mean_bp_cosine": 0.2720195781439543, + "mean_rho": 0.24409680720418692, + "mean_nudge_001": -0.0037333294421841856, + "mean_nudge_003": -0.01090175670105964, + "mean_nudge_01": -0.03293398043024354, + "bp_cosine_per_layer": [ + 0.8497925996780396, + 0.4692588150501251, + 0.1727459728717804, + 0.1467132717370987, + 0.13944602012634277, + 0.1262509524822235, + 0.13373470306396484, + 0.13821429014205933 + ], + "rho_per_layer": [ + 0.7623768448829651, + 0.4223487377166748, + 0.18194836378097534, + 0.12129966914653778, + 0.11680327355861664, + 0.15588274598121643, + 0.1260674148797989, + 0.06604740768671036 + ], + "nudge_per_layer": [ + -0.23203837871551514, + -0.013907128013670444, + -0.0036564678885042667, + -0.0029728016816079617, + -0.0027978671714663506, + -0.0026036568451672792, + -0.002694307826459408, + -0.0028012352995574474 + ], + "state_pred_error_per_layer": [ + 10530.408203125, + 8501.392578125, + 5819.005859375, + 4775.642578125, + 4112.55224609375, + 3853.83984375, + 4342.64697265625, + 3851.865478515625 + ], + "mean_state_pred_error": 5723.419219970703 + }, + "credit_bridge": { + "test_acc": 0.616, + "mean_bp_cosine": 0.11742978217080235, + "mean_rho": 0.20278298296034336, + "mean_nudge_001": -0.000763369575906836, + "mean_nudge_003": -0.0022864671773277223, + "mean_nudge_01": -0.007572929258458316, + "bp_cosine_per_layer": [ + 0.0006081201136112213, + 0.13602128624916077, + 0.1264307200908661, + 0.13147516548633575, + 0.14721693098545074, + 0.1274956315755844, + 0.13849349319934845, + 0.1316969096660614 + ], + "rho_per_layer": [ + 0.0121258944272995, + 0.21904222667217255, + 0.23992177844047546, + 0.23384322226047516, + 0.24397125840187073, + 0.24230614304542542, + 0.23810306191444397, + 0.1929502785205841 + ], + "nudge_per_layer": [ + 0.0015163691714406013, + -0.009462166577577591, + -0.008223006501793861, + -0.008610539138317108, + -0.009565019980072975, + -0.00855704490095377, + -0.008995135314762592, + -0.008686890825629234 + ], + "final_value_loss": 0.5891867377281189, + "final_term_loss": 0.3338063308954239, + "final_bridge_loss": 0.026477533173561097, + "final_tgrad_loss": 0.2289028725862503 + } + }, + "a0.25_L8_s123": { + "bp": { + "test_acc": 0.896, + "mean_bp_cosine": 0.8579939901828766, + "mean_rho": 0.9999475553631783, + "mean_nudge_001": -0.008832237246679142, + "mean_nudge_003": -0.02530999999726191, + "mean_nudge_01": -0.07218505791388452, + "bp_cosine_per_layer": [ + 0.8995364308357239, + 0.8806806802749634, + 0.8653636574745178, + 0.852218508720398, + 0.8451849222183228, + 0.8416627645492554, + 0.8401176333427429, + 0.8391873240470886 + ], + "rho_per_layer": [ + 0.9999992251396179, + 0.9999973773956299, + 0.9999878406524658, + 0.9999729990959167, + 0.9999438524246216, + 0.9999128580093384, + 0.9999063611030579, + 0.9998599290847778 + ], + "nudge_per_layer": [ + -0.2192329615354538, + -0.13158643245697021, + -0.07524827122688293, + -0.04681030660867691, + -0.03351406753063202, + -0.026811176910996437, + -0.02318240888416767, + -0.02109483815729618 + ] + }, + "dfa": { + "test_acc": 0.833, + "mean_bp_cosine": 0.07527017407119274, + "mean_rho": 0.08970394870266318, + "mean_nudge_001": -3.044791992579121e-05, + "mean_nudge_003": -8.396412886213511e-05, + "mean_nudge_01": -0.00019736881949938834, + "bp_cosine_per_layer": [ + -0.030230171978473663, + 0.1515132635831833, + 0.08784028142690659, + 0.07231537997722626, + 0.09554086625576019, + 0.09082843363285065, + 0.05412551760673523, + 0.0802278220653534 + ], + "rho_per_layer": [ + 0.04074572026729584, + 0.1662997603416443, + 0.08309999853372574, + 0.07389070093631744, + 0.14882703125476837, + 0.04519672691822052, + 0.0252661295235157, + 0.13430552184581757 + ], + "nudge_per_layer": [ + 0.013973418623209, + -0.0047885943204164505, + -0.0020089128520339727, + -0.0015227446565404534, + -0.002120924647897482, + -0.0020366935059428215, + -0.001262089004740119, + -0.0018124101916328073 + ] + }, + "state_bridge": { + "test_acc": 0.753, + "mean_bp_cosine": 0.26880230009555817, + "mean_rho": 0.23677901271730661, + "mean_nudge_001": -0.0032272498192469357, + "mean_nudge_003": -0.009375294612254947, + "mean_nudge_01": -0.027950568503001705, + "bp_cosine_per_layer": [ + 0.8559742569923401, + 0.48324936628341675, + 0.20313377678394318, + 0.15002062916755676, + 0.13207414746284485, + 0.11473802477121353, + 0.10703189671039581, + 0.10419630259275436 + ], + "rho_per_layer": [ + 0.712527871131897, + 0.4307812452316284, + 0.20181137323379517, + 0.13881561160087585, + 0.15075963735580444, + 0.09288278967142105, + 0.0890430212020874, + 0.0776105523109436 + ], + "nudge_per_layer": [ + -0.19413721561431885, + -0.013532894663512707, + -0.004060069564729929, + -0.0029658200219273567, + -0.00256463885307312, + -0.0022291922941803932, + -0.00204793200828135, + -0.002066785003989935 + ], + "state_pred_error_per_layer": [ + 8381.830078125, + 6536.470703125, + 4195.43359375, + 3240.16162109375, + 3085.78857421875, + 3078.50390625, + 3156.81787109375, + 3267.9345703125 + ], + "mean_state_pred_error": 4367.867614746094 + }, + "credit_bridge": { + "test_acc": 0.651, + "mean_bp_cosine": 0.131322234403342, + "mean_rho": 0.19494653795845807, + "mean_nudge_001": -0.0009437191256438382, + "mean_nudge_003": -0.002826296287821606, + "mean_nudge_01": -0.009364197961986065, + "bp_cosine_per_layer": [ + 0.021486874669790268, + 0.13597777485847473, + 0.14020901918411255, + 0.16125136613845825, + 0.15609152615070343, + 0.1541982889175415, + 0.14447104930877686, + 0.13689197599887848 + ], + "rho_per_layer": [ + 0.021052071824669838, + 0.17873916029930115, + 0.25896143913269043, + 0.18253415822982788, + 0.20761561393737793, + 0.24419330060482025, + 0.21560567617416382, + 0.25087088346481323 + ], + "nudge_per_layer": [ + -0.006693178787827492, + -0.009655885398387909, + -0.009345939382910728, + -0.010369300842285156, + -0.010154420509934425, + -0.010046296752989292, + -0.009472687728703022, + -0.009175874292850494 + ], + "final_value_loss": 0.41045001599788666, + "final_term_loss": 0.17502211028933526, + "final_bridge_loss": 0.01536440534889698, + "final_tgrad_loss": 0.2200635038137436 + } + }, + "a0.25_L8_s456": { + "bp": { + "test_acc": 0.8915, + "mean_bp_cosine": 0.8808343783020973, + "mean_rho": 0.9999449253082275, + "mean_nudge_001": -0.00886416298453696, + "mean_nudge_003": -0.025221005314961076, + "mean_nudge_01": -0.07025118661113083, + "bp_cosine_per_layer": [ + 0.9125592708587646, + 0.9000785946846008, + 0.8909372687339783, + 0.8829550743103027, + 0.8725745677947998, + 0.8661020994186401, + 0.8620940446853638, + 0.8593741059303284 + ], + "rho_per_layer": [ + 0.999998927116394, + 0.9999973177909851, + 0.9999907612800598, + 0.9999756813049316, + 0.9999436140060425, + 0.9999102354049683, + 0.9998818635940552, + 0.9998610019683838 + ], + "nudge_per_layer": [ + -0.20531992614269257, + -0.12906500697135925, + -0.07575342804193497, + -0.04753156006336212, + -0.033830925822257996, + -0.02684028074145317, + -0.02297976426780224, + -0.020688600838184357 + ] + }, + "dfa": { + "test_acc": 0.8165, + "mean_bp_cosine": 0.1053345538675785, + "mean_rho": 0.1329206523951143, + "mean_nudge_001": -0.0005203891905694036, + "mean_nudge_003": -0.0015467511984752491, + "mean_nudge_01": -0.0049866703047882766, + "bp_cosine_per_layer": [ + 0.023487910628318787, + 0.16097302734851837, + 0.15321409702301025, + 0.08171598613262177, + 0.09132305532693863, + 0.0943714827299118, + 0.12134475260972977, + 0.11624611914157867 + ], + "rho_per_layer": [ + 0.006953349336981773, + 0.2090909481048584, + 0.23601846396923065, + 0.09328415989875793, + 0.10916170477867126, + 0.12872634828090668, + 0.15839380025863647, + 0.12173644453287125 + ], + "nudge_per_layer": [ + -0.013351024128496647, + -0.0065501369535923, + -0.004914519842714071, + -0.002402292797341943, + -0.002674146555364132, + -0.0028969072736799717, + -0.0036479653790593147, + -0.0034563695080578327 + ] + }, + "state_bridge": { + "test_acc": 0.765, + "mean_bp_cosine": 0.24095587618649006, + "mean_rho": 0.20889087952673435, + "mean_nudge_001": -0.0035492044535203604, + "mean_nudge_003": -0.01036601059968234, + "mean_nudge_01": -0.03139855920744594, + "bp_cosine_per_layer": [ + 0.8715300559997559, + 0.44268321990966797, + 0.14538408815860748, + 0.1153520941734314, + 0.09680549800395966, + 0.08768410980701447, + 0.08654746413230896, + 0.08166047930717468 + ], + "rho_per_layer": [ + 0.7710200548171997, + 0.4253605008125305, + 0.09275925159454346, + 0.09712537378072739, + 0.11123719066381454, + 0.028249293565750122, + 0.05002531409263611, + 0.09535005688667297 + ], + "nudge_per_layer": [ + -0.22555799782276154, + -0.012845459394156933, + -0.003021553158760071, + -0.0024172987323254347, + -0.002025863155722618, + -0.0018953735707327724, + -0.0018195084994658828, + -0.0016054193256422877 + ], + "state_pred_error_per_layer": [ + 7857.92041015625, + 7327.2666015625, + 4158.3056640625, + 3231.240234375, + 3079.712890625, + 2843.65966796875, + 3014.824951171875, + 2904.82080078125 + ], + "mean_state_pred_error": 4302.218902587891 + }, + "credit_bridge": { + "test_acc": 0.6845, + "mean_bp_cosine": 0.08619831164833158, + "mean_rho": 0.20396122278179973, + "mean_nudge_001": -0.0008905812101147603, + "mean_nudge_003": -0.0026642234588507563, + "mean_nudge_01": -0.008798376395134255, + "bp_cosine_per_layer": [ + -0.005484581924974918, + 0.03739434853196144, + 0.0736197978258133, + 0.10366753488779068, + 0.11266068369150162, + 0.12653732299804688, + 0.11692580580711365, + 0.12426558136940002 + ], + "rho_per_layer": [ + -0.0015162499621510506, + 0.12250564247369766, + 0.22542724013328552, + 0.204342320561409, + 0.2217923402786255, + 0.28867796063423157, + 0.33211782574653625, + 0.23834270238876343 + ], + "nudge_per_layer": [ + 0.0002549269702285528, + -0.006913396995514631, + -0.008808376267552376, + -0.010325662791728973, + -0.010591026395559311, + -0.011654841713607311, + -0.010967787355184555, + -0.011380846612155437 + ], + "final_value_loss": 0.966836922454834, + "final_term_loss": 0.6684003219604492, + "final_bridge_loss": 0.09051647346019745, + "final_tgrad_loss": 0.20792012577056884 + } + }, + "a0.25_L12_s42": { + "bp": { + "test_acc": 0.897, + "mean_bp_cosine": 0.826698362827301, + "mean_rho": 0.9998699675003687, + "mean_nudge_001": -0.006519351474707946, + "mean_nudge_003": -0.0185935211678346, + "mean_nudge_01": -0.05259064872128268, + "bp_cosine_per_layer": [ + 0.8824102282524109, + 0.865839958190918, + 0.8526839017868042, + 0.839972198009491, + 0.826134204864502, + 0.8190910220146179, + 0.8134430646896362, + 0.8095068335533142, + 0.8061133027076721, + 0.8034266233444214, + 0.8016149997711182, + 0.8001440167427063 + ], + "rho_per_layer": [ + 0.9999990463256836, + 0.9999975562095642, + 0.9999887347221375, + 0.9999736547470093, + 0.9999515414237976, + 0.9999052882194519, + 0.9998592138290405, + 0.999845027923584, + 0.99979567527771, + 0.9997392892837524, + 0.999713659286499, + 0.9996709227561951 + ], + "nudge_per_layer": [ + -0.21559840440750122, + -0.13125374913215637, + -0.0758625715970993, + -0.04728776216506958, + -0.03328181058168411, + -0.025909576565027237, + -0.021545151248574257, + -0.01875336468219757, + -0.016917269676923752, + -0.015656160190701485, + -0.014799138531088829, + -0.01422282587736845 + ] + }, + "dfa": { + "test_acc": 0.8165, + "mean_bp_cosine": 0.06692749153201778, + "mean_rho": 0.09511666395701468, + "mean_nudge_001": -0.0003660954941248444, + "mean_nudge_003": -0.0010870555027698476, + "mean_nudge_01": -0.003503491034886489, + "bp_cosine_per_layer": [ + 0.02035588026046753, + 0.09721152484416962, + 0.10017214715480804, + 0.06879279017448425, + 0.0898706465959549, + 0.0775061622262001, + 0.0738426148891449, + 0.022470442578196526, + 0.03698011115193367, + 0.09759337455034256, + 0.05344103276729584, + 0.06489317119121552 + ], + "rho_per_layer": [ + -0.041805852204561234, + 0.14336195588111877, + 0.21263040602207184, + 0.15326815843582153, + 0.04533267021179199, + 0.07981619238853455, + 0.08665720373392105, + 0.004602088592946529, + 0.0780038833618164, + 0.11769488453865051, + 0.1415681391954422, + 0.12027023732662201 + ], + "nudge_per_layer": [ + -0.007749770302325487, + -0.008321389555931091, + -0.003876405069604516, + -0.0026999912224709988, + -0.0026630363427102566, + -0.0033310302533209324, + -0.0026011697482317686, + -0.0011158722918480635, + -0.0018408913165330887, + -0.0036767907440662384, + -0.0019704087171703577, + -0.0021951368544250727 + ] + }, + "state_bridge": { + "test_acc": 0.687, + "mean_bp_cosine": 0.1969081535935402, + "mean_rho": 0.18958334562679133, + "mean_nudge_001": -0.0026059118196523436, + "mean_nudge_003": -0.007709211970601852, + "mean_nudge_01": -0.02444164449116215, + "bp_cosine_per_layer": [ + 0.7618155479431152, + 0.3189862072467804, + 0.20356883108615875, + 0.1471748650074005, + 0.14541830122470856, + 0.13144558668136597, + 0.11054451763629913, + 0.12045299261808395, + 0.11467338353395462, + 0.1017053946852684, + 0.10614258050918579, + 0.10096963495016098 + ], + "rho_per_layer": [ + 0.6406711339950562, + 0.31470298767089844, + 0.1861359179019928, + 0.17725443840026855, + 0.11286133527755737, + 0.1387007087469101, + 0.07976903766393661, + 0.11419158428907394, + 0.13525697588920593, + 0.13865813612937927, + 0.10792528837919235, + 0.1288726031780243 + ], + "nudge_per_layer": [ + -0.24276113510131836, + -0.011681582778692245, + -0.006372842937707901, + -0.004580066539347172, + -0.004361784551292658, + -0.004005158320069313, + -0.0033329487778246403, + -0.003609130624681711, + -0.003437052248045802, + -0.003070915350690484, + -0.0031537071336060762, + -0.0029334095306694508 + ], + "state_pred_error_per_layer": [ + 13069.6103515625, + 12902.267578125, + 5325.7177734375, + 4598.6796875, + 4871.38818359375, + 4525.17333984375, + 4230.712890625, + 4117.212890625, + 3694.05078125, + 3737.547607421875, + 3966.26025390625, + 4157.70654296875 + ], + "mean_state_pred_error": 5766.360656738281 + }, + "credit_bridge": { + "test_acc": 0.6145, + "mean_bp_cosine": 0.07906571677691925, + "mean_rho": 0.138323282978187, + "mean_nudge_001": -0.000623912480174719, + "mean_nudge_003": -0.0018697016639634967, + "mean_nudge_01": -0.006201692313576738, + "bp_cosine_per_layer": [ + -0.00034100248012691736, + 0.04912012815475464, + 0.07342620939016342, + 0.08266763389110565, + 0.08488726615905762, + 0.08897420018911362, + 0.09187051653862, + 0.09561659395694733, + 0.09157264232635498, + 0.0947732925415039, + 0.09517554938793182, + 0.10104557126760483 + ], + "rho_per_layer": [ + 0.03049650974571705, + 0.10809889435768127, + 0.08979646861553192, + 0.17959633469581604, + 0.1275440901517868, + 0.17255432903766632, + 0.16415373980998993, + 0.11534757167100906, + 0.17073199152946472, + 0.15983673930168152, + 0.15877583622932434, + 0.18294689059257507 + ], + "nudge_per_layer": [ + -0.003660556860268116, + -0.004647519439458847, + -0.005617665126919746, + -0.006360755302011967, + -0.006202561780810356, + -0.006613034754991531, + -0.006794797722250223, + -0.006956290453672409, + -0.006790010258555412, + -0.006838815752416849, + -0.006875438615679741, + -0.007062861695885658 + ], + "final_value_loss": 0.5342490439891815, + "final_term_loss": 0.2775654150247574, + "final_bridge_loss": 0.01819542294666171, + "final_tgrad_loss": 0.2384882021665573 + } + }, + "a0.25_L12_s123": { + "bp": { + "test_acc": 0.902, + "mean_bp_cosine": 0.7854474087556204, + "mean_rho": 0.9998569438854853, + "mean_nudge_001": -0.005986864319614445, + "mean_nudge_003": -0.01699222985189408, + "mean_nudge_01": -0.04738136318822702, + "bp_cosine_per_layer": [ + 0.8318638801574707, + 0.8205357789993286, + 0.8115277886390686, + 0.8032979965209961, + 0.7886118292808533, + 0.7801527976989746, + 0.7755030393600464, + 0.769822359085083, + 0.7656118869781494, + 0.7624454498291016, + 0.7592873573303223, + 0.7567087411880493 + ], + "rho_per_layer": [ + 0.9999992251396179, + 0.9999969005584717, + 0.9999886155128479, + 0.9999699592590332, + 0.9999390244483948, + 0.9998932480812073, + 0.9998554587364197, + 0.9998190999031067, + 0.9997619986534119, + 0.9997045397758484, + 0.9997037649154663, + 0.9996514916419983 + ], + "nudge_per_layer": [ + -0.19001588225364685, + -0.1191760003566742, + -0.0696173831820488, + -0.04359997808933258, + -0.030619269236922264, + -0.023702502250671387, + -0.019644131883978844, + -0.01702706888318062, + -0.015273808501660824, + -0.014067228883504868, + -0.01321301981806755, + -0.012620084919035435 + ] + }, + "dfa": { + "test_acc": 0.8475, + "mean_bp_cosine": 0.08017303561791778, + "mean_rho": 0.06949969536314408, + "mean_nudge_001": -0.00017117233619501349, + "mean_nudge_003": -0.0005107432225486264, + "mean_nudge_01": -0.0016712878035226215, + "bp_cosine_per_layer": [ + 0.007017737254500389, + 0.1750856339931488, + 0.09811605513095856, + 0.09870222210884094, + 0.06923168152570724, + 0.07072796672582626, + 0.1299426257610321, + 0.06372487545013428, + 0.05202930420637131, + 0.07090489566326141, + 0.04892899468541145, + 0.07766443490982056 + ], + "rho_per_layer": [ + -0.05082311853766441, + 0.15127798914909363, + 0.10723739117383957, + 0.1141807958483696, + 0.10590988397598267, + 0.05159565061330795, + 0.11685939878225327, + 0.06997300684452057, + 0.00848393514752388, + 0.09840574860572815, + 0.04575839638710022, + 0.015137266367673874 + ], + "nudge_per_layer": [ + -9.43206250667572e-05, + -0.004689650610089302, + -0.0020264536142349243, + -0.0020407852716743946, + -0.0012656663311645389, + -0.0012923413887619972, + -0.0026080894749611616, + -0.0013762509915977716, + -0.0008721412159502506, + -0.0014046088326722383, + -0.0009981195908039808, + -0.0013870256952941418 + ] + }, + "state_bridge": { + "test_acc": 0.653, + "mean_bp_cosine": 0.212141719336311, + "mean_rho": 0.16903599786261717, + "mean_nudge_001": -0.002121228181446592, + "mean_nudge_003": -0.006256894756612989, + "mean_nudge_01": -0.019624086019272607, + "bp_cosine_per_layer": [ + 0.7411977648735046, + 0.3599514067173004, + 0.24466437101364136, + 0.18324854969978333, + 0.1438049077987671, + 0.1288401186466217, + 0.12390943616628647, + 0.11832019686698914, + 0.1285572201013565, + 0.12467152625322342, + 0.12941977381706238, + 0.11911536008119583 + ], + "rho_per_layer": [ + 0.637965977191925, + 0.3033628761768341, + 0.22177954018115997, + 0.1946793794631958, + 0.08981841057538986, + 0.07293770462274551, + 0.06646254658699036, + 0.08072252571582794, + 0.1001453697681427, + 0.10873826593160629, + 0.08548736572265625, + 0.06633201241493225 + ], + "nudge_per_layer": [ + -0.19135718047618866, + -0.010539980605244637, + -0.006164146587252617, + -0.004623022396117449, + -0.003351652529090643, + -0.002855603815987706, + -0.002745934296399355, + -0.0025949627161026, + -0.002952038776129484, + -0.002784580923616886, + -0.002810355508700013, + -0.0027095736004412174 + ], + "state_pred_error_per_layer": [ + 11398.169921875, + 8994.236328125, + 6843.07958984375, + 5338.4423828125, + 5392.61279296875, + 5254.96435546875, + 5057.08544921875, + 3968.3759765625, + 3609.97021484375, + 3456.01708984375, + 3801.56005859375, + 3800.938232421875 + ], + "mean_state_pred_error": 5576.287699381511 + }, + "credit_bridge": { + "test_acc": 0.6165, + "mean_bp_cosine": 0.062155287557592, + "mean_rho": 0.1365320294474562, + "mean_nudge_001": -0.0005568450481708472, + "mean_nudge_003": -0.001666992757236585, + "mean_nudge_01": -0.005523480668974419, + "bp_cosine_per_layer": [ + 0.022855455055832863, + 0.05216163024306297, + 0.06243491545319557, + 0.06105152890086174, + 0.04914259910583496, + 0.0686616599559784, + 0.07184358686208725, + 0.06793813407421112, + 0.07173632830381393, + 0.07284142076969147, + 0.07256414741277695, + 0.07263204455375671 + ], + "rho_per_layer": [ + 0.035705771297216415, + 0.06484436988830566, + 0.15210987627506256, + 0.16708198189735413, + 0.14389753341674805, + 0.17870034277439117, + 0.1870872974395752, + 0.1476944386959076, + 0.15697413682937622, + 0.11093902587890625, + 0.14925891160964966, + 0.1440906673669815 + ], + "nudge_per_layer": [ + -0.010396174155175686, + -0.0040237451903522015, + -0.004916047677397728, + -0.004709047265350819, + -0.003890307154506445, + -0.005256335251033306, + -0.00541608827188611, + -0.005244302563369274, + -0.005511538591235876, + -0.005561722908169031, + -0.005636853165924549, + -0.0057196058332920074 + ], + "final_value_loss": 0.7472030250549316, + "final_term_loss": 0.48659993648529054, + "final_bridge_loss": 0.02176231173723936, + "final_tgrad_loss": 0.23884078254699706 + } + }, + "a0.25_L12_s456": { + "bp": { + "test_acc": 0.899, + "mean_bp_cosine": 0.7671962430079778, + "mean_rho": 0.9998593876759211, + "mean_nudge_001": -0.004748132584306101, + "mean_nudge_003": -0.013334368025728812, + "mean_nudge_01": -0.03616663611804446, + "bp_cosine_per_layer": [ + 0.8408721685409546, + 0.8110387921333313, + 0.7906323671340942, + 0.7719681262969971, + 0.7599710822105408, + 0.7539124488830566, + 0.7502779364585876, + 0.7483201026916504, + 0.7469743490219116, + 0.7455896139144897, + 0.7440224885940552, + 0.7427754402160645 + ], + "rho_per_layer": [ + 0.9999985694885254, + 0.9999968409538269, + 0.9999892711639404, + 0.9999746680259705, + 0.9999452233314514, + 0.9998985528945923, + 0.999815821647644, + 0.9998071789741516, + 0.9997591972351074, + 0.9997697472572327, + 0.9996993541717529, + 0.9996582269668579 + ], + "nudge_per_layer": [ + -0.1375543624162674, + -0.0896252989768982, + -0.05422336980700493, + -0.034489020705223083, + -0.024439619854092598, + -0.019029833376407623, + -0.015829749405384064, + -0.013777680695056915, + -0.012396320700645447, + -0.011455517262220383, + -0.01080663874745369, + -0.01037222146987915 + ] + }, + "dfa": { + "test_acc": 0.8205, + "mean_bp_cosine": 0.11264437561233838, + "mean_rho": 0.10325007668385904, + "mean_nudge_001": -0.0003942390236867747, + "mean_nudge_003": -0.001173070602817461, + "mean_nudge_01": -0.003865133059055855, + "bp_cosine_per_layer": [ + 0.03703948110342026, + 0.2760871648788452, + 0.18428769707679749, + 0.1331849992275238, + 0.09719057381153107, + 0.1258918195962906, + 0.0748991146683693, + 0.08436713367700577, + 0.09110807627439499, + 0.10076140612363815, + 0.06335102021694183, + 0.08356402069330215 + ], + "rho_per_layer": [ + 0.048133689910173416, + 0.19754433631896973, + 0.16992174088954926, + 0.13566580414772034, + 0.05106702446937561, + 0.13118207454681396, + 0.057789772748947144, + 0.09156530350446701, + 0.05846566706895828, + 0.07805749773979187, + 0.11393842101097107, + 0.10566958785057068 + ], + "nudge_per_layer": [ + -0.010506195947527885, + -0.007814407348632812, + -0.005055932328104973, + -0.003603969234973192, + -0.0024205115623772144, + -0.0030835624784231186, + -0.0020989018958061934, + -0.002160410862416029, + -0.0025065483059734106, + -0.0029421483632177114, + -0.0018882867880165577, + -0.0023007215932011604 + ] + }, + "state_bridge": { + "test_acc": 0.645, + "mean_bp_cosine": 0.17685540641347566, + "mean_rho": 0.14925638431062302, + "mean_nudge_001": -0.001906786697266701, + "mean_nudge_003": -0.005651665274247837, + "mean_nudge_01": -0.018038961667722713, + "bp_cosine_per_layer": [ + 0.7252062559127808, + 0.29899632930755615, + 0.17116883397102356, + 0.13035137951374054, + 0.11515486240386963, + 0.09652335941791534, + 0.0831163302063942, + 0.08587749302387238, + 0.1138496845960617, + 0.09370164573192596, + 0.10970423370599747, + 0.09861446917057037 + ], + "rho_per_layer": [ + 0.5776556730270386, + 0.24244043231010437, + 0.15723995864391327, + 0.11212021112442017, + 0.13527166843414307, + 0.09345141798257828, + 0.05218992009758949, + 0.09958191215991974, + 0.09601333737373352, + 0.05242425203323364, + 0.08741243183612823, + 0.08527539670467377 + ], + "nudge_per_layer": [ + -0.1766481101512909, + -0.00916180107742548, + -0.004768161568790674, + -0.00345130218192935, + -0.0031899111345410347, + -0.002747050253674388, + -0.002392321825027466, + -0.0024352066684514284, + -0.0032566720619797707, + -0.0024684183299541473, + -0.003083357820287347, + -0.0028652269393205643 + ], + "state_pred_error_per_layer": [ + 14567.1396484375, + 8843.26171875, + 5969.56787109375, + 5045.4873046875, + 4699.3388671875, + 4805.94287109375, + 4535.58935546875, + 4793.4423828125, + 4549.9345703125, + 4690.251953125, + 4812.1875, + 4947.22509765625 + ], + "mean_state_pred_error": 6021.614095052083 + }, + "credit_bridge": { + "test_acc": 0.5665, + "mean_bp_cosine": 0.0795192973067363, + "mean_rho": 0.11809263161073129, + "mean_nudge_001": -0.0007323032235338663, + "mean_nudge_003": -0.002197402771950389, + "mean_nudge_01": -0.007294998116170366, + "bp_cosine_per_layer": [ + 0.0279831662774086, + 0.034206733107566833, + 0.06341560930013657, + 0.0695083886384964, + 0.09047738462686539, + 0.09644618630409241, + 0.1011449545621872, + 0.09714356064796448, + 0.09739723801612854, + 0.09588810801506042, + 0.09328337758779526, + 0.08733686059713364 + ], + "rho_per_layer": [ + -0.01078212633728981, + 0.08389643579721451, + 0.09591226279735565, + 0.09822964668273926, + 0.15539337694644928, + 0.077084481716156, + 0.18135306239128113, + 0.13923753798007965, + 0.15523496270179749, + 0.1566530466079712, + 0.16011789441108704, + 0.12478099763393402 + ], + "nudge_per_layer": [ + -0.014675050042569637, + -0.0035726604983210564, + -0.005193591117858887, + -0.005878218449652195, + -0.007073326967656612, + -0.007276617921888828, + -0.0072667524218559265, + -0.007385652512311935, + -0.00723686721175909, + -0.007413622923195362, + -0.0073149921372532845, + -0.007252625189721584 + ], + "final_value_loss": 0.8463798692464829, + "final_term_loss": 0.5014169258773327, + "final_bridge_loss": 0.03549532132707536, + "final_tgrad_loss": 0.3094676312446594 + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.0_L12_s123.json b/results/synth_ladder_v2_lo/synth_a0.0_L12_s123.json new file mode 100644 index 0000000..6c23585 --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.0_L12_s123.json @@ -0,0 +1,1722 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.0067736080646514, + 0.5260489372253419, + 0.4133770223617554, + 0.4122163911819458, + 0.40281385097503664, + 0.36370011711120603, + 0.33828531596660616, + 0.29866596674919127, + 0.333806049990654, + 0.2945868176460266, + 0.323841304898262, + 0.2685866693496704, + 0.3298992721319199, + 0.25060330071449277, + 0.25327417068481445, + 0.2714337857246399, + 0.29294549844264983, + 0.21931176762580873, + 0.2727045719623566, + 0.20682705554962158, + 0.2116490536928177, + 0.21470289249420166, + 0.2009852997303009, + 0.1929733597636223, + 0.18818628187179565, + 0.1860898569047451, + 0.16704004918932916, + 0.16348838634490967, + 0.23760174412727356, + 0.1993864372253418, + 0.28539346175193786, + 0.21175305500030517, + 0.20074062764644623, + 0.17021721827983857, + 0.17064657579660417, + 0.15043421156406403, + 0.16111934831142424, + 0.14164673606455325, + 0.12837897226810455, + 0.12804475803375245, + 0.13920657671391964, + 0.11750857322216034, + 0.11461956782341004, + 0.12064324700832367, + 0.12140779693126678, + 0.10785262448787689, + 0.11697521369457245, + 0.11477361053824425, + 0.10196099520921707, + 0.10024751018285752, + 0.10045197930335999, + 0.11292316007614135, + 0.13151926128268243, + 0.09808630378246308, + 0.10186688977479935, + 0.09669416191577912, + 0.09587533710598946, + 0.08454020006656647, + 0.08168289212062955, + 0.07666999014616012, + 0.08046016120910644, + 0.08711373453140259, + 0.08040154814720153, + 0.07493037286698818, + 0.07147429277896881, + 0.07314489345550537, + 0.07231674332618714, + 0.06915788714289665, + 0.0673254727602005, + 0.06822554222345352, + 0.06570249862521887, + 0.06449803622961044, + 0.06389484124183654, + 0.0637645405292511, + 0.06311032083034515, + 0.06264074442386627, + 0.062277248072624206, + 0.06212917380332947, + 0.06193282167315483, + 0.06185461490154266 + ], + "train_acc": [ + 0.6301, + 0.7973, + 0.8351, + 0.8363, + 0.8453, + 0.8538, + 0.8636, + 0.885, + 0.8718, + 0.8834, + 0.8689, + 0.8876, + 0.8709, + 0.896, + 0.9007, + 0.8928, + 0.8871, + 0.9143, + 0.8958, + 0.9193, + 0.9172, + 0.9153, + 0.9212, + 0.9237, + 0.9254, + 0.9249, + 0.9337, + 0.9366, + 0.9097, + 0.9214, + 0.8924, + 0.9129, + 0.9176, + 0.9332, + 0.9307, + 0.9394, + 0.9357, + 0.9463, + 0.9531, + 0.9528, + 0.9459, + 0.9566, + 0.9606, + 0.9562, + 0.9554, + 0.9626, + 0.9547, + 0.9582, + 0.9655, + 0.9634, + 0.9647, + 0.9563, + 0.9502, + 0.9658, + 0.9642, + 0.9654, + 0.9653, + 0.9742, + 0.976, + 0.9777, + 0.976, + 0.9715, + 0.9751, + 0.9801, + 0.9825, + 0.9803, + 0.9819, + 0.9835, + 0.9849, + 0.9832, + 0.9854, + 0.9859, + 0.987, + 0.9868, + 0.9871, + 0.9874, + 0.9876, + 0.9873, + 0.9877, + 0.9879 + ], + "test_acc": [ + 0.77, + 0.785, + 0.841, + 0.8315, + 0.8475, + 0.8605, + 0.8405, + 0.8505, + 0.8555, + 0.8665, + 0.8515, + 0.8665, + 0.868, + 0.878, + 0.882, + 0.873, + 0.878, + 0.889, + 0.8825, + 0.8825, + 0.8785, + 0.8805, + 0.897, + 0.8855, + 0.891, + 0.892, + 0.891, + 0.885, + 0.8925, + 0.887, + 0.8695, + 0.891, + 0.894, + 0.895, + 0.897, + 0.8935, + 0.907, + 0.909, + 0.8995, + 0.899, + 0.9045, + 0.9035, + 0.911, + 0.902, + 0.9095, + 0.903, + 0.9095, + 0.9125, + 0.909, + 0.9075, + 0.9095, + 0.9055, + 0.9045, + 0.916, + 0.9145, + 0.908, + 0.9105, + 0.9125, + 0.9185, + 0.917, + 0.9155, + 0.915, + 0.917, + 0.9165, + 0.9155, + 0.916, + 0.915, + 0.915, + 0.9165, + 0.9155, + 0.916, + 0.915, + 0.9155, + 0.9165, + 0.915, + 0.9145, + 0.914, + 0.914, + 0.9145, + 0.9145 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.832116425037384, + 0.8141677379608154, + 0.8023761510848999, + 0.7934653759002686, + 0.7857377529144287, + 0.7797414064407349, + 0.7767306566238403, + 0.7744640111923218, + 0.7725205421447754, + 0.7711977958679199, + 0.7703278064727783, + 0.7695904970169067 + ], + "perturbation_rho": [ + 0.9999991655349731, + 0.9999972581863403, + 0.9999898672103882, + 0.999970555305481, + 0.9999305009841919, + 0.9999109506607056, + 0.9998676180839539, + 0.999832808971405, + 0.9997924566268921, + 0.9997202754020691, + 0.9997268319129944, + 0.9997689127922058 + ], + "nudging": { + "0.001": [ + -0.028135288506746292, + -0.012758657336235046, + -0.006248572841286659, + -0.0036318942438811064, + -0.0025165460538119078, + -0.0019575022161006927, + -0.0016390127129852772, + -0.001437678001821041, + -0.0013056336902081966, + -0.0012165943626314402, + -0.0011555720120668411, + -0.0011164546012878418 + ], + "0.003": [ + -0.07627765089273453, + -0.03659018874168396, + -0.018335573375225067, + -0.010755512863397598, + -0.007481487933546305, + -0.005830957554280758, + -0.004887878894805908, + -0.004290360026061535, + -0.00389806367456913, + -0.00363331800326705, + -0.0034519662149250507, + -0.0033352887257933617 + ], + "0.01": [ + -0.17892791330814362, + -0.10439710319042206, + -0.05659153312444687, + -0.034265220165252686, + -0.02416030317544937, + -0.01895919442176819, + -0.015955276787281036, + -0.01404004916548729, + -0.01277724839746952, + -0.011922692880034447, + -0.011335920542478561, + -0.010958053171634674 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.0924509696960447, + 1.03269632396698, + 0.7241468557357789, + 0.6072907946586609, + 0.5515357565402985, + 0.5621125034332275, + 0.4907495887756348, + 0.5219814170837402, + 0.5708751871109009, + 0.5191205244064331, + 0.5519021101236343, + 0.544450197315216, + 0.61959801902771, + 0.5679715090274811, + 0.6162963458061218, + 0.6608567100048065, + 0.5779239411354065, + 0.5276209714889526, + 1.01328331489563, + 0.519946471786499, + 0.8604830993652344, + 0.9144351811885834, + 1.1253784037590027, + 0.9372499645233154, + 0.8480413142204285, + 0.5914154142379761, + 0.640305153465271, + 0.5981941318511963, + 1.135121632194519, + 0.6362483476638794, + 0.5418768036842346, + 0.9402659358978271, + 1.0797846031188965, + 0.7645710904121399, + 1.2322801650047301, + 0.7908753656864166, + 0.7349962800979615, + 0.7140366114616394, + 0.8069758752822876, + 0.6646730958938598, + 0.9489161729097366, + 0.582535719871521, + 0.6260909730911255, + 0.698049334526062, + 0.6176723531961441, + 0.6726475171089172, + 0.5952546514511109, + 0.7433469331741333, + 0.5916723924636841, + 0.6389080200195313, + 0.5947137939929962, + 0.5748984836578369, + 0.7570524696826935, + 0.44153712167739867, + 0.44736578378677366, + 0.5139478639602661, + 0.4778360952377319, + 0.4288335760116577, + 0.4595722749233246, + 0.4253603402137756, + 0.42853148097991944, + 0.42120102367401124, + 0.4038095116376877, + 0.3923453485250473, + 0.4267167915344238, + 0.40038953356742857, + 0.36469351987838744, + 0.3733260186672211, + 0.35249682779312136, + 0.3941283622741699, + 0.34860973496437075, + 0.33470872814655306, + 0.3397274105072021, + 0.342729074048996, + 0.33137304639816284, + 0.33342387351989744, + 0.3293384352207184, + 0.32710764508247375, + 0.32727917928695677, + 0.32547602846622464 + ], + "train_acc": [ + 0.2403, + 0.6217, + 0.7314, + 0.777, + 0.7934, + 0.7883, + 0.8173, + 0.81, + 0.8007, + 0.8185, + 0.8119, + 0.8107, + 0.7957, + 0.8153, + 0.8048, + 0.7935, + 0.8084, + 0.8208, + 0.7284, + 0.8177, + 0.7633, + 0.7409, + 0.7108, + 0.7466, + 0.7492, + 0.8055, + 0.7943, + 0.7997, + 0.7105, + 0.7922, + 0.8115, + 0.7389, + 0.7191, + 0.77, + 0.696, + 0.7666, + 0.7733, + 0.7799, + 0.7683, + 0.7917, + 0.7586, + 0.8071, + 0.7992, + 0.7877, + 0.8068, + 0.7913, + 0.8053, + 0.7778, + 0.808, + 0.8032, + 0.803, + 0.812, + 0.7775, + 0.845, + 0.8439, + 0.8279, + 0.8362, + 0.8495, + 0.8413, + 0.8497, + 0.8436, + 0.8522, + 0.8533, + 0.853, + 0.8501, + 0.8533, + 0.8681, + 0.8617, + 0.8716, + 0.8595, + 0.8705, + 0.8761, + 0.8748, + 0.8724, + 0.8778, + 0.8759, + 0.8782, + 0.8797, + 0.8794, + 0.8799 + ], + "test_acc": [ + 0.5005, + 0.673, + 0.7145, + 0.727, + 0.743, + 0.7505, + 0.71, + 0.7185, + 0.703, + 0.689, + 0.745, + 0.7005, + 0.7235, + 0.7795, + 0.64, + 0.7805, + 0.7205, + 0.518, + 0.762, + 0.7215, + 0.5445, + 0.483, + 0.6085, + 0.591, + 0.659, + 0.6965, + 0.746, + 0.5735, + 0.7155, + 0.7325, + 0.5895, + 0.6945, + 0.653, + 0.5595, + 0.671, + 0.68, + 0.702, + 0.6095, + 0.722, + 0.6895, + 0.681, + 0.747, + 0.6935, + 0.6485, + 0.7315, + 0.687, + 0.666, + 0.699, + 0.698, + 0.667, + 0.656, + 0.6015, + 0.732, + 0.7635, + 0.7205, + 0.7695, + 0.762, + 0.7965, + 0.8045, + 0.7785, + 0.779, + 0.77, + 0.8045, + 0.8215, + 0.812, + 0.8345, + 0.8125, + 0.8345, + 0.807, + 0.8265, + 0.8345, + 0.8335, + 0.829, + 0.8375, + 0.836, + 0.838, + 0.8425, + 0.843, + 0.8425, + 0.841 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.009534038603305817, + 0.2771005630493164, + 0.12846891582012177, + 0.12727834284305573, + 0.09264838695526123, + 0.08494879305362701, + 0.1454543173313141, + 0.07647830247879028, + 0.055110231041908264, + 0.08491981029510498, + 0.054209403693675995, + 0.06925329566001892 + ], + "perturbation_rho": [ + -0.030354971066117287, + 0.19958093762397766, + 0.10430362075567245, + 0.06749340891838074, + 0.08917459845542908, + 0.06985980272293091, + 0.08990536630153656, + -0.0003178045153617859, + -0.05352415516972542, + 0.12398940324783325, + 0.05844062566757202, + 0.06276053190231323 + ], + "nudging": { + "0.001": [ + 5.0953527534147725e-05, + -0.0006460470613092184, + -0.0002715848677325994, + -0.00028075071168132126, + -0.00018533585534896702, + -0.00017889743321575224, + -0.00029740406898781657, + -0.0001274347014259547, + -7.406625081785023e-05, + -0.0001561331155244261, + -0.0001032993895933032, + -0.00014120049308985472 + ], + "0.003": [ + 0.00016943782975431532, + -0.0019340584985911846, + -0.0008146192994900048, + -0.0008385812398046255, + -0.0005608047358691692, + -0.0005349678685888648, + -0.0008904121932573617, + -0.00038351857801899314, + -0.00022607628488913178, + -0.00046768866013735533, + -0.0003058650763705373, + -0.0004211085324641317 + ], + "0.01": [ + 0.0008368014823645353, + -0.00641840323805809, + -0.0027151124086230993, + -0.002792379120364785, + -0.0018645611125975847, + -0.0017843465320765972, + -0.002957880962640047, + -0.0012784524587914348, + -0.0007560949889011681, + -0.0015581869520246983, + -0.0010259757982566953, + -0.0014001178788021207 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.8275699935913086, + 1.3385464324951173, + 1.037378346633911, + 1.002308666419983, + 1.0388273836135864, + 1.0882213558197023, + 1.1394051094055175, + 1.1788917055130006, + 1.2267918197631835, + 1.2478832811355591, + 1.2316707176208497, + 1.287934114074707, + 1.2420732460021973, + 1.2143509733200073, + 1.229138567352295, + 1.259750719833374, + 1.1612068832397462, + 1.149783327293396, + 1.1361305335998535, + 1.1167785579681397, + 1.1316240934371948, + 1.1020189935684204, + 1.0256468997955321, + 1.0201313499450684, + 0.9847993452072143, + 0.9970695999145508, + 1.0227494039535523, + 1.1330445571899415, + 1.2469683200836181, + 1.1566339334487914, + 1.107145287322998, + 1.110690570449829, + 1.0532963357925416, + 1.0852850601196289, + 1.0935607889175416, + 1.0834732231140136, + 1.0420629257202147, + 1.0830944820404054, + 1.0634357900619507, + 1.0303276639938355, + 0.9689252651214599, + 1.0131777705192566, + 1.0103633685112, + 1.002309990501404, + 1.0113068084716796, + 0.9995921211242675, + 1.0161544053077698, + 0.9966502132415771, + 1.0186468648910523, + 1.0372472515106201, + 0.9930810668945312, + 0.9901977378845215, + 0.988507303237915, + 0.9591489524841309, + 0.935456734085083, + 0.9176784860610961, + 0.8929200078964233, + 0.8777516023635864, + 0.8699161693572998, + 0.8663567218780518, + 0.855108270072937, + 0.8465001301765442, + 0.848315406036377, + 0.8377359997272491, + 0.830757266998291, + 0.831167548942566, + 0.8265859796524048, + 0.819621584033966, + 0.8219145364761352, + 0.8136607124328613, + 0.8122711290359497, + 0.8106639209747315, + 0.8065893723487854, + 0.8030635206222534, + 0.8029474701881408, + 0.8009245029449463, + 0.8000903869628906, + 0.79931964969635, + 0.7988908242225647, + 0.7986321613311768 + ], + "train_acc": [ + 0.3739, + 0.5487, + 0.6322, + 0.6501, + 0.6387, + 0.6203, + 0.615, + 0.6129, + 0.5974, + 0.5921, + 0.5918, + 0.5772, + 0.5826, + 0.5914, + 0.5855, + 0.5734, + 0.6028, + 0.6044, + 0.6072, + 0.6171, + 0.6172, + 0.6223, + 0.6371, + 0.6377, + 0.6495, + 0.6412, + 0.6326, + 0.6082, + 0.5968, + 0.619, + 0.6391, + 0.6371, + 0.6521, + 0.6487, + 0.646, + 0.6521, + 0.6558, + 0.6525, + 0.6501, + 0.6609, + 0.6693, + 0.6536, + 0.6586, + 0.6603, + 0.6543, + 0.6585, + 0.6599, + 0.6665, + 0.6666, + 0.6712, + 0.6763, + 0.6816, + 0.6819, + 0.6887, + 0.6966, + 0.6988, + 0.7027, + 0.705, + 0.7072, + 0.7108, + 0.7089, + 0.7167, + 0.711, + 0.715, + 0.7173, + 0.7164, + 0.7205, + 0.722, + 0.7179, + 0.7223, + 0.7237, + 0.7214, + 0.7216, + 0.7228, + 0.7234, + 0.7226, + 0.7229, + 0.7229, + 0.7233, + 0.7239 + ], + "test_acc": [ + 0.5075, + 0.5705, + 0.6225, + 0.6155, + 0.5905, + 0.588, + 0.567, + 0.568, + 0.543, + 0.5535, + 0.479, + 0.5455, + 0.5425, + 0.5415, + 0.5135, + 0.564, + 0.57, + 0.521, + 0.534, + 0.547, + 0.5265, + 0.5945, + 0.557, + 0.581, + 0.591, + 0.5685, + 0.589, + 0.519, + 0.548, + 0.5655, + 0.5655, + 0.611, + 0.589, + 0.613, + 0.605, + 0.605, + 0.5675, + 0.616, + 0.592, + 0.6325, + 0.6195, + 0.602, + 0.6085, + 0.602, + 0.5995, + 0.623, + 0.628, + 0.6295, + 0.6315, + 0.634, + 0.6305, + 0.628, + 0.638, + 0.6505, + 0.6515, + 0.654, + 0.65, + 0.6515, + 0.656, + 0.6505, + 0.6615, + 0.6595, + 0.658, + 0.666, + 0.6655, + 0.663, + 0.661, + 0.6675, + 0.6715, + 0.6735, + 0.667, + 0.669, + 0.6765, + 0.6755, + 0.677, + 0.677, + 0.677, + 0.6755, + 0.675, + 0.675 + ], + "state_pred_error": [ + 0.6583093455791473, + 0.2847297016143799, + 0.22077271904945373, + 0.21189437193870544, + 0.1841041277885437, + 0.17305933623313904, + 0.17701434428691865, + 0.18802506301403046, + 0.17837908656597137, + 0.14958413000106813, + 0.13064928512573243, + 0.1284900181055069, + 0.13219893939495087, + 0.13047706623077393, + 0.12345472877025604, + 0.10324463622570038, + 0.09139569116830826, + 0.07699145336151123, + 0.06765981405973434, + 0.07321135756969452, + 0.07089905383586884, + 0.06882416786551475, + 0.05610226457118988, + 0.043682216036319735, + 0.035003681576251985, + 0.02870281513929367, + 0.02616107567548752, + 0.0247726686835289, + 0.023823431384563446, + 0.024860127294063568, + 0.02640067371726036, + 0.02769387246966362, + 0.028516952562332155, + 0.02941493996977806, + 0.029591170537471772, + 0.028317847082018854, + 0.027129681679606436, + 0.026555932518839837, + 0.026938045769929884, + 0.027426798117160797, + 0.029536254298686983, + 0.03211808215379715, + 0.03510575920939445, + 0.03469557763338089, + 0.03365132007598877, + 0.03368182533979416, + 0.03552556530237198, + 0.038989124006032945, + 0.04195216841697693, + 0.043111143064498904, + 0.044202814984321596, + 0.045387097096443174, + 0.04451717386841774, + 0.04319920334815979, + 0.042182978856563566, + 0.041060500395298, + 0.0400146517932415, + 0.03966583462953568, + 0.03924502938389778, + 0.03796827178895473, + 0.03660108530521393, + 0.03574252983927727, + 0.03452657175064087, + 0.03394979124069214, + 0.0328981254786253, + 0.031669361919164654, + 0.030848443555831908, + 0.029799468955397607, + 0.028912526750564577, + 0.028214104449748992, + 0.027432609269022943, + 0.026476147815585136, + 0.02564660669863224, + 0.024992754793167114, + 0.024431089624762536, + 0.023907900010049343, + 0.023127568793296815, + 0.02265733232498169, + 0.022044888520240783, + 0.021540785717964174 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.7589784860610962, + 0.34465640783309937, + 0.20695620775222778, + 0.15412747859954834, + 0.14041899144649506, + 0.152847021818161, + 0.1464981734752655, + 0.13855373859405518, + 0.13026131689548492, + 0.11798880249261856, + 0.11249798536300659, + 0.11956378817558289 + ], + "perturbation_rho": [ + 0.6762608289718628, + 0.29351934790611267, + 0.15623700618743896, + 0.07772233337163925, + 0.09808109700679779, + 0.14218339323997498, + 0.09985582530498505, + 0.07779418677091599, + 0.10923020541667938, + 0.10118008404970169, + 0.08211226016283035, + 0.09183197468519211 + ], + "nudging": { + "0.001": [ + -0.024234283715486526, + -0.0011283548083156347, + -0.0005652708932757378, + -0.00041053639142774045, + -0.00037075550062581897, + -0.00039911235217005014, + -0.0003868499770760536, + -0.00036323058884590864, + -0.00033692887518554926, + -0.000307242211420089, + -0.0002827422576956451, + -0.00030345225241035223 + ], + "0.003": [ + -0.07142189145088196, + -0.0033810725435614586, + -0.0016954769380390644, + -0.0012313042534515262, + -0.0011121997376903892, + -0.0011966262245550752, + -0.0011605183826759458, + -0.0010896101593971252, + -0.0010103486711159348, + -0.0009211936267092824, + -0.000847844872623682, + -0.0009103003540076315 + ], + "0.01": [ + -0.22324970364570618, + -0.01123635284602642, + -0.0056420015171170235, + -0.0040974924340844154, + -0.0037027131766080856, + -0.003983458504080772, + -0.0038626876194030046, + -0.0036268262192606926, + -0.003363188588991761, + -0.0030670221894979477, + -0.0028224957641214132, + -0.0030306889675557613 + ] + }, + "state_pred_error_per_layer": [ + 10215.58203125, + 8926.0654296875, + 5285.6044921875, + 5192.0830078125, + 4575.35791015625, + 4063.82666015625, + 4966.6884765625, + 5378.6435546875, + 4702.37890625, + 4026.143310546875, + 3985.35595703125, + 3780.156494140625 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.093309115028381, + 1.032017181968689, + 0.7077153354644775, + 0.5732980075836182, + 0.5402240601539612, + 0.5183043882369995, + 0.5319672570228576, + 0.5359590018749237, + 0.5482052456855774, + 0.5222824983596802, + 0.6027764239311219, + 0.49652273721694945, + 0.5368509518623352, + 0.566478079509735, + 0.6263480365753173, + 0.7491202196836472, + 0.6788468971252442, + 0.7347880103588105, + 0.8662578244686127, + 0.678591609096527, + 0.8630354214191437, + 0.712297385597229, + 0.7786388912200928, + 0.7855329002380371, + 0.8845748617887497, + 0.8085215629577637, + 0.7420635931015015, + 0.7875441513061523, + 0.7688868448257447, + 0.7473984729766846, + 1.0297006687164307, + 0.8987462726593017, + 0.9227742693901062, + 0.9423508636474609, + 0.7886569627761841, + 0.8662117418289185, + 1.0016330226898194, + 0.922345392036438, + 0.8514365245819092, + 0.8499950613498688, + 0.8536573698043823, + 0.8536672010421753, + 0.837739602279663, + 0.9626629913330078, + 0.8708203351974487, + 0.9226528865814209, + 0.886489924621582, + 0.884385742521286, + 0.8640118010520935, + 0.9462248080253601, + 0.9388958973884582, + 0.9003979402542114, + 0.8771900144577026, + 0.8063458614349365, + 0.7585287186145783, + 0.7785314264297485, + 0.7583562124252319, + 0.7231489379882813, + 0.7116691125869751, + 0.7012166356563568, + 0.6967055747032166, + 0.6990642721176148, + 0.7341344322204589, + 0.7070941570281982, + 0.717008107471466, + 0.7219762700080872, + 0.7167341491699218, + 0.7061620636940003, + 0.7071943338394165, + 0.6979920616149903, + 0.696011471939087, + 0.6982332837104798, + 0.6905044673919678, + 0.690191311454773, + 0.6926393260002136, + 0.6883825535297394, + 0.6852098932266235, + 0.6849852310180664, + 0.6831081211090088, + 0.6824430053234101 + ], + "train_acc": [ + 0.2427, + 0.6203, + 0.7378, + 0.7896, + 0.7939, + 0.805, + 0.8035, + 0.8076, + 0.8018, + 0.8194, + 0.8027, + 0.8223, + 0.8124, + 0.8119, + 0.8022, + 0.7784, + 0.791, + 0.7844, + 0.7596, + 0.7915, + 0.7527, + 0.774, + 0.7627, + 0.7535, + 0.7315, + 0.7344, + 0.7496, + 0.7405, + 0.7384, + 0.7403, + 0.6992, + 0.7114, + 0.709, + 0.7067, + 0.7358, + 0.7261, + 0.712, + 0.7299, + 0.7476, + 0.7511, + 0.7532, + 0.7552, + 0.7561, + 0.7327, + 0.7464, + 0.734, + 0.7416, + 0.7412, + 0.743, + 0.7265, + 0.7276, + 0.7301, + 0.7357, + 0.7407, + 0.7519, + 0.7433, + 0.7493, + 0.7556, + 0.7553, + 0.758, + 0.7592, + 0.761, + 0.7445, + 0.7562, + 0.7549, + 0.7515, + 0.7516, + 0.7555, + 0.7569, + 0.7587, + 0.7586, + 0.7565, + 0.7596, + 0.7617, + 0.7564, + 0.7595, + 0.7618, + 0.7621, + 0.7611, + 0.7614 + ], + "test_acc": [ + 0.5025, + 0.6865, + 0.7425, + 0.7505, + 0.74, + 0.7655, + 0.755, + 0.7195, + 0.7695, + 0.7425, + 0.757, + 0.74, + 0.7145, + 0.657, + 0.61, + 0.6675, + 0.6895, + 0.691, + 0.6775, + 0.6985, + 0.693, + 0.678, + 0.6795, + 0.6445, + 0.6355, + 0.6535, + 0.676, + 0.646, + 0.68, + 0.5935, + 0.603, + 0.6625, + 0.604, + 0.725, + 0.6155, + 0.6425, + 0.715, + 0.6955, + 0.7035, + 0.686, + 0.667, + 0.709, + 0.683, + 0.715, + 0.6905, + 0.716, + 0.709, + 0.6965, + 0.688, + 0.66, + 0.685, + 0.664, + 0.7035, + 0.7035, + 0.6935, + 0.6825, + 0.6795, + 0.7065, + 0.697, + 0.7135, + 0.7185, + 0.705, + 0.7205, + 0.7035, + 0.6945, + 0.714, + 0.7205, + 0.709, + 0.7085, + 0.7195, + 0.7175, + 0.72, + 0.714, + 0.72, + 0.7195, + 0.72, + 0.7185, + 0.7185, + 0.721, + 0.721 + ], + "value_loss": [ + 2.895308603286743, + 1.0838360973358154, + 0.8661615056991577, + 0.7228779357194901, + 0.6979825808525085, + 0.654473484325409, + 0.7223839604854584, + 0.8182331377506256, + 0.8379502923965454, + 0.8138473363876343, + 1.1507868383049964, + 0.7328620315790176, + 0.8565217294692993, + 1.0016156348228455, + 1.277318878364563, + 1.7167091186523438, + 1.3837544082641602, + 1.6866768316745757, + 2.521582665491104, + 1.798458749961853, + 2.762005415582657, + 1.7501773468017578, + 2.065952481651306, + 1.7661181676864623, + 2.237529104137421, + 1.6968138498306276, + 1.5028521341323853, + 1.4401282972335816, + 1.5227922265052796, + 1.3540578876495362, + 2.2935845052957533, + 1.8538220872879028, + 1.921490113067627, + 1.8531652376174927, + 1.2972030296325683, + 1.6667764266967773, + 2.4392109436035154, + 2.1221363357543943, + 1.9600661560058594, + 2.1009968710660933, + 2.162639275550842, + 1.8537513482332229, + 1.9440034482955932, + 1.821842461013794, + 1.9722608186721802, + 1.6478357261657715, + 1.5106155110836028, + 1.482781691980362, + 1.3237692507743835, + 1.3403249841690064, + 1.2857119444847107, + 1.2022730991363526, + 0.9818777618408203, + 0.8647946514129639, + 0.6914702701568604, + 0.7234345043182373, + 0.7077870290756225, + 0.6724249305725097, + 0.6462549682617188, + 0.584807029056549, + 0.5510385043144226, + 0.5364630532741547, + 0.5645569776535034, + 0.552950176525116, + 0.49300712423324583, + 0.5377466377735138, + 0.502735111618042, + 0.5176207973480225, + 0.46474625415802, + 0.4454069378852844, + 0.44403015842437743, + 0.4113505308389664, + 0.40353398851156236, + 0.42983919105529783, + 0.419776428937912, + 0.4019131669998169, + 0.38927605810165405, + 0.39006197519302366, + 0.3755714391708374, + 0.37253577736616134 + ], + "term_loss": [ + 1.7315585552215575, + 0.8666729364395142, + 0.7229979902267456, + 0.596312265253067, + 0.5545540596961975, + 0.5088294490814209, + 0.5825292092323303, + 0.6813051890134811, + 0.7038109269142151, + 0.6887646074295044, + 1.0119939782977103, + 0.6134444280862809, + 0.7291853536605835, + 0.8673401327610016, + 1.1276171969413757, + 1.5555007932901384, + 1.2286012786865235, + 1.513133518087864, + 2.2361230753183365, + 1.5198300567150116, + 2.3595263324260713, + 1.4453560852050782, + 1.7648071206092835, + 1.5087391733169555, + 1.882237844824791, + 1.3722010416030883, + 1.2332301671981811, + 1.113333308649063, + 1.2077602449655533, + 1.0543692749023437, + 1.915369022846222, + 1.5654558784484864, + 1.5864534119606017, + 1.561221913743019, + 1.0531947800636292, + 1.3718099038124085, + 2.127058590698242, + 1.779372572517395, + 1.6149614444255829, + 1.7391510653555393, + 1.844177998828888, + 1.5599529803752898, + 1.665471398806572, + 1.48765220746994, + 1.592831818151474, + 1.3742333667755127, + 1.2108251216828823, + 1.1529828948736192, + 0.9720637693166733, + 1.0287326244413852, + 0.9365793524742126, + 0.889251443862915, + 0.7040525654792785, + 0.5985294085502625, + 0.4618072083234787, + 0.47211782517433165, + 0.46372374649047854, + 0.4095201286315918, + 0.396888076210022, + 0.3395151155948639, + 0.32013212871551516, + 0.31056776316165924, + 0.332690350818634, + 0.32696542110443116, + 0.2811112231254578, + 0.3146396808505058, + 0.2787236780166626, + 0.30104646191596984, + 0.26121058802604674, + 0.24297695212364198, + 0.24487788009643555, + 0.21334869912862778, + 0.21118227637484668, + 0.23297631640434266, + 0.2227356671333313, + 0.20269683571159838, + 0.19634508168697357, + 0.19681874605417252, + 0.18710794867277145, + 0.18445234730243684 + ], + "bridge_loss": [ + 0.8910756826514378, + 0.03931298022270203, + 0.005479304197430611, + 0.008322687608003617, + 0.026911671420931815, + 0.031393191632628444, + 0.020954727735370396, + 0.017316379761695862, + 0.013768722853064536, + 0.010478140366077424, + 0.01041390485316515, + 0.006281406325101852, + 0.00699371280670166, + 0.00916883425116539, + 0.01326431538015604, + 0.011463350397348403, + 0.012470959171652795, + 0.021742843547463416, + 0.10813169282078743, + 0.13266532423496247, + 0.22559858589172363, + 0.1508849209487438, + 0.13424171340465546, + 0.08663208992481232, + 0.1692257175862789, + 0.14401090178489684, + 0.09763954291343689, + 0.14743438252806665, + 0.1390697629928589, + 0.12534118332862854, + 0.16236012780070305, + 0.09478195638656617, + 0.13880339596271515, + 0.0893877745948732, + 0.060379807114601135, + 0.09944173128604888, + 0.10493364100456237, + 0.15071102497577668, + 0.16545130755901336, + 0.1862475948754698, + 0.13735291347503661, + 0.11587412934750319, + 0.10125242130011321, + 0.13694310559034348, + 0.19478518126010894, + 0.08310441122055054, + 0.11459392108917237, + 0.14490415418148042, + 0.16996705425977707, + 0.11792534888982772, + 0.1546827676296234, + 0.12324597455859185, + 0.09212502805590629, + 0.08768177535533905, + 0.05900698439478874, + 0.07211811376214028, + 0.07296420599222184, + 0.09570572891235352, + 0.08214142266511917, + 0.08104119520187378, + 0.06706379449367524, + 0.061731532573699954, + 0.05951230276823044, + 0.05904238046109676, + 0.04439769803881645, + 0.052698305994272235, + 0.05405294654369354, + 0.04950189056396485, + 0.036288917183876036, + 0.036671600222587586, + 0.033586744678020475, + 0.03112454196512699, + 0.027874897088855505, + 0.03210000774860382, + 0.03222285799980164, + 0.034796000942587856, + 0.02962491188645363, + 0.02967825172841549, + 0.025359011243283748, + 0.0251624245762825 + ], + "tgrad_loss": [ + 0.2726743935823441, + 0.1778501721382141, + 0.13768420703411102, + 0.1182429804623127, + 0.11651685256958008, + 0.11425084311962128, + 0.11890002069473267, + 0.11961156708002091, + 0.12037064489126205, + 0.1146045907497406, + 0.1283789484590292, + 0.11313620157241822, + 0.1203426679611206, + 0.12510666944980622, + 0.13643737218379975, + 0.14974497756958008, + 0.14268217465877533, + 0.15180046949386597, + 0.17732788567543029, + 0.14596336963176726, + 0.17688049802184105, + 0.1539363568544388, + 0.16690364735126495, + 0.17074689378738403, + 0.18606554128527641, + 0.18060191497802736, + 0.17198242325782775, + 0.17936062285900117, + 0.17596222264766692, + 0.17434742822647095, + 0.2158553662776947, + 0.19358424880504607, + 0.1962333065032959, + 0.20255555391311644, + 0.18362843871116638, + 0.19552478518486022, + 0.2072187364578247, + 0.19205274913311005, + 0.17965343070030212, + 0.17559819491207598, + 0.181108380818367, + 0.1779242508649826, + 0.1772796312212944, + 0.1972471403121948, + 0.1846438142299652, + 0.19049793491363526, + 0.18519648184776305, + 0.1848946546435356, + 0.18173843351602553, + 0.19366701731681824, + 0.1944498215675354, + 0.1897756907939911, + 0.18570017099380492, + 0.17858346576690673, + 0.17065607466697694, + 0.17919855782985689, + 0.17109907450675965, + 0.1671990744113922, + 0.16722547005414962, + 0.1642507126569748, + 0.16384257422685622, + 0.16416375482082368, + 0.17235432732105255, + 0.16694237639904022, + 0.16749820382595063, + 0.17040865378379821, + 0.16995848925113677, + 0.16707244870662688, + 0.1672467480659485, + 0.16575838651657104, + 0.1655655403137207, + 0.1668772896051407, + 0.16447681208848952, + 0.16476286969184875, + 0.16481790508031846, + 0.16442033001184464, + 0.16330606236457826, + 0.1635649757742882, + 0.16310447854995727, + 0.16292100727558137 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.0035465662367641926, + -0.001160490675829351, + 0.00486466521397233, + 0.012821277603507042, + 0.012568866834044456, + 0.019143100827932358, + 0.022381767630577087, + 0.024246837943792343, + 0.027966029942035675, + 0.03333558514714241, + 0.04247187077999115, + 0.04586232826113701 + ], + "perturbation_rho": [ + 0.01447216235101223, + -0.01648387312889099, + 0.027175014838576317, + 0.03045208379626274, + 0.05211577191948891, + -0.0074118818156421185, + 0.0508866012096405, + 0.01983593963086605, + 0.03707783669233322, + 0.12354743480682373, + 0.16596439480781555, + 0.10420688986778259 + ], + "nudging": { + "0.001": [ + 0.00018672729493118823, + -4.912609438179061e-05, + -7.719603308942169e-05, + -0.00012457264529075474, + -0.0001271502551389858, + -0.0001674975355854258, + -0.0001832679263316095, + -0.00020593422232195735, + -0.0002297492028446868, + -0.00026241032173857093, + -0.00029993863427080214, + -0.0003139717737212777 + ], + "0.003": [ + 0.0005920766270719469, + -0.00014469146844930947, + -0.00023059282102622092, + -0.00037341262213885784, + -0.00037795325624756515, + -0.0005033073830418289, + -0.0005485712317749858, + -0.000615192111581564, + -0.0006871747900731862, + -0.0007873581489548087, + -0.0009002696024253964, + -0.0009423828450962901 + ], + "0.01": [ + 0.002342540305107832, + -0.0004765552293974906, + -0.0007624666905030608, + -0.0012423819862306118, + -0.0012568822130560875, + -0.0016762344166636467, + -0.0018269497668370605, + -0.0020500137470662594, + -0.0022837575525045395, + -0.0026187507901340723, + -0.0029940432868897915, + -0.0031347349286079407 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.0_L12_s42.json b/results/synth_ladder_v2_lo/synth_a0.0_L12_s42.json new file mode 100644 index 0000000..b02cb6c --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.0_L12_s42.json @@ -0,0 +1,1722 @@ +{ + "bp": { + "log": { + "train_loss": [ + 0.9691492250442505, + 0.5541921775817871, + 0.5057802117824555, + 0.3705566248893738, + 0.38152624435424803, + 0.4184226482987404, + 0.32005277891159056, + 0.3379063062667847, + 0.32360546998977663, + 0.30641096782684324, + 0.32992204971313477, + 0.3234290994644165, + 0.2892835647583008, + 0.27116408772468564, + 0.25336739110946654, + 0.26921175379753115, + 0.2770581937789917, + 0.2615867853164673, + 0.29473981132507326, + 0.29788853192329406, + 0.22695203926563262, + 0.21405179328918458, + 0.22035713307857513, + 0.18809561533927918, + 0.22268259687423705, + 0.22361898727416993, + 0.2335181351661682, + 0.22086384482383728, + 0.20982224086523055, + 0.16931071857213975, + 0.16913503708839417, + 0.17825531432628633, + 0.1811700684905052, + 0.15162764992713929, + 0.15718278613090514, + 0.21250098304748535, + 0.19473938479423522, + 0.18452690076828002, + 0.143575802898407, + 0.1587403874397278, + 0.18108075993061065, + 0.14308705676496028, + 0.12316284523010254, + 0.12980578224658967, + 0.13384961998462677, + 0.12410676991939544, + 0.13440781029462814, + 0.12151769155859947, + 0.110893037545681, + 0.10822025581598282, + 0.10422320003509522, + 0.10408455009460449, + 0.10522357710003853, + 0.09913086289763451, + 0.09440416249632835, + 0.0924928415775299, + 0.10758058831691741, + 0.09329749217033387, + 0.09131886911988259, + 0.08834524278640747, + 0.08724276800155639, + 0.09795933984518052, + 0.08578420240879059, + 0.08392888104915619, + 0.08338507117033005, + 0.07894570019841195, + 0.07729433171749114, + 0.07803093535900116, + 0.0760855792760849, + 0.0740779890447855, + 0.07295384521484374, + 0.07261191159486771, + 0.07193484778404236, + 0.07130219305753707, + 0.07076054784059524, + 0.07032060540914535, + 0.07007708017826081, + 0.06981839218139649, + 0.06965371253490447, + 0.06955726127624512 + ], + "train_acc": [ + 0.6449, + 0.7847, + 0.8076, + 0.8517, + 0.8456, + 0.8355, + 0.8739, + 0.8646, + 0.8696, + 0.877, + 0.8727, + 0.8717, + 0.8838, + 0.8874, + 0.8988, + 0.8932, + 0.89, + 0.8946, + 0.8868, + 0.8843, + 0.908, + 0.913, + 0.912, + 0.9236, + 0.9124, + 0.9094, + 0.9042, + 0.9092, + 0.9156, + 0.9327, + 0.9341, + 0.9292, + 0.9273, + 0.9418, + 0.9392, + 0.9196, + 0.9237, + 0.9267, + 0.9448, + 0.9393, + 0.9299, + 0.9445, + 0.9559, + 0.9506, + 0.9499, + 0.9523, + 0.9464, + 0.9558, + 0.96, + 0.9615, + 0.9641, + 0.9626, + 0.9646, + 0.9651, + 0.971, + 0.9701, + 0.9608, + 0.9673, + 0.9699, + 0.9703, + 0.9728, + 0.9674, + 0.9725, + 0.974, + 0.9729, + 0.9769, + 0.9787, + 0.9789, + 0.9802, + 0.9813, + 0.9817, + 0.9819, + 0.9818, + 0.9833, + 0.9839, + 0.9838, + 0.9836, + 0.9837, + 0.9838, + 0.9841 + ], + "test_acc": [ + 0.7685, + 0.807, + 0.8325, + 0.843, + 0.831, + 0.8405, + 0.8685, + 0.8405, + 0.867, + 0.864, + 0.852, + 0.8645, + 0.86, + 0.874, + 0.8745, + 0.86, + 0.879, + 0.887, + 0.868, + 0.879, + 0.877, + 0.882, + 0.8865, + 0.883, + 0.8925, + 0.8885, + 0.879, + 0.8895, + 0.896, + 0.9, + 0.9005, + 0.8915, + 0.901, + 0.9035, + 0.9035, + 0.892, + 0.8955, + 0.903, + 0.9075, + 0.9035, + 0.8935, + 0.9035, + 0.911, + 0.9085, + 0.911, + 0.904, + 0.9005, + 0.915, + 0.91, + 0.914, + 0.913, + 0.911, + 0.916, + 0.908, + 0.9145, + 0.9095, + 0.9135, + 0.917, + 0.915, + 0.912, + 0.9105, + 0.9115, + 0.912, + 0.9135, + 0.915, + 0.912, + 0.9115, + 0.9135, + 0.914, + 0.912, + 0.915, + 0.916, + 0.915, + 0.914, + 0.9155, + 0.9155, + 0.914, + 0.9145, + 0.914, + 0.9135 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8936765193939209, + 0.875713586807251, + 0.8523612022399902, + 0.835299551486969, + 0.8243429064750671, + 0.8148068189620972, + 0.809612512588501, + 0.8055970668792725, + 0.8028815984725952, + 0.8011909127235413, + 0.8001247644424438, + 0.799472451210022 + ], + "perturbation_rho": [ + 0.9999988079071045, + 0.999997615814209, + 0.9999872446060181, + 0.9999661445617676, + 0.9999244213104248, + 0.9998762011528015, + 0.9998204708099365, + 0.9997811317443848, + 0.9997683167457581, + 0.9997478723526001, + 0.9997052550315857, + 0.9996634721755981 + ], + "nudging": { + "0.001": [ + -0.02805091254413128, + -0.013208158314228058, + -0.0066702282056212425, + -0.003945831675082445, + -0.002750034909695387, + -0.002152357716113329, + -0.0018071717349812388, + -0.0015899442369118333, + -0.0014494031202048063, + -0.0013547888956964016, + -0.0012928021606057882, + -0.0012546603102236986 + ], + "0.003": [ + -0.07421690225601196, + -0.03749680891633034, + -0.019483720883727074, + -0.011658146977424622, + -0.008164399303495884, + -0.006405050866305828, + -0.0053850943222641945, + -0.004741774406284094, + -0.004324971232563257, + -0.004044387489557266, + -0.003860148834064603, + -0.0037467507645487785 + ], + "0.01": [ + -0.15880361199378967, + -0.10216463357210159, + -0.058997806161642075, + -0.0368044376373291, + -0.02622675709426403, + -0.02074911817908287, + -0.017529264092445374, + -0.015481802634894848, + -0.014148212037980556, + -0.013247357681393623, + -0.012655021622776985, + -0.012289617210626602 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.062218222427368, + 1.0111772974014281, + 0.7069105566978454, + 0.5894367267131806, + 0.5519145173072815, + 0.5328701040267945, + 0.5143702904701233, + 0.5037649742126464, + 0.5267402291297912, + 0.5362862730979919, + 0.5706932378292083, + 0.5366109603404999, + 0.5748039415359497, + 0.6984620532989502, + 0.6995907222032547, + 0.6355872257232666, + 0.5994791854858399, + 0.6105069580078125, + 0.755839087486267, + 0.7219365031242371, + 0.7605537420272828, + 0.7302447261810303, + 0.7689904579162598, + 0.6884315003395081, + 0.6808914300203324, + 0.6728718101501465, + 0.7055298049449921, + 0.6493824725151062, + 0.6272500898987055, + 0.5995918445706367, + 0.5774760694503784, + 0.6369666585922241, + 0.6621656682491303, + 0.6987312582492828, + 0.7215407601356506, + 0.7177485369443893, + 0.6749118590354919, + 0.7748493107795715, + 0.6226130012512207, + 0.59164186668396, + 0.8793521818518638, + 0.5344610214710236, + 0.6223686878204345, + 0.5742042091012001, + 0.6648194321632386, + 0.6924330261230469, + 0.6171909283161163, + 0.6225832930564881, + 0.5864963626980781, + 0.5502301546096802, + 0.6340892565965652, + 0.5290304160118103, + 0.593668369102478, + 0.5533372339248657, + 0.6408262311697006, + 0.4738055535316467, + 0.5309371071815491, + 0.4636679154396057, + 0.5358815372467041, + 0.45992880697250366, + 0.458472611618042, + 0.46539330711364746, + 0.47984019027948377, + 0.44190584735870364, + 0.45413577545881273, + 0.43303393692970277, + 0.4372877141952515, + 0.45334326210021975, + 0.4221468412399292, + 0.4217998252868652, + 0.4122497503757477, + 0.4124288455963135, + 0.4077335179507732, + 0.3989184023857117, + 0.3986554427713156, + 0.39380938061475756, + 0.39323648450374604, + 0.39136115703582763, + 0.39004903059005736, + 0.38944205143451693 + ], + "train_acc": [ + 0.2526, + 0.628, + 0.7334, + 0.7835, + 0.7903, + 0.7999, + 0.8125, + 0.8145, + 0.8116, + 0.8155, + 0.8113, + 0.8242, + 0.8189, + 0.7977, + 0.7993, + 0.8201, + 0.8267, + 0.8299, + 0.8104, + 0.8145, + 0.8077, + 0.818, + 0.8117, + 0.8259, + 0.8297, + 0.8323, + 0.8296, + 0.8424, + 0.8483, + 0.8508, + 0.8527, + 0.8463, + 0.842, + 0.8346, + 0.8304, + 0.8329, + 0.8415, + 0.8272, + 0.8528, + 0.8517, + 0.8201, + 0.8663, + 0.8515, + 0.8582, + 0.8449, + 0.8462, + 0.8551, + 0.8533, + 0.8555, + 0.8652, + 0.8528, + 0.8688, + 0.8578, + 0.8656, + 0.8516, + 0.8779, + 0.8655, + 0.8768, + 0.8643, + 0.8772, + 0.8783, + 0.8791, + 0.8749, + 0.8827, + 0.8802, + 0.8822, + 0.8846, + 0.8819, + 0.8855, + 0.8854, + 0.8897, + 0.8892, + 0.8904, + 0.893, + 0.8915, + 0.8936, + 0.8923, + 0.8933, + 0.8942, + 0.8943 + ], + "test_acc": [ + 0.496, + 0.674, + 0.718, + 0.7275, + 0.701, + 0.768, + 0.757, + 0.771, + 0.765, + 0.653, + 0.771, + 0.7435, + 0.7445, + 0.73, + 0.716, + 0.759, + 0.774, + 0.7065, + 0.726, + 0.741, + 0.7765, + 0.7795, + 0.736, + 0.75, + 0.7835, + 0.762, + 0.7935, + 0.7395, + 0.7585, + 0.7765, + 0.75, + 0.786, + 0.722, + 0.807, + 0.7605, + 0.7365, + 0.782, + 0.7935, + 0.7915, + 0.7045, + 0.803, + 0.803, + 0.7895, + 0.7795, + 0.7665, + 0.795, + 0.771, + 0.82, + 0.799, + 0.8235, + 0.809, + 0.8115, + 0.808, + 0.815, + 0.823, + 0.8165, + 0.8285, + 0.8075, + 0.837, + 0.8315, + 0.8305, + 0.821, + 0.8325, + 0.8325, + 0.841, + 0.835, + 0.8295, + 0.843, + 0.838, + 0.8405, + 0.8355, + 0.839, + 0.843, + 0.842, + 0.842, + 0.841, + 0.8415, + 0.8405, + 0.8415, + 0.8405 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.022819485515356064, + 0.10611869394779205, + 0.08763782680034637, + 0.06361521780490875, + 0.08818645775318146, + 0.07573625445365906, + 0.07574683427810669, + 0.025106821209192276, + 0.029594242572784424, + 0.09018446505069733, + 0.04191981628537178, + 0.05728168785572052 + ], + "perturbation_rho": [ + -0.0498071163892746, + 0.18554872274398804, + 0.19663047790527344, + 0.14150168001651764, + 0.06663499772548676, + 0.12039551883935928, + 0.12434913218021393, + 0.05157296732068062, + 0.09405694901943207, + 0.07376686483621597, + 0.061272408813238144, + 0.10341489315032959 + ], + "nudging": { + "0.001": [ + -0.00011285400250926614, + -0.0005286485538817942, + -0.00023863595561124384, + -0.0001699515269137919, + -0.00019242128473706543, + -0.00020841028890572488, + -0.00017818620835896581, + -8.221696771215647e-05, + -0.00012262666132301092, + -0.0002659684687387198, + -7.3433002398815e-05, + -0.00015967088984325528 + ], + "0.003": [ + -0.00024241290520876646, + -0.0015879659913480282, + -0.0007213138160295784, + -0.0005122334696352482, + -0.0005765345995314419, + -0.0006294770864769816, + -0.0005317657487466931, + -0.0002465004217810929, + -0.000370893714716658, + -0.0007963281823322177, + -0.00021844575530849397, + -0.00047936002374626696 + ], + "0.01": [ + 0.000284646637737751, + -0.005279931705445051, + -0.002400151453912258, + -0.0017087131273001432, + -0.0019207102013751864, + -0.0020927595905959606, + -0.0017691099783405662, + -0.0008208724320866168, + -0.0012333606136962771, + -0.0026537002995610237, + -0.0007275568204931915, + -0.0015953464899212122 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.9170144527435302, + 1.3574325843811035, + 1.0219036561965942, + 1.0417006726264955, + 1.1545506413459778, + 1.0443228019714355, + 1.069793510723114, + 1.1563185817718507, + 1.2034203029632569, + 1.2093300688743591, + 1.2421297967910767, + 1.2121269897460938, + 1.2421570183753967, + 1.227959622001648, + 1.2875715705871582, + 1.2968539279937745, + 1.2598994022369385, + 1.2438384927749633, + 1.257016632270813, + 1.3526598268508911, + 1.3369555353164673, + 1.2425631269454955, + 1.1589678699493409, + 1.1722875375747681, + 1.196830919456482, + 1.2976784371376038, + 1.4418400695800782, + 1.5240311195373535, + 1.3321481491088867, + 1.1875362323760987, + 1.1509679439544678, + 1.137692106437683, + 1.0400111068725586, + 1.0969075414657592, + 1.0011995708465575, + 1.0474750366210936, + 1.0674565059661865, + 1.0524237518310546, + 1.0477498797416687, + 1.0017159150123596, + 1.0123031642913818, + 1.032210140323639, + 0.9697861175537109, + 0.9672701766967774, + 0.9756033916473389, + 0.9363939442634582, + 0.9666579208374023, + 0.9819006387710572, + 0.9768954681396484, + 0.9663044677734375, + 0.9702695720672607, + 0.942413935470581, + 0.9659700645446777, + 0.9314608770370484, + 0.9171806238174438, + 0.9250450847625732, + 0.9110939646720886, + 0.909934245300293, + 0.8979906294822693, + 0.8799821901321411, + 0.8749663389205933, + 0.8692678067207337, + 0.861733264541626, + 0.8568462301254273, + 0.8578854080200196, + 0.8505663597106934, + 0.8482229557037354, + 0.8452105672836304, + 0.8483084865570069, + 0.8421358110427857, + 0.8392665149688721, + 0.8388012510299683, + 0.8370298583984375, + 0.8364136636734009, + 0.8345022481918335, + 0.8332059104919434, + 0.831232413482666, + 0.830617018032074, + 0.830040982055664, + 0.8296857852935791 + ], + "train_acc": [ + 0.3517, + 0.5406, + 0.637, + 0.6539, + 0.642, + 0.649, + 0.6309, + 0.6125, + 0.5943, + 0.585, + 0.5871, + 0.5969, + 0.581, + 0.5812, + 0.5714, + 0.5742, + 0.5815, + 0.5852, + 0.6003, + 0.5856, + 0.5956, + 0.6059, + 0.6156, + 0.6163, + 0.6124, + 0.6008, + 0.5782, + 0.5726, + 0.6073, + 0.6195, + 0.6281, + 0.6301, + 0.6442, + 0.6423, + 0.6638, + 0.6437, + 0.6416, + 0.6452, + 0.642, + 0.654, + 0.6567, + 0.6568, + 0.6646, + 0.6658, + 0.663, + 0.6761, + 0.6684, + 0.6674, + 0.6674, + 0.674, + 0.6749, + 0.6792, + 0.6738, + 0.6805, + 0.686, + 0.6842, + 0.6903, + 0.6848, + 0.6934, + 0.6995, + 0.6987, + 0.7028, + 0.7012, + 0.7035, + 0.7027, + 0.7097, + 0.7091, + 0.712, + 0.7104, + 0.7087, + 0.7106, + 0.7127, + 0.7098, + 0.711, + 0.714, + 0.7122, + 0.7127, + 0.7147, + 0.7143, + 0.7145 + ], + "test_acc": [ + 0.4755, + 0.5345, + 0.6515, + 0.6045, + 0.6325, + 0.614, + 0.575, + 0.583, + 0.576, + 0.551, + 0.5735, + 0.5495, + 0.5625, + 0.5185, + 0.516, + 0.5475, + 0.561, + 0.5915, + 0.4995, + 0.493, + 0.539, + 0.6, + 0.5995, + 0.58, + 0.554, + 0.5895, + 0.486, + 0.5515, + 0.5825, + 0.5845, + 0.5545, + 0.6015, + 0.599, + 0.623, + 0.6035, + 0.6035, + 0.61, + 0.6105, + 0.6025, + 0.6305, + 0.6195, + 0.6255, + 0.635, + 0.6365, + 0.636, + 0.628, + 0.64, + 0.6165, + 0.6255, + 0.633, + 0.641, + 0.641, + 0.65, + 0.6545, + 0.654, + 0.66, + 0.6605, + 0.6605, + 0.66, + 0.6655, + 0.66, + 0.659, + 0.6705, + 0.668, + 0.6625, + 0.663, + 0.667, + 0.671, + 0.674, + 0.6765, + 0.68, + 0.6735, + 0.677, + 0.6735, + 0.675, + 0.6755, + 0.6745, + 0.6745, + 0.675, + 0.675 + ], + "state_pred_error": [ + 0.6493651579856873, + 0.29575768976211547, + 0.23103001885414123, + 0.2334385880947113, + 0.23548452725410463, + 0.19967564697265625, + 0.18518944029808043, + 0.16725214145183565, + 0.1649368047952652, + 0.16571793246269226, + 0.17572792928218842, + 0.1743344892501831, + 0.15893575103282928, + 0.14322838592529297, + 0.13594432392120362, + 0.14049444479942322, + 0.14633379299640656, + 0.13476813054084777, + 0.11506632614135742, + 0.09945053409337998, + 0.0853865048646927, + 0.07948669990301133, + 0.07776896188259125, + 0.07093840420246124, + 0.0676786900997162, + 0.07071898134946823, + 0.0722231029510498, + 0.06867871108055115, + 0.06268749744296073, + 0.05706663088798523, + 0.05825891577005386, + 0.0631956821680069, + 0.06554845556020737, + 0.06385076906085015, + 0.059801281118392946, + 0.056304640930891034, + 0.051978501677513125, + 0.0483906120300293, + 0.04619176578521728, + 0.04515855231881142, + 0.043788279366493224, + 0.042852709513902666, + 0.04160206508040428, + 0.04094642661809921, + 0.03986684157252312, + 0.03952786195278168, + 0.03936737617254257, + 0.04014009275436401, + 0.04107310829758644, + 0.04151235276460648, + 0.04251271829605102, + 0.042470853394269946, + 0.04116504163742066, + 0.039731386798620226, + 0.03882245666384697, + 0.03727775193452835, + 0.035602553805708884, + 0.03460706757307053, + 0.03363208696842194, + 0.0326178902387619, + 0.03211134424805641, + 0.03151855516433716, + 0.03118992812037468, + 0.030708241164684295, + 0.029781148672103883, + 0.02953700419664383, + 0.028982311296463014, + 0.028379172378778458, + 0.02792458461225033, + 0.027120157611370085, + 0.026746750193834306, + 0.0262485995978117, + 0.025594802010059356, + 0.02498560943007469, + 0.024488566598296166, + 0.02415746918618679, + 0.023551164603233338, + 0.023047770342230798, + 0.02238947468996048, + 0.02236259917318821 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.7431880235671997, + 0.2796655595302582, + 0.13151727616786957, + 0.09881292283535004, + 0.0924338698387146, + 0.10159576684236526, + 0.09764175117015839, + 0.09642879664897919, + 0.09804226458072662, + 0.09603762626647949, + 0.09261822700500488, + 0.08885498344898224 + ], + "perturbation_rho": [ + 0.611870527267456, + 0.24307268857955933, + 0.10120554268360138, + 0.09459854662418365, + 0.09521515667438507, + 0.07265714555978775, + 0.07570740580558777, + 0.0650622695684433, + 0.07738275825977325, + 0.11346932500600815, + 0.08958262950181961, + 0.07643747329711914 + ], + "nudging": { + "0.001": [ + -0.022723916918039322, + -0.0008963837753981352, + -0.0003589537227526307, + -0.0002731546701397747, + -0.0002443054981995374, + -0.0002676681033335626, + -0.0002532715443521738, + -0.0002561286382842809, + -0.00026835669996216893, + -0.00025519070914015174, + -0.00024644829682074487, + -0.00023727267398498952 + ], + "0.003": [ + -0.06697431951761246, + -0.0026875482872128487, + -0.001076806103810668, + -0.0008197093848139048, + -0.0007331351516768336, + -0.0008034107740968466, + -0.0007598516531288624, + -0.000768211844842881, + -0.0008050791220739484, + -0.0007651542546227574, + -0.000739292532671243, + -0.0007121727103367448 + ], + "0.01": [ + -0.20912763476371765, + -0.00893338117748499, + -0.0035844063386321068, + -0.0027289288118481636, + -0.0024399380199611187, + -0.0026743747293949127, + -0.0025294050574302673, + -0.002557961270213127, + -0.0026802942156791687, + -0.002547960262745619, + -0.002460954710841179, + -0.0023713763803243637 + ] + }, + "state_pred_error_per_layer": [ + 20223.798828125, + 14219.4013671875, + 11048.2333984375, + 10263.419921875, + 8570.201171875, + 7224.33740234375, + 7281.2197265625, + 8034.87548828125, + 6686.9033203125, + 6885.98291015625, + 6667.048828125, + 6627.78125 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.0764933771133425, + 1.0333355437278748, + 0.7067635051727295, + 0.5858699575424194, + 0.5356992348194123, + 0.5212211735248565, + 0.5239047775268555, + 0.5818343393325806, + 0.6053238994598389, + 0.5796063490390777, + 0.5091782062530518, + 0.6705454446792602, + 0.5421884929656983, + 0.6353844381332397, + 0.6657565035820008, + 0.6767716047048569, + 0.6167357039451599, + 0.6938248710155487, + 0.8726231457233429, + 0.8884702047348022, + 0.9432406356811524, + 1.090025691795349, + 0.968264564704895, + 1.0746012533664704, + 1.1493414950847625, + 1.1367902378082275, + 1.3055742527008056, + 1.1653732303619384, + 1.1293184537887573, + 1.334260126066208, + 1.2707585639953614, + 1.4581013576507569, + 1.4308010631561279, + 1.285036499786377, + 1.8279240913391113, + 1.8119590299606323, + 2.283292189025879, + 1.6382048044204711, + 1.4503440219879151, + 1.7393564136505126, + 1.6293182621002198, + 1.4443016117095948, + 1.2811944095611572, + 1.21372008228302, + 1.1024506355285644, + 1.2282759926795959, + 1.2983571229934692, + 1.3142110950469972, + 1.323133878517151, + 1.3581235847473145, + 1.2896308329582213, + 1.284184308242798, + 1.2349051277160645, + 1.3431798957824708, + 1.1847218454360962, + 1.1301065828323364, + 1.1214371286392213, + 1.0846952264785767, + 1.0839066341400148, + 1.097983945274353, + 1.0511162779808045, + 1.0496550798416138, + 1.0508357788085938, + 1.0465448284626007, + 1.0507531276702882, + 1.0591266249656677, + 1.0550554061889648, + 1.0550357730865478, + 1.0820843217849732, + 1.0595227965354919, + 1.065673966217041, + 1.0613273656845092, + 1.0590686019897462, + 1.0599220966339111, + 1.0588614574432373, + 1.0581368492126464, + 1.0541149351119996, + 1.0519661378860474, + 1.0514939740180969, + 1.0511556272506715 + ], + "train_acc": [ + 0.2452, + 0.6221, + 0.7343, + 0.784, + 0.801, + 0.805, + 0.8066, + 0.7899, + 0.7896, + 0.8047, + 0.8283, + 0.7988, + 0.8245, + 0.8083, + 0.8112, + 0.8115, + 0.8284, + 0.8143, + 0.7943, + 0.7885, + 0.7858, + 0.7695, + 0.7757, + 0.7569, + 0.7501, + 0.7476, + 0.7172, + 0.7332, + 0.7408, + 0.7223, + 0.7292, + 0.694, + 0.6746, + 0.6863, + 0.6085, + 0.6042, + 0.5516, + 0.6079, + 0.614, + 0.5877, + 0.5988, + 0.6126, + 0.6327, + 0.648, + 0.6703, + 0.6493, + 0.6395, + 0.6404, + 0.6402, + 0.6375, + 0.6505, + 0.6503, + 0.6588, + 0.636, + 0.6598, + 0.6677, + 0.6697, + 0.6766, + 0.6791, + 0.6715, + 0.6827, + 0.6841, + 0.6788, + 0.6811, + 0.6818, + 0.6793, + 0.6794, + 0.6814, + 0.6722, + 0.6808, + 0.6791, + 0.6816, + 0.6826, + 0.681, + 0.6824, + 0.6812, + 0.6834, + 0.6838, + 0.6841, + 0.6839 + ], + "test_acc": [ + 0.487, + 0.667, + 0.72, + 0.7295, + 0.754, + 0.7085, + 0.725, + 0.7445, + 0.7405, + 0.743, + 0.685, + 0.7675, + 0.7645, + 0.73, + 0.759, + 0.7505, + 0.731, + 0.6945, + 0.729, + 0.7415, + 0.6975, + 0.7285, + 0.7145, + 0.712, + 0.673, + 0.6825, + 0.635, + 0.6405, + 0.672, + 0.654, + 0.649, + 0.5795, + 0.682, + 0.5525, + 0.5845, + 0.3575, + 0.5085, + 0.5355, + 0.5015, + 0.49, + 0.5295, + 0.5085, + 0.585, + 0.6325, + 0.6295, + 0.531, + 0.5645, + 0.58, + 0.5825, + 0.604, + 0.6035, + 0.608, + 0.552, + 0.579, + 0.6445, + 0.633, + 0.643, + 0.6575, + 0.6475, + 0.651, + 0.664, + 0.6545, + 0.66, + 0.6625, + 0.663, + 0.66, + 0.663, + 0.662, + 0.6645, + 0.6635, + 0.663, + 0.6685, + 0.67, + 0.6675, + 0.6585, + 0.667, + 0.665, + 0.666, + 0.664, + 0.6635 + ], + "value_loss": [ + 2.8549158838272093, + 1.161496125793457, + 0.903598198890686, + 0.7632983952522278, + 0.6835939199686051, + 0.6766883213043213, + 0.7091717009544373, + 0.9754714385986328, + 1.08224688205719, + 1.062293195784092, + 0.9092092826843262, + 1.4716599861145019, + 1.038246541786194, + 1.4234249837160111, + 1.664121393585205, + 1.6125931749343871, + 1.4978518940925598, + 1.7518914916992188, + 2.72013060503006, + 3.1416282855987547, + 3.455105680847168, + 4.676465829467773, + 3.303184397125244, + 3.646682159423828, + 4.276524467420578, + 4.3695808753967285, + 5.563025414466858, + 4.5929090194702145, + 4.1187556289672855, + 5.53759754114151, + 6.174367126464844, + 5.94762811126709, + 4.872971316528321, + 3.637530991744995, + 5.705263479614258, + 6.351236457061767, + 8.093695210266114, + 4.504659541511535, + 2.6615619094848633, + 5.09617506980896, + 3.5259002746582033, + 2.7192329330444336, + 2.638924031639099, + 1.6318247977256775, + 1.3823803621292114, + 1.951340493106842, + 2.216556364059448, + 2.1964007709503175, + 2.5811822102546693, + 2.1051325965881347, + 1.8404160772800446, + 1.9780693883895875, + 1.718860918045044, + 1.983682257080078, + 1.9515350111961365, + 1.2874729948043824, + 1.3900933967590332, + 1.2211145097732543, + 1.3988167335510253, + 1.2648169076919555, + 1.1056289435863496, + 0.9794681151866913, + 1.0225543155670167, + 1.0772494400978088, + 0.9853854091644287, + 0.9633722298145294, + 0.9995410033226013, + 1.0373240133285522, + 1.104611580657959, + 1.0151097399234772, + 1.0281483087539673, + 0.969052958202362, + 0.9510830691337585, + 0.9537978723526, + 0.8950119636535645, + 0.8671914636135102, + 0.9178054649353027, + 0.9064536457061767, + 0.8821513331413269, + 0.9863593735218048 + ], + "term_loss": [ + 1.682755407524109, + 0.9349195198059082, + 0.7577797178268433, + 0.6367232304573059, + 0.5474753088951111, + 0.5284061282157898, + 0.5641642443656921, + 0.8194823429107666, + 0.9324796360015869, + 0.912509532225132, + 0.7826824951171875, + 1.319875775718689, + 0.9083852030277252, + 1.281417071583867, + 1.5178388681411743, + 1.4628825843811035, + 1.3601782407283782, + 1.590202610015869, + 2.46570823032856, + 2.7377664497375487, + 2.9881096405029295, + 4.093345769119263, + 2.8418840057373047, + 3.1584136568069456, + 3.727611806821823, + 3.8350956407547, + 4.957208102893829, + 3.993870001220703, + 3.628015086746216, + 4.997284079122544, + 5.491623828125, + 5.350730059623718, + 4.29666678314209, + 3.107940061569214, + 4.910516096496582, + 5.609202164840698, + 7.328441577911377, + 3.92153433303833, + 2.2080428680419923, + 4.370297067832947, + 3.0111737335205078, + 2.2708549232959747, + 2.1683303813934325, + 1.2954999471187592, + 1.0790472076416016, + 1.5998526191234588, + 1.8377661813259125, + 1.8053871860504151, + 2.1328504148960112, + 1.717490065574646, + 1.4750218168020248, + 1.6484625193595885, + 1.4090114224433898, + 1.6390713775634767, + 1.6058604949712754, + 1.0051573803424836, + 1.102199532008171, + 0.9493986696243286, + 1.0932330482721329, + 0.9720278540134429, + 0.8383463484048843, + 0.7234356563329697, + 0.7596620301246643, + 0.8095307093143463, + 0.7318540607452393, + 0.7117131633043289, + 0.7411717020988464, + 0.76621328125, + 0.8340190933227539, + 0.7561145126342773, + 0.7697270512580872, + 0.7089268949508667, + 0.6988980655670166, + 0.7010336683273315, + 0.6438103723526001, + 0.6179502298414707, + 0.6598036010742188, + 0.6499435122966767, + 0.626848087978363, + 0.7168336891174316 + ], + "bridge_loss": [ + 0.896014222253242, + 0.04517395571172238, + 0.006593965370953083, + 0.0034440495952963827, + 0.018616770416498184, + 0.030837100231647492, + 0.024734814091026784, + 0.02389179002046585, + 0.01787433380782604, + 0.018077380554378034, + 0.010488519954681396, + 0.015156167778372765, + 0.010538265505433082, + 0.012908530953526497, + 0.01322974010705948, + 0.016209473606944084, + 0.015149136707186699, + 0.025635590088367462, + 0.09975660238265992, + 0.24363938935995103, + 0.30326125044822694, + 0.4093769493103027, + 0.2900644659996033, + 0.30407776420712473, + 0.36139686872959137, + 0.3478179151058197, + 0.3997144910812378, + 0.4011154135465622, + 0.2988287874698639, + 0.32996571643352507, + 0.48100315761566165, + 0.37056637697219846, + 0.3436944869041443, + 0.3004012752532959, + 0.5041740354537964, + 0.44999724850654604, + 0.4296209671974182, + 0.3023332357406616, + 0.18253318367004395, + 0.4315898947238922, + 0.23118360629081727, + 0.18129249473810197, + 0.22337257357835769, + 0.09488131734728814, + 0.07875844204425812, + 0.11123235714435577, + 0.12893191225528716, + 0.13899659600257874, + 0.19428774079680441, + 0.13162928407192231, + 0.1163264914393425, + 0.0801027453839779, + 0.06760505118966102, + 0.08564049925804139, + 0.10703954181075095, + 0.05367120292782784, + 0.058458478817343715, + 0.04750625167787075, + 0.08299656238555908, + 0.06785187515616417, + 0.05007092701196671, + 0.03860371837019921, + 0.04493570284247398, + 0.05130842483341694, + 0.036386512249708174, + 0.033535686874389646, + 0.04093419628441334, + 0.05317574837207794, + 0.0473568382024765, + 0.04034040171802044, + 0.0394649936914444, + 0.0410647492647171, + 0.03395739138126373, + 0.03392591526508331, + 0.033935180634260174, + 0.030197322559356688, + 0.04014543912410736, + 0.039191885554790494, + 0.03813223616480827, + 0.05245816183909774 + ], + "tgrad_loss": [ + 0.27614626688957217, + 0.1814026545524597, + 0.13922452120780945, + 0.12313111693859101, + 0.11750183961391449, + 0.1174450924873352, + 0.12027264575958252, + 0.13209730380773543, + 0.13189289898872375, + 0.13170627192556858, + 0.1160382707118988, + 0.13662804961204528, + 0.11932307603359223, + 0.12909939237833024, + 0.13305279737710954, + 0.1335011120378971, + 0.12252451281547547, + 0.13605329816937448, + 0.15466575002670288, + 0.16022245128154755, + 0.16373479413986206, + 0.1737431848526001, + 0.17123591811656952, + 0.18419077730178832, + 0.18751578764915466, + 0.18666732320785523, + 0.2061028514146805, + 0.19792364330291748, + 0.19191175360679627, + 0.21034778068065643, + 0.20174010210037233, + 0.22633177161216736, + 0.23261008365154268, + 0.2291896457672119, + 0.2905733513832092, + 0.29203712682724, + 0.33563268880844116, + 0.2807919749736786, + 0.27098584852218627, + 0.29428816595077517, + 0.2835429540157318, + 0.2670855068206787, + 0.24722108142375945, + 0.24144353773593902, + 0.22457472248077393, + 0.24025552184581755, + 0.24985827751159667, + 0.2520169780254364, + 0.2540440467596054, + 0.2560132534980774, + 0.2490677748680115, + 0.24950413098335267, + 0.24224443774223328, + 0.258970384645462, + 0.2386349895954132, + 0.22864441821575165, + 0.22943539001941682, + 0.224209578537941, + 0.22258712384700774, + 0.2249371839284897, + 0.21721167531013488, + 0.21742874386310576, + 0.21795658111572266, + 0.21641030756235122, + 0.21714482364654542, + 0.2181233823299408, + 0.21743510699272156, + 0.21793499126434326, + 0.22323566336631775, + 0.2186548171043396, + 0.21895627632141113, + 0.2190613217353821, + 0.21822762320041655, + 0.21883828949928283, + 0.21726641387939452, + 0.21904391651153565, + 0.2178564251422882, + 0.21731825175285338, + 0.2171710154533386, + 0.21706753172874452 + ] + }, + "diagnostics": { + "bp_cosine": [ + 9.498395957052708e-05, + 0.029415149241685867, + 0.062070880085229874, + 0.07393385469913483, + 0.07970248907804489, + 0.08624569326639175, + 0.10002343356609344, + 0.10488344728946686, + 0.10920242965221405, + 0.10451158881187439, + 0.09929930418729782, + 0.09505851566791534 + ], + "perturbation_rho": [ + 0.025425152853131294, + 0.0574759915471077, + 0.13417154550552368, + 0.10034967213869095, + 0.17468321323394775, + 0.17164339125156403, + 0.15925100445747375, + 0.08668951690196991, + 0.1521437168121338, + 0.14672580361366272, + 0.1825145184993744, + 0.12463894486427307 + ], + "nudging": { + "0.001": [ + 9.352347115054727e-05, + -0.0002647446817718446, + -0.00047820506733842194, + -0.0005149872158654034, + -0.0005640805466100574, + -0.0006015360122546554, + -0.0006438379641622305, + -0.0006649883580394089, + -0.0007019470212981105, + -0.0006623220397159457, + -0.0006254295585677028, + -0.0006009879289194942 + ], + "0.003": [ + 0.0003153950092382729, + -0.0007944293902255595, + -0.0014327235985547304, + -0.0015408566687256098, + -0.0016878837486729026, + -0.0018035313114523888, + -0.0019295630045235157, + -0.0019936237949877977, + -0.0020997454412281513, + -0.0019858325831592083, + -0.001876077032648027, + -0.0018000612035393715 + ], + "0.01": [ + 0.001420565415173769, + -0.0026360084302723408, + -0.00476992130279541, + -0.005131378769874573, + -0.005615689791738987, + -0.006001932080835104, + -0.006417973432689905, + -0.006630052346736193, + -0.006984136067330837, + -0.0066003259271383286, + -0.00623705331236124, + -0.005985542666167021 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.0_L12_s456.json b/results/synth_ladder_v2_lo/synth_a0.0_L12_s456.json new file mode 100644 index 0000000..1368dc3 --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.0_L12_s456.json @@ -0,0 +1,1722 @@ +{ + "bp": { + "log": { + "train_loss": [ + 0.969122644329071, + 0.5920969530105591, + 0.4555384733200073, + 0.42013895292282105, + 0.3577242928504944, + 0.37090972731113436, + 0.3204999417304993, + 0.3792783494949341, + 0.3393013801574707, + 0.3097765709400177, + 0.33500295226573945, + 0.2910071131706238, + 0.29785395264625547, + 0.283798801279068, + 0.2583663343429565, + 0.27849551072120665, + 0.2531052485704422, + 0.23891032192707062, + 0.2196098397731781, + 0.2663255609512329, + 0.260848161315918, + 0.2927300401687622, + 0.30502517681121827, + 0.2855231747150421, + 0.21818343462944031, + 0.19386887674331665, + 0.2458417517900467, + 0.19182274364233018, + 0.17297324039936066, + 0.19739589419364928, + 0.1834898106098175, + 0.1994040518283844, + 0.20876692607402803, + 0.15818328301906587, + 0.1655046018600464, + 0.18371486501693726, + 0.18603038516044618, + 0.16989948571324348, + 0.14640453379154206, + 0.16136881852149965, + 0.18090535459518434, + 0.16096133246421815, + 0.17648028812408448, + 0.19660544855594636, + 0.1483273560643196, + 0.1228380591392517, + 0.139758788728714, + 0.1273645007133484, + 0.1370752555370331, + 0.1313122305870056, + 0.12541208545863627, + 0.10699837379455567, + 0.11257837036848069, + 0.10080176743865013, + 0.0961822389125824, + 0.10998678052425384, + 0.10155456811189652, + 0.09173920025825501, + 0.09425398440361023, + 0.0889471257686615, + 0.08973454808592796, + 0.08506661486625672, + 0.0839197184562683, + 0.08141958972215653, + 0.081237429189682, + 0.08236398327350616, + 0.0800594212770462, + 0.07829977524876594, + 0.0759517749786377, + 0.0762132091999054, + 0.0748500356912613, + 0.07403571516871452, + 0.07296141183376312, + 0.07267795407772064, + 0.07197105139493942, + 0.07171081202030181, + 0.07135244336128235, + 0.07104146628379822, + 0.0708903494656086, + 0.07079571675658226 + ], + "train_acc": [ + 0.6424, + 0.7776, + 0.8193, + 0.8339, + 0.8565, + 0.8537, + 0.8696, + 0.852, + 0.863, + 0.8761, + 0.8654, + 0.8834, + 0.8805, + 0.8895, + 0.8965, + 0.8924, + 0.9028, + 0.9009, + 0.9098, + 0.902, + 0.8968, + 0.8843, + 0.8793, + 0.8855, + 0.9128, + 0.9232, + 0.9032, + 0.9231, + 0.9326, + 0.9229, + 0.9256, + 0.9166, + 0.9155, + 0.9371, + 0.9368, + 0.9301, + 0.9236, + 0.9306, + 0.9446, + 0.9353, + 0.9262, + 0.9369, + 0.9296, + 0.9221, + 0.9433, + 0.9533, + 0.945, + 0.9519, + 0.9451, + 0.948, + 0.9534, + 0.9643, + 0.9598, + 0.9675, + 0.9698, + 0.9634, + 0.9653, + 0.9733, + 0.9713, + 0.9731, + 0.9744, + 0.9758, + 0.9773, + 0.9788, + 0.9798, + 0.9776, + 0.9795, + 0.9801, + 0.9815, + 0.9821, + 0.9825, + 0.9839, + 0.9848, + 0.9837, + 0.9844, + 0.9846, + 0.9847, + 0.9852, + 0.9852, + 0.9853 + ], + "test_acc": [ + 0.775, + 0.7965, + 0.823, + 0.8375, + 0.838, + 0.838, + 0.8475, + 0.84, + 0.8545, + 0.858, + 0.847, + 0.866, + 0.873, + 0.8685, + 0.868, + 0.8605, + 0.866, + 0.871, + 0.8765, + 0.8585, + 0.8675, + 0.862, + 0.868, + 0.8685, + 0.879, + 0.886, + 0.8755, + 0.8865, + 0.8925, + 0.8825, + 0.879, + 0.896, + 0.884, + 0.8835, + 0.886, + 0.895, + 0.8825, + 0.893, + 0.8905, + 0.8975, + 0.896, + 0.8955, + 0.8845, + 0.8825, + 0.901, + 0.896, + 0.902, + 0.9055, + 0.906, + 0.8995, + 0.908, + 0.907, + 0.907, + 0.908, + 0.9025, + 0.9005, + 0.905, + 0.9005, + 0.909, + 0.9025, + 0.9055, + 0.913, + 0.908, + 0.91, + 0.911, + 0.911, + 0.9125, + 0.9125, + 0.9115, + 0.9125, + 0.912, + 0.9115, + 0.91, + 0.9085, + 0.91, + 0.911, + 0.9115, + 0.9115, + 0.9115, + 0.9115 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.841245174407959, + 0.830803632736206, + 0.8195754885673523, + 0.8066799640655518, + 0.7983194589614868, + 0.7908304929733276, + 0.7860588431358337, + 0.7811387777328491, + 0.7771316170692444, + 0.7744728326797485, + 0.7727954983711243, + 0.7717056274414062 + ], + "perturbation_rho": [ + 0.9999991059303284, + 0.9999973177909851, + 0.9999889731407166, + 0.9999734163284302, + 0.9999427795410156, + 0.9998763799667358, + 0.9998629093170166, + 0.9998323321342468, + 0.9997599720954895, + 0.9997479319572449, + 0.9997410774230957, + 0.9997145533561707 + ], + "nudging": { + "0.001": [ + -0.024454854428768158, + -0.011305858381092548, + -0.00559408962726593, + -0.0032756051514297724, + -0.0022792830131947994, + -0.001779809594154358, + -0.0014915994834154844, + -0.0013089049607515335, + -0.0011874620104208589, + -0.0011061741970479488, + -0.00105283223092556, + -0.0010198504896834493 + ], + "0.003": [ + -0.06566837430000305, + -0.03229808062314987, + -0.016386456787586212, + -0.00969094317406416, + -0.0067720417864620686, + -0.0052991146221756935, + -0.004446372855454683, + -0.0039047286845743656, + -0.0035444353707134724, + -0.0033029273618012667, + -0.003144192509353161, + -0.003046202240511775 + ], + "0.01": [ + -0.1470111906528473, + -0.09042022377252579, + -0.050197783857584, + -0.030754856765270233, + -0.021816428750753403, + -0.017199307680130005, + -0.014493460766971111, + -0.012762569822371006, + -0.01160583458840847, + -0.010828070342540741, + -0.010316012427210808, + -0.00999932736158371 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.0898007585525513, + 1.1015719889640807, + 0.7905141721725464, + 0.6718451899528504, + 0.6203681846618653, + 0.6325145021438598, + 0.6236261308193207, + 0.6393312355041504, + 0.6374612313747406, + 0.6430461730480194, + 0.5502225688934326, + 0.8417456014633179, + 0.7175684427261353, + 1.0312082330226897, + 0.8398658451080322, + 0.8481408470153808, + 0.6183168939113617, + 0.937887061214447, + 0.8483327810287475, + 1.0181842102050782, + 0.7333554124832153, + 1.3151530385017396, + 1.102606842803955, + 0.8690633714675904, + 0.9178138070106506, + 1.0159898044586182, + 3.232203116989136, + 1.3720880279541015, + 0.6449793176651001, + 0.8210637205123902, + 0.9120081573486328, + 1.1590281297683716, + 0.855452324104309, + 0.7272457509994507, + 0.8923147548675537, + 0.7562281994819641, + 0.680691127204895, + 0.6434698450565338, + 0.723854674911499, + 0.8917708801269532, + 0.703606390953064, + 0.6779194925308227, + 0.6525233362197876, + 1.1295996128082275, + 0.8972809474945068, + 0.5784100801467895, + 0.6937777447223663, + 0.7719525880813599, + 0.6017424495697021, + 0.7032140111923217, + 0.515312993812561, + 0.5384840083122253, + 0.5088662053585052, + 0.4816106027841568, + 0.5108573516845704, + 0.5119831256866455, + 0.6042850525379181, + 0.4791012176513672, + 0.5760747453689575, + 0.45199957361221316, + 0.395004202580452, + 0.43196895809173586, + 0.4245094624042511, + 0.3937124969959259, + 0.4062374726772308, + 0.38945438613891603, + 0.3935444291114807, + 0.37236739473342895, + 0.4024800674438477, + 0.37810999517440796, + 0.3714436505317688, + 0.35974656147956846, + 0.36245792179107666, + 0.35358601045608523, + 0.3556142600655556, + 0.34317912871837614, + 0.34346320304870603, + 0.3412538662314415, + 0.33999497032165527, + 0.3392112380981445 + ], + "train_acc": [ + 0.242, + 0.6061, + 0.7059, + 0.7544, + 0.7711, + 0.7653, + 0.7685, + 0.7636, + 0.7644, + 0.7713, + 0.7934, + 0.7077, + 0.7412, + 0.6984, + 0.7215, + 0.7161, + 0.7733, + 0.7014, + 0.7168, + 0.6967, + 0.7423, + 0.6917, + 0.712, + 0.7198, + 0.707, + 0.6952, + 0.5487, + 0.6802, + 0.7747, + 0.7323, + 0.7125, + 0.6785, + 0.7421, + 0.7598, + 0.7335, + 0.7576, + 0.768, + 0.7791, + 0.7621, + 0.7386, + 0.7683, + 0.7724, + 0.7795, + 0.7106, + 0.7384, + 0.8012, + 0.7775, + 0.7554, + 0.7943, + 0.784, + 0.8146, + 0.8054, + 0.8234, + 0.8261, + 0.8169, + 0.8192, + 0.8006, + 0.8264, + 0.8009, + 0.8317, + 0.8518, + 0.8421, + 0.8454, + 0.8499, + 0.8472, + 0.8525, + 0.8469, + 0.8542, + 0.8459, + 0.8574, + 0.856, + 0.8652, + 0.8609, + 0.8635, + 0.865, + 0.866, + 0.8665, + 0.8678, + 0.868, + 0.8685 + ], + "test_acc": [ + 0.478, + 0.66, + 0.7125, + 0.665, + 0.634, + 0.693, + 0.689, + 0.642, + 0.584, + 0.708, + 0.656, + 0.6605, + 0.559, + 0.6505, + 0.606, + 0.6635, + 0.566, + 0.6175, + 0.478, + 0.6495, + 0.433, + 0.5855, + 0.5385, + 0.645, + 0.6835, + 0.401, + 0.5985, + 0.6675, + 0.6025, + 0.6285, + 0.5105, + 0.565, + 0.662, + 0.6695, + 0.6665, + 0.648, + 0.6885, + 0.667, + 0.4995, + 0.671, + 0.7005, + 0.621, + 0.6685, + 0.6735, + 0.6925, + 0.662, + 0.6445, + 0.696, + 0.6395, + 0.7555, + 0.687, + 0.7115, + 0.7375, + 0.7585, + 0.742, + 0.695, + 0.7735, + 0.719, + 0.735, + 0.792, + 0.7645, + 0.752, + 0.801, + 0.768, + 0.7955, + 0.784, + 0.8105, + 0.7885, + 0.808, + 0.817, + 0.809, + 0.8145, + 0.822, + 0.82, + 0.8185, + 0.817, + 0.824, + 0.8255, + 0.827, + 0.8275 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.0384417325258255, + 0.27492010593414307, + 0.17608770728111267, + 0.12729278206825256, + 0.09575799107551575, + 0.13158489763736725, + 0.07343505322933197, + 0.08012130856513977, + 0.08938327431678772, + 0.09414967149496078, + 0.06517850607633591, + 0.07253237068653107 + ], + "perturbation_rho": [ + -0.00336202559992671, + 0.18004602193832397, + 0.18598641455173492, + 0.15388232469558716, + 0.058810293674468994, + 0.14123386144638062, + 0.05320374667644501, + 0.10196533054113388, + 0.09802494943141937, + 0.10918877273797989, + 0.09344048798084259, + 0.0655277818441391 + ], + "nudging": { + "0.001": [ + -0.001064171316102147, + -0.0006666459375992417, + -0.0004184156423434615, + -0.000315168930683285, + -0.00022096859174780548, + -0.0002887723676394671, + -0.00016212352784350514, + -0.00017708796076476574, + -0.00021025452588219196, + -0.00024805153952911496, + -0.00015850270574446768, + -0.00017888075672090054 + ], + "0.003": [ + -0.0031536915339529514, + -0.0019956310279667377, + -0.00125154631678015, + -0.000938912620767951, + -0.0006729550659656525, + -0.0008644282352179289, + -0.0004864725051447749, + -0.0005231637042015791, + -0.0006273322505876422, + -0.0007397128501906991, + -0.0004687863402068615, + -0.0005287445383146405 + ], + "0.01": [ + -0.010087584145367146, + -0.006617182400077581, + -0.004152917303144932, + -0.0031182561069726944, + -0.0022262579295784235, + -0.0028664623387157917, + -0.0016081882640719414, + -0.0017378728371113539, + -0.0020772137213498354, + -0.002457245485857129, + -0.0015545324422419071, + -0.0017554720398038626 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.9577019836425782, + 1.367190316581726, + 1.1470114725112914, + 1.0665275047302245, + 1.1731505100250244, + 1.2525334920883178, + 1.3311169979095459, + 1.5198530440330504, + 1.3418273334503175, + 1.3490344924926758, + 1.3042446374893188, + 1.2384788623809815, + 1.2332912294387817, + 1.216872233581543, + 1.2361593342781068, + 1.1900994968414307, + 1.220567015838623, + 1.2757856309890747, + 1.2281171096801757, + 1.161736725616455, + 1.1808231119155883, + 1.1178058204650878, + 1.1057362071037293, + 1.185501344013214, + 1.136134003829956, + 1.1250077436447143, + 1.098593546295166, + 1.1006900829315185, + 1.092524215221405, + 1.0361322803497315, + 1.0446809569358826, + 1.0481329538345336, + 1.053780317878723, + 1.0705591835021973, + 1.1286329881668091, + 1.1078846117973327, + 1.1074383437156676, + 1.083875510597229, + 1.054987931394577, + 1.042312901210785, + 1.0332075857162475, + 1.0004530704498291, + 0.9915621906280517, + 0.9539300963401794, + 0.9578770606994629, + 0.9117126565933228, + 0.8960798753738404, + 0.8623609913825989, + 0.8706058340072632, + 0.8639619729995728, + 0.8503742446899414, + 0.8467240323066711, + 0.8390994773864746, + 0.8202853441238404, + 0.820123230457306, + 0.8141281935691833, + 0.792419764328003, + 0.7936320905208588, + 0.7901265294551849, + 0.7891995994567871, + 0.7945449181556702, + 0.7905005366325378, + 0.7813621898651123, + 0.7853380561828613, + 0.7846485383987427, + 0.7863743240356446, + 0.7899072016716003, + 0.7869116140365601, + 0.7873675743103027, + 0.7921814329147339, + 0.7928447710990906, + 0.7956968950271607, + 0.7953850835800171, + 0.7970634747505188, + 0.7977744478225708, + 0.7989712644577026, + 0.7980876712799072, + 0.7980577057838439, + 0.797688978767395, + 0.797543062210083 + ], + "train_acc": [ + 0.3543, + 0.5319, + 0.5908, + 0.6146, + 0.592, + 0.578, + 0.5808, + 0.5464, + 0.5774, + 0.5876, + 0.5817, + 0.5923, + 0.5941, + 0.5988, + 0.608, + 0.6113, + 0.61, + 0.6043, + 0.6128, + 0.6209, + 0.6127, + 0.6245, + 0.6261, + 0.6088, + 0.6229, + 0.6272, + 0.6305, + 0.6276, + 0.6363, + 0.6424, + 0.6415, + 0.6418, + 0.6443, + 0.6398, + 0.6277, + 0.6338, + 0.6352, + 0.6373, + 0.6486, + 0.651, + 0.6508, + 0.6554, + 0.6575, + 0.6666, + 0.6627, + 0.6796, + 0.6857, + 0.6914, + 0.6914, + 0.6926, + 0.7, + 0.7, + 0.6987, + 0.7024, + 0.7016, + 0.7041, + 0.7115, + 0.7135, + 0.7104, + 0.7115, + 0.7099, + 0.715, + 0.7162, + 0.7163, + 0.7166, + 0.7173, + 0.7123, + 0.7213, + 0.7146, + 0.7148, + 0.718, + 0.7155, + 0.714, + 0.7128, + 0.7152, + 0.7148, + 0.7146, + 0.7138, + 0.7152, + 0.7153 + ], + "test_acc": [ + 0.495, + 0.5595, + 0.5795, + 0.574, + 0.5465, + 0.5705, + 0.5295, + 0.532, + 0.5555, + 0.541, + 0.5535, + 0.5705, + 0.558, + 0.581, + 0.5955, + 0.582, + 0.57, + 0.5665, + 0.572, + 0.5885, + 0.576, + 0.586, + 0.552, + 0.5675, + 0.5705, + 0.59, + 0.5705, + 0.5785, + 0.6125, + 0.607, + 0.6175, + 0.632, + 0.598, + 0.6025, + 0.5915, + 0.6025, + 0.6125, + 0.6225, + 0.641, + 0.617, + 0.6225, + 0.623, + 0.6415, + 0.631, + 0.641, + 0.646, + 0.6585, + 0.643, + 0.665, + 0.6675, + 0.659, + 0.6665, + 0.6545, + 0.679, + 0.671, + 0.683, + 0.676, + 0.6775, + 0.6935, + 0.6895, + 0.698, + 0.698, + 0.684, + 0.69, + 0.6835, + 0.69, + 0.6935, + 0.6845, + 0.6865, + 0.6905, + 0.6845, + 0.685, + 0.688, + 0.6855, + 0.6825, + 0.685, + 0.683, + 0.683, + 0.6835, + 0.684 + ], + "state_pred_error": [ + 0.6557525987625122, + 0.2581627747535706, + 0.2180150511264801, + 0.19771510035991668, + 0.17691524381637574, + 0.21782165381908417, + 0.19984715962409974, + 0.20151861963272094, + 0.22002407603263854, + 0.22233803098201751, + 0.1950549049139023, + 0.18242949080467225, + 0.1731606459379196, + 0.16580520544052124, + 0.15936565225124358, + 0.15244879407882692, + 0.1435310169696808, + 0.1339448815703392, + 0.12139209755659103, + 0.10519540898799896, + 0.09373599338531494, + 0.08733212774991989, + 0.08062151061296463, + 0.07534996691942215, + 0.07384048416614533, + 0.07770671141147613, + 0.07913587466478347, + 0.07108985353708268, + 0.06537577290534974, + 0.06072714284658432, + 0.05709798917174339, + 0.057688245034217836, + 0.05891312641501427, + 0.061041689145565035, + 0.059126829808950426, + 0.05346322001814842, + 0.052376105165481565, + 0.05078197082877159, + 0.04823381187915802, + 0.045614832776784894, + 0.043012580084800724, + 0.03774388888478279, + 0.032903633427619934, + 0.028299692285060882, + 0.02640610886514187, + 0.027187307637929918, + 0.028776719480752944, + 0.030680300956964494, + 0.03148365080356598, + 0.03091398191154003, + 0.029518017873167993, + 0.026383623799681663, + 0.02372063409090042, + 0.02179983432292938, + 0.02020930643975735, + 0.01886237643659115, + 0.018010195726156236, + 0.017387488079071044, + 0.016838955014944076, + 0.016470046550035478, + 0.01637252227962017, + 0.01600538874566555, + 0.015849738636612893, + 0.015769525337219238, + 0.01577099280208349, + 0.015590812629461288, + 0.015244143217802047, + 0.015246101871132851, + 0.0149916733071208, + 0.01488443463742733, + 0.014857900011539459, + 0.014476912885904311, + 0.014302368466556073, + 0.013730039289593697, + 0.01368503429889679, + 0.013323678565025329, + 0.013020070712268352, + 0.012987913605570793, + 0.012227315375208854, + 0.012032101236283779 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.7363088726997375, + 0.32443851232528687, + 0.21702790260314941, + 0.21007081866264343, + 0.16975754499435425, + 0.1722516119480133, + 0.16474759578704834, + 0.12138545513153076, + 0.1178494393825531, + 0.13036376237869263, + 0.11493153870105743, + 0.1162962019443512 + ], + "perturbation_rho": [ + 0.6429969072341919, + 0.2531689405441284, + 0.22036504745483398, + 0.17542049288749695, + 0.15819020569324493, + 0.14438438415527344, + 0.07042165100574493, + 0.11963094770908356, + 0.1070300042629242, + 0.07622774690389633, + 0.035559043288230896, + 0.045592159032821655 + ], + "nudging": { + "0.001": [ + -0.01886601373553276, + -0.0009471861412748694, + -0.0005426729912869632, + -0.0005197790451347828, + -0.00040702728438191116, + -0.00039994364487938583, + -0.0003908725338988006, + -0.0003088848025072366, + -0.0002972484799101949, + -0.00033751194132491946, + -0.0002799705835059285, + -0.00027640321059152484 + ], + "0.003": [ + -0.05549539998173714, + -0.002838960848748684, + -0.0016271104104816914, + -0.0015591384144499898, + -0.001220998470671475, + -0.0011997417313978076, + -0.0011723506031557918, + -0.0009265473927371204, + -0.000891170755494386, + -0.0010123227257281542, + -0.0008400253136642277, + -0.0008296556770801544 + ], + "0.01": [ + -0.1725819855928421, + -0.009430286474525928, + -0.0054127369076013565, + -0.005186344031244516, + -0.004062540829181671, + -0.0039931111969053745, + -0.003901706077158451, + -0.003083862829953432, + -0.002966922242194414, + -0.0033692335709929466, + -0.002796228276565671, + -0.002761534880846739 + ] + }, + "state_pred_error_per_layer": [ + 8107.484375, + 6015.64697265625, + 3272.651123046875, + 3025.219970703125, + 3498.379150390625, + 2962.442626953125, + 2732.457275390625, + 3394.069091796875, + 3050.444091796875, + 3397.53271484375, + 3068.22607421875, + 3145.807373046875 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.092706339263916, + 1.0952877737998963, + 0.7729337105751037, + 0.6789219863891601, + 0.6241036960601807, + 0.6100845262527466, + 0.594813515996933, + 0.7195955331802368, + 0.6677259072303772, + 0.6198010721206665, + 0.6374922561645507, + 0.7701140362739562, + 0.69171789560318, + 0.708719236278534, + 0.6036844366073608, + 0.8205160137176514, + 0.9806505244255066, + 0.7954677212715149, + 0.7861951595306397, + 0.823767824935913, + 0.6428154012203217, + 0.7191776779174804, + 0.8116244506835938, + 0.753524228477478, + 0.8249499505996704, + 0.7682834581375122, + 0.7208644798278808, + 0.759485391998291, + 1.042400759124756, + 1.547001088142395, + 1.1331607871055602, + 1.0703241619110107, + 0.8603198796749115, + 0.8971985034942627, + 1.0760511143684388, + 1.152393785381317, + 1.4280963862895966, + 1.5006843608856202, + 1.3100523867607117, + 1.1282628120422362, + 1.2173214994430541, + 1.0435792781829833, + 1.2676011086463927, + 1.2351581176757813, + 1.246204901123047, + 1.2180886367797852, + 1.3540986360549927, + 1.219435647392273, + 1.2538528778076172, + 1.1500556253433227, + 1.055687839126587, + 1.1929910972595215, + 1.3931519176483154, + 1.4715053829193114, + 1.6093412540435792, + 1.7281322120666505, + 1.7611547931671143, + 1.7229496166229248, + 1.5543313556671143, + 1.409035835647583, + 1.281838191986084, + 1.210691173553467, + 1.1457153511047364, + 1.1038917953491212, + 1.1368809636592865, + 1.0750537950515746, + 1.078484614944458, + 1.0653290471553802, + 1.043406178855896, + 1.029171966934204, + 1.0249553047180175, + 1.0062125328063964, + 0.9868852173805237, + 0.980598240661621, + 0.9800201850891114, + 0.9732961756706238, + 0.9715418921470642, + 0.9726413438796997, + 0.9694333058834076, + 0.9690543773651124 + ], + "train_acc": [ + 0.2472, + 0.6098, + 0.7158, + 0.7471, + 0.7633, + 0.775, + 0.7733, + 0.7387, + 0.7635, + 0.765, + 0.7685, + 0.7314, + 0.7553, + 0.7495, + 0.7784, + 0.7204, + 0.6933, + 0.7259, + 0.7279, + 0.7282, + 0.7687, + 0.7487, + 0.7313, + 0.7414, + 0.7313, + 0.7547, + 0.7595, + 0.7644, + 0.7269, + 0.6914, + 0.7377, + 0.7329, + 0.7555, + 0.7575, + 0.7373, + 0.7285, + 0.7163, + 0.6928, + 0.7033, + 0.7168, + 0.6899, + 0.7089, + 0.6715, + 0.6694, + 0.6696, + 0.6666, + 0.649, + 0.6656, + 0.6545, + 0.6709, + 0.686, + 0.6767, + 0.648, + 0.6469, + 0.6339, + 0.6281, + 0.6347, + 0.6376, + 0.6473, + 0.6607, + 0.669, + 0.6811, + 0.6873, + 0.6898, + 0.6811, + 0.6921, + 0.6948, + 0.6904, + 0.6949, + 0.695, + 0.6913, + 0.6975, + 0.7004, + 0.6993, + 0.6993, + 0.7, + 0.6991, + 0.6994, + 0.7022, + 0.7017 + ], + "test_acc": [ + 0.49, + 0.659, + 0.701, + 0.7205, + 0.721, + 0.6975, + 0.708, + 0.6605, + 0.7245, + 0.6645, + 0.6145, + 0.6515, + 0.5925, + 0.6665, + 0.561, + 0.472, + 0.637, + 0.66, + 0.5885, + 0.6525, + 0.657, + 0.521, + 0.5985, + 0.5795, + 0.6475, + 0.669, + 0.6665, + 0.5875, + 0.6335, + 0.7045, + 0.633, + 0.6845, + 0.6295, + 0.6315, + 0.7015, + 0.6905, + 0.5995, + 0.6185, + 0.6335, + 0.585, + 0.652, + 0.513, + 0.5615, + 0.5745, + 0.5725, + 0.555, + 0.613, + 0.5315, + 0.6245, + 0.6495, + 0.6425, + 0.6055, + 0.611, + 0.637, + 0.582, + 0.582, + 0.587, + 0.614, + 0.6315, + 0.631, + 0.6295, + 0.644, + 0.6635, + 0.634, + 0.664, + 0.656, + 0.664, + 0.665, + 0.664, + 0.661, + 0.6635, + 0.664, + 0.6665, + 0.671, + 0.671, + 0.6655, + 0.6635, + 0.6695, + 0.6685, + 0.669 + ], + "value_loss": [ + 2.756714974594116, + 1.0699842605590821, + 0.772724876499176, + 0.7186811010360717, + 0.7039346227645874, + 0.7089841152191162, + 0.7045547727584839, + 1.0278774134635926, + 1.0351098167419435, + 0.79849758310318, + 0.8763475816726685, + 1.2047807735443115, + 1.027970889377594, + 1.0575392370224, + 0.7888917721748352, + 1.2805246074676513, + 2.225238763809204, + 1.0823904124736785, + 1.1905035690307617, + 1.642304021835327, + 0.9129455471992493, + 1.2949172660827637, + 1.9253954372406006, + 1.5692272598266601, + 2.174523571395874, + 1.989169766139984, + 1.3499937854766846, + 1.7908005687713624, + 3.913453258514404, + 8.14511700668335, + 5.840194707679749, + 4.497665633392334, + 3.1302750116348266, + 3.5435767040252686, + 4.556240005493164, + 5.435755169677734, + 9.532537229919434, + 9.881556200408935, + 6.2278411382198335, + 4.9383210889816285, + 4.416168696212768, + 3.3235662673950195, + 5.057485938262939, + 3.643429838180542, + 3.272873913192749, + 2.747176977729797, + 3.895003358268738, + 2.62603823928833, + 2.462896474838257, + 2.229940517234802, + 2.081709727478027, + 2.7063279764175414, + 3.1426480583190917, + 3.744391917037964, + 3.7624966133117677, + 3.801296794509888, + 4.549085423660278, + 4.737994041442871, + 3.6686552688598635, + 2.8817406677246096, + 2.1652517974853516, + 2.257669227409363, + 1.8863371967315674, + 1.753921750640869, + 1.704151694869995, + 1.605138656806946, + 1.366706605911255, + 1.3500237414360046, + 1.4022936582565309, + 1.1546042854309082, + 1.143458882522583, + 1.030033224105835, + 0.9880966281175614, + 0.9858702459335327, + 1.0123830188751222, + 0.8727149436950684, + 0.8251452196121216, + 0.8818260744094849, + 0.8404904095649719, + 0.8257113872528076 + ], + "term_loss": [ + 1.6504224247932433, + 0.8375917286872864, + 0.6154087921142578, + 0.5532272914409637, + 0.5395434478759765, + 0.5454418560981751, + 0.548071176624298, + 0.8495948793888092, + 0.871022064948082, + 0.6399660477638245, + 0.7113209009170532, + 1.0140180881977081, + 0.8458488144636154, + 0.8732069333314896, + 0.6247593785524368, + 1.064120747566223, + 1.9725029928207398, + 0.8703572043895721, + 0.9687161136627197, + 1.3335205810546875, + 0.6815592967748642, + 0.9841544357299805, + 1.4630473113059999, + 1.1648006004333495, + 1.6974185828447341, + 1.585868435716629, + 1.086215167760849, + 1.4794144651412964, + 3.383740266418457, + 6.938124223327637, + 5.274092036437988, + 3.881667746925354, + 2.553757908630371, + 2.978989521408081, + 3.82173573884964, + 4.520999314308167, + 8.147785523223877, + 8.00288946609497, + 5.000799319529533, + 4.125068738365173, + 3.5042172052383425, + 2.699850891304016, + 4.425766694641113, + 3.1604889556884768, + 2.7477581281661987, + 2.2315157468795777, + 3.2700717025756836, + 2.140160263442993, + 2.0445699644088746, + 1.8384040803909303, + 1.7394722784042358, + 2.334256193733215, + 2.7318620399475098, + 3.210952592277527, + 3.1114013697624205, + 3.125122370147705, + 3.922404075050354, + 4.07079298210144, + 3.0838204498291018, + 2.4635134841918944, + 1.74991473236084, + 1.8150607773780822, + 1.5140642840385437, + 1.4030307838439942, + 1.390348579788208, + 1.2754892768859862, + 1.0548970350265503, + 1.0442349720954895, + 1.079941069793701, + 0.869195331954956, + 0.8486155418395996, + 0.7500218649864197, + 0.7166386909261346, + 0.7068471017837524, + 0.7262772275924683, + 0.6089376243591309, + 0.565191646194458, + 0.6097024906158447, + 0.5746593361854553, + 0.5509136886596679 + ], + "bridge_loss": [ + 0.8274208247567294, + 0.04628952074944973, + 0.005470760084688663, + 0.022114072570204736, + 0.02619350514113903, + 0.02462219797000289, + 0.016575153788924216, + 0.012172694252431393, + 0.008306282567977906, + 0.007131045020371676, + 0.006602350142598152, + 0.007133904299885034, + 0.00889486790150404, + 0.007033539731428027, + 0.007029886939749121, + 0.016358042316138743, + 0.020663128697872162, + 0.010306563833355903, + 0.020879663941264153, + 0.10206406505107879, + 0.06092094658613205, + 0.1235328954577446, + 0.260770632982254, + 0.20950047061443328, + 0.26373723001480104, + 0.20571331169605256, + 0.07498671305179595, + 0.12556591314077378, + 0.2968582089275122, + 0.9360601034164429, + 0.34663937301635744, + 0.39642132375240324, + 0.38016364483833315, + 0.36436182782649995, + 0.5179255735874176, + 0.6902249323606491, + 1.1416879810333251, + 1.6240587829351425, + 0.9814537258118391, + 0.5799458844184876, + 0.659208872383833, + 0.39408149279356003, + 0.3656025336742401, + 0.22205486388206483, + 0.2630800589323044, + 0.25402860095500945, + 0.3471872593641281, + 0.2257408608198166, + 0.1474910190463066, + 0.13604351500570774, + 0.09966603577136994, + 0.11529678661227226, + 0.12656707118153573, + 0.24201848303973675, + 0.34999929159879684, + 0.3684466096520424, + 0.32107353453636167, + 0.36825179790854456, + 0.2991718190073967, + 0.14634431777000428, + 0.15489137840270997, + 0.19152780306339265, + 0.1264393635749817, + 0.110255957955122, + 0.06583732250332833, + 0.09188482095599175, + 0.07512128737568856, + 0.06769476855397225, + 0.08805738928318024, + 0.052597072744369505, + 0.061042466819286344, + 0.049813730967044834, + 0.043870848792791364, + 0.051897744873166084, + 0.05865620729923248, + 0.03764229657351971, + 0.03385210290849209, + 0.04558607372045517, + 0.04050549000203609, + 0.049323998257517813 + ], + "tgrad_loss": [ + 0.27887171220779416, + 0.18610301048755645, + 0.15184532343149185, + 0.143339737200737, + 0.13819767172336578, + 0.1389200611591339, + 0.1399084441423416, + 0.16610983300209045, + 0.15578146158456802, + 0.15140049700737, + 0.15842433052062987, + 0.18362878961563112, + 0.17322721722126008, + 0.17729875540733336, + 0.1571024955034256, + 0.20004582180976868, + 0.23207265706062316, + 0.2017266354560852, + 0.20090780715942383, + 0.20671938235759735, + 0.17046530573368074, + 0.18722992515563966, + 0.20157747678756713, + 0.19492619981765746, + 0.21336774530410765, + 0.19758802919387816, + 0.1887919110774994, + 0.18582018871307374, + 0.2328547879219055, + 0.2709327209472656, + 0.21946332993507386, + 0.21957662334442138, + 0.1963534575819969, + 0.20022535383701323, + 0.21657870807647706, + 0.22453099676370622, + 0.24306369013786316, + 0.2546080108642578, + 0.24558807609081268, + 0.23330649132728576, + 0.25274263796806334, + 0.2296339340209961, + 0.2661167623519897, + 0.2608860526561737, + 0.26203568353652956, + 0.2616326283454895, + 0.27774441232681274, + 0.2601371428012848, + 0.2708354802131653, + 0.25549290828704835, + 0.24257140054702758, + 0.2567750201940536, + 0.2842189628124237, + 0.29142085790634153, + 0.30109593143463137, + 0.3077278130531311, + 0.3056078572273254, + 0.29894922952651976, + 0.2856630270242691, + 0.2718828806877136, + 0.26044571537971495, + 0.25108065757751463, + 0.24583355770111084, + 0.24063498420715332, + 0.2479657948255539, + 0.2377645515680313, + 0.2366882876396179, + 0.2380939986228943, + 0.2342951997756958, + 0.2328118751525879, + 0.23380087866783142, + 0.23019764132499695, + 0.22758708037137984, + 0.2271253991127014, + 0.22744957551956177, + 0.22613502042293548, + 0.2261014585018158, + 0.2265375138759613, + 0.2253255781173706, + 0.22547370266914368 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.0015124600613489747, + 0.020085982978343964, + 0.03127610310912132, + 0.03517032414674759, + 0.042219605296850204, + 0.05027471110224724, + 0.05683741718530655, + 0.057938531041145325, + 0.06581299006938934, + 0.06761687994003296, + 0.07107532024383545, + 0.07804323732852936 + ], + "perturbation_rho": [ + 0.03147998824715614, + -0.015333062037825584, + 0.020876668393611908, + 0.07304719090461731, + 0.0599740669131279, + 0.08874240517616272, + 0.05341971293091774, + 0.07721589505672455, + 0.08801877498626709, + 0.10527393221855164, + 0.16833831369876862, + 0.1291283369064331 + ], + "nudging": { + "0.001": [ + -0.00044463935773819685, + -0.00012659450294449925, + -0.0001986775896511972, + -0.0002730795240495354, + -0.0002829947043210268, + -0.00034303159918636084, + -0.0003691607271321118, + -0.00040001055458560586, + -0.00042912771459668875, + -0.00045504042645916343, + -0.00047524512046948075, + -0.0004846052033826709 + ], + "0.003": [ + -0.0013053687289357185, + -0.00038041931111365557, + -0.0005985662573948503, + -0.0008211880922317505, + -0.0008477486553601921, + -0.001032006461173296, + -0.0011103888973593712, + -0.0012022369774058461, + -0.0012896620901301503, + -0.00136495940387249, + -0.0014261011965572834, + -0.0014572828076779842 + ], + "0.01": [ + -0.004048495087772608, + -0.0012588155223056674, + -0.0019918864127248526, + -0.002725755563005805, + -0.0028244066052138805, + -0.003425109200179577, + -0.0036919033154845238, + -0.003999053034931421, + -0.0042928787879645824, + -0.004538967739790678, + -0.004742524586617947, + -0.004852524492889643 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.0_L2_s123.json b/results/synth_ladder_v2_lo/synth_a0.0_L2_s123.json new file mode 100644 index 0000000..09aec16 --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.0_L2_s123.json @@ -0,0 +1,1512 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.7207277019500733, + 0.7790515207290649, + 0.45965238094329836, + 0.344505589389801, + 0.305948727107048, + 0.265342556476593, + 0.25686684017181394, + 0.24114981298446655, + 0.22925823230743408, + 0.23424035305976867, + 0.21124905035495758, + 0.19400378139019012, + 0.18992817602157594, + 0.20065753853321075, + 0.1758887457370758, + 0.18987385909557342, + 0.1766733213186264, + 0.17402569117546082, + 0.16750437734127044, + 0.1609703923225403, + 0.1667053633213043, + 0.15978011922836305, + 0.16382880132198333, + 0.15408793671131135, + 0.1573232760667801, + 0.15904042587280273, + 0.16996713733673097, + 0.16745088925361634, + 0.1407752888917923, + 0.1437982935667038, + 0.1288691416501999, + 0.13675620369911193, + 0.1404436342716217, + 0.1322325788140297, + 0.1205964973449707, + 0.12338397283554077, + 0.11539463124275208, + 0.11405454754829407, + 0.11564468727111817, + 0.11277760289907456, + 0.10829375276565552, + 0.10773034353256225, + 0.10590754004120827, + 0.10246410021781921, + 0.10704636499881745, + 0.10346804196238518, + 0.09824472286701202, + 0.09875981305241585, + 0.09532992283701897, + 0.09478073754310608, + 0.09963924968242645, + 0.09461190940141678, + 0.09311110566854477, + 0.09307761950492859, + 0.09144059424400329, + 0.09472406225204467, + 0.09397407406568527, + 0.08954561126232147, + 0.08714181256294251, + 0.08698110367059708, + 0.0848695909947157, + 0.08321986048221588, + 0.08306121920347213, + 0.0825563444018364, + 0.0815550530552864, + 0.08082753023505211, + 0.08034503507614135, + 0.07994237960577011, + 0.07942863342761994, + 0.07910665745735168, + 0.0787971821308136, + 0.0786789097070694, + 0.078331869161129, + 0.07799442697763442, + 0.07777877117395401, + 0.07760189070105553, + 0.07745174323320389, + 0.07733372535705567, + 0.0772703528702259, + 0.07722830307483673 + ], + "train_acc": [ + 0.4324, + 0.7882, + 0.875, + 0.9066, + 0.9012, + 0.9149, + 0.9096, + 0.9135, + 0.9191, + 0.9118, + 0.9244, + 0.9294, + 0.9321, + 0.9245, + 0.9372, + 0.9291, + 0.932, + 0.937, + 0.9356, + 0.9412, + 0.9378, + 0.9412, + 0.9395, + 0.9424, + 0.9405, + 0.9422, + 0.9318, + 0.9324, + 0.95, + 0.9485, + 0.9534, + 0.9511, + 0.9495, + 0.9511, + 0.9588, + 0.9603, + 0.9626, + 0.9636, + 0.9609, + 0.9649, + 0.9659, + 0.9662, + 0.9662, + 0.9694, + 0.9661, + 0.9688, + 0.9715, + 0.9703, + 0.9743, + 0.974, + 0.9705, + 0.9722, + 0.974, + 0.9737, + 0.9759, + 0.9726, + 0.975, + 0.9765, + 0.9784, + 0.9791, + 0.9809, + 0.9814, + 0.9807, + 0.9816, + 0.9824, + 0.9836, + 0.9833, + 0.9834, + 0.9835, + 0.9838, + 0.9846, + 0.9842, + 0.9848, + 0.9848, + 0.9846, + 0.9848, + 0.9852, + 0.9851, + 0.9852, + 0.9853 + ], + "test_acc": [ + 0.669, + 0.8435, + 0.8705, + 0.879, + 0.874, + 0.8965, + 0.899, + 0.89, + 0.8975, + 0.8895, + 0.896, + 0.903, + 0.9, + 0.902, + 0.9035, + 0.907, + 0.907, + 0.897, + 0.907, + 0.9025, + 0.9065, + 0.905, + 0.904, + 0.9025, + 0.903, + 0.906, + 0.9055, + 0.9035, + 0.919, + 0.905, + 0.9065, + 0.9085, + 0.9075, + 0.9085, + 0.911, + 0.9135, + 0.906, + 0.91, + 0.917, + 0.9215, + 0.915, + 0.9145, + 0.915, + 0.916, + 0.9155, + 0.912, + 0.916, + 0.9135, + 0.9155, + 0.9185, + 0.917, + 0.918, + 0.9215, + 0.92, + 0.9165, + 0.915, + 0.9155, + 0.917, + 0.9145, + 0.919, + 0.9165, + 0.914, + 0.9155, + 0.914, + 0.916, + 0.917, + 0.918, + 0.9185, + 0.9195, + 0.9195, + 0.9195, + 0.92, + 0.92, + 0.9205, + 0.92, + 0.9205, + 0.9195, + 0.92, + 0.9205, + 0.9205 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8634263277053833, + 0.8499601483345032 + ], + "perturbation_rho": [ + 0.9999988079071045, + 0.9999933838844299 + ], + "nudging": { + "0.001": [ + -0.022913530468940735, + -0.0076592592522501945 + ], + "0.003": [ + -0.06158487871289253, + -0.022190168499946594 + ], + "0.01": [ + -0.13922545313835144, + -0.06537239253520966 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2145429794311524, + 1.4832333190917968, + 0.8427700979232788, + 0.5642387649536132, + 0.44259997854232785, + 0.3797396701812744, + 0.36115866856575013, + 0.3420704277038574, + 0.34744873743057253, + 0.35834124784469606, + 0.34505550694465636, + 0.37205679273605347, + 0.36223536982536314, + 0.3897885517209768, + 0.3661109811067581, + 0.3905520539283752, + 0.3873382499694824, + 0.4310034593820572, + 0.379075954246521, + 0.3956090630054474, + 0.41010830894708633, + 0.3871167766094208, + 0.4128729253053665, + 0.37673398666381835, + 0.4386045214653015, + 0.4175387234687805, + 0.5163568344116211, + 0.41816404705047605, + 0.3691399229049683, + 0.3856747570514679, + 0.3798481074810028, + 0.3966631019592285, + 0.4648309063076973, + 0.3615638767376542, + 0.35468427698612215, + 0.38685988901853563, + 0.3459345358610153, + 0.3860490513801575, + 0.40029369468688963, + 0.3782256749629974, + 0.35560350346565245, + 0.3603634602546692, + 0.3720236937999725, + 0.379230254983902, + 0.3613779128074646, + 0.3320357777953148, + 0.3244936734318733, + 0.3268082529783249, + 0.316782475566864, + 0.3409638210296631, + 0.34503824408650396, + 0.31332876653671266, + 0.3428362133741379, + 0.32030015414953233, + 0.31090027656555175, + 0.3185324101924896, + 0.3263511387348175, + 0.30935111100673673, + 0.30104202661514284, + 0.30687724331617355, + 0.29393203148841857, + 0.2826761653423309, + 0.28839151701927185, + 0.2897114434480667, + 0.2847494943141937, + 0.28069971054792403, + 0.27908870706558225, + 0.2764286852836609, + 0.2836688223004341, + 0.27157128534317015, + 0.2719319869995117, + 0.27284973291158676, + 0.2693837205886841, + 0.2679568641424179, + 0.26705331959724427, + 0.26758628270626067, + 0.2656683373451233, + 0.2651437629699707, + 0.26474326791763303, + 0.26457467867136003 + ], + "train_acc": [ + 0.1934, + 0.5051, + 0.7204, + 0.8027, + 0.8378, + 0.855, + 0.8574, + 0.8678, + 0.867, + 0.8666, + 0.8729, + 0.868, + 0.8718, + 0.8671, + 0.8734, + 0.8663, + 0.8653, + 0.862, + 0.8727, + 0.8701, + 0.8711, + 0.8743, + 0.8727, + 0.8771, + 0.8627, + 0.8671, + 0.8467, + 0.8678, + 0.881, + 0.8785, + 0.8742, + 0.871, + 0.8619, + 0.8833, + 0.8836, + 0.8765, + 0.887, + 0.8747, + 0.8724, + 0.8812, + 0.8841, + 0.8831, + 0.8812, + 0.8799, + 0.8799, + 0.8887, + 0.8908, + 0.8877, + 0.8959, + 0.8881, + 0.8856, + 0.8951, + 0.8854, + 0.8905, + 0.892, + 0.892, + 0.8897, + 0.894, + 0.8976, + 0.8963, + 0.8993, + 0.9014, + 0.9001, + 0.8995, + 0.9015, + 0.9031, + 0.9016, + 0.9033, + 0.9009, + 0.9056, + 0.9043, + 0.9036, + 0.9049, + 0.9055, + 0.9051, + 0.9051, + 0.9057, + 0.9055, + 0.9061, + 0.9063 + ], + "test_acc": [ + 0.355, + 0.6045, + 0.7335, + 0.7805, + 0.8005, + 0.805, + 0.813, + 0.826, + 0.826, + 0.8285, + 0.816, + 0.821, + 0.815, + 0.828, + 0.8065, + 0.827, + 0.797, + 0.826, + 0.797, + 0.792, + 0.82, + 0.812, + 0.817, + 0.8115, + 0.806, + 0.8075, + 0.804, + 0.831, + 0.8235, + 0.827, + 0.805, + 0.8145, + 0.821, + 0.8315, + 0.813, + 0.8245, + 0.8245, + 0.8145, + 0.815, + 0.8255, + 0.8275, + 0.821, + 0.8175, + 0.8095, + 0.8385, + 0.835, + 0.8395, + 0.8305, + 0.8305, + 0.8365, + 0.826, + 0.835, + 0.834, + 0.82, + 0.8245, + 0.8285, + 0.821, + 0.836, + 0.837, + 0.833, + 0.8415, + 0.832, + 0.84, + 0.8435, + 0.8405, + 0.8465, + 0.839, + 0.849, + 0.843, + 0.8425, + 0.8395, + 0.843, + 0.8395, + 0.845, + 0.84, + 0.841, + 0.8415, + 0.841, + 0.841, + 0.841 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.048809632658958435, + 0.12263120710849762 + ], + "perturbation_rho": [ + 0.09689537435770035, + 0.10561469197273254 + ], + "nudging": { + "0.001": [ + -0.001597832073457539, + -0.00047309682122431695 + ], + "0.003": [ + -0.004742181394249201, + -0.001416387502104044 + ], + "0.01": [ + -0.015226385556161404, + -0.00468847481533885 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 2.0100293533325195, + 1.0204413017272949, + 0.54354176902771, + 0.39702820897102353, + 0.3586913129806519, + 0.3554326295375824, + 0.361624427986145, + 0.36465097951889036, + 0.3603580026626587, + 0.3543916482686996, + 0.3507106711387634, + 0.35224332275390624, + 0.3475004379510879, + 0.3553124601364136, + 0.37312231225967407, + 0.37028597445487976, + 0.3665724731683731, + 0.37034252033233644, + 0.38506430788040164, + 0.4009858402252197, + 0.41984470853805544, + 0.4130363565444946, + 0.4252812045574188, + 0.43580607299804686, + 0.466691482257843, + 0.4120105969429016, + 0.4388778105735779, + 0.418408594417572, + 0.42251289710998535, + 0.42326131315231325, + 0.41453264694213865, + 0.4108378723144531, + 0.42514692809581756, + 0.41193596658706666, + 0.4172293882369995, + 0.4110143481254578, + 0.3909164998292923, + 0.38413406591415405, + 0.38740381708145144, + 0.38655886726379396, + 0.38635201063156127, + 0.3766866379261017, + 0.3757282977819443, + 0.37710726108551024, + 0.3712064995765686, + 0.37017061100006105, + 0.3811788000822067, + 0.3592162804841995, + 0.368729523897171, + 0.38313820214271543, + 0.3553819965362549, + 0.38453965463638307, + 0.352666961979866, + 0.35594648966789244, + 0.35147202444076536, + 0.3434806545257568, + 0.350411687374115, + 0.3472837806224823, + 0.34532749392986295, + 0.34017591814994813, + 0.33683158864974977, + 0.3410106474876404, + 0.3374420499801636, + 0.3345813477516174, + 0.33512692725658416, + 0.33064404239654543, + 0.3299761538028717, + 0.32880062866806986, + 0.3271276932477951, + 0.3273114435195923, + 0.32523203148841856, + 0.32425895788669584, + 0.32357494492530825, + 0.3230543273448944, + 0.32268554170131686, + 0.32191982040405276, + 0.32155804014205935, + 0.32106889061927796, + 0.3208657922267914, + 0.3206909418106079 + ], + "train_acc": [ + 0.2879, + 0.6675, + 0.8151, + 0.8582, + 0.8655, + 0.8656, + 0.8608, + 0.8595, + 0.8647, + 0.8689, + 0.8684, + 0.8684, + 0.8691, + 0.8643, + 0.8616, + 0.8616, + 0.8673, + 0.8624, + 0.8547, + 0.8522, + 0.8427, + 0.8437, + 0.8419, + 0.8374, + 0.8276, + 0.8474, + 0.8357, + 0.843, + 0.842, + 0.8394, + 0.8435, + 0.8439, + 0.8437, + 0.8477, + 0.8473, + 0.8446, + 0.8546, + 0.8604, + 0.8586, + 0.8571, + 0.8605, + 0.8645, + 0.8609, + 0.8647, + 0.8645, + 0.8668, + 0.8617, + 0.8685, + 0.8675, + 0.861, + 0.8705, + 0.8656, + 0.8723, + 0.8709, + 0.8723, + 0.8763, + 0.8751, + 0.8766, + 0.8715, + 0.8758, + 0.8782, + 0.8767, + 0.8801, + 0.8774, + 0.8801, + 0.8824, + 0.8806, + 0.8808, + 0.8815, + 0.8819, + 0.8825, + 0.8823, + 0.8819, + 0.883, + 0.8819, + 0.8831, + 0.8823, + 0.8828, + 0.8826, + 0.8828 + ], + "test_acc": [ + 0.5255, + 0.7235, + 0.7935, + 0.8195, + 0.8155, + 0.818, + 0.8185, + 0.8195, + 0.819, + 0.8235, + 0.8145, + 0.8175, + 0.822, + 0.8115, + 0.8185, + 0.809, + 0.809, + 0.806, + 0.7985, + 0.789, + 0.802, + 0.795, + 0.7785, + 0.767, + 0.782, + 0.7785, + 0.793, + 0.7765, + 0.798, + 0.7875, + 0.8025, + 0.799, + 0.808, + 0.794, + 0.81, + 0.8045, + 0.8135, + 0.8065, + 0.8235, + 0.8165, + 0.819, + 0.8085, + 0.8145, + 0.8115, + 0.8125, + 0.815, + 0.819, + 0.812, + 0.8155, + 0.8175, + 0.8125, + 0.811, + 0.8125, + 0.8235, + 0.8155, + 0.8145, + 0.8215, + 0.816, + 0.818, + 0.8225, + 0.825, + 0.8205, + 0.818, + 0.818, + 0.8235, + 0.824, + 0.8185, + 0.8175, + 0.821, + 0.818, + 0.8195, + 0.822, + 0.8185, + 0.8205, + 0.82, + 0.8195, + 0.8205, + 0.82, + 0.822, + 0.822 + ], + "state_pred_error": [ + 0.7962929263591766, + 0.331514656496048, + 0.19661902210712434, + 0.16503102767467498, + 0.14755443301200866, + 0.12628681234121322, + 0.10449981281757355, + 0.08584924747943878, + 0.0699757203578949, + 0.05582202136516571, + 0.04389634461402893, + 0.036387173852324484, + 0.03049680006802082, + 0.02591462894678116, + 0.02221634505391121, + 0.019373500156402587, + 0.017665761670470237, + 0.0157645114377141, + 0.014524527588486671, + 0.013737535402178765, + 0.012687528398633003, + 0.011898116055130959, + 0.011640684556961059, + 0.010859360812604427, + 0.010485637862980365, + 0.009991707500815392, + 0.009739254067838193, + 0.008777845013141631, + 0.00828778415173292, + 0.008094209410250188, + 0.007691447506099939, + 0.007422742694616318, + 0.007276442471146584, + 0.006999653156101703, + 0.0067770635947585105, + 0.006470148958265781, + 0.006286166054010391, + 0.00604953683167696, + 0.006004941011965275, + 0.005863147027045488, + 0.005500460632890463, + 0.005411263838410377, + 0.005238449747860432, + 0.005156481459736824, + 0.004926877556741238, + 0.004763428920507431, + 0.004753794524073601, + 0.004590867299586535, + 0.004666488307341933, + 0.004403108169138432, + 0.004165763948857784, + 0.00412739000916481, + 0.0041623744465410705, + 0.004234333600848913, + 0.004279930933192373, + 0.00375170355848968, + 0.003802278782427311, + 0.0036928312376141546, + 0.0036528290495276452, + 0.0038295471183955668, + 0.003527464033663273, + 0.0033376181811094283, + 0.003297599468007684, + 0.0033206129163503646, + 0.003547699999809265, + 0.0032429821506142617, + 0.0031518954910337927, + 0.003168932900391519, + 0.002991512390971184, + 0.0029735447630286215, + 0.0029666012093424797, + 0.0029554983984678984, + 0.002873803383857012, + 0.002869913595914841, + 0.00284024139046669, + 0.0029223025660961867, + 0.0027367467910051346, + 0.0027474096663296223, + 0.0026910540357232096, + 0.0027065009888261556 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9309895038604736, + 0.47941499948501587 + ], + "perturbation_rho": [ + 0.8439192175865173, + 0.37250760197639465 + ], + "nudging": { + "0.001": [ + -0.0257757268846035, + -0.0026356291491538286 + ], + "0.003": [ + -0.07368925958871841, + -0.007871035486459732 + ], + "0.01": [ + -0.2068808674812317, + -0.025803586468100548 + ] + }, + "state_pred_error_per_layer": [ + 436.0709533691406, + 352.44915771484375 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2166633338928223, + 1.4822776604652406, + 0.8527356213569641, + 0.5706128049373627, + 0.43896263313293454, + 0.38758574914932253, + 0.3662052785873413, + 0.35315943990945814, + 0.3356183546543121, + 0.3451760648012161, + 0.35537444372177124, + 0.3936114372730255, + 0.35565873963832856, + 0.3649965980768204, + 0.37292858068943024, + 0.3939949078083038, + 0.39196848384141925, + 0.39390314302444457, + 0.42576994676589963, + 0.4276782782554627, + 0.49126899070739743, + 0.5104124393463135, + 0.5060470756292343, + 0.5146438408851624, + 0.5792045258522034, + 0.58794528465271, + 0.6390262460947037, + 0.6486665966033935, + 0.6689690710544586, + 0.7052691784381866, + 0.7274600021362305, + 0.7133333879470826, + 0.7636545959472656, + 0.7814437804698944, + 0.7844102795600891, + 0.775709469127655, + 0.8138838304996491, + 0.8132558471679687, + 0.8678097775459289, + 0.8119752780914307, + 0.8714342193603516, + 0.9063542318344117, + 0.925028806400299, + 0.8863205076217652, + 0.9204323357582093, + 0.9434663917541504, + 0.9461792286872863, + 0.9343688268661499, + 0.9500316833496094, + 0.9462117325782776, + 0.9365047801971436, + 0.935371301651001, + 0.9619980144500733, + 0.9775615167617798, + 0.9611524658203126, + 0.9673760023117065, + 0.9664952352523803, + 0.9738808612823486, + 0.9750494892120362, + 0.997103341293335, + 0.9816123373031617, + 0.9958496462821961, + 1.0000357272148133, + 0.9956781629562378, + 1.0005756943702697, + 1.0038517833709717, + 1.0042228302001952, + 1.0025716598510743, + 1.002968798828125, + 1.0022998886108399, + 1.0010733880996705, + 0.9982695043563843, + 0.9950118174552918, + 0.9933666072845458, + 0.9921276975631714, + 0.990613134765625, + 0.9894881931304932, + 0.9888591194152831, + 0.9883952844619751, + 0.9880848827362061 + ], + "train_acc": [ + 0.1912, + 0.5078, + 0.712, + 0.8031, + 0.8345, + 0.8512, + 0.8565, + 0.8636, + 0.8719, + 0.8714, + 0.8708, + 0.8646, + 0.8746, + 0.8757, + 0.8688, + 0.866, + 0.867, + 0.8694, + 0.8589, + 0.8607, + 0.8507, + 0.8413, + 0.8457, + 0.8431, + 0.8284, + 0.822, + 0.8066, + 0.8036, + 0.7986, + 0.7888, + 0.7845, + 0.7843, + 0.7753, + 0.764, + 0.7626, + 0.7606, + 0.7499, + 0.7428, + 0.7326, + 0.738, + 0.7238, + 0.7095, + 0.7052, + 0.7201, + 0.7072, + 0.7003, + 0.6995, + 0.6979, + 0.699, + 0.6974, + 0.701, + 0.6997, + 0.6946, + 0.6889, + 0.6945, + 0.6899, + 0.6912, + 0.6881, + 0.6871, + 0.6842, + 0.6865, + 0.6847, + 0.6883, + 0.6848, + 0.6851, + 0.6841, + 0.6878, + 0.6856, + 0.6872, + 0.6879, + 0.686, + 0.6866, + 0.6869, + 0.6855, + 0.6881, + 0.6875, + 0.688, + 0.6885, + 0.6881, + 0.6881 + ], + "test_acc": [ + 0.348, + 0.5945, + 0.728, + 0.782, + 0.7995, + 0.811, + 0.8105, + 0.818, + 0.825, + 0.8175, + 0.811, + 0.8265, + 0.824, + 0.821, + 0.821, + 0.8255, + 0.8055, + 0.827, + 0.814, + 0.77, + 0.795, + 0.789, + 0.788, + 0.783, + 0.764, + 0.7615, + 0.7575, + 0.7545, + 0.734, + 0.735, + 0.728, + 0.7295, + 0.718, + 0.721, + 0.7195, + 0.709, + 0.687, + 0.661, + 0.671, + 0.6885, + 0.6745, + 0.6765, + 0.6655, + 0.6745, + 0.657, + 0.675, + 0.6705, + 0.6505, + 0.6705, + 0.673, + 0.6785, + 0.666, + 0.6705, + 0.6695, + 0.669, + 0.6715, + 0.672, + 0.666, + 0.6715, + 0.6685, + 0.674, + 0.6665, + 0.6655, + 0.6695, + 0.6565, + 0.6595, + 0.6655, + 0.6545, + 0.6655, + 0.6625, + 0.6615, + 0.6615, + 0.6645, + 0.666, + 0.6625, + 0.664, + 0.6635, + 0.6635, + 0.6635, + 0.664 + ], + "value_loss": [ + 2.862312266921997, + 0.7870045631408692, + 0.5866680012226104, + 0.487851585483551, + 0.42467003531455993, + 0.42933752834796907, + 0.4517250923156738, + 0.49036711559295654, + 0.5370833713054657, + 0.5225693160533905, + 0.5723625789642334, + 0.6810438357830048, + 0.6196456489801407, + 0.6161580103397369, + 0.6767898920059204, + 0.6839942785263061, + 0.7228468099951744, + 0.731743062210083, + 0.8153413344562054, + 0.8487729335784913, + 1.1239148555755616, + 1.111784733581543, + 1.0937595278739929, + 1.1393394327163697, + 1.3184698207855226, + 1.2240205763816834, + 1.281676392173767, + 1.3282772884368896, + 1.277956589794159, + 1.3837186878204346, + 1.3530437088012695, + 1.1659054378509521, + 1.209618302154541, + 1.0256237523555756, + 0.9905264866828919, + 0.8770509265899659, + 0.9170616325616836, + 0.8460413787841797, + 0.978120857000351, + 0.7710761907577515, + 0.7819046745300293, + 0.8031992895126343, + 0.8599374737739564, + 0.7989227243423462, + 0.8483824888706207, + 0.838105262184143, + 0.831775927734375, + 0.8010647817611695, + 0.7901058013916016, + 0.7647614275455474, + 0.764328832244873, + 0.7659363707542419, + 0.7591242840766906, + 0.793391801738739, + 0.774118152999878, + 0.6988259189605713, + 0.7934306571006775, + 0.754872838139534, + 0.7264098434448242, + 0.7199796464920044, + 0.7088566905021667, + 0.7621092021942139, + 0.7465033507347107, + 0.7402997331619263, + 0.697352447605133, + 0.722913084411621, + 0.7380389479637146, + 0.6805807943344117, + 0.6974307493209839, + 0.6769652221679687, + 0.6623517539978028, + 0.6548144243717193, + 0.6477350507736206, + 0.6379247413635254, + 0.6550224852561951, + 0.6673833505630493, + 0.6371668090820313, + 0.6245359985351563, + 0.6310369262695312, + 0.6019191103935242 + ], + "term_loss": [ + 1.6362721346855165, + 0.37781597232818603, + 0.35956392331123355, + 0.30113453228473663, + 0.2540520797491074, + 0.26107953673601153, + 0.28645103769302366, + 0.33103201488256456, + 0.3847377519249916, + 0.369207483792305, + 0.41831262006759645, + 0.5161090086460114, + 0.4692179684817791, + 0.4602657828330994, + 0.5237038430452347, + 0.5198972980499268, + 0.5641665159583091, + 0.5718718901395797, + 0.6431136459127068, + 0.677467121887207, + 0.9314209022521973, + 0.9112024291992188, + 0.8943795773983002, + 0.9359503910779953, + 1.0914871151924133, + 0.9879622640609741, + 1.026415785932541, + 1.078644213104248, + 1.0273881074905395, + 1.1246179870605468, + 1.085285704421997, + 0.8998660541534423, + 0.9242175249814987, + 0.7358711883544922, + 0.6963623027563095, + 0.5854673199653625, + 0.6217934660077095, + 0.5570110441207886, + 0.6709790559053421, + 0.4901563432216644, + 0.4858744155883789, + 0.4959319089889526, + 0.5449313802719116, + 0.4945675350189209, + 0.5295222800731659, + 0.5174280918598175, + 0.5047948003768921, + 0.4674406248092651, + 0.4568398364067078, + 0.4325192159175873, + 0.4349327120780945, + 0.4375899739265442, + 0.42619164731502535, + 0.45259529867172243, + 0.4362746577501297, + 0.36338143222332003, + 0.4524987346172333, + 0.4116030908584595, + 0.38697444515228274, + 0.3790359831929207, + 0.3727722673654556, + 0.41500336648225783, + 0.4030157947540283, + 0.39471385617256166, + 0.35684009437263015, + 0.37995485734939577, + 0.3932207664966583, + 0.3434924767494202, + 0.3561821739196777, + 0.33800402256250384, + 0.32919570360183714, + 0.32527549781799314, + 0.32046796481013295, + 0.3076671746253967, + 0.32101710920333865, + 0.329897655916214, + 0.3110539279192686, + 0.289623655128479, + 0.30524736881256104, + 0.28414561631679536 + ], + "bridge_loss": [ + 0.9257246531827085, + 0.11931550175547599, + 0.019036986203491688, + 0.009200494468957186, + 0.01670405386686325, + 0.022144653449952603, + 0.02092598076760769, + 0.017403891210258007, + 0.014749217769503593, + 0.014875961096584797, + 0.012387205076217652, + 0.013591324252635241, + 0.01249192453622818, + 0.015692542472481728, + 0.011785203318297863, + 0.014191117997467518, + 0.012356174829602242, + 0.015679762499034404, + 0.018022386149317025, + 0.018556285762786864, + 0.025691469037532805, + 0.027234909960627555, + 0.026883753621578216, + 0.02885721744298935, + 0.036984953236579896, + 0.042136997365951535, + 0.04648944373428822, + 0.0383615080177784, + 0.03299343649148941, + 0.036316176214814186, + 0.037490837126970294, + 0.03762312990427017, + 0.04573201023340225, + 0.04586766301393509, + 0.05017340140193701, + 0.048964026015996934, + 0.044927955681830646, + 0.03785374255180359, + 0.0429724424123764, + 0.028634057849645615, + 0.032143977612257006, + 0.03326438666582108, + 0.038441793063282964, + 0.03851528071463108, + 0.04538965437486768, + 0.041940523386001585, + 0.04745692467689514, + 0.05371042605638504, + 0.053415575397014615, + 0.053903627383708956, + 0.05321261163949966, + 0.053114770835638044, + 0.0531739701628685, + 0.057856653088331225, + 0.059756802570819854, + 0.05648564575314522, + 0.06359097779989242, + 0.06458331343829632, + 0.060640481400489804, + 0.05943436603546143, + 0.058031611156463624, + 0.06803198567032814, + 0.06276154099106789, + 0.06635524654388428, + 0.06129389543533325, + 0.06432680562734604, + 0.06636923305988311, + 0.059899713945388795, + 0.0640624837398529, + 0.062204831221699716, + 0.057054962158203125, + 0.054482452845573424, + 0.05312725995779038, + 0.05630911908447742, + 0.06101996395587921, + 0.06387735533714295, + 0.0534395126581192, + 0.0628511904478073, + 0.0538769678235054, + 0.04602321577072144 + ], + "tgrad_loss": [ + 0.3003154767036438, + 0.2898730874300003, + 0.20806708674430846, + 0.17751656254529952, + 0.15391390190124513, + 0.14611333754062653, + 0.14434807376861572, + 0.14193120997697115, + 0.13759640024900435, + 0.13848587619662284, + 0.14166275129318237, + 0.15134349975585937, + 0.13793575568199157, + 0.14019968309402467, + 0.14130084238052368, + 0.14990585656166078, + 0.1463241186618805, + 0.14419140665531158, + 0.1542052926674485, + 0.1527495301246643, + 0.1668024854183197, + 0.17334739017486572, + 0.17249620418548584, + 0.17453181505203247, + 0.18999774327278138, + 0.1939213035583496, + 0.2087711593389511, + 0.2112715651512146, + 0.21757504351139068, + 0.22278451583385467, + 0.23026716661453248, + 0.2284162474632263, + 0.23966876842975615, + 0.24388489694595336, + 0.24399078636169433, + 0.24261958465576172, + 0.25034020925164224, + 0.2511765937805176, + 0.2641693664073944, + 0.2522857914686203, + 0.2638862795829773, + 0.2740029864311218, + 0.2765643033981323, + 0.2658399072170258, + 0.2734705581665039, + 0.27873664593696595, + 0.27952420189380645, + 0.2799137293815613, + 0.279850385761261, + 0.2783385745048523, + 0.27618350377082823, + 0.27523162972927095, + 0.2797586728334427, + 0.28293985466957094, + 0.2780866926670075, + 0.2789588441610336, + 0.27734094581604, + 0.27868643355369566, + 0.27879491510391236, + 0.2815093013763428, + 0.2780528148651123, + 0.2790738520145416, + 0.2807260126113892, + 0.27923062591552733, + 0.2792184523820877, + 0.2786314179420471, + 0.27844894323349, + 0.2771886028289795, + 0.2771860946416855, + 0.2767563671588898, + 0.2761010935783386, + 0.2750564743757248, + 0.2741398271083832, + 0.27394844496250154, + 0.2729854103088379, + 0.2736083378314972, + 0.2726733682632446, + 0.27206115741729736, + 0.2719125874519348, + 0.27175028200149537 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.08253486454486847, + 0.21193227171897888 + ], + "perturbation_rho": [ + 0.16999724507331848, + 0.38439691066741943 + ], + "nudging": { + "0.001": [ + -0.006295680068433285, + -0.0018268785206601024 + ], + "0.003": [ + -0.01877513900399208, + -0.005475326906889677 + ], + "0.01": [ + -0.06126694008708, + -0.018186643719673157 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.0_L2_s42.json b/results/synth_ladder_v2_lo/synth_a0.0_L2_s42.json new file mode 100644 index 0000000..45cc27d --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.0_L2_s42.json @@ -0,0 +1,1512 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.7469921964645385, + 0.7762492984771728, + 0.4454891031265259, + 0.3439776607513428, + 0.30045424115657804, + 0.26611735553741456, + 0.2505315256118774, + 0.24360769803524018, + 0.22747097635269165, + 0.21351920757293702, + 0.22532537747621537, + 0.19045140881538392, + 0.21200945961475373, + 0.18350264816284179, + 0.19344435539245605, + 0.19839551146030426, + 0.18061033978462218, + 0.18738391342163085, + 0.18450877788066863, + 0.1632273875951767, + 0.16299721558094024, + 0.16514803619384766, + 0.1703759162902832, + 0.15658577971458434, + 0.14988700304031372, + 0.15264777562618256, + 0.14738776090145111, + 0.13500966317653657, + 0.1457256983742118, + 0.13223446586132048, + 0.13609031571149827, + 0.13583973288536072, + 0.1469111985206604, + 0.13777201886177062, + 0.13065203895568847, + 0.12617083721160888, + 0.1321597861289978, + 0.12395665965080262, + 0.11719741675853729, + 0.11553976912498475, + 0.11449888982772827, + 0.11582267075777054, + 0.11140473079681397, + 0.11012234913110733, + 0.10696516524553298, + 0.10496284217834473, + 0.10164717164635659, + 0.09967014385461807, + 0.09949336104393006, + 0.09992695951461791, + 0.09878557796478271, + 0.0970326550245285, + 0.09741161692142486, + 0.09751687405109405, + 0.09623571313023567, + 0.09284615292549134, + 0.0957500367641449, + 0.09338720336854457, + 0.09024579298496246, + 0.08942505007982254, + 0.08785170428752899, + 0.08733722891807556, + 0.08688130040168762, + 0.08673911666870117, + 0.08548909291028976, + 0.08519326827526093, + 0.08429346961975098, + 0.08352354682683945, + 0.08309621875286102, + 0.08272465426325798, + 0.08228744316101075, + 0.08209771162867546, + 0.08182088244557381, + 0.08152369939088822, + 0.08132276413440705, + 0.08110721132159233, + 0.08096936017274857, + 0.08085654984712601, + 0.08079161962270737, + 0.08074765578508378 + ], + "train_acc": [ + 0.4186, + 0.794, + 0.8784, + 0.8999, + 0.9031, + 0.9152, + 0.9146, + 0.9133, + 0.921, + 0.9255, + 0.915, + 0.9361, + 0.9218, + 0.9335, + 0.9261, + 0.9272, + 0.9335, + 0.932, + 0.9311, + 0.9429, + 0.9413, + 0.9402, + 0.9383, + 0.9425, + 0.9462, + 0.9424, + 0.9487, + 0.9543, + 0.9483, + 0.9555, + 0.9531, + 0.9531, + 0.9454, + 0.9526, + 0.9564, + 0.9572, + 0.9548, + 0.9578, + 0.9611, + 0.9644, + 0.9644, + 0.9634, + 0.966, + 0.9664, + 0.9675, + 0.9682, + 0.9708, + 0.9716, + 0.9738, + 0.9711, + 0.974, + 0.9742, + 0.9739, + 0.9723, + 0.9728, + 0.9778, + 0.9738, + 0.9747, + 0.9771, + 0.9784, + 0.9793, + 0.9797, + 0.9803, + 0.9807, + 0.9809, + 0.981, + 0.9813, + 0.9821, + 0.9822, + 0.9821, + 0.9822, + 0.9832, + 0.983, + 0.9833, + 0.9833, + 0.9832, + 0.9836, + 0.9838, + 0.9839, + 0.9841 + ], + "test_acc": [ + 0.674, + 0.8355, + 0.8645, + 0.8825, + 0.874, + 0.878, + 0.886, + 0.8895, + 0.889, + 0.8865, + 0.89, + 0.8995, + 0.894, + 0.8955, + 0.891, + 0.893, + 0.896, + 0.898, + 0.9015, + 0.901, + 0.903, + 0.91, + 0.906, + 0.9105, + 0.901, + 0.9105, + 0.9095, + 0.908, + 0.9015, + 0.911, + 0.909, + 0.9075, + 0.9065, + 0.901, + 0.9065, + 0.908, + 0.9095, + 0.913, + 0.9125, + 0.9155, + 0.9155, + 0.9125, + 0.9165, + 0.9105, + 0.914, + 0.9155, + 0.9155, + 0.9155, + 0.921, + 0.918, + 0.9145, + 0.9185, + 0.9185, + 0.9195, + 0.917, + 0.9185, + 0.9165, + 0.9155, + 0.916, + 0.916, + 0.9175, + 0.9175, + 0.9165, + 0.9175, + 0.918, + 0.9205, + 0.9185, + 0.9195, + 0.9195, + 0.9185, + 0.919, + 0.92, + 0.9195, + 0.9185, + 0.918, + 0.918, + 0.9185, + 0.9185, + 0.9185, + 0.9185 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9016435146331787, + 0.885430634021759 + ], + "perturbation_rho": [ + 0.9999990463256836, + 0.9999956488609314 + ], + "nudging": { + "0.001": [ + -0.025333665311336517, + -0.008427875116467476 + ], + "0.003": [ + -0.06789667904376984, + -0.024404384195804596 + ], + "0.01": [ + -0.1530623733997345, + -0.07174263894557953 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2672516973495482, + 1.5406763599395752, + 0.8734839607238769, + 0.5719744925498962, + 0.43795060081481935, + 0.3796915352344513, + 0.3515102066040039, + 0.34363653602600097, + 0.346579896068573, + 0.3523189636230469, + 0.36527162773907185, + 0.354346701669693, + 0.36580664479769764, + 0.3704022624015808, + 0.38606751427650454, + 0.39586514394283295, + 0.39508123254776, + 0.3993864247083664, + 0.37308432426452637, + 0.37541835613250735, + 0.39490375390052795, + 0.41886737365722654, + 0.42669332542419436, + 0.4329951783180237, + 0.41213310742378234, + 0.41604060430526735, + 0.439035751914978, + 0.4203595119476318, + 0.4442571120105684, + 0.3852801851511002, + 0.4143046700000763, + 0.40898334140777587, + 0.4385781176567078, + 0.4152657918930054, + 0.3895705045700073, + 0.37223660364151, + 0.44713057374954224, + 0.39130793590545654, + 0.4226909558773041, + 0.40002760217189787, + 0.40161972694396975, + 0.40211384024620056, + 0.35893915023803713, + 0.3810792253375053, + 0.3602697286605835, + 0.39281459631919863, + 0.36947657871246337, + 0.35637855994701384, + 0.3324590299606323, + 0.3467387020111084, + 0.36033435146808623, + 0.33432699961662293, + 0.34486105864048006, + 0.33717776260375976, + 0.3389194183349609, + 0.33332413997650145, + 0.3654030384540558, + 0.33450953476428985, + 0.3124741755962372, + 0.318544306409359, + 0.30823197283744813, + 0.3136479189872742, + 0.31080177907943723, + 0.3169054593086243, + 0.3074277029514313, + 0.30450149250030517, + 0.30927493453025817, + 0.3046170944571495, + 0.2992845245361328, + 0.3026343915730715, + 0.29540148811340333, + 0.29762721849679946, + 0.29338113285303113, + 0.29300176270604134, + 0.2912304340839386, + 0.2921901733696461, + 0.29031082172393796, + 0.2895033945083618, + 0.2892534152030945, + 0.2889680833816528 + ], + "train_acc": [ + 0.1707, + 0.4868, + 0.6988, + 0.7929, + 0.8367, + 0.8555, + 0.866, + 0.873, + 0.8721, + 0.8736, + 0.8709, + 0.8743, + 0.8744, + 0.8735, + 0.8726, + 0.873, + 0.8759, + 0.8706, + 0.8758, + 0.879, + 0.8741, + 0.8645, + 0.8702, + 0.8677, + 0.8714, + 0.8741, + 0.8644, + 0.8692, + 0.8643, + 0.8824, + 0.8701, + 0.8755, + 0.8675, + 0.8737, + 0.8813, + 0.8809, + 0.8657, + 0.8804, + 0.8722, + 0.8754, + 0.8757, + 0.8753, + 0.8879, + 0.8822, + 0.8884, + 0.8823, + 0.8806, + 0.8855, + 0.8935, + 0.893, + 0.8867, + 0.8912, + 0.8868, + 0.8913, + 0.8911, + 0.8926, + 0.8844, + 0.8921, + 0.8996, + 0.8933, + 0.8985, + 0.8971, + 0.8978, + 0.8939, + 0.9007, + 0.9005, + 0.8987, + 0.8986, + 0.9016, + 0.9009, + 0.9022, + 0.9008, + 0.9041, + 0.9027, + 0.9035, + 0.9042, + 0.9041, + 0.9038, + 0.9039, + 0.9041 + ], + "test_acc": [ + 0.3125, + 0.5955, + 0.726, + 0.775, + 0.7965, + 0.8115, + 0.8185, + 0.823, + 0.814, + 0.8095, + 0.8235, + 0.818, + 0.8225, + 0.802, + 0.8155, + 0.8165, + 0.8145, + 0.8135, + 0.826, + 0.8315, + 0.8215, + 0.817, + 0.8075, + 0.7745, + 0.8085, + 0.817, + 0.8235, + 0.7995, + 0.821, + 0.795, + 0.8085, + 0.822, + 0.8145, + 0.8365, + 0.8175, + 0.8085, + 0.8175, + 0.804, + 0.8235, + 0.8135, + 0.818, + 0.812, + 0.8305, + 0.827, + 0.827, + 0.822, + 0.8145, + 0.8365, + 0.8235, + 0.8325, + 0.8365, + 0.83, + 0.8215, + 0.816, + 0.8315, + 0.835, + 0.838, + 0.8415, + 0.839, + 0.834, + 0.841, + 0.8325, + 0.8355, + 0.837, + 0.8425, + 0.8445, + 0.8355, + 0.8385, + 0.8435, + 0.8375, + 0.8405, + 0.8425, + 0.8415, + 0.8435, + 0.842, + 0.8425, + 0.842, + 0.844, + 0.842, + 0.842 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.003507068380713463, + 0.06432205438613892 + ], + "perturbation_rho": [ + 0.009520611725747585, + 0.008434494026005268 + ], + "nudging": { + "0.001": [ + -0.0002756889152806252, + -0.00020426382252480835 + ], + "0.003": [ + -0.0007265026797540486, + -0.0006114119896665215 + ], + "0.01": [ + -0.0012172441929578781, + -0.002031015930697322 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 2.035005982208252, + 1.0625006386756897, + 0.5681396248340607, + 0.40292615756988526, + 0.35494276213645937, + 0.35367286462783815, + 0.3522244266748428, + 0.3483129674911499, + 0.3471846503138542, + 0.339002624130249, + 0.3345070185661316, + 0.32301185145378114, + 0.33057213478088376, + 0.32907251510620117, + 0.3413796614646912, + 0.3397313566684723, + 0.34876382074356077, + 0.37978848781585695, + 0.3638390887260437, + 0.38385889353752134, + 0.37183677554130556, + 0.3724878916740417, + 0.37140159249305726, + 0.36678935465812684, + 0.39441064119338987, + 0.3975552704811096, + 0.37753898453712464, + 0.3906581982135773, + 0.37475493841171265, + 0.37576223373413087, + 0.3782484645366669, + 0.37623033885359763, + 0.36558109712600706, + 0.3910276884615421, + 0.3600040744304657, + 0.36322228198051454, + 0.3801977564573288, + 0.36730438537597654, + 0.3575902397632599, + 0.37418701705932617, + 0.3590826825141907, + 0.3950372566223144, + 0.36714599866867065, + 0.3721199869632721, + 0.3592522024154663, + 0.35940034481287003, + 0.34905432891845706, + 0.3683148382663727, + 0.3443241489171982, + 0.3423384827136993, + 0.3531889009475708, + 0.34689038696289065, + 0.35813456788063047, + 0.35032057762145996, + 0.3468820187568665, + 0.3417310636520386, + 0.3436132889151573, + 0.3363162727832794, + 0.33885444416999816, + 0.3382028401374817, + 0.3337278725862503, + 0.32967933921813963, + 0.33579480311870574, + 0.3290024467945099, + 0.32965006504058836, + 0.32792007284164426, + 0.32932969875335694, + 0.3255772262096405, + 0.3246876961708069, + 0.3239794743061066, + 0.32336828413009644, + 0.32233704478740693, + 0.32169947628974915, + 0.3200554334640503, + 0.3199539676547051, + 0.31967375645637514, + 0.3195785717487335, + 0.318930774641037, + 0.3186777819395065, + 0.3185241099357605 + ], + "train_acc": [ + 0.2702, + 0.6491, + 0.8061, + 0.8554, + 0.8668, + 0.8634, + 0.8662, + 0.8688, + 0.8671, + 0.8702, + 0.8729, + 0.8782, + 0.8732, + 0.8719, + 0.8673, + 0.8678, + 0.8671, + 0.8563, + 0.8596, + 0.854, + 0.8605, + 0.8572, + 0.8592, + 0.8646, + 0.8541, + 0.8505, + 0.8577, + 0.8555, + 0.8621, + 0.8601, + 0.863, + 0.8583, + 0.8668, + 0.8577, + 0.8657, + 0.862, + 0.8547, + 0.8652, + 0.8667, + 0.8618, + 0.867, + 0.8564, + 0.8662, + 0.8633, + 0.8686, + 0.8658, + 0.8734, + 0.8632, + 0.8724, + 0.8748, + 0.8728, + 0.8697, + 0.8659, + 0.8727, + 0.8756, + 0.8783, + 0.8745, + 0.8766, + 0.8747, + 0.8767, + 0.8764, + 0.8802, + 0.8779, + 0.879, + 0.8787, + 0.8781, + 0.8788, + 0.8802, + 0.8798, + 0.88, + 0.8814, + 0.8811, + 0.8817, + 0.8829, + 0.8819, + 0.8821, + 0.8827, + 0.8825, + 0.8824, + 0.8825 + ], + "test_acc": [ + 0.503, + 0.7255, + 0.797, + 0.817, + 0.8245, + 0.8205, + 0.825, + 0.824, + 0.8225, + 0.8195, + 0.819, + 0.804, + 0.815, + 0.803, + 0.812, + 0.806, + 0.805, + 0.787, + 0.788, + 0.7925, + 0.7975, + 0.787, + 0.7985, + 0.7925, + 0.794, + 0.7845, + 0.788, + 0.8, + 0.809, + 0.7955, + 0.79, + 0.804, + 0.7995, + 0.8195, + 0.802, + 0.8105, + 0.805, + 0.807, + 0.788, + 0.8005, + 0.799, + 0.805, + 0.8055, + 0.812, + 0.8145, + 0.8125, + 0.81, + 0.816, + 0.814, + 0.811, + 0.8095, + 0.807, + 0.815, + 0.8165, + 0.8155, + 0.822, + 0.8125, + 0.816, + 0.824, + 0.818, + 0.8225, + 0.8235, + 0.8225, + 0.8235, + 0.822, + 0.823, + 0.826, + 0.8225, + 0.8245, + 0.825, + 0.8305, + 0.8265, + 0.8245, + 0.825, + 0.8245, + 0.8255, + 0.8255, + 0.8245, + 0.825, + 0.825 + ], + "state_pred_error": [ + 0.7930344770431519, + 0.33453584871292114, + 0.20085580315589904, + 0.1662054708957672, + 0.1484192388534546, + 0.12706449398994446, + 0.1051150745511055, + 0.0862806459903717, + 0.07003339284062386, + 0.056576034367084506, + 0.04550816717147827, + 0.037443365716934206, + 0.03156180031001568, + 0.026521402359008787, + 0.024098804253339767, + 0.020684491539001464, + 0.018775052654743194, + 0.016968464668095113, + 0.015761400666832924, + 0.0148261524528265, + 0.013772383904457092, + 0.012841872078180314, + 0.01212171582430601, + 0.011358869352936745, + 0.010760826092958451, + 0.010395293319225311, + 0.009721535283327103, + 0.009380436344444751, + 0.008714642544090748, + 0.00832201651930809, + 0.007944079050421715, + 0.007537899447977543, + 0.007203187400847673, + 0.006980897760391235, + 0.0067270153641700746, + 0.006773905930668116, + 0.006287054452300072, + 0.006013905717432499, + 0.005785777585208416, + 0.00562433947250247, + 0.005380938850343227, + 0.005262843784689903, + 0.005085598437488079, + 0.00498003980666399, + 0.004932753546535969, + 0.005003796426951885, + 0.004590760344266891, + 0.004599673649668693, + 0.00439439031817019, + 0.00423201487660408, + 0.004100750351697206, + 0.004011376547813416, + 0.003973590862005949, + 0.004097817398235202, + 0.0037751846626400947, + 0.0036597197454422714, + 0.003587385104969144, + 0.0035407144874334334, + 0.003462031126394868, + 0.0033322377867996693, + 0.0033507585413753986, + 0.003264742435514927, + 0.003270072665065527, + 0.0031124879892915486, + 0.003089210972934961, + 0.003064330695942044, + 0.0030382187522947786, + 0.002925222585350275, + 0.003029374345391989, + 0.0030071801479905846, + 0.0029380858182907104, + 0.002891799750179052, + 0.0028872372664511202, + 0.0027601104773581028, + 0.002647246193885803, + 0.003206372195482254, + 0.002585273112356663, + 0.0026350405309349297, + 0.0025491194140166043, + 0.002513679987192154 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9153801202774048, + 0.4171057343482971 + ], + "perturbation_rho": [ + 0.8286964893341064, + 0.3651735186576843 + ], + "nudging": { + "0.001": [ + -0.028001569211483, + -0.003089441917836666 + ], + "0.003": [ + -0.08059416711330414, + -0.00922414381057024 + ], + "0.01": [ + -0.23136131465435028, + -0.030226988717913628 + ] + }, + "state_pred_error_per_layer": [ + 438.86456298828125, + 353.2518310546875 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2677657585144044, + 1.5392805450439453, + 0.8744732268333435, + 0.568014195728302, + 0.4398987528085709, + 0.3760902978897095, + 0.3541576505661011, + 0.3411660843849182, + 0.34918038940429685, + 0.3663975031852722, + 0.35367102298736575, + 0.3754954501867294, + 0.36713659081459044, + 0.38618344717025754, + 0.3743376718521118, + 0.40900271940231325, + 0.393092963218689, + 0.40236372089385986, + 0.40079734888076785, + 0.4382667214393616, + 0.45539406690597534, + 0.482037882232666, + 0.48538611330986026, + 0.5342730137348175, + 0.5415242199420929, + 0.5768073871612549, + 0.6066906931877136, + 0.5891243501663208, + 0.6048513441085815, + 0.6677637449264526, + 0.6201698928833008, + 0.6366922058105469, + 0.6642072593688965, + 0.6999521923065185, + 0.6945115597724915, + 0.6664895143508911, + 0.7284628839492798, + 0.6817547720909118, + 0.6409681924819947, + 0.6730700984954834, + 0.7049953090667724, + 0.6589361456871032, + 0.6752442480087281, + 0.7031260248184205, + 0.697934859085083, + 0.7272751848220825, + 0.7606932877540589, + 0.7395933769226074, + 0.7341751010894776, + 0.7405285339355469, + 0.733946765422821, + 0.7636806823730469, + 0.7857295166015625, + 0.7889110160827637, + 0.7920944040298462, + 0.7986338794708252, + 0.8144829880714417, + 0.8125959665298462, + 0.8262598834991455, + 0.8528658538818359, + 0.8327025209903717, + 0.838051769399643, + 0.8450202142715454, + 0.8672424634933472, + 0.8608419931411743, + 0.8575022724151611, + 0.8643195161819458, + 0.8576637521743774, + 0.8549348508834839, + 0.8627238691329956, + 0.8602130598068237, + 0.8596111630439758, + 0.8598717666625977, + 0.8593405214309693, + 0.8577193733215333, + 0.8576152732849122, + 0.8567814826011658, + 0.8552138454437256, + 0.8546268630981445, + 0.8542516090393066 + ], + "train_acc": [ + 0.1687, + 0.482, + 0.6983, + 0.7931, + 0.8356, + 0.8575, + 0.8634, + 0.8707, + 0.8712, + 0.8677, + 0.8761, + 0.8715, + 0.8803, + 0.874, + 0.8744, + 0.8687, + 0.8705, + 0.8714, + 0.8688, + 0.8601, + 0.854, + 0.8454, + 0.8436, + 0.8243, + 0.8256, + 0.8162, + 0.8066, + 0.8109, + 0.8025, + 0.7834, + 0.794, + 0.7832, + 0.7798, + 0.7623, + 0.7665, + 0.768, + 0.7548, + 0.7635, + 0.7693, + 0.7596, + 0.7519, + 0.7585, + 0.7591, + 0.7516, + 0.7492, + 0.7504, + 0.7421, + 0.744, + 0.7436, + 0.7452, + 0.7458, + 0.7377, + 0.7331, + 0.7333, + 0.7298, + 0.7316, + 0.7319, + 0.7304, + 0.7251, + 0.7211, + 0.7276, + 0.7256, + 0.7235, + 0.7199, + 0.7224, + 0.7196, + 0.7167, + 0.7208, + 0.7206, + 0.7152, + 0.7204, + 0.7213, + 0.7205, + 0.7207, + 0.7194, + 0.7214, + 0.7189, + 0.7189, + 0.72, + 0.7203 + ], + "test_acc": [ + 0.3165, + 0.585, + 0.732, + 0.777, + 0.8045, + 0.8135, + 0.8195, + 0.815, + 0.812, + 0.8215, + 0.81, + 0.823, + 0.8185, + 0.83, + 0.814, + 0.8175, + 0.8005, + 0.8195, + 0.8085, + 0.7935, + 0.7795, + 0.792, + 0.762, + 0.755, + 0.761, + 0.752, + 0.7535, + 0.739, + 0.731, + 0.7295, + 0.7245, + 0.7105, + 0.7015, + 0.6825, + 0.705, + 0.705, + 0.713, + 0.707, + 0.708, + 0.693, + 0.709, + 0.706, + 0.6945, + 0.681, + 0.6865, + 0.671, + 0.684, + 0.6535, + 0.688, + 0.69, + 0.6805, + 0.6705, + 0.6685, + 0.6865, + 0.674, + 0.671, + 0.676, + 0.668, + 0.673, + 0.6765, + 0.675, + 0.67, + 0.666, + 0.661, + 0.6725, + 0.6655, + 0.6725, + 0.6685, + 0.666, + 0.6645, + 0.666, + 0.671, + 0.6695, + 0.6665, + 0.6705, + 0.666, + 0.6685, + 0.6705, + 0.6675, + 0.6675 + ], + "value_loss": [ + 2.905167144203186, + 0.7669180957794189, + 0.6147705508232116, + 0.5460843969345093, + 0.49546599617004394, + 0.4756456241607666, + 0.49797406158447266, + 0.5252212357997894, + 0.5387117910385132, + 0.6003822177171707, + 0.5737031475782395, + 0.653786695432663, + 0.6151383343935013, + 0.6694676952362061, + 0.6386722043037415, + 0.7662193554401397, + 0.7467729004859924, + 0.7038962652206421, + 0.6815459918498993, + 0.8039541248321533, + 0.8136287561416626, + 0.8644815028190613, + 0.8639612847328186, + 0.957852701663971, + 0.9195338849067688, + 0.9657894494056701, + 0.9908361279964447, + 0.9199113003730774, + 0.8898286704063415, + 0.9735244311332703, + 0.8156944500446319, + 0.7673966148376464, + 0.8238904671669006, + 0.7150344722747802, + 0.7092076916694641, + 0.5518315614700318, + 0.6911849412918091, + 0.5676486842632293, + 0.49137882578372954, + 0.47492049646377565, + 0.5294659261226654, + 0.48027371821403503, + 0.44395333375930784, + 0.4657917083263397, + 0.4749296194553375, + 0.525708182144165, + 0.5745783069372177, + 0.5165858255386353, + 0.49307253487110136, + 0.5070521484375, + 0.5017346429347992, + 0.49205484499931335, + 0.5560474545955658, + 0.6022055298805237, + 0.5778612011909485, + 0.5518968848228455, + 0.6285089484214783, + 0.5622078717708587, + 0.5958783441543579, + 0.6478308411598206, + 0.6241149466991425, + 0.5775983124256134, + 0.6079863901615142, + 0.6766130451202392, + 0.6386424642562866, + 0.5859615839004516, + 0.5853579979896545, + 0.609243207168579, + 0.5789407480239868, + 0.5828682322502137, + 0.5751972764015197, + 0.566095032453537, + 0.5679136329650879, + 0.541389085483551, + 0.5323089897155762, + 0.5463050646781922, + 0.5233067933321, + 0.539995517539978, + 0.5501079843044281, + 0.5091902822494507 + ], + "term_loss": [ + 1.6733786989212036, + 0.35953630895614624, + 0.3810900314331055, + 0.3640085501432419, + 0.3260841584324837, + 0.3077553846359253, + 0.3324718035697937, + 0.367346294260025, + 0.3859865920186043, + 0.45301228156089784, + 0.43512448742985727, + 0.5114166520357132, + 0.4755927606105804, + 0.5224317581176757, + 0.4974579632759094, + 0.6170232265353203, + 0.6003770110368729, + 0.5554250373840331, + 0.5345663616418839, + 0.6390543521881104, + 0.6454430676460267, + 0.6881791119873524, + 0.6889909839630127, + 0.7676727800190449, + 0.7288528527259827, + 0.7648732300281524, + 0.7703499612808228, + 0.702520156121254, + 0.6705087103843689, + 0.7275943111419678, + 0.5834438146114349, + 0.5341563625752926, + 0.5786461258172989, + 0.4691500406265259, + 0.46397005558013915, + 0.3172274461269379, + 0.4181660563707352, + 0.32323681541234256, + 0.2588549638271332, + 0.24302781400680543, + 0.2924638859629631, + 0.24494203708171844, + 0.2152600380897522, + 0.22989102821350096, + 0.2353773395419121, + 0.28108422079086304, + 0.31342148925065993, + 0.27359422492980956, + 0.25125429936647414, + 0.257268256187439, + 0.2591492292642593, + 0.23964913494586945, + 0.29251497268676757, + 0.3298768766343594, + 0.3039268769741058, + 0.2792709235191345, + 0.33827268505096436, + 0.28002805522680285, + 0.3018962340831757, + 0.3368746694564819, + 0.32222775983810426, + 0.2843563482582569, + 0.30906297858953474, + 0.3611741382598877, + 0.33170013012886046, + 0.2902149326324463, + 0.28840259952545166, + 0.31378483290672304, + 0.2902891281366348, + 0.2919290991783142, + 0.28340531673431396, + 0.278327653375268, + 0.27732584218978884, + 0.25806645315587523, + 0.25701560287475583, + 0.2673572342649102, + 0.2432628269404173, + 0.2552922504991293, + 0.2640775308728218, + 0.2335890076160431 + ], + "bridge_loss": [ + 0.9043548678459716, + 0.1099991770863533, + 0.0185405650511384, + 0.006047719717770815, + 0.016022920724749565, + 0.028978378069400786, + 0.031905842757225036, + 0.029302026838064193, + 0.023079814870655538, + 0.016131247261166572, + 0.012949446664750576, + 0.013754056148231029, + 0.015889972979575395, + 0.018446111026406288, + 0.01638760406896472, + 0.017992716232687236, + 0.019003601244091988, + 0.020746660566329955, + 0.01826081564426422, + 0.02830883066356182, + 0.024853757178783416, + 0.024344006457924842, + 0.023935870000720023, + 0.02609362450838089, + 0.025477111788839102, + 0.02811358508467674, + 0.037432029013335706, + 0.04066388768851757, + 0.03775561413168907, + 0.045691771799325945, + 0.04316586040407419, + 0.03629823230803013, + 0.044383459562063216, + 0.03235162799358368, + 0.0325787200063467, + 0.027550594240427016, + 0.053535217493772505, + 0.035429628413915636, + 0.031108605259656905, + 0.023855108603835107, + 0.02121337473988533, + 0.02979328683614731, + 0.020273821192979814, + 0.020139847481250764, + 0.025227140033245086, + 0.025450278180837633, + 0.03434615105986595, + 0.02146386271119118, + 0.02109189542680979, + 0.02925411523580551, + 0.02310084878951311, + 0.02616748433560133, + 0.03327374953627586, + 0.04235334511995315, + 0.041773559814691545, + 0.03985991308093071, + 0.05651662215590477, + 0.04745835790634155, + 0.055931367576122284, + 0.06850977175235748, + 0.0639593681037426, + 0.05509283916950226, + 0.05903308473825455, + 0.07053237849473953, + 0.06470432556271553, + 0.0535823705971241, + 0.051599254608154295, + 0.05326937973499298, + 0.047149808438122276, + 0.046959778106212616, + 0.04897745460271835, + 0.04479330514669418, + 0.04897215344905853, + 0.040769342416524884, + 0.03437164931297302, + 0.03721886334717274, + 0.03824560036659241, + 0.04369500883221626, + 0.04542522546350956, + 0.035112081968784334 + ], + "tgrad_loss": [ + 0.3274335751533508, + 0.29738261065483096, + 0.2151399471282959, + 0.17602813131809233, + 0.15335891692638398, + 0.13891186106204986, + 0.13359641733169555, + 0.12857291507720947, + 0.12964537999629974, + 0.13123868188858032, + 0.125629212808609, + 0.12861598132550717, + 0.12365560574531555, + 0.1285898279428482, + 0.1248266352891922, + 0.13120342084169387, + 0.1273922846198082, + 0.12772456929683684, + 0.12871881544589997, + 0.13659093623161317, + 0.14333192269802095, + 0.151958393907547, + 0.1510344393968582, + 0.16408629912137984, + 0.1652039253950119, + 0.1728026305437088, + 0.18305413188934327, + 0.1767272587299347, + 0.18156433925628662, + 0.20023834683895111, + 0.18908477582931518, + 0.19694202189445495, + 0.20086088314056397, + 0.21353280200958252, + 0.21265892071723938, + 0.20705352492332457, + 0.21948367331027985, + 0.20898223748207093, + 0.20141525354385376, + 0.20803757467269898, + 0.21578866653442383, + 0.2055383932828903, + 0.20841947269439698, + 0.21576083455085754, + 0.21432514040470124, + 0.21917368249893188, + 0.22681067111492156, + 0.22152773485183716, + 0.22072633769512176, + 0.22052977714538574, + 0.21948456611633302, + 0.22623822565078736, + 0.2302587287902832, + 0.22997530328035354, + 0.2321607629299164, + 0.2327660462141037, + 0.23371964123249053, + 0.2347214570045471, + 0.23805074806213378, + 0.24244639527797698, + 0.23792780854701995, + 0.23814912319183348, + 0.23989032588005066, + 0.2449065265893936, + 0.2422380124092102, + 0.24216427443027497, + 0.24535614709854126, + 0.24218899645805358, + 0.24150181224346162, + 0.24397935581207275, + 0.24281450612545014, + 0.24297407388687134, + 0.24161563982963563, + 0.24255329012870788, + 0.2409217383861542, + 0.24172897021770479, + 0.24179836411476135, + 0.24100825939178466, + 0.2406052262067795, + 0.2404891884803772 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.1011175885796547, + 0.23295700550079346 + ], + "perturbation_rho": [ + 0.19994769990444183, + 0.32798534631729126 + ], + "nudging": { + "0.001": [ + -0.00725348386913538, + -0.00188851123675704 + ], + "0.003": [ + -0.021614037454128265, + -0.0056588975712656975 + ], + "0.01": [ + -0.07033564895391464, + -0.01879441738128662 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.0_L2_s456.json b/results/synth_ladder_v2_lo/synth_a0.0_L2_s456.json new file mode 100644 index 0000000..3f357b8 --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.0_L2_s456.json @@ -0,0 +1,1512 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.7540335287094115, + 0.7887995930671692, + 0.45601481485366824, + 0.3563029076099396, + 0.3058449071407318, + 0.27814644107818604, + 0.256092844247818, + 0.2486086864233017, + 0.2273713537454605, + 0.22320388717651368, + 0.22591865739822387, + 0.21023976492881774, + 0.21006116704940797, + 0.2019081612110138, + 0.19240621073246003, + 0.17767472962141037, + 0.17261487174034118, + 0.18222670216560363, + 0.18264247782230378, + 0.16773689975738526, + 0.18042192044258118, + 0.17836842503547667, + 0.17410975818634034, + 0.17574358505010604, + 0.15518579416275025, + 0.14563439567089081, + 0.14957009754180908, + 0.16893083366155626, + 0.14229146575927734, + 0.1370330379009247, + 0.1540110511779785, + 0.16346854424476623, + 0.13422132856845856, + 0.12666763162612915, + 0.12608725222349168, + 0.12264905602931976, + 0.1324379847049713, + 0.13239208903312683, + 0.1317316207408905, + 0.12270301322340965, + 0.11590332639217377, + 0.11994003572463989, + 0.11405094165802002, + 0.1112155341386795, + 0.10668404247760772, + 0.10974465991258621, + 0.1068548722743988, + 0.10398986601829528, + 0.10589976058006287, + 0.1045347521185875, + 0.09930369100570678, + 0.09925224586725236, + 0.10005474714636803, + 0.09637348690032958, + 0.09619558620452881, + 0.09599231715202332, + 0.09453698312044144, + 0.09238649787902832, + 0.09135240658521653, + 0.09056207950115204, + 0.0904913359284401, + 0.08896962072849274, + 0.08807550078630447, + 0.08736293792724609, + 0.0872790049791336, + 0.08682763931751251, + 0.0863328184247017, + 0.08547967915534974, + 0.08507368334531784, + 0.08477922387123107, + 0.08439313389062882, + 0.08397663788795472, + 0.08362844693660736, + 0.08331081527471543, + 0.0830932537317276, + 0.08289919497966766, + 0.08278876669406891, + 0.0826721666097641, + 0.08259252429008485, + 0.08254909700155258 + ], + "train_acc": [ + 0.4207, + 0.7857, + 0.8773, + 0.894, + 0.8987, + 0.9076, + 0.9143, + 0.9122, + 0.9185, + 0.9164, + 0.9167, + 0.9216, + 0.9235, + 0.9238, + 0.93, + 0.9363, + 0.9374, + 0.9328, + 0.9317, + 0.9368, + 0.9311, + 0.9307, + 0.9329, + 0.9344, + 0.9447, + 0.946, + 0.9452, + 0.937, + 0.9509, + 0.9534, + 0.9455, + 0.9371, + 0.9516, + 0.9572, + 0.9578, + 0.9583, + 0.9521, + 0.953, + 0.9548, + 0.9569, + 0.9621, + 0.9563, + 0.963, + 0.9664, + 0.9689, + 0.967, + 0.967, + 0.9678, + 0.9681, + 0.9689, + 0.9727, + 0.9735, + 0.9715, + 0.9752, + 0.974, + 0.9752, + 0.975, + 0.9778, + 0.9781, + 0.9787, + 0.9785, + 0.9787, + 0.9804, + 0.9802, + 0.9801, + 0.9803, + 0.9816, + 0.9826, + 0.9823, + 0.9821, + 0.9823, + 0.9826, + 0.9829, + 0.983, + 0.9833, + 0.9833, + 0.9832, + 0.9838, + 0.9839, + 0.9839 + ], + "test_acc": [ + 0.6795, + 0.8435, + 0.8735, + 0.887, + 0.887, + 0.904, + 0.908, + 0.9, + 0.9045, + 0.9015, + 0.903, + 0.906, + 0.9035, + 0.9135, + 0.9175, + 0.9075, + 0.9125, + 0.913, + 0.908, + 0.913, + 0.906, + 0.911, + 0.914, + 0.9145, + 0.921, + 0.9215, + 0.92, + 0.915, + 0.923, + 0.923, + 0.916, + 0.917, + 0.9285, + 0.921, + 0.921, + 0.9275, + 0.919, + 0.927, + 0.924, + 0.9265, + 0.928, + 0.9215, + 0.923, + 0.9205, + 0.928, + 0.9235, + 0.93, + 0.927, + 0.931, + 0.929, + 0.9305, + 0.9275, + 0.927, + 0.93, + 0.932, + 0.9305, + 0.9305, + 0.932, + 0.9295, + 0.9305, + 0.9305, + 0.929, + 0.93, + 0.9325, + 0.93, + 0.9285, + 0.9325, + 0.9295, + 0.929, + 0.929, + 0.931, + 0.931, + 0.93, + 0.93, + 0.929, + 0.93, + 0.9295, + 0.9295, + 0.9295, + 0.9295 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8826531171798706, + 0.8583619594573975 + ], + "perturbation_rho": [ + 0.9999988079071045, + 0.9999959468841553 + ], + "nudging": { + "0.001": [ + -0.021625827997922897, + -0.0073820194229483604 + ], + "0.003": [ + -0.0571812242269516, + -0.021265367045998573 + ], + "0.01": [ + -0.12340263277292252, + -0.06141046807169914 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2789152168273925, + 1.5198317989349366, + 0.864434551525116, + 0.5843122736930847, + 0.45720995845794676, + 0.4017148985385895, + 0.3776179392337799, + 0.37144901649951934, + 0.3685629499435425, + 0.37063308811187745, + 0.37334213446378706, + 0.3977362024307251, + 0.3849859349250793, + 0.3885465118408203, + 0.4121596324086189, + 0.4142354433834553, + 0.41292374534606935, + 0.4443123857498169, + 0.44203310720920563, + 0.42226147565841676, + 0.4249496959686279, + 0.4256349886894226, + 0.43858823890686033, + 0.4887267217159271, + 0.4046924789428711, + 0.44023080163002015, + 0.4586866247177124, + 0.47388719167709353, + 0.4657478348731995, + 0.4368759090423584, + 0.49420316143035886, + 0.455893372297287, + 0.43190188279151914, + 0.4301922942638397, + 0.4683740642309189, + 0.41559304761886595, + 0.4515250599861145, + 0.44344369277954104, + 0.5267878504753113, + 0.44394594959020617, + 0.4324127757668495, + 0.40358923535346986, + 0.4648085826396942, + 0.4322748986721039, + 0.3977247392654419, + 0.4430144777774811, + 0.4182663669586182, + 0.4156523362159729, + 0.41285320320129393, + 0.4263911725178361, + 0.3818113656997681, + 0.40127683003544806, + 0.38001128873825074, + 0.395466704750061, + 0.37924830303192136, + 0.39582441291809084, + 0.38846483197212217, + 0.3674187141418457, + 0.37231723667383193, + 0.3590473205566406, + 0.3668627885401249, + 0.35952253170013426, + 0.3661739505529404, + 0.35552182607650756, + 0.35606588587760923, + 0.3480822557926178, + 0.3466999515578151, + 0.3430781412124634, + 0.3444066115856171, + 0.34685713081359865, + 0.3389283345222473, + 0.3368847903251648, + 0.33722841114997865, + 0.3348792476654053, + 0.335844083404541, + 0.33308425464630126, + 0.33272774691581725, + 0.33165184540748593, + 0.3310907633304596, + 0.3308901508331299 + ], + "train_acc": [ + 0.159, + 0.4941, + 0.7011, + 0.7898, + 0.8315, + 0.85, + 0.8575, + 0.8576, + 0.8634, + 0.8631, + 0.8649, + 0.8574, + 0.8654, + 0.8661, + 0.8592, + 0.8603, + 0.8626, + 0.8547, + 0.856, + 0.8636, + 0.8584, + 0.8637, + 0.8627, + 0.8485, + 0.8733, + 0.8618, + 0.8621, + 0.859, + 0.8585, + 0.8637, + 0.8544, + 0.8631, + 0.868, + 0.8694, + 0.8606, + 0.873, + 0.8584, + 0.8689, + 0.856, + 0.8702, + 0.871, + 0.8764, + 0.8614, + 0.8719, + 0.8793, + 0.8682, + 0.8713, + 0.8756, + 0.8757, + 0.8733, + 0.8849, + 0.8772, + 0.8819, + 0.8792, + 0.8835, + 0.8813, + 0.8817, + 0.8863, + 0.8835, + 0.8858, + 0.8857, + 0.8845, + 0.8833, + 0.886, + 0.8875, + 0.8875, + 0.8927, + 0.8909, + 0.891, + 0.8876, + 0.891, + 0.892, + 0.8939, + 0.8924, + 0.8919, + 0.8912, + 0.8928, + 0.8941, + 0.8947, + 0.8946 + ], + "test_acc": [ + 0.323, + 0.6025, + 0.745, + 0.7805, + 0.8, + 0.8155, + 0.806, + 0.8185, + 0.819, + 0.8075, + 0.8195, + 0.8265, + 0.8285, + 0.814, + 0.814, + 0.8155, + 0.8205, + 0.813, + 0.825, + 0.8265, + 0.809, + 0.83, + 0.8195, + 0.839, + 0.8095, + 0.8245, + 0.81, + 0.8155, + 0.835, + 0.8135, + 0.8325, + 0.8325, + 0.834, + 0.813, + 0.836, + 0.842, + 0.81, + 0.8265, + 0.834, + 0.82, + 0.833, + 0.832, + 0.8315, + 0.8425, + 0.824, + 0.8375, + 0.8375, + 0.823, + 0.824, + 0.8375, + 0.8415, + 0.842, + 0.842, + 0.8365, + 0.8405, + 0.8435, + 0.841, + 0.85, + 0.8425, + 0.848, + 0.844, + 0.847, + 0.849, + 0.845, + 0.8465, + 0.846, + 0.8445, + 0.85, + 0.8455, + 0.8485, + 0.847, + 0.8475, + 0.847, + 0.848, + 0.847, + 0.8485, + 0.851, + 0.8495, + 0.8485, + 0.8485 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.016239378601312637, + 0.08700481057167053 + ], + "perturbation_rho": [ + -0.0633457601070404, + 0.09238316863775253 + ], + "nudging": { + "0.001": [ + -0.0005403641844168305, + -0.0003429484786465764 + ], + "0.003": [ + -0.0015787126030772924, + -0.0010280576534569263 + ], + "0.01": [ + -0.004778302274644375, + -0.003415417857468128 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 2.03510007686615, + 1.077442472267151, + 0.609830850982666, + 0.4300918912887573, + 0.3839862449645996, + 0.3708487091064453, + 0.36614356565475464, + 0.3628130876541138, + 0.36194450925588606, + 0.3576546109199524, + 0.3619418657779694, + 0.3517365313529968, + 0.34097144956588743, + 0.35138510484695434, + 0.3435681216239929, + 0.352434642791748, + 0.3715478811264038, + 0.3778843415737152, + 0.3998612182617188, + 0.3988710145950317, + 0.41688702239990233, + 0.4265467617034912, + 0.4248304518222809, + 0.40923274965286255, + 0.3897163356781006, + 0.3885489140033722, + 0.3746957459449768, + 0.3795012855529785, + 0.3912307156085968, + 0.38832212753295897, + 0.39127745122909546, + 0.4051106197834015, + 0.4201839946746826, + 0.4025802077293396, + 0.413509761428833, + 0.4256944602966309, + 0.4097448627471924, + 0.4372278747558594, + 0.4230543599128723, + 0.4329932454109192, + 0.4262246448993683, + 0.4197934967517853, + 0.4233694318771362, + 0.4268952363014221, + 0.41731767301559447, + 0.416495183467865, + 0.4137693079948425, + 0.42386709623336793, + 0.40960294895172117, + 0.40348369274139406, + 0.4084292630195618, + 0.393343914270401, + 0.39545347409248355, + 0.391191748046875, + 0.3969509807109833, + 0.3895566881656647, + 0.3817503587841988, + 0.37462963981628417, + 0.3790303818464279, + 0.3720798149585724, + 0.37286534557342527, + 0.37294170576334, + 0.3663740547180176, + 0.36788779735565186, + 0.3682312522411346, + 0.36158624505996706, + 0.362826536655426, + 0.35837330026626585, + 0.35764170565605163, + 0.3563748463153839, + 0.3544979793548584, + 0.35291474685668944, + 0.3523685070037842, + 0.351926808154583, + 0.3506764990568161, + 0.3501978385448456, + 0.3497668510437012, + 0.3495366275787353, + 0.3492322545051575, + 0.3491422838926315 + ], + "train_acc": [ + 0.2744, + 0.6311, + 0.7872, + 0.8484, + 0.8554, + 0.8602, + 0.8602, + 0.8633, + 0.8637, + 0.8656, + 0.8633, + 0.8667, + 0.8716, + 0.8655, + 0.8699, + 0.8666, + 0.8529, + 0.8537, + 0.8501, + 0.848, + 0.8471, + 0.8413, + 0.8409, + 0.8409, + 0.8532, + 0.8535, + 0.8604, + 0.858, + 0.8543, + 0.857, + 0.8538, + 0.8501, + 0.8501, + 0.8543, + 0.8504, + 0.8482, + 0.8537, + 0.8499, + 0.8539, + 0.848, + 0.8512, + 0.856, + 0.8522, + 0.8492, + 0.8551, + 0.8557, + 0.8557, + 0.8555, + 0.8581, + 0.862, + 0.859, + 0.8629, + 0.8608, + 0.8622, + 0.8617, + 0.8624, + 0.8643, + 0.8697, + 0.8672, + 0.8676, + 0.8683, + 0.8667, + 0.8679, + 0.8667, + 0.866, + 0.8722, + 0.8701, + 0.8718, + 0.872, + 0.8713, + 0.8714, + 0.8731, + 0.8729, + 0.873, + 0.8724, + 0.873, + 0.8736, + 0.8731, + 0.8733, + 0.8734 + ], + "test_acc": [ + 0.525, + 0.726, + 0.7975, + 0.8225, + 0.8235, + 0.825, + 0.8225, + 0.8235, + 0.8195, + 0.827, + 0.8265, + 0.8295, + 0.835, + 0.8375, + 0.8315, + 0.83, + 0.824, + 0.8095, + 0.809, + 0.8125, + 0.799, + 0.8075, + 0.8115, + 0.812, + 0.812, + 0.817, + 0.812, + 0.812, + 0.8065, + 0.815, + 0.815, + 0.81, + 0.805, + 0.817, + 0.808, + 0.823, + 0.8045, + 0.8, + 0.801, + 0.8115, + 0.82, + 0.814, + 0.812, + 0.8155, + 0.8105, + 0.8175, + 0.8065, + 0.817, + 0.8135, + 0.8205, + 0.824, + 0.8145, + 0.8215, + 0.812, + 0.8215, + 0.819, + 0.8195, + 0.815, + 0.8225, + 0.8205, + 0.8225, + 0.823, + 0.8175, + 0.8265, + 0.8225, + 0.829, + 0.8255, + 0.8255, + 0.8265, + 0.8255, + 0.8285, + 0.8265, + 0.8285, + 0.828, + 0.829, + 0.8275, + 0.8275, + 0.829, + 0.8285, + 0.8285 + ], + "state_pred_error": [ + 0.7936658924102783, + 0.33496607384681704, + 0.20223751559257508, + 0.16735892939567565, + 0.14485984333753585, + 0.11955849848985672, + 0.09462791703939438, + 0.07538449263572693, + 0.05961660117506981, + 0.04735348780155182, + 0.038567446672916415, + 0.03213091719150543, + 0.028004648900032042, + 0.024515093371272088, + 0.022012931832671164, + 0.020446427571773527, + 0.018394847139716147, + 0.016773300230503083, + 0.015448834140598774, + 0.014468847262859344, + 0.013597128289937973, + 0.012880013291537762, + 0.012064755845069886, + 0.011425680384039879, + 0.010745641595125198, + 0.010167037642002106, + 0.0096464214771986, + 0.009187596023082733, + 0.008730744183063507, + 0.008276390147954225, + 0.007866678546369075, + 0.00768265388160944, + 0.007270389303565025, + 0.007174727764725685, + 0.0070541538849473, + 0.0067812193542718885, + 0.006654527989774942, + 0.00636177619099617, + 0.006175523652881384, + 0.006045299311727285, + 0.005936238116025925, + 0.005970760487020016, + 0.005785428526252508, + 0.005630842386931181, + 0.005440417719632387, + 0.005434160755574703, + 0.005252558408677578, + 0.005300074205547571, + 0.005076368814706802, + 0.005021050906181336, + 0.004854675306379795, + 0.004958594182133675, + 0.004614286011457443, + 0.004535953061282635, + 0.004470928203314543, + 0.004415199124440551, + 0.0042777580007910725, + 0.004198400410264731, + 0.004141696321219206, + 0.004083840855211019, + 0.004052111233770847, + 0.003930420187115669, + 0.003949926514923573, + 0.0037584460385143756, + 0.0037061349514871836, + 0.003612276028469205, + 0.0035469237841665746, + 0.0035739093132317067, + 0.0034136051505804063, + 0.0034378198258578777, + 0.003333174591511488, + 0.0032446157082915306, + 0.003214318350702524, + 0.0031311317443847657, + 0.003078432670608163, + 0.003057278237864375, + 0.0029395090855658056, + 0.003017135479673743, + 0.0030766903996467592, + 0.0030378309611231087 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9387110471725464, + 0.5040415525436401 + ], + "perturbation_rho": [ + 0.7997298240661621, + 0.4891185164451599 + ], + "nudging": { + "0.001": [ + -0.02664007619023323, + -0.0032268627546727657 + ], + "0.003": [ + -0.07605530321598053, + -0.00962437316775322 + ], + "0.01": [ + -0.21233828365802765, + -0.031433407217264175 + ] + }, + "state_pred_error_per_layer": [ + 387.8657531738281, + 319.336669921875 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2791277053833006, + 1.5271975772857667, + 0.8674576456069947, + 0.587049162864685, + 0.4626688796043396, + 0.4040388158321381, + 0.37643657150268556, + 0.37468256072998046, + 0.3784513481616974, + 0.3786823602676392, + 0.37917218251228335, + 0.38788830342292785, + 0.3958303390264511, + 0.393599364900589, + 0.39977145621776583, + 0.40370213751792905, + 0.4120421281814575, + 0.45399587993621826, + 0.4687366197824478, + 0.4652291350364685, + 0.5005440378189087, + 0.5234059304714203, + 0.5221618666172028, + 0.5542463368415832, + 0.5820084628105163, + 0.5705709765195847, + 0.5702225286483764, + 0.5786975580215454, + 0.6307714500427246, + 0.6665315362930297, + 0.6137196712493896, + 0.6527844795227051, + 0.690822039604187, + 0.7107784267425538, + 0.7316474711418152, + 0.718277031326294, + 0.7050886112213135, + 0.708720292520523, + 0.7131800124168396, + 0.7192850646018982, + 0.7119332159996032, + 0.7151562330245972, + 0.7151052355766296, + 0.7357472681999206, + 0.7336779589653015, + 0.7310818168640136, + 0.7227139064788818, + 0.7629635635375976, + 0.7363060358047485, + 0.7154419450759888, + 0.7398526870727539, + 0.7556214105606079, + 0.7158489876747132, + 0.7164914712905884, + 0.7232932413101196, + 0.720790207862854, + 0.7382160652160644, + 0.7421017236709595, + 0.7198905362606048, + 0.7215996326446533, + 0.713732839012146, + 0.7260521041870117, + 0.7214395964860916, + 0.7165161167144776, + 0.718010532951355, + 0.7195493728637695, + 0.7165915153503418, + 0.7138662039756775, + 0.7102315483093262, + 0.7073148555755615, + 0.7073911678314209, + 0.7052887998104096, + 0.7047561235427856, + 0.7036817129135132, + 0.7020157369613648, + 0.7008753277301788, + 0.7001741619110108, + 0.6988817626953125, + 0.6988485893249512, + 0.6985764275550842 + ], + "train_acc": [ + 0.1601, + 0.491, + 0.7022, + 0.7916, + 0.8288, + 0.8486, + 0.8581, + 0.8577, + 0.8589, + 0.8612, + 0.8592, + 0.8631, + 0.8628, + 0.8636, + 0.8657, + 0.8659, + 0.8624, + 0.8518, + 0.8531, + 0.8528, + 0.8367, + 0.8354, + 0.8307, + 0.8247, + 0.8166, + 0.8139, + 0.8134, + 0.8052, + 0.793, + 0.7851, + 0.7952, + 0.7803, + 0.7699, + 0.7628, + 0.7577, + 0.7532, + 0.7604, + 0.7578, + 0.7536, + 0.7537, + 0.7561, + 0.7468, + 0.7497, + 0.7416, + 0.7428, + 0.7422, + 0.7463, + 0.7339, + 0.7393, + 0.7454, + 0.7379, + 0.7354, + 0.7424, + 0.7436, + 0.7415, + 0.7443, + 0.7379, + 0.7353, + 0.743, + 0.7401, + 0.744, + 0.7405, + 0.7417, + 0.7408, + 0.7428, + 0.7408, + 0.7425, + 0.7423, + 0.742, + 0.7447, + 0.7421, + 0.7443, + 0.7463, + 0.745, + 0.7458, + 0.7467, + 0.7485, + 0.747, + 0.7475, + 0.7478 + ], + "test_acc": [ + 0.3225, + 0.6005, + 0.735, + 0.7835, + 0.799, + 0.8105, + 0.813, + 0.8105, + 0.815, + 0.8275, + 0.816, + 0.8135, + 0.8275, + 0.8225, + 0.8215, + 0.819, + 0.809, + 0.812, + 0.8025, + 0.8145, + 0.804, + 0.7925, + 0.7875, + 0.7805, + 0.771, + 0.7595, + 0.7835, + 0.761, + 0.756, + 0.7445, + 0.7525, + 0.733, + 0.722, + 0.7035, + 0.718, + 0.7215, + 0.724, + 0.722, + 0.718, + 0.716, + 0.7085, + 0.7115, + 0.7125, + 0.704, + 0.705, + 0.711, + 0.6985, + 0.696, + 0.719, + 0.703, + 0.6875, + 0.708, + 0.706, + 0.708, + 0.7035, + 0.695, + 0.6985, + 0.6985, + 0.702, + 0.7065, + 0.706, + 0.713, + 0.71, + 0.7165, + 0.705, + 0.711, + 0.7115, + 0.708, + 0.709, + 0.7055, + 0.707, + 0.7125, + 0.7065, + 0.7095, + 0.7125, + 0.711, + 0.7115, + 0.7115, + 0.7115, + 0.7115 + ], + "value_loss": [ + 3.1635106006622316, + 0.7740020160675048, + 0.6276501627922058, + 0.5707134353637695, + 0.5015447573661804, + 0.4983567372083664, + 0.5175379848480225, + 0.547992883682251, + 0.5898804153442383, + 0.6042054812431336, + 0.6014190244197846, + 0.6637537957787514, + 0.6845919721126557, + 0.6927346345424652, + 0.7124938590049744, + 0.7445667055130005, + 0.7623097400665283, + 0.8733150297164917, + 0.9832132648468017, + 0.8608565040588378, + 0.9329591770648956, + 0.9217451201438904, + 0.8799381763935089, + 0.9203727130889893, + 0.9129298717975617, + 0.8228008040904998, + 0.723678154373169, + 0.6765096341133118, + 0.7649027530670166, + 0.8161859791755677, + 0.6514515069007873, + 0.7141245938301086, + 0.7329993425369262, + 0.7307948766708374, + 0.7585475451469421, + 0.6689410001754761, + 0.624963953590393, + 0.6088551391601562, + 0.6095617308139801, + 0.5894894409894943, + 0.5563288737297059, + 0.5322869329929352, + 0.4976848304748535, + 0.524449465751648, + 0.5014263719558716, + 0.4898082717895508, + 0.46659274439811704, + 0.5616481122970581, + 0.4971419037818909, + 0.4274770281791687, + 0.46093521366119383, + 0.4697890731334686, + 0.43194802646636965, + 0.4221532721042633, + 0.4475786390304565, + 0.42143903999328614, + 0.4458761687278748, + 0.45337565126419066, + 0.4238472384929657, + 0.40281684017181396, + 0.38932490911483764, + 0.3897231784820557, + 0.38490687227249143, + 0.38104017810821533, + 0.3687279556751251, + 0.3669544050216675, + 0.36931539878845215, + 0.36263137147426605, + 0.349668848323822, + 0.34732296204566954, + 0.3342470671653748, + 0.33395242664813996, + 0.33387985258102415, + 0.33358972406387327, + 0.3530650995254517, + 0.3312079078435898, + 0.31177036271095276, + 0.3145587480545044, + 0.3253957736968994, + 0.31588549439907077 + ], + "term_loss": [ + 1.7951480650424958, + 0.3761807126045227, + 0.4006756747245789, + 0.3907634472846985, + 0.33307474012374877, + 0.33421838104128837, + 0.3550305375099182, + 0.3851635645866394, + 0.4342513330459595, + 0.45601325892210004, + 0.45521873558163645, + 0.5165402359724045, + 0.5361827510595322, + 0.5454751461267471, + 0.5646561876296997, + 0.5965961949110031, + 0.6103998653411865, + 0.7111995510339737, + 0.8167527445793152, + 0.6931714932918549, + 0.747134658908844, + 0.7326245096206665, + 0.6787485965967178, + 0.7093002405881882, + 0.6855188606858253, + 0.595027423453331, + 0.5057091500282288, + 0.4579630083799362, + 0.5400014482975006, + 0.5755828867912293, + 0.43018956017494203, + 0.477418512403965, + 0.49788543190956114, + 0.4815887330055237, + 0.5000800666809082, + 0.4204012803554535, + 0.3826768821001053, + 0.3597612362623215, + 0.3625356485247612, + 0.34448800829648973, + 0.3180155368089676, + 0.28404023527503014, + 0.2569198631286621, + 0.27715443172454834, + 0.2526350587069988, + 0.2411904234647751, + 0.22838947129249573, + 0.299795917224884, + 0.246653905916214, + 0.191054323387146, + 0.21536591811180114, + 0.217297107899189, + 0.1931860875606537, + 0.1848979764148593, + 0.20436019200086594, + 0.18643514511585235, + 0.2030245313167572, + 0.2116449776649475, + 0.18160687791109084, + 0.16249994401931764, + 0.15484164142608642, + 0.1528463675737381, + 0.1489361402630806, + 0.14461671495437622, + 0.13463031718730928, + 0.1294142901301384, + 0.13273104189634324, + 0.12744402947425842, + 0.11626906907856464, + 0.11444123766869306, + 0.10322715325504542, + 0.10297624860405923, + 0.10388474629819393, + 0.10207910882234573, + 0.1196654408454895, + 0.10161699144244193, + 0.08757407498955727, + 0.08594336168766022, + 0.09848421711921691, + 0.09000624770522117 + ], + "bridge_loss": [ + 1.0729727275717247, + 0.11431841832399368, + 0.023766263148188593, + 0.007563671678304672, + 0.013874480509757996, + 0.021678775465488433, + 0.025472599875926972, + 0.025822595372796058, + 0.01795407388061285, + 0.011467179806530475, + 0.01033123205602169, + 0.01144010070860386, + 0.012751704286038876, + 0.013523769325017929, + 0.014328493074327707, + 0.015080985119193792, + 0.01630606939792633, + 0.01711897891610861, + 0.020690989595651625, + 0.02325695974826813, + 0.028962209689617158, + 0.027630632358789445, + 0.03822321012318134, + 0.041376910424232485, + 0.050044859862327574, + 0.04990889082849026, + 0.04164786594510078, + 0.03684647643864155, + 0.03118742448091507, + 0.03392234752178192, + 0.029907469933480025, + 0.03319982000291347, + 0.024718015414476394, + 0.030926838570833205, + 0.036485740578174594, + 0.027715866570174694, + 0.02814151096343994, + 0.033959431263804435, + 0.03254524117708206, + 0.029349126595258714, + 0.02586204304397106, + 0.03363803274035454, + 0.02803821322321892, + 0.0314576941460371, + 0.03330667742192745, + 0.03362447772026062, + 0.0266525205463171, + 0.04000154567956925, + 0.03556216908097267, + 0.026239325052499773, + 0.029197816705703736, + 0.033797084963321684, + 0.029408058428764344, + 0.027986173009872436, + 0.032767310640215874, + 0.026094853281974792, + 0.029071284955739976, + 0.02895135208964348, + 0.032204047930240634, + 0.030318710601329804, + 0.026927110385894775, + 0.026824868822097777, + 0.02698569309413433, + 0.02751481302976608, + 0.02610580772459507, + 0.02898943041563034, + 0.02892138159275055, + 0.028138772577047347, + 0.026615089032053948, + 0.02712062079310417, + 0.025527843962609768, + 0.026397538816928863, + 0.025526897245645525, + 0.026975207622349263, + 0.029337245070934295, + 0.02542050951719284, + 0.02072744626104832, + 0.025458942368626593, + 0.023841479897499084, + 0.023082720217108728 + ], + "tgrad_loss": [ + 0.29538979725837705, + 0.2835028868198395, + 0.20320821890830992, + 0.1723863210439682, + 0.15459553496837616, + 0.14245957915782928, + 0.13703485209941865, + 0.1370067240715027, + 0.13767500700950622, + 0.13672504227161408, + 0.13586905403137206, + 0.13577345745563507, + 0.1356575172126293, + 0.13373572314977647, + 0.13350917862653733, + 0.1328895225763321, + 0.13560380978584288, + 0.1449965008020401, + 0.14576953587532043, + 0.14442804169654846, + 0.15686230430603026, + 0.16148997682332994, + 0.16296637887954712, + 0.1696955554485321, + 0.17736615447998047, + 0.17786449105739593, + 0.17632114362716675, + 0.18170014889240266, + 0.1937138816833496, + 0.20668074293136596, + 0.1913544800758362, + 0.20350626287460327, + 0.21039589591026306, + 0.2182793056488037, + 0.22198174507617952, + 0.22082385530471801, + 0.21414556305408478, + 0.21513447856903076, + 0.21448083605766297, + 0.2156523087978363, + 0.21245129132270812, + 0.21460866712331772, + 0.21272675414085387, + 0.21583734347820283, + 0.21548463908433915, + 0.21499337368011476, + 0.21155075321197508, + 0.22185065126419068, + 0.2149258313894272, + 0.21018337931632997, + 0.21637148156166078, + 0.2186948810338974, + 0.2093538791656494, + 0.20926912331581116, + 0.21045113792419434, + 0.2089090428352356, + 0.2137803575515747, + 0.2127793226003647, + 0.21003631122112273, + 0.20999818406105042, + 0.20755615634918212, + 0.21005194301605223, + 0.2089850417137146, + 0.20890865128040315, + 0.2079918318271637, + 0.20855068507194519, + 0.20766297452449797, + 0.20704856889247894, + 0.20678469212055206, + 0.20576110424995422, + 0.20549206850528717, + 0.20457864027023315, + 0.20446821138858795, + 0.20453540694713593, + 0.20406241462230681, + 0.20417041058540344, + 0.20346884107589722, + 0.20315644788742065, + 0.2030700761795044, + 0.20279652795791625 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.08927787840366364, + 0.2430092990398407 + ], + "perturbation_rho": [ + 0.16060538589954376, + 0.35060590505599976 + ], + "nudging": { + "0.001": [ + -0.004890232812613249, + -0.001682603731751442 + ], + "0.003": [ + -0.01459127850830555, + -0.005042100325226784 + ], + "0.01": [ + -0.047705113887786865, + -0.016734274104237556 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.0_L4_s123.json b/results/synth_ladder_v2_lo/synth_a0.0_L4_s123.json new file mode 100644 index 0000000..9d86d3b --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.0_L4_s123.json @@ -0,0 +1,1554 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.3597635933876038, + 0.4536431095123291, + 0.3459823863983154, + 0.3341377299308777, + 0.32835464673042297, + 0.2696523241996765, + 0.27801587681770323, + 0.24306170365810395, + 0.23653682124614717, + 0.215101296377182, + 0.2301153823494911, + 0.20403413383960725, + 0.20097120499610902, + 0.22046247262954713, + 0.2552937029838562, + 0.21473501553535462, + 0.21990597033500672, + 0.19129086129665374, + 0.212379501581192, + 0.16677302420139312, + 0.15547462480068205, + 0.186291242647171, + 0.18397651748657226, + 0.16398042314052583, + 0.1707391785144806, + 0.16971807260513305, + 0.16760108163356782, + 0.16507963252067565, + 0.1741574893474579, + 0.1611321299791336, + 0.1508718879699707, + 0.1727994635283947, + 0.1291253708600998, + 0.1493298847913742, + 0.1369689993739128, + 0.11946097416877746, + 0.13066255633831025, + 0.11778032405376435, + 0.11688732101917267, + 0.11105217039585114, + 0.10557443997859955, + 0.10357953503131867, + 0.10208219905346631, + 0.09509066256284714, + 0.09412468841969968, + 0.09085212640762329, + 0.09300690701007842, + 0.10208991168737412, + 0.09088193004131317, + 0.09341149046421052, + 0.09043532534837723, + 0.0881039730668068, + 0.08196499594449996, + 0.07785149207115173, + 0.07818879878520965, + 0.08360754170417786, + 0.08134148994684219, + 0.07631582351922989, + 0.07548105678558349, + 0.07233029038906097, + 0.07013705761432648, + 0.0682597011089325, + 0.0686048051595688, + 0.06799649763703346, + 0.0662772851228714, + 0.06585792093835771, + 0.06456468963623047, + 0.06448650191426278, + 0.06374172894954681, + 0.06366113255023956, + 0.06288158102035522, + 0.06201381566524505, + 0.061693436133861544, + 0.06130597965121269, + 0.06098243209123611, + 0.06075502749085426, + 0.060538161253929135, + 0.06037251279354095, + 0.060264147567749025, + 0.060201747500896456 + ], + "train_acc": [ + 0.5469, + 0.8466, + 0.8731, + 0.8675, + 0.8726, + 0.8934, + 0.8903, + 0.9035, + 0.9056, + 0.9159, + 0.9072, + 0.9191, + 0.9196, + 0.9081, + 0.8992, + 0.9099, + 0.9158, + 0.9243, + 0.9152, + 0.9351, + 0.9413, + 0.9245, + 0.9283, + 0.9337, + 0.9353, + 0.9357, + 0.9329, + 0.9358, + 0.931, + 0.9387, + 0.9413, + 0.9337, + 0.9518, + 0.9419, + 0.945, + 0.9548, + 0.9509, + 0.9574, + 0.9556, + 0.9605, + 0.9631, + 0.9646, + 0.9651, + 0.9708, + 0.9709, + 0.9736, + 0.9711, + 0.9635, + 0.9714, + 0.9693, + 0.9719, + 0.9699, + 0.9779, + 0.9786, + 0.9795, + 0.9744, + 0.9765, + 0.9797, + 0.9796, + 0.9828, + 0.9838, + 0.9862, + 0.9861, + 0.9862, + 0.9869, + 0.9876, + 0.9883, + 0.9879, + 0.9884, + 0.9893, + 0.9888, + 0.9893, + 0.9892, + 0.9899, + 0.9896, + 0.9901, + 0.9901, + 0.9901, + 0.9901, + 0.9901 + ], + "test_acc": [ + 0.803, + 0.8665, + 0.8645, + 0.8795, + 0.8855, + 0.8825, + 0.8945, + 0.885, + 0.889, + 0.8915, + 0.8925, + 0.898, + 0.905, + 0.8975, + 0.884, + 0.8955, + 0.9, + 0.902, + 0.902, + 0.916, + 0.907, + 0.9015, + 0.9105, + 0.896, + 0.9095, + 0.916, + 0.9225, + 0.9055, + 0.9095, + 0.916, + 0.9135, + 0.907, + 0.9135, + 0.9115, + 0.9085, + 0.9065, + 0.9185, + 0.914, + 0.914, + 0.916, + 0.9185, + 0.9185, + 0.9225, + 0.921, + 0.921, + 0.9205, + 0.9195, + 0.9165, + 0.9215, + 0.926, + 0.9245, + 0.9255, + 0.922, + 0.923, + 0.926, + 0.9225, + 0.9245, + 0.9245, + 0.9235, + 0.922, + 0.923, + 0.924, + 0.924, + 0.924, + 0.9255, + 0.927, + 0.925, + 0.927, + 0.925, + 0.9265, + 0.925, + 0.9265, + 0.9245, + 0.926, + 0.9265, + 0.926, + 0.9255, + 0.926, + 0.926, + 0.926 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.808335542678833, + 0.780368447303772, + 0.7579712271690369, + 0.7386088371276855 + ], + "perturbation_rho": [ + 0.9999986886978149, + 0.999996542930603, + 0.9999827146530151, + 0.9999296069145203 + ], + "nudging": { + "0.001": [ + -0.024415872991085052, + -0.010280027985572815, + -0.0043833074159920216, + -0.002259491942822933 + ], + "0.003": [ + -0.06437402963638306, + -0.029320701956748962, + -0.012876948341727257, + -0.006704050116240978 + ], + "0.01": [ + -0.13544964790344238, + -0.08136264234781265, + -0.039826083928346634, + -0.02149367332458496 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.217821652793884, + 1.3246940484046936, + 0.7493350847244262, + 0.538270884513855, + 0.44736879706382754, + 0.3983163408279419, + 0.39004899067878723, + 0.3853191681861877, + 0.41915534315109254, + 0.39315735092163084, + 0.47443838696479795, + 0.4305809484481812, + 0.4602065758705139, + 0.4855801467895508, + 0.544716870880127, + 0.6184461592674255, + 0.48602481198310854, + 0.511720466041565, + 0.5636395650863647, + 0.5762063206672668, + 0.6417800651550293, + 0.6123115917682648, + 0.5502352278709411, + 0.5557829687118531, + 0.6617294226646423, + 0.6650739029884338, + 0.7917305309295655, + 0.6830677656173706, + 0.5279762314796448, + 0.5275279850006104, + 0.7316341178894042, + 0.8045071473598481, + 0.5481081441879272, + 0.6501041484832764, + 0.670727561199665, + 0.4684417116165161, + 0.6186270072937011, + 0.466635973739624, + 0.5074456503868103, + 0.5474989008903504, + 0.6431586159706115, + 0.5485258643150329, + 0.5743701865196228, + 0.6116557616233825, + 0.49257451605796815, + 0.45059744175672534, + 0.442867475605011, + 0.41883020987510683, + 0.48730407762527467, + 0.4751015350818634, + 0.4839245565414429, + 0.6619925937652588, + 0.4038557548522949, + 0.42862871398925784, + 0.42465049457550047, + 0.4021777713537216, + 0.3575906034708023, + 0.37100726470947265, + 0.44350298371315, + 0.37363572471141815, + 0.35096964074373244, + 0.3305072016239166, + 0.3425370252609253, + 0.33376783447265623, + 0.33789163026809693, + 0.3560477269053459, + 0.33696223058700564, + 0.3281270618438721, + 0.3405058237075806, + 0.3135561194419861, + 0.3187324108123779, + 0.3193257817268372, + 0.31392969816923144, + 0.3078404443740845, + 0.3086083073616028, + 0.30346697087287905, + 0.3060754126548767, + 0.3020245785713196, + 0.3013403681755066, + 0.3004632753372192 + ], + "train_acc": [ + 0.1919, + 0.5281, + 0.7258, + 0.7963, + 0.8319, + 0.8494, + 0.8467, + 0.8535, + 0.8446, + 0.8508, + 0.8274, + 0.8414, + 0.8308, + 0.8218, + 0.8056, + 0.7906, + 0.8203, + 0.8164, + 0.8014, + 0.801, + 0.7813, + 0.7929, + 0.8008, + 0.8026, + 0.7794, + 0.7745, + 0.7558, + 0.7777, + 0.8133, + 0.8094, + 0.7677, + 0.7531, + 0.8023, + 0.7904, + 0.7811, + 0.828, + 0.7935, + 0.8292, + 0.8167, + 0.8113, + 0.7979, + 0.8091, + 0.8019, + 0.7991, + 0.8229, + 0.8322, + 0.8354, + 0.8504, + 0.828, + 0.8261, + 0.8283, + 0.8013, + 0.8476, + 0.8422, + 0.8432, + 0.8514, + 0.8646, + 0.862, + 0.8393, + 0.8586, + 0.8673, + 0.8731, + 0.8716, + 0.8738, + 0.8731, + 0.8669, + 0.8707, + 0.8738, + 0.8703, + 0.8794, + 0.8792, + 0.8773, + 0.8792, + 0.8832, + 0.8817, + 0.8849, + 0.8831, + 0.8865, + 0.8856, + 0.8849 + ], + "test_acc": [ + 0.3755, + 0.6615, + 0.758, + 0.8, + 0.807, + 0.8035, + 0.812, + 0.8155, + 0.832, + 0.7705, + 0.804, + 0.799, + 0.796, + 0.7725, + 0.6785, + 0.7665, + 0.7685, + 0.7155, + 0.774, + 0.726, + 0.68, + 0.6745, + 0.763, + 0.7305, + 0.602, + 0.661, + 0.627, + 0.684, + 0.742, + 0.741, + 0.6955, + 0.773, + 0.676, + 0.597, + 0.7755, + 0.7595, + 0.7705, + 0.7325, + 0.71, + 0.716, + 0.707, + 0.6835, + 0.7205, + 0.7695, + 0.7395, + 0.742, + 0.746, + 0.7305, + 0.768, + 0.7255, + 0.72, + 0.762, + 0.797, + 0.749, + 0.788, + 0.813, + 0.7895, + 0.7935, + 0.798, + 0.8085, + 0.8275, + 0.8285, + 0.8155, + 0.8315, + 0.814, + 0.8125, + 0.829, + 0.8125, + 0.834, + 0.8345, + 0.834, + 0.833, + 0.8285, + 0.833, + 0.8365, + 0.829, + 0.834, + 0.8415, + 0.8385, + 0.8375 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.028116505593061447, + 0.29581546783447266, + 0.170908123254776, + 0.12216862291097641 + ], + "perturbation_rho": [ + -0.07312458753585815, + 0.3015226125717163, + 0.09657395631074905, + 0.12382403016090393 + ], + "nudging": { + "0.001": [ + 0.0003163664659950882, + -0.0007488747360184789, + -0.0004035384044982493, + -0.0003090125974267721 + ], + "0.003": [ + 0.000998551258817315, + -0.0022399011068046093, + -0.0012046258198097348, + -0.0009229769930243492 + ], + "0.01": [ + 0.0038727924693375826, + -0.007415304891765118, + -0.0039948043413460255, + -0.0030613194685429335 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.7790241302490235, + 0.7654216047286987, + 0.46630783150196076, + 0.47609069652557373, + 0.5295370441436767, + 0.6392696193695069, + 0.8025703903675079, + 0.8035835893630981, + 0.7054816937446594, + 0.7188894889831543, + 0.723155996131897, + 0.7175666692256928, + 0.7450492376327514, + 0.8028973734855652, + 0.7876711024284363, + 0.8558139623641968, + 0.9155208786010742, + 0.9130255826950073, + 0.8950250951766968, + 0.8848126942634582, + 0.8685707977294922, + 0.8587310639381409, + 0.8291590257644653, + 0.8409093645095825, + 0.8759365214824677, + 0.8694478960990906, + 0.8698111413955688, + 0.8271794857025146, + 0.7845186081886292, + 0.7641353513717651, + 0.8730007939338684, + 0.7617129602432251, + 0.8081050999641418, + 0.7825005729675293, + 0.8260969108581543, + 0.788632160949707, + 0.785611438369751, + 0.7567414481163025, + 0.7519236874580383, + 0.7204991332054138, + 0.6952073329925537, + 0.6957939908981323, + 0.6553646293640136, + 0.6512393726348877, + 0.6812118953704834, + 0.6507732427597046, + 0.6394011632919312, + 0.6314525890350342, + 0.6011349618911743, + 0.6011737225532532, + 0.6056679985046387, + 0.5851486385583877, + 0.5611786159515381, + 0.5698102533340454, + 0.573320036649704, + 0.5536427591323853, + 0.5558445056915283, + 0.5360203624725342, + 0.5445126184463501, + 0.5587158493041993, + 0.5366106060028076, + 0.5330157579421997, + 0.5352685430526734, + 0.5297672599315644, + 0.5239216472625733, + 0.5195175980091095, + 0.5199703005313874, + 0.5157433489561081, + 0.5121160847663879, + 0.5126092442512512, + 0.5086378963470459, + 0.5108375263214111, + 0.5078012703418732, + 0.5062523377895355, + 0.5038812646865845, + 0.5041313044309617, + 0.5022756348133087, + 0.5015905421257019, + 0.5012978015899658, + 0.5010596646308899 + ], + "train_acc": [ + 0.3594, + 0.7146, + 0.8235, + 0.8186, + 0.8051, + 0.7814, + 0.7432, + 0.7361, + 0.7595, + 0.7514, + 0.7429, + 0.74, + 0.7308, + 0.7178, + 0.7278, + 0.7089, + 0.6963, + 0.7038, + 0.7026, + 0.7037, + 0.7077, + 0.7078, + 0.7158, + 0.7134, + 0.7102, + 0.712, + 0.715, + 0.7232, + 0.7355, + 0.7393, + 0.7201, + 0.7444, + 0.7367, + 0.7377, + 0.7323, + 0.7432, + 0.7453, + 0.7439, + 0.7481, + 0.7521, + 0.7572, + 0.757, + 0.7669, + 0.7734, + 0.7688, + 0.7735, + 0.7733, + 0.7809, + 0.7902, + 0.7857, + 0.7875, + 0.7929, + 0.7995, + 0.7974, + 0.7971, + 0.8058, + 0.8039, + 0.8103, + 0.8086, + 0.8045, + 0.8106, + 0.8073, + 0.8086, + 0.8128, + 0.8122, + 0.8158, + 0.8171, + 0.8151, + 0.8149, + 0.8175, + 0.8169, + 0.8165, + 0.8181, + 0.8173, + 0.82, + 0.8182, + 0.8196, + 0.8202, + 0.82, + 0.8192 + ], + "test_acc": [ + 0.61, + 0.777, + 0.8045, + 0.7855, + 0.7695, + 0.743, + 0.699, + 0.728, + 0.7265, + 0.7325, + 0.717, + 0.722, + 0.697, + 0.725, + 0.685, + 0.6885, + 0.6915, + 0.677, + 0.685, + 0.6855, + 0.671, + 0.7015, + 0.6895, + 0.69, + 0.6625, + 0.6745, + 0.6885, + 0.7165, + 0.718, + 0.7145, + 0.7225, + 0.715, + 0.7155, + 0.7125, + 0.72, + 0.732, + 0.7175, + 0.7335, + 0.74, + 0.7355, + 0.7315, + 0.7365, + 0.742, + 0.731, + 0.755, + 0.7395, + 0.7525, + 0.7595, + 0.775, + 0.7535, + 0.776, + 0.773, + 0.779, + 0.7765, + 0.7815, + 0.7785, + 0.787, + 0.785, + 0.784, + 0.777, + 0.7825, + 0.7805, + 0.78, + 0.7915, + 0.78, + 0.7855, + 0.784, + 0.784, + 0.787, + 0.7865, + 0.782, + 0.79, + 0.7875, + 0.7845, + 0.785, + 0.7875, + 0.789, + 0.788, + 0.788, + 0.788 + ], + "state_pred_error": [ + 0.731694634437561, + 0.23417646443843843, + 0.16782856330871582, + 0.16226573445796966, + 0.17099161510467528, + 0.18394631323814392, + 0.2019855978012085, + 0.2017958946466446, + 0.18371798615455628, + 0.16329481868743898, + 0.14329309587478636, + 0.12559115798473358, + 0.11022487533092498, + 0.09227231090068817, + 0.08201295229792595, + 0.0791339715719223, + 0.08487667949199676, + 0.08578719186782836, + 0.08310736228227615, + 0.07845945283174514, + 0.07394840196371079, + 0.07031645606756211, + 0.06856394438743592, + 0.06723007636070251, + 0.06694858776330948, + 0.06499523911476135, + 0.0608354157447815, + 0.058438737750053406, + 0.05698145393133163, + 0.052568575745821, + 0.050997378104925155, + 0.05048060681819916, + 0.05061923050284386, + 0.050916296947002414, + 0.05144686884880066, + 0.049674761563539505, + 0.04818300241231918, + 0.04592841443419456, + 0.04362559068500996, + 0.04214356968998909, + 0.040407472240924835, + 0.0395667809009552, + 0.03697864121794701, + 0.035583154261112214, + 0.034380488550662995, + 0.033168623971939086, + 0.03175738565921783, + 0.030352817764878273, + 0.02928148764371872, + 0.028111288553476332, + 0.027019555035233497, + 0.025773531574010848, + 0.024918644481897356, + 0.02384750773906708, + 0.022921911144256592, + 0.02203721873164177, + 0.021401436349749565, + 0.020324303320050238, + 0.01945747507214546, + 0.019061913284659386, + 0.018533632457256317, + 0.01755019921064377, + 0.017115412124991417, + 0.01673678147494793, + 0.016080432334542274, + 0.015739672049880027, + 0.014881113383173942, + 0.014514415556192399, + 0.014839580875635148, + 0.013830390541255474, + 0.013450295147299767, + 0.013125950311124325, + 0.01287915479838848, + 0.012489116263389588, + 0.012440057030320167, + 0.012103424173593521, + 0.011794415658712388, + 0.011523600345849991, + 0.011835576038062573, + 0.011463819001615047 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8812471032142639, + 0.4430118799209595, + 0.14485391974449158, + 0.12024529278278351 + ], + "perturbation_rho": [ + 0.803270697593689, + 0.4108988642692566, + 0.12428833544254303, + 0.13494184613227844 + ], + "nudging": { + "0.001": [ + -0.024419698864221573, + -0.0013216643128544092, + -0.0002967847976833582, + -0.00024071265943348408 + ], + "0.003": [ + -0.07050125300884247, + -0.003957290668040514, + -0.000889409682713449, + -0.0007224518340080976 + ], + "0.01": [ + -0.20551547408103943, + -0.01310029998421669, + -0.0029572518542408943, + -0.0024035971146076918 + ] + }, + "state_pred_error_per_layer": [ + 6307.859375, + 4221.2177734375, + 3825.8369140625, + 3284.16064453125 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2233777091979983, + 1.3201545307159424, + 0.7576372374534607, + 0.5368822441101074, + 0.4500424364089966, + 0.38826052474975586, + 0.39760261478424075, + 0.37347561759948733, + 0.3910197820663452, + 0.4118315992355347, + 0.540269495010376, + 0.42307977981567385, + 0.5061588063240051, + 0.4734330579280853, + 0.4749123188257217, + 0.5071706413269043, + 0.5010161249160766, + 0.6885399580955506, + 0.544177054977417, + 0.5456480445146561, + 0.6398725945472717, + 0.5177282638072968, + 0.614991586971283, + 0.8017618133783341, + 0.6560545772552491, + 0.6096531329154968, + 0.6245969655513763, + 0.7609677839279175, + 0.6611320633172989, + 0.6679078796386718, + 0.8986292762756347, + 1.0624667304039002, + 1.1147180395126344, + 1.1291320568084717, + 1.0890060359954834, + 0.9963282011032104, + 0.9234770161628724, + 0.8350841384887695, + 0.7985178932189941, + 0.7377351993560791, + 0.6755618171691895, + 0.6427918606758117, + 0.6642848100662232, + 0.6907006132125855, + 0.7195065155029297, + 0.7240495725631714, + 0.7414470927238465, + 0.7254366884231568, + 0.7317997849464416, + 0.7184565709114075, + 0.7197928576469421, + 0.736747712135315, + 0.7459960594177246, + 0.7461433578968049, + 0.7599917417526245, + 0.7754338600158691, + 0.7704233293533325, + 0.7772411148071289, + 0.7732292792320251, + 0.7953451323509216, + 0.7916302759170533, + 0.7988780770301819, + 0.7872319763183594, + 0.7829252526283265, + 0.7787840461730957, + 0.7778675572395325, + 0.769661307477951, + 0.758454351234436, + 0.7563795409679412, + 0.7561245315551758, + 0.7567275346755982, + 0.7507296043395996, + 0.7509326208114624, + 0.7505197130203247, + 0.749734306716919, + 0.7463954158782959, + 0.7466216814041138, + 0.7459904764175415, + 0.7456792185783386, + 0.7455195524215699 + ], + "train_acc": [ + 0.1943, + 0.5348, + 0.7198, + 0.799, + 0.8296, + 0.8514, + 0.8485, + 0.8563, + 0.8515, + 0.8431, + 0.8126, + 0.8404, + 0.8209, + 0.8292, + 0.8287, + 0.8186, + 0.819, + 0.7762, + 0.809, + 0.8056, + 0.793, + 0.8161, + 0.7959, + 0.7597, + 0.7784, + 0.7888, + 0.7822, + 0.7508, + 0.7724, + 0.7708, + 0.7283, + 0.7004, + 0.6836, + 0.6831, + 0.689, + 0.6989, + 0.7143, + 0.7324, + 0.7395, + 0.7549, + 0.7631, + 0.7728, + 0.7685, + 0.7624, + 0.754, + 0.7545, + 0.7474, + 0.7515, + 0.749, + 0.7485, + 0.7501, + 0.7473, + 0.7401, + 0.7421, + 0.7359, + 0.7375, + 0.7374, + 0.7341, + 0.7342, + 0.7265, + 0.7332, + 0.731, + 0.7336, + 0.733, + 0.7325, + 0.736, + 0.7365, + 0.7374, + 0.7408, + 0.7383, + 0.7403, + 0.7414, + 0.7393, + 0.7371, + 0.7397, + 0.7404, + 0.7394, + 0.7412, + 0.7414, + 0.7407 + ], + "test_acc": [ + 0.3715, + 0.648, + 0.7525, + 0.7905, + 0.819, + 0.826, + 0.806, + 0.8, + 0.807, + 0.7125, + 0.8075, + 0.8035, + 0.761, + 0.728, + 0.7605, + 0.7535, + 0.6975, + 0.7105, + 0.679, + 0.6655, + 0.79, + 0.72, + 0.6645, + 0.7405, + 0.724, + 0.7155, + 0.7075, + 0.744, + 0.7375, + 0.7115, + 0.646, + 0.615, + 0.6355, + 0.6425, + 0.6855, + 0.693, + 0.6975, + 0.7135, + 0.7245, + 0.7355, + 0.744, + 0.7495, + 0.7445, + 0.726, + 0.7345, + 0.7295, + 0.7375, + 0.7205, + 0.7325, + 0.7325, + 0.7315, + 0.725, + 0.7175, + 0.717, + 0.7235, + 0.722, + 0.7205, + 0.7155, + 0.7065, + 0.7145, + 0.711, + 0.717, + 0.72, + 0.7205, + 0.714, + 0.7105, + 0.7145, + 0.7235, + 0.729, + 0.7285, + 0.7265, + 0.725, + 0.73, + 0.728, + 0.728, + 0.7275, + 0.7295, + 0.731, + 0.732, + 0.7305 + ], + "value_loss": [ + 2.8550353353500366, + 0.8866892028808594, + 0.7480095406532288, + 0.6082758625984191, + 0.5294733749389648, + 0.4669463201522827, + 0.5216086049079895, + 0.4541858399868011, + 0.4832085543632507, + 0.5550105792999268, + 0.9533118436336517, + 0.6223780393600464, + 0.8233321074962616, + 0.7200716451644897, + 0.7445190457582473, + 0.761704793548584, + 0.7307724816322326, + 1.308116909313202, + 0.847868885421753, + 0.8612865437030792, + 1.1462507836341858, + 0.8061599975585938, + 1.0712029182434082, + 1.6493792618513108, + 1.0849245027542114, + 0.9315045223712921, + 0.9024537401676178, + 1.1654763233184815, + 0.831434667301178, + 0.802046495628357, + 1.4604990215301514, + 1.8645850904464722, + 1.9254398429870605, + 1.901911312484741, + 1.908003631401062, + 1.3320872589588166, + 1.159297624206543, + 1.0534205688476563, + 1.022995594406128, + 0.8503112316131591, + 0.6928019966125488, + 0.5846758200645447, + 0.6259316144943238, + 0.737749203491211, + 0.7123853011608123, + 0.7282990433692932, + 0.7251070489883423, + 0.6488828766226769, + 0.6383351172924042, + 0.5482705329895019, + 0.5401105587005616, + 0.6111136708259582, + 0.6008573663949967, + 0.5928836660385132, + 0.587500508594513, + 0.6057562492847443, + 0.5744828891277314, + 0.5471131669998169, + 0.5470271216392517, + 0.5842728374481201, + 0.5563190423965454, + 0.5892029490470886, + 0.5781536190032959, + 0.559272833108902, + 0.5027279161453247, + 0.5155309186935425, + 0.4943126286268234, + 0.48159287810325624, + 0.47510195388793947, + 0.4727193992614746, + 0.4602918514728546, + 0.4717276556968689, + 0.4678098875999451, + 0.44807784576416015, + 0.4467434461593628, + 0.4619509654998779, + 0.4547319677352905, + 0.4616655399799347, + 0.4558076531887054, + 0.454630423784256 + ], + "term_loss": [ + 1.6017029710769652, + 0.5620692476034165, + 0.5624156644821167, + 0.45781700096130373, + 0.3847409117221832, + 0.3312454249382019, + 0.38407751197814943, + 0.32735779056549075, + 0.3551049388170242, + 0.41827326583862307, + 0.7827223787307739, + 0.4792309603691101, + 0.6631194186210633, + 0.56457426404953, + 0.5845303027391434, + 0.5921518229961396, + 0.560609471321106, + 1.0828363707065582, + 0.6606335117340087, + 0.6683305771827698, + 0.9340125537872315, + 0.6249504384040833, + 0.8550516845703126, + 1.3669306713342666, + 0.8527113088130951, + 0.7162394056797028, + 0.682893370962143, + 0.9105785119056702, + 0.6048965015590191, + 0.5712942959785462, + 1.1673702945709228, + 1.5335067611694335, + 1.5751249431610108, + 1.5584389656066895, + 1.5522349954605104, + 0.9972099202394485, + 0.8370615739822388, + 0.754201112651825, + 0.6871392876505852, + 0.5123987158775329, + 0.37408054313659667, + 0.2995497988522053, + 0.3503581358909607, + 0.43231560316085815, + 0.41566086394786833, + 0.42524624509811404, + 0.4210509229183197, + 0.37233240249752997, + 0.3575580341219902, + 0.28671212253570555, + 0.276478619146347, + 0.34283951930999756, + 0.33277941216230394, + 0.32401346683502197, + 0.3095528627634048, + 0.33110152459144593, + 0.3003123944878578, + 0.27548920292854306, + 0.2802939491033554, + 0.3095864547729492, + 0.28826558628082277, + 0.3132749440193176, + 0.30294250259399413, + 0.2914313010454178, + 0.23652310552597045, + 0.25194979372024534, + 0.23297107075452805, + 0.22141846432685852, + 0.213679298555851, + 0.21105558428764343, + 0.198782471460104, + 0.21103085417747497, + 0.20293742198944092, + 0.18831457014083863, + 0.18615080082416535, + 0.19670715589523316, + 0.19051085848808288, + 0.19064104088544845, + 0.18662560603618622, + 0.185297670173645 + ], + "bridge_loss": [ + 0.9507376404299052, + 0.07687758333981037, + 0.010045724719017744, + 0.007879937368631363, + 0.01797304810285568, + 0.022158381700515747, + 0.01883206216990948, + 0.013739564181864262, + 0.009246241227537394, + 0.00828621684461832, + 0.013158259350061416, + 0.009157512763142585, + 0.008230384607613087, + 0.010887455415725708, + 0.01082873924607411, + 0.011825704242289067, + 0.011146052476763726, + 0.020588019510917367, + 0.014733550934493541, + 0.018946828547120095, + 0.0171926746442914, + 0.012086341893672943, + 0.02020258846729994, + 0.04198084568008781, + 0.020474260175228118, + 0.017216893035918474, + 0.016566254922747613, + 0.02010813295543194, + 0.011718014118075371, + 0.009661335621774196, + 0.014811528635025025, + 0.025247243924438955, + 0.02885524544119835, + 0.02420730111002922, + 0.04327671680450439, + 0.041912767720222475, + 0.05198930660188198, + 0.04971838068962097, + 0.0946202084183693, + 0.10887049219608307, + 0.09956775677204133, + 0.07377382544577121, + 0.05807075983285904, + 0.07968466079235077, + 0.06396899864077568, + 0.07015788811445237, + 0.0661502730846405, + 0.04226519621908665, + 0.04419996572732925, + 0.02805532423853874, + 0.02968351852297783, + 0.03154238290339708, + 0.030124809206277133, + 0.030319892784953117, + 0.03490727263391018, + 0.029208701252937317, + 0.030425633952021598, + 0.027547460222244264, + 0.02228509824424982, + 0.025416205316781997, + 0.020846416425704957, + 0.025860949020087717, + 0.029329672813415527, + 0.02281882424093783, + 0.02173859670162201, + 0.02062494530826807, + 0.019635991206765176, + 0.021509875628352167, + 0.024021596324443818, + 0.02360761443376541, + 0.023896243134140967, + 0.024439388674497603, + 0.028702323484420776, + 0.022215539541840554, + 0.02425522618293762, + 0.029845060449838638, + 0.029500862574577333, + 0.03606419536471367, + 0.03410082252025604, + 0.03432008520960808 + ], + "tgrad_loss": [ + 0.3025947289943695, + 0.24774237773418425, + 0.17554815773963928, + 0.14257892484664916, + 0.12675941741466523, + 0.11354251420497895, + 0.11869904023408889, + 0.11308848708868027, + 0.11885737178325653, + 0.12845109815597533, + 0.15743120503425598, + 0.1339895663022995, + 0.1519823107242584, + 0.14460992698669434, + 0.14916000380814076, + 0.1577272620677948, + 0.15901696157455444, + 0.2046925228357315, + 0.17250181584358215, + 0.17400914220809938, + 0.19504555777311325, + 0.16912321989536286, + 0.19594864068031312, + 0.2404677330493927, + 0.21173893311023712, + 0.1980482220649719, + 0.20299411978721618, + 0.23478967311382293, + 0.21482015360593795, + 0.22109085936546324, + 0.27831719441413877, + 0.3058310720920563, + 0.32145967130661013, + 0.3192650461196899, + 0.31249191117286684, + 0.29296456089019773, + 0.27024675250053404, + 0.2495010799407959, + 0.24123610022068023, + 0.2290420253276825, + 0.21915370206832885, + 0.21135219641923905, + 0.21750271730422974, + 0.22574893996715545, + 0.23275544457435607, + 0.23289490954875947, + 0.2379058575630188, + 0.23428526936769486, + 0.23657712292671204, + 0.23350308730602265, + 0.23394841928482055, + 0.23673176517486572, + 0.2379531442165375, + 0.23855031342506408, + 0.2430403748035431, + 0.2454460260629654, + 0.24374487085342408, + 0.24407650451660157, + 0.24444807255268097, + 0.24927017650604247, + 0.24720704221725465, + 0.25006705377101895, + 0.245881445145607, + 0.24502270793914796, + 0.24446621508598326, + 0.24295618000030517, + 0.24170556166172028, + 0.23866453852653505, + 0.23740106127262114, + 0.23805620374679565, + 0.23761313960552216, + 0.23625741076469423, + 0.2361701448917389, + 0.23754773426055908, + 0.23633741874694825, + 0.23539874830245971, + 0.2347202454328537, + 0.234960302066803, + 0.23508122134208678, + 0.2350126650452614 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.03434538468718529, + 0.12379913777112961, + 0.1433446854352951, + 0.13808263838291168 + ], + "perturbation_rho": [ + 0.03924814611673355, + 0.21971622109413147, + 0.26409071683883667, + 0.20994533598423004 + ], + "nudging": { + "0.001": [ + -0.002085629850625992, + -0.000930527166929096, + -0.0010337861021980643, + -0.0009522428154014051 + ], + "0.003": [ + -0.00620113592594862, + -0.002788654062896967, + -0.00309766735881567, + -0.002854354679584503 + ], + "0.01": [ + -0.020018436014652252, + -0.00925234891474247, + -0.010285570286214352, + -0.009476927109062672 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.0_L4_s42.json b/results/synth_ladder_v2_lo/synth_a0.0_L4_s42.json new file mode 100644 index 0000000..ea8fed5 --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.0_L4_s42.json @@ -0,0 +1,1554 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.393444329071045, + 0.4656594688892364, + 0.3387208812713623, + 0.3310880187511444, + 0.2834443459033966, + 0.274416100025177, + 0.27555663251876833, + 0.2919650815010071, + 0.27522954301834107, + 0.23417099084854126, + 0.25085752539634704, + 0.23627781853675842, + 0.22855967761278154, + 0.18523962483406067, + 0.21957328805923462, + 0.21457258567810059, + 0.1951643503189087, + 0.2028646148085594, + 0.17204643013477325, + 0.1741173769235611, + 0.17967198448181151, + 0.2015627604007721, + 0.18227966165542603, + 0.1597546272277832, + 0.18108189311623574, + 0.13940092482566835, + 0.17725008516311647, + 0.16082020609378814, + 0.14163353414535523, + 0.18069012370109558, + 0.13981632175445557, + 0.17373259100914, + 0.14335163850188257, + 0.11797005029916763, + 0.1098598550081253, + 0.12287375556230545, + 0.11599228973388671, + 0.13744940540790557, + 0.11864437719583511, + 0.10169189417362214, + 0.11369898817539215, + 0.11818749423027039, + 0.12267465643882751, + 0.10739170112609864, + 0.10322156901359558, + 0.09787526609897614, + 0.09492687509059906, + 0.09019990837574005, + 0.09442386355400086, + 0.08670992460250855, + 0.08388052983283996, + 0.09170566325187683, + 0.08163954379558563, + 0.0846316162109375, + 0.07659096655249596, + 0.07475700554847717, + 0.07641377507448197, + 0.07337763814926147, + 0.072775554728508, + 0.0721108490049839, + 0.06907813559770584, + 0.06751610193252564, + 0.06612331621646882, + 0.06645804003477096, + 0.06647891576737165, + 0.06381897580623627, + 0.06374451096057891, + 0.06368994359970093, + 0.06230272837877274, + 0.06174979591369629, + 0.061164255321025846, + 0.06092808446884155, + 0.06049565544426441, + 0.05998984745144844, + 0.05971836262345314, + 0.05945266941785812, + 0.0592673523157835, + 0.059102416515350344, + 0.05901545432806015, + 0.058958782851696014 + ], + "train_acc": [ + 0.5424, + 0.8445, + 0.872, + 0.8691, + 0.8872, + 0.8945, + 0.8899, + 0.8867, + 0.8926, + 0.908, + 0.9016, + 0.9067, + 0.9102, + 0.9315, + 0.9151, + 0.915, + 0.923, + 0.9194, + 0.9324, + 0.9339, + 0.931, + 0.9216, + 0.9259, + 0.9363, + 0.927, + 0.9478, + 0.9299, + 0.9384, + 0.9472, + 0.9319, + 0.9471, + 0.9343, + 0.9444, + 0.9583, + 0.9624, + 0.957, + 0.9581, + 0.949, + 0.9573, + 0.9665, + 0.9617, + 0.9571, + 0.9557, + 0.9597, + 0.9643, + 0.9678, + 0.9689, + 0.9725, + 0.9692, + 0.9744, + 0.9771, + 0.9728, + 0.9764, + 0.9742, + 0.9821, + 0.9815, + 0.9798, + 0.9822, + 0.983, + 0.9823, + 0.9865, + 0.986, + 0.9874, + 0.9871, + 0.9859, + 0.9891, + 0.9891, + 0.9885, + 0.9899, + 0.9905, + 0.9909, + 0.9915, + 0.9915, + 0.9914, + 0.9918, + 0.992, + 0.9922, + 0.9921, + 0.9923, + 0.9924 + ], + "test_acc": [ + 0.806, + 0.8735, + 0.8755, + 0.8855, + 0.8975, + 0.8865, + 0.8865, + 0.8855, + 0.896, + 0.897, + 0.9005, + 0.901, + 0.9055, + 0.9075, + 0.895, + 0.905, + 0.903, + 0.8995, + 0.9155, + 0.91, + 0.912, + 0.909, + 0.9155, + 0.9125, + 0.9175, + 0.909, + 0.913, + 0.9085, + 0.917, + 0.913, + 0.9215, + 0.9195, + 0.919, + 0.9195, + 0.923, + 0.919, + 0.9155, + 0.9115, + 0.926, + 0.92, + 0.9215, + 0.922, + 0.9235, + 0.921, + 0.921, + 0.921, + 0.922, + 0.9245, + 0.9255, + 0.93, + 0.924, + 0.923, + 0.926, + 0.9225, + 0.9265, + 0.925, + 0.9255, + 0.923, + 0.9235, + 0.925, + 0.929, + 0.925, + 0.923, + 0.9235, + 0.9275, + 0.9245, + 0.924, + 0.924, + 0.925, + 0.925, + 0.925, + 0.9245, + 0.925, + 0.926, + 0.925, + 0.925, + 0.9255, + 0.9255, + 0.9255, + 0.925 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8599773645401001, + 0.8422204256057739, + 0.8250665664672852, + 0.8009470701217651 + ], + "perturbation_rho": [ + 0.9999991655349731, + 0.9999953508377075, + 0.9999807476997375, + 0.9999338984489441 + ], + "nudging": { + "0.001": [ + -0.021187957376241684, + -0.008892672136425972, + -0.003854521783068776, + -0.002078109886497259 + ], + "0.003": [ + -0.05588283762335777, + -0.02533331699669361, + -0.01131636556237936, + -0.006165246479213238 + ], + "0.01": [ + -0.12188813835382462, + -0.07056954503059387, + -0.034971628338098526, + -0.019762540236115456 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2351631088256836, + 1.2604516805648804, + 0.6909901732444763, + 0.5023803288459778, + 0.4199826082229614, + 0.3939720664024353, + 0.36745505712032317, + 0.36464036779403686, + 0.36945423431396485, + 0.37754397621154784, + 0.41259857263565064, + 0.3929980557441711, + 0.3836580101966858, + 0.42829677181243897, + 0.45100361251831056, + 0.4771954530715942, + 0.45615267324447634, + 0.47997308826446533, + 0.519016338443756, + 0.4339796148777008, + 0.48482293429374695, + 0.4760143366098404, + 0.41006571016311644, + 0.4283779393434525, + 0.4630606350660324, + 0.4736118658065796, + 0.47070072836875915, + 0.5205575771808624, + 0.43153712959289553, + 0.6288577288150787, + 0.49815777282714846, + 0.5681126009941101, + 0.4582767408490181, + 0.4725220314502716, + 0.4469193904876709, + 0.4821565442085266, + 0.4843693884849548, + 0.5006482328891754, + 0.44061602096557617, + 0.4250831531524658, + 0.4099806285858154, + 0.4905092445373535, + 0.5239814792633056, + 0.43106476440429686, + 0.42259651679992677, + 0.4021846671104431, + 0.41326967359781264, + 0.36481091504096985, + 0.3732275875091553, + 0.38772435383796694, + 0.3595582166671753, + 0.4164277789950371, + 0.3571169295310974, + 0.3573374299049377, + 0.3340035634994507, + 0.3495286958694458, + 0.34169850187301637, + 0.36254877605438235, + 0.3357857964515686, + 0.3260487530708313, + 0.3146523279190063, + 0.32904662322998046, + 0.3236200043678284, + 0.3109028839111328, + 0.30532244243621826, + 0.3066009913444519, + 0.29923178367614744, + 0.31248617701530457, + 0.30051798222064974, + 0.29083643901348116, + 0.289837948679924, + 0.28680111265182495, + 0.2866984937429428, + 0.284077316904068, + 0.2823953621149063, + 0.2806439053058624, + 0.28072562822103503, + 0.27919705109596255, + 0.2788663013458252, + 0.2786029499530792 + ], + "train_acc": [ + 0.1823, + 0.5598, + 0.7406, + 0.8059, + 0.8373, + 0.8477, + 0.857, + 0.8613, + 0.859, + 0.8612, + 0.8538, + 0.8613, + 0.8658, + 0.857, + 0.8547, + 0.8475, + 0.8567, + 0.8558, + 0.8472, + 0.864, + 0.854, + 0.8592, + 0.8691, + 0.8692, + 0.8595, + 0.8599, + 0.8604, + 0.8496, + 0.8638, + 0.8323, + 0.8575, + 0.8423, + 0.8613, + 0.8581, + 0.8604, + 0.855, + 0.852, + 0.8511, + 0.8644, + 0.8643, + 0.8698, + 0.8532, + 0.8413, + 0.8641, + 0.8633, + 0.8688, + 0.8668, + 0.8784, + 0.8777, + 0.8732, + 0.8802, + 0.8646, + 0.8806, + 0.8813, + 0.8854, + 0.8824, + 0.8856, + 0.876, + 0.8839, + 0.8899, + 0.8921, + 0.8875, + 0.8856, + 0.8889, + 0.8933, + 0.8918, + 0.8969, + 0.8906, + 0.8936, + 0.8976, + 0.8998, + 0.8993, + 0.8996, + 0.899, + 0.8987, + 0.9003, + 0.8989, + 0.9013, + 0.9017, + 0.9017 + ], + "test_acc": [ + 0.3805, + 0.658, + 0.763, + 0.8055, + 0.802, + 0.799, + 0.8135, + 0.83, + 0.818, + 0.818, + 0.8195, + 0.821, + 0.822, + 0.7695, + 0.8265, + 0.821, + 0.8265, + 0.8005, + 0.8295, + 0.8195, + 0.8175, + 0.837, + 0.825, + 0.7865, + 0.813, + 0.783, + 0.7715, + 0.7985, + 0.767, + 0.8315, + 0.782, + 0.82, + 0.819, + 0.8365, + 0.777, + 0.8205, + 0.7815, + 0.7855, + 0.8065, + 0.823, + 0.835, + 0.774, + 0.805, + 0.812, + 0.8135, + 0.813, + 0.837, + 0.834, + 0.841, + 0.8225, + 0.8385, + 0.8245, + 0.8455, + 0.8425, + 0.8365, + 0.8515, + 0.8475, + 0.8555, + 0.847, + 0.854, + 0.854, + 0.836, + 0.8465, + 0.843, + 0.853, + 0.848, + 0.8515, + 0.849, + 0.8545, + 0.8535, + 0.8525, + 0.8535, + 0.853, + 0.854, + 0.855, + 0.855, + 0.855, + 0.8565, + 0.8555, + 0.856 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.004014266654849052, + 0.16519895195960999, + 0.13244280219078064, + 0.11504888534545898 + ], + "perturbation_rho": [ + 0.042726192623376846, + 0.18379396200180054, + 0.108277827501297, + 0.03345024213194847 + ], + "nudging": { + "0.001": [ + -0.0005973952356725931, + -0.0005849459557794034, + -0.00033618923043832183, + -0.0002846581628546119 + ], + "0.003": [ + -0.0017661447636783123, + -0.0017487092409282923, + -0.0010064283851534128, + -0.0008522539865225554 + ], + "0.01": [ + -0.005573366768658161, + -0.005793239921331406, + -0.003338021691888571, + -0.002831015270203352 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.8313716026306153, + 0.7926182842254639, + 0.46973575134277346, + 0.48155548248291014, + 0.5448596946716309, + 0.6645664943695069, + 0.7318389461517334, + 0.7279546222686768, + 0.7492408039093018, + 0.7303381389141083, + 0.7058333037376404, + 0.7079017165184021, + 0.7165615272521972, + 0.7146007489204407, + 0.7339236400604248, + 0.7427304380893708, + 0.760910213470459, + 0.8237569445610047, + 0.7993208209991455, + 0.8246796663284301, + 0.8065732408523559, + 0.8133731035232544, + 0.7934063248634339, + 0.8101628801345825, + 0.8197265989303589, + 0.8273739593505859, + 0.8092071041584015, + 0.7728347238540649, + 0.7805830051422119, + 0.7523685384750366, + 0.6997231612205506, + 0.7115532672405243, + 0.6899057216644288, + 0.7243086003780365, + 0.7161950044155121, + 0.6915306072235108, + 0.7306950844287873, + 0.7001749244689941, + 0.7435074928283691, + 0.7183393833160401, + 0.6917117639541626, + 0.6912902464389801, + 0.7219114833831787, + 0.7060039350509644, + 0.7032419225692749, + 0.7001213099002838, + 0.6712141176223755, + 0.6735524456977844, + 0.6646129000663757, + 0.6637430681228638, + 0.6549304262876511, + 0.6523052272796631, + 0.6376511907577515, + 0.6561032221794129, + 0.6557626156806946, + 0.6385821124076844, + 0.6371082330703736, + 0.622728742980957, + 0.6358778423309326, + 0.6097657412528992, + 0.5984001077651978, + 0.6008862220764161, + 0.6019291736602783, + 0.5893378508806228, + 0.5775623394012451, + 0.5764101420402526, + 0.5693036109924317, + 0.5785774702072144, + 0.5725307025909424, + 0.5699037223815918, + 0.5678042579650879, + 0.5655107064247131, + 0.5588490388393402, + 0.5583755543708802, + 0.5569040360450744, + 0.555097555732727, + 0.5553366912841797, + 0.5538557461977005, + 0.5529845510482788, + 0.5527793859481811 + ], + "train_acc": [ + 0.3425, + 0.7013, + 0.8169, + 0.8155, + 0.8002, + 0.7747, + 0.7521, + 0.7467, + 0.7366, + 0.7402, + 0.7432, + 0.7511, + 0.7483, + 0.7529, + 0.7435, + 0.7501, + 0.7443, + 0.7278, + 0.737, + 0.729, + 0.7347, + 0.7305, + 0.7339, + 0.7327, + 0.7272, + 0.7248, + 0.7394, + 0.7436, + 0.7445, + 0.7497, + 0.7621, + 0.7597, + 0.7682, + 0.7574, + 0.7627, + 0.7629, + 0.7527, + 0.7656, + 0.7528, + 0.7589, + 0.7652, + 0.7627, + 0.7557, + 0.7562, + 0.7584, + 0.7611, + 0.7712, + 0.7672, + 0.7691, + 0.77, + 0.7688, + 0.7715, + 0.7805, + 0.7717, + 0.7726, + 0.7796, + 0.7806, + 0.784, + 0.7781, + 0.7916, + 0.7943, + 0.7897, + 0.788, + 0.7945, + 0.7966, + 0.7954, + 0.7997, + 0.7948, + 0.7941, + 0.7979, + 0.7973, + 0.7998, + 0.8028, + 0.8015, + 0.8024, + 0.8021, + 0.8017, + 0.8049, + 0.8036, + 0.8043 + ], + "test_acc": [ + 0.582, + 0.7605, + 0.805, + 0.7815, + 0.7585, + 0.739, + 0.7315, + 0.7055, + 0.709, + 0.716, + 0.7225, + 0.7035, + 0.714, + 0.7025, + 0.6895, + 0.71, + 0.682, + 0.684, + 0.6935, + 0.6815, + 0.663, + 0.6735, + 0.6475, + 0.6625, + 0.687, + 0.691, + 0.691, + 0.6855, + 0.708, + 0.711, + 0.7175, + 0.7135, + 0.7035, + 0.7, + 0.702, + 0.7015, + 0.719, + 0.69, + 0.722, + 0.7085, + 0.711, + 0.6865, + 0.7155, + 0.693, + 0.727, + 0.717, + 0.726, + 0.7125, + 0.734, + 0.7355, + 0.7235, + 0.721, + 0.7245, + 0.703, + 0.7315, + 0.7205, + 0.733, + 0.735, + 0.745, + 0.7455, + 0.742, + 0.7425, + 0.757, + 0.754, + 0.7545, + 0.754, + 0.7585, + 0.753, + 0.7545, + 0.755, + 0.7585, + 0.7635, + 0.758, + 0.76, + 0.762, + 0.763, + 0.759, + 0.76, + 0.762, + 0.7615 + ], + "state_pred_error": [ + 0.738724960899353, + 0.23754536838531495, + 0.17166675362586975, + 0.16519432184696198, + 0.17659714086055756, + 0.1853035955429077, + 0.18247937891483307, + 0.1752823434829712, + 0.16551947779655457, + 0.15197912480831147, + 0.14014595470428468, + 0.12900954908132553, + 0.11189029586315155, + 0.09048521988391876, + 0.07707659014463425, + 0.06862674397230148, + 0.0619474271774292, + 0.057251011681556704, + 0.05508155573606491, + 0.053471049499511716, + 0.05379626307487488, + 0.05419672028422356, + 0.052421370673179625, + 0.049650419402122496, + 0.047358448946475985, + 0.04709382080435753, + 0.04492674662470818, + 0.04099081097245216, + 0.038694602066278456, + 0.03637899459600449, + 0.035295955044031144, + 0.03464271750450134, + 0.03390544964671135, + 0.0339607761323452, + 0.03294503695368767, + 0.03164411043822765, + 0.030480435860157012, + 0.030075301492214202, + 0.028113591521978377, + 0.027257576552033425, + 0.02627144229412079, + 0.026506870889663695, + 0.024739411950111388, + 0.02403323279619217, + 0.023340081292390822, + 0.022683567291498185, + 0.021613040015101434, + 0.020623113670945166, + 0.01925096574127674, + 0.018227936267852782, + 0.017412171779572962, + 0.01633626956343651, + 0.015502833461761475, + 0.01486019978672266, + 0.014131347727775573, + 0.013682181715965271, + 0.013298307892680168, + 0.012884229637682439, + 0.01228856347501278, + 0.012014592817425727, + 0.011584452259540558, + 0.011723892691731453, + 0.011077864146232606, + 0.010830551779270172, + 0.01048019336760044, + 0.010463275627046823, + 0.010006480371952058, + 0.010270701536536217, + 0.009520307847857476, + 0.009370259954035282, + 0.009139169569313526, + 0.009051338295638561, + 0.0087209147721529, + 0.0086469930768013, + 0.00830997234582901, + 0.008232304611802101, + 0.00801251590847969, + 0.007979873966425657, + 0.007716833171993494, + 0.0075651704967021945 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8646283149719238, + 0.4090673327445984, + 0.1404263973236084, + 0.114067442715168 + ], + "perturbation_rho": [ + 0.7375176548957825, + 0.33617356419563293, + 0.14259827136993408, + 0.06911392509937286 + ], + "nudging": { + "0.001": [ + -0.02527385950088501, + -0.0013827341608703136, + -0.0003888161154463887, + -0.00030949554638937116 + ], + "0.003": [ + -0.07343459129333496, + -0.004140978213399649, + -0.0011658729054033756, + -0.0009282166138291359 + ], + "0.01": [ + -0.218303382396698, + -0.013712376356124878, + -0.003879058640450239, + -0.0030895976815372705 + ] + }, + "state_pred_error_per_layer": [ + 6951.521484375, + 6099.5322265625, + 5877.8310546875, + 3832.076416015625 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.235261058425903, + 1.262081871986389, + 0.6915569072723389, + 0.4963927393436432, + 0.41897850689888, + 0.3801000884056091, + 0.3732742650032043, + 0.360334720993042, + 0.40119956569671633, + 0.40856367979049685, + 0.39234666719436645, + 0.38830075261592867, + 0.42427587156295776, + 0.39181271744966506, + 0.3884301266908646, + 0.40899407005310057, + 0.5711139780521393, + 0.44214163110256194, + 0.5412520337820053, + 0.5265979358673095, + 0.6395262619018555, + 0.6767067618846894, + 0.8079449705123901, + 0.8860318534851074, + 0.7464127262115479, + 0.8458122653961182, + 0.8400936029434204, + 0.8388831905364991, + 0.7874737511634826, + 0.8481869525909423, + 0.9002291926383972, + 0.8685866487503052, + 0.9101456764221192, + 0.8837849536895752, + 0.972322064781189, + 0.9345996368408203, + 0.9418193544387817, + 1.0260784551620483, + 0.9719976706504821, + 0.9391058128356934, + 0.9489206720352172, + 0.9835691333770752, + 0.967494802236557, + 0.9707959476470948, + 1.0399179498672486, + 1.0601639880180358, + 0.985697636795044, + 1.008144894504547, + 1.0092436389923096, + 1.0680249240875244, + 1.0354044677734375, + 1.0328852564811706, + 1.015745788383484, + 1.0277701950073241, + 1.0103555604934693, + 1.0488319797515868, + 1.0303876429557801, + 1.0285811204433442, + 1.0417894123077394, + 1.0004704116821288, + 1.0626476989746094, + 0.9951508989334107, + 1.0081708417892457, + 0.9910860794067383, + 0.9883740512847901, + 0.9812014641761779, + 0.9917335124969482, + 0.9694048974990844, + 0.9646705657958984, + 0.9635228799819946, + 0.9591471391677856, + 0.9535331716537475, + 0.9531492277145386, + 0.9459964708328247, + 0.9468160850524903, + 0.9449826847076416, + 0.9444061769485473, + 0.9419779738426208, + 0.940774139881134, + 0.9405258314132691 + ], + "train_acc": [ + 0.1859, + 0.5571, + 0.7419, + 0.8077, + 0.8355, + 0.854, + 0.8566, + 0.8623, + 0.8544, + 0.8542, + 0.8635, + 0.863, + 0.8534, + 0.8702, + 0.8695, + 0.8666, + 0.8423, + 0.8592, + 0.8456, + 0.8478, + 0.8218, + 0.8173, + 0.7867, + 0.777, + 0.7871, + 0.7663, + 0.7597, + 0.7502, + 0.7552, + 0.7402, + 0.7275, + 0.7264, + 0.7154, + 0.721, + 0.7022, + 0.7062, + 0.7027, + 0.6832, + 0.689, + 0.6948, + 0.6911, + 0.68, + 0.6843, + 0.6828, + 0.6613, + 0.6613, + 0.6731, + 0.669, + 0.6672, + 0.6584, + 0.6651, + 0.6658, + 0.6648, + 0.6609, + 0.661, + 0.6587, + 0.6615, + 0.6583, + 0.6597, + 0.6641, + 0.6535, + 0.6622, + 0.6598, + 0.6636, + 0.6656, + 0.6651, + 0.6674, + 0.6666, + 0.6709, + 0.6665, + 0.6731, + 0.6714, + 0.673, + 0.6717, + 0.6727, + 0.6728, + 0.6735, + 0.6738, + 0.6744, + 0.6741 + ], + "test_acc": [ + 0.384, + 0.66, + 0.757, + 0.791, + 0.815, + 0.826, + 0.7975, + 0.8165, + 0.8125, + 0.799, + 0.83, + 0.8025, + 0.8145, + 0.822, + 0.808, + 0.8145, + 0.8015, + 0.8145, + 0.8205, + 0.785, + 0.8, + 0.744, + 0.738, + 0.764, + 0.7405, + 0.713, + 0.729, + 0.7045, + 0.7025, + 0.7025, + 0.677, + 0.6385, + 0.721, + 0.592, + 0.627, + 0.694, + 0.6495, + 0.6515, + 0.637, + 0.6755, + 0.6155, + 0.673, + 0.6715, + 0.628, + 0.6315, + 0.6485, + 0.635, + 0.62, + 0.5955, + 0.622, + 0.636, + 0.63, + 0.637, + 0.643, + 0.6265, + 0.6445, + 0.6375, + 0.6175, + 0.649, + 0.6255, + 0.656, + 0.652, + 0.643, + 0.644, + 0.6555, + 0.6575, + 0.647, + 0.6605, + 0.656, + 0.6575, + 0.6565, + 0.661, + 0.655, + 0.6575, + 0.664, + 0.657, + 0.663, + 0.6585, + 0.6585, + 0.6585 + ], + "value_loss": [ + 2.789435099697113, + 0.8181893708229065, + 0.7272053227424622, + 0.5833633841991425, + 0.5203261951446533, + 0.487560515499115, + 0.5104867960453033, + 0.5071568609237671, + 0.7265350058555603, + 0.6770524631500244, + 0.6544264476060867, + 0.6184350404918194, + 0.82130862698555, + 0.7288621360361576, + 0.6920311128377914, + 0.7491695034027099, + 1.436285315656662, + 0.9137073722839355, + 1.3024319067001342, + 1.1969394775390625, + 1.5527768714904786, + 1.7683637444019318, + 2.1371090829849244, + 2.7897338537216188, + 1.7251617815971374, + 2.1219203945159912, + 1.8316284656524657, + 1.6271437129974364, + 1.533262328338623, + 1.4435790887832642, + 1.425470267868042, + 1.2025170761942863, + 1.3155294904232024, + 1.1143611429214477, + 1.2226881009578705, + 1.4462114141464233, + 1.0543560623168946, + 1.0660594150543212, + 0.9147385849952697, + 0.8270027490615844, + 0.8281644924163818, + 1.0131224609851837, + 0.8204657958984375, + 0.7915476408958435, + 1.0112078512191773, + 0.9825851963043213, + 0.7297250129699707, + 0.7310111741065979, + 0.8675759086608886, + 0.8777669506072998, + 0.7935477031707764, + 0.7559813811302185, + 0.6910819556236267, + 0.7187119407653808, + 0.7091325038909913, + 0.8288764345169067, + 0.6835856030464172, + 0.696506120300293, + 0.7955103742599487, + 0.6248370735168457, + 0.7264847853183747, + 0.6357070183992386, + 0.6640777275085449, + 0.6200332149505615, + 0.6066704128265381, + 0.6134613354206085, + 0.624502198600769, + 0.5682870136260987, + 0.5714269968986512, + 0.5611187159061432, + 0.560384591293335, + 0.5337265998840331, + 0.518946839427948, + 0.5066715524673462, + 0.5192569964408874, + 0.5218038980484009, + 0.515819926071167, + 0.5021115490913391, + 0.5022512309074402, + 0.5270826056480408 + ], + "term_loss": [ + 1.6281806005001067, + 0.5260812068939209, + 0.5574779790878296, + 0.4467624794960022, + 0.38560171570777896, + 0.35132181377410887, + 0.3726922478437424, + 0.3839768423080444, + 0.5983181779623031, + 0.5458563985824585, + 0.5328782257556915, + 0.49554837535619733, + 0.6895202607631683, + 0.6041087128341198, + 0.5711961905956269, + 0.622646349143982, + 1.2603772453427315, + 0.773075110912323, + 1.1336991445064544, + 1.0312418762207032, + 1.3463582670211791, + 1.5365228524684906, + 1.8501261821746826, + 2.4006380270242693, + 1.451894647026062, + 1.8385419921875, + 1.5503413744926453, + 1.348254576587677, + 1.2533037424087525, + 1.162389670753479, + 1.1130255826950073, + 0.9006625356771052, + 1.0001833762645722, + 0.8168405591964721, + 0.9015608322620392, + 1.099498508644104, + 0.723140911102295, + 0.7195442680358887, + 0.5906892456054688, + 0.5117025557518006, + 0.5222296411037445, + 0.6893843678474426, + 0.5126559923410415, + 0.47389315984249114, + 0.6742367547988891, + 0.6494622436523437, + 0.42108994102478026, + 0.42529633424282076, + 0.5564227697372437, + 0.562213070678711, + 0.4802745559692383, + 0.4539243455886841, + 0.3954838166773319, + 0.41656764430999754, + 0.407904678440094, + 0.5054427813529968, + 0.3801931502342224, + 0.3841923901736736, + 0.47365911989212034, + 0.32998718037605285, + 0.4120689484864473, + 0.334956028342247, + 0.3557816318035126, + 0.31811208209991454, + 0.3048724256515503, + 0.31001371720433235, + 0.3186835240840912, + 0.27292693586349487, + 0.2744087711334228, + 0.26349675579071047, + 0.26173307815790176, + 0.24325768327713013, + 0.22855849746465684, + 0.21712086362838745, + 0.2279037822365761, + 0.22775145735740662, + 0.2218828114748001, + 0.21318944548368454, + 0.2103438462257385, + 0.22659661755561827 + ], + "bridge_loss": [ + 0.8669556872836547, + 0.06360601794421673, + 0.008560461984574795, + 0.005917139887809754, + 0.01696948218345642, + 0.025800688429176807, + 0.02753051795810461, + 0.015897551971673966, + 0.012487161195278167, + 0.011549899433553218, + 0.009167527516558766, + 0.010144380106031895, + 0.012813932079076768, + 0.014643209081888198, + 0.012564446350932122, + 0.013087814033031464, + 0.0355284596927464, + 0.019168835720419882, + 0.028831265807896852, + 0.029531528568267823, + 0.04496059722006321, + 0.05906419792771339, + 0.08262725896835327, + 0.17684709503650664, + 0.07839597351551056, + 0.07206453119516373, + 0.06329247436523437, + 0.05826105718612671, + 0.06393873658180237, + 0.05167575533390045, + 0.06876316456794739, + 0.06094803668484092, + 0.06672434015274048, + 0.05214060747623444, + 0.059061125856637954, + 0.0942545708656311, + 0.0740616250872612, + 0.07541715958714486, + 0.06009064224362373, + 0.05432415052056313, + 0.044301791000366214, + 0.05619173694849014, + 0.04468392983227968, + 0.05211084792613983, + 0.056994534659385684, + 0.0499825501203537, + 0.036443243896961214, + 0.032711439895629885, + 0.0384589661359787, + 0.0338902623295784, + 0.03647522128820419, + 0.02619726200699806, + 0.02073877650052309, + 0.025440873777866364, + 0.026828269357979297, + 0.04103488396704197, + 0.027947768175601958, + 0.03465887205153704, + 0.04586356149315834, + 0.023804297626018524, + 0.03421685046106577, + 0.031679686503112314, + 0.03704538420438767, + 0.03376271347999573, + 0.032853434824943545, + 0.037378453141450885, + 0.03849537320137024, + 0.031244005316495894, + 0.033646199870109555, + 0.033860014009475706, + 0.036484488779306413, + 0.029376127362251283, + 0.03004473757147789, + 0.03032349246442318, + 0.03176274458765983, + 0.03554704558849335, + 0.03567317904829979, + 0.030595304039120676, + 0.033694784569740295, + 0.04233165686130524 + ], + "tgrad_loss": [ + 0.29429881639480593, + 0.22850215055942535, + 0.161166881275177, + 0.13068375954627992, + 0.11775499715805053, + 0.11043801250457763, + 0.11026402975320816, + 0.1072824667930603, + 0.11572966387271881, + 0.1196461637020111, + 0.11238069614171982, + 0.11274228993058205, + 0.11897443695068359, + 0.1101102095194161, + 0.10827047473788261, + 0.11343533954620362, + 0.1403796047925949, + 0.12146342446804047, + 0.13990149824619294, + 0.13616608276367187, + 0.16145800683498382, + 0.17277670335769654, + 0.20435564041137697, + 0.2122487030506134, + 0.19487117614746094, + 0.2113138470888138, + 0.21799462871551514, + 0.22062808697223663, + 0.21601984961032866, + 0.2295136512517929, + 0.2436815215110779, + 0.24090649601221084, + 0.24862176179885864, + 0.24537998490333557, + 0.2620661392688751, + 0.2524583529949188, + 0.25715352358818055, + 0.27109798228740695, + 0.26395870418548584, + 0.26097603678703307, + 0.2616330534219742, + 0.26754635171890256, + 0.26312588040828705, + 0.26554363651275636, + 0.27997655792236326, + 0.283140408372879, + 0.27219182567596434, + 0.273003400182724, + 0.2726941707611084, + 0.28166362385749816, + 0.2767979258060455, + 0.27585977494716646, + 0.27485936024188995, + 0.27670341873168947, + 0.27439955916404724, + 0.28239877376556394, + 0.2754446792840958, + 0.2776548579931259, + 0.2759876941680908, + 0.2710455940723419, + 0.2801989861369133, + 0.26907129883766173, + 0.27125071516036986, + 0.2681584177017212, + 0.26894454793930056, + 0.2660691703081131, + 0.2673233015060425, + 0.26411607012748717, + 0.26337203187942504, + 0.2637619474411011, + 0.2621670220375061, + 0.2610927885055542, + 0.2603436091423035, + 0.2592271981239319, + 0.2595904722213745, + 0.2585053967475891, + 0.25826393089294436, + 0.2583268014431, + 0.2582126024246216, + 0.25815433073043825 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.049023956060409546, + 0.11911389231681824, + 0.12341275811195374, + 0.14533579349517822 + ], + "perturbation_rho": [ + 0.09633419662714005, + 0.23598268628120422, + 0.24357257783412933, + 0.28465405106544495 + ], + "nudging": { + "0.001": [ + -0.0026640507858246565, + -0.0008936430094763637, + -0.0009184350492432714, + -0.0010046247625723481 + ], + "0.003": [ + -0.00795636884868145, + -0.002677815966308117, + -0.0027562258765101433, + -0.00301147997379303 + ], + "0.01": [ + -0.026128236204385757, + -0.008897590450942516, + -0.009167088195681572, + -0.01000890415161848 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.0_L4_s456.json b/results/synth_ladder_v2_lo/synth_a0.0_L4_s456.json new file mode 100644 index 0000000..7650767 --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.0_L4_s456.json @@ -0,0 +1,1554 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.3731443418502807, + 0.45537459869384767, + 0.35577080373764036, + 0.31175249495506285, + 0.27360669269561766, + 0.2810947861671448, + 0.24048879499435424, + 0.24676378889083864, + 0.2759784088134766, + 0.24307160301208497, + 0.26237674512863157, + 0.23416826553344727, + 0.2248387837409973, + 0.21073892421722412, + 0.24063232788443564, + 0.1794070078253746, + 0.16393975179195405, + 0.17630366325974464, + 0.1611418173789978, + 0.18589975430965425, + 0.19959153530597687, + 0.18609004082679748, + 0.2101752697944641, + 0.18727956137657165, + 0.18735633269548416, + 0.15335247926712037, + 0.15109058359861374, + 0.13571504959762096, + 0.1245847250699997, + 0.14161244950294494, + 0.1458503407716751, + 0.13648778162002564, + 0.15326098034381866, + 0.13605039689540863, + 0.14244712383747102, + 0.12564499164819717, + 0.12560201988220215, + 0.123886791780591, + 0.10236743612289428, + 0.1362798055291176, + 0.12099106664657593, + 0.10914861574172974, + 0.12570393970012664, + 0.10449062542915344, + 0.10824102314710617, + 0.09449664130806923, + 0.08988672842979431, + 0.09423538935184479, + 0.086681573843956, + 0.08409314980506898, + 0.09122710851430893, + 0.08288905795812607, + 0.07891612914800644, + 0.08072301609516144, + 0.07801145380735397, + 0.07551923055648804, + 0.08653738065361977, + 0.07552462376207113, + 0.07158097697496414, + 0.06908470562696457, + 0.07035302019119263, + 0.0688866972208023, + 0.06807387411594391, + 0.06748173639774323, + 0.06727217892408371, + 0.06582817186415195, + 0.0644117630302906, + 0.06337794905900955, + 0.06335201333165169, + 0.06263100127875805, + 0.061897891375422474, + 0.06139995861053467, + 0.061135529518127445, + 0.06082992137670517, + 0.060517309045791626, + 0.06032120343446731, + 0.06014305528700352, + 0.05998744894862175, + 0.059879496657848356, + 0.05982443904429674 + ], + "train_acc": [ + 0.5436, + 0.8483, + 0.8663, + 0.8784, + 0.8941, + 0.8913, + 0.9035, + 0.905, + 0.8901, + 0.9066, + 0.8969, + 0.9066, + 0.909, + 0.9154, + 0.9038, + 0.9302, + 0.9381, + 0.9348, + 0.9379, + 0.9263, + 0.9193, + 0.9257, + 0.9166, + 0.9258, + 0.9252, + 0.9404, + 0.9411, + 0.9484, + 0.9558, + 0.9448, + 0.9436, + 0.9492, + 0.941, + 0.9459, + 0.9449, + 0.9524, + 0.9517, + 0.9544, + 0.9659, + 0.9472, + 0.9539, + 0.9594, + 0.9519, + 0.9626, + 0.9611, + 0.9693, + 0.9708, + 0.9683, + 0.9725, + 0.9741, + 0.972, + 0.9759, + 0.9773, + 0.9767, + 0.9781, + 0.9808, + 0.9724, + 0.9803, + 0.9835, + 0.9843, + 0.9837, + 0.9842, + 0.9845, + 0.9851, + 0.9866, + 0.9865, + 0.9873, + 0.9891, + 0.9886, + 0.9882, + 0.9892, + 0.9897, + 0.9899, + 0.9895, + 0.9902, + 0.9903, + 0.9903, + 0.9903, + 0.9905, + 0.9904 + ], + "test_acc": [ + 0.8105, + 0.863, + 0.8775, + 0.8835, + 0.8925, + 0.891, + 0.887, + 0.8875, + 0.894, + 0.9015, + 0.8975, + 0.8955, + 0.895, + 0.898, + 0.8995, + 0.9105, + 0.9045, + 0.91, + 0.9115, + 0.9025, + 0.899, + 0.908, + 0.8935, + 0.903, + 0.911, + 0.917, + 0.9115, + 0.918, + 0.914, + 0.917, + 0.9165, + 0.923, + 0.922, + 0.911, + 0.9185, + 0.9145, + 0.9095, + 0.917, + 0.9165, + 0.914, + 0.918, + 0.919, + 0.919, + 0.9215, + 0.919, + 0.926, + 0.925, + 0.927, + 0.927, + 0.928, + 0.9255, + 0.928, + 0.9295, + 0.9275, + 0.931, + 0.9255, + 0.929, + 0.929, + 0.9295, + 0.929, + 0.9285, + 0.928, + 0.928, + 0.927, + 0.9275, + 0.927, + 0.927, + 0.93, + 0.9285, + 0.9285, + 0.9285, + 0.9275, + 0.928, + 0.9285, + 0.929, + 0.9285, + 0.9285, + 0.9285, + 0.9285, + 0.9285 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8268355131149292, + 0.7960893511772156, + 0.7726784944534302, + 0.758276104927063 + ], + "perturbation_rho": [ + 0.9999993443489075, + 0.999996542930603, + 0.999983549118042, + 0.9999449253082275 + ], + "nudging": { + "0.001": [ + -0.025982849299907684, + -0.011168255470693111, + -0.004903188906610012, + -0.00263153831474483 + ], + "0.003": [ + -0.0689958781003952, + -0.031877096742391586, + -0.014398043975234032, + -0.0078039406798779964 + ], + "0.01": [ + -0.15056422352790833, + -0.08916378021240234, + -0.04451071470975876, + -0.024980343878269196 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.224132486343384, + 1.301893235874176, + 0.7188028474807739, + 0.5128707235813141, + 0.42812706022262575, + 0.37687723331451417, + 0.36274061586856843, + 0.37224565534591675, + 0.409719740486145, + 0.363206641292572, + 0.4132363173484802, + 0.3830319176673889, + 0.4377296754837036, + 0.5042400701522827, + 0.4587587996959686, + 0.40405231256484986, + 0.4265386765956879, + 0.46920745529383423, + 0.4496193967103958, + 0.5309565215110779, + 0.47508658266067505, + 0.5223682291030883, + 0.5833926257848739, + 0.4541007481098175, + 0.486807417678833, + 0.6768758428573608, + 0.6182225590750575, + 0.44827224477529526, + 0.4793268074035644, + 0.5156525156021118, + 0.6022252152085305, + 0.5234319113731384, + 0.579210432434082, + 0.6143261737346649, + 0.5015040687561035, + 0.5146571145176887, + 0.445119722366333, + 0.5691154903054237, + 0.448343026638031, + 0.4685825558662415, + 0.4096014291524887, + 0.5122244827270508, + 0.6234302169322967, + 0.45217046575546266, + 0.47220536499023436, + 0.4531041558265686, + 0.4435129361629486, + 0.41575306297540665, + 0.3937792213439941, + 0.41530909223556517, + 0.3755643924176693, + 0.3749552250266075, + 0.3837516236305237, + 0.4414386757850647, + 0.37744559860229493, + 0.3851316329956055, + 0.4645349792003632, + 0.3641450496673584, + 0.33832284042835237, + 0.3521949558258057, + 0.3619681317090988, + 0.32718548822402954, + 0.3552513185501099, + 0.3407223903656006, + 0.35497476048469545, + 0.33103148469924926, + 0.3239391952753067, + 0.3205251240491867, + 0.3142642366409302, + 0.3211916448712349, + 0.31001556646823886, + 0.30832804889678955, + 0.30703437480926515, + 0.30306859114170076, + 0.3034073314666748, + 0.30061344475746155, + 0.2995585773333907, + 0.2981973441004753, + 0.29732816677093504, + 0.29705501853227617 + ], + "train_acc": [ + 0.1974, + 0.5468, + 0.7323, + 0.8055, + 0.8397, + 0.8578, + 0.8597, + 0.8554, + 0.8508, + 0.8621, + 0.8543, + 0.8596, + 0.8544, + 0.8409, + 0.8505, + 0.8624, + 0.8606, + 0.8605, + 0.8591, + 0.849, + 0.8606, + 0.8512, + 0.847, + 0.8642, + 0.8642, + 0.8388, + 0.8457, + 0.8726, + 0.8708, + 0.8639, + 0.8488, + 0.8655, + 0.8584, + 0.8527, + 0.8736, + 0.8691, + 0.879, + 0.8616, + 0.8812, + 0.8705, + 0.8883, + 0.8723, + 0.8579, + 0.8837, + 0.877, + 0.8811, + 0.8823, + 0.89, + 0.8942, + 0.8841, + 0.898, + 0.8937, + 0.8918, + 0.8832, + 0.8939, + 0.8931, + 0.8814, + 0.8987, + 0.9038, + 0.9009, + 0.8973, + 0.9057, + 0.9007, + 0.9047, + 0.8983, + 0.9058, + 0.9078, + 0.9061, + 0.9088, + 0.9077, + 0.9092, + 0.9088, + 0.9106, + 0.9119, + 0.9088, + 0.9119, + 0.9103, + 0.9118, + 0.9119, + 0.9122 + ], + "test_acc": [ + 0.403, + 0.649, + 0.7545, + 0.7955, + 0.8085, + 0.8145, + 0.8085, + 0.822, + 0.819, + 0.816, + 0.7925, + 0.7795, + 0.768, + 0.797, + 0.8135, + 0.816, + 0.811, + 0.7945, + 0.778, + 0.8085, + 0.8, + 0.811, + 0.7915, + 0.797, + 0.777, + 0.7965, + 0.8235, + 0.809, + 0.82, + 0.82, + 0.792, + 0.787, + 0.814, + 0.8055, + 0.8135, + 0.833, + 0.7875, + 0.8145, + 0.819, + 0.826, + 0.8285, + 0.7855, + 0.827, + 0.8245, + 0.8305, + 0.844, + 0.8395, + 0.83, + 0.8305, + 0.837, + 0.8445, + 0.8275, + 0.8325, + 0.842, + 0.853, + 0.821, + 0.831, + 0.848, + 0.85, + 0.8495, + 0.845, + 0.858, + 0.8535, + 0.856, + 0.8565, + 0.859, + 0.8565, + 0.8555, + 0.862, + 0.857, + 0.8585, + 0.8565, + 0.8635, + 0.8615, + 0.862, + 0.864, + 0.8635, + 0.8655, + 0.8655, + 0.8655 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.012256121262907982, + 0.07949584722518921, + 0.0787847638130188, + 0.09904449433088303 + ], + "perturbation_rho": [ + -0.003950485959649086, + 0.06165219843387604, + 0.14469987154006958, + 0.16344788670539856 + ], + "nudging": { + "0.001": [ + 0.00019160524243488908, + -0.0005540554411709309, + -0.0002737665781751275, + -0.0003133100690320134 + ], + "0.003": [ + 0.0006248276331461966, + -0.0016580942319706082, + -0.0008215569541789591, + -0.0009416901739314198 + ], + "0.01": [ + 0.002696676878258586, + -0.005506287328898907, + -0.0027312645688652992, + -0.003131583333015442 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.7803834889411927, + 0.732652216053009, + 0.45487410321235655, + 0.4741226222038269, + 0.5595431688308716, + 0.6150015846252441, + 0.6448732872009277, + 0.7614690663337708, + 0.7527310195922852, + 0.6854381818771362, + 0.69789430103302, + 0.7211309887886047, + 0.7422091772079468, + 0.771403307723999, + 0.7684701559066772, + 0.7899860233306885, + 0.785915501832962, + 0.7849839227676392, + 0.7681392771720886, + 0.7435544511795044, + 0.751194825553894, + 0.7936021596908569, + 0.7802497886657714, + 0.780384884262085, + 0.7791699929237366, + 0.7584754270553589, + 0.8155371535301208, + 0.7780845603942871, + 0.7793395760059356, + 0.7373061706542968, + 0.7489152907371521, + 0.7263450141906739, + 0.7460742810249329, + 0.6866057529449463, + 0.7141902516365052, + 0.703807559967041, + 0.7199574493408203, + 0.7092751522064209, + 0.6616440784454346, + 0.6884374785423278, + 0.6783149375915527, + 0.6543091285705567, + 0.6953400015354156, + 0.6466015434265137, + 0.6512385541915894, + 0.6394664388656616, + 0.6508148580551147, + 0.6421753215789795, + 0.6408709971427917, + 0.659412619304657, + 0.6453365729808808, + 0.6413490727424621, + 0.6515926889896393, + 0.6426593520641327, + 0.6448210357666015, + 0.6461298638343811, + 0.6379973960399627, + 0.6365840391635895, + 0.6462472536087036, + 0.6423500331401825, + 0.6288489917755127, + 0.6368016141891479, + 0.6358265670776367, + 0.6384655450820923, + 0.631528349018097, + 0.6209217232704163, + 0.6202675918579101, + 0.6212863056182861, + 0.614168495464325, + 0.6118847620964051, + 0.6091739875793457, + 0.6087853524208069, + 0.6050858163833618, + 0.603250790977478, + 0.6008227246522904, + 0.6006201690673828, + 0.5996918613433838, + 0.5988774878025055, + 0.5984367890357971, + 0.5981314883232117 + ], + "train_acc": [ + 0.3598, + 0.7233, + 0.8271, + 0.8268, + 0.8049, + 0.7872, + 0.7751, + 0.7489, + 0.745, + 0.7539, + 0.7478, + 0.7413, + 0.7351, + 0.7251, + 0.7302, + 0.7287, + 0.7275, + 0.7273, + 0.7377, + 0.7392, + 0.7399, + 0.7321, + 0.7351, + 0.7354, + 0.7407, + 0.748, + 0.7371, + 0.7431, + 0.7437, + 0.7604, + 0.7542, + 0.76, + 0.7521, + 0.7689, + 0.7628, + 0.7629, + 0.7559, + 0.7656, + 0.7767, + 0.7703, + 0.7741, + 0.7826, + 0.7689, + 0.7867, + 0.782, + 0.7838, + 0.7823, + 0.784, + 0.7867, + 0.7803, + 0.7829, + 0.7858, + 0.7799, + 0.7847, + 0.7848, + 0.7865, + 0.7889, + 0.7883, + 0.7786, + 0.7867, + 0.7864, + 0.7874, + 0.7889, + 0.7865, + 0.7892, + 0.7911, + 0.7941, + 0.7912, + 0.7911, + 0.7912, + 0.7945, + 0.796, + 0.7962, + 0.7951, + 0.7976, + 0.7975, + 0.7968, + 0.7959, + 0.7968, + 0.7965 + ], + "test_acc": [ + 0.602, + 0.757, + 0.81, + 0.7795, + 0.771, + 0.7595, + 0.7525, + 0.7185, + 0.7265, + 0.7125, + 0.7215, + 0.7035, + 0.6955, + 0.696, + 0.671, + 0.689, + 0.655, + 0.676, + 0.694, + 0.692, + 0.682, + 0.6875, + 0.684, + 0.677, + 0.695, + 0.6915, + 0.708, + 0.6805, + 0.705, + 0.689, + 0.7165, + 0.7085, + 0.7085, + 0.7135, + 0.6955, + 0.7125, + 0.7225, + 0.723, + 0.6925, + 0.736, + 0.728, + 0.7205, + 0.726, + 0.746, + 0.731, + 0.721, + 0.735, + 0.737, + 0.731, + 0.741, + 0.7455, + 0.731, + 0.744, + 0.743, + 0.7445, + 0.749, + 0.7415, + 0.749, + 0.74, + 0.746, + 0.742, + 0.7375, + 0.751, + 0.7475, + 0.7455, + 0.739, + 0.744, + 0.747, + 0.744, + 0.743, + 0.7435, + 0.745, + 0.747, + 0.7455, + 0.7465, + 0.747, + 0.746, + 0.746, + 0.7455, + 0.7455 + ], + "state_pred_error": [ + 0.7301947330474854, + 0.2293994782924652, + 0.15949859266281127, + 0.15117296252250673, + 0.15491236505508424, + 0.16152297229766846, + 0.16639477663040161, + 0.16297674663066863, + 0.1474767792701721, + 0.13462664729356766, + 0.1192866288304329, + 0.10311011584997178, + 0.08718618566989898, + 0.07007366203069687, + 0.059906782633066175, + 0.05418295328617096, + 0.05250892471075058, + 0.053210784059762956, + 0.05376021633148193, + 0.0505560393512249, + 0.04665645271539688, + 0.04122237099409103, + 0.035260846930742266, + 0.029457686340808868, + 0.02472122933268547, + 0.020959654900431633, + 0.018036982771754265, + 0.01579355520308018, + 0.014835753314197063, + 0.013916902904212474, + 0.013557420775294303, + 0.013417310911417008, + 0.013456771358847618, + 0.013404925701022148, + 0.013516017714142799, + 0.013791045615077019, + 0.013860506749153137, + 0.013912296595424414, + 0.01376565940529108, + 0.01364058257341385, + 0.016863438057899475, + 0.013605340698361397, + 0.01336009669303894, + 0.013293599289655686, + 0.01339816378504038, + 0.01297538487315178, + 0.012990520419180394, + 0.012765769854187965, + 0.012577315384149551, + 0.012284608180820942, + 0.012003655248880387, + 0.011748795488476753, + 0.011465166535973549, + 0.011208864139020443, + 0.010971895548701286, + 0.010833216698467731, + 0.010546348862349987, + 0.010316753853857517, + 0.01005659337937832, + 0.009844934567809105, + 0.009683808153867721, + 0.009427979576587676, + 0.009225837172567844, + 0.009161983558535576, + 0.008829943571984768, + 0.008661615046858787, + 0.008553683330118656, + 0.008285431960225105, + 0.008538309474289418, + 0.007964446505904197, + 0.007747227008640766, + 0.0076069540724158285, + 0.007299331539869308, + 0.007200139582157135, + 0.007046559315174818, + 0.006977505052089691, + 0.006643858262896538, + 0.006649243193119764, + 0.006426095798611641, + 0.006344281244277954 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8436356782913208, + 0.46039146184921265, + 0.16277557611465454, + 0.13905379176139832 + ], + "perturbation_rho": [ + 0.7277628183364868, + 0.48849108815193176, + 0.1771586537361145, + 0.09970887005329132 + ], + "nudging": { + "0.001": [ + -0.027422115206718445, + -0.0018765792483463883, + -0.0004788438673131168, + -0.0003904813784174621 + ], + "0.003": [ + -0.07989989221096039, + -0.0056180888786911964, + -0.001435610232874751, + -0.0011701165931299329 + ], + "0.01": [ + -0.2401106357574463, + -0.018598388880491257, + -0.004775169305503368, + -0.0038934119511395693 + ] + }, + "state_pred_error_per_layer": [ + 3442.556884765625, + 2195.27490234375, + 2035.546875, + 2293.3291015625 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.21667213973999, + 1.3028536838531495, + 0.7136714351654053, + 0.5170062650680542, + 0.428484773182869, + 0.3893401426315308, + 0.3633166349887848, + 0.3759902914404869, + 0.3800179394721985, + 0.374489461517334, + 0.41736346807479857, + 0.4102055465698242, + 0.4892664265632629, + 0.4714547214508057, + 0.4549084837436676, + 0.4638775846004486, + 0.4697629602909088, + 0.5410322017669678, + 0.455058971118927, + 0.5534555526733398, + 0.5718941131830215, + 0.5692951575756073, + 0.7074480386734009, + 0.8779852552890778, + 0.7194037189483643, + 0.7017252969741822, + 0.7141246451377868, + 0.8214343783378601, + 0.860213596200943, + 0.8622452178955078, + 0.9510571762084961, + 0.9425890031814576, + 0.9824190010070801, + 1.0797506145477296, + 0.9800792013168335, + 0.9507031625747681, + 1.0324596477508545, + 0.9877136844635009, + 1.00947436542511, + 1.0367300788879394, + 1.0976514343261718, + 1.1145684359550476, + 1.1553843279838563, + 1.1054404956817627, + 1.1235701330184937, + 1.104157660484314, + 1.084609769821167, + 1.0474918176651, + 1.0699964389801024, + 1.1043497201919557, + 1.1458708742141723, + 1.1705602006912232, + 1.1516906476974487, + 1.1598484769821167, + 1.1815660175323486, + 1.2148106037139892, + 1.2095819049835206, + 1.1930717593193054, + 1.2089854690551758, + 1.2108521512985229, + 1.1752276388168335, + 1.1807297292709351, + 1.1614444935798645, + 1.1496624534606934, + 1.1391552867889405, + 1.1303464347839356, + 1.1392961274147033, + 1.1198745210647583, + 1.107233187866211, + 1.1058051456451417, + 1.1052214641571045, + 1.103658806848526, + 1.0945639568328858, + 1.0903655527114868, + 1.0888818534851075, + 1.0861711362838744, + 1.0846550971984863, + 1.083442396068573, + 1.082554894256592, + 1.0821752315998077 + ], + "train_acc": [ + 0.1941, + 0.539, + 0.7388, + 0.8041, + 0.837, + 0.8521, + 0.8595, + 0.8565, + 0.8598, + 0.8592, + 0.8536, + 0.8592, + 0.8407, + 0.8492, + 0.8514, + 0.8502, + 0.8553, + 0.8478, + 0.8617, + 0.8493, + 0.8419, + 0.8356, + 0.8135, + 0.7864, + 0.8069, + 0.8035, + 0.79, + 0.7629, + 0.7469, + 0.7452, + 0.718, + 0.7185, + 0.7087, + 0.6877, + 0.7011, + 0.7004, + 0.687, + 0.6925, + 0.6908, + 0.6827, + 0.6795, + 0.6783, + 0.6698, + 0.6789, + 0.6776, + 0.6689, + 0.6723, + 0.6756, + 0.6708, + 0.6601, + 0.6588, + 0.6492, + 0.6589, + 0.6555, + 0.6509, + 0.6513, + 0.651, + 0.6547, + 0.6524, + 0.6504, + 0.6618, + 0.6563, + 0.6608, + 0.6593, + 0.6637, + 0.667, + 0.6641, + 0.6633, + 0.6724, + 0.6698, + 0.6683, + 0.6682, + 0.6699, + 0.6721, + 0.6704, + 0.6736, + 0.6716, + 0.6722, + 0.6723, + 0.6729 + ], + "test_acc": [ + 0.415, + 0.662, + 0.754, + 0.7975, + 0.793, + 0.7945, + 0.817, + 0.811, + 0.8205, + 0.8045, + 0.8105, + 0.7925, + 0.81, + 0.799, + 0.7945, + 0.8085, + 0.8125, + 0.812, + 0.815, + 0.773, + 0.7865, + 0.7505, + 0.7205, + 0.7745, + 0.7635, + 0.726, + 0.7075, + 0.641, + 0.663, + 0.654, + 0.659, + 0.598, + 0.603, + 0.6775, + 0.662, + 0.609, + 0.667, + 0.663, + 0.662, + 0.6265, + 0.621, + 0.623, + 0.653, + 0.6325, + 0.6035, + 0.661, + 0.655, + 0.644, + 0.6515, + 0.6325, + 0.608, + 0.6305, + 0.624, + 0.6245, + 0.622, + 0.6345, + 0.6375, + 0.6435, + 0.611, + 0.629, + 0.633, + 0.6365, + 0.638, + 0.6355, + 0.634, + 0.637, + 0.6385, + 0.643, + 0.637, + 0.635, + 0.6355, + 0.6385, + 0.6425, + 0.6395, + 0.641, + 0.643, + 0.645, + 0.6455, + 0.642, + 0.644 + ], + "value_loss": [ + 2.98627366771698, + 0.8837935139656067, + 0.7089252394676209, + 0.5627537595748902, + 0.4647229739665985, + 0.4527482861757278, + 0.42183804416656495, + 0.44746375745534894, + 0.5015264921665191, + 0.5325376167297363, + 0.67313133187294, + 0.6454255343437195, + 0.9217477686882019, + 0.8973391900062561, + 0.8749618107795716, + 0.8525666799545288, + 0.9360130718708038, + 1.3155556218147277, + 0.9591496783256531, + 1.3932193581581116, + 1.3368174820899963, + 1.4153075652837754, + 1.8522763618469238, + 2.692264319419861, + 1.987386597442627, + 1.7064623640060426, + 1.5963992614746094, + 1.8007077737808228, + 1.8428632176399231, + 1.8114418548583984, + 2.151936915397644, + 1.9110771072387696, + 2.018029465484619, + 1.8322255165100099, + 1.645587540435791, + 1.3747720615386962, + 1.5352789054870606, + 1.2163612977981568, + 1.1944268989562987, + 1.2833883277893066, + 1.3255775995254517, + 1.4826569160461425, + 1.5467321198940278, + 1.284308567047119, + 1.7137093808174133, + 1.1552894416809083, + 1.1311728733062745, + 1.0472279965400695, + 1.0053806617736816, + 1.0010575477600097, + 0.9859790618896485, + 1.2155662194252015, + 1.003822357082367, + 1.0635619995355605, + 1.1148122986793518, + 1.1133179431915283, + 1.1314655995845795, + 1.063596166086197, + 1.08116314201355, + 1.2070675258636474, + 1.1020942071914672, + 1.0678428085327147, + 0.9401497948646546, + 0.9278912733078003, + 0.9080529265403747, + 0.9108555992126465, + 0.9342455106735229, + 0.8713727573394775, + 0.8542225917339324, + 0.7861682298660279, + 0.8850017538070679, + 0.8619107227563858, + 0.8038089787960052, + 0.7899838858604431, + 0.7701753869056701, + 0.769465737915039, + 0.7744430953979492, + 0.7900901956558227, + 0.7403188591003418, + 0.7469501955509186 + ], + "term_loss": [ + 1.7330207207679749, + 0.5570951914310456, + 0.5406998898506165, + 0.42358581104278564, + 0.330837759578228, + 0.3169518223524094, + 0.29698160467147827, + 0.3257715297937393, + 0.38289243738651274, + 0.41381053009033203, + 0.5447130520641804, + 0.5157749845981597, + 0.7718508359909058, + 0.7546274427890778, + 0.7339719145298004, + 0.7112689768791198, + 0.791866575551033, + 1.1592939472913741, + 0.8167946130514145, + 1.2256993349075318, + 1.1646487221479416, + 1.2383904585599899, + 1.631025779724121, + 2.4219681352615354, + 1.7584926077842713, + 1.4707476893424989, + 1.3351344179153442, + 1.520205120897293, + 1.5596533782958983, + 1.515875082397461, + 1.79064727973938, + 1.5599366078615189, + 1.6685857362747192, + 1.4755192764282226, + 1.3079399518966675, + 1.044541180229187, + 1.1824697380065918, + 0.9046971752166748, + 0.875753413772583, + 0.9598105868339538, + 0.9913295073509216, + 1.1304236074447631, + 1.1843891148805619, + 0.9457870094299317, + 1.3240039914131165, + 0.8169942698001862, + 0.7961643146514893, + 0.7154263019561767, + 0.6731688285827637, + 0.6658499521374702, + 0.6485110036373138, + 0.8649091658592224, + 0.6634476466417313, + 0.7145267177820206, + 0.7573314692020416, + 0.7621763240695, + 0.7773383576869964, + 0.7098418580263853, + 0.7351013217926026, + 0.8393829751968384, + 0.7465768881320953, + 0.7260645219802856, + 0.6062547987580299, + 0.5984976484775543, + 0.5737183202266694, + 0.5811108931541443, + 0.6015944788455964, + 0.5377804847717285, + 0.5286362272024154, + 0.46792872714996336, + 0.5465958580970764, + 0.523382218259573, + 0.47831321868896487, + 0.464987371301651, + 0.44250393846035, + 0.44271842584609983, + 0.44280669292211533, + 0.45500148746967317, + 0.41044492044448855, + 0.4142983556270599 + ], + "bridge_loss": [ + 0.9648801658940677, + 0.08952797002196312, + 0.010387033657729626, + 0.00868126191496849, + 0.019953231650590895, + 0.02652147726416588, + 0.020377826833724976, + 0.0113384807407856, + 0.008869929821789265, + 0.00884415243268013, + 0.010127060194313526, + 0.013834500606358052, + 0.015429657346010208, + 0.015005127727985382, + 0.01737220617234707, + 0.016507850235700606, + 0.017887714263796806, + 0.023489831846952438, + 0.02137830719947815, + 0.02939054045677185, + 0.026938988852500914, + 0.03005907730460167, + 0.0494566838145256, + 0.07397269518375396, + 0.05218240886628628, + 0.05718883774280548, + 0.07471259951591491, + 0.07095959825217724, + 0.058274264189600945, + 0.06374176431894302, + 0.11108007080554962, + 0.09976578676998615, + 0.08669499335289002, + 0.07870205481052399, + 0.07394435806274414, + 0.06967136498093605, + 0.080409853130579, + 0.04817635658979416, + 0.05157966592311859, + 0.05089826797246933, + 0.05235503783226013, + 0.06689172427654266, + 0.0671337242603302, + 0.05729759488105774, + 0.1062810962766409, + 0.05406412786245346, + 0.05491479247808456, + 0.054957729548215865, + 0.052455113303661344, + 0.04835679746866226, + 0.042898213720321654, + 0.05113928149938583, + 0.04518155987560749, + 0.051552925246953964, + 0.058847477835416794, + 0.04706944565176964, + 0.052829784095287324, + 0.05310420074760914, + 0.04631037278175354, + 0.06662687994241714, + 0.06011319470405579, + 0.04712236127257347, + 0.039016457271575926, + 0.03940267757177353, + 0.044726579827070234, + 0.043924689245224, + 0.045097052454948425, + 0.04810757489204407, + 0.04271955596804619, + 0.03583536728620529, + 0.057168651711940764, + 0.05612469773888588, + 0.04613451107442379, + 0.0457260724902153, + 0.0485022147655487, + 0.04867343447208405, + 0.05331066003292799, + 0.05733778126835823, + 0.05258702590465546, + 0.05541581681370735 + ], + "tgrad_loss": [ + 0.2883727689743042, + 0.23717035751342774, + 0.15783831593990327, + 0.1304866850376129, + 0.11393198389410973, + 0.10927498421669006, + 0.10447861251831055, + 0.11035374848097562, + 0.10976412500143051, + 0.10988293509483338, + 0.1182912248492241, + 0.11581605107784271, + 0.13446727237701417, + 0.12770662536621094, + 0.12361769351959229, + 0.12478985731601715, + 0.12625877491235732, + 0.1327718471288681, + 0.12097676041126251, + 0.13812946257591247, + 0.14522977732419967, + 0.14685802749991417, + 0.17179391975402833, + 0.1963234726667404, + 0.17671158585548402, + 0.1785258449792862, + 0.18655224494934083, + 0.20954303665161134, + 0.22493557806015016, + 0.2318249930381775, + 0.25020956571102143, + 0.2513746982336044, + 0.2627487404823303, + 0.27800417733192445, + 0.263703225851059, + 0.2605595135688782, + 0.27239930696487424, + 0.26348776059150697, + 0.26709380178451536, + 0.272679474067688, + 0.2818930588245392, + 0.2853415786743164, + 0.2952092591524124, + 0.28122395482063295, + 0.2834243035316467, + 0.2842310373783112, + 0.28009376602172853, + 0.276843967628479, + 0.2797567158699036, + 0.28685079827308657, + 0.2945698440313339, + 0.2995177795648575, + 0.2951931531190872, + 0.29748235273361207, + 0.2986333510398865, + 0.3040721726417541, + 0.3012974452495575, + 0.30065011866092684, + 0.299751437997818, + 0.3010576790332794, + 0.2954041223526001, + 0.2946559201717377, + 0.29487854740619657, + 0.28999093780517576, + 0.28960802850723266, + 0.2858200194358826, + 0.28755397300720215, + 0.28548469729423526, + 0.28286680579185486, + 0.28240412793159486, + 0.2812372575759888, + 0.2824038036108017, + 0.2793612523317337, + 0.2792704437494278, + 0.27916923666000365, + 0.2780738802909851, + 0.27832574605941773, + 0.27775092339515683, + 0.2772869101524353, + 0.2772360302686691 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.053475264459848404, + 0.17959368228912354, + 0.19590041041374207, + 0.18553033471107483 + ], + "perturbation_rho": [ + 0.04320300370454788, + 0.30398592352867126, + 0.35316282510757446, + 0.3741052448749542 + ], + "nudging": { + "0.001": [ + -0.002843886613845825, + -0.0015414394438266754, + -0.001540113240480423, + -0.0015225318493321538 + ], + "0.003": [ + -0.008491966873407364, + -0.004619893617928028, + -0.004617607686668634, + -0.004564257338643074 + ], + "0.01": [ + -0.027841825038194656, + -0.015361151657998562, + -0.015351004898548126, + -0.015173434279859066 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.0_L8_s123.json b/results/synth_ladder_v2_lo/synth_a0.0_L8_s123.json new file mode 100644 index 0000000..e4a62d1 --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.0_L8_s123.json @@ -0,0 +1,1638 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.0751699994087218, + 0.5078761493682862, + 0.4315531859636307, + 0.3730073788642883, + 0.3855140475273132, + 0.3838132353544235, + 0.3313831533908844, + 0.3231501661300659, + 0.3923093918323517, + 0.31546831176280976, + 0.28469861125946044, + 0.31882518215179445, + 0.2853241161823273, + 0.30717134480476377, + 0.3008323100566864, + 0.25230099849700927, + 0.26736773533821107, + 0.290317884016037, + 0.28117715458869935, + 0.2628298757553101, + 0.27629507098197936, + 0.21616523714065553, + 0.23837570557594298, + 0.23259806416034698, + 0.20912184219360352, + 0.2282358638763428, + 0.23643302953243256, + 0.19742694540023803, + 0.19373424887657165, + 0.17873178114891053, + 0.21476234383583068, + 0.19948986144065856, + 0.19502384197711944, + 0.18266755771636964, + 0.1968197359085083, + 0.16177621128559114, + 0.16351565613746644, + 0.18049528713226318, + 0.17411686115264893, + 0.1877502377986908, + 0.1758611748933792, + 0.15605131125450133, + 0.1843089075088501, + 0.16815092163085937, + 0.16242712774276732, + 0.14932012376785278, + 0.13747083263397217, + 0.14795307011604308, + 0.14553518596887588, + 0.12967102394104005, + 0.12926516201496124, + 0.12882190299034119, + 0.1262246768951416, + 0.12236184301376343, + 0.11932372522354126, + 0.12124661664962769, + 0.1193896909236908, + 0.11769546012878418, + 0.11199279772043229, + 0.10861553268432617, + 0.11058963505029679, + 0.10696912100315094, + 0.10576842985153198, + 0.10256688792705536, + 0.10151043713092804, + 0.10045346193313599, + 0.10001536026597023, + 0.09882576355934143, + 0.09955769186019897, + 0.097229629945755, + 0.09649371477365494, + 0.09524589428305626, + 0.0947727505683899, + 0.0946026062130928, + 0.09410042756795883, + 0.09368885006904602, + 0.09331119285821915, + 0.09311075817346573, + 0.09294630281925201, + 0.0928657611489296 + ], + "train_acc": [ + 0.6186, + 0.8031, + 0.8268, + 0.8526, + 0.8455, + 0.8495, + 0.8701, + 0.8729, + 0.8484, + 0.8757, + 0.888, + 0.8728, + 0.8865, + 0.8801, + 0.8827, + 0.901, + 0.8965, + 0.8856, + 0.8887, + 0.8952, + 0.8927, + 0.917, + 0.9074, + 0.9096, + 0.9187, + 0.9067, + 0.9079, + 0.9245, + 0.9234, + 0.933, + 0.9146, + 0.9225, + 0.9254, + 0.9321, + 0.9224, + 0.9382, + 0.9376, + 0.9292, + 0.9326, + 0.9306, + 0.9328, + 0.9449, + 0.9316, + 0.9368, + 0.9386, + 0.9465, + 0.9512, + 0.9456, + 0.9435, + 0.9554, + 0.9547, + 0.9558, + 0.9586, + 0.9609, + 0.9611, + 0.9582, + 0.9615, + 0.9614, + 0.9655, + 0.9654, + 0.9633, + 0.9676, + 0.968, + 0.9707, + 0.9713, + 0.9729, + 0.9732, + 0.9731, + 0.9733, + 0.9743, + 0.9746, + 0.9761, + 0.976, + 0.976, + 0.9763, + 0.9767, + 0.9765, + 0.9767, + 0.9766, + 0.9766 + ], + "test_acc": [ + 0.813, + 0.8325, + 0.8525, + 0.8385, + 0.845, + 0.8585, + 0.871, + 0.8765, + 0.865, + 0.8745, + 0.8755, + 0.8695, + 0.8765, + 0.8855, + 0.877, + 0.8745, + 0.8755, + 0.88, + 0.883, + 0.885, + 0.8855, + 0.8835, + 0.891, + 0.8905, + 0.884, + 0.886, + 0.8865, + 0.899, + 0.897, + 0.8985, + 0.8885, + 0.8895, + 0.8865, + 0.9005, + 0.8965, + 0.9, + 0.8905, + 0.892, + 0.8955, + 0.9005, + 0.898, + 0.8985, + 0.893, + 0.9025, + 0.896, + 0.908, + 0.9095, + 0.9045, + 0.9095, + 0.9105, + 0.909, + 0.9125, + 0.907, + 0.9095, + 0.9065, + 0.906, + 0.9085, + 0.91, + 0.9105, + 0.911, + 0.9125, + 0.915, + 0.915, + 0.9135, + 0.9135, + 0.9155, + 0.9145, + 0.914, + 0.912, + 0.91, + 0.9125, + 0.914, + 0.9145, + 0.9135, + 0.9125, + 0.913, + 0.9125, + 0.9125, + 0.913, + 0.913 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9087610840797424, + 0.8890509605407715, + 0.8756387233734131, + 0.860000729560852, + 0.8513467311859131, + 0.8465403914451599, + 0.8431664705276489, + 0.8415512442588806 + ], + "perturbation_rho": [ + 0.9999994039535522, + 0.9999971389770508, + 0.9999857544898987, + 0.9999687671661377, + 0.9999316930770874, + 0.9999115467071533, + 0.9998936653137207, + 0.9998670816421509 + ], + "nudging": { + "0.001": [ + -0.028264127671718597, + -0.012846414931118488, + -0.006331811659038067, + -0.00377178774215281, + -0.002737606642767787, + -0.002249529119580984, + -0.001993998885154724, + -0.001851807115599513 + ], + "0.003": [ + -0.07839110493659973, + -0.037237778306007385, + -0.01868210732936859, + -0.011206002905964851, + -0.00815582275390625, + -0.006710343062877655, + -0.005951954051852226, + -0.005529414396733046 + ], + "0.01": [ + -0.19297254085540771, + -0.10940254479646683, + -0.05867426097393036, + -0.03609157353639603, + -0.026526644825935364, + -0.02192458137869835, + -0.019491419196128845, + -0.01812979206442833 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2520987983703615, + 1.1921777906417848, + 0.7223491347312927, + 0.569675174999237, + 0.5051876047611237, + 0.48127662410736083, + 0.4736270173072815, + 0.48385843744277957, + 0.5066647751808167, + 0.6151531973838806, + 0.5581183519363403, + 0.5944986409664154, + 0.5604664645195008, + 0.6437756621837616, + 0.5333342678070069, + 0.6594652740478516, + 0.6894421440124512, + 0.923525112915039, + 0.6622302152633667, + 0.716798538017273, + 0.878897295498848, + 0.744471817779541, + 0.7070304737091064, + 0.8442294884204864, + 0.7826246971130371, + 0.9029400730133057, + 0.8069341362476349, + 0.6115505308151246, + 0.6366227967739105, + 0.7032427085876465, + 0.7799454936504364, + 0.6853430420875549, + 0.5523268433570862, + 0.6605892517089844, + 0.7941808592796326, + 0.6566873438835144, + 0.6355799470424652, + 0.5692268901824952, + 0.5685003101348877, + 0.5846692030906677, + 0.5944320782661437, + 0.5346815711975098, + 0.5563252561569214, + 0.5020768721580505, + 0.5537538578987121, + 0.6320813038825989, + 0.5045045644760132, + 0.5110798831939697, + 0.5231480001449585, + 0.5048403442382813, + 0.5210682102203369, + 0.4949748097419739, + 0.4827910567998886, + 0.4423401186943054, + 0.4498805576324463, + 0.46643654356002806, + 0.4347722285270691, + 0.4337064916610718, + 0.41907463989257815, + 0.4191367287635803, + 0.419102601480484, + 0.40577776985168457, + 0.3929736733078957, + 0.37650615103244783, + 0.3740151602745056, + 0.3905257468223572, + 0.36958946516513824, + 0.3557390733718872, + 0.36144173402786256, + 0.3519090287685394, + 0.36009115864038466, + 0.3531981776714325, + 0.3487885144233704, + 0.3433017575263977, + 0.3405120318412781, + 0.3415103307723999, + 0.33846223516464236, + 0.3397556669831276, + 0.3369497664451599, + 0.33650312814712524 + ], + "train_acc": [ + 0.187, + 0.5683, + 0.7281, + 0.7834, + 0.8106, + 0.8164, + 0.8225, + 0.8247, + 0.8189, + 0.8058, + 0.8164, + 0.8143, + 0.8204, + 0.8133, + 0.8333, + 0.8131, + 0.8084, + 0.7864, + 0.8171, + 0.8117, + 0.7935, + 0.8132, + 0.8146, + 0.798, + 0.8052, + 0.7939, + 0.8041, + 0.8316, + 0.8288, + 0.8203, + 0.8082, + 0.8216, + 0.8393, + 0.8247, + 0.8002, + 0.8228, + 0.8243, + 0.8356, + 0.8345, + 0.8326, + 0.8294, + 0.8372, + 0.836, + 0.8491, + 0.8335, + 0.8282, + 0.8409, + 0.8445, + 0.8382, + 0.8452, + 0.8417, + 0.8476, + 0.8478, + 0.8554, + 0.8543, + 0.8507, + 0.8552, + 0.8554, + 0.8587, + 0.8575, + 0.856, + 0.8624, + 0.8653, + 0.8712, + 0.8715, + 0.8675, + 0.8736, + 0.8761, + 0.874, + 0.8767, + 0.8745, + 0.877, + 0.8782, + 0.8787, + 0.8819, + 0.8805, + 0.8819, + 0.8799, + 0.8804, + 0.8814 + ], + "test_acc": [ + 0.3945, + 0.6725, + 0.7445, + 0.7825, + 0.7695, + 0.7775, + 0.7865, + 0.7655, + 0.745, + 0.772, + 0.7825, + 0.7515, + 0.764, + 0.791, + 0.7455, + 0.7675, + 0.6775, + 0.7775, + 0.751, + 0.6575, + 0.782, + 0.758, + 0.7245, + 0.755, + 0.723, + 0.7655, + 0.7665, + 0.7775, + 0.789, + 0.777, + 0.7655, + 0.8005, + 0.7685, + 0.738, + 0.764, + 0.746, + 0.762, + 0.784, + 0.793, + 0.781, + 0.799, + 0.787, + 0.805, + 0.7865, + 0.7745, + 0.802, + 0.79, + 0.819, + 0.812, + 0.8105, + 0.8165, + 0.8025, + 0.8065, + 0.8135, + 0.8005, + 0.8165, + 0.821, + 0.8145, + 0.825, + 0.7965, + 0.8335, + 0.8345, + 0.821, + 0.827, + 0.838, + 0.841, + 0.8415, + 0.8475, + 0.847, + 0.847, + 0.8355, + 0.8485, + 0.849, + 0.8475, + 0.848, + 0.848, + 0.8475, + 0.8505, + 0.849, + 0.849 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.02848462387919426, + 0.15189720690250397, + 0.09141203761100769, + 0.07272940874099731, + 0.09136377274990082, + 0.0857112780213356, + 0.044680722057819366, + 0.0834236741065979 + ], + "perturbation_rho": [ + 0.03057212010025978, + 0.16072696447372437, + 0.13512857258319855, + 0.0885201245546341, + 0.1377822607755661, + 0.04239961504936218, + 0.0035119224339723587, + 0.15597838163375854 + ], + "nudging": { + "0.001": [ + 0.0014594306703656912, + -0.0004577417275868356, + -0.00020887120626866817, + -0.00015224868548102677, + -0.0001943351817317307, + -0.0002066612069029361, + -0.00010780030424939469, + -0.0001827073429012671 + ], + "0.003": [ + 0.00443669268861413, + -0.0013740381691604853, + -0.0006262905662879348, + -0.0004553776525426656, + -0.0005815139738842845, + -0.0006211799918673933, + -0.0003220687503926456, + -0.0005518731195479631 + ], + "0.01": [ + 0.015482441522181034, + -0.004561400040984154, + -0.0020816801115870476, + -0.0015152986161410809, + -0.0019329312490299344, + -0.002064004773274064, + -0.001068722689524293, + -0.0018352947663515806 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.6933611570358276, + 0.8735141654968261, + 0.7665568499565124, + 0.8385689164161683, + 0.9764881328582764, + 1.02570270652771, + 1.025010629272461, + 1.020008626461029, + 1.0027467712402345, + 1.0423539823532104, + 1.0425711331367493, + 1.0316707324981689, + 0.9828058090209961, + 1.010973007583618, + 0.986733434677124, + 0.9870936322212219, + 1.0305029682159423, + 0.9933851184844971, + 1.0522663254737854, + 0.9639181180000305, + 0.9579864252090454, + 0.9713263109207153, + 0.9710080772399903, + 0.958733812046051, + 0.9615955039978027, + 1.027508487701416, + 0.9683805879592895, + 0.9042373063087463, + 0.8988901743888855, + 0.9260022815704345, + 0.9189402528762818, + 0.9042542934417724, + 0.9470187347412109, + 0.9738248091697693, + 0.9535215856552124, + 0.9395688908576966, + 0.9090730375289917, + 0.885469716835022, + 0.8550978662490845, + 0.8035958326339722, + 0.8043856971740723, + 0.7268994374275207, + 0.6941964792251587, + 0.6895901699066163, + 0.6707516403198243, + 0.6721853691101074, + 0.6611783460140228, + 0.659359624004364, + 0.6429293818473816, + 0.6381944968223572, + 0.6279613481521606, + 0.6223987235546112, + 0.6126754106521607, + 0.6082254240989685, + 0.6074888929367065, + 0.6079129957199096, + 0.5843968881607056, + 0.5827842922210693, + 0.5797355854988098, + 0.5714883241653442, + 0.5579988807678222, + 0.562573088645935, + 0.5711278948783874, + 0.5605402961730958, + 0.5530248602867126, + 0.5467610740661621, + 0.5411503358840942, + 0.5433719402313233, + 0.540703071641922, + 0.5357308044433594, + 0.533350599193573, + 0.5327393305778504, + 0.5315601040363311, + 0.5277191678047181, + 0.5272269250869751, + 0.5260714418411255, + 0.5258072991371154, + 0.5249099862098694, + 0.5241127325057984, + 0.5239003022670746 + ], + "train_acc": [ + 0.3869, + 0.6741, + 0.7213, + 0.712, + 0.6916, + 0.6886, + 0.6666, + 0.651, + 0.6536, + 0.6405, + 0.6405, + 0.6462, + 0.6581, + 0.6553, + 0.6657, + 0.6618, + 0.656, + 0.6597, + 0.6499, + 0.6689, + 0.6689, + 0.6612, + 0.6713, + 0.6743, + 0.6725, + 0.6567, + 0.6765, + 0.6919, + 0.6986, + 0.6925, + 0.6938, + 0.6935, + 0.6785, + 0.6739, + 0.6752, + 0.6824, + 0.6969, + 0.7072, + 0.7205, + 0.7291, + 0.7284, + 0.7438, + 0.7548, + 0.7567, + 0.7589, + 0.766, + 0.7651, + 0.7677, + 0.7717, + 0.7795, + 0.7739, + 0.7796, + 0.7866, + 0.785, + 0.7854, + 0.786, + 0.7965, + 0.7908, + 0.7913, + 0.7964, + 0.7981, + 0.7981, + 0.7953, + 0.7985, + 0.8028, + 0.8024, + 0.8039, + 0.8051, + 0.8041, + 0.8085, + 0.8105, + 0.8086, + 0.8085, + 0.809, + 0.8111, + 0.8097, + 0.8101, + 0.8101, + 0.8108, + 0.8109 + ], + "test_acc": [ + 0.5935, + 0.72, + 0.6775, + 0.68, + 0.656, + 0.6325, + 0.6155, + 0.6255, + 0.615, + 0.6105, + 0.6085, + 0.6345, + 0.6185, + 0.6345, + 0.5905, + 0.6125, + 0.621, + 0.6105, + 0.6455, + 0.631, + 0.615, + 0.6305, + 0.602, + 0.639, + 0.615, + 0.618, + 0.6255, + 0.6465, + 0.618, + 0.632, + 0.635, + 0.608, + 0.633, + 0.624, + 0.64, + 0.642, + 0.6695, + 0.6785, + 0.6885, + 0.697, + 0.701, + 0.707, + 0.6975, + 0.7185, + 0.7175, + 0.7105, + 0.7225, + 0.724, + 0.7435, + 0.734, + 0.721, + 0.732, + 0.7455, + 0.724, + 0.7385, + 0.7435, + 0.749, + 0.761, + 0.7585, + 0.756, + 0.7515, + 0.758, + 0.754, + 0.76, + 0.7585, + 0.757, + 0.762, + 0.768, + 0.7695, + 0.764, + 0.7665, + 0.7705, + 0.7715, + 0.775, + 0.771, + 0.768, + 0.773, + 0.7715, + 0.7715, + 0.7725 + ], + "state_pred_error": [ + 0.6523542706489563, + 0.19193185296058654, + 0.14653349640369415, + 0.15872931728363038, + 0.18078227672576905, + 0.1991569593667984, + 0.2008796215057373, + 0.18525008442401886, + 0.16809621107578276, + 0.15999590849876405, + 0.15330226860046386, + 0.14592516691684723, + 0.13386850850582122, + 0.12190511665344238, + 0.10378667067289353, + 0.08404812656641006, + 0.07603342895507813, + 0.08103448238372803, + 0.08138266659975052, + 0.07272305935621262, + 0.05746607996225357, + 0.04692842020392418, + 0.043097834444046024, + 0.04099300811886787, + 0.0405810765504837, + 0.04342285684943199, + 0.048582996279001235, + 0.04889846543669701, + 0.0451542430460453, + 0.04271460177898407, + 0.04027070061564445, + 0.039503088825941085, + 0.04128472047448158, + 0.046091007149219515, + 0.050196210831403736, + 0.049017273938655855, + 0.04467248005867004, + 0.039510804724693295, + 0.038085958564281465, + 0.03630638051629066, + 0.03414194769263267, + 0.0312760682284832, + 0.028667821806669234, + 0.026828847748041153, + 0.02496851394176483, + 0.023867447009682654, + 0.022309034156799315, + 0.021144986769557, + 0.020247555989027024, + 0.019221594369411468, + 0.018156419448554516, + 0.017370658588409423, + 0.01632956005334854, + 0.015447458410263062, + 0.014759005525708198, + 0.013934719793498517, + 0.013313219195604324, + 0.012773487070202828, + 0.012312416805326938, + 0.01164230280816555, + 0.011094774509966373, + 0.010633055430650712, + 0.01053461185693741, + 0.009895847409218549, + 0.009508155985176563, + 0.009198328344523906, + 0.009013811707496643, + 0.008660282976180315, + 0.00837978694587946, + 0.008148924431949854, + 0.007967903938889503, + 0.007802195318043232, + 0.007647230580449104, + 0.007468716404587031, + 0.007320268598198891, + 0.007207962603121996, + 0.007048187575489283, + 0.006943403443694114, + 0.00690332992747426, + 0.006703724086284638 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8679102659225464, + 0.46438825130462646, + 0.22033852338790894, + 0.1893446445465088, + 0.16738475859165192, + 0.14945879578590393, + 0.1267041563987732, + 0.16090741753578186 + ], + "perturbation_rho": [ + 0.6897462606430054, + 0.42848390340805054, + 0.19369670748710632, + 0.19582855701446533, + 0.14048044383525848, + 0.12853404879570007, + 0.09809397161006927, + 0.18465319275856018 + ], + "nudging": { + "0.001": [ + -0.023718392476439476, + -0.0012583123752847314, + -0.00044915906619280577, + -0.0003827106556855142, + -0.00033165872446261346, + -0.0002987197949551046, + -0.0002500134869478643, + -0.0003117678570561111 + ], + "0.003": [ + -0.06893274188041687, + -0.0037688319571316242, + -0.0013465355150401592, + -0.001147672301158309, + -0.0009943797485902905, + -0.0008956906385719776, + -0.0007494555320590734, + -0.0009345603175461292 + ], + "0.01": [ + -0.2050759196281433, + -0.01248687319457531, + -0.004478689283132553, + -0.003817938268184662, + -0.00330835347995162, + -0.002980519086122513, + -0.002494834130629897, + -0.003109385259449482 + ] + }, + "state_pred_error_per_layer": [ + 7121.279296875, + 6133.4482421875, + 3940.991943359375, + 2496.587646484375, + 2560.85595703125, + 2498.587890625, + 3539.93115234375, + 2449.22607421875 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2500952816009523, + 1.1873374975204467, + 0.7212190233230591, + 0.589605973815918, + 0.5065119435310363, + 0.49011473684310913, + 0.4700994392395019, + 0.49362938632965087, + 0.517937117767334, + 0.5726593207359314, + 0.5896924369812012, + 0.560268968963623, + 0.7397664501190185, + 0.5875084342956542, + 0.7278265399932862, + 0.6364062483787537, + 0.6483331825256348, + 0.6756553826332092, + 0.797479226398468, + 0.8857126516819, + 0.7695636330604553, + 0.8077825311660767, + 0.8752077760696411, + 0.9167019436836242, + 0.9218885593414307, + 1.1383125644683838, + 0.9534948586463928, + 1.0558939460754395, + 1.0323654453277589, + 1.116957998275757, + 1.1411346126556396, + 1.0218814598083497, + 0.9977903114318848, + 0.9335888034820556, + 0.8998320890426635, + 0.8658985606193542, + 0.8732052396774292, + 0.8411305795669556, + 0.8131478414535522, + 0.8340221326828003, + 0.8159633024215698, + 0.950879275226593, + 0.9489988649368286, + 1.0056487663269043, + 1.0859495765686036, + 0.9971291749954224, + 0.9133035232543946, + 0.9639798210144043, + 0.9673156415939331, + 0.9582165712356567, + 0.969321283531189, + 0.9587007732391357, + 0.9764175521850585, + 0.9668055473327637, + 1.0020932814121246, + 0.9464939272403717, + 0.934805569267273, + 0.9322779521942138, + 0.9594141904830933, + 0.9337027027130127, + 0.9510448094367981, + 0.9412529281616211, + 0.9553708855628967, + 0.9822353410720825, + 0.9803216348648072, + 0.9576361427307128, + 0.9710129974365235, + 0.9710078893661499, + 0.9533861350059509, + 0.9576114654541016, + 0.9587514167785645, + 0.9548089513778687, + 0.9527052781105042, + 0.9493050754547119, + 0.9484169096946716, + 0.9474969398975372, + 0.9456873325347901, + 0.9430316831588745, + 0.9420053770065308, + 0.9418123706817627 + ], + "train_acc": [ + 0.1872, + 0.5716, + 0.7344, + 0.7792, + 0.8089, + 0.8161, + 0.8276, + 0.8192, + 0.8187, + 0.8135, + 0.8124, + 0.8225, + 0.7924, + 0.8233, + 0.8001, + 0.8193, + 0.8194, + 0.8151, + 0.7973, + 0.7798, + 0.796, + 0.7956, + 0.7883, + 0.7818, + 0.7855, + 0.761, + 0.7843, + 0.7714, + 0.7577, + 0.7354, + 0.7261, + 0.7398, + 0.7285, + 0.72, + 0.7188, + 0.7159, + 0.7195, + 0.7271, + 0.7257, + 0.7217, + 0.7199, + 0.7001, + 0.7002, + 0.6867, + 0.6722, + 0.6834, + 0.6982, + 0.6896, + 0.6815, + 0.6799, + 0.6781, + 0.6785, + 0.677, + 0.6788, + 0.6645, + 0.6836, + 0.6862, + 0.6881, + 0.6786, + 0.6888, + 0.6833, + 0.6903, + 0.6823, + 0.6764, + 0.677, + 0.6797, + 0.676, + 0.6795, + 0.6773, + 0.6801, + 0.6781, + 0.6817, + 0.6793, + 0.6811, + 0.6811, + 0.6828, + 0.6822, + 0.6819, + 0.6819, + 0.681 + ], + "test_acc": [ + 0.396, + 0.6675, + 0.755, + 0.779, + 0.7785, + 0.7735, + 0.7875, + 0.773, + 0.7755, + 0.7345, + 0.7665, + 0.728, + 0.772, + 0.746, + 0.794, + 0.8, + 0.77, + 0.725, + 0.718, + 0.7665, + 0.781, + 0.735, + 0.78, + 0.7635, + 0.682, + 0.724, + 0.7315, + 0.7385, + 0.629, + 0.6065, + 0.678, + 0.687, + 0.6895, + 0.6655, + 0.6555, + 0.641, + 0.659, + 0.664, + 0.627, + 0.661, + 0.619, + 0.6305, + 0.656, + 0.656, + 0.6375, + 0.6495, + 0.6185, + 0.64, + 0.6445, + 0.6445, + 0.629, + 0.6205, + 0.654, + 0.649, + 0.665, + 0.66, + 0.6525, + 0.641, + 0.658, + 0.652, + 0.6675, + 0.663, + 0.6535, + 0.6515, + 0.6505, + 0.646, + 0.649, + 0.6555, + 0.652, + 0.6485, + 0.6555, + 0.6505, + 0.6615, + 0.66, + 0.6565, + 0.6615, + 0.6555, + 0.6565, + 0.657, + 0.656 + ], + "value_loss": [ + 3.0406550333023072, + 1.0739864919662476, + 0.8797902669906617, + 0.8119230751037597, + 0.7505124300003052, + 0.7688478637218475, + 0.7816700012207031, + 0.8277950994491577, + 0.9332238399505616, + 1.2073661733627319, + 1.2178748641967774, + 1.1489280862808227, + 2.049370337677002, + 1.3749836051940918, + 1.967809481048584, + 1.5042143379211426, + 1.784430411529541, + 1.8522346771240235, + 2.380785788345337, + 2.688079098987579, + 2.2121243869781493, + 2.5771859003067017, + 3.0177161417007445, + 3.1963249433517458, + 3.278499910736084, + 4.103906137943268, + 3.2893902530670167, + 3.538276944923401, + 3.4071033470153806, + 3.393061047363281, + 3.593107583808899, + 2.7045906631469725, + 2.323301078128815, + 1.6587140537261962, + 1.4096987594604493, + 1.1064665121078492, + 1.3018325449943542, + 0.9622974695205688, + 0.9416653045654297, + 1.137942492198944, + 0.8390110436439514, + 1.118818556213379, + 1.4351170351982117, + 1.4146549716949464, + 1.350854679107666, + 1.0553760808944703, + 0.9420531357765197, + 0.8516968212127686, + 0.8288311427116394, + 0.8953044918060302, + 1.0598519243240356, + 0.9243116011619568, + 0.8204109439849854, + 0.7235022459983825, + 0.7862601518392562, + 0.6927293693065644, + 0.6582143189430237, + 0.6549857058525086, + 0.6321955774307251, + 0.6534549119949341, + 0.6194889225959778, + 0.6070202907562255, + 0.6236599988937378, + 0.6771267072677613, + 0.627422360420227, + 0.5855028019428253, + 0.5894961810111999, + 0.6091744654655457, + 0.5452647192955017, + 0.5310998445272446, + 0.5282959970474244, + 0.5099697267055512, + 0.4917725399017334, + 0.5025618681430817, + 0.49637296361923217, + 0.5040994747161865, + 0.4880611917734146, + 0.49410484876632693, + 0.4913170972824097, + 0.5009399848937989 + ], + "term_loss": [ + 1.7701866647720337, + 0.8185793559074401, + 0.7281914510726929, + 0.6773546756744385, + 0.6231063483715057, + 0.6291931590080261, + 0.6409166412353515, + 0.6794824399948121, + 0.7937101348876953, + 1.0600441616535188, + 1.073026711654663, + 1.0124413738250733, + 1.872055620956421, + 1.2352364639282227, + 1.7976898548126221, + 1.3538026538848877, + 1.6288803262233733, + 1.6948101093292236, + 2.183274205303192, + 2.43363659965992, + 1.9681268157958984, + 2.2916102712631226, + 2.6780563119888305, + 2.800471863937378, + 2.8440163452148437, + 3.695234584617615, + 2.880801276016235, + 3.1201632221221924, + 2.9632775779724123, + 2.86259497795105, + 3.054944895553589, + 2.352185597229004, + 1.9367447420120238, + 1.3329054591178895, + 1.1181737011909485, + 0.8464344053268432, + 0.9961952589988708, + 0.7022396294593811, + 0.707889524269104, + 0.8871172556400299, + 0.6092679342508316, + 0.8543165489196778, + 1.115777855873108, + 1.1159364093780517, + 1.0589161104202272, + 0.788054754447937, + 0.6829598517417907, + 0.5953400208473205, + 0.5665688289642334, + 0.6170466102600097, + 0.7452212821960449, + 0.6295418489217758, + 0.5425786751747131, + 0.4624239018917084, + 0.5189494615197182, + 0.4438389172077179, + 0.4131625669956207, + 0.4099783119916916, + 0.39147601351737976, + 0.4156059757232666, + 0.38140970554351805, + 0.3751539804458618, + 0.3869523651123047, + 0.433263720870018, + 0.3870872139692306, + 0.3497257801055908, + 0.34638986687660217, + 0.36702115522623063, + 0.30950822319984433, + 0.2987165945053101, + 0.2955163496017456, + 0.2773493879556656, + 0.2587234512090683, + 0.2675587327003479, + 0.2639723771095276, + 0.2690547852039337, + 0.2558252832889557, + 0.2572220780849457, + 0.2568408847570419, + 0.26505257573127744 + ], + "bridge_loss": [ + 0.9756296471449372, + 0.05096207812726498, + 0.0040795450083911415, + 0.003944373325258493, + 0.010001258826255799, + 0.02449473536014557, + 0.028989047938585283, + 0.03089492822885513, + 0.017126886777579783, + 0.02114856996536255, + 0.015148569072782994, + 0.013431627827882767, + 0.025956531542539598, + 0.016493944716453553, + 0.026987479603290558, + 0.02172586493641138, + 0.024694513821601868, + 0.023027422791719435, + 0.04703930978775024, + 0.0878580693244934, + 0.0928592936873436, + 0.13349414933919906, + 0.17922042346000672, + 0.2330398242712021, + 0.26964373564720157, + 0.2232494835972786, + 0.24393825019598006, + 0.238459867978096, + 0.2615100040435791, + 0.33379141356945036, + 0.3384218771457672, + 0.16515041677951814, + 0.19477927612662316, + 0.1302941825270653, + 0.09851177232265472, + 0.07011229394674301, + 0.11377327572107315, + 0.07345656241178512, + 0.049081385147571564, + 0.06210354118570685, + 0.044834843748807904, + 0.06010619266033173, + 0.11214887998700142, + 0.08002942824363708, + 0.06650356951355935, + 0.05039359704554081, + 0.05662242863774299, + 0.04390023035407066, + 0.04950015317201614, + 0.06451151894330978, + 0.10136058478355407, + 0.08128330940008163, + 0.06231695182323456, + 0.04845148310661316, + 0.04830691860318184, + 0.04050123587995767, + 0.03742270451784134, + 0.038977445417642594, + 0.03015052459836006, + 0.033309116637706755, + 0.02923171687424183, + 0.026229538318514822, + 0.027924185514450073, + 0.030216664960980414, + 0.02713270623087883, + 0.026153411862254144, + 0.03055509918630123, + 0.030000684344768522, + 0.025569038861989975, + 0.021031512331962585, + 0.022238533282279968, + 0.02216599059700966, + 0.022519239933788775, + 0.025397614547610282, + 0.022649219024181367, + 0.025156321668624877, + 0.022629088670015333, + 0.028267720448970794, + 0.025573840299248696, + 0.027039055764675142 + ], + "tgrad_loss": [ + 0.29483874645233155, + 0.20444505448341369, + 0.14751926844120025, + 0.1306240245819092, + 0.11740482016801834, + 0.11515996508598328, + 0.11176430797576904, + 0.11741772980690002, + 0.1223868124961853, + 0.12617343007326126, + 0.12969958176612853, + 0.12305508751869201, + 0.15135818424224853, + 0.12325320014953613, + 0.14313213738203048, + 0.12868581702709198, + 0.13085558440685272, + 0.13439714648723602, + 0.15047225980758666, + 0.16658445747494696, + 0.15113828577399255, + 0.15208148312568665, + 0.16043939247131347, + 0.16281324887275697, + 0.1648398354291916, + 0.18542204723358155, + 0.16465072660446167, + 0.1796539167881012, + 0.18231577808856964, + 0.1966746131181717, + 0.19974080891609192, + 0.18725463242530824, + 0.19177704265117645, + 0.19551441068649292, + 0.19301328949928284, + 0.18991980985403062, + 0.191864014005661, + 0.18660128991603853, + 0.18469438967704774, + 0.18872169270515443, + 0.18490826721191406, + 0.2043958014011383, + 0.20719030148983, + 0.21868912653923034, + 0.2254349905014038, + 0.21692773156166076, + 0.2024708650588989, + 0.21245656762123108, + 0.21276216344833374, + 0.21374636619091034, + 0.2132700624704361, + 0.21348643493652344, + 0.21551531555652617, + 0.21262686700820924, + 0.21900376980304717, + 0.20838922061920165, + 0.20762904937267304, + 0.20602994527816773, + 0.21056903939247132, + 0.20453982200622559, + 0.20884749658107757, + 0.20563676958084107, + 0.20878344979286192, + 0.21364632172584533, + 0.21320244359970092, + 0.2096236107826233, + 0.21255121397972107, + 0.2121526288509369, + 0.21018745770454406, + 0.2113517366886139, + 0.21054111399650574, + 0.21045434730052948, + 0.21052985265254975, + 0.20960552549362182, + 0.20975136260986327, + 0.20988836765289307, + 0.209606822681427, + 0.20861505036354064, + 0.2089023720264435, + 0.20884835484027864 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.001700198045000434, + 0.04125010222196579, + 0.1112770289182663, + 0.11907510459423065, + 0.11768756806850433, + 0.11733907461166382, + 0.11329221725463867, + 0.117521733045578 + ], + "perturbation_rho": [ + 0.043069981038570404, + 0.1044735386967659, + 0.23828034102916718, + 0.18111932277679443, + 0.19782572984695435, + 0.1971191018819809, + 0.20729684829711914, + 0.2299107313156128 + ], + "nudging": { + "0.001": [ + -0.0006511092651635408, + -0.00034308910835534334, + -0.000792907492723316, + -0.0008164917235262692, + -0.0008322584326379001, + -0.0008019506931304932, + -0.0008090936462394893, + -0.0008134577656164765 + ], + "0.003": [ + -0.0019249932374805212, + -0.001026424579322338, + -0.002375826006755233, + -0.0024475236423313618, + -0.00249303737655282, + -0.0024030092172324657, + -0.002427314408123493, + -0.002439431846141815 + ], + "0.01": [ + -0.006082434207201004, + -0.003400696674361825, + -0.007903593592345715, + -0.008138573728501797, + -0.008289994671940804, + -0.007994470186531544, + -0.00807441771030426, + -0.008117234334349632 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.0_L8_s42.json b/results/synth_ladder_v2_lo/synth_a0.0_L8_s42.json new file mode 100644 index 0000000..9a870b4 --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.0_L8_s42.json @@ -0,0 +1,1638 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.0757543913841248, + 0.5076081553459167, + 0.44924112920761106, + 0.4247585828781128, + 0.390476895737648, + 0.3476995074748993, + 0.34030030264854433, + 0.3316740375518799, + 0.3210986800670624, + 0.3004637783050537, + 0.3107565640449524, + 0.31333593788146974, + 0.3368205448627472, + 0.3013008052945137, + 0.24617022519111634, + 0.2921410479068756, + 0.2635057222366333, + 0.2468733805656433, + 0.2835908453464508, + 0.24917495551109314, + 0.23554206476211548, + 0.2440310100078583, + 0.2401031512260437, + 0.23388757339715957, + 0.22199509954452515, + 0.24858054161071777, + 0.2563783165931702, + 0.2575826109409332, + 0.21732676796913147, + 0.2173767949104309, + 0.22188423473834992, + 0.18563161835670472, + 0.20825975818634032, + 0.17853380255699158, + 0.16998590087890625, + 0.22122718925476073, + 0.17761884450912477, + 0.1721252568244934, + 0.18634113365411759, + 0.16172185846567155, + 0.14872372229099273, + 0.1512143076300621, + 0.1437873905658722, + 0.15217237317562105, + 0.15337150135040284, + 0.16384036836624147, + 0.1659779568195343, + 0.1543241171836853, + 0.14291128422021865, + 0.13691224701404572, + 0.13174424264132978, + 0.12449043486118316, + 0.12606769989728928, + 0.12063085582256317, + 0.1212635150194168, + 0.12218361542224884, + 0.11889479755163193, + 0.11501415977478027, + 0.11453091421127319, + 0.11233264380693436, + 0.10913959243297577, + 0.1080293738424778, + 0.10722576280832291, + 0.10587466154694557, + 0.10347079048156738, + 0.1029079300403595, + 0.1010995524764061, + 0.10133141717910767, + 0.10086093401908874, + 0.09952975501418114, + 0.09885214577913284, + 0.09803358337879181, + 0.09736436128616333, + 0.09699009905606508, + 0.0960432112455368, + 0.09560413639545441, + 0.09529533250927925, + 0.0950549742102623, + 0.09487758847773076, + 0.09478750932216644 + ], + "train_acc": [ + 0.6176, + 0.8033, + 0.8282, + 0.8365, + 0.8415, + 0.8594, + 0.8616, + 0.8667, + 0.8712, + 0.8777, + 0.8772, + 0.8762, + 0.8668, + 0.8811, + 0.9031, + 0.8815, + 0.8954, + 0.9032, + 0.8904, + 0.9, + 0.9054, + 0.9037, + 0.8994, + 0.9078, + 0.9118, + 0.9008, + 0.9003, + 0.8984, + 0.9117, + 0.912, + 0.9104, + 0.9275, + 0.9171, + 0.9301, + 0.9363, + 0.914, + 0.9305, + 0.9348, + 0.925, + 0.9397, + 0.9444, + 0.9459, + 0.9476, + 0.9444, + 0.9424, + 0.9364, + 0.9358, + 0.9404, + 0.9472, + 0.9511, + 0.9553, + 0.9594, + 0.9593, + 0.9604, + 0.9607, + 0.9597, + 0.962, + 0.962, + 0.9636, + 0.9656, + 0.967, + 0.9682, + 0.9697, + 0.9695, + 0.9704, + 0.9715, + 0.9735, + 0.9725, + 0.9739, + 0.9745, + 0.9728, + 0.9745, + 0.9752, + 0.975, + 0.976, + 0.9768, + 0.9773, + 0.977, + 0.9774, + 0.9775 + ], + "test_acc": [ + 0.787, + 0.8035, + 0.833, + 0.842, + 0.8535, + 0.8575, + 0.86, + 0.848, + 0.8745, + 0.866, + 0.8675, + 0.8635, + 0.867, + 0.8735, + 0.887, + 0.876, + 0.8785, + 0.8855, + 0.874, + 0.88, + 0.8865, + 0.8785, + 0.871, + 0.883, + 0.8995, + 0.8785, + 0.8715, + 0.875, + 0.896, + 0.8965, + 0.897, + 0.903, + 0.896, + 0.8985, + 0.895, + 0.8895, + 0.895, + 0.897, + 0.887, + 0.903, + 0.9035, + 0.9045, + 0.897, + 0.8945, + 0.9065, + 0.9025, + 0.904, + 0.9035, + 0.9045, + 0.903, + 0.905, + 0.908, + 0.9045, + 0.91, + 0.909, + 0.908, + 0.9075, + 0.9125, + 0.909, + 0.9085, + 0.9035, + 0.909, + 0.9085, + 0.905, + 0.9075, + 0.9105, + 0.91, + 0.909, + 0.9065, + 0.908, + 0.907, + 0.9065, + 0.9075, + 0.908, + 0.908, + 0.9075, + 0.9065, + 0.9065, + 0.906, + 0.906 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8854324817657471, + 0.8737501502037048, + 0.8630377054214478, + 0.8562113046646118, + 0.8509326577186584, + 0.8481521606445312, + 0.84560626745224, + 0.8443001508712769 + ], + "perturbation_rho": [ + 0.9999991655349731, + 0.9999963045120239, + 0.9999881386756897, + 0.9999630451202393, + 0.9999364614486694, + 0.9999151825904846, + 0.9998926520347595, + 0.9998775720596313 + ], + "nudging": { + "0.001": [ + -0.031868599355220795, + -0.014682772569358349, + -0.00733374897390604, + -0.0044118668884038925, + -0.0032190121710300446, + -0.002646001288667321, + -0.0023340615443885326, + -0.0021536401472985744 + ], + "0.003": [ + -0.08796128630638123, + -0.042457789182662964, + -0.021612998098134995, + -0.013098624534904957, + -0.00958542712032795, + -0.007890285924077034, + -0.006964934058487415, + -0.006429150700569153 + ], + "0.01": [ + -0.21767401695251465, + -0.12408202886581421, + -0.06762672960758209, + -0.04208396375179291, + -0.031123068183660507, + -0.025745777413249016, + -0.022784877568483353, + -0.021061642095446587 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.13472125415802, + 1.064750273513794, + 0.6787943045616149, + 0.5445983642578125, + 0.4691809035301209, + 0.44078434734344485, + 0.4589700782775879, + 0.4633651376724243, + 0.48622037637233734, + 0.5303937173843384, + 0.5300615015029907, + 0.5191615985870361, + 0.6124243753433227, + 0.6110803317785263, + 0.5108732610702514, + 0.6651096425056457, + 0.6519462231874465, + 0.6120770479202271, + 0.611581618309021, + 0.7067273505687713, + 0.6294481365203858, + 0.6680336037635803, + 0.7899993432998658, + 0.7286258486032486, + 0.7593296463012695, + 0.6259688374519348, + 0.7967933742523193, + 1.0146251457214355, + 0.8291450224876403, + 0.7330523146629333, + 0.8095165735721588, + 0.6667535767793655, + 0.6494596580505371, + 0.6892270953893661, + 0.6535914615631103, + 0.752629549407959, + 0.6489908882915973, + 0.7158377149581909, + 0.8427579293370246, + 0.7397276062965393, + 0.7076394484519959, + 0.680823688364029, + 0.6616308630347252, + 0.6541980605125427, + 0.7793759801864624, + 0.8009075149536132, + 0.6981098392486572, + 0.6555009291648864, + 0.6616069585680961, + 0.6934653346061707, + 0.6811443558603525, + 0.6117486233711242, + 0.6414114294528961, + 0.6468382164001465, + 0.6715234688282012, + 0.5874644180297851, + 0.617424130487442, + 0.5686914512634277, + 0.5897184799194336, + 0.563749632358551, + 0.5560783692359924, + 0.5561227001190185, + 0.5419582702159882, + 0.5483636920452117, + 0.5441933881878853, + 0.5452967376232147, + 0.5415290240168571, + 0.5169584144592285, + 0.5267872435450554, + 0.5149645379066468, + 0.5136418291330338, + 0.5051588420391083, + 0.5119852211952209, + 0.5085399871870875, + 0.50260826587677, + 0.4999133358955383, + 0.49910780143737793, + 0.49455464423894885, + 0.4937580402228981, + 0.4927313493728638 + ], + "train_acc": [ + 0.2241, + 0.6144, + 0.7485, + 0.7929, + 0.8238, + 0.8322, + 0.832, + 0.834, + 0.8279, + 0.828, + 0.8247, + 0.8309, + 0.8223, + 0.8173, + 0.843, + 0.8172, + 0.8248, + 0.8386, + 0.8341, + 0.824, + 0.8362, + 0.8351, + 0.8275, + 0.8305, + 0.8288, + 0.8519, + 0.8242, + 0.805, + 0.8315, + 0.8379, + 0.8337, + 0.8522, + 0.8513, + 0.8439, + 0.8553, + 0.8379, + 0.8559, + 0.8481, + 0.8328, + 0.8445, + 0.8516, + 0.8537, + 0.856, + 0.8561, + 0.837, + 0.8422, + 0.8485, + 0.8613, + 0.8568, + 0.8485, + 0.8541, + 0.8632, + 0.8631, + 0.8594, + 0.8544, + 0.8676, + 0.861, + 0.8701, + 0.866, + 0.8709, + 0.8731, + 0.8725, + 0.8749, + 0.8691, + 0.8736, + 0.8732, + 0.8747, + 0.8783, + 0.8739, + 0.8785, + 0.8784, + 0.8796, + 0.8797, + 0.8802, + 0.8794, + 0.8817, + 0.8804, + 0.8823, + 0.8814, + 0.8818 + ], + "test_acc": [ + 0.452, + 0.664, + 0.7355, + 0.773, + 0.7975, + 0.7885, + 0.7945, + 0.777, + 0.774, + 0.7755, + 0.792, + 0.763, + 0.7875, + 0.777, + 0.736, + 0.7485, + 0.789, + 0.7625, + 0.7415, + 0.784, + 0.739, + 0.772, + 0.797, + 0.704, + 0.7955, + 0.786, + 0.7635, + 0.7495, + 0.7615, + 0.771, + 0.7995, + 0.821, + 0.794, + 0.7825, + 0.773, + 0.8035, + 0.804, + 0.779, + 0.7465, + 0.7895, + 0.8165, + 0.783, + 0.8055, + 0.8015, + 0.7835, + 0.7945, + 0.798, + 0.8215, + 0.7735, + 0.8165, + 0.804, + 0.823, + 0.7875, + 0.811, + 0.8245, + 0.8195, + 0.8185, + 0.824, + 0.819, + 0.822, + 0.8275, + 0.821, + 0.8295, + 0.8295, + 0.8315, + 0.825, + 0.829, + 0.823, + 0.8335, + 0.834, + 0.836, + 0.8295, + 0.8315, + 0.8305, + 0.8355, + 0.8335, + 0.8345, + 0.8345, + 0.8325, + 0.8325 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.02968163788318634, + 0.08609121292829514, + 0.09377065300941467, + 0.10205866396427155, + 0.08807726949453354, + 0.053033627569675446, + 0.056919872760772705, + 0.04721488058567047 + ], + "perturbation_rho": [ + -0.09032663702964783, + 0.17043988406658173, + 0.18389353156089783, + 0.16770029067993164, + 0.1504741907119751, + 0.05179755389690399, + 0.050898581743240356, + -0.03670964762568474 + ], + "nudging": { + "0.001": [ + 0.002358348574489355, + -0.0005224555497989058, + -0.00029081435059197247, + -0.0002893093624152243, + -0.00024064714671112597, + -0.0001590531610418111, + -0.00014225264021661133, + -0.00011707056546583772 + ], + "0.003": [ + 0.0073735713958740234, + -0.0015679008793085814, + -0.0008718278259038925, + -0.0008626180933788419, + -0.000721139891538769, + -0.00047776539577171206, + -0.0004256684915162623, + -0.0003536291478667408 + ], + "0.01": [ + 0.028243789449334145, + -0.00520662497729063, + -0.0028999613132327795, + -0.002869710559025407, + -0.0023996694944798946, + -0.0015899656573310494, + -0.0014181910082697868, + -0.0011781371431425214 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.7328739669799804, + 0.9811433526992798, + 0.7968745387077332, + 0.80839176197052, + 0.8580701364994049, + 0.9189817895889282, + 0.9484232675552369, + 0.9335546033859253, + 0.9336960997581482, + 0.9480458303451538, + 0.9517143133163453, + 0.9554149606704712, + 0.9504594124794007, + 0.97358454246521, + 1.0018829744338988, + 0.9550861362457276, + 0.9641454742431641, + 0.9438694232940674, + 0.9552924007415772, + 0.9330580535888672, + 0.8800268087387085, + 0.858905982208252, + 0.9175141490936279, + 0.920817092704773, + 0.9107141004562378, + 0.8834829970359802, + 0.845861376953125, + 0.8068534229278564, + 0.8613802621841431, + 0.8515079685211182, + 0.8195189044952392, + 0.8610365732192993, + 0.8288298233509064, + 0.7938063079833985, + 0.782201350402832, + 0.8223142776489257, + 0.8027304618835449, + 0.796955973815918, + 0.769949794960022, + 0.7569882241249084, + 0.7953457245826722, + 0.8144200666427612, + 0.7426586433410645, + 0.755963011932373, + 0.7787463603973389, + 0.743975663948059, + 0.759346683883667, + 0.7585860026836395, + 0.7371354169845581, + 0.7337988836288453, + 0.7494666588783264, + 0.7489494784355164, + 0.7316932228088379, + 0.7707076009750367, + 0.7418164071559906, + 0.7404774815559387, + 0.736026719045639, + 0.7313680733680725, + 0.7195740768432617, + 0.7385888179779053, + 0.7218243119239807, + 0.699979656791687, + 0.6981355967521667, + 0.6896988845348359, + 0.6775998549222946, + 0.6683120150566101, + 0.667447187423706, + 0.6596596981048584, + 0.6571299660205842, + 0.648965798997879, + 0.6483057856559753, + 0.6461096891403199, + 0.6408902339935303, + 0.6388658201217652, + 0.6380767006874084, + 0.6351657607078552, + 0.6342095012664795, + 0.6330936979293823, + 0.6321959840774536, + 0.631820877456665 + ], + "train_acc": [ + 0.3774, + 0.6438, + 0.702, + 0.7105, + 0.7005, + 0.6896, + 0.6819, + 0.6739, + 0.6689, + 0.6621, + 0.6589, + 0.6571, + 0.6607, + 0.6563, + 0.6563, + 0.6693, + 0.6647, + 0.6737, + 0.6748, + 0.6718, + 0.6874, + 0.6971, + 0.6821, + 0.6934, + 0.6935, + 0.7054, + 0.7122, + 0.7186, + 0.7057, + 0.7113, + 0.7256, + 0.7072, + 0.7181, + 0.7251, + 0.7255, + 0.7236, + 0.7238, + 0.7252, + 0.7354, + 0.7392, + 0.7232, + 0.7273, + 0.7429, + 0.7366, + 0.7356, + 0.738, + 0.7348, + 0.7376, + 0.741, + 0.7428, + 0.7398, + 0.7432, + 0.7433, + 0.7352, + 0.7398, + 0.7414, + 0.7443, + 0.7444, + 0.7476, + 0.7398, + 0.748, + 0.7523, + 0.7573, + 0.7549, + 0.7603, + 0.7642, + 0.7656, + 0.7656, + 0.7698, + 0.7711, + 0.7689, + 0.7716, + 0.7704, + 0.7718, + 0.7748, + 0.7733, + 0.7752, + 0.7752, + 0.7762, + 0.7765 + ], + "test_acc": [ + 0.5465, + 0.653, + 0.6825, + 0.6735, + 0.664, + 0.6365, + 0.64, + 0.6305, + 0.6235, + 0.621, + 0.6325, + 0.6335, + 0.633, + 0.6125, + 0.6295, + 0.6175, + 0.65, + 0.615, + 0.641, + 0.6645, + 0.6565, + 0.6625, + 0.6605, + 0.653, + 0.6765, + 0.6805, + 0.69, + 0.6625, + 0.678, + 0.6895, + 0.673, + 0.669, + 0.7, + 0.6975, + 0.6765, + 0.69, + 0.6845, + 0.6915, + 0.707, + 0.6645, + 0.6725, + 0.688, + 0.7195, + 0.701, + 0.7, + 0.682, + 0.7095, + 0.6985, + 0.712, + 0.6955, + 0.6935, + 0.713, + 0.698, + 0.688, + 0.7065, + 0.6865, + 0.7145, + 0.713, + 0.7025, + 0.708, + 0.7195, + 0.7155, + 0.714, + 0.726, + 0.718, + 0.7225, + 0.721, + 0.7275, + 0.721, + 0.7235, + 0.7295, + 0.724, + 0.7245, + 0.7225, + 0.7265, + 0.728, + 0.727, + 0.7265, + 0.727, + 0.726 + ], + "state_pred_error": [ + 0.6428197972297669, + 0.19351577122211455, + 0.1660344313621521, + 0.17652878823280335, + 0.18978006644248963, + 0.19631840877532958, + 0.19491800663471223, + 0.19226022069454193, + 0.18165790848731994, + 0.16527520124912262, + 0.14865010199546813, + 0.13212442252635956, + 0.1177069759130478, + 0.11029988080263138, + 0.10093973301649094, + 0.08951207721233367, + 0.08190780951976775, + 0.08566042828559875, + 0.08916603361368179, + 0.0825111199259758, + 0.07487273232936859, + 0.06487578954696656, + 0.059569144582748416, + 0.05982308453321457, + 0.05629802569746971, + 0.04989139791727066, + 0.0473561365544796, + 0.04492486463785172, + 0.044193212151527404, + 0.04343981958031654, + 0.041326461428403856, + 0.040116964304447174, + 0.03958643175363541, + 0.03792573779821396, + 0.03780722205638885, + 0.03684104197919369, + 0.035100384438037875, + 0.033475980192422865, + 0.03184100140333176, + 0.031417953404784205, + 0.03174956562519073, + 0.031464615708589556, + 0.030044199123978616, + 0.028851599764823915, + 0.027254376643896103, + 0.025502048003673554, + 0.023910949629545212, + 0.02216300364136696, + 0.020575732861459254, + 0.019327285060286522, + 0.018592858423292637, + 0.01823208925127983, + 0.018495164170861243, + 0.01851490514278412, + 0.018615340042114258, + 0.018319079437851906, + 0.017992605185508728, + 0.017830414324998857, + 0.017337585292756558, + 0.016755458490550518, + 0.01625010498762131, + 0.015588380454480648, + 0.015276109413802624, + 0.014523939031362534, + 0.013859204940497876, + 0.013518636293709278, + 0.013107557639479636, + 0.012660594460368156, + 0.012188548400998115, + 0.01179230693280697, + 0.011473847399652005, + 0.0111009864538908, + 0.010866704443097114, + 0.010644253891706467, + 0.01051605779528618, + 0.010096385054290294, + 0.009957369659096002, + 0.009735264672338963, + 0.009506795328110456, + 0.00936661482155323 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8151727914810181, + 0.4042307734489441, + 0.16176781058311462, + 0.1698867678642273, + 0.14891386032104492, + 0.1726662963628769, + 0.1322125643491745, + 0.14817725121974945 + ], + "perturbation_rho": [ + 0.7261759042739868, + 0.36915943026542664, + 0.17840053141117096, + 0.16105638444423676, + 0.14931628108024597, + 0.15696927905082703, + 0.17820878326892853, + 0.1840115785598755 + ], + "nudging": { + "0.001": [ + -0.023730942979454994, + -0.0011499840766191483, + -0.00041868066182360053, + -0.0004118153010495007, + -0.000386256433557719, + -0.0004230579361319542, + -0.0003364062577020377, + -0.0003734407073352486 + ], + "0.003": [ + -0.06960602104663849, + -0.003446865128353238, + -0.001256113639101386, + -0.0012356475926935673, + -0.0011594654060900211, + -0.001268491381779313, + -0.001009067753329873, + -0.0011201862944290042 + ], + "0.01": [ + -0.21425020694732666, + -0.011446774937212467, + -0.004181142896413803, + -0.004114024806767702, + -0.0038589704781770706, + -0.00422251783311367, + -0.003358659567311406, + -0.003728472860530019 + ] + }, + "state_pred_error_per_layer": [ + 7398.20849609375, + 5242.7607421875, + 3768.9609375, + 3258.12548828125, + 3060.2021484375, + 2786.609619140625, + 3211.44921875, + 2939.81005859375 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.1370582035064696, + 1.0645069687843323, + 0.6801733062744141, + 0.5586606249332428, + 0.4881390431404114, + 0.46811703872680666, + 0.47793011622428894, + 0.491072265625, + 0.45632949471473694, + 0.49341422691345216, + 0.6391787099599838, + 0.5234632035255432, + 0.5246470190525055, + 0.6408189677238464, + 0.6090221863985061, + 0.5636324305534363, + 0.6122668931216001, + 0.6223794656276703, + 0.7977206924438477, + 0.7688750084877014, + 0.8809650159835816, + 0.9288559448242187, + 0.8847734958648682, + 0.9730628623962402, + 0.9568616161346436, + 1.0317223262786865, + 1.136458911895752, + 1.1702300283432008, + 0.9281893106460571, + 1.0470865356445314, + 1.1126060703277587, + 1.1764981075286864, + 0.9546853006362915, + 0.9108602264404296, + 0.8738015920639038, + 0.8948956307888031, + 0.813925849533081, + 0.9619963138580322, + 1.0160358333587647, + 0.9929837261199951, + 1.0878820617675782, + 0.991282360458374, + 1.0092166801452638, + 1.0004161891937255, + 1.0230372599601745, + 1.0760341178894044, + 0.9872162799835205, + 0.9739640418052673, + 1.0317725978851318, + 1.0004596428871155, + 0.9978432794094085, + 1.0264748498916625, + 1.073675299835205, + 1.0885952290534973, + 1.0659225395202636, + 1.0828760971069336, + 1.0679924612045288, + 1.0984314491271974, + 1.1133429298400879, + 1.0874613107681275, + 1.1088385950088502, + 1.080880365371704, + 1.1012449313163757, + 1.0722564311504363, + 1.063163561439514, + 1.0487949291229248, + 1.0663402166366578, + 1.0534990873336791, + 1.0597085929870604, + 1.0426021310806275, + 1.0364102695465087, + 1.0401461017608642, + 1.03147163105011, + 1.032290082359314, + 1.0253121829986571, + 1.023413536453247, + 1.0240816875457763, + 1.0224136894226075, + 1.0198726715087891, + 1.0197427711486817 + ], + "train_acc": [ + 0.2223, + 0.6146, + 0.7422, + 0.7889, + 0.8129, + 0.8208, + 0.8242, + 0.8254, + 0.8378, + 0.8275, + 0.8051, + 0.8348, + 0.8319, + 0.8211, + 0.8253, + 0.8405, + 0.8325, + 0.835, + 0.8078, + 0.8158, + 0.7949, + 0.791, + 0.7938, + 0.7747, + 0.7774, + 0.7745, + 0.7607, + 0.7438, + 0.7736, + 0.749, + 0.7511, + 0.7318, + 0.7493, + 0.7459, + 0.7528, + 0.7375, + 0.7445, + 0.7151, + 0.7011, + 0.707, + 0.6813, + 0.6985, + 0.6986, + 0.6899, + 0.6838, + 0.6775, + 0.6854, + 0.6941, + 0.6759, + 0.677, + 0.682, + 0.6713, + 0.666, + 0.6642, + 0.6638, + 0.6643, + 0.6642, + 0.6542, + 0.6521, + 0.6569, + 0.6636, + 0.6591, + 0.6569, + 0.662, + 0.6675, + 0.6717, + 0.667, + 0.6692, + 0.6706, + 0.6745, + 0.6756, + 0.6742, + 0.6741, + 0.6745, + 0.6746, + 0.6742, + 0.6751, + 0.6767, + 0.6778, + 0.6774 + ], + "test_acc": [ + 0.444, + 0.6745, + 0.7325, + 0.7745, + 0.7815, + 0.798, + 0.8035, + 0.798, + 0.8025, + 0.711, + 0.7895, + 0.7985, + 0.791, + 0.766, + 0.77, + 0.794, + 0.7735, + 0.7315, + 0.759, + 0.7495, + 0.752, + 0.735, + 0.705, + 0.732, + 0.721, + 0.752, + 0.7115, + 0.72, + 0.6915, + 0.7335, + 0.6465, + 0.7225, + 0.6795, + 0.709, + 0.697, + 0.6885, + 0.6295, + 0.6055, + 0.583, + 0.6355, + 0.583, + 0.659, + 0.6365, + 0.6345, + 0.5925, + 0.6095, + 0.666, + 0.602, + 0.6545, + 0.612, + 0.638, + 0.6155, + 0.611, + 0.6055, + 0.6135, + 0.6285, + 0.626, + 0.607, + 0.623, + 0.608, + 0.6185, + 0.6095, + 0.609, + 0.6265, + 0.626, + 0.622, + 0.629, + 0.626, + 0.633, + 0.6425, + 0.634, + 0.636, + 0.634, + 0.6375, + 0.6375, + 0.638, + 0.64, + 0.639, + 0.639, + 0.64 + ], + "value_loss": [ + 2.9023948707580565, + 0.9411828812599182, + 0.9784409198760986, + 0.9702556604385376, + 0.911243058013916, + 0.9411980567932129, + 1.0062726194381715, + 1.0051571633458138, + 0.7945024635076523, + 0.8636679088592529, + 1.351515377473831, + 0.9440338861465454, + 1.0237316113948822, + 1.6041599166870117, + 1.4913020963668824, + 1.3120978896141051, + 1.4634722517490386, + 1.5368283511161804, + 2.3160801666259765, + 2.31045254573822, + 2.833774365234375, + 3.385757903289795, + 2.9262950035095217, + 3.250738282775879, + 3.1019880832672118, + 3.6402773345947264, + 4.2429088134765625, + 4.023282150268555, + 2.689120644378662, + 3.2996597610473635, + 4.053308227157593, + 3.6391844707489014, + 2.5846795793533324, + 1.8673851746559142, + 1.6735054915428162, + 1.9220958820343017, + 1.271403459739685, + 1.567453321647644, + 2.111127665615082, + 1.4919785886764527, + 1.5718415649414061, + 1.237246979522705, + 1.4188125720977782, + 1.0745463274002076, + 1.0068994304180146, + 1.185745523071289, + 1.2835211219787597, + 0.8518369881629944, + 0.8437435919761658, + 0.8486205416202545, + 0.8211554767489433, + 0.7640671442985535, + 0.7999482116699219, + 0.9456826114654541, + 0.810999361205101, + 0.8642545461654663, + 0.8051076416015625, + 0.8193947722434998, + 0.8351191815376282, + 0.7857263399124146, + 0.9166569149971008, + 0.7972983899593353, + 0.9325546828269958, + 0.7981749772071839, + 0.8134522473335266, + 0.7371659188747406, + 0.7727094465255737, + 0.7542548943519592, + 0.7355351985931396, + 0.7110868342399597, + 0.7060981317520142, + 0.7146732750892639, + 0.7173495404720306, + 0.6977155768394471, + 0.6535471586227417, + 0.6667288435935974, + 0.6411734392166137, + 0.6943656763076782, + 0.6403075717926026, + 0.6615465266227722 + ], + "term_loss": [ + 1.6929137281417848, + 0.7076341553688049, + 0.832843780708313, + 0.8462161507606506, + 0.7989002693176269, + 0.8294573577880859, + 0.8796000757217407, + 0.8496675333380699, + 0.6641823264122009, + 0.734419527053833, + 1.1998622996211052, + 0.8190442297935486, + 0.8997376405477524, + 1.463374104309082, + 1.350538944530487, + 1.1835087180614472, + 1.3240371099829673, + 1.403322444820404, + 2.149280529022217, + 2.1371682680130006, + 2.6051794219970703, + 3.134266621398926, + 2.6367359077453614, + 2.9021682273864746, + 2.7777284118652346, + 3.2490100632667542, + 3.7669732330322265, + 3.564024981689453, + 2.304465440368652, + 2.9117907354354857, + 3.57571163482666, + 3.2041259724617004, + 2.1697021233558655, + 1.5657260522842407, + 1.3720391330718995, + 1.558706689453125, + 0.9739575270175934, + 1.2646527061462403, + 1.7258377660751343, + 1.2162893053054809, + 1.2816789051055908, + 0.9437851461410522, + 1.1169724729537964, + 0.8192238623142243, + 0.7615165826678276, + 0.9261411437988282, + 1.009357823753357, + 0.6213359757423401, + 0.6048593424797059, + 0.6017368167161942, + 0.5840524630784989, + 0.5252864897727967, + 0.5610690414428711, + 0.6845973509550095, + 0.5607477729558945, + 0.6126968932867051, + 0.5582075795173645, + 0.5701824194669723, + 0.5824683590888977, + 0.5440888320446015, + 0.6618193277835845, + 0.5566088491201401, + 0.6798252540588379, + 0.5569242746114731, + 0.5653092860221863, + 0.5025307513594628, + 0.5350002650260925, + 0.5163064182400704, + 0.5040774492263794, + 0.4812365728378296, + 0.47341508727073667, + 0.4825198311924934, + 0.4820213997364044, + 0.4671297842979431, + 0.4262480612754822, + 0.4348880102574825, + 0.4149773345947266, + 0.4545517260074615, + 0.4134101836204529, + 0.43013124598264696 + ], + "bridge_loss": [ + 0.9270794340786408, + 0.045553212680667636, + 0.003968565206974745, + 0.002537821502238512, + 0.0031120730198919773, + 0.0066142574056983, + 0.0196716277718544, + 0.04569760949611664, + 0.02804326199516654, + 0.021940968203544617, + 0.023567047103494405, + 0.016042337491363287, + 0.014572544375434518, + 0.01808674999922514, + 0.02120318498685956, + 0.020132692527770998, + 0.026115470457077027, + 0.022087446881830692, + 0.03340454182624817, + 0.04386694201231003, + 0.08512414672374725, + 0.10392638924121857, + 0.14596812286376953, + 0.19242930736541747, + 0.1708755298614502, + 0.2332140768289566, + 0.30846771535873413, + 0.28443601269721985, + 0.23180612392425537, + 0.21575192351341246, + 0.30160183690786363, + 0.2529610634982586, + 0.25124281091690065, + 0.13896957349777223, + 0.14441813020706176, + 0.199903391456604, + 0.13990903476476668, + 0.12412642853856087, + 0.19780184895992278, + 0.09088843083381652, + 0.09028354053497314, + 0.10483143763542176, + 0.10901366031169892, + 0.06172756772786379, + 0.048116388000547884, + 0.059933180809021, + 0.08071009765267372, + 0.040531087708473204, + 0.03966846313476562, + 0.049442718121409414, + 0.041820975951850414, + 0.03792309836894274, + 0.03355912851691246, + 0.054180008935928343, + 0.04611676089167595, + 0.046126355296373364, + 0.04175337711572647, + 0.03904522615373135, + 0.04093780878186226, + 0.03443106972575188, + 0.04773863691091537, + 0.03512803372144699, + 0.04503686083853245, + 0.03661287835687399, + 0.04466721993088722, + 0.03356916709542274, + 0.033895546194911, + 0.03588070866465569, + 0.030623928356170654, + 0.030353828406333924, + 0.03458711423873902, + 0.033419507718086244, + 0.037426383411884305, + 0.0331623010635376, + 0.030711766165494918, + 0.035254054686427116, + 0.029518259859085082, + 0.04370544706583023, + 0.03128685694634915, + 0.0357342723429203 + ], + "tgrad_loss": [ + 0.28240168471336363, + 0.1879955181479454, + 0.1416285768508911, + 0.12150168550014497, + 0.10923070974349976, + 0.10512643830776215, + 0.10700090990066528, + 0.10979201674461364, + 0.10227687674164772, + 0.1073074081659317, + 0.12808603233098984, + 0.1089473068356514, + 0.10942141929864883, + 0.12269907640218734, + 0.11955996571779251, + 0.1084564683675766, + 0.1133196670204401, + 0.1114184632062912, + 0.1333950751066208, + 0.1294173326253891, + 0.14347079792022704, + 0.1475648888349533, + 0.14359098019599914, + 0.15614077184200287, + 0.15338412828445436, + 0.1580532071352005, + 0.167467866563797, + 0.1748211373090744, + 0.15284905924797057, + 0.17211710295677185, + 0.17599477090835572, + 0.18209742259979247, + 0.16373461263179778, + 0.1626895320892334, + 0.15704822034835816, + 0.16348580796718598, + 0.1575368951320648, + 0.1786741998195648, + 0.1874880330324173, + 0.18480085792541504, + 0.19987909994125366, + 0.18863038229942322, + 0.1928264294862747, + 0.19359489631652832, + 0.19726645183563232, + 0.19967118492126465, + 0.1934531969308853, + 0.1899699252128601, + 0.19921578810214996, + 0.19744101244211196, + 0.19528203347921372, + 0.20085754714012147, + 0.20532003726959228, + 0.20690523879528044, + 0.20413482726812363, + 0.20543130034208298, + 0.2051466886997223, + 0.21016712760925294, + 0.21171300716400146, + 0.20720643639564515, + 0.2070989497900009, + 0.2055615005493164, + 0.20769256865978242, + 0.20463782558441163, + 0.20347574241161345, + 0.20106599922180177, + 0.20381363768577576, + 0.2020677721977234, + 0.20083382663726806, + 0.1994964292526245, + 0.19809593105316162, + 0.1987339344024658, + 0.19790175647735594, + 0.19742349796295167, + 0.1965873306274414, + 0.19658677837848662, + 0.1966778451681137, + 0.19610850033760072, + 0.19561053042411805, + 0.19568100452423096 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.010387556627392769, + 0.06787668168544769, + 0.11108389496803284, + 0.11367877572774887, + 0.11491300165653229, + 0.1093105673789978, + 0.11488444358110428, + 0.12266267836093903 + ], + "perturbation_rho": [ + 0.0504305437207222, + 0.11780044436454773, + 0.23789767920970917, + 0.24238067865371704, + 0.22429296374320984, + 0.25153419375419617, + 0.25647929310798645, + 0.22654107213020325 + ], + "nudging": { + "0.001": [ + -0.00042957920231856406, + -0.0005755086895078421, + -0.0007836788427084684, + -0.0008127648616209626, + -0.0008176113478839397, + -0.0008154284441843629, + -0.0008326433598995209, + -0.0008715562289580703 + ], + "0.003": [ + -0.0012653844896703959, + -0.0017247737850993872, + -0.002354162745177746, + -0.002438494935631752, + -0.002453066874295473, + -0.0024441296700388193, + -0.00249684345908463, + -0.002618872094899416 + ], + "0.01": [ + -0.003928218502551317, + -0.0057389335706830025, + -0.007835019379854202, + -0.008116443641483784, + -0.0081653306260705, + -0.00813683308660984, + -0.008312376216053963, + -0.00871281512081623 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.0_L8_s456.json b/results/synth_ladder_v2_lo/synth_a0.0_L8_s456.json new file mode 100644 index 0000000..98e3c0a --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.0_L8_s456.json @@ -0,0 +1,1638 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.0602704408168793, + 0.5027601260185242, + 0.43080672092437744, + 0.4305861669540405, + 0.35372886188030245, + 0.35343530569076537, + 0.3411521464467049, + 0.3113056640148163, + 0.3555877588272095, + 0.35838791880607607, + 0.310362742805481, + 0.2821650200843811, + 0.26945531539916995, + 0.27178956003189086, + 0.3010430852890015, + 0.28751621344089506, + 0.2822985043525696, + 0.28170071473121644, + 0.2461530613899231, + 0.2909035976409912, + 0.2241233106136322, + 0.22891775674819947, + 0.2648821008682251, + 0.29351482318639754, + 0.21875614569187166, + 0.19591772537231444, + 0.19844525773525237, + 0.1983874746322632, + 0.21039879322052002, + 0.1819182156085968, + 0.2276622181892395, + 0.191768607711792, + 0.18294820175170898, + 0.17453236331939698, + 0.20749281368255615, + 0.17378860583305358, + 0.1630034108877182, + 0.1688230975151062, + 0.1894659786939621, + 0.15866619582176208, + 0.17937585167884826, + 0.16238984402418136, + 0.15362602603435516, + 0.15638497247695923, + 0.14544389412403105, + 0.14327869791686534, + 0.13311278290748596, + 0.1496122142314911, + 0.15034341797828674, + 0.14216417129039766, + 0.14079184398651123, + 0.14070965950489045, + 0.12715232799053192, + 0.1181271733045578, + 0.12163998708724975, + 0.11910948114395141, + 0.12497851085662842, + 0.12175717628002167, + 0.11586888887882232, + 0.11415803298354149, + 0.10847577197551728, + 0.11201638069152832, + 0.10924316263198852, + 0.10966023950576782, + 0.10431095411777497, + 0.10155300235748291, + 0.10120472279787064, + 0.09946133661270141, + 0.09955022404193878, + 0.09832342414855957, + 0.09743722066879272, + 0.0961718876838684, + 0.09559566440582275, + 0.09503851671218871, + 0.0945616308093071, + 0.09419615615606308, + 0.09386814022064209, + 0.09363705427646637, + 0.09348938752114773, + 0.09341154512763024 + ], + "train_acc": [ + 0.6262, + 0.8013, + 0.8277, + 0.8347, + 0.8597, + 0.856, + 0.8639, + 0.8759, + 0.8605, + 0.8558, + 0.876, + 0.8879, + 0.8957, + 0.8886, + 0.8799, + 0.8868, + 0.8868, + 0.8889, + 0.898, + 0.8824, + 0.9111, + 0.9088, + 0.8934, + 0.8869, + 0.9131, + 0.9217, + 0.9206, + 0.9224, + 0.9156, + 0.928, + 0.9094, + 0.9244, + 0.9292, + 0.9307, + 0.9179, + 0.9306, + 0.938, + 0.9331, + 0.9251, + 0.9413, + 0.9292, + 0.9359, + 0.9409, + 0.9407, + 0.9444, + 0.9484, + 0.9544, + 0.9445, + 0.9418, + 0.9453, + 0.9472, + 0.9467, + 0.957, + 0.9605, + 0.9597, + 0.9608, + 0.9553, + 0.9582, + 0.9636, + 0.9629, + 0.968, + 0.9654, + 0.966, + 0.9668, + 0.9684, + 0.9709, + 0.9703, + 0.9731, + 0.9733, + 0.973, + 0.9743, + 0.9753, + 0.976, + 0.9762, + 0.9765, + 0.9766, + 0.9766, + 0.9769, + 0.9771, + 0.9771 + ], + "test_acc": [ + 0.786, + 0.819, + 0.8195, + 0.8455, + 0.8495, + 0.847, + 0.857, + 0.8615, + 0.851, + 0.862, + 0.862, + 0.8575, + 0.8705, + 0.86, + 0.8645, + 0.859, + 0.864, + 0.8685, + 0.866, + 0.8715, + 0.8755, + 0.869, + 0.8595, + 0.868, + 0.875, + 0.8755, + 0.8865, + 0.8725, + 0.8845, + 0.8835, + 0.871, + 0.881, + 0.881, + 0.891, + 0.883, + 0.8805, + 0.891, + 0.8805, + 0.889, + 0.889, + 0.89, + 0.8835, + 0.896, + 0.889, + 0.888, + 0.892, + 0.898, + 0.893, + 0.899, + 0.8955, + 0.892, + 0.895, + 0.9015, + 0.8965, + 0.8935, + 0.895, + 0.902, + 0.896, + 0.9005, + 0.8985, + 0.8925, + 0.9015, + 0.899, + 0.8965, + 0.8985, + 0.8985, + 0.9005, + 0.899, + 0.8965, + 0.9005, + 0.8975, + 0.901, + 0.899, + 0.8975, + 0.8975, + 0.898, + 0.8965, + 0.8965, + 0.8965, + 0.8965 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9283311367034912, + 0.9162832498550415, + 0.8925424814224243, + 0.8799441456794739, + 0.8746041655540466, + 0.8698863983154297, + 0.8666130304336548, + 0.863634467124939 + ], + "perturbation_rho": [ + 0.9999991059303284, + 0.9999967217445374, + 0.9999891519546509, + 0.9999651908874512, + 0.9999410510063171, + 0.9999043941497803, + 0.9998966455459595, + 0.9999027252197266 + ], + "nudging": { + "0.001": [ + -0.0268093291670084, + -0.012417184188961983, + -0.006203295662999153, + -0.0037101488560438156, + -0.0026736343279480934, + -0.002185049932450056, + -0.0019234392093494534, + -0.0017743848729878664 + ], + "0.003": [ + -0.07339517027139664, + -0.0357743538916111, + -0.018248513340950012, + -0.011002784594893456, + -0.007955053821206093, + -0.0065111806616187096, + -0.005736147053539753, + -0.005294123664498329 + ], + "0.01": [ + -0.17811693251132965, + -0.10346511751413345, + -0.05678309500217438, + -0.035222865641117096, + -0.025761041790246964, + -0.021198198199272156, + -0.01872769370675087, + -0.017311803996562958 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.130140475845337, + 1.068121821975708, + 0.6906124912261963, + 0.5849464416503907, + 0.539908002948761, + 0.5278588153839111, + 0.4802340653896332, + 0.4802248366832733, + 0.5312753393173217, + 0.5193623352050781, + 0.5183892659187317, + 0.5653032401919365, + 0.5576160436630249, + 0.5253325591087341, + 0.6005686638832092, + 0.600859852027893, + 0.6416343383789063, + 0.6754157733917237, + 0.6742553455352783, + 0.6983654169082641, + 0.7714478206634522, + 0.907026005935669, + 0.7574946401596069, + 0.7974853692531586, + 0.6163667502880097, + 0.6207158555030823, + 0.6624710424423218, + 0.767758971786499, + 0.7936295557022095, + 0.7818759674072265, + 0.6439841373443603, + 0.7241471338272095, + 0.7835567468881607, + 0.5556868800163269, + 0.7838432991981507, + 0.6678941816329956, + 0.5996702154159546, + 0.6219454681396485, + 0.6077403234004974, + 0.5930344202041626, + 0.7072095224380494, + 0.6957413219451904, + 0.6925682455062866, + 0.5746548117637634, + 0.5665205227851867, + 0.652870412158966, + 0.5017711290359497, + 0.5837478618621826, + 0.4854253540992737, + 0.4386099347114563, + 0.4709485713005066, + 0.5079970285415649, + 0.5075192336320877, + 0.49625477714538574, + 0.5056534718036652, + 0.4276254318237305, + 0.5216204251050949, + 0.41532413592338563, + 0.42688399028778073, + 0.4528659384965897, + 0.40737592430114744, + 0.4285537419319153, + 0.4251507745742798, + 0.3982658393383026, + 0.3921439680337906, + 0.4048129905462265, + 0.3849823941230774, + 0.37166397957801817, + 0.3756074117660522, + 0.37098817892074587, + 0.37144046624898913, + 0.36408291239738466, + 0.36373486807346345, + 0.3633287199020386, + 0.35742094442248346, + 0.35612085094451906, + 0.35380580410957335, + 0.3545500941991806, + 0.3522390522420406, + 0.3517058536529541 + ], + "train_acc": [ + 0.2243, + 0.6106, + 0.7399, + 0.7827, + 0.794, + 0.8004, + 0.8171, + 0.8253, + 0.8161, + 0.8205, + 0.8272, + 0.8178, + 0.8203, + 0.8305, + 0.8221, + 0.8243, + 0.8261, + 0.8204, + 0.8166, + 0.821, + 0.8069, + 0.7971, + 0.8102, + 0.8044, + 0.8348, + 0.8323, + 0.8294, + 0.8073, + 0.8135, + 0.8034, + 0.829, + 0.8167, + 0.811, + 0.8429, + 0.8065, + 0.8205, + 0.8317, + 0.8341, + 0.8319, + 0.8325, + 0.8167, + 0.8122, + 0.818, + 0.8326, + 0.8371, + 0.8246, + 0.8514, + 0.8328, + 0.8522, + 0.8603, + 0.8509, + 0.8455, + 0.8445, + 0.8496, + 0.8461, + 0.86, + 0.8445, + 0.8679, + 0.8654, + 0.8542, + 0.8667, + 0.8642, + 0.8677, + 0.8696, + 0.8685, + 0.8666, + 0.8719, + 0.8757, + 0.8746, + 0.8747, + 0.8768, + 0.8776, + 0.8759, + 0.8769, + 0.8774, + 0.8784, + 0.8793, + 0.8792, + 0.8796, + 0.8795 + ], + "test_acc": [ + 0.463, + 0.6815, + 0.744, + 0.7455, + 0.7515, + 0.7875, + 0.7565, + 0.7965, + 0.764, + 0.77, + 0.778, + 0.7455, + 0.768, + 0.7625, + 0.8125, + 0.745, + 0.7205, + 0.774, + 0.709, + 0.7445, + 0.7275, + 0.787, + 0.7495, + 0.7855, + 0.809, + 0.7825, + 0.718, + 0.7635, + 0.7445, + 0.7795, + 0.755, + 0.7165, + 0.7715, + 0.734, + 0.768, + 0.778, + 0.76, + 0.7275, + 0.7785, + 0.714, + 0.765, + 0.7515, + 0.779, + 0.713, + 0.7855, + 0.797, + 0.7775, + 0.79, + 0.811, + 0.7785, + 0.7895, + 0.7415, + 0.7975, + 0.7715, + 0.8085, + 0.7865, + 0.8095, + 0.8235, + 0.81, + 0.8135, + 0.8165, + 0.808, + 0.828, + 0.8165, + 0.8235, + 0.8185, + 0.8275, + 0.828, + 0.8235, + 0.824, + 0.823, + 0.824, + 0.8315, + 0.8305, + 0.832, + 0.834, + 0.831, + 0.833, + 0.8335, + 0.833 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.020978286862373352, + 0.16464680433273315, + 0.15073026716709137, + 0.08116275072097778, + 0.08070477098226547, + 0.0867747962474823, + 0.10854049026966095, + 0.11201675236225128 + ], + "perturbation_rho": [ + 0.032643549144268036, + 0.2071959227323532, + 0.2057623416185379, + 0.09326457977294922, + 0.06205561012029648, + 0.1389445811510086, + 0.11340519785881042, + 0.08505052328109741 + ], + "nudging": { + "0.001": [ + -0.0014469942543655634, + -0.000573523691855371, + -0.00041266781045123935, + -0.00018763300613500178, + -0.00020507823501247913, + -0.00022557468037120998, + -0.0002862402761820704, + -0.00027868736651726067 + ], + "0.003": [ + -0.004212609492242336, + -0.0017168434569612145, + -0.0012332911137491465, + -0.0005597122944891453, + -0.000612777890637517, + -0.0006744061829522252, + -0.0008597993873991072, + -0.0008341555367223918 + ], + "0.01": [ + -0.012655803002417088, + -0.005697320215404034, + -0.004094945732504129, + -0.0018561023753136396, + -0.0020380420610308647, + -0.0022426587529480457, + -0.002856952603906393, + -0.0027735023759305477 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.6613537705421448, + 0.8804613601207734, + 0.6975507205963135, + 0.7853355399608613, + 0.8572468722343445, + 0.9299439128875733, + 0.9885676727294922, + 1.0133089805603028, + 0.9962917245864868, + 0.9606268395423889, + 0.9880515659332275, + 0.9777737205505371, + 0.9968037183761597, + 0.9445726100921631, + 1.020095972442627, + 1.0027801685333253, + 0.9952171697616577, + 0.9394625225067139, + 0.9024322465896606, + 0.8761118396759033, + 0.8587080497741699, + 0.8608775177001953, + 0.858176763343811, + 0.8500239983558655, + 0.8605942026138306, + 0.8296343204498291, + 0.8473277267456054, + 0.9032470754623413, + 0.8595288021087647, + 0.8529232517242432, + 0.8514831623077392, + 0.7993372547149659, + 0.7925733268737793, + 0.7777183090209961, + 0.752255222415924, + 0.737820636177063, + 0.718349192905426, + 0.7632894110679627, + 0.7490254787445069, + 0.7206074246406555, + 0.72772101688385, + 0.7681838896751404, + 0.7500456344604493, + 0.7505516075134278, + 0.7438103253364563, + 0.7039294353485107, + 0.7070825775623322, + 0.7316446516036987, + 0.6909497563362121, + 0.6812596918106079, + 0.6990848143577576, + 0.6861800757408142, + 0.6805085423469543, + 0.6727995056152344, + 0.6663222888946533, + 0.6554413802146911, + 0.65927137966156, + 0.6400224656105041, + 0.626771753025055, + 0.6305665927886963, + 0.6282225363254547, + 0.6152347024440765, + 0.6126221405029297, + 0.6149387537956238, + 0.6082951297283172, + 0.5970498047828674, + 0.6011845873832703, + 0.5955050713539124, + 0.5878239162445068, + 0.5866915851593018, + 0.5876003602027893, + 0.5810875995635987, + 0.5816027210235596, + 0.5784582069873809, + 0.5760020084381103, + 0.5744486512184143, + 0.5738656497955322, + 0.5729139318466187, + 0.5723003579139709, + 0.5719887516021729 + ], + "train_acc": [ + 0.3893, + 0.6696, + 0.7401, + 0.7421, + 0.719, + 0.6886, + 0.6631, + 0.6603, + 0.6661, + 0.6592, + 0.6494, + 0.6491, + 0.6455, + 0.6682, + 0.6508, + 0.6536, + 0.6601, + 0.6722, + 0.6882, + 0.6953, + 0.7005, + 0.7068, + 0.6992, + 0.6956, + 0.7035, + 0.7091, + 0.703, + 0.689, + 0.6964, + 0.7009, + 0.7001, + 0.7172, + 0.7219, + 0.7283, + 0.7337, + 0.7369, + 0.745, + 0.7332, + 0.7355, + 0.7415, + 0.7396, + 0.7345, + 0.736, + 0.7369, + 0.7385, + 0.7482, + 0.7451, + 0.7373, + 0.7529, + 0.7547, + 0.7536, + 0.7591, + 0.7564, + 0.7642, + 0.7664, + 0.766, + 0.7665, + 0.7756, + 0.78, + 0.7785, + 0.7795, + 0.7829, + 0.7842, + 0.7826, + 0.7866, + 0.7876, + 0.7873, + 0.7893, + 0.7907, + 0.7927, + 0.7913, + 0.7943, + 0.7931, + 0.796, + 0.7968, + 0.7963, + 0.7959, + 0.7962, + 0.7964, + 0.7964 + ], + "test_acc": [ + 0.5895, + 0.683, + 0.724, + 0.7075, + 0.659, + 0.6335, + 0.64, + 0.645, + 0.645, + 0.6335, + 0.6375, + 0.6195, + 0.651, + 0.6245, + 0.648, + 0.6265, + 0.6325, + 0.663, + 0.644, + 0.634, + 0.6665, + 0.6655, + 0.6565, + 0.6745, + 0.6635, + 0.669, + 0.6515, + 0.631, + 0.6075, + 0.611, + 0.6985, + 0.6515, + 0.678, + 0.6845, + 0.6845, + 0.696, + 0.6915, + 0.689, + 0.7035, + 0.6985, + 0.695, + 0.6895, + 0.692, + 0.689, + 0.716, + 0.704, + 0.6965, + 0.708, + 0.7095, + 0.701, + 0.735, + 0.71, + 0.722, + 0.722, + 0.7365, + 0.734, + 0.7335, + 0.728, + 0.733, + 0.7315, + 0.728, + 0.74, + 0.7435, + 0.7445, + 0.746, + 0.7455, + 0.7425, + 0.7465, + 0.7495, + 0.7565, + 0.755, + 0.742, + 0.7545, + 0.7535, + 0.753, + 0.749, + 0.749, + 0.7495, + 0.7505, + 0.7495 + ], + "state_pred_error": [ + 0.6588439248561859, + 0.18840705387592316, + 0.14289978892803193, + 0.15212055261135102, + 0.17622629220485686, + 0.19014827156066894, + 0.1907501521587372, + 0.1974239867210388, + 0.20479401926994323, + 0.19324371876716614, + 0.1692460091352463, + 0.14547201271057128, + 0.13392872540950776, + 0.13207265970706938, + 0.12733380571603775, + 0.12442956283092499, + 0.11992262068986893, + 0.11454836254119873, + 0.10640433104038238, + 0.09588282935619354, + 0.08941714116334915, + 0.08326569969654084, + 0.08106024689674378, + 0.07807673720121383, + 0.06985928665399552, + 0.05780385282039642, + 0.04903316358923912, + 0.042540194964408876, + 0.03769502246379852, + 0.03340193069577217, + 0.030505492842197418, + 0.027835199296474458, + 0.026414455169439317, + 0.026154682007431984, + 0.027012317779660226, + 0.027285932829976083, + 0.02783989610671997, + 0.02848111428618431, + 0.02768479132056236, + 0.026838592088222504, + 0.025692131254076957, + 0.0250046414911747, + 0.024446581745147706, + 0.023822997540235518, + 0.023123727387189864, + 0.023240181931853295, + 0.022701505839824675, + 0.022446804578602313, + 0.02224079295396805, + 0.02201542984545231, + 0.022186503106355667, + 0.022374201011657716, + 0.022197162532806396, + 0.022024760249257088, + 0.021556022208929063, + 0.020752609607577324, + 0.02029846299290657, + 0.01939405950307846, + 0.01925926080942154, + 0.0179039378374815, + 0.01723805043101311, + 0.016645756682753563, + 0.016013126088678838, + 0.015421504980325698, + 0.014981058233976365, + 0.014707353785634042, + 0.014117280274629593, + 0.013762151800096035, + 0.013112149319052696, + 0.012881575208902358, + 0.01252510030567646, + 0.012011728531122208, + 0.011849733792245389, + 0.01146787409633398, + 0.011190799026191234, + 0.01094292304366827, + 0.01079139669984579, + 0.010453094108402729, + 0.010252758046984672, + 0.010227990358322859 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8467778563499451, + 0.3549606502056122, + 0.1711018681526184, + 0.12375819683074951, + 0.1153455525636673, + 0.12219913303852081, + 0.12895643711090088, + 0.10622675716876984 + ], + "perturbation_rho": [ + 0.7416437268257141, + 0.2796669900417328, + 0.14060860872268677, + 0.09820520132780075, + 0.10454020649194717, + 0.08740514516830444, + 0.10375625640153885, + 0.12008601427078247 + ], + "nudging": { + "0.001": [ + -0.02524612657725811, + -0.0010118680074810982, + -0.00039384554838761687, + -0.0002958686964120716, + -0.00027316075284034014, + -0.0002826714771799743, + -0.0002984246239066124, + -0.00024543559993617237 + ], + "0.003": [ + -0.07356468588113785, + -0.003032396547496319, + -0.0011817947961390018, + -0.0008877563523128629, + -0.0008196210255846381, + -0.0008473420166410506, + -0.0008945445879362524, + -0.0007367263897322118 + ], + "0.01": [ + -0.2212277054786682, + -0.010068328119814396, + -0.00393392750993371, + -0.002955838106572628, + -0.0027290289290249348, + -0.0028208147268742323, + -0.002979037119075656, + -0.002453283406794071 + ] + }, + "state_pred_error_per_layer": [ + 10942.7939453125, + 10293.740234375, + 7482.4482421875, + 5008.9619140625, + 4863.818359375, + 4492.451171875, + 3565.2744140625, + 3837.47998046875 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.1349513092041015, + 1.0799473155021668, + 0.6904095640182495, + 0.5730169864654541, + 0.5376711503982544, + 0.5217435983657837, + 0.5241446275711059, + 0.5752555076599121, + 0.5162794561386108, + 0.5799625160217285, + 0.5156625980377197, + 0.54727692527771, + 0.5622692403793335, + 0.6077177556037903, + 0.6142744152069092, + 0.5783923351287842, + 0.5948413852691651, + 0.7985807825088501, + 0.7876970001220703, + 1.0439940561294556, + 0.7259676246643066, + 0.8126457204818726, + 0.7394346284866333, + 0.8870538883209228, + 0.8942244791984558, + 1.018878134918213, + 1.1607880065917968, + 1.2915550483703613, + 1.0802051795959473, + 1.132888382291794, + 1.0752713064193726, + 1.2749524337768554, + 1.3533095266342163, + 1.254620951271057, + 1.327561699104309, + 1.3512781272888184, + 1.358589473247528, + 1.3133805484771728, + 1.3522217433929444, + 1.2569283782958984, + 1.2115153579711915, + 1.1729324398040772, + 1.458994796180725, + 1.1794059185028076, + 1.1593233011245727, + 1.1951527072906494, + 1.3532650127410888, + 1.2816025928497314, + 1.2753959981918335, + 1.3296147323608398, + 1.3296164437294007, + 1.4913486896514894, + 1.4076004596948624, + 1.4025042806625365, + 1.5456968538284301, + 1.5032260831832887, + 1.541390106201172, + 1.5214945098876953, + 1.5504541542053223, + 1.6073409852027893, + 1.5711617599487304, + 1.5610263828277589, + 1.5516953735351562, + 1.538286647415161, + 1.5312161500930785, + 1.5014611629486083, + 1.49632290391922, + 1.4762050870895387, + 1.4426008732795714, + 1.4320516025543213, + 1.4142663345336914, + 1.4014085182189941, + 1.3942050539970399, + 1.3843670928955079, + 1.381881692504883, + 1.3740321586608886, + 1.370679066848755, + 1.3696322021484375, + 1.3669484914779664, + 1.3658903411865235 + ], + "train_acc": [ + 0.2258, + 0.6057, + 0.7399, + 0.781, + 0.794, + 0.806, + 0.8037, + 0.7994, + 0.8165, + 0.809, + 0.8278, + 0.8214, + 0.825, + 0.8179, + 0.8185, + 0.8293, + 0.8265, + 0.7944, + 0.8036, + 0.7689, + 0.8042, + 0.7954, + 0.7949, + 0.7834, + 0.7894, + 0.767, + 0.7489, + 0.7289, + 0.7411, + 0.7199, + 0.7209, + 0.6906, + 0.6894, + 0.6987, + 0.6832, + 0.6712, + 0.6676, + 0.6648, + 0.6652, + 0.6608, + 0.665, + 0.6695, + 0.6347, + 0.6647, + 0.6674, + 0.6599, + 0.6289, + 0.637, + 0.6461, + 0.6344, + 0.6359, + 0.6245, + 0.6301, + 0.6303, + 0.6141, + 0.6183, + 0.6157, + 0.6167, + 0.6148, + 0.6119, + 0.6073, + 0.6164, + 0.6129, + 0.6116, + 0.6111, + 0.6167, + 0.6114, + 0.6142, + 0.6226, + 0.6232, + 0.625, + 0.6244, + 0.6286, + 0.628, + 0.6261, + 0.6275, + 0.6284, + 0.6295, + 0.6297, + 0.6298 + ], + "test_acc": [ + 0.452, + 0.688, + 0.7325, + 0.7685, + 0.7775, + 0.752, + 0.767, + 0.7435, + 0.757, + 0.785, + 0.76, + 0.7375, + 0.761, + 0.7525, + 0.786, + 0.766, + 0.681, + 0.745, + 0.6875, + 0.737, + 0.7465, + 0.7495, + 0.707, + 0.731, + 0.7445, + 0.7165, + 0.654, + 0.6635, + 0.699, + 0.6565, + 0.6125, + 0.609, + 0.6125, + 0.669, + 0.634, + 0.6155, + 0.6165, + 0.612, + 0.5675, + 0.669, + 0.619, + 0.514, + 0.632, + 0.6165, + 0.635, + 0.533, + 0.586, + 0.5425, + 0.554, + 0.6015, + 0.5345, + 0.586, + 0.6125, + 0.5765, + 0.5875, + 0.613, + 0.608, + 0.61, + 0.5825, + 0.5925, + 0.5925, + 0.5935, + 0.608, + 0.6025, + 0.6035, + 0.5975, + 0.611, + 0.605, + 0.6095, + 0.6115, + 0.6155, + 0.616, + 0.6105, + 0.6155, + 0.616, + 0.615, + 0.6185, + 0.6185, + 0.618, + 0.617 + ], + "value_loss": [ + 2.727321440219879, + 0.9396097582817078, + 0.8612026205062866, + 0.8072550956726074, + 0.7662750400066376, + 0.8116222425937653, + 0.7918028060913086, + 1.058762281036377, + 0.9410865303039551, + 1.1683196662902833, + 0.8891641233444214, + 1.0408354179382324, + 1.2426973400115966, + 1.3723524351119996, + 1.3864970308303832, + 1.2711094731330872, + 1.4452000873565674, + 2.0964325157165526, + 2.503941488647461, + 3.8773516985416414, + 2.1931466732025147, + 2.4717007579803467, + 1.8694116882324219, + 2.562740281677246, + 2.7024575206756594, + 3.388196944236755, + 4.119316976737976, + 4.325601746749878, + 3.317746393966675, + 3.243412302494049, + 2.8255897121429445, + 3.7306121185302734, + 4.122640119934082, + 3.4347802352905275, + 3.8012741462707518, + 3.5787492347717285, + 3.369715265369415, + 2.77193868560791, + 3.474485213088989, + 2.375825690841675, + 2.1312103996276854, + 1.956772960472107, + 3.083518902397156, + 1.9400283665657043, + 1.692312808418274, + 1.5720748712539674, + 1.8764948084831239, + 1.6743739032745362, + 1.567044317626953, + 1.7899606132507324, + 1.9826876150131225, + 2.5111199203491212, + 1.8491062855243683, + 1.746228759765625, + 2.085294245147705, + 1.9948427753448486, + 1.9512831954956054, + 2.158460530471802, + 2.0963551795959474, + 2.327825161552429, + 2.352580466079712, + 2.054654391479492, + 1.8559182556152343, + 1.8292891555786133, + 1.755587695646286, + 1.710701921081543, + 1.6332559819698333, + 1.5935078775405884, + 1.5094772003889083, + 1.5422865842342377, + 1.476211569213867, + 1.4243068096637725, + 1.2866611572265625, + 1.2408681606292724, + 1.2721347715377807, + 1.1996249546051025, + 1.210354462814331, + 1.1556780391693116, + 1.1320207769393922, + 1.2871107803344726 + ], + "term_loss": [ + 1.6279608231544496, + 0.704119206237793, + 0.7059318660736084, + 0.6708632150650025, + 0.6246756870269775, + 0.6474101797103882, + 0.6305780605316162, + 0.9013450145721436, + 0.8003977013587952, + 1.014212282562256, + 0.7516019021987915, + 0.8989673347473145, + 1.1009173652648925, + 1.221914840745926, + 1.2337085500240326, + 1.1299663187503814, + 1.2949002643585206, + 1.9072193572998046, + 2.2973386978149413, + 3.4965499984025956, + 1.9051358992099763, + 2.1613095233917234, + 1.5260497505187989, + 2.1684676694869993, + 2.3560955852508543, + 3.0179900035858154, + 3.702320911979675, + 3.7875602326393127, + 2.8640588617324827, + 2.8004565309524536, + 2.397008271789551, + 3.191488564300537, + 3.68539259185791, + 2.979008136749268, + 3.262051542663574, + 3.0784937271118165, + 2.832118960571289, + 2.343948299407959, + 2.996490676879883, + 1.9708608936309815, + 1.7158579580783844, + 1.5594909168243407, + 2.6169842109680177, + 1.5474250222682953, + 1.3258218050837516, + 1.1993716355800628, + 1.4649041637420654, + 1.2486765979766845, + 1.1667367574691772, + 1.3506693029403687, + 1.5352664937973022, + 2.035203108596802, + 1.457682236149907, + 1.3602924033164978, + 1.679940075302124, + 1.588972739124298, + 1.552276259613037, + 1.731438402557373, + 1.7071564056396484, + 1.8799896495819093, + 1.9350618648529052, + 1.6424618713378907, + 1.4868921995162965, + 1.446955292892456, + 1.3913815165519714, + 1.34365530128479, + 1.2715293394446372, + 1.2260353670597077, + 1.1480308882594108, + 1.1766893856525422, + 1.1144582271575927, + 1.0618839118480683, + 0.9506599808931351, + 0.9098234622478485, + 0.9204758085250855, + 0.8746725267410278, + 0.8588070724487304, + 0.8281577826499938, + 0.797250756931305, + 0.9274139808654785 + ], + "bridge_loss": [ + 0.8083143433531106, + 0.03534272773116827, + 0.004054905174672604, + 0.0025750217221677304, + 0.0111042478621006, + 0.03642336260080337, + 0.03164129929542542, + 0.01822726946026087, + 0.013087374910712242, + 0.01670566949248314, + 0.012304777045547962, + 0.013311486148834229, + 0.012470375210046769, + 0.015150112447142601, + 0.017846742632985114, + 0.012756926289200783, + 0.01719350122511387, + 0.029539665845036506, + 0.049753447246551515, + 0.19335796689391135, + 0.1377138121843338, + 0.14538880939483642, + 0.1858158534049988, + 0.22088744847774505, + 0.17615320081710814, + 0.17890373020172118, + 0.208697167468071, + 0.317703052854538, + 0.2462163796842098, + 0.21817022037506104, + 0.20710145602226257, + 0.2946344936847687, + 0.18753280954360962, + 0.21550205829143523, + 0.28386482191085816, + 0.238300489795208, + 0.2713253611803055, + 0.16291713156700136, + 0.21267032642364503, + 0.14305857858657836, + 0.1569474487543106, + 0.14258797616362573, + 0.18065397282838822, + 0.13496598809361457, + 0.11368236303329468, + 0.11145756494998932, + 0.12573257199525834, + 0.14761312683820724, + 0.12837004759311677, + 0.15965413780212404, + 0.1698465512096882, + 0.18340668123960496, + 0.10641542260348796, + 0.10253700153827668, + 0.10657473990917206, + 0.1121935983300209, + 0.10271678879261018, + 0.13303805556297302, + 0.09351474790573121, + 0.14432539250850676, + 0.11737795681953431, + 0.11367511397600175, + 0.07074648933410645, + 0.08508506771326065, + 0.06773971323072911, + 0.07468509637117386, + 0.06730701846480369, + 0.07540959911942482, + 0.07412677040994167, + 0.08127087873220444, + 0.07701363701820374, + 0.07957754820287227, + 0.05529560489952564, + 0.05010534638762474, + 0.0712317577123642, + 0.046139729899168015, + 0.072980900400877, + 0.04892427727878094, + 0.056062604546546935, + 0.0815536917924881 + ], + "tgrad_loss": [ + 0.2910462556838989, + 0.2001478245973587, + 0.15121584887504577, + 0.13381686885356903, + 0.13049510194063188, + 0.12778870586156846, + 0.129583452129364, + 0.13919000265598297, + 0.1276014597415924, + 0.13740170998573303, + 0.12525744400024413, + 0.12855659551620482, + 0.12930960359573365, + 0.13528747370243072, + 0.13494173312187194, + 0.12838622679710388, + 0.1331063397884369, + 0.15967349395751954, + 0.15684934887886048, + 0.18744370300769805, + 0.15029693999290467, + 0.16500240364074706, + 0.1575460779428482, + 0.17338516240119933, + 0.1702087482213974, + 0.19130323677062988, + 0.2082989068508148, + 0.22033847556114197, + 0.20747117023468017, + 0.2247855720281601, + 0.2214799639225006, + 0.2444890670776367, + 0.24971474064588547, + 0.24027000885009767, + 0.2553577440261841, + 0.26195502963066103, + 0.2662709293603897, + 0.2650732141494751, + 0.2653242133140564, + 0.261906224489212, + 0.2584049981594086, + 0.25469407353401186, + 0.28588071343898774, + 0.2576373676300049, + 0.25280862176418306, + 0.2612456651687622, + 0.28585807564258575, + 0.27808416323661805, + 0.27193750815391543, + 0.2796371641159058, + 0.2775745363712311, + 0.2925101243019104, + 0.2850086217224598, + 0.2833993576049805, + 0.2987794400215149, + 0.2936764407157898, + 0.2962901576042175, + 0.2939840517044067, + 0.2956840163230896, + 0.3035101066350937, + 0.30014064073562624, + 0.29851739921569825, + 0.2982795658111572, + 0.297248807144165, + 0.29646646108627317, + 0.2923615251541138, + 0.2944196360826492, + 0.2920629088878632, + 0.2873195513010025, + 0.2843263193130493, + 0.28473971853256225, + 0.28284534950256346, + 0.28070557026863097, + 0.2809393483161926, + 0.2804271911859512, + 0.27881269562244415, + 0.2785664937496185, + 0.2785959745883942, + 0.27870741724967957, + 0.2781431001186371 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.03283574804663658, + 0.05836774408817291, + 0.11590129137039185, + 0.10100162029266357, + 0.1079024076461792, + 0.10276803374290466, + 0.11581481993198395, + 0.11350809782743454 + ], + "perturbation_rho": [ + 0.06095704063773155, + 0.13836193084716797, + 0.1803440898656845, + 0.1439131498336792, + 0.14064353704452515, + 0.15858328342437744, + 0.22606094181537628, + 0.17918413877487183 + ], + "nudging": { + "0.001": [ + -0.002448005136102438, + -0.0006180563941597939, + -0.0009603539947420359, + -0.0008934920188039541, + -0.0009336093789897859, + -0.0008919704705476761, + -0.0009885210311040282, + -0.000981275225058198 + ], + "0.003": [ + -0.007285828702151775, + -0.0018541133031249046, + -0.00287721143104136, + -0.0026775901205837727, + -0.00279964879155159, + -0.002672631060704589, + -0.002965346910059452, + -0.0029417702462524176 + ], + "0.01": [ + -0.023668643087148666, + -0.006166210863739252, + -0.009575091302394867, + -0.00891521479934454, + -0.00932026281952858, + -0.008899858221411705, + -0.009868312627077103, + -0.009792262688279152 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.25_L12_s123.json b/results/synth_ladder_v2_lo/synth_a0.25_L12_s123.json new file mode 100644 index 0000000..80dd4af --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.25_L12_s123.json @@ -0,0 +1,1722 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.0251480885505677, + 0.5381011812925339, + 0.41018714437484743, + 0.41668477268218995, + 0.3987781819820404, + 0.34647837781906127, + 0.3328484351158142, + 0.3411853968143463, + 0.31531344504356384, + 0.2811115964889526, + 0.3177991699934006, + 0.276431111907959, + 0.31507457468509675, + 0.23614442422389983, + 0.254969379901886, + 0.27476890687942507, + 0.2822477249979973, + 0.22857851524353026, + 0.2848317095279694, + 0.22646245069503784, + 0.19609259796142578, + 0.20422002878189086, + 0.2278106704711914, + 0.21199282817840576, + 0.22999722228050232, + 0.18927179362773897, + 0.1868197315096855, + 0.1624525843143463, + 0.16611186580657958, + 0.1776226815700531, + 0.18346555788517, + 0.18616020417213439, + 0.21773850283622742, + 0.17072519811987877, + 0.1434326003074646, + 0.14783699934482575, + 0.15042639310359954, + 0.12889793826341628, + 0.12356024625301361, + 0.1692313243865967, + 0.15909709224700927, + 0.1192699939250946, + 0.11174692940711975, + 0.11469121931791305, + 0.09951091033518314, + 0.09089980803132057, + 0.09371082916259765, + 0.10394041108489037, + 0.08837119708657265, + 0.0850338310956955, + 0.08094862339496613, + 0.08114566903114319, + 0.0906995141685009, + 0.078421424472332, + 0.0745745754480362, + 0.06969475071430206, + 0.0771757453918457, + 0.07762574458122254, + 0.07343646372556686, + 0.06731920648217202, + 0.06413565802574157, + 0.0694550199508667, + 0.06341172800064086, + 0.06010753145813942, + 0.0578922655582428, + 0.05571632192134857, + 0.05808653661012649, + 0.055248909771442416, + 0.05357116482257843, + 0.05281550569534302, + 0.05171134668439627, + 0.050705768856406215, + 0.04993012307882309, + 0.04970487477779388, + 0.04938072466850281, + 0.04907250826358795, + 0.048702222812175754, + 0.04849463161230087, + 0.04836083398014307, + 0.04829238135814667 + ], + "train_acc": [ + 0.6282, + 0.7909, + 0.8356, + 0.8387, + 0.8442, + 0.8678, + 0.864, + 0.8668, + 0.878, + 0.8879, + 0.8761, + 0.891, + 0.8781, + 0.9061, + 0.8998, + 0.8908, + 0.8897, + 0.9051, + 0.89, + 0.9092, + 0.924, + 0.9202, + 0.9112, + 0.9156, + 0.9113, + 0.922, + 0.9281, + 0.9346, + 0.9359, + 0.9311, + 0.9273, + 0.9257, + 0.9147, + 0.933, + 0.9439, + 0.9438, + 0.9417, + 0.9526, + 0.9544, + 0.9381, + 0.9407, + 0.9555, + 0.9599, + 0.9549, + 0.9662, + 0.9731, + 0.9685, + 0.9654, + 0.9715, + 0.9729, + 0.9751, + 0.975, + 0.9686, + 0.9772, + 0.9789, + 0.9812, + 0.9762, + 0.9755, + 0.9773, + 0.9815, + 0.9841, + 0.9801, + 0.9832, + 0.9859, + 0.9881, + 0.9893, + 0.9875, + 0.9879, + 0.9904, + 0.9916, + 0.9919, + 0.9924, + 0.993, + 0.9929, + 0.9935, + 0.9936, + 0.9937, + 0.9937, + 0.9939, + 0.9939 + ], + "test_acc": [ + 0.7655, + 0.7705, + 0.845, + 0.8445, + 0.856, + 0.8585, + 0.8535, + 0.863, + 0.863, + 0.8645, + 0.852, + 0.8735, + 0.876, + 0.868, + 0.8825, + 0.8725, + 0.869, + 0.873, + 0.8675, + 0.876, + 0.8745, + 0.8785, + 0.875, + 0.8745, + 0.8785, + 0.878, + 0.8905, + 0.881, + 0.883, + 0.889, + 0.8855, + 0.8835, + 0.8815, + 0.894, + 0.891, + 0.8865, + 0.8855, + 0.8865, + 0.884, + 0.8925, + 0.893, + 0.8995, + 0.9, + 0.894, + 0.8985, + 0.9, + 0.897, + 0.8975, + 0.895, + 0.9005, + 0.895, + 0.904, + 0.8985, + 0.899, + 0.9025, + 0.901, + 0.899, + 0.8985, + 0.8985, + 0.897, + 0.897, + 0.902, + 0.902, + 0.9025, + 0.899, + 0.9035, + 0.901, + 0.902, + 0.903, + 0.901, + 0.9035, + 0.902, + 0.901, + 0.901, + 0.901, + 0.9005, + 0.902, + 0.902, + 0.902, + 0.902 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8318638801574707, + 0.8205357789993286, + 0.8115277886390686, + 0.8032979965209961, + 0.7886118292808533, + 0.7801527976989746, + 0.7755030393600464, + 0.769822359085083, + 0.7656118869781494, + 0.7624454498291016, + 0.7592873573303223, + 0.7567087411880493 + ], + "perturbation_rho": [ + 0.9999992251396179, + 0.9999969005584717, + 0.9999886155128479, + 0.9999699592590332, + 0.9999390244483948, + 0.9998932480812073, + 0.9998554587364197, + 0.9998190999031067, + 0.9997619986534119, + 0.9997045397758484, + 0.9997037649154663, + 0.9996514916419983 + ], + "nudging": { + "0.001": [ + -0.02965891733765602, + -0.014755135402083397, + -0.007768464274704456, + -0.004644382745027542, + -0.0031942492350935936, + -0.0024470873177051544, + -0.002016209065914154, + -0.0017410764703527093, + -0.001558023039251566, + -0.0014324376825243235, + -0.001343877287581563, + -0.0012825119774788618 + ], + "0.003": [ + -0.0804542750120163, + -0.042193710803985596, + -0.022742247208952904, + -0.013738743960857391, + -0.00949312373995781, + -0.007289452478289604, + -0.006013792939484119, + -0.005197531543672085, + -0.004653473384678364, + -0.004280170891433954, + -0.004016467835754156, + -0.0038337684236466885 + ], + "0.01": [ + -0.19001588225364685, + -0.1191760003566742, + -0.0696173831820488, + -0.04359997808933258, + -0.030619269236922264, + -0.023702502250671387, + -0.019644131883978844, + -0.01702706888318062, + -0.015273808501660824, + -0.014067228883504868, + -0.01321301981806755, + -0.012620084919035435 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.1161888708114622, + 1.0705381093978883, + 0.7379587242126465, + 0.6230424444198608, + 0.5587224875450134, + 0.5511080667495728, + 0.5147961149215698, + 0.5059333966255188, + 0.5395212747573852, + 0.5567793758392334, + 0.6206620505332947, + 0.5265415138721466, + 0.5160172220230103, + 0.5400834962844848, + 0.5545318482398987, + 0.5883845041275024, + 0.6101506164550782, + 0.5516913089752197, + 0.6737783394813538, + 0.6081213068962097, + 0.811542774772644, + 0.6109004033088684, + 0.5861687495231629, + 0.6011404423713684, + 0.6571122856140137, + 0.6412208379745483, + 0.9013783811628818, + 0.5354073376655578, + 0.5708883996009827, + 0.6849057559967041, + 1.001942999124527, + 0.60237093501091, + 0.6511475246667862, + 0.6211171346664429, + 0.602404217338562, + 0.546023369216919, + 0.6272468940734863, + 0.6112368375778198, + 0.5450925559997558, + 0.7834748405456543, + 0.6081129229784011, + 0.5642386393815279, + 0.56300906457901, + 0.505311530637741, + 0.5361756405830383, + 0.4359512243270874, + 0.545820366859436, + 0.5309959113121032, + 0.5448329068422317, + 0.4796094952344894, + 0.4383549818992615, + 0.47926157960891724, + 0.46650244359970094, + 0.4291006091594696, + 0.4090529757976532, + 0.3741895474433899, + 0.46069719450473784, + 0.4360212215423584, + 0.43903335857391357, + 0.39378074131011964, + 0.3575065735816956, + 0.38047246384620664, + 0.3535813014984131, + 0.3860295336961746, + 0.35095718326568603, + 0.37885420265197756, + 0.3496265037059784, + 0.34361237716674803, + 0.3341560622692108, + 0.34267382655143735, + 0.3308092978477478, + 0.3239377063751221, + 0.32587551040649415, + 0.32046382219791414, + 0.31662249999046327, + 0.316526219534874, + 0.315068252658844, + 0.31297805325984956, + 0.3121805286288261, + 0.31114738615751264 + ], + "train_acc": [ + 0.2347, + 0.6109, + 0.7271, + 0.7668, + 0.7901, + 0.7911, + 0.8103, + 0.8109, + 0.8039, + 0.8057, + 0.7993, + 0.8217, + 0.8213, + 0.8225, + 0.8165, + 0.8147, + 0.8151, + 0.8288, + 0.8074, + 0.8169, + 0.7825, + 0.8202, + 0.8321, + 0.8321, + 0.8179, + 0.8169, + 0.787, + 0.8383, + 0.8308, + 0.8067, + 0.7794, + 0.8299, + 0.8183, + 0.8227, + 0.8221, + 0.84, + 0.8212, + 0.8258, + 0.8318, + 0.7943, + 0.8294, + 0.8284, + 0.8301, + 0.8396, + 0.8353, + 0.8567, + 0.8271, + 0.8324, + 0.8331, + 0.8414, + 0.8513, + 0.8441, + 0.8437, + 0.8564, + 0.8621, + 0.8661, + 0.8483, + 0.8563, + 0.8535, + 0.8627, + 0.8716, + 0.8674, + 0.873, + 0.867, + 0.8746, + 0.8692, + 0.8759, + 0.8763, + 0.8793, + 0.8761, + 0.8811, + 0.8839, + 0.8847, + 0.886, + 0.8883, + 0.8857, + 0.8871, + 0.8883, + 0.8883, + 0.889 + ], + "test_acc": [ + 0.4935, + 0.664, + 0.7105, + 0.7415, + 0.7515, + 0.749, + 0.738, + 0.7145, + 0.747, + 0.6885, + 0.779, + 0.747, + 0.7215, + 0.774, + 0.7765, + 0.737, + 0.7385, + 0.7485, + 0.7145, + 0.7095, + 0.746, + 0.6925, + 0.7445, + 0.733, + 0.7555, + 0.6975, + 0.744, + 0.758, + 0.7605, + 0.6015, + 0.7335, + 0.744, + 0.7155, + 0.76, + 0.742, + 0.6985, + 0.756, + 0.797, + 0.669, + 0.6595, + 0.7775, + 0.751, + 0.7825, + 0.792, + 0.7875, + 0.7185, + 0.7555, + 0.711, + 0.7865, + 0.7815, + 0.7525, + 0.7505, + 0.756, + 0.8095, + 0.8295, + 0.8095, + 0.7835, + 0.811, + 0.792, + 0.835, + 0.8165, + 0.8195, + 0.824, + 0.8365, + 0.83, + 0.8305, + 0.8355, + 0.8345, + 0.841, + 0.8435, + 0.845, + 0.8445, + 0.8385, + 0.8435, + 0.849, + 0.8425, + 0.852, + 0.846, + 0.8475, + 0.8475 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.007017737254500389, + 0.1750856339931488, + 0.09811605513095856, + 0.09870222210884094, + 0.06923168152570724, + 0.07072796672582626, + 0.1299426257610321, + 0.06372487545013428, + 0.05202930420637131, + 0.07090489566326141, + 0.04892899468541145, + 0.07766443490982056 + ], + "perturbation_rho": [ + -0.05082311853766441, + 0.15127798914909363, + 0.10723739117383957, + 0.1141807958483696, + 0.10590988397598267, + 0.05159565061330795, + 0.11685939878225327, + 0.06997300684452057, + 0.00848393514752388, + 0.09840574860572815, + 0.04575839638710022, + 0.015137266367673874 + ], + "nudging": { + "0.001": [ + -4.85350246890448e-05, + -0.00047083833487704396, + -0.0002036669902736321, + -0.00020484492415562272, + -0.00012755952775478363, + -0.0001312094391323626, + -0.00026341876946389675, + -0.00013891540584154427, + -8.587291813455522e-05, + -0.0001401761983288452, + -0.00010106117406394333, + -0.00013796932762488723 + ], + "0.003": [ + -0.00011904549319297075, + -0.0014130279887467623, + -0.0006089931703172624, + -0.0006149515393190086, + -0.00038236152613535523, + -0.0003897756978403777, + -0.0007856430020183325, + -0.00041487300768494606, + -0.00026209562201984227, + -0.0004224291769787669, + -0.0003004029858857393, + -0.00041531946044415236 + ], + "0.01": [ + -9.43206250667572e-05, + -0.004689650610089302, + -0.0020264536142349243, + -0.0020407852716743946, + -0.0012656663311645389, + -0.0012923413887619972, + -0.0026080894749611616, + -0.0013762509915977716, + -0.0008721412159502506, + -0.0014046088326722383, + -0.0009981195908039808, + -0.0013870256952941418 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.7660392265319824, + 1.178251402759552, + 0.9799116178512574, + 0.9648374988555908, + 0.9458347319602967, + 0.9694253993034363, + 1.031941456604004, + 1.086812539100647, + 1.1742973445892333, + 1.19130708694458, + 1.1743286926269532, + 1.1457796726226808, + 1.1943257934570313, + 1.1683498153686522, + 1.1290361179351807, + 1.0556812404632567, + 1.0298576685905456, + 1.0394999574661254, + 1.0867010340690613, + 1.049304892539978, + 1.0673762855529785, + 1.0524308464050294, + 1.0844358332633972, + 1.1172401988983154, + 1.1323510132789611, + 1.1146858919143676, + 1.128648495578766, + 1.0949398155212402, + 1.0749667533874512, + 1.0532681093215943, + 0.9976370090484619, + 0.9771609001159668, + 1.0085774200439452, + 0.9589678119659424, + 1.0052671368122101, + 1.0016240659713744, + 0.9660814436912537, + 0.9806823503494263, + 0.9850459058761597, + 0.9981972049713135, + 0.9740466180801391, + 0.9784111059188842, + 1.0064473885536194, + 1.0063808506011962, + 1.0454398796081543, + 1.068976349067688, + 1.0449666645050049, + 0.9966327934265137, + 0.9869317514419556, + 0.9675295728683472, + 0.9301507671356202, + 0.9641815420150757, + 0.9217775179862976, + 0.9083558129310608, + 0.8999398115158082, + 0.9012471942901611, + 0.876110479068756, + 0.8611874293327332, + 0.8559818737030029, + 0.8613637584686279, + 0.8418010949134827, + 0.8399203823089599, + 0.822348624420166, + 0.8137641032218933, + 0.8099215194702148, + 0.8083343101501465, + 0.79866770362854, + 0.7958657787322998, + 0.7941301454544067, + 0.7885932938575745, + 0.7868301971435547, + 0.7845343255996704, + 0.7839029501914978, + 0.7834184554100037, + 0.7787990325927734, + 0.7778603867530822, + 0.7773278060913086, + 0.7761943964004516, + 0.7756718534469604, + 0.7753890983581543 + ], + "train_acc": [ + 0.3775, + 0.5866, + 0.6582, + 0.6737, + 0.6776, + 0.6691, + 0.6489, + 0.6323, + 0.615, + 0.6048, + 0.6065, + 0.6163, + 0.5998, + 0.6116, + 0.6105, + 0.6255, + 0.6347, + 0.6341, + 0.6203, + 0.6327, + 0.6274, + 0.6273, + 0.6222, + 0.6166, + 0.6221, + 0.6313, + 0.6286, + 0.6398, + 0.6346, + 0.6421, + 0.6539, + 0.6626, + 0.6542, + 0.6694, + 0.662, + 0.6658, + 0.6749, + 0.6665, + 0.6672, + 0.6647, + 0.6694, + 0.6657, + 0.6662, + 0.6634, + 0.6582, + 0.6572, + 0.6615, + 0.6692, + 0.6772, + 0.6794, + 0.6878, + 0.672, + 0.688, + 0.688, + 0.6891, + 0.6883, + 0.6942, + 0.6958, + 0.6969, + 0.6946, + 0.7045, + 0.7034, + 0.7078, + 0.7092, + 0.7115, + 0.7134, + 0.7138, + 0.7166, + 0.7183, + 0.7177, + 0.7171, + 0.7211, + 0.7219, + 0.7237, + 0.7234, + 0.7234, + 0.7229, + 0.7241, + 0.7237, + 0.7238 + ], + "test_acc": [ + 0.521, + 0.603, + 0.6275, + 0.638, + 0.64, + 0.6115, + 0.6005, + 0.5555, + 0.575, + 0.5755, + 0.5515, + 0.5135, + 0.563, + 0.5605, + 0.5765, + 0.5455, + 0.598, + 0.5825, + 0.5805, + 0.5785, + 0.5125, + 0.5985, + 0.57, + 0.5875, + 0.5775, + 0.571, + 0.6055, + 0.6095, + 0.6085, + 0.6005, + 0.6235, + 0.608, + 0.63, + 0.607, + 0.611, + 0.6395, + 0.6215, + 0.6065, + 0.609, + 0.622, + 0.62, + 0.619, + 0.62, + 0.6035, + 0.6035, + 0.614, + 0.611, + 0.615, + 0.6215, + 0.6185, + 0.6415, + 0.641, + 0.6365, + 0.634, + 0.6375, + 0.6385, + 0.638, + 0.638, + 0.6585, + 0.6345, + 0.6515, + 0.6415, + 0.6495, + 0.648, + 0.6535, + 0.649, + 0.6485, + 0.6535, + 0.6605, + 0.652, + 0.6495, + 0.656, + 0.6555, + 0.6525, + 0.6495, + 0.653, + 0.6515, + 0.6525, + 0.653, + 0.653 + ], + "state_pred_error": [ + 0.6562932591438293, + 0.23981053397655486, + 0.1903499266386032, + 0.19460821108818055, + 0.18526573693752288, + 0.17590652742385865, + 0.17703034114837646, + 0.18292365341186523, + 0.17384615654945373, + 0.15362654786109925, + 0.13457916014194488, + 0.10651036943197251, + 0.08625391768217087, + 0.07398555294275284, + 0.06209893840551376, + 0.05550870283842087, + 0.053596517646312715, + 0.04783650130033493, + 0.043200792515277864, + 0.04244589750766754, + 0.03850420281887054, + 0.034261447036266324, + 0.03740785131454468, + 0.05187485041022301, + 0.062013522326946256, + 0.06344651449918746, + 0.06347008838653564, + 0.05844136718511581, + 0.055137157082557675, + 0.0557414687871933, + 0.057311562991142276, + 0.054085967439413074, + 0.051402875846624375, + 0.05376452451944351, + 0.056453118932247165, + 0.058846011412143705, + 0.05783562337160111, + 0.05683179898262024, + 0.04931292141675949, + 0.046385925376415255, + 0.04792898969650269, + 0.04724597421884537, + 0.048053572791814804, + 0.05018840481638909, + 0.0515774268746376, + 0.051133309531211854, + 0.04661017266511917, + 0.040031638622283934, + 0.03488108472824097, + 0.034121088311076166, + 0.033728338706493374, + 0.0345772180557251, + 0.035495428866147996, + 0.0358143527507782, + 0.03543115886449814, + 0.034300058418512344, + 0.03347357029318809, + 0.03296002690792084, + 0.03150505864620209, + 0.031229876655340195, + 0.030605761355161666, + 0.029714866718649865, + 0.029429574620723726, + 0.028748987805843354, + 0.0280685770124197, + 0.027459417676925658, + 0.02690108307301998, + 0.0262698985517025, + 0.025815216612815856, + 0.025245039772987365, + 0.02476883113980293, + 0.024032312482595443, + 0.023628278690576553, + 0.02287783022224903, + 0.022595539873838423, + 0.022138828229904175, + 0.02166169041991234, + 0.021171285590529443, + 0.020910686141252518, + 0.020324308523535728 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.7411977648735046, + 0.3599514067173004, + 0.24466437101364136, + 0.18324854969978333, + 0.1438049077987671, + 0.1288401186466217, + 0.12390943616628647, + 0.11832019686698914, + 0.1285572201013565, + 0.12467152625322342, + 0.12941977381706238, + 0.11911536008119583 + ], + "perturbation_rho": [ + 0.637965977191925, + 0.3033628761768341, + 0.22177954018115997, + 0.1946793794631958, + 0.08981841057538986, + 0.07293770462274551, + 0.06646254658699036, + 0.08072252571582794, + 0.1001453697681427, + 0.10873826593160629, + 0.08548736572265625, + 0.06633201241493225 + ], + "nudging": { + "0.001": [ + -0.021028487011790276, + -0.001058874186128378, + -0.0006181992357596755, + -0.0004633825155906379, + -0.00033575957058928907, + -0.00028632720932364464, + -0.0002752277650870383, + -0.00025989426649175584, + -0.0002959924750030041, + -0.0002790615544654429, + -0.0002817974309436977, + -0.00027173495618626475 + ], + "0.003": [ + -0.06181221827864647, + -0.0031739207915961742, + -0.0018536150455474854, + -0.0013895141892135143, + -0.0010071746073663235, + -0.0008582596783526242, + -0.0008251374820247293, + -0.0007799923187121749, + -0.0008870307938195765, + -0.0008369790157303214, + -0.0008445986313745379, + -0.000814296246971935 + ], + "0.01": [ + -0.19135718047618866, + -0.010539980605244637, + -0.006164146587252617, + -0.004623022396117449, + -0.003351652529090643, + -0.002855603815987706, + -0.002745934296399355, + -0.0025949627161026, + -0.002952038776129484, + -0.002784580923616886, + -0.002810355508700013, + -0.0027095736004412174 + ] + }, + "state_pred_error_per_layer": [ + 11398.169921875, + 8994.236328125, + 6843.07958984375, + 5338.4423828125, + 5392.61279296875, + 5254.96435546875, + 5057.08544921875, + 3968.3759765625, + 3609.97021484375, + 3456.01708984375, + 3801.56005859375, + 3800.938232421875 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.1167624181747438, + 1.0788958876609802, + 0.7283429620742797, + 0.6024269011974335, + 0.5713749401092529, + 0.5598325239181519, + 0.5255904386997223, + 0.4974329795598984, + 0.4899064763069153, + 0.5248763283252716, + 0.5883738929748535, + 0.5222483651161194, + 0.6248608678817749, + 0.6194486492156982, + 0.662178272819519, + 0.640893846309185, + 0.5865561918258667, + 0.885394397687912, + 0.6598452829360962, + 0.8222563210964203, + 0.754990729355812, + 0.8914188419342041, + 1.031625161933899, + 1.0454975284576415, + 1.2010375715255737, + 1.0348915752410888, + 1.165796419429779, + 1.231134867119789, + 1.1155884208679199, + 1.126976979446411, + 1.1689010509490967, + 1.2431681230545044, + 1.1928106174468993, + 1.2096030212402344, + 1.3011646310806275, + 1.4129821705818175, + 1.6691173180580139, + 1.7397695838928222, + 1.5034552973747253, + 1.4103708577156067, + 1.4138535682678222, + 1.426429981994629, + 1.403753551864624, + 1.3699013526916504, + 1.2783019632339478, + 1.4253152322292328, + 1.2403149646759033, + 1.2535520204544068, + 1.2423814392089845, + 1.2836143051147462, + 1.2725918060302734, + 1.459489345550537, + 1.3426179229736328, + 1.2982452480316162, + 1.2198686767578124, + 1.2035927333831786, + 1.189828524017334, + 1.1886818801879884, + 1.186541651058197, + 1.196483794784546, + 1.1956911575317384, + 1.1999056583404542, + 1.1884550790786743, + 1.16442092628479, + 1.1864193830490113, + 1.175171266555786, + 1.164777257537842, + 1.143490619659424, + 1.1616380886077882, + 1.148275350189209, + 1.1453337799072265, + 1.1361551708221436, + 1.1338137168884277, + 1.1356001434326173, + 1.1363445959091187, + 1.1320666946411133, + 1.1263005462646485, + 1.1265122992515564, + 1.1240507564544677, + 1.122698894882202 + ], + "train_acc": [ + 0.2326, + 0.6009, + 0.7284, + 0.782, + 0.7858, + 0.7932, + 0.8017, + 0.8211, + 0.821, + 0.8133, + 0.8013, + 0.8252, + 0.8039, + 0.8028, + 0.8062, + 0.8088, + 0.8267, + 0.7767, + 0.8198, + 0.7967, + 0.8033, + 0.7824, + 0.7618, + 0.7514, + 0.7357, + 0.7568, + 0.7255, + 0.7226, + 0.7436, + 0.7404, + 0.7352, + 0.7124, + 0.7168, + 0.7056, + 0.6906, + 0.6805, + 0.6348, + 0.6271, + 0.6467, + 0.6502, + 0.6414, + 0.6359, + 0.6329, + 0.6335, + 0.6483, + 0.6185, + 0.6446, + 0.6477, + 0.6504, + 0.6359, + 0.6434, + 0.6053, + 0.6247, + 0.6278, + 0.645, + 0.6464, + 0.6447, + 0.6448, + 0.6491, + 0.6438, + 0.6471, + 0.6432, + 0.6445, + 0.6451, + 0.642, + 0.6436, + 0.6457, + 0.6523, + 0.6477, + 0.6485, + 0.6528, + 0.6531, + 0.6558, + 0.6543, + 0.6514, + 0.6525, + 0.6535, + 0.6521, + 0.6561, + 0.6539 + ], + "test_acc": [ + 0.4875, + 0.677, + 0.7215, + 0.7555, + 0.711, + 0.746, + 0.749, + 0.766, + 0.737, + 0.781, + 0.737, + 0.7375, + 0.682, + 0.752, + 0.741, + 0.753, + 0.7145, + 0.7665, + 0.7315, + 0.7535, + 0.735, + 0.693, + 0.6625, + 0.6565, + 0.6395, + 0.6925, + 0.6545, + 0.65, + 0.6975, + 0.6685, + 0.6285, + 0.624, + 0.6125, + 0.5815, + 0.637, + 0.595, + 0.569, + 0.6345, + 0.588, + 0.564, + 0.551, + 0.558, + 0.532, + 0.558, + 0.463, + 0.5915, + 0.592, + 0.605, + 0.5635, + 0.583, + 0.475, + 0.5865, + 0.5545, + 0.573, + 0.574, + 0.5875, + 0.6035, + 0.6145, + 0.5835, + 0.6215, + 0.5825, + 0.596, + 0.5915, + 0.595, + 0.5825, + 0.6105, + 0.6125, + 0.5925, + 0.611, + 0.6085, + 0.6045, + 0.614, + 0.6135, + 0.611, + 0.6095, + 0.6165, + 0.615, + 0.6175, + 0.617, + 0.6165 + ], + "value_loss": [ + 2.917377243423462, + 1.0885846445083618, + 0.8722483618736268, + 0.7590288893699646, + 0.6848006416320801, + 0.7795331933021545, + 0.7230647287368774, + 0.6652144893169403, + 0.6948482487678528, + 0.845168435049057, + 1.012792977142334, + 0.9757756937980652, + 1.377029209136963, + 1.2504926189422607, + 1.5225606134414673, + 1.4383921993494033, + 1.3322697761535645, + 2.4565747309207917, + 1.6300376277923585, + 2.823884797477722, + 2.3786984578609465, + 3.188929486846924, + 3.881624488592148, + 3.887029996871948, + 5.223129042053222, + 3.704177805709839, + 3.865027075386047, + 4.846107821583748, + 4.141783078241348, + 3.970493141937256, + 3.874847568798065, + 4.200226354598999, + 3.745213671684265, + 3.198570384597778, + 3.0785925355911257, + 3.9717932876586914, + 4.700067436790467, + 4.323802533721924, + 4.030013834190369, + 3.1393288494110108, + 2.987711456298828, + 2.7445001739501955, + 3.0291526428222655, + 2.3462921596527098, + 1.9060795955657959, + 2.258526708507538, + 1.7152527221679688, + 1.8757978493452072, + 1.7933397781372071, + 1.972236647605896, + 1.9309973197937012, + 2.1270628622055052, + 2.527687882232666, + 1.409256293106079, + 1.5656167263031007, + 1.207306969833374, + 1.161829356956482, + 1.1612982688903808, + 1.3352970541954041, + 1.0183050258636475, + 1.0635041744232179, + 1.1356115013122559, + 1.030290427494049, + 0.9526879192352294, + 0.9847541847229004, + 0.9769651292800904, + 1.0084786526679992, + 0.847856243610382, + 0.9065985995292664, + 0.8622876857757569, + 0.985212391090393, + 0.8992663670539855, + 0.8764174394369125, + 0.879221212387085, + 0.7656205827713013, + 0.7692451740264893, + 0.7758066005706787, + 0.7651944708824158, + 0.7469569927215576, + 0.7472030250549316 + ], + "term_loss": [ + 1.7071890327453614, + 0.8562626203536987, + 0.7217037587165832, + 0.6241729659080505, + 0.5283200964927673, + 0.6200158938407898, + 0.5797653388977051, + 0.5340959584653378, + 0.570998721408844, + 0.717055173254013, + 0.8720836116790771, + 0.8500968678474426, + 1.2321790990829469, + 1.1084193689346313, + 1.371880656862259, + 1.2907429981589318, + 1.1943902667999267, + 2.2709406319350003, + 1.4680245761871338, + 2.522774781036377, + 2.103910192489624, + 2.813427988433838, + 3.51185936422348, + 3.507211095714569, + 4.675780584716797, + 3.273686423397064, + 3.37993256855011, + 4.347406148648262, + 3.6078256138801574, + 3.477346031188965, + 3.3423506669521332, + 3.635915426635742, + 3.2431184103012085, + 2.731623638153076, + 2.569586363697052, + 3.3848239572525025, + 3.9930092430114748, + 3.6855425521850584, + 3.439471867132187, + 2.6192165103912353, + 2.430570825958252, + 2.2859115070343017, + 2.510902947998047, + 1.8956809158325196, + 1.5424002754211426, + 1.8663454635381698, + 1.3792756309509278, + 1.5096056005597114, + 1.4301966918945312, + 1.6093664487838746, + 1.5647689273834229, + 1.7485398204803466, + 2.0468893560409547, + 1.086868813419342, + 1.2306722325801849, + 0.9031556518554688, + 0.8638837631225585, + 0.8681535690307617, + 1.0182161829471588, + 0.7249538288116455, + 0.7807100736618042, + 0.8440699245452881, + 0.7501027065992355, + 0.6742322627067566, + 0.7051959021568298, + 0.7000651927947998, + 0.7283024723052979, + 0.5799991112709045, + 0.6314232111930848, + 0.5915066772460937, + 0.7066991906166077, + 0.6210276663541794, + 0.6052080447912216, + 0.6054580961704255, + 0.506322053527832, + 0.5056319164276123, + 0.5136490772247314, + 0.5038866362571717, + 0.4870232744216919, + 0.48659993648529054 + ], + "bridge_loss": [ + 0.934133678069734, + 0.04377672711312771, + 0.00621748416274786, + 0.009328789858520032, + 0.03208852110505104, + 0.03361516862809658, + 0.025169576000422238, + 0.016107972599565982, + 0.01099225374609232, + 0.009757265958189964, + 0.012258637046068907, + 0.009598278574645519, + 0.011902521315217018, + 0.01008907663524151, + 0.012962754887342453, + 0.016048321741446853, + 0.014013315912336111, + 0.02511794980466366, + 0.03051947158575058, + 0.14839042081832884, + 0.1288803307890892, + 0.21345752367973328, + 0.18923244893550872, + 0.1900414011478424, + 0.3374566346645355, + 0.2436180516242981, + 0.27291790237426755, + 0.2844627224907279, + 0.33504061785936357, + 0.28894724340438843, + 0.323739523935318, + 0.3439501903533936, + 0.2863821896791458, + 0.24004585890769958, + 0.2657137688159943, + 0.3297406603336334, + 0.4193671970367432, + 0.3435313666343689, + 0.3151414979636669, + 0.2521958198547363, + 0.286889494228363, + 0.18249824771881104, + 0.24513883123397828, + 0.1807411163687706, + 0.10391507806777954, + 0.11641201150417328, + 0.0781691556930542, + 0.11070946050584317, + 0.10752428450584411, + 0.09995526621341705, + 0.10843874815702438, + 0.09153415812253952, + 0.21060027264356612, + 0.05525967319011688, + 0.07939857324361801, + 0.052892149806022644, + 0.04809255766868591, + 0.043376958113908765, + 0.06525523254275321, + 0.041036498141288756, + 0.034595796847343444, + 0.039489244347810745, + 0.03204091534614563, + 0.03184057741165161, + 0.03210646907687187, + 0.03017198827266693, + 0.03566043748408556, + 0.026130416893959046, + 0.030878000298142434, + 0.028091139087080955, + 0.036872993779182434, + 0.037208085697889325, + 0.031016037890315058, + 0.03364388849139214, + 0.01882201724052429, + 0.022678672552108765, + 0.023471874904632567, + 0.022254053789377212, + 0.021548601961135866, + 0.02176231173723936 + ], + "tgrad_loss": [ + 0.2760545256614685, + 0.1885452966928482, + 0.14432712779045104, + 0.12552713549137115, + 0.1243920262336731, + 0.12590213398933411, + 0.11812981011867524, + 0.11501056258678437, + 0.1128572760105133, + 0.1183559935092926, + 0.12845072351694106, + 0.1160805418252945, + 0.1329475926876068, + 0.1319841867685318, + 0.13771721487045288, + 0.13160088445991278, + 0.12386620242595672, + 0.16051614969968797, + 0.1314936074256897, + 0.152719602394104, + 0.14590793343186378, + 0.1620439998626709, + 0.1805326670050621, + 0.18977752606868745, + 0.20989185056686402, + 0.18687333135604858, + 0.21217663090229033, + 0.21423892506957054, + 0.19891686100959777, + 0.20419985570907592, + 0.20875739620923997, + 0.22036073546409607, + 0.2157130225300789, + 0.22690090117454528, + 0.2432923877954483, + 0.2572286765575409, + 0.28769104671478274, + 0.29472856616973875, + 0.27540048587322236, + 0.26791652979850766, + 0.2702511163234711, + 0.2760904380321503, + 0.27311084804534913, + 0.2698701079368591, + 0.2597642467021942, + 0.27576921684741973, + 0.25780792813301084, + 0.25548279466629026, + 0.2556188053131104, + 0.26291491422653196, + 0.2577896447181702, + 0.2869888922214508, + 0.2701982216835022, + 0.2671278247833252, + 0.25554592900276185, + 0.2512591653585434, + 0.2498530375957489, + 0.249767742729187, + 0.25182563605308533, + 0.25231471223831176, + 0.24819831862449646, + 0.25205233681201933, + 0.24814680593013763, + 0.24661508560180664, + 0.24745180859565735, + 0.2467279472351074, + 0.2445157471895218, + 0.24172671518325806, + 0.2442973881959915, + 0.24268987379074097, + 0.24164021210670472, + 0.24103060722351075, + 0.24019335939884187, + 0.24011922693252563, + 0.240476509141922, + 0.24093458075523377, + 0.2386856475353241, + 0.23905378465652466, + 0.23838511614799499, + 0.23884078254699706 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.022855455055832863, + 0.05216163024306297, + 0.06243491545319557, + 0.06105152890086174, + 0.04914259910583496, + 0.0686616599559784, + 0.07184358686208725, + 0.06793813407421112, + 0.07173632830381393, + 0.07284142076969147, + 0.07256414741277695, + 0.07263204455375671 + ], + "perturbation_rho": [ + 0.035705771297216415, + 0.06484436988830566, + 0.15210987627506256, + 0.16708198189735413, + 0.14389753341674805, + 0.17870034277439117, + 0.1870872974395752, + 0.1476944386959076, + 0.15697413682937622, + 0.11093902587890625, + 0.14925891160964966, + 0.1440906673669815 + ], + "nudging": { + "0.001": [ + -0.001078948494978249, + -0.0004032487340737134, + -0.0004934167372994125, + -0.00047345247003249824, + -0.00039035180816426873, + -0.0005267527303658426, + -0.0005424739792943001, + -0.0005249894456937909, + -0.0005533735384233296, + -0.0005575859104283154, + -0.0005652024410665035, + -0.0005723442882299423 + ], + "0.003": [ + -0.0032069606240838766, + -0.0012108207447454333, + -0.0014771935530006886, + -0.001415132312104106, + -0.0011700796894729137, + -0.0015794191276654601, + -0.001628151978366077, + -0.0015758140943944454, + -0.0016569469589740038, + -0.0016708305338397622, + -0.001694234786555171, + -0.0017183286836370826 + ], + "0.01": [ + -0.010396174155175686, + -0.0040237451903522015, + -0.004916047677397728, + -0.004709047265350819, + -0.003890307154506445, + -0.005256335251033306, + -0.00541608827188611, + -0.005244302563369274, + -0.005511538591235876, + -0.005561722908169031, + -0.005636853165924549, + -0.0057196058332920074 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.25_L12_s42.json b/results/synth_ladder_v2_lo/synth_a0.25_L12_s42.json new file mode 100644 index 0000000..c93276f --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.25_L12_s42.json @@ -0,0 +1,1722 @@ +{ + "bp": { + "log": { + "train_loss": [ + 0.9884123200893402, + 0.5460307235717774, + 0.4540341721534729, + 0.3844916480064392, + 0.3968988080024719, + 0.41963135101795196, + 0.29759747257232666, + 0.36947814264297485, + 0.3806398531913757, + 0.29335604696273804, + 0.2874252618789673, + 0.32758747911453245, + 0.30908223123550416, + 0.2971659957408905, + 0.23906751189231873, + 0.22946795601844788, + 0.2539147944688797, + 0.22845910873413086, + 0.3282787434577942, + 0.2661190662384033, + 0.24266858730316163, + 0.25516548223495483, + 0.23597899619340898, + 0.18901561794281005, + 0.2580148603916168, + 0.19427666611671449, + 0.19329874439239503, + 0.17538535070419312, + 0.17377141309976576, + 0.15650151609182358, + 0.15580351371765136, + 0.18987136631011964, + 0.207766206407547, + 0.14973504890799522, + 0.13435618991851805, + 0.17490362329483033, + 0.17151201934814453, + 0.15580902137756347, + 0.12738764666318894, + 0.12490283071994782, + 0.11846845669746399, + 0.11482198586463928, + 0.11522660837173462, + 0.13794113398194313, + 0.10947950057983398, + 0.1372414189338684, + 0.13609834372997284, + 0.1075260235697031, + 0.09584161682724952, + 0.08979704446792602, + 0.087031523630023, + 0.08224497293233872, + 0.08695690851807594, + 0.08022827257514, + 0.0766805015206337, + 0.07483255062103271, + 0.07608340452313424, + 0.07494754149019718, + 0.06930721849799157, + 0.06876047478914261, + 0.06823876276016236, + 0.07385597123503684, + 0.0662713002204895, + 0.0657794366121292, + 0.062218379247188565, + 0.06041689007431269, + 0.05945101605653763, + 0.06069924997091293, + 0.057991378545761106, + 0.05709035173952579, + 0.05598740013837814, + 0.055655374181270596, + 0.05501515428423882, + 0.05459572645425796, + 0.054142729806900027, + 0.05369558590054512, + 0.053477102118730545, + 0.053296024799346926, + 0.053159212905168535, + 0.05307692391872406 + ], + "train_acc": [ + 0.638, + 0.7898, + 0.8165, + 0.8465, + 0.8471, + 0.8347, + 0.8801, + 0.8604, + 0.8517, + 0.8827, + 0.8844, + 0.8688, + 0.878, + 0.8833, + 0.9033, + 0.9077, + 0.8992, + 0.9063, + 0.8739, + 0.8918, + 0.9022, + 0.9018, + 0.9059, + 0.9272, + 0.9005, + 0.9246, + 0.9247, + 0.9314, + 0.9311, + 0.9392, + 0.9379, + 0.9225, + 0.9168, + 0.9433, + 0.9502, + 0.9324, + 0.9331, + 0.937, + 0.9524, + 0.9527, + 0.9592, + 0.9569, + 0.9568, + 0.9483, + 0.961, + 0.9491, + 0.9465, + 0.9608, + 0.9677, + 0.9703, + 0.9725, + 0.9755, + 0.9724, + 0.9759, + 0.9782, + 0.9797, + 0.978, + 0.9785, + 0.9816, + 0.983, + 0.9827, + 0.9798, + 0.9827, + 0.9821, + 0.9868, + 0.9871, + 0.9884, + 0.9872, + 0.9893, + 0.9901, + 0.9904, + 0.9909, + 0.9918, + 0.9913, + 0.9914, + 0.9923, + 0.992, + 0.9921, + 0.9922, + 0.9922 + ], + "test_acc": [ + 0.771, + 0.8075, + 0.839, + 0.83, + 0.82, + 0.8445, + 0.8565, + 0.846, + 0.8415, + 0.8655, + 0.8635, + 0.8595, + 0.8405, + 0.8475, + 0.8725, + 0.868, + 0.8705, + 0.868, + 0.851, + 0.8605, + 0.8665, + 0.869, + 0.8725, + 0.8705, + 0.874, + 0.884, + 0.882, + 0.8835, + 0.878, + 0.8825, + 0.8835, + 0.8815, + 0.878, + 0.895, + 0.884, + 0.872, + 0.8725, + 0.8835, + 0.886, + 0.8845, + 0.8885, + 0.897, + 0.8805, + 0.887, + 0.891, + 0.8865, + 0.882, + 0.8885, + 0.893, + 0.8925, + 0.891, + 0.8945, + 0.898, + 0.897, + 0.8945, + 0.8965, + 0.894, + 0.896, + 0.897, + 0.902, + 0.897, + 0.8975, + 0.9005, + 0.9, + 0.895, + 0.8975, + 0.899, + 0.898, + 0.8975, + 0.8975, + 0.8965, + 0.8985, + 0.901, + 0.8975, + 0.897, + 0.897, + 0.8975, + 0.8975, + 0.897, + 0.897 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8824102282524109, + 0.865839958190918, + 0.8526839017868042, + 0.839972198009491, + 0.826134204864502, + 0.8190910220146179, + 0.8134430646896362, + 0.8095068335533142, + 0.8061133027076721, + 0.8034266233444214, + 0.8016149997711182, + 0.8001440167427063 + ], + "perturbation_rho": [ + 0.9999990463256836, + 0.9999975562095642, + 0.9999887347221375, + 0.9999736547470093, + 0.9999515414237976, + 0.9999052882194519, + 0.9998592138290405, + 0.999845027923584, + 0.99979567527771, + 0.9997392892837524, + 0.999713659286499, + 0.9996709227561951 + ], + "nudging": { + "0.001": [ + -0.03222742676734924, + -0.016009416431188583, + -0.008412450551986694, + -0.005028060637414455, + -0.003471477422863245, + -0.002676197327673435, + -0.002212640829384327, + -0.0019189234590157866, + -0.0017268857918679714, + -0.0015955264680087566, + -0.0015064922627061605, + -0.0014467197470366955 + ], + "0.003": [ + -0.088250532746315, + -0.04596046730875969, + -0.024666687473654747, + -0.014880567789077759, + -0.010317552834749222, + -0.007971002720296383, + -0.006598907522857189, + -0.005727590061724186, + -0.005157099571079016, + -0.004766468890011311, + -0.004501671064645052, + -0.004323706030845642 + ], + "0.01": [ + -0.21559840440750122, + -0.13125374913215637, + -0.0758625715970993, + -0.04728776216506958, + -0.03328181058168411, + -0.025909576565027237, + -0.021545151248574257, + -0.01875336468219757, + -0.016917269676923752, + -0.015656160190701485, + -0.014799138531088829, + -0.01422282587736845 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.091241591453552, + 1.0522155212402344, + 0.7197729051113129, + 0.5984360224723816, + 0.55927502784729, + 0.5319774662971497, + 0.48646941194534304, + 0.5328002332687378, + 0.5385726051807403, + 0.580863460111618, + 0.49310305881500244, + 0.5983066858291626, + 0.5821534514427185, + 0.5875922044754028, + 0.599033100938797, + 0.5862060243606567, + 0.7749097516059875, + 0.6087754693984986, + 0.7364706658363342, + 0.7253197401046753, + 0.933016799545288, + 0.8019046752929687, + 0.6908189784288407, + 0.5993604675292968, + 0.7429474418640136, + 0.7197145952224732, + 0.7374668367385864, + 0.676032237815857, + 0.7813192527770996, + 0.6604006807804108, + 0.8066447370529175, + 0.7775278373718262, + 0.8043575154304504, + 0.6516128785610199, + 0.6490189645051956, + 0.6631092401742935, + 0.6493145933866501, + 0.6440104596614837, + 0.6592015397071839, + 0.6828624240875244, + 0.8400594820022583, + 0.6588001432418823, + 0.7000653821468353, + 0.764811098241806, + 0.7084193643569946, + 0.6780031036376953, + 0.6745406296730041, + 0.6227908559322357, + 0.6173504204750061, + 0.6519232685089111, + 0.681457055580616, + 0.5612579683303833, + 0.7425640492200851, + 0.6078716424942017, + 0.5751205417633056, + 0.5557551406860352, + 0.5769869324684143, + 0.5574739450454712, + 0.5620601721048355, + 0.5108847286462784, + 0.5051990665435792, + 0.5577566593170166, + 0.5067275173187256, + 0.5076467472076416, + 0.500104681968689, + 0.4845377607345581, + 0.48600583753585813, + 0.48937382678985597, + 0.47086129837036134, + 0.4627019955635071, + 0.4640789652824402, + 0.4643590691566467, + 0.46600833835601807, + 0.4590310299873352, + 0.4536386815071106, + 0.4487397773385048, + 0.4473173204421997, + 0.44602737324237823, + 0.4437102550506592, + 0.44304467763900757 + ], + "train_acc": [ + 0.2446, + 0.6126, + 0.7299, + 0.7774, + 0.7913, + 0.8001, + 0.8152, + 0.8027, + 0.8023, + 0.7957, + 0.8231, + 0.8073, + 0.815, + 0.8163, + 0.8138, + 0.8282, + 0.7956, + 0.8249, + 0.8081, + 0.8089, + 0.7907, + 0.8088, + 0.8266, + 0.8447, + 0.8231, + 0.8263, + 0.828, + 0.8404, + 0.822, + 0.8396, + 0.8204, + 0.8226, + 0.8249, + 0.8469, + 0.842, + 0.8455, + 0.8456, + 0.8484, + 0.8434, + 0.8372, + 0.8221, + 0.8455, + 0.8401, + 0.8275, + 0.8357, + 0.8437, + 0.8472, + 0.8518, + 0.8517, + 0.8478, + 0.8481, + 0.864, + 0.8388, + 0.853, + 0.8583, + 0.8625, + 0.855, + 0.86, + 0.8625, + 0.8716, + 0.8695, + 0.861, + 0.8703, + 0.8702, + 0.8724, + 0.8745, + 0.875, + 0.8768, + 0.8766, + 0.8758, + 0.878, + 0.8759, + 0.8773, + 0.88, + 0.88, + 0.8819, + 0.8813, + 0.8822, + 0.8826, + 0.8829 + ], + "test_acc": [ + 0.48, + 0.6615, + 0.707, + 0.7425, + 0.715, + 0.7465, + 0.753, + 0.7765, + 0.69, + 0.721, + 0.719, + 0.7375, + 0.738, + 0.76, + 0.731, + 0.703, + 0.717, + 0.7535, + 0.716, + 0.68, + 0.6755, + 0.7735, + 0.781, + 0.708, + 0.7465, + 0.7725, + 0.7485, + 0.75, + 0.7325, + 0.7805, + 0.712, + 0.741, + 0.7685, + 0.7415, + 0.7955, + 0.777, + 0.762, + 0.76, + 0.783, + 0.691, + 0.774, + 0.7895, + 0.73, + 0.776, + 0.7745, + 0.771, + 0.7805, + 0.7785, + 0.765, + 0.781, + 0.774, + 0.7755, + 0.781, + 0.7965, + 0.8025, + 0.804, + 0.79, + 0.7915, + 0.8055, + 0.804, + 0.8095, + 0.805, + 0.8075, + 0.812, + 0.8065, + 0.806, + 0.806, + 0.817, + 0.8115, + 0.815, + 0.81, + 0.812, + 0.811, + 0.8145, + 0.8115, + 0.812, + 0.8155, + 0.8165, + 0.8165, + 0.8165 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.02035588026046753, + 0.09721152484416962, + 0.10017214715480804, + 0.06879279017448425, + 0.0898706465959549, + 0.0775061622262001, + 0.0738426148891449, + 0.022470442578196526, + 0.03698011115193367, + 0.09759337455034256, + 0.05344103276729584, + 0.06489317119121552 + ], + "perturbation_rho": [ + -0.041805852204561234, + 0.14336195588111877, + 0.21263040602207184, + 0.15326815843582153, + 0.04533267021179199, + 0.07981619238853455, + 0.08665720373392105, + 0.004602088592946529, + 0.0780038833618164, + 0.11769488453865051, + 0.1415681391954422, + 0.12027023732662201 + ], + "nudging": { + "0.001": [ + -0.0009545196662656963, + -0.0008363645756617188, + -0.0003885737678501755, + -0.00026890120352618396, + -0.0002675559953786433, + -0.00033352605532854795, + -0.0002601599844638258, + -0.00011189336510142311, + -0.0001840656332205981, + -0.0003697811043821275, + -0.0001971298042917624, + -0.00022067477402742952 + ], + "0.003": [ + -0.0027363700792193413, + -0.0025048283860087395, + -0.0011647494975477457, + -0.000811159610748291, + -0.0008012806065380573, + -0.0010005887597799301, + -0.0007811359828338027, + -0.00033516576513648033, + -0.0005535727832466364, + -0.0011049836175516248, + -0.0005915613146498799, + -0.0006592696299776435 + ], + "0.01": [ + -0.007749770302325487, + -0.008321389555931091, + -0.003876405069604516, + -0.0026999912224709988, + -0.0026630363427102566, + -0.0033310302533209324, + -0.0026011697482317686, + -0.0011158722918480635, + -0.0018408913165330887, + -0.0036767907440662384, + -0.0019704087171703577, + -0.0021951368544250727 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.843170643234253, + 1.193545725440979, + 0.9349142212867737, + 0.9590050317764283, + 0.9601007102966309, + 1.0591806930541992, + 1.0750218585968017, + 1.0594622192382812, + 1.0260618852615357, + 1.0633037223815918, + 1.1873747802734376, + 1.1900213710784913, + 1.1711347143173219, + 1.110907957649231, + 1.141725605583191, + 1.1908537561416626, + 1.1576408653259278, + 1.2335913299560546, + 1.1927038297653199, + 1.1675678352355956, + 1.1620887538909912, + 1.238514815044403, + 1.1467733171463013, + 1.1628135605812073, + 1.1169413381576538, + 1.1289218362808227, + 1.1431014865875244, + 1.0724326686859131, + 1.020245622253418, + 0.9871452375411988, + 1.013824908065796, + 1.057583949661255, + 1.0269935136795043, + 1.0403342270851135, + 1.0003446009635926, + 1.023628770160675, + 0.9621780359268188, + 0.9958351311683655, + 0.9854215185165405, + 0.94918332862854, + 0.9539219416618347, + 0.9634699941635132, + 0.9163962741851807, + 0.89243365650177, + 0.8894084901809692, + 0.9069821780204773, + 0.9070278909683227, + 0.9259662859916687, + 0.9052657639503479, + 0.8919173622131348, + 0.8811036640167237, + 0.877770324420929, + 0.8617347580909729, + 0.8443253430366516, + 0.8402864801406861, + 0.8299113247871399, + 0.8174763144493103, + 0.8079615959167481, + 0.796233709526062, + 0.7943985921859741, + 0.7881768466949463, + 0.7766195007324219, + 0.7731075840473175, + 0.767168036365509, + 0.7628648261070251, + 0.764765630197525, + 0.758231233215332, + 0.7616345821380616, + 0.7603204396247863, + 0.7553847047805786, + 0.7550768209457397, + 0.7540734338760376, + 0.7542704034805298, + 0.7539316363334656, + 0.7512542444229126, + 0.751466016960144, + 0.7500110761642456, + 0.7499307077407837, + 0.7494694025039673, + 0.7491868644714356 + ], + "train_acc": [ + 0.3634, + 0.584, + 0.6681, + 0.6817, + 0.6731, + 0.6436, + 0.6318, + 0.6412, + 0.6483, + 0.6338, + 0.6131, + 0.6092, + 0.6072, + 0.6194, + 0.6114, + 0.6033, + 0.6136, + 0.5971, + 0.6066, + 0.6075, + 0.6054, + 0.5811, + 0.6084, + 0.6094, + 0.6267, + 0.6203, + 0.6182, + 0.6388, + 0.6563, + 0.6621, + 0.656, + 0.6457, + 0.6542, + 0.6535, + 0.6622, + 0.6504, + 0.665, + 0.653, + 0.6581, + 0.6737, + 0.6644, + 0.6634, + 0.6761, + 0.6825, + 0.6815, + 0.6846, + 0.6805, + 0.6738, + 0.6866, + 0.6853, + 0.6905, + 0.6901, + 0.696, + 0.6979, + 0.7064, + 0.7099, + 0.7107, + 0.7138, + 0.7154, + 0.7173, + 0.7194, + 0.7222, + 0.7244, + 0.7262, + 0.7263, + 0.725, + 0.7318, + 0.732, + 0.7284, + 0.7291, + 0.7306, + 0.7327, + 0.7306, + 0.7294, + 0.7325, + 0.7319, + 0.7341, + 0.7327, + 0.7337, + 0.7334 + ], + "test_acc": [ + 0.4985, + 0.6215, + 0.6765, + 0.644, + 0.6285, + 0.602, + 0.593, + 0.6145, + 0.604, + 0.571, + 0.5675, + 0.55, + 0.58, + 0.5485, + 0.5415, + 0.5615, + 0.5325, + 0.498, + 0.495, + 0.5825, + 0.5105, + 0.547, + 0.575, + 0.5695, + 0.5825, + 0.5755, + 0.5925, + 0.605, + 0.626, + 0.624, + 0.6195, + 0.625, + 0.619, + 0.619, + 0.6005, + 0.631, + 0.6155, + 0.6075, + 0.616, + 0.637, + 0.5925, + 0.628, + 0.627, + 0.6325, + 0.6275, + 0.64, + 0.6285, + 0.6405, + 0.638, + 0.6405, + 0.6565, + 0.6465, + 0.659, + 0.666, + 0.6645, + 0.6575, + 0.682, + 0.669, + 0.674, + 0.6885, + 0.6815, + 0.679, + 0.6755, + 0.682, + 0.6795, + 0.686, + 0.682, + 0.68, + 0.6845, + 0.688, + 0.6865, + 0.686, + 0.687, + 0.687, + 0.687, + 0.686, + 0.688, + 0.6865, + 0.6865, + 0.687 + ], + "state_pred_error": [ + 0.6467912001609802, + 0.2545396152973175, + 0.20769398341178893, + 0.20405273129940033, + 0.18864516608715057, + 0.1722513226032257, + 0.1580212815761566, + 0.1571042188167572, + 0.1673955574989319, + 0.1630590828895569, + 0.14197517161369325, + 0.13434906735420227, + 0.14216270933151245, + 0.13005418779850006, + 0.12095460612773895, + 0.11327731199264526, + 0.0938235213279724, + 0.07791765773296357, + 0.07149236190319061, + 0.07858237608671188, + 0.0889093372106552, + 0.0929118694782257, + 0.0870423443198204, + 0.09221649793386459, + 0.10558602612018585, + 0.11078759597539901, + 0.09640501194000244, + 0.08363894666433334, + 0.07552479531764984, + 0.06893316633701324, + 0.07225388768911362, + 0.07809946043491363, + 0.07972891807556153, + 0.07829325978159904, + 0.07489659252166748, + 0.06952577213048936, + 0.06463980766534805, + 0.06346644792556763, + 0.06054295033812523, + 0.057002867662906645, + 0.04881957597732544, + 0.0461565929889679, + 0.045704828941822054, + 0.04578752514719963, + 0.044416132467985155, + 0.04437544884681702, + 0.04501764898300171, + 0.044673075044155124, + 0.04345381007194519, + 0.04358632897734642, + 0.04145509601831436, + 0.0403918799161911, + 0.039635618847608564, + 0.03812404837608337, + 0.036712032747268676, + 0.03498043670654297, + 0.03441862116456032, + 0.03294241904020309, + 0.03208653058409691, + 0.03133675431907177, + 0.030832906076312065, + 0.03027755205631256, + 0.02992823379933834, + 0.029483068200945855, + 0.0286442294716835, + 0.02817883363366127, + 0.027806038296222687, + 0.027423375517129898, + 0.027105927157402038, + 0.026499537679553032, + 0.025793941861391067, + 0.025682287681102752, + 0.025424988290667534, + 0.02452395534515381, + 0.024412634512782097, + 0.023537403476238252, + 0.023103883719444274, + 0.023237476989626884, + 0.022374696707725523, + 0.02213728377223015 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.7618155479431152, + 0.3189862072467804, + 0.20356883108615875, + 0.1471748650074005, + 0.14541830122470856, + 0.13144558668136597, + 0.11054451763629913, + 0.12045299261808395, + 0.11467338353395462, + 0.1017053946852684, + 0.10614258050918579, + 0.10096963495016098 + ], + "perturbation_rho": [ + 0.6406711339950562, + 0.31470298767089844, + 0.1861359179019928, + 0.17725443840026855, + 0.11286133527755737, + 0.1387007087469101, + 0.07976903766393661, + 0.11419158428907394, + 0.13525697588920593, + 0.13865813612937927, + 0.10792528837919235, + 0.1288726031780243 + ], + "nudging": { + "0.001": [ + -0.02620597556233406, + -0.0011723835486918688, + -0.0006386470049619675, + -0.0004590698517858982, + -0.0004368656955193728, + -0.00040132386493496597, + -0.00033375341445207596, + -0.0003613364533521235, + -0.00034441970637999475, + -0.0003074322594329715, + -0.0003160890773870051, + -0.0002936453965958208 + ], + "0.003": [ + -0.07732252031564713, + -0.003513920586556196, + -0.0019150176085531712, + -0.0013760130386799574, + -0.0013105350080877542, + -0.0012034340761601925, + -0.0010010767728090286, + -0.0010843132622539997, + -0.0010324888862669468, + -0.0009225246030837297, + -0.0009475111728534102, + -0.000881188316270709 + ], + "0.01": [ + -0.24276113510131836, + -0.011681582778692245, + -0.006372842937707901, + -0.004580066539347172, + -0.004361784551292658, + -0.004005158320069313, + -0.0033329487778246403, + -0.003609130624681711, + -0.003437052248045802, + -0.003070915350690484, + -0.0031537071336060762, + -0.0029334095306694508 + ] + }, + "state_pred_error_per_layer": [ + 13069.6103515625, + 12902.267578125, + 5325.7177734375, + 4598.6796875, + 4871.38818359375, + 4525.17333984375, + 4230.712890625, + 4117.212890625, + 3694.05078125, + 3737.547607421875, + 3966.26025390625, + 4157.70654296875 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.1033826606750488, + 1.0748736568450927, + 0.7240967851638794, + 0.5924014734268188, + 0.561312539768219, + 0.5548838109970092, + 0.5445125359535218, + 0.5231592364311218, + 0.5370318948268891, + 0.5203416132450104, + 0.5313664150238037, + 0.5501730252742767, + 0.5255774791955948, + 0.6364645127296448, + 0.7171019055366517, + 0.5824658064305782, + 0.5903935560703277, + 0.6552688138961792, + 0.7979116170406342, + 0.8206407766342163, + 0.8171166659355164, + 0.9182533592224121, + 0.9087733953475953, + 0.9816526121139526, + 1.0274024284362793, + 0.9425600393295288, + 1.0292234921455383, + 1.0032360237121583, + 1.0786525871276855, + 0.9839243467330933, + 1.1140670619487762, + 1.24523821849823, + 1.6123345489501952, + 1.5466830284118653, + 1.4625207302093506, + 1.4497597217559814, + 1.2631195013046264, + 1.285225419998169, + 1.1248238891601563, + 1.3207208611488341, + 1.1724660835266114, + 1.1170583526611328, + 1.1232026329994202, + 1.1826211513519287, + 1.1198238399505616, + 1.2758455450057984, + 1.3378776414871216, + 1.3473635297775268, + 1.3659595549583434, + 1.3431388856887818, + 1.2782950267791748, + 1.2850243312835694, + 1.252669066619873, + 1.339367476272583, + 1.242458748817444, + 1.230945915222168, + 1.2400875186920166, + 1.2213593549728394, + 1.2046165678024292, + 1.2265458261489868, + 1.1864308532714845, + 1.1639758094787598, + 1.1673540477752686, + 1.1801281490325928, + 1.1353608043670653, + 1.1621911179542541, + 1.1203375988006592, + 1.1035721940040588, + 1.103725563430786, + 1.0981345941543579, + 1.0916361534118653, + 1.0767202972412109, + 1.077680862236023, + 1.0722866813659668, + 1.0760423473358154, + 1.070871086883545, + 1.069193116569519, + 1.0655735412597656, + 1.0649883579254151, + 1.064067266368866 + ], + "train_acc": [ + 0.2354, + 0.6085, + 0.7242, + 0.775, + 0.7907, + 0.7907, + 0.7949, + 0.8044, + 0.8041, + 0.8146, + 0.8192, + 0.819, + 0.8235, + 0.8034, + 0.7958, + 0.8229, + 0.8218, + 0.8163, + 0.8019, + 0.7992, + 0.8047, + 0.7917, + 0.7848, + 0.7655, + 0.7523, + 0.7595, + 0.7344, + 0.7334, + 0.7218, + 0.7249, + 0.6916, + 0.6803, + 0.6402, + 0.6413, + 0.6429, + 0.63, + 0.6482, + 0.6414, + 0.6647, + 0.6255, + 0.6497, + 0.6516, + 0.6494, + 0.6409, + 0.653, + 0.623, + 0.6096, + 0.6181, + 0.6077, + 0.6099, + 0.6135, + 0.6072, + 0.6083, + 0.5871, + 0.6069, + 0.608, + 0.6128, + 0.6105, + 0.6132, + 0.6069, + 0.6163, + 0.6195, + 0.6177, + 0.6132, + 0.6257, + 0.6214, + 0.6258, + 0.6301, + 0.6275, + 0.6326, + 0.6342, + 0.6369, + 0.6366, + 0.6378, + 0.6381, + 0.6404, + 0.6361, + 0.6387, + 0.6408, + 0.6389 + ], + "test_acc": [ + 0.4725, + 0.6485, + 0.709, + 0.696, + 0.7445, + 0.725, + 0.7285, + 0.7285, + 0.7285, + 0.7705, + 0.7485, + 0.759, + 0.7485, + 0.7405, + 0.7365, + 0.732, + 0.7405, + 0.718, + 0.739, + 0.739, + 0.718, + 0.7465, + 0.7445, + 0.7155, + 0.668, + 0.7365, + 0.6875, + 0.644, + 0.6715, + 0.573, + 0.628, + 0.5135, + 0.567, + 0.4905, + 0.576, + 0.522, + 0.544, + 0.568, + 0.537, + 0.5915, + 0.61, + 0.5865, + 0.5695, + 0.606, + 0.557, + 0.5285, + 0.5355, + 0.589, + 0.569, + 0.5705, + 0.559, + 0.543, + 0.526, + 0.5555, + 0.5485, + 0.577, + 0.567, + 0.5515, + 0.562, + 0.5815, + 0.5775, + 0.5885, + 0.5955, + 0.6, + 0.5825, + 0.59, + 0.6035, + 0.6035, + 0.606, + 0.6095, + 0.6165, + 0.613, + 0.615, + 0.6165, + 0.617, + 0.613, + 0.617, + 0.613, + 0.6145, + 0.6145 + ], + "value_loss": [ + 2.8795433490753175, + 1.138833139228821, + 0.8944398401260376, + 0.753239490032196, + 0.7442562434196472, + 0.7400344492912293, + 0.7306710628509522, + 0.7415657516479492, + 0.82294074883461, + 0.8365529833316803, + 0.8819458911895752, + 1.0201535857915878, + 0.9605329707860947, + 1.4210680746555329, + 1.7769229404449463, + 1.238111216878891, + 1.2918084540724755, + 1.5650643337249757, + 2.441974627304077, + 2.8493117763519287, + 3.0508531768798828, + 3.376968189239502, + 3.1227704570770265, + 3.2954182872772217, + 3.1305700786590576, + 2.5652926385879518, + 2.916162197494507, + 2.787790596961975, + 2.9674931542396545, + 2.2431891622543336, + 2.357407363319397, + 2.9580355476379396, + 4.707226892852783, + 4.06712333908081, + 3.4517571243286134, + 3.739633938217163, + 2.3796893051147463, + 2.312957144165039, + 1.6016325395584106, + 1.888862350463867, + 1.6106449718475342, + 1.6451952739715576, + 1.278008158302307, + 1.402012867116928, + 1.120068933391571, + 1.792665054321289, + 1.7022325145721435, + 1.8678716411590577, + 1.6293914850234985, + 1.4686889837265014, + 1.2121935440063476, + 1.2230595738887786, + 1.0494541343688966, + 1.3173374273300171, + 0.995644793176651, + 0.988969333744049, + 0.9092360616207122, + 0.931911379814148, + 0.9861841753005981, + 0.8858683162212372, + 0.9150554649353028, + 0.7729743946075439, + 0.8225113790512085, + 0.7946224576473236, + 0.7470991016387939, + 0.7245953347682953, + 0.6737630318641663, + 0.6625622462272645, + 0.6309533950805664, + 0.683922253704071, + 0.6013473030090332, + 0.640416144156456, + 0.5948970086336136, + 0.5904984499931335, + 0.7156881134033203, + 0.5747135852813721, + 0.5855776166915894, + 0.5862875978469848, + 0.5623929689884186, + 0.5342490439891815 + ], + "term_loss": [ + 1.6790412804603576, + 0.8982505217552185, + 0.7413894156932831, + 0.6220758651733398, + 0.6074585275650024, + 0.5809205256462097, + 0.5737000848770142, + 0.5971134037017822, + 0.6812812467336654, + 0.701437530875206, + 0.7465327880859375, + 0.8768298113107681, + 0.8273132968902588, + 1.2669593958616256, + 1.61081964635849, + 1.0948760835170745, + 1.1464744834303855, + 1.402798189163208, + 2.2375652463912963, + 2.523746669578552, + 2.6504026668548586, + 2.9341827514648435, + 2.691425150680542, + 2.7866681671142577, + 2.652672901535034, + 2.2063637409210206, + 2.547779343557358, + 2.468216030406952, + 2.5574094997406007, + 1.8789901941299438, + 1.9658982633590698, + 2.52254821395874, + 4.053012676239014, + 3.474026759338379, + 2.8665278963088987, + 2.968799212646484, + 1.9112021133422852, + 1.8258201915740966, + 1.2143830659866333, + 1.4988377429962159, + 1.2614112941741944, + 1.2955748889923095, + 0.9486180826187134, + 1.0766471548080445, + 0.818901381111145, + 1.425261696243286, + 1.3437454446792603, + 1.4943192962646485, + 1.275571553325653, + 1.1279070884227753, + 0.8779431870937348, + 0.8859598497360944, + 0.7277735261440277, + 0.9731939913749695, + 0.6878395918846131, + 0.680720578956604, + 0.6131223832130432, + 0.6315723412513733, + 0.6783120639801026, + 0.5902733963012695, + 0.6128241561889648, + 0.48777494831085205, + 0.5294700266361236, + 0.5069688389539718, + 0.46669540004730226, + 0.4496366826176643, + 0.40343587884902954, + 0.3926115131378174, + 0.3630800880432129, + 0.4072012848377228, + 0.3359340609073639, + 0.3683177730798721, + 0.3314026749163866, + 0.32736128149032595, + 0.4275485870361328, + 0.31639244627952573, + 0.31941745207309724, + 0.31965322036743166, + 0.3014388550043106, + 0.2775654150247574 + ], + "bridge_loss": [ + 0.9205643273350259, + 0.049716909077763556, + 0.006901342153549195, + 0.004086462584137917, + 0.011321419489383698, + 0.03111027323231101, + 0.028954532250761986, + 0.0201554466471076, + 0.014559349776804446, + 0.012043245652318001, + 0.009253665941953659, + 0.015398956954479218, + 0.010174707736074925, + 0.013219280099868775, + 0.014298373484611512, + 0.01533438156247139, + 0.017070907866954803, + 0.026255203837156297, + 0.05299281061887741, + 0.17080406608581544, + 0.24779340076446532, + 0.2782947730541229, + 0.2630520602226257, + 0.3237492141723633, + 0.2868452004909515, + 0.17925718649625777, + 0.17205788164138794, + 0.12203870689868927, + 0.1952126978158951, + 0.15671373710632325, + 0.16713737347126006, + 0.19014450411796568, + 0.36893905363082885, + 0.31131081352233886, + 0.31187417430877684, + 0.49280351762771607, + 0.21481027870178224, + 0.2258558230161667, + 0.14994133372306823, + 0.130926451587677, + 0.10678757133483886, + 0.11099275469779968, + 0.09215516982972621, + 0.07868353074193, + 0.059325709569454196, + 0.1034778290361166, + 0.08524036257266998, + 0.0978135336279869, + 0.07102513880133629, + 0.06375027797222138, + 0.06410591588020324, + 0.06628356148302555, + 0.05309232649803162, + 0.0602637135386467, + 0.041760663875937465, + 0.04346258090734482, + 0.0322291255697608, + 0.036784381067752836, + 0.047651028633117674, + 0.03259250336289406, + 0.044905204331874844, + 0.03081065520644188, + 0.03847316392660141, + 0.02912857881039381, + 0.031706764674186705, + 0.023801118858903646, + 0.023423786050081254, + 0.02463961470723152, + 0.022945232474803925, + 0.031977996022999285, + 0.02354992071390152, + 0.031676595094799996, + 0.022221289660036565, + 0.023916197538375854, + 0.04762986923456192, + 0.01927408311367035, + 0.02702880091071129, + 0.0285713312625885, + 0.022266658338904382, + 0.01819542294666171 + ], + "tgrad_loss": [ + 0.27993770937919615, + 0.19086571320295334, + 0.1461490781903267, + 0.12707716104984285, + 0.12547629919052125, + 0.1280036602139473, + 0.12801644196510314, + 0.1242969009399414, + 0.12710014595985414, + 0.12307221227884292, + 0.1261594377040863, + 0.12792480454444885, + 0.1230449640750885, + 0.14088939685821533, + 0.15180491466522217, + 0.12790074618458747, + 0.1282630600363016, + 0.13601094789505006, + 0.15141655212640762, + 0.15476103026866914, + 0.15265711691379547, + 0.16449068531990052, + 0.16829325798749925, + 0.1850009373664856, + 0.19105196151733397, + 0.1796716957807541, + 0.19632497339248658, + 0.1975358585357666, + 0.2148709450483322, + 0.20748521902561187, + 0.22437173571586608, + 0.24534283994436265, + 0.2852751801490784, + 0.2817857069015503, + 0.2733550168991089, + 0.27803118324279785, + 0.2536769271850586, + 0.261281143283844, + 0.23730815300941469, + 0.259098140335083, + 0.24244610705375672, + 0.23862764320373536, + 0.23723490653038026, + 0.24668219068050384, + 0.24184185400009156, + 0.2639255453109741, + 0.27324670872688295, + 0.27573881940841677, + 0.28279479751586917, + 0.2770316267490387, + 0.2701444469451904, + 0.27081617115736006, + 0.268588280916214, + 0.28387971448898314, + 0.2660445416927338, + 0.2647861789703369, + 0.2638845456361771, + 0.26355465149879453, + 0.260221079993248, + 0.26300240964889526, + 0.25732610797882083, + 0.2543887885093689, + 0.25456818895339967, + 0.25852504687309263, + 0.24869694046974183, + 0.2511575377345085, + 0.24690336623191833, + 0.24531111750602722, + 0.24492807807922362, + 0.24474297270774842, + 0.24186331791877747, + 0.2404217655658722, + 0.24127304337024688, + 0.23922096462249756, + 0.24050965766906737, + 0.23904705972671508, + 0.23913136382102967, + 0.2380630495071411, + 0.2386874575138092, + 0.2384882021665573 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.00034100248012691736, + 0.04912012815475464, + 0.07342620939016342, + 0.08266763389110565, + 0.08488726615905762, + 0.08897420018911362, + 0.09187051653862, + 0.09561659395694733, + 0.09157264232635498, + 0.0947732925415039, + 0.09517554938793182, + 0.10104557126760483 + ], + "perturbation_rho": [ + 0.03049650974571705, + 0.10809889435768127, + 0.08979646861553192, + 0.17959633469581604, + 0.1275440901517868, + 0.17255432903766632, + 0.16415373980998993, + 0.11534757167100906, + 0.17073199152946472, + 0.15983673930168152, + 0.15877583622932434, + 0.18294689059257507 + ], + "nudging": { + "0.001": [ + -0.000400771910790354, + -0.0004662078863475472, + -0.0005619406583718956, + -0.0006374302320182323, + -0.0006211107829585671, + -0.0006620356580242515, + -0.0006802619900554419, + -0.000695920898579061, + -0.000679123040754348, + -0.0006845796597190201, + -0.0006896791164763272, + -0.0007078879280015826 + ], + "0.003": [ + -0.0011788331903517246, + -0.0013967687264084816, + -0.00168684555683285, + -0.0019111934816464782, + -0.001862682867795229, + -0.001987476134672761, + -0.002041077706962824, + -0.0020898221991956234, + -0.0020393673330545425, + -0.0020541974809020758, + -0.0020654238760471344, + -0.002122731413692236 + ], + "0.01": [ + -0.003660556860268116, + -0.004647519439458847, + -0.005617665126919746, + -0.006360755302011967, + -0.006202561780810356, + -0.006613034754991531, + -0.006794797722250223, + -0.006956290453672409, + -0.006790010258555412, + -0.006838815752416849, + -0.006875438615679741, + -0.007062861695885658 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.25_L12_s456.json b/results/synth_ladder_v2_lo/synth_a0.25_L12_s456.json new file mode 100644 index 0000000..2d51c87 --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.25_L12_s456.json @@ -0,0 +1,1722 @@ +{ + "bp": { + "log": { + "train_loss": [ + 0.9947674840927124, + 0.5959297422885895, + 0.4441185667037964, + 0.4238312294960022, + 0.4082300910949707, + 0.393765958237648, + 0.3456931649684906, + 0.31308822474479675, + 0.34416239910125734, + 0.27713756511211396, + 0.308809486413002, + 0.3001532375335693, + 0.3525312074661255, + 0.34459256377220154, + 0.2930661339998245, + 0.2344497579097748, + 0.23357478170394896, + 0.27331467504501344, + 0.2594615140080452, + 0.2084457780122757, + 0.22421327531337737, + 0.2495953950881958, + 0.26592646188735963, + 0.2653880777835846, + 0.20616664996147155, + 0.23063301057815552, + 0.2234852524280548, + 0.18022556896209715, + 0.19890744733810425, + 0.18154424366950989, + 0.189240668797493, + 0.19498020770549773, + 0.16609342606067656, + 0.16478614134788513, + 0.16893418736457824, + 0.1679157147884369, + 0.15672187466621398, + 0.15162110064029694, + 0.133504154253006, + 0.1337939938545227, + 0.184183518242836, + 0.1587675848007202, + 0.1786697045326233, + 0.16375601427555084, + 0.12898387837409972, + 0.12127504997253417, + 0.1357682282924652, + 0.10440323195457459, + 0.09760309319496155, + 0.11050140519142151, + 0.10689635886847973, + 0.08951765444278717, + 0.09638235607147216, + 0.09622903165221214, + 0.08356250081062316, + 0.09570504027605056, + 0.08704132456183433, + 0.07892893888950347, + 0.07683630051612854, + 0.07765760183334351, + 0.0783784222126007, + 0.07589095104932785, + 0.07282794521450997, + 0.07019219055175781, + 0.07221138014793396, + 0.06894144759178161, + 0.066200683760643, + 0.06355799829363823, + 0.0628858461380005, + 0.06295600434541702, + 0.06119969562292099, + 0.0605082638591528, + 0.05951749495267868, + 0.05923395432829857, + 0.058772369563579556, + 0.058454980385303494, + 0.058216135403513905, + 0.05801380957365036, + 0.05786988719701767, + 0.057799397979676724 + ], + "train_acc": [ + 0.6354, + 0.7735, + 0.8247, + 0.8317, + 0.8432, + 0.844, + 0.8605, + 0.8726, + 0.8612, + 0.8887, + 0.8785, + 0.8806, + 0.8632, + 0.8671, + 0.8851, + 0.9049, + 0.9085, + 0.8919, + 0.8975, + 0.9172, + 0.9096, + 0.901, + 0.8955, + 0.8924, + 0.9181, + 0.9095, + 0.911, + 0.9299, + 0.9217, + 0.9287, + 0.9245, + 0.9228, + 0.9328, + 0.9344, + 0.9341, + 0.9335, + 0.9386, + 0.9404, + 0.9484, + 0.9483, + 0.924, + 0.9353, + 0.9302, + 0.9351, + 0.9511, + 0.9544, + 0.9482, + 0.9636, + 0.97, + 0.9597, + 0.9625, + 0.9734, + 0.9669, + 0.9669, + 0.9761, + 0.9696, + 0.9733, + 0.9785, + 0.9784, + 0.9789, + 0.9784, + 0.9804, + 0.9831, + 0.9837, + 0.9821, + 0.9839, + 0.9859, + 0.9886, + 0.988, + 0.9867, + 0.9895, + 0.9897, + 0.9903, + 0.9901, + 0.9906, + 0.9906, + 0.9905, + 0.9906, + 0.9907, + 0.9907 + ], + "test_acc": [ + 0.757, + 0.798, + 0.8185, + 0.839, + 0.8365, + 0.831, + 0.859, + 0.8515, + 0.843, + 0.8645, + 0.8585, + 0.8575, + 0.857, + 0.855, + 0.8715, + 0.867, + 0.857, + 0.8595, + 0.879, + 0.8755, + 0.8675, + 0.864, + 0.869, + 0.869, + 0.8825, + 0.8745, + 0.8745, + 0.8825, + 0.872, + 0.879, + 0.8785, + 0.8805, + 0.8895, + 0.8745, + 0.8815, + 0.8835, + 0.886, + 0.8925, + 0.895, + 0.887, + 0.873, + 0.8845, + 0.884, + 0.8825, + 0.8935, + 0.8925, + 0.893, + 0.894, + 0.8895, + 0.895, + 0.901, + 0.899, + 0.9035, + 0.893, + 0.8915, + 0.8965, + 0.898, + 0.9, + 0.896, + 0.898, + 0.8935, + 0.899, + 0.898, + 0.899, + 0.9025, + 0.896, + 0.8975, + 0.9, + 0.8985, + 0.8985, + 0.9005, + 0.899, + 0.8975, + 0.898, + 0.898, + 0.8985, + 0.899, + 0.899, + 0.899, + 0.899 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8408721685409546, + 0.8110387921333313, + 0.7906323671340942, + 0.7719681262969971, + 0.7599710822105408, + 0.7539124488830566, + 0.7502779364585876, + 0.7483201026916504, + 0.7469743490219116, + 0.7455896139144897, + 0.7440224885940552, + 0.7427754402160645 + ], + "perturbation_rho": [ + 0.9999985694885254, + 0.9999968409538269, + 0.9999892711639404, + 0.9999746680259705, + 0.9999452233314514, + 0.9998985528945923, + 0.999815821647644, + 0.9998071789741516, + 0.9997591972351074, + 0.9997697472572327, + 0.9996993541717529, + 0.9996582269668579 + ], + "nudging": { + "0.001": [ + -0.023041635751724243, + -0.011698233895003796, + -0.006238154135644436, + -0.0037476818542927504, + -0.0025868481025099754, + -0.001987478695809841, + -0.0016404282068833709, + -0.0014207971980795264, + -0.0012741510290652514, + -0.0011747813550755382, + -0.0011064992286264896, + -0.001060901558957994 + ], + "0.003": [ + -0.06129148602485657, + -0.033079855144023895, + -0.01814448833465576, + -0.011038530617952347, + -0.0076637002639472485, + -0.005905331112444401, + -0.004882573150098324, + -0.004233422689139843, + -0.0037992263678461313, + -0.0035047021228820086, + -0.0033022318966686726, + -0.003166868584230542 + ], + "0.01": [ + -0.1375543624162674, + -0.0896252989768982, + -0.05422336980700493, + -0.034489020705223083, + -0.024439619854092598, + -0.019029833376407623, + -0.015829749405384064, + -0.013777680695056915, + -0.012396320700645447, + -0.011455517262220383, + -0.01080663874745369, + -0.01037222146987915 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.124322125816345, + 1.131116539478302, + 0.7928409598350525, + 0.6759025037765503, + 0.6115491585731506, + 0.6032277975082397, + 0.5580433654785156, + 0.6098665882110595, + 0.6155833411216736, + 0.6180649537801742, + 0.5471897947311402, + 0.7873612755775452, + 0.6355358539581298, + 0.9136189843177795, + 0.618724655532837, + 0.6802553035736084, + 0.5858199717521667, + 0.7376443414211273, + 0.7392737801551819, + 0.6306376735687256, + 0.7112307133674621, + 0.9737488382339478, + 0.9086463136672973, + 0.850034592628479, + 0.6517437356948853, + 1.2407935445785523, + 1.1789815021514893, + 1.020478351020813, + 0.7643687894821167, + 0.8357456016540528, + 1.1298155811309814, + 0.8742633706092835, + 0.6635566035270691, + 0.6822684181213379, + 1.066520718383789, + 1.0742153341770173, + 0.6373770482063293, + 0.6482282336235047, + 0.5901363306045532, + 0.7677202499389648, + 0.8966454248428345, + 0.6450998259544373, + 0.7499248750686646, + 0.6379090648174286, + 0.7380184473991394, + 0.6519559772491456, + 0.6984748714447021, + 0.7411647702217102, + 0.583937159729004, + 0.61994026222229, + 0.6090516567468643, + 0.47370276279449464, + 0.4794863220214844, + 0.6398159673810005, + 0.4859983974456787, + 0.4938936637878418, + 0.5712474269390106, + 0.4674346417427063, + 0.5590529252052308, + 0.46515351371765135, + 0.4210616909980774, + 0.44265751304626466, + 0.41583880286216734, + 0.3911753342151642, + 0.41973802375793456, + 0.4061159435272217, + 0.3860981136798859, + 0.3852514534473419, + 0.39405768866539004, + 0.37666168694496155, + 0.3830901497840881, + 0.3774588644981384, + 0.36966973986625673, + 0.3606788787841797, + 0.3621327772021294, + 0.35749068994522093, + 0.35715772972106935, + 0.35473382360935213, + 0.35407376971244814, + 0.35300638766288756 + ], + "train_acc": [ + 0.2313, + 0.5939, + 0.7093, + 0.7511, + 0.7705, + 0.7765, + 0.7968, + 0.7762, + 0.7721, + 0.7781, + 0.7964, + 0.7469, + 0.77, + 0.718, + 0.7773, + 0.7627, + 0.7806, + 0.751, + 0.7478, + 0.7717, + 0.7445, + 0.715, + 0.7042, + 0.722, + 0.7591, + 0.6789, + 0.6837, + 0.7078, + 0.7443, + 0.7261, + 0.6835, + 0.7268, + 0.7664, + 0.7658, + 0.7015, + 0.7169, + 0.7713, + 0.7713, + 0.7876, + 0.7577, + 0.7252, + 0.778, + 0.7595, + 0.7809, + 0.7548, + 0.7769, + 0.7671, + 0.7629, + 0.7883, + 0.7916, + 0.7826, + 0.8233, + 0.8234, + 0.7805, + 0.8201, + 0.8201, + 0.7993, + 0.8282, + 0.8048, + 0.8293, + 0.8378, + 0.8387, + 0.8424, + 0.8493, + 0.8397, + 0.8453, + 0.8508, + 0.8514, + 0.8478, + 0.8547, + 0.852, + 0.857, + 0.858, + 0.8598, + 0.8603, + 0.859, + 0.8612, + 0.862, + 0.8624, + 0.8626 + ], + "test_acc": [ + 0.476, + 0.659, + 0.709, + 0.6815, + 0.6795, + 0.726, + 0.7425, + 0.721, + 0.7035, + 0.733, + 0.5475, + 0.7095, + 0.564, + 0.627, + 0.7265, + 0.676, + 0.607, + 0.6305, + 0.6685, + 0.639, + 0.4255, + 0.663, + 0.6265, + 0.6955, + 0.6085, + 0.5685, + 0.5145, + 0.585, + 0.567, + 0.507, + 0.581, + 0.658, + 0.6685, + 0.647, + 0.5785, + 0.718, + 0.69, + 0.753, + 0.5325, + 0.6125, + 0.632, + 0.5605, + 0.6765, + 0.752, + 0.645, + 0.577, + 0.644, + 0.711, + 0.668, + 0.6685, + 0.7255, + 0.7025, + 0.6725, + 0.757, + 0.7645, + 0.7305, + 0.8015, + 0.7245, + 0.7565, + 0.7775, + 0.782, + 0.77, + 0.7985, + 0.7735, + 0.7885, + 0.7925, + 0.7955, + 0.804, + 0.8, + 0.8075, + 0.81, + 0.822, + 0.8155, + 0.817, + 0.82, + 0.8135, + 0.8165, + 0.8195, + 0.822, + 0.8205 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.03703948110342026, + 0.2760871648788452, + 0.18428769707679749, + 0.1331849992275238, + 0.09719057381153107, + 0.1258918195962906, + 0.0748991146683693, + 0.08436713367700577, + 0.09110807627439499, + 0.10076140612363815, + 0.06335102021694183, + 0.08356402069330215 + ], + "perturbation_rho": [ + 0.048133689910173416, + 0.19754433631896973, + 0.16992174088954926, + 0.13566580414772034, + 0.05106702446937561, + 0.13118207454681396, + 0.057789772748947144, + 0.09156530350446701, + 0.05846566706895828, + 0.07805749773979187, + 0.11393842101097107, + 0.10566958785057068 + ], + "nudging": { + "0.001": [ + -0.0010935654863715172, + -0.0007910718559287488, + -0.0005110235651955009, + -0.0003657024062704295, + -0.0002454574278090149, + -0.00031436217250302434, + -0.00021353720512706786, + -0.00021881572320125997, + -0.00025353196542710066, + -0.00029741236357949674, + -0.00019224401330575347, + -0.00023414409952238202 + ], + "0.003": [ + -0.0032477299682796, + -0.0023589283227920532, + -0.0015236057806760073, + -0.0010900571942329407, + -0.0007291981601156294, + -0.0009313088376075029, + -0.0006336293881759048, + -0.0006524997879751027, + -0.0007575232302770019, + -0.0008877321379259229, + -0.0005692495033144951, + -0.0006953849224373698 + ], + "0.01": [ + -0.010506195947527885, + -0.007814407348632812, + -0.005055932328104973, + -0.003603969234973192, + -0.0024205115623772144, + -0.0030835624784231186, + -0.0020989018958061934, + -0.002160410862416029, + -0.0025065483059734106, + -0.0029421483632177114, + -0.0018882867880165577, + -0.0023007215932011604 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.8810795295715332, + 1.2361003873825074, + 1.1001177528381347, + 1.0620904754638671, + 0.9923239807128906, + 1.0118637664794923, + 1.0294495058059692, + 1.035706482887268, + 1.1197983177185058, + 1.1272871920585632, + 1.1440982617378235, + 1.1798527102470397, + 1.2583636451721192, + 1.16342516040802, + 1.1545253436088563, + 1.1172974102020263, + 1.105135089302063, + 1.1267213039398194, + 1.1039850887298583, + 1.146181492614746, + 1.188433178806305, + 1.133612074279785, + 1.1646951875686646, + 1.1493542042732239, + 1.193199885559082, + 1.1990179855346679, + 1.1798026483535766, + 1.2109940435409545, + 1.1876913191795349, + 1.136012986755371, + 1.0995346645355224, + 1.1363990716934205, + 1.0839429043769837, + 1.036410266494751, + 1.0403498750686646, + 1.0100184856414796, + 1.0011023750305177, + 1.0164660669326782, + 1.0148341651916504, + 0.9997676483154296, + 1.079225712966919, + 1.0086151275634765, + 0.9838174611091614, + 0.9308564140319824, + 0.9210850870132447, + 0.9249866769790649, + 0.9204979789733887, + 1.0016128253936767, + 1.0033588279724122, + 0.9989631762504577, + 0.9597750957489014, + 0.9665767883300781, + 0.9695200438499451, + 0.979364437866211, + 1.0115489553451538, + 1.044701505279541, + 1.071289315032959, + 1.0969339916229248, + 1.0794300346374512, + 1.0735850115776062, + 1.0443150358200073, + 1.0285705953598023, + 1.011650534439087, + 0.9911880954742431, + 0.9808807865142822, + 0.9643822746276856, + 0.9543527652740479, + 0.9422026905059815, + 0.9374882905960084, + 0.9291035015106202, + 0.9215585130691528, + 0.9194198372840882, + 0.9146845828056336, + 0.9108321361541748, + 0.908439405822754, + 0.907101872253418, + 0.9050157958984375, + 0.9036195611000061, + 0.9028717960357666, + 0.9025129417419434 + ], + "train_acc": [ + 0.3648, + 0.5616, + 0.6071, + 0.6265, + 0.6596, + 0.652, + 0.6486, + 0.6435, + 0.6203, + 0.6245, + 0.6139, + 0.6054, + 0.5993, + 0.623, + 0.6222, + 0.6158, + 0.6189, + 0.619, + 0.6237, + 0.6187, + 0.6121, + 0.6181, + 0.6077, + 0.6086, + 0.6023, + 0.5997, + 0.6041, + 0.6032, + 0.6095, + 0.6156, + 0.6221, + 0.6192, + 0.6387, + 0.6512, + 0.6428, + 0.6486, + 0.6467, + 0.6543, + 0.653, + 0.6532, + 0.6402, + 0.6577, + 0.6606, + 0.6726, + 0.6731, + 0.6733, + 0.6713, + 0.6536, + 0.651, + 0.6492, + 0.6701, + 0.6638, + 0.6666, + 0.6661, + 0.6573, + 0.6522, + 0.6453, + 0.6405, + 0.6415, + 0.6428, + 0.6508, + 0.6514, + 0.6577, + 0.6609, + 0.6643, + 0.6653, + 0.6697, + 0.6684, + 0.6709, + 0.6743, + 0.6763, + 0.6755, + 0.6773, + 0.6788, + 0.6761, + 0.678, + 0.6792, + 0.6804, + 0.6803, + 0.6802 + ], + "test_acc": [ + 0.5295, + 0.5775, + 0.6065, + 0.6085, + 0.632, + 0.625, + 0.6215, + 0.583, + 0.6125, + 0.6035, + 0.5775, + 0.555, + 0.607, + 0.589, + 0.5885, + 0.601, + 0.5745, + 0.581, + 0.57, + 0.567, + 0.5955, + 0.529, + 0.582, + 0.5845, + 0.5495, + 0.585, + 0.556, + 0.578, + 0.579, + 0.5955, + 0.583, + 0.6235, + 0.602, + 0.609, + 0.626, + 0.6245, + 0.601, + 0.578, + 0.6385, + 0.5785, + 0.632, + 0.6265, + 0.626, + 0.656, + 0.648, + 0.657, + 0.624, + 0.618, + 0.6185, + 0.6325, + 0.6345, + 0.6375, + 0.6405, + 0.6395, + 0.632, + 0.6215, + 0.6005, + 0.6135, + 0.5985, + 0.6105, + 0.615, + 0.6215, + 0.6185, + 0.63, + 0.6265, + 0.628, + 0.629, + 0.6345, + 0.6345, + 0.6415, + 0.6415, + 0.6425, + 0.6395, + 0.644, + 0.6475, + 0.6465, + 0.644, + 0.6455, + 0.645, + 0.645 + ], + "state_pred_error": [ + 0.6453981456756592, + 0.23473459401130675, + 0.22407248733043672, + 0.22245599946975708, + 0.21019233787059785, + 0.18144550337791443, + 0.17582191152572632, + 0.17074397916793824, + 0.1751905428647995, + 0.1764908756017685, + 0.1641579815387726, + 0.15101692166328431, + 0.14769069714546204, + 0.14573342962265015, + 0.14323594300746917, + 0.1388802298069, + 0.13048029086589813, + 0.12313583681583405, + 0.1169026269197464, + 0.11280269784927369, + 0.1114406135559082, + 0.10753615816831588, + 0.09873319754600525, + 0.09379508064985276, + 0.09320075496435165, + 0.09452443287372589, + 0.08613354905843734, + 0.07822277886867524, + 0.06739198684692382, + 0.05750293148756027, + 0.04770064138174057, + 0.044405366152524946, + 0.04118964074850082, + 0.038421801435947416, + 0.035279463201761244, + 0.03239466397762299, + 0.02980326344370842, + 0.028275283205509184, + 0.027806608456373214, + 0.02775250583291054, + 0.027604129791259764, + 0.02825467872619629, + 0.03000386506319046, + 0.03052634057998657, + 0.030324843940138818, + 0.03044587863087654, + 0.030369041973352433, + 0.030169917958974838, + 0.029345124167203904, + 0.028020204293727875, + 0.026755033046007157, + 0.025642084258794783, + 0.025034043380618095, + 0.025460178035497664, + 0.025847621342539786, + 0.026586625242233278, + 0.027172537714242936, + 0.02762252908349037, + 0.027387323778867722, + 0.0279737877368927, + 0.027401061433553697, + 0.026677529415488243, + 0.026780897063016892, + 0.025761067128181457, + 0.02527744944691658, + 0.02493682624697685, + 0.02452848722934723, + 0.023785253030061723, + 0.023475021582841874, + 0.0230139014005661, + 0.022756616941094397, + 0.021971601372957228, + 0.02164053836464882, + 0.020801106786727905, + 0.020165389025211335, + 0.019814389663934708, + 0.01931059607863426, + 0.018816861334443092, + 0.018472328102588653, + 0.017988865703344344 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.7252062559127808, + 0.29899632930755615, + 0.17116883397102356, + 0.13035137951374054, + 0.11515486240386963, + 0.09652335941791534, + 0.0831163302063942, + 0.08587749302387238, + 0.1138496845960617, + 0.09370164573192596, + 0.10970423370599747, + 0.09861446917057037 + ], + "perturbation_rho": [ + 0.5776556730270386, + 0.24244043231010437, + 0.15723995864391327, + 0.11212021112442017, + 0.13527166843414307, + 0.09345141798257828, + 0.05218992009758949, + 0.09958191215991974, + 0.09601333737373352, + 0.05242425203323364, + 0.08741243183612823, + 0.08527539670467377 + ], + "nudging": { + "0.001": [ + -0.01889077201485634, + -0.0009189919801428914, + -0.0004775590787176043, + -0.000345642096363008, + -0.0003198374470230192, + -0.00027532177045941353, + -0.00023964255524333566, + -0.00024414859944954515, + -0.00032626462052576244, + -0.00024727743584662676, + -0.0003089705132879317, + -0.00028701225528493524 + ], + "0.003": [ + -0.05585412308573723, + -0.0027553164400160313, + -0.0014325750526040792, + -0.0010372890392318368, + -0.0009584734216332436, + -0.0008253002306446433, + -0.0007186426082625985, + -0.0007314274553209543, + -0.000978380674496293, + -0.0007414872525259852, + -0.0009262076346203685, + -0.0008607603958807886 + ], + "0.01": [ + -0.1766481101512909, + -0.00916180107742548, + -0.004768161568790674, + -0.00345130218192935, + -0.0031899111345410347, + -0.002747050253674388, + -0.002392321825027466, + -0.0024352066684514284, + -0.0032566720619797707, + -0.0024684183299541473, + -0.003083357820287347, + -0.0028652269393205643 + ] + }, + "state_pred_error_per_layer": [ + 14567.1396484375, + 8843.26171875, + 5969.56787109375, + 5045.4873046875, + 4699.3388671875, + 4805.94287109375, + 4535.58935546875, + 4793.4423828125, + 4549.9345703125, + 4690.251953125, + 4812.1875, + 4947.22509765625 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.1223959423065186, + 1.1308925502777099, + 0.7801009045600891, + 0.6729701273918152, + 0.6086994623184204, + 0.5650544769287109, + 0.557174564743042, + 0.635125132226944, + 0.6045203336715699, + 0.6104950213432312, + 0.6773919567108154, + 0.634354585647583, + 0.7008390525817871, + 0.5426709760665893, + 0.6239622621536255, + 0.6713327980041504, + 0.6004258505821228, + 0.679081558227539, + 0.8434337931632996, + 0.7248663192749023, + 0.5846601127624512, + 0.7091362628936767, + 0.7446982576370239, + 0.781251979637146, + 0.803330804347992, + 0.7121967086791993, + 0.6684488694190979, + 0.8766575017929077, + 0.9210894750595093, + 0.82434025888443, + 0.837844763469696, + 0.80740807056427, + 0.9366403986930847, + 0.9515004661560058, + 1.1598037229537963, + 1.10346333694458, + 1.1477074918746948, + 1.3325309940338135, + 1.7308238342285156, + 1.2630112736701966, + 1.162735636138916, + 1.4247036094665528, + 1.7260048475265504, + 1.7118493715286256, + 1.648465139770508, + 1.5406495670318603, + 1.438048271369934, + 1.336459242248535, + 1.3360411096572875, + 1.3773949566841126, + 1.27808166847229, + 1.2043107717514039, + 1.3566615823745727, + 1.2266771377563477, + 1.2032874032974243, + 1.3345542625427247, + 1.277489598464966, + 1.2574082427978515, + 1.3388423186302185, + 1.317376096725464, + 1.3218458183288575, + 1.3416841665267945, + 1.313708076095581, + 1.3063379524230958, + 1.324901369857788, + 1.3095571729660034, + 1.3367181018829346, + 1.3342665132522582, + 1.3231969213485717, + 1.2999568965911865, + 1.2956551901817321, + 1.283503600692749, + 1.282581994819641, + 1.2756302757263183, + 1.2712590478897094, + 1.2688031791687011, + 1.2658842399597168, + 1.2636978759765625, + 1.2609567411422729, + 1.2598623921394347 + ], + "train_acc": [ + 0.2364, + 0.5948, + 0.7131, + 0.7478, + 0.7703, + 0.7889, + 0.7914, + 0.7656, + 0.7862, + 0.7757, + 0.7658, + 0.7746, + 0.748, + 0.7989, + 0.7753, + 0.7604, + 0.7796, + 0.7569, + 0.7207, + 0.7579, + 0.7832, + 0.7498, + 0.7331, + 0.7337, + 0.7258, + 0.755, + 0.7684, + 0.7433, + 0.7383, + 0.7477, + 0.747, + 0.7533, + 0.7224, + 0.7082, + 0.6644, + 0.6817, + 0.6672, + 0.6219, + 0.5687, + 0.6204, + 0.6338, + 0.6038, + 0.5568, + 0.5556, + 0.557, + 0.5713, + 0.5855, + 0.5923, + 0.5942, + 0.5825, + 0.5996, + 0.61, + 0.5866, + 0.6144, + 0.6164, + 0.5915, + 0.6046, + 0.6063, + 0.5949, + 0.5979, + 0.5971, + 0.5942, + 0.5962, + 0.5992, + 0.5918, + 0.5979, + 0.5926, + 0.5951, + 0.5954, + 0.5958, + 0.6024, + 0.6052, + 0.6038, + 0.6006, + 0.6055, + 0.6049, + 0.6047, + 0.6063, + 0.6086, + 0.6089 + ], + "test_acc": [ + 0.48, + 0.644, + 0.7065, + 0.733, + 0.7315, + 0.7055, + 0.7035, + 0.67, + 0.695, + 0.669, + 0.708, + 0.6635, + 0.678, + 0.6665, + 0.554, + 0.6675, + 0.653, + 0.637, + 0.569, + 0.647, + 0.5995, + 0.702, + 0.5415, + 0.6205, + 0.6875, + 0.633, + 0.6135, + 0.6145, + 0.6435, + 0.706, + 0.6325, + 0.5855, + 0.633, + 0.525, + 0.588, + 0.668, + 0.6115, + 0.453, + 0.502, + 0.586, + 0.6, + 0.494, + 0.5125, + 0.445, + 0.5215, + 0.5165, + 0.535, + 0.5235, + 0.485, + 0.514, + 0.571, + 0.5115, + 0.5405, + 0.5585, + 0.488, + 0.5775, + 0.5685, + 0.5465, + 0.558, + 0.5425, + 0.5335, + 0.55, + 0.5565, + 0.5345, + 0.5465, + 0.555, + 0.565, + 0.562, + 0.5535, + 0.555, + 0.5625, + 0.5585, + 0.5685, + 0.5595, + 0.564, + 0.5655, + 0.5645, + 0.569, + 0.5645, + 0.5665 + ], + "value_loss": [ + 2.7805515005111694, + 1.081686860370636, + 0.797205941772461, + 0.6986260824680328, + 0.7140384963989258, + 0.676977529335022, + 0.6860679067611695, + 1.0100212257385255, + 1.0003583810806274, + 0.8196450786590577, + 1.0773170350074768, + 0.9696109293460846, + 1.0457900135040283, + 0.7022124642372132, + 0.8929926084518433, + 0.9564439485549927, + 0.7808498700141907, + 0.9953287747383117, + 1.468350359916687, + 1.2638125471115111, + 0.83949560546875, + 1.2727160860061646, + 1.3841882694244385, + 1.678631261253357, + 1.725769453048706, + 1.5402052530288697, + 1.2585258999824525, + 2.0741510969161987, + 2.4101175380706787, + 1.948118208217621, + 2.2736195261001586, + 1.8106961948394775, + 2.211885329437256, + 2.1651109546661376, + 2.5323298233032228, + 2.1501616649627686, + 2.2966494682312013, + 3.1301290969848634, + 4.273359652328491, + 2.197300305747986, + 1.5282178970336915, + 2.6804796546936034, + 3.514599729347229, + 3.5422376876831057, + 2.5286996788024902, + 1.9258211517333985, + 1.815034661102295, + 1.506567113494873, + 1.5045080892562865, + 1.7108898855209351, + 1.241757023048401, + 1.2125720126152038, + 1.3929070613861083, + 1.1463023363113403, + 1.1142121349334717, + 1.332335331916809, + 1.1768944136142732, + 1.1620534097671509, + 1.298662633562088, + 1.1294718536376953, + 1.1261915169715881, + 1.122890726852417, + 1.1405691360473633, + 1.0319907926559448, + 1.0340288082122804, + 0.9726796591758728, + 1.0593993881225585, + 1.050448949432373, + 1.100425945854187, + 1.0933582187652588, + 0.8975212239265442, + 0.8938636081695557, + 0.9166557600021362, + 0.977439419555664, + 0.8397266407966614, + 0.8533422320365905, + 0.874716013431549, + 0.8575616405487061, + 0.838136801624298, + 0.8463798692464829 + ], + "term_loss": [ + 1.6485074674129485, + 0.8297072814941406, + 0.634693399810791, + 0.5434339653253555, + 0.5507466105461121, + 0.5207709157943725, + 0.5341971765518189, + 0.846416844177246, + 0.841112010717392, + 0.6564387054443359, + 0.9049889453649521, + 0.798225192284584, + 0.8605166847705841, + 0.5482600785255433, + 0.7241384846687317, + 0.7684001558303833, + 0.6070996345996856, + 0.7962655972480774, + 1.2140521295547486, + 0.9860176255226135, + 0.608419938647747, + 0.9112939659118653, + 0.9734650965690613, + 1.2297438148498536, + 1.299837247133255, + 1.1938978694915772, + 0.9857995202064515, + 1.69483338432312, + 1.9083918838500977, + 1.6175825427293777, + 1.9212311550140382, + 1.5342649998188018, + 1.8532086339950562, + 1.8259620584487914, + 2.1624345304489134, + 1.806892790031433, + 1.8902231861114502, + 2.5273943916320802, + 3.5992365367889403, + 1.7663538317680358, + 1.1680109001159669, + 2.154721879196167, + 2.983940335559845, + 2.932674698829651, + 2.0614490547180178, + 1.522164292526245, + 1.4121819274902343, + 1.1339237529754638, + 1.1243637654304504, + 1.3226550352573394, + 0.8877180952310562, + 0.8467551987171174, + 1.0091370786666871, + 0.7961967350006104, + 0.7717182033538819, + 0.9400051207065582, + 0.8129089121699333, + 0.7943745586633683, + 0.9124063068151474, + 0.7582885841369629, + 0.757268895816803, + 0.7520805835723877, + 0.7614981719970703, + 0.672174573135376, + 0.664697764635086, + 0.6174597493886947, + 0.6784869749546051, + 0.6815483723163605, + 0.7197177550315857, + 0.7082983478546142, + 0.5514742812633514, + 0.5509846379041672, + 0.5635691103935242, + 0.6054943891525268, + 0.5014636739730834, + 0.5115930925846099, + 0.5238163274765014, + 0.5094047106742859, + 0.4961314143180847, + 0.5014169258773327 + ], + "bridge_loss": [ + 0.8486444220311474, + 0.057455028840899466, + 0.00647345672249794, + 0.010065643244981765, + 0.026260024583339692, + 0.02356478395164013, + 0.01767999943345785, + 0.011712782212346793, + 0.01253184175491333, + 0.00921778129786253, + 0.007642647423967719, + 0.008494817974418402, + 0.0081177446693182, + 0.007718402835354209, + 0.0076394867897033696, + 0.009256541520357132, + 0.009772012880444526, + 0.01316194803416729, + 0.03859584418535233, + 0.08582426563501358, + 0.0680036034822464, + 0.16674192352294923, + 0.2082908762693405, + 0.23976570377349854, + 0.2108058066368103, + 0.15342824853658676, + 0.09269820539355278, + 0.1716358684539795, + 0.2829114284992218, + 0.11972570022344589, + 0.14527669587135314, + 0.07409173301458359, + 0.13836023993194102, + 0.1047233594417572, + 0.10239493898153305, + 0.08479896945953369, + 0.14000908613204957, + 0.30332467155456544, + 0.31832720917463303, + 0.13028690763115883, + 0.06915579251646996, + 0.2068889322757721, + 0.1689413583636284, + 0.2432434256672859, + 0.10945895296931267, + 0.058291493260860444, + 0.0695342747092247, + 0.051727681058645246, + 0.05560128738582134, + 0.06204493397176266, + 0.04303289123028517, + 0.06258053659200669, + 0.06440504032969475, + 0.049851995158195495, + 0.04215986429452896, + 0.0714924750328064, + 0.05100864072740078, + 0.056615071886777876, + 0.06172715484499931, + 0.05179036730527878, + 0.04902632168531418, + 0.04722833627164364, + 0.05790429630279541, + 0.04115619099140167, + 0.047522115555405614, + 0.03584751927256584, + 0.059197174768149854, + 0.04522456908226013, + 0.0625448987364769, + 0.06798982162475586, + 0.03050621822923422, + 0.030018169784545898, + 0.03876454293727875, + 0.058579221987724306, + 0.026292440569400787, + 0.030662278072535992, + 0.03989438471794128, + 0.03742715321779251, + 0.031834218949079514, + 0.03549532132707536 + ], + "tgrad_loss": [ + 0.2833996032714844, + 0.19452454969882965, + 0.15603908603191377, + 0.14512648067474365, + 0.13703186490535735, + 0.1326418347477913, + 0.1341907325744629, + 0.1518915962100029, + 0.14671453332901002, + 0.15398859734535217, + 0.16468544862270354, + 0.16289091897010805, + 0.17715558688640595, + 0.14623399047851562, + 0.16121463856697082, + 0.17878725657463074, + 0.16397822947502136, + 0.18590123443603515, + 0.2157023815393448, + 0.19197065043449402, + 0.16307206680774688, + 0.19468018741607665, + 0.20243228673934938, + 0.20912174048423768, + 0.21512638583183288, + 0.192879146194458, + 0.18002817583084108, + 0.20768185408115386, + 0.21881421895027162, + 0.2108099551796913, + 0.20711168808937072, + 0.20233947868347169, + 0.2203164538860321, + 0.2344255461215973, + 0.26750037670135496, + 0.2584699326515198, + 0.2664172016143799, + 0.2994100332260132, + 0.355795917224884, + 0.3006595685005188, + 0.29105121412277224, + 0.3188688861846924, + 0.36171807627677915, + 0.36631957635879514, + 0.3577916645050049, + 0.34536534185409545, + 0.3333184560775757, + 0.3209156816482544, + 0.3245430320739746, + 0.32618993062973023, + 0.31100603489875794, + 0.30323628644943235, + 0.31936494970321655, + 0.30025360336303714, + 0.300334077167511, + 0.32083772625923157, + 0.31297685990333557, + 0.31106378889083863, + 0.32452915863990783, + 0.3193928955078125, + 0.31989630165100097, + 0.3235818109035492, + 0.3211666654109955, + 0.31866003241539004, + 0.3218089293956757, + 0.3193724016189575, + 0.3217152436733246, + 0.3236760053157806, + 0.31816329843997954, + 0.31707005248069764, + 0.3155407253742218, + 0.3128608033657074, + 0.3143221000671387, + 0.31336581163406374, + 0.3119705219507217, + 0.3110868597269058, + 0.3110053087234497, + 0.3107297755241394, + 0.3101711611270905, + 0.3094676312446594 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.0279831662774086, + 0.034206733107566833, + 0.06341560930013657, + 0.0695083886384964, + 0.09047738462686539, + 0.09644618630409241, + 0.1011449545621872, + 0.09714356064796448, + 0.09739723801612854, + 0.09588810801506042, + 0.09328337758779526, + 0.08733686059713364 + ], + "perturbation_rho": [ + -0.01078212633728981, + 0.08389643579721451, + 0.09591226279735565, + 0.09822964668273926, + 0.15539337694644928, + 0.077084481716156, + 0.18135306239128113, + 0.13923753798007965, + 0.15523496270179749, + 0.1566530466079712, + 0.16011789441108704, + 0.12478099763393402 + ], + "nudging": { + "0.001": [ + -0.001502810511738062, + -0.00035649939673021436, + -0.0005188342183828354, + -0.0005870601162314415, + -0.0007064240635372698, + -0.0007271112990565598, + -0.000728512299247086, + -0.0007376023568212986, + -0.0007232739008031785, + -0.0007425217772834003, + -0.0007311765220947564, + -0.000725812220480293 + ], + "0.003": [ + -0.004485548473894596, + -0.001071919221431017, + -0.0015602593775838614, + -0.0017638156423345208, + -0.0021236937027424574, + -0.0021875915117561817, + -0.002183424076065421, + -0.002218396170064807, + -0.0021718533243983984, + -0.0022269198670983315, + -0.0021976742427796125, + -0.0021777376532554626 + ], + "0.01": [ + -0.014675050042569637, + -0.0035726604983210564, + -0.005193591117858887, + -0.005878218449652195, + -0.007073326967656612, + -0.007276617921888828, + -0.0072667524218559265, + -0.007385652512311935, + -0.00723686721175909, + -0.007413622923195362, + -0.0073149921372532845, + -0.007252625189721584 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.25_L2_s123.json b/results/synth_ladder_v2_lo/synth_a0.25_L2_s123.json new file mode 100644 index 0000000..bdb0570 --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.25_L2_s123.json @@ -0,0 +1,1512 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.7654977563858032, + 0.8444957286834717, + 0.4950144814491272, + 0.36671135663986204, + 0.321284081697464, + 0.27993531551361084, + 0.27256134262084963, + 0.24975784158706665, + 0.23994892349243163, + 0.24492980494499206, + 0.22574045833349227, + 0.20097337501049042, + 0.1994509120464325, + 0.20277229657173157, + 0.18468337926864625, + 0.18727314873933792, + 0.1769370955467224, + 0.1838186579465866, + 0.17439295463562013, + 0.17294140467643737, + 0.1822731651544571, + 0.17028081703186035, + 0.1692028619647026, + 0.15768814945220946, + 0.14810290710926055, + 0.14752176475524903, + 0.16309453177452088, + 0.15764646480083466, + 0.14147279624938966, + 0.14498449137210845, + 0.1356404733657837, + 0.14475175623893738, + 0.13740543792247772, + 0.13167994917631148, + 0.12572967143058777, + 0.12563280085921288, + 0.11893130984306335, + 0.11800628488063812, + 0.11565658164024353, + 0.11688636230826378, + 0.11060135436058044, + 0.11006813128590584, + 0.1071192905664444, + 0.10655531152486801, + 0.10557044495344162, + 0.10469848154783248, + 0.10152105563879013, + 0.10145853953361511, + 0.09961113617420196, + 0.09860005731582641, + 0.10467973436117173, + 0.09797345906496048, + 0.09573235869407654, + 0.09314765231609344, + 0.09170019273757934, + 0.09269226717948914, + 0.09341713771820068, + 0.09100220992565156, + 0.08908436529636383, + 0.08798767466545104, + 0.08603315978050231, + 0.0854144489645958, + 0.08496862246394157, + 0.08380987513065338, + 0.08267026079893113, + 0.08210583221912383, + 0.08188264560699463, + 0.08136292295455932, + 0.08069994529485702, + 0.08029244214296341, + 0.07990814363956451, + 0.07976104700565338, + 0.07939706645011901, + 0.07912448803782463, + 0.07889298883974552, + 0.07872593634724617, + 0.0785790141582489, + 0.07847202535867691, + 0.0784075082063675, + 0.07836773316860199 + ], + "train_acc": [ + 0.4156, + 0.7664, + 0.8679, + 0.9013, + 0.8997, + 0.9114, + 0.9042, + 0.9112, + 0.9163, + 0.9084, + 0.9186, + 0.9294, + 0.9276, + 0.9251, + 0.9345, + 0.9343, + 0.9347, + 0.9319, + 0.9369, + 0.9368, + 0.9337, + 0.9361, + 0.9391, + 0.9422, + 0.9495, + 0.9487, + 0.9383, + 0.9407, + 0.952, + 0.9466, + 0.953, + 0.9474, + 0.9502, + 0.955, + 0.9573, + 0.9575, + 0.9618, + 0.9616, + 0.9634, + 0.9615, + 0.9654, + 0.9661, + 0.9677, + 0.9684, + 0.9667, + 0.9687, + 0.9705, + 0.9684, + 0.9714, + 0.9719, + 0.9662, + 0.9719, + 0.9735, + 0.9758, + 0.9764, + 0.9766, + 0.9741, + 0.9774, + 0.9768, + 0.9778, + 0.9801, + 0.9801, + 0.9817, + 0.9811, + 0.9818, + 0.9825, + 0.9823, + 0.9825, + 0.9838, + 0.9833, + 0.9839, + 0.9844, + 0.9845, + 0.9845, + 0.9849, + 0.9848, + 0.9852, + 0.9853, + 0.9853, + 0.9853 + ], + "test_acc": [ + 0.656, + 0.838, + 0.867, + 0.8815, + 0.886, + 0.8975, + 0.9005, + 0.895, + 0.901, + 0.8945, + 0.895, + 0.9035, + 0.9005, + 0.901, + 0.9045, + 0.909, + 0.904, + 0.898, + 0.906, + 0.908, + 0.9085, + 0.912, + 0.904, + 0.9015, + 0.904, + 0.9075, + 0.912, + 0.9105, + 0.9135, + 0.911, + 0.9175, + 0.913, + 0.913, + 0.9165, + 0.916, + 0.9145, + 0.912, + 0.9135, + 0.9165, + 0.919, + 0.9185, + 0.9205, + 0.916, + 0.916, + 0.9175, + 0.9155, + 0.9175, + 0.9155, + 0.9165, + 0.9155, + 0.913, + 0.9145, + 0.9165, + 0.9165, + 0.9185, + 0.9195, + 0.915, + 0.92, + 0.922, + 0.9225, + 0.919, + 0.922, + 0.919, + 0.921, + 0.923, + 0.9195, + 0.9205, + 0.921, + 0.92, + 0.921, + 0.921, + 0.92, + 0.9195, + 0.921, + 0.9205, + 0.92, + 0.92, + 0.92, + 0.92, + 0.92 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8569881916046143, + 0.8500438928604126 + ], + "perturbation_rho": [ + 0.9999989867210388, + 0.9999954700469971 + ], + "nudging": { + "0.001": [ + -0.02136343903839588, + -0.007668375503271818 + ], + "0.003": [ + -0.05757742375135422, + -0.022186852991580963 + ], + "0.01": [ + -0.13159069418907166, + -0.06504300236701965 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.222045899963379, + 1.5443243183135986, + 0.9165551806926727, + 0.6182797731399536, + 0.4814643452644348, + 0.4080216860771179, + 0.3821046540737152, + 0.3557525873661041, + 0.3617426670074463, + 0.3635426070213318, + 0.3631010500907898, + 0.3817070824146271, + 0.3703360957622528, + 0.4017043243922293, + 0.36939922463893893, + 0.3809434096813202, + 0.37349798345565793, + 0.4216185576438904, + 0.37035776710510254, + 0.4096152338027954, + 0.44324955769777297, + 0.37625437016487123, + 0.41346786515712736, + 0.38239140539169314, + 0.43430486598014834, + 0.4266927839279175, + 0.47304191370010373, + 0.42663185768127443, + 0.3726616260290146, + 0.39664573118686675, + 0.4000628391265869, + 0.3725332321166992, + 0.4474667528867722, + 0.3764329075098038, + 0.39272863276004794, + 0.3961232415050268, + 0.35540812203884126, + 0.3754589093208313, + 0.3967381541252136, + 0.37234801816940305, + 0.38604524369239807, + 0.38428880689144135, + 0.3889479875087738, + 0.39900728015899656, + 0.3657263102054596, + 0.3451460936665535, + 0.3340610753059387, + 0.3457312560558319, + 0.3312659737110138, + 0.3334344934463501, + 0.34277497341632845, + 0.3261671709060669, + 0.33543690328598025, + 0.32464828124046324, + 0.327925772857666, + 0.31421077461242675, + 0.3448867746353149, + 0.3114112159252167, + 0.31121128454208374, + 0.31479848520755765, + 0.3050527681350708, + 0.3033456075429916, + 0.29738776047229765, + 0.29894379968643187, + 0.2957280710220337, + 0.29328098392486573, + 0.29249357726573944, + 0.2907493370056152, + 0.2953320168852806, + 0.2873753551006317, + 0.2861742950439453, + 0.2886102059006691, + 0.2845136415481567, + 0.2840243721663952, + 0.2817679080247879, + 0.2821083644628525, + 0.2808473236083984, + 0.2805542977809906, + 0.28007913836240766, + 0.2798538848757744 + ], + "train_acc": [ + 0.1881, + 0.4863, + 0.6985, + 0.7856, + 0.8266, + 0.8435, + 0.8497, + 0.861, + 0.8595, + 0.8635, + 0.8666, + 0.8594, + 0.8676, + 0.8577, + 0.8692, + 0.8668, + 0.8652, + 0.8583, + 0.8715, + 0.8657, + 0.8559, + 0.8734, + 0.8662, + 0.8726, + 0.8565, + 0.8585, + 0.8527, + 0.8631, + 0.874, + 0.8676, + 0.8678, + 0.8728, + 0.8577, + 0.8711, + 0.8713, + 0.8663, + 0.8801, + 0.8751, + 0.8667, + 0.8762, + 0.8731, + 0.8725, + 0.8721, + 0.8695, + 0.8727, + 0.8817, + 0.8837, + 0.8817, + 0.886, + 0.8858, + 0.8819, + 0.8876, + 0.8819, + 0.8835, + 0.8853, + 0.8891, + 0.8824, + 0.8891, + 0.8926, + 0.8861, + 0.8912, + 0.8907, + 0.8944, + 0.8937, + 0.8928, + 0.8946, + 0.8933, + 0.895, + 0.8922, + 0.8964, + 0.8952, + 0.8949, + 0.8961, + 0.8957, + 0.8982, + 0.8974, + 0.898, + 0.8973, + 0.8976, + 0.8975 + ], + "test_acc": [ + 0.3455, + 0.586, + 0.718, + 0.775, + 0.8005, + 0.8085, + 0.831, + 0.832, + 0.8335, + 0.8355, + 0.8275, + 0.8195, + 0.8265, + 0.837, + 0.8305, + 0.8365, + 0.8095, + 0.8405, + 0.8095, + 0.8065, + 0.8115, + 0.826, + 0.816, + 0.8145, + 0.822, + 0.8205, + 0.799, + 0.837, + 0.814, + 0.8285, + 0.8325, + 0.826, + 0.813, + 0.824, + 0.8335, + 0.827, + 0.8205, + 0.8235, + 0.817, + 0.8355, + 0.823, + 0.802, + 0.8055, + 0.832, + 0.8375, + 0.85, + 0.8365, + 0.834, + 0.8335, + 0.8435, + 0.8335, + 0.8365, + 0.838, + 0.833, + 0.832, + 0.824, + 0.833, + 0.854, + 0.8455, + 0.8455, + 0.852, + 0.8435, + 0.848, + 0.848, + 0.8525, + 0.8485, + 0.851, + 0.8535, + 0.853, + 0.848, + 0.852, + 0.849, + 0.8485, + 0.8525, + 0.8525, + 0.8525, + 0.8555, + 0.852, + 0.8525, + 0.853 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.05345926433801651, + 0.1220134049654007 + ], + "perturbation_rho": [ + 0.09254007041454315, + 0.03279075771570206 + ], + "nudging": { + "0.001": [ + -0.0014900758396834135, + -0.00040765886660665274 + ], + "0.003": [ + -0.0044248285703361034, + -0.0012199780903756618 + ], + "0.01": [ + -0.0142319705337286, + -0.004036533646285534 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 2.035307823371887, + 1.0818795654296876, + 0.5848175754547119, + 0.4178084654331207, + 0.36943293256759646, + 0.36182685775756834, + 0.36377423672676085, + 0.3638772452354431, + 0.36289256069660186, + 0.35803506598472595, + 0.3521030779838562, + 0.36004641103744506, + 0.3508536817073822, + 0.3523506750106811, + 0.37145801367759707, + 0.35224308915138247, + 0.35803700803518296, + 0.35305213971138, + 0.3651015239715576, + 0.3836041011810303, + 0.3781185965538025, + 0.38939061965942384, + 0.42120680956840517, + 0.40723042488098143, + 0.4526292643547058, + 0.40323816947937013, + 0.415028613948822, + 0.41594237394332884, + 0.40914614896774293, + 0.40614798660278323, + 0.39321772956848144, + 0.38597395792007444, + 0.4012366283416748, + 0.39515967016220094, + 0.3989246150016785, + 0.40142448501586914, + 0.37222539920806885, + 0.3748494933605194, + 0.38571743087768556, + 0.3823385854721069, + 0.3849996451854706, + 0.37309266843795774, + 0.3707266288280487, + 0.3709278034210205, + 0.37044406490325926, + 0.3628380756378174, + 0.36986831691265104, + 0.35957499681711197, + 0.3573640037059784, + 0.37129577651023865, + 0.35399168338775633, + 0.3636847696185112, + 0.35051158096790314, + 0.3494784439086914, + 0.3490269979476929, + 0.34427729971408844, + 0.34917515044212344, + 0.34596708917617797, + 0.3457959949493408, + 0.3382417812347412, + 0.3398675190448761, + 0.33830025720596313, + 0.3366756670475006, + 0.3361509337425232, + 0.3335879071235657, + 0.3334713472366333, + 0.3317858941078186, + 0.33048621253967286, + 0.33019430565834046, + 0.3285010213851929, + 0.32787752251625063, + 0.32666881173849105, + 0.32629875988960266, + 0.3255439553260803, + 0.3254732527732849, + 0.3248609799385071, + 0.32443962535858156, + 0.3241093095779419, + 0.32383085441589354, + 0.32369576120376586 + ], + "train_acc": [ + 0.2759, + 0.6504, + 0.8027, + 0.8556, + 0.8617, + 0.8633, + 0.8603, + 0.8608, + 0.8597, + 0.8664, + 0.8637, + 0.8641, + 0.8664, + 0.8655, + 0.86, + 0.8672, + 0.869, + 0.8672, + 0.8576, + 0.8559, + 0.859, + 0.8534, + 0.8441, + 0.8506, + 0.8305, + 0.8495, + 0.8446, + 0.8438, + 0.8428, + 0.8449, + 0.8507, + 0.8543, + 0.8483, + 0.8496, + 0.8506, + 0.8483, + 0.862, + 0.8558, + 0.8543, + 0.8589, + 0.8602, + 0.8607, + 0.8587, + 0.8633, + 0.8606, + 0.8659, + 0.8625, + 0.8659, + 0.8671, + 0.8616, + 0.8693, + 0.8661, + 0.8696, + 0.8722, + 0.8714, + 0.8728, + 0.8713, + 0.8736, + 0.8725, + 0.875, + 0.8738, + 0.8752, + 0.8753, + 0.874, + 0.8781, + 0.8763, + 0.8786, + 0.8772, + 0.878, + 0.8784, + 0.879, + 0.8797, + 0.8798, + 0.8799, + 0.8798, + 0.8801, + 0.8797, + 0.8801, + 0.8813, + 0.8813 + ], + "test_acc": [ + 0.503, + 0.72, + 0.7965, + 0.826, + 0.8265, + 0.8335, + 0.8295, + 0.8315, + 0.8315, + 0.8335, + 0.823, + 0.823, + 0.831, + 0.826, + 0.8215, + 0.8205, + 0.828, + 0.8215, + 0.814, + 0.8145, + 0.817, + 0.812, + 0.806, + 0.788, + 0.8175, + 0.8145, + 0.808, + 0.793, + 0.8065, + 0.7955, + 0.807, + 0.812, + 0.816, + 0.8215, + 0.8125, + 0.8175, + 0.821, + 0.803, + 0.8285, + 0.8265, + 0.83, + 0.8215, + 0.824, + 0.8185, + 0.83, + 0.834, + 0.832, + 0.837, + 0.8375, + 0.8295, + 0.829, + 0.82, + 0.825, + 0.831, + 0.8365, + 0.8315, + 0.8395, + 0.834, + 0.83, + 0.831, + 0.841, + 0.839, + 0.831, + 0.838, + 0.8335, + 0.835, + 0.8365, + 0.831, + 0.8385, + 0.832, + 0.835, + 0.8365, + 0.8335, + 0.8325, + 0.8335, + 0.836, + 0.8345, + 0.834, + 0.834, + 0.834 + ], + "state_pred_error": [ + 0.7997600481987, + 0.3437161437034607, + 0.2014044310092926, + 0.16714438018798827, + 0.15179780702590942, + 0.13224747791290284, + 0.11098563377857208, + 0.0916959712266922, + 0.07569896295070648, + 0.061903948831558225, + 0.05011345111131668, + 0.04207257339954376, + 0.0351084869146347, + 0.030359905037283898, + 0.026254229775071143, + 0.02318112598657608, + 0.021127575582265853, + 0.018682509154081345, + 0.017222601471841334, + 0.016082065165042878, + 0.014975263381004333, + 0.014202502882480622, + 0.014144844499230385, + 0.01311485079973936, + 0.012837442517280579, + 0.012465586432814597, + 0.012172201824188232, + 0.01132886090874672, + 0.011098468725383281, + 0.010547183714807033, + 0.009977656623721123, + 0.009493274948000908, + 0.009209013964235782, + 0.008924346220493316, + 0.008761503490805626, + 0.00834588114619255, + 0.008196133199334144, + 0.008180657398700714, + 0.007771395539492369, + 0.007566665153205395, + 0.007358304584771395, + 0.007139906688034534, + 0.007039350777864456, + 0.007165508459508419, + 0.006619077945500612, + 0.006377335331588983, + 0.0062913012474775315, + 0.006098052710294724, + 0.006248931968957185, + 0.005887588227540255, + 0.005769434168934822, + 0.005733849746733904, + 0.005528700548410415, + 0.005712412436306476, + 0.005568497113138437, + 0.005270802947878838, + 0.005042337468266487, + 0.0052765426017344, + 0.004908596959710122, + 0.005113466054946184, + 0.004858688966929913, + 0.004781623714789748, + 0.004587523357570171, + 0.004601859824359417, + 0.004504906559363008, + 0.0047202605225145815, + 0.004451583327353001, + 0.004443144879117608, + 0.004247794686257839, + 0.004191487204283476, + 0.004164984770864248, + 0.004182276912778616, + 0.00406104885712266, + 0.004042744146287441, + 0.004139866654574871, + 0.003951248052343726, + 0.003766103806346655, + 0.0038973809622228146, + 0.004124714520573616, + 0.003765122526139021 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9177796840667725, + 0.47225815057754517 + ], + "perturbation_rho": [ + 0.7912815809249878, + 0.3786163330078125 + ], + "nudging": { + "0.001": [ + -0.02343657612800598, + -0.0025146803818643093 + ], + "0.003": [ + -0.06697157770395279, + -0.0075065759010612965 + ], + "0.01": [ + -0.187799870967865, + -0.02459421567618847 + ] + }, + "state_pred_error_per_layer": [ + 654.3871459960938, + 278.6759338378906 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2231978775024412, + 1.5435144302368164, + 0.9255192138671875, + 0.6231668456077576, + 0.47682934741973876, + 0.41253710989952086, + 0.38058802461624147, + 0.3612384679555893, + 0.3502673017501831, + 0.3541757307052612, + 0.36556007900238036, + 0.3836657918453217, + 0.3598676048755646, + 0.3682255392074585, + 0.3784599184989929, + 0.4032455762863159, + 0.3752034682035446, + 0.395582155418396, + 0.42088637284040453, + 0.4353969056129456, + 0.49382096910476686, + 0.46568728313446045, + 0.4780210087776184, + 0.5099774327039719, + 0.5591948669433594, + 0.5902343495845794, + 0.6529199718952179, + 0.6656437032699585, + 0.667899845123291, + 0.7424959661483764, + 0.796056184387207, + 0.814354309463501, + 0.8498922292709351, + 0.9181127500534058, + 0.8227109302520752, + 0.8799352335929871, + 0.9216915922164917, + 0.9162841287612915, + 0.961645627784729, + 0.934480671787262, + 0.9278618555068969, + 0.9472960815429687, + 0.977372176361084, + 0.9279924439430237, + 0.931221773815155, + 0.9409424783706665, + 0.9645380886077881, + 0.9430541513442993, + 0.9649716537475586, + 0.9659242866516113, + 0.9619326337814331, + 0.9567905778884888, + 0.9783849853515625, + 1.0015579802513122, + 1.00494115524292, + 1.0035569537639617, + 1.0050078544616698, + 1.0123552949905394, + 1.01352340259552, + 1.039237533378601, + 1.035588917160034, + 1.032976812839508, + 1.0407879976272583, + 1.0397173221588134, + 1.0423907831192016, + 1.0491719779968263, + 1.0476377964019776, + 1.0432713088989258, + 1.0447245557785034, + 1.0415431062698364, + 1.0402565887451172, + 1.0366182415008545, + 1.0374339856147765, + 1.034851577758789, + 1.034139908027649, + 1.03353916721344, + 1.0329146126270294, + 1.0321089252471924, + 1.031716856765747, + 1.0315448204040527 + ], + "train_acc": [ + 0.1876, + 0.4894, + 0.6908, + 0.7843, + 0.8259, + 0.842, + 0.8522, + 0.8611, + 0.865, + 0.8667, + 0.8621, + 0.8616, + 0.8682, + 0.8684, + 0.8649, + 0.8589, + 0.8678, + 0.8687, + 0.8575, + 0.8564, + 0.8445, + 0.8433, + 0.847, + 0.8404, + 0.8242, + 0.8214, + 0.8033, + 0.7973, + 0.7998, + 0.7819, + 0.7709, + 0.759, + 0.7496, + 0.7381, + 0.7503, + 0.7337, + 0.7231, + 0.7248, + 0.7162, + 0.7119, + 0.7086, + 0.704, + 0.6929, + 0.6995, + 0.6953, + 0.689, + 0.6838, + 0.6914, + 0.682, + 0.6818, + 0.6811, + 0.678, + 0.6733, + 0.6705, + 0.6659, + 0.6704, + 0.6677, + 0.664, + 0.6659, + 0.6563, + 0.6611, + 0.6626, + 0.659, + 0.6568, + 0.6604, + 0.6565, + 0.6579, + 0.6618, + 0.6593, + 0.6605, + 0.6601, + 0.6607, + 0.6624, + 0.6624, + 0.6629, + 0.6634, + 0.6626, + 0.663, + 0.6627, + 0.6634 + ], + "test_acc": [ + 0.336, + 0.581, + 0.72, + 0.7835, + 0.8075, + 0.8185, + 0.8225, + 0.8195, + 0.827, + 0.8205, + 0.824, + 0.8235, + 0.8285, + 0.818, + 0.8225, + 0.831, + 0.8015, + 0.8365, + 0.8205, + 0.765, + 0.8095, + 0.8035, + 0.7985, + 0.774, + 0.77, + 0.7605, + 0.738, + 0.75, + 0.739, + 0.731, + 0.7145, + 0.7115, + 0.6835, + 0.703, + 0.701, + 0.6735, + 0.6755, + 0.656, + 0.6585, + 0.6815, + 0.68, + 0.6655, + 0.6795, + 0.6795, + 0.675, + 0.665, + 0.665, + 0.659, + 0.6605, + 0.657, + 0.662, + 0.652, + 0.648, + 0.648, + 0.646, + 0.6455, + 0.6495, + 0.6455, + 0.646, + 0.6435, + 0.639, + 0.6315, + 0.6405, + 0.635, + 0.644, + 0.6405, + 0.637, + 0.6265, + 0.6335, + 0.6385, + 0.6355, + 0.631, + 0.637, + 0.635, + 0.6395, + 0.6365, + 0.639, + 0.6365, + 0.638, + 0.638 + ], + "value_loss": [ + 2.876306781387329, + 0.7856723394393921, + 0.5928473916530609, + 0.5013651826143265, + 0.44722279748916627, + 0.4374195610523224, + 0.4381609722137451, + 0.46451272745132444, + 0.5010983292698861, + 0.49245802602767946, + 0.5388860324859619, + 0.6111842860221863, + 0.5615375234603882, + 0.5658212431192398, + 0.6179779888391495, + 0.6809112598419189, + 0.6433888878822327, + 0.6772890575408935, + 0.7352884284079075, + 0.8157524694442749, + 0.9909413330078125, + 0.9366963150024414, + 0.9510981642961502, + 1.048841558933258, + 1.154732922744751, + 1.2454240258216858, + 1.4217876974105834, + 1.3324861633300782, + 1.383902477169037, + 1.4895198330879211, + 1.6056639788627625, + 1.427614409351349, + 1.3538882410049438, + 1.411731699848175, + 1.1238839833259582, + 1.2100854367256164, + 1.214574584853649, + 1.0777985618591308, + 1.1443535018444062, + 1.0253696113348008, + 0.919029998588562, + 0.8878245719909668, + 0.9744467445373535, + 0.824526634979248, + 0.8014205926895142, + 0.7634805387496948, + 0.7902832801818848, + 0.7393046459197998, + 0.7831286626815795, + 0.758888035583496, + 0.719997971534729, + 0.7418651414871216, + 0.7080020462989807, + 0.8019536107063293, + 0.7214265657424926, + 0.7120814613819122, + 0.717910733795166, + 0.7196631093978881, + 0.7238030241012573, + 0.7440049339294433, + 0.7167224275588989, + 0.6929942185401916, + 0.7202660966396331, + 0.6883848846435547, + 0.698680549621582, + 0.7095868293762208, + 0.6795802874088287, + 0.663805854511261, + 0.6624986004829406, + 0.6704760707855225, + 0.6755891981124877, + 0.7603735716819763, + 0.648806884264946, + 0.6449895093441009, + 0.6462680356025696, + 0.6254746982574463, + 0.6235096879005432, + 0.6025638544082642, + 0.6216146362304688, + 0.6248516966819763 + ], + "term_loss": [ + 1.639870400428772, + 0.3507210045337677, + 0.34477140822410585, + 0.29710007433891295, + 0.2601790674209595, + 0.25600365054607394, + 0.25877483711242677, + 0.29236667512655257, + 0.3331691867649555, + 0.3240827446460724, + 0.36899902091026304, + 0.4347284555196762, + 0.3967565870523453, + 0.39815111773014067, + 0.4507559413194656, + 0.5020932229995727, + 0.4743917005300522, + 0.5037893265724183, + 0.5480789810597897, + 0.6277814621925354, + 0.7829725056648255, + 0.7233813446044922, + 0.7467594781458378, + 0.8260618205308914, + 0.9186455319404602, + 1.0031881261825562, + 1.1540955222129823, + 1.0660843635559083, + 1.1143094442605972, + 1.2018714171886444, + 1.3037795733451842, + 1.1133485041618347, + 1.0332393661499024, + 1.0753915726184844, + 0.8136546610355377, + 0.8798294746398926, + 0.8744119406983256, + 0.7455172416687011, + 0.8011896505832672, + 0.6859100102216006, + 0.5815183532238006, + 0.5462483320474625, + 0.6176732580661773, + 0.4817309150695801, + 0.4554020172119141, + 0.4135750238418579, + 0.4313158232688904, + 0.39167013053894045, + 0.428555741071701, + 0.40601828079223634, + 0.3743584144592285, + 0.3892281187534332, + 0.3544705183029175, + 0.43724887987971306, + 0.35984939937591554, + 0.35236385194063186, + 0.3571020919799805, + 0.35568072917461396, + 0.361035050535202, + 0.3737378871917725, + 0.35216808892488477, + 0.32893878989219666, + 0.3490776247859001, + 0.32203044962882993, + 0.32965824136734007, + 0.33938146572113037, + 0.3120464255452156, + 0.30106174416542053, + 0.29664410429000854, + 0.30635549602508544, + 0.30906102600097657, + 0.375988377571106, + 0.29100386579036713, + 0.28118928681612015, + 0.2787789331912994, + 0.267332150387764, + 0.2657620764285326, + 0.2520246841192246, + 0.2673741018772125, + 0.2734043194293976 + ], + "bridge_loss": [ + 0.9365049929586589, + 0.13423291933834552, + 0.02359517429172993, + 0.009435658095777035, + 0.016151994919776917, + 0.019326301124691962, + 0.02228460746407509, + 0.017419311372935772, + 0.015196872821450233, + 0.015288333666324615, + 0.013569608584046364, + 0.013740351551026106, + 0.012244615394622087, + 0.012688239745795726, + 0.011124985119700432, + 0.012841972821950912, + 0.014346514343097807, + 0.015282003252208232, + 0.020628411626443268, + 0.01985876966714859, + 0.024889793342351915, + 0.03505476154237985, + 0.02604603983312845, + 0.03549123661220074, + 0.034647015199065205, + 0.037708253931999204, + 0.04363026385307312, + 0.04016457169055939, + 0.04331139268875122, + 0.041140395292639735, + 0.044560722640156744, + 0.049140659207105634, + 0.04577249918580055, + 0.04996752251982689, + 0.04400557230710983, + 0.048151988497376445, + 0.05200917733758688, + 0.04542869421243668, + 0.04608109139800072, + 0.046201552886515854, + 0.04489687628746033, + 0.04607596616744995, + 0.054255467438697816, + 0.049672819927334785, + 0.053708798533678055, + 0.053039796304702756, + 0.05734103150367737, + 0.051897763884067534, + 0.05335785975456238, + 0.05264690642356873, + 0.047083489751815796, + 0.05342354041486978, + 0.05028336017727852, + 0.05724046026468277, + 0.0501610916852951, + 0.05189191411733627, + 0.05292398271858692, + 0.053859466511011124, + 0.05355185590982437, + 0.054500432527065275, + 0.05102754718065262, + 0.052611512261629106, + 0.057694364416599274, + 0.05261626641750336, + 0.055332134974002835, + 0.05660939726829529, + 0.05285219025611877, + 0.05093574574589729, + 0.0517145704627037, + 0.05241333737373352, + 0.055536415910720824, + 0.07385429392457009, + 0.04720236387550831, + 0.05397108833789825, + 0.05832255332022905, + 0.04941890643239021, + 0.04918186986446381, + 0.04253149769902229, + 0.04644611543416977, + 0.04374015842676163 + ], + "tgrad_loss": [ + 0.2999313575744629, + 0.30071841287612916, + 0.2244808042049408, + 0.19482945413589478, + 0.17089173245429992, + 0.16208961111307144, + 0.15710153303146362, + 0.15472674567103387, + 0.15273226557970046, + 0.15308694994449615, + 0.15631739873886108, + 0.1627154801607132, + 0.15253631706237794, + 0.15498188679218292, + 0.15609705946445465, + 0.16597607221603394, + 0.154650675368309, + 0.15821772830486297, + 0.16658104096725584, + 0.1681122395515442, + 0.18307903990745544, + 0.17826021099090575, + 0.17829264632463454, + 0.18728849435448647, + 0.20144037680625915, + 0.20452762956619264, + 0.2240619119644165, + 0.22623722536563873, + 0.22628164014816285, + 0.24650802659988402, + 0.2573236642599106, + 0.26512524480819705, + 0.2748763925552368, + 0.28637262206077574, + 0.2662237548828125, + 0.2821039693832397, + 0.28815346791744234, + 0.2868526280403137, + 0.29708276128768923, + 0.2932580437421799, + 0.292614759683609, + 0.2955002767562866, + 0.3025180263757706, + 0.2931228996038437, + 0.29230977420806886, + 0.2968657133102417, + 0.30162642464637757, + 0.2957367503643036, + 0.30121506395339964, + 0.3002228458404541, + 0.2985560688495636, + 0.29921348223686217, + 0.3032481753349304, + 0.3074642710447311, + 0.3114160710811615, + 0.3078256957054138, + 0.30788465242385865, + 0.31012291219234467, + 0.30921611247062686, + 0.3157666190624237, + 0.31352679815292356, + 0.31144391264915466, + 0.31349411163330076, + 0.3137381648540497, + 0.31369017992019654, + 0.3135959681987762, + 0.3146816665649414, + 0.3118083592414856, + 0.31413992648124694, + 0.3117072313308716, + 0.3109917598247528, + 0.3105308976173401, + 0.3106006525039673, + 0.30982913246154786, + 0.30916655061244963, + 0.3087236411571503, + 0.3085657374978065, + 0.3080076750278473, + 0.3077944193840027, + 0.3077072183132172 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.09752383828163147, + 0.2814161777496338 + ], + "perturbation_rho": [ + 0.2172888070344925, + 0.46050792932510376 + ], + "nudging": { + "0.001": [ + -0.005947513971477747, + -0.0023629600182175636 + ], + "0.003": [ + -0.017743801698088646, + -0.007080004084855318 + ], + "0.01": [ + -0.05797416716814041, + -0.023506879806518555 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.25_L2_s42.json b/results/synth_ladder_v2_lo/synth_a0.25_L2_s42.json new file mode 100644 index 0000000..08b20a6 --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.25_L2_s42.json @@ -0,0 +1,1512 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.7909032949447632, + 0.8408651754379273, + 0.4797002552509308, + 0.3647427452087402, + 0.3124784866809845, + 0.2817441850662231, + 0.2590787395477295, + 0.25116723079681397, + 0.2374646141052246, + 0.22318382008075713, + 0.2223593633413315, + 0.1995730001926422, + 0.2196668884038925, + 0.19875684378147127, + 0.1934546858549118, + 0.18952004461288452, + 0.18683569231033326, + 0.19224771404266358, + 0.18635251063108443, + 0.16810201063156127, + 0.17770678448677063, + 0.17279608354568482, + 0.16727651731967927, + 0.1559371694803238, + 0.15815642802715302, + 0.14418157806396484, + 0.14997697926163672, + 0.1387534565925598, + 0.15129592059105634, + 0.13506835396289826, + 0.1424376358985901, + 0.1351928102493286, + 0.1380953494757414, + 0.12529992187023162, + 0.1325531720519066, + 0.1227368601322174, + 0.13023556920289994, + 0.12078996238708496, + 0.12364544925689697, + 0.11792606129646302, + 0.1153166356086731, + 0.11588856360912322, + 0.11642754650115966, + 0.11655678544044494, + 0.10944631642103195, + 0.10654066693782806, + 0.10285172426700592, + 0.10260429283976555, + 0.099968874502182, + 0.09773169926404952, + 0.097343274974823, + 0.09863903195858002, + 0.0987546160697937, + 0.0955238178730011, + 0.09478670574426651, + 0.09218684401512146, + 0.09407348573207855, + 0.09172552303671837, + 0.08920091514587403, + 0.08815436470508575, + 0.08759597380161285, + 0.0869701828956604, + 0.08645854530334472, + 0.08645270910263061, + 0.08507799062728882, + 0.08462890653610229, + 0.0839632087945938, + 0.08303676342964172, + 0.08232744481563568, + 0.08194958243370055, + 0.08150955953598023, + 0.08117919763922692, + 0.0808682661652565, + 0.08060784562826157, + 0.08038016645908355, + 0.08024281358420848, + 0.0800727246761322, + 0.07996719419956207, + 0.07990662084817886, + 0.07986213479042054 + ], + "train_acc": [ + 0.4015, + 0.7763, + 0.872, + 0.8957, + 0.9046, + 0.9098, + 0.9139, + 0.91, + 0.9202, + 0.92, + 0.9182, + 0.9316, + 0.9176, + 0.9279, + 0.9296, + 0.9311, + 0.9308, + 0.9279, + 0.9304, + 0.9406, + 0.9342, + 0.9348, + 0.9381, + 0.9455, + 0.9419, + 0.9511, + 0.9453, + 0.954, + 0.9456, + 0.9527, + 0.948, + 0.9541, + 0.9518, + 0.9601, + 0.9544, + 0.9613, + 0.9538, + 0.9586, + 0.9584, + 0.9612, + 0.962, + 0.9617, + 0.9613, + 0.9593, + 0.9645, + 0.9672, + 0.971, + 0.9708, + 0.9735, + 0.9739, + 0.9725, + 0.9731, + 0.9719, + 0.9745, + 0.9751, + 0.976, + 0.9732, + 0.9763, + 0.9781, + 0.9783, + 0.9781, + 0.9786, + 0.9791, + 0.9798, + 0.9821, + 0.9809, + 0.9808, + 0.9812, + 0.9818, + 0.9824, + 0.982, + 0.9824, + 0.9828, + 0.9828, + 0.9832, + 0.9836, + 0.9837, + 0.9836, + 0.9838, + 0.9838 + ], + "test_acc": [ + 0.6525, + 0.8175, + 0.8655, + 0.8835, + 0.8785, + 0.882, + 0.893, + 0.888, + 0.8855, + 0.8905, + 0.893, + 0.894, + 0.894, + 0.889, + 0.897, + 0.8985, + 0.8865, + 0.898, + 0.8935, + 0.897, + 0.8925, + 0.905, + 0.8995, + 0.9085, + 0.902, + 0.9065, + 0.9045, + 0.906, + 0.902, + 0.903, + 0.9015, + 0.9055, + 0.9075, + 0.9075, + 0.912, + 0.9065, + 0.9085, + 0.9065, + 0.9015, + 0.908, + 0.9045, + 0.9045, + 0.906, + 0.906, + 0.904, + 0.904, + 0.911, + 0.908, + 0.9085, + 0.9135, + 0.909, + 0.9075, + 0.9115, + 0.9135, + 0.917, + 0.914, + 0.91, + 0.9135, + 0.9105, + 0.91, + 0.911, + 0.908, + 0.9065, + 0.9075, + 0.908, + 0.909, + 0.907, + 0.907, + 0.9085, + 0.9095, + 0.9085, + 0.908, + 0.9075, + 0.9075, + 0.9085, + 0.9085, + 0.908, + 0.908, + 0.908, + 0.908 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9068200588226318, + 0.8893121480941772 + ], + "perturbation_rho": [ + 0.9999985098838806, + 0.9999943971633911 + ], + "nudging": { + "0.001": [ + -0.023899933323264122, + -0.008479279465973377 + ], + "0.003": [ + -0.0650826171040535, + -0.024595053866505623 + ], + "0.01": [ + -0.15680165588855743, + -0.07294036448001862 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.272149989128113, + 1.6072792436599732, + 0.9563953531265259, + 0.632236511516571, + 0.47902783765792845, + 0.4073201657772064, + 0.3671415810585022, + 0.35644190893173217, + 0.35256571426391603, + 0.3582359858751297, + 0.3660087926208973, + 0.36652003979682923, + 0.37060247931480406, + 0.3795734006881714, + 0.38890625929832456, + 0.3900839144229889, + 0.4118562028884888, + 0.4039736029624939, + 0.37663860700130464, + 0.37836415185928346, + 0.420570277929306, + 0.4127836347579956, + 0.41665606060028076, + 0.3981014615058899, + 0.400833323764801, + 0.41302710666656495, + 0.41561282229423524, + 0.3989115385055542, + 0.43917759885042906, + 0.39013743410110474, + 0.4253689344406128, + 0.40447203521728514, + 0.40794838209152223, + 0.4303056351661682, + 0.3982668053627014, + 0.3899207235336304, + 0.42121000814437864, + 0.4009185729980469, + 0.41895741519927976, + 0.41355561633110044, + 0.38559334030151365, + 0.39681776518821715, + 0.3590934567213058, + 0.37791539306640626, + 0.3702590451717377, + 0.37318263463974, + 0.3705978121757507, + 0.3725005265951157, + 0.34017645268440244, + 0.35172376317977905, + 0.35478726396560667, + 0.3520003671169281, + 0.3633641314744949, + 0.33544783420562746, + 0.3414689769744873, + 0.3352735348701477, + 0.344571617937088, + 0.32714939917325975, + 0.3172183589220047, + 0.3279861245632172, + 0.32109520440101624, + 0.316487836933136, + 0.31405309810638427, + 0.3157914097547531, + 0.30937249819040297, + 0.31022134857177736, + 0.31250496447086334, + 0.30788920271396636, + 0.3062834129333496, + 0.3069887036204338, + 0.3004336483001709, + 0.3017194701194763, + 0.29909859516620635, + 0.29890388836860654, + 0.2970484607696533, + 0.29831262575387957, + 0.29611629629135133, + 0.2954514974594116, + 0.2951315716266632, + 0.294859547996521 + ], + "train_acc": [ + 0.1683, + 0.4682, + 0.6752, + 0.7755, + 0.8224, + 0.8451, + 0.8605, + 0.8657, + 0.8635, + 0.8677, + 0.8698, + 0.8682, + 0.8697, + 0.8687, + 0.8672, + 0.87, + 0.865, + 0.8635, + 0.8739, + 0.8745, + 0.8605, + 0.8632, + 0.8674, + 0.8705, + 0.867, + 0.8662, + 0.8655, + 0.8703, + 0.8605, + 0.8701, + 0.8616, + 0.8678, + 0.8676, + 0.8661, + 0.8688, + 0.8706, + 0.8628, + 0.873, + 0.8626, + 0.8685, + 0.8731, + 0.8714, + 0.8803, + 0.8761, + 0.8799, + 0.8822, + 0.8754, + 0.8773, + 0.8849, + 0.883, + 0.8826, + 0.8826, + 0.8778, + 0.8878, + 0.8855, + 0.8878, + 0.882, + 0.885, + 0.8921, + 0.8867, + 0.8886, + 0.8925, + 0.8926, + 0.8922, + 0.8964, + 0.8934, + 0.8924, + 0.8942, + 0.8954, + 0.8958, + 0.898, + 0.8958, + 0.8981, + 0.898, + 0.8982, + 0.8972, + 0.8986, + 0.8991, + 0.8995, + 0.8986 + ], + "test_acc": [ + 0.3005, + 0.571, + 0.71, + 0.769, + 0.794, + 0.807, + 0.82, + 0.8205, + 0.8235, + 0.8205, + 0.8175, + 0.822, + 0.822, + 0.8075, + 0.8225, + 0.813, + 0.811, + 0.82, + 0.831, + 0.821, + 0.817, + 0.817, + 0.815, + 0.7975, + 0.8065, + 0.8205, + 0.826, + 0.7885, + 0.8195, + 0.792, + 0.8155, + 0.8325, + 0.809, + 0.826, + 0.8235, + 0.808, + 0.8195, + 0.8115, + 0.809, + 0.819, + 0.805, + 0.833, + 0.8255, + 0.824, + 0.8305, + 0.8195, + 0.806, + 0.8375, + 0.8325, + 0.8255, + 0.83, + 0.8185, + 0.836, + 0.832, + 0.8455, + 0.8335, + 0.8425, + 0.846, + 0.841, + 0.839, + 0.8405, + 0.843, + 0.8425, + 0.8405, + 0.8485, + 0.8445, + 0.8455, + 0.848, + 0.85, + 0.849, + 0.8445, + 0.8495, + 0.8475, + 0.843, + 0.8465, + 0.8485, + 0.846, + 0.8475, + 0.848, + 0.847 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.008382977917790413, + 0.06159647926688194 + ], + "perturbation_rho": [ + -0.022914212197065353, + 0.018335968255996704 + ], + "nudging": { + "0.001": [ + 0.0001649217592785135, + -0.00021235107851680368 + ], + "0.003": [ + 0.0006042401073500514, + -0.0006366041488945484 + ], + "0.01": [ + 0.0033093439415097237, + -0.002113340189680457 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 2.057672385406494, + 1.1166771314620971, + 0.6086244252204895, + 0.4245740672111511, + 0.36483576316833494, + 0.35679988889694214, + 0.3548254811286926, + 0.34793691511154173, + 0.3464306734323502, + 0.3435576392173767, + 0.34013770332932475, + 0.33322665920257566, + 0.33403541398048403, + 0.3319604155063629, + 0.3415149167060852, + 0.3399295929431915, + 0.3496535359382629, + 0.37121437792778017, + 0.362134037733078, + 0.38054348917007447, + 0.37667123994827273, + 0.36827400608062744, + 0.37283519170284274, + 0.3736583568572998, + 0.39922317066192625, + 0.38717319040298465, + 0.37632566776275633, + 0.39565731761455536, + 0.3784814638614655, + 0.3727163250207901, + 0.37778283381462097, + 0.36831437734365463, + 0.36310676040649414, + 0.4009634237289429, + 0.3620505106925964, + 0.3674455921173096, + 0.3772189566731453, + 0.3530207999229431, + 0.3573484922885895, + 0.3630984719753265, + 0.35662814855575564, + 0.37530835361480713, + 0.351890708065033, + 0.36676664543151855, + 0.3481761688232422, + 0.35212536692619323, + 0.34319338274002076, + 0.3521613523960114, + 0.337118542098999, + 0.3296779903411865, + 0.33185150694847104, + 0.3305467273712158, + 0.3442539291143417, + 0.33049997148513793, + 0.32896905941963195, + 0.327506383895874, + 0.3324374245882034, + 0.3221533220291138, + 0.3242107194542885, + 0.32271010704040526, + 0.318077142906189, + 0.3179136665344238, + 0.3174248493671417, + 0.3131567057132721, + 0.31502656025886533, + 0.31301859073638916, + 0.312909477519989, + 0.3118305783390999, + 0.31005851497650144, + 0.30886491203308103, + 0.3087408046722412, + 0.30726790990829467, + 0.3069364815831184, + 0.3057547236442566, + 0.3054956469535828, + 0.30528006699085236, + 0.30487773990631106, + 0.30455025148391723, + 0.304351772236824, + 0.30421765327453615 + ], + "train_acc": [ + 0.2627, + 0.6355, + 0.7918, + 0.8496, + 0.8661, + 0.8649, + 0.8652, + 0.8693, + 0.8681, + 0.8695, + 0.8729, + 0.8751, + 0.8734, + 0.8741, + 0.8698, + 0.8682, + 0.8684, + 0.8594, + 0.862, + 0.8585, + 0.8587, + 0.8606, + 0.8568, + 0.8597, + 0.8494, + 0.8553, + 0.8551, + 0.8509, + 0.8614, + 0.8609, + 0.861, + 0.8661, + 0.8636, + 0.8551, + 0.863, + 0.8613, + 0.859, + 0.8686, + 0.8678, + 0.8627, + 0.8657, + 0.8607, + 0.867, + 0.8651, + 0.8714, + 0.871, + 0.8732, + 0.8694, + 0.8748, + 0.8771, + 0.878, + 0.8747, + 0.8735, + 0.8772, + 0.8792, + 0.878, + 0.8762, + 0.8818, + 0.8768, + 0.8803, + 0.879, + 0.8811, + 0.8814, + 0.883, + 0.8825, + 0.8844, + 0.8823, + 0.8829, + 0.8866, + 0.8862, + 0.8846, + 0.8855, + 0.885, + 0.8869, + 0.8859, + 0.8861, + 0.8857, + 0.886, + 0.8862, + 0.8862 + ], + "test_acc": [ + 0.482, + 0.709, + 0.787, + 0.813, + 0.8285, + 0.8275, + 0.8345, + 0.826, + 0.826, + 0.8305, + 0.8215, + 0.819, + 0.8185, + 0.817, + 0.819, + 0.812, + 0.817, + 0.8125, + 0.8045, + 0.7905, + 0.7995, + 0.8055, + 0.801, + 0.8025, + 0.804, + 0.801, + 0.792, + 0.7925, + 0.807, + 0.798, + 0.7985, + 0.799, + 0.7915, + 0.8155, + 0.8095, + 0.804, + 0.811, + 0.814, + 0.803, + 0.8115, + 0.81, + 0.813, + 0.819, + 0.813, + 0.817, + 0.8165, + 0.8175, + 0.8245, + 0.82, + 0.814, + 0.8225, + 0.816, + 0.8245, + 0.817, + 0.8225, + 0.82, + 0.8225, + 0.826, + 0.823, + 0.823, + 0.8275, + 0.8235, + 0.8225, + 0.826, + 0.8255, + 0.827, + 0.8245, + 0.825, + 0.8255, + 0.8235, + 0.8245, + 0.826, + 0.8225, + 0.8265, + 0.8245, + 0.825, + 0.8255, + 0.827, + 0.827, + 0.827 + ], + "state_pred_error": [ + 0.7967377858638763, + 0.34598296966552733, + 0.2030195487499237, + 0.16683620121479034, + 0.15052817759513856, + 0.13117947192192078, + 0.10972135738134384, + 0.0900312513589859, + 0.07317366843223572, + 0.06010319168567657, + 0.04874778895378113, + 0.0407476614356041, + 0.03495406020283699, + 0.02987285739183426, + 0.026561988437175752, + 0.023144602596759795, + 0.021253752559423446, + 0.019422493594884873, + 0.017936924171447755, + 0.016594687747955323, + 0.015548654867708683, + 0.014461067456007004, + 0.013745320722460748, + 0.012979924492537976, + 0.01257009451687336, + 0.012221769727766514, + 0.011650261569023133, + 0.011007585345208645, + 0.010606600934267045, + 0.01016893789768219, + 0.00975934579372406, + 0.009299210277199745, + 0.009092474126815795, + 0.008728945380449295, + 0.008686305114626884, + 0.008494052711874247, + 0.007941164903342724, + 0.007641752201318741, + 0.007414149653911591, + 0.007252850785851478, + 0.007086898298561573, + 0.006903395959734917, + 0.0067314132377505305, + 0.006647216567397117, + 0.006545945912599564, + 0.006497067116945982, + 0.006256709571182728, + 0.006150986460596323, + 0.005971997079998255, + 0.005811705444008112, + 0.005608313149213791, + 0.005580492584407329, + 0.005637438614666462, + 0.005647444573789835, + 0.005466383482515812, + 0.005266562070697546, + 0.005138493876159191, + 0.00498729590177536, + 0.004910858514904976, + 0.004862993755191564, + 0.004731716811656952, + 0.0047377496108412746, + 0.0047596204489469525, + 0.004541794133931398, + 0.00446272025257349, + 0.004423295229673386, + 0.00430677450299263, + 0.0043451601408422, + 0.004428337071090937, + 0.004295985059812665, + 0.0042147732827812435, + 0.0040082332260906696, + 0.0041201773762702945, + 0.003969736605882645, + 0.00395717710107565, + 0.004493858044967055, + 0.003766924513503909, + 0.0037810308314859867, + 0.0038307637006044387, + 0.0036542431749403475 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9188902378082275, + 0.4362110495567322 + ], + "perturbation_rho": [ + 0.8401009440422058, + 0.41428011655807495 + ], + "nudging": { + "0.001": [ + -0.027256522327661514, + -0.0028760721907019615 + ], + "0.003": [ + -0.07801611721515656, + -0.008582176640629768 + ], + "0.01": [ + -0.21947401762008667, + -0.02806854248046875 + ] + }, + "state_pred_error_per_layer": [ + 753.1610107421875, + 333.87890625 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2717817337036132, + 1.6044951431274415, + 0.9575855054855347, + 0.6274385880470276, + 0.479679812002182, + 0.4025820679664612, + 0.3722260438919067, + 0.35356286239624024, + 0.35820354251861575, + 0.37495428252220153, + 0.3565654326915741, + 0.3734219524860382, + 0.3754354688644409, + 0.39081022024154666, + 0.37834826040267944, + 0.4085339098930359, + 0.3934634296178818, + 0.40792312593460084, + 0.41530650129318236, + 0.45324366564750673, + 0.4508738428592682, + 0.5132140514850616, + 0.5059539035320282, + 0.5738642817497254, + 0.5628011140346527, + 0.5786454545974732, + 0.6376582353115082, + 0.6003107436180115, + 0.6011718498229981, + 0.6524772605895997, + 0.6472935548782348, + 0.6307102481842041, + 0.6182636840820313, + 0.63121531457901, + 0.6926726831436157, + 0.6685154367446899, + 0.7257110968589783, + 0.6795891889095307, + 0.6769815434455871, + 0.7017775566101074, + 0.7776780778884888, + 0.7102687572002411, + 0.7532470722198487, + 0.7802075752258301, + 0.7946839473724365, + 0.7761624695301056, + 0.8113742619514466, + 0.8059718873977662, + 0.8183923157691956, + 0.8154451040267945, + 0.8366338520050048, + 0.842187615776062, + 0.8577603224754333, + 0.8479723624229432, + 0.8778535093307495, + 0.876348822593689, + 0.8831672384738922, + 0.8729063333511352, + 0.8774579629898072, + 0.9124985290527343, + 0.8993189775466919, + 0.9178578794002533, + 0.9149423480987549, + 0.9265102993011475, + 0.9319318475723266, + 0.937051300239563, + 0.9444302869796752, + 0.9413692620277405, + 0.9406136125564575, + 0.9456098251342774, + 0.9459423446655273, + 0.9455011163711547, + 0.9455199542999267, + 0.9456782765388488, + 0.9462723201751709, + 0.9461660702705383, + 0.9455078218698502, + 0.9445678804397583, + 0.9438195475578308, + 0.943692198753357 + ], + "train_acc": [ + 0.1685, + 0.4663, + 0.6767, + 0.7776, + 0.8201, + 0.8482, + 0.8584, + 0.864, + 0.8674, + 0.8645, + 0.8725, + 0.8674, + 0.8708, + 0.8656, + 0.872, + 0.866, + 0.8661, + 0.8626, + 0.8645, + 0.8503, + 0.8526, + 0.8318, + 0.8337, + 0.8206, + 0.818, + 0.8111, + 0.7946, + 0.8, + 0.7977, + 0.7791, + 0.7799, + 0.782, + 0.7861, + 0.7743, + 0.7594, + 0.7633, + 0.746, + 0.7597, + 0.7585, + 0.7534, + 0.7343, + 0.7503, + 0.7375, + 0.734, + 0.7335, + 0.7346, + 0.7281, + 0.7262, + 0.7197, + 0.7231, + 0.7196, + 0.7156, + 0.7134, + 0.7144, + 0.7037, + 0.7092, + 0.7075, + 0.7085, + 0.7071, + 0.6968, + 0.6984, + 0.697, + 0.7003, + 0.6966, + 0.6967, + 0.6967, + 0.6951, + 0.6947, + 0.6952, + 0.6924, + 0.6928, + 0.693, + 0.6911, + 0.6925, + 0.6939, + 0.6929, + 0.6941, + 0.6926, + 0.6936, + 0.6938 + ], + "test_acc": [ + 0.3075, + 0.577, + 0.7165, + 0.765, + 0.805, + 0.806, + 0.825, + 0.822, + 0.816, + 0.816, + 0.812, + 0.8185, + 0.819, + 0.8245, + 0.822, + 0.8215, + 0.802, + 0.8235, + 0.8035, + 0.801, + 0.773, + 0.767, + 0.7385, + 0.763, + 0.775, + 0.731, + 0.745, + 0.738, + 0.7035, + 0.708, + 0.7235, + 0.6945, + 0.7005, + 0.694, + 0.699, + 0.7045, + 0.7055, + 0.704, + 0.6985, + 0.6615, + 0.7085, + 0.695, + 0.6765, + 0.6655, + 0.6895, + 0.6725, + 0.6775, + 0.6455, + 0.671, + 0.667, + 0.664, + 0.6685, + 0.6715, + 0.6655, + 0.662, + 0.657, + 0.657, + 0.6665, + 0.6665, + 0.6635, + 0.6485, + 0.663, + 0.6535, + 0.6595, + 0.6515, + 0.65, + 0.6535, + 0.6525, + 0.647, + 0.6465, + 0.6475, + 0.6505, + 0.648, + 0.6445, + 0.648, + 0.6455, + 0.645, + 0.6455, + 0.645, + 0.6455 + ], + "value_loss": [ + 2.9139820795059204, + 0.7781319219589233, + 0.6261702270507813, + 0.5631922412395477, + 0.5089643202781677, + 0.47773351917266843, + 0.49251684589385986, + 0.5094742440223694, + 0.5250778325080872, + 0.5757163972377777, + 0.5253688870429992, + 0.5867766951560974, + 0.5887034587860107, + 0.6342814973831177, + 0.6224288850784302, + 0.7040738446712493, + 0.6622943760871888, + 0.6909106607675553, + 0.6861579052448272, + 0.8070016531944275, + 0.7657489172935485, + 0.8981747324943542, + 0.8311526319503785, + 1.0680026486992835, + 0.9285434822559356, + 0.8835838872909546, + 0.9766024167537689, + 0.8232256447792053, + 0.7960768020629883, + 0.7652815974235535, + 0.7177574991226197, + 0.6208152499198913, + 0.5670896316051484, + 0.521339186668396, + 0.6030832626342774, + 0.5279540919303894, + 0.6378763611793518, + 0.4802740800619125, + 0.4685490375518799, + 0.46527220191955565, + 0.5925926671981812, + 0.4850484214305878, + 0.5189880228042603, + 0.5404599063873291, + 0.5865764006614685, + 0.5419052541732788, + 0.5603141060113906, + 0.559055899143219, + 0.6549916872501373, + 0.5873499877929688, + 0.5730865565299987, + 0.5765046960830689, + 0.6072168838500976, + 0.6075364608764648, + 0.6144091351985932, + 0.6132542675971985, + 0.6039235576629639, + 0.602211035656929, + 0.5848144401550293, + 0.6547185651779175, + 0.6224689907073975, + 0.6558543173074722, + 0.6365399208068848, + 0.6299452920913696, + 0.6250463237762451, + 0.6158743118286133, + 0.6338640846252441, + 0.6420701734542846, + 0.6022836451530457, + 0.6110358497619629, + 0.6228030502319336, + 0.6002978692770005, + 0.6006025218963623, + 0.6115713768005371, + 0.6018096000671387, + 0.6287955265522003, + 0.5901965017795563, + 0.5782727504730225, + 0.5828642177581788, + 0.5630231554031372 + ], + "term_loss": [ + 1.675116873073578, + 0.34430024371147155, + 0.3699357802391052, + 0.3608538656949997, + 0.32141098375320437, + 0.296013809967041, + 0.3145594831466675, + 0.3366319574356079, + 0.35779941773414614, + 0.41367546219825746, + 0.3742054052591324, + 0.4305104339599609, + 0.4350124341964722, + 0.47471349573135374, + 0.4695607521057129, + 0.5416271431207657, + 0.50037581397295, + 0.5279187945127487, + 0.5226932208895684, + 0.6252485764980316, + 0.5859362184286118, + 0.6939002041339875, + 0.634807921075821, + 0.8540068101286888, + 0.7134227627754212, + 0.6600253582000732, + 0.7331792865395546, + 0.5853852001190185, + 0.5587812387466431, + 0.5075105863571167, + 0.464410977602005, + 0.37542237077355384, + 0.3169003723859787, + 0.2732926230430603, + 0.3423420313835144, + 0.2687295290231705, + 0.35581202269792556, + 0.22913563103079795, + 0.21938599632382394, + 0.2144745792388916, + 0.31799187030792236, + 0.2320458871483803, + 0.2544168309211731, + 0.2703706371307373, + 0.3117321794748306, + 0.2738133100509644, + 0.27934123712182046, + 0.2817279294967651, + 0.3692713690519333, + 0.30682048025131226, + 0.2853371166229248, + 0.28265748102664945, + 0.30581441168785095, + 0.30762661685943604, + 0.30526128548383713, + 0.305000597679615, + 0.29075743298530576, + 0.29170473134592173, + 0.27489340591430667, + 0.32806511583328246, + 0.3060114824295044, + 0.3312658293545246, + 0.31389011993408206, + 0.3109654490470886, + 0.303177494096756, + 0.29685306973457337, + 0.311812850189209, + 0.31457807751893996, + 0.2882286059886217, + 0.2872561911582947, + 0.3006808135509491, + 0.2861353112459183, + 0.2760439012527466, + 0.29094672749638556, + 0.2810854609966278, + 0.3063315445184708, + 0.2749019814029336, + 0.2580472655415535, + 0.2624768678069115, + 0.2533654543399811 + ], + "bridge_loss": [ + 0.9121190248202939, + 0.12368383026123046, + 0.02325579553693533, + 0.00638287930637598, + 0.015633951807022095, + 0.0267038604259491, + 0.029089016681909562, + 0.03015945321023464, + 0.022946262511610985, + 0.01605847358852625, + 0.011836738139390946, + 0.013218694264441729, + 0.01344587414264679, + 0.01692773981690407, + 0.015606502836942673, + 0.017554944163560866, + 0.02013770264238119, + 0.01981841846704483, + 0.018635487586259842, + 0.026470916414260866, + 0.026284595650434495, + 0.029653245022892953, + 0.02730709999203682, + 0.02978192163705826, + 0.031069664573669435, + 0.03410405703783035, + 0.038268526667356494, + 0.040036833453178405, + 0.03885038551688194, + 0.04320903084874153, + 0.041191232109069824, + 0.036969611018896106, + 0.043973470589518546, + 0.03558493182659149, + 0.033664032626152036, + 0.036646516934037206, + 0.044948402404785155, + 0.026731023278832436, + 0.024752013075351714, + 0.02128150890469551, + 0.02616920839548111, + 0.021055375733971596, + 0.02227571759223938, + 0.022238678365945817, + 0.02414751509428024, + 0.021202504792809485, + 0.025903358660638334, + 0.02438402145802975, + 0.029620986983180046, + 0.026105598723888398, + 0.027550537937879562, + 0.03267939478158951, + 0.03767158226370811, + 0.038392514300346375, + 0.04036871939897537, + 0.04241352363824844, + 0.04498921741694212, + 0.04509584439694882, + 0.042803814631700514, + 0.05169626851081848, + 0.0450944231569767, + 0.04986252784132957, + 0.04847792634963989, + 0.04344110252559185, + 0.04525724016427994, + 0.04157515670657158, + 0.042778206980228425, + 0.04924657067060471, + 0.03752178891897202, + 0.04514836919307709, + 0.04305028664469719, + 0.035792450475692746, + 0.04672777749300003, + 0.042780098879337314, + 0.0434021101474762, + 0.044323261296749114, + 0.03760044357031584, + 0.04323315477967262, + 0.04370184513926506, + 0.03314736911058426 + ], + "tgrad_loss": [ + 0.3267462004184723, + 0.31014784474372864, + 0.23297864780426025, + 0.19595549144744873, + 0.1719193906068802, + 0.15501584944725036, + 0.14886834893226625, + 0.14268282673358917, + 0.14433215198516847, + 0.14598246383666993, + 0.1393267445087433, + 0.14304756488204, + 0.140245152425766, + 0.14264026589393616, + 0.13726163320541382, + 0.1448917584180832, + 0.141780867344141, + 0.14317344819307326, + 0.14482919363975524, + 0.15528216607570647, + 0.15352810034751893, + 0.17462128348350525, + 0.16903761179447174, + 0.18421390730142592, + 0.184051059871912, + 0.1894544795513153, + 0.20515460292696952, + 0.19780361485481263, + 0.19844518136978148, + 0.21456197862625123, + 0.21215528469085693, + 0.20842326607704162, + 0.20621578772068025, + 0.2124616316318512, + 0.22707719662189485, + 0.22257804441452025, + 0.23711593326330185, + 0.22440742473006248, + 0.22441103448867797, + 0.2295161123752594, + 0.24843158135414123, + 0.23194715747833253, + 0.24229546999931337, + 0.24785059971809387, + 0.25069670701026914, + 0.24688943903446198, + 0.25506951308250425, + 0.25294395008087156, + 0.2560993363618851, + 0.2544239068031311, + 0.26019890108108523, + 0.26116782383918763, + 0.26373088693618774, + 0.2615173279285431, + 0.2687791325092316, + 0.2658401421546936, + 0.26817690315246584, + 0.26541045472621916, + 0.26711721820831297, + 0.2749571761608124, + 0.2713630847454071, + 0.2747259566783905, + 0.2741718715667725, + 0.27553872985839845, + 0.2766115864753723, + 0.2774460829734802, + 0.27927302808761595, + 0.2782455343008041, + 0.27653324790000916, + 0.27863129014968874, + 0.2790719511032104, + 0.27837010283470154, + 0.2778308403968811, + 0.27784455041885375, + 0.27732203030586244, + 0.27814072003364565, + 0.27769407304525373, + 0.2769923341035843, + 0.27668550889492033, + 0.27651033034324646 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.07500731945037842, + 0.23077097535133362 + ], + "perturbation_rho": [ + 0.12894567847251892, + 0.37924277782440186 + ], + "nudging": { + "0.001": [ + -0.005560865625739098, + -0.0021081208251416683 + ], + "0.003": [ + -0.01659420132637024, + -0.006318465806543827 + ], + "0.01": [ + -0.05425257235765457, + -0.020995579659938812 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.25_L2_s456.json b/results/synth_ladder_v2_lo/synth_a0.25_L2_s456.json new file mode 100644 index 0000000..57e685b --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.25_L2_s456.json @@ -0,0 +1,1512 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.8000983072280883, + 0.8553262281417847, + 0.4930526713371277, + 0.3784203895568848, + 0.3197663818836212, + 0.29053169984817506, + 0.26875064196586607, + 0.25987493658065797, + 0.23892381181716918, + 0.22869952754974365, + 0.22458118422031403, + 0.21209806804656983, + 0.20757287468910218, + 0.19907629506587982, + 0.20321457154750824, + 0.18708656415939331, + 0.17637303404808044, + 0.1847076560974121, + 0.17682335205078126, + 0.187822900390625, + 0.18293290028572082, + 0.18654212374687196, + 0.17292806282043457, + 0.18349194377660752, + 0.1571652352333069, + 0.16827380738258363, + 0.15997591190338134, + 0.1580581651687622, + 0.14601466226577758, + 0.14226590123176575, + 0.14564169149398803, + 0.15921205137968064, + 0.13405996446609497, + 0.13091181358098983, + 0.12752190665006638, + 0.12275864148139953, + 0.1250006089925766, + 0.11982801494598389, + 0.12906549286842345, + 0.12449447993934154, + 0.11429075312614441, + 0.1164977291584015, + 0.11286599822044373, + 0.10972460707426071, + 0.10615357451438903, + 0.10912412519454956, + 0.1058990234375, + 0.10500219140052795, + 0.10486637511253356, + 0.10353950891494751, + 0.09869744987487793, + 0.09981467643976212, + 0.09713814241886139, + 0.09420502263009548, + 0.09280058851242065, + 0.0938924689769745, + 0.0941491194486618, + 0.09126792776584625, + 0.08973681110143661, + 0.08885353000164031, + 0.08794978060722351, + 0.08694391140937806, + 0.08604433858394622, + 0.0855510621547699, + 0.08556988172531128, + 0.08505082764625549, + 0.08439020845592021, + 0.08360161371231078, + 0.08313429535627365, + 0.08274500939846038, + 0.08240846571028232, + 0.08203878502845764, + 0.08169064269661903, + 0.08140706999301911, + 0.0811797592163086, + 0.08097635807991029, + 0.08089512157440186, + 0.08077903534770012, + 0.08070964171886444, + 0.08066833609938621 + ], + "train_acc": [ + 0.3997, + 0.7677, + 0.8688, + 0.8872, + 0.8985, + 0.9015, + 0.9094, + 0.9081, + 0.9159, + 0.9185, + 0.9183, + 0.9231, + 0.9244, + 0.9284, + 0.9244, + 0.9341, + 0.9376, + 0.932, + 0.9358, + 0.9307, + 0.9297, + 0.9255, + 0.9352, + 0.9308, + 0.9436, + 0.9367, + 0.9393, + 0.9413, + 0.9498, + 0.9492, + 0.9497, + 0.9404, + 0.9532, + 0.9557, + 0.9587, + 0.962, + 0.9591, + 0.9608, + 0.9572, + 0.9563, + 0.9638, + 0.9611, + 0.9661, + 0.9671, + 0.9679, + 0.9665, + 0.9689, + 0.9706, + 0.9675, + 0.9704, + 0.9741, + 0.9719, + 0.9733, + 0.9754, + 0.9772, + 0.9747, + 0.9759, + 0.9778, + 0.9787, + 0.9779, + 0.9799, + 0.9802, + 0.981, + 0.9812, + 0.9805, + 0.9816, + 0.9819, + 0.9817, + 0.9821, + 0.9823, + 0.9822, + 0.9832, + 0.9832, + 0.9834, + 0.9835, + 0.9838, + 0.9832, + 0.9833, + 0.9833, + 0.9833 + ], + "test_acc": [ + 0.658, + 0.831, + 0.867, + 0.8755, + 0.878, + 0.875, + 0.885, + 0.886, + 0.8885, + 0.8915, + 0.8895, + 0.886, + 0.8885, + 0.8965, + 0.8935, + 0.887, + 0.9, + 0.898, + 0.902, + 0.8875, + 0.8975, + 0.894, + 0.8955, + 0.894, + 0.904, + 0.9, + 0.8975, + 0.896, + 0.9055, + 0.903, + 0.8995, + 0.9035, + 0.9055, + 0.8975, + 0.905, + 0.9045, + 0.903, + 0.908, + 0.9045, + 0.9115, + 0.9075, + 0.906, + 0.91, + 0.912, + 0.9145, + 0.909, + 0.9145, + 0.915, + 0.914, + 0.9095, + 0.913, + 0.909, + 0.912, + 0.915, + 0.9135, + 0.912, + 0.9125, + 0.915, + 0.9125, + 0.916, + 0.9135, + 0.912, + 0.9135, + 0.9145, + 0.914, + 0.913, + 0.914, + 0.9135, + 0.9125, + 0.9125, + 0.912, + 0.912, + 0.9135, + 0.913, + 0.913, + 0.9135, + 0.914, + 0.914, + 0.914, + 0.914 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8855119943618774, + 0.8700143098831177 + ], + "perturbation_rho": [ + 0.9999988079071045, + 0.9999958276748657 + ], + "nudging": { + "0.001": [ + -0.025924552232027054, + -0.009314566850662231 + ], + "0.003": [ + -0.06999024748802185, + -0.026958726346492767 + ], + "0.01": [ + -0.16111940145492554, + -0.07906024903059006 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.283660962677002, + 1.585267567062378, + 0.9385803462982177, + 0.6367190747261048, + 0.49448280506134035, + 0.4259012367725372, + 0.39124873666763305, + 0.38015281138420104, + 0.37522998003959657, + 0.3701688726902008, + 0.37803883278369904, + 0.39746112833023073, + 0.3802763431549072, + 0.3912481979370117, + 0.4047987679004669, + 0.4151992503881454, + 0.4170101192951202, + 0.42453424332141876, + 0.4173937663078308, + 0.43686163773536685, + 0.42365531826019287, + 0.42363426294326784, + 0.4208437828063965, + 0.4529822621464729, + 0.4070855083465576, + 0.4689378917694092, + 0.4634589358329773, + 0.4367367925167084, + 0.4250321800231934, + 0.4287016040802002, + 0.4584434572219849, + 0.44194866588115694, + 0.4174223184347153, + 0.44547443580627444, + 0.46664287486076356, + 0.4065489921808243, + 0.4331810564517975, + 0.42899156646728515, + 0.5209377204418182, + 0.4371390515804291, + 0.4179263119697571, + 0.40993842480182646, + 0.4559203372001648, + 0.40942260138988495, + 0.3948855718612671, + 0.4338044833183289, + 0.4061251772403717, + 0.4279718475818634, + 0.4087572427749634, + 0.4140715950973332, + 0.38019427223205565, + 0.4078751751422882, + 0.383210799074173, + 0.38765000307559966, + 0.37216824359893796, + 0.41562538146972655, + 0.382677834546566, + 0.3672296663284302, + 0.3730851769924164, + 0.3590498920440674, + 0.36640932368040086, + 0.35998264112472533, + 0.36020482025146483, + 0.35171630606651305, + 0.35406614532470704, + 0.35089321160316467, + 0.3469816573232412, + 0.34033540658950806, + 0.3445661533117294, + 0.34326147508621213, + 0.3389697380542755, + 0.3388423357963562, + 0.33665650494098665, + 0.33594908571243287, + 0.33628645095825194, + 0.3349286338806152, + 0.3339044927597046, + 0.3329299204826355, + 0.33245518345832825, + 0.3322625407218933 + ], + "train_acc": [ + 0.1556, + 0.4765, + 0.6797, + 0.7739, + 0.8177, + 0.8382, + 0.8504, + 0.8549, + 0.8578, + 0.8611, + 0.8564, + 0.8512, + 0.863, + 0.8611, + 0.8578, + 0.8551, + 0.8564, + 0.8549, + 0.8564, + 0.8552, + 0.8586, + 0.8599, + 0.8615, + 0.8542, + 0.861, + 0.8548, + 0.8554, + 0.8602, + 0.8653, + 0.8605, + 0.8558, + 0.8606, + 0.865, + 0.8578, + 0.8578, + 0.8691, + 0.8625, + 0.8631, + 0.8471, + 0.8608, + 0.8684, + 0.8681, + 0.8555, + 0.871, + 0.8725, + 0.8647, + 0.8679, + 0.8651, + 0.8667, + 0.8681, + 0.8756, + 0.867, + 0.8762, + 0.8754, + 0.8796, + 0.8686, + 0.8744, + 0.8788, + 0.878, + 0.8809, + 0.8807, + 0.8805, + 0.8801, + 0.8841, + 0.8834, + 0.8841, + 0.8849, + 0.8869, + 0.886, + 0.8853, + 0.8881, + 0.8862, + 0.8874, + 0.8873, + 0.8878, + 0.8885, + 0.8897, + 0.8895, + 0.8893, + 0.8889 + ], + "test_acc": [ + 0.3075, + 0.5895, + 0.7175, + 0.763, + 0.794, + 0.803, + 0.8195, + 0.8175, + 0.814, + 0.8145, + 0.8165, + 0.8235, + 0.8225, + 0.8215, + 0.815, + 0.8135, + 0.8255, + 0.817, + 0.817, + 0.8195, + 0.8075, + 0.8145, + 0.817, + 0.824, + 0.7985, + 0.8095, + 0.8085, + 0.819, + 0.8165, + 0.814, + 0.826, + 0.821, + 0.828, + 0.8205, + 0.829, + 0.8335, + 0.82, + 0.824, + 0.8205, + 0.8235, + 0.8255, + 0.8195, + 0.832, + 0.8435, + 0.8155, + 0.8275, + 0.827, + 0.8165, + 0.8215, + 0.833, + 0.83, + 0.8285, + 0.8345, + 0.827, + 0.8315, + 0.836, + 0.8335, + 0.8405, + 0.8355, + 0.836, + 0.8375, + 0.838, + 0.8395, + 0.836, + 0.841, + 0.8405, + 0.838, + 0.836, + 0.8385, + 0.8395, + 0.8355, + 0.839, + 0.841, + 0.838, + 0.841, + 0.8415, + 0.8415, + 0.842, + 0.842, + 0.842 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.015632983297109604, + 0.08371198177337646 + ], + "perturbation_rho": [ + -0.06864285469055176, + 0.1325663924217224 + ], + "nudging": { + "0.001": [ + -0.000759319169446826, + -0.0003429622738622129 + ], + "0.003": [ + -0.002224094932898879, + -0.0010281240101903677 + ], + "0.01": [ + -0.006782663054764271, + -0.003414375241845846 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 2.0607079202651977, + 1.1337099237442017, + 0.647877628993988, + 0.4504327066421509, + 0.3940727692604065, + 0.3723359739303589, + 0.3689178777933121, + 0.3625231744766235, + 0.35998505368232725, + 0.35867741174697876, + 0.3579361547470093, + 0.35106793417930604, + 0.34446446766853334, + 0.3474297195911408, + 0.3416134696006775, + 0.345831178188324, + 0.3566520956993103, + 0.36237930603027346, + 0.3771623134613037, + 0.3816791586399078, + 0.39025780296325685, + 0.3933836591720581, + 0.4161139528751373, + 0.4057706892967224, + 0.3918828906059265, + 0.3976308813095093, + 0.3874743386268616, + 0.38788036189079284, + 0.3851133870601654, + 0.3756926311016083, + 0.3775329941749573, + 0.3970633387565613, + 0.4137820346355438, + 0.3905292279243469, + 0.40476176710128786, + 0.41149664545059206, + 0.4037230536460876, + 0.44066204071044923, + 0.41780310134887694, + 0.4295464913368225, + 0.42649631886482237, + 0.4284087491989136, + 0.4360576012611389, + 0.44457482340335847, + 0.4401917548656464, + 0.43505805568695066, + 0.44327515368461606, + 0.4325465172767639, + 0.43232013721466067, + 0.4275367980480194, + 0.427516703081131, + 0.4204970709323883, + 0.41822126712799074, + 0.4155596286773682, + 0.4231887112617493, + 0.4155136170387268, + 0.40704256649017334, + 0.40344800395965574, + 0.40768413548469545, + 0.4017280409812927, + 0.3982292408466339, + 0.39725692327022555, + 0.39136295738220217, + 0.3908126180648804, + 0.39189315357208254, + 0.3870381077766418, + 0.3879516251564026, + 0.3833280053138733, + 0.38215707620978356, + 0.3819090251922607, + 0.37943741810321807, + 0.3780518521785736, + 0.3775427331447601, + 0.37716020322442056, + 0.3760606771469116, + 0.37568101379871366, + 0.37528624348640444, + 0.3750066729545593, + 0.37472169427871704, + 0.37465501019954683 + ], + "train_acc": [ + 0.2642, + 0.6184, + 0.7763, + 0.8422, + 0.8529, + 0.8584, + 0.8561, + 0.8627, + 0.8625, + 0.8624, + 0.866, + 0.8646, + 0.8708, + 0.8681, + 0.8686, + 0.8658, + 0.8625, + 0.861, + 0.8542, + 0.8492, + 0.8519, + 0.849, + 0.8451, + 0.849, + 0.8487, + 0.8491, + 0.8527, + 0.853, + 0.8523, + 0.8552, + 0.8557, + 0.8487, + 0.8438, + 0.854, + 0.8489, + 0.849, + 0.8503, + 0.8455, + 0.8514, + 0.8453, + 0.8493, + 0.8484, + 0.8465, + 0.8434, + 0.8478, + 0.8538, + 0.8475, + 0.8494, + 0.8548, + 0.8534, + 0.8525, + 0.8562, + 0.8564, + 0.8563, + 0.8544, + 0.8563, + 0.8584, + 0.8601, + 0.8585, + 0.8604, + 0.8637, + 0.8612, + 0.8637, + 0.8637, + 0.8626, + 0.8657, + 0.8646, + 0.8662, + 0.8666, + 0.8676, + 0.8676, + 0.868, + 0.8692, + 0.8698, + 0.8692, + 0.8703, + 0.8696, + 0.8702, + 0.8703, + 0.87 + ], + "test_acc": [ + 0.514, + 0.7025, + 0.788, + 0.8215, + 0.826, + 0.8235, + 0.8205, + 0.824, + 0.824, + 0.8265, + 0.8285, + 0.8265, + 0.8315, + 0.832, + 0.8335, + 0.8255, + 0.8315, + 0.822, + 0.808, + 0.8155, + 0.8105, + 0.818, + 0.818, + 0.813, + 0.808, + 0.8085, + 0.813, + 0.811, + 0.811, + 0.81, + 0.8165, + 0.794, + 0.803, + 0.8115, + 0.7995, + 0.82, + 0.81, + 0.8005, + 0.798, + 0.806, + 0.806, + 0.815, + 0.809, + 0.806, + 0.807, + 0.8095, + 0.813, + 0.809, + 0.804, + 0.811, + 0.8095, + 0.804, + 0.8075, + 0.8085, + 0.8125, + 0.8055, + 0.8125, + 0.8085, + 0.812, + 0.8135, + 0.809, + 0.815, + 0.8085, + 0.8145, + 0.814, + 0.8155, + 0.816, + 0.8175, + 0.814, + 0.8135, + 0.817, + 0.8155, + 0.8155, + 0.8155, + 0.817, + 0.8175, + 0.8175, + 0.8175, + 0.817, + 0.817 + ], + "state_pred_error": [ + 0.7975846492767334, + 0.34740002810955045, + 0.20626533489227294, + 0.1688566227912903, + 0.14969556045532226, + 0.12686697702407837, + 0.10258943965435029, + 0.08248359158039092, + 0.06579203307628631, + 0.05322268953919411, + 0.043497616136074065, + 0.03624378236830234, + 0.03155959424376488, + 0.027837770199775697, + 0.025018838441371916, + 0.02305573586821556, + 0.021030399315059185, + 0.01895637398958206, + 0.01772472830414772, + 0.01661195346415043, + 0.01626126909852028, + 0.014910457614064216, + 0.014206837660074235, + 0.013685992537438869, + 0.012581391307711602, + 0.011982576858997345, + 0.011717106333374977, + 0.010968378871679306, + 0.010795737752318383, + 0.010089151945710181, + 0.009628403913974761, + 0.009443067149817944, + 0.00910616643279791, + 0.008941967545449734, + 0.00865904248803854, + 0.008406908518075943, + 0.008553840538859367, + 0.00796011516302824, + 0.007852698883414269, + 0.007530789855122566, + 0.007451776137948036, + 0.007600892862677574, + 0.007261194361746311, + 0.0070939825333654885, + 0.006930866247415543, + 0.0068556764483451845, + 0.0068909044548869135, + 0.006718636322021484, + 0.006451771011948586, + 0.0070287389852106575, + 0.006461447269469499, + 0.006300677789747715, + 0.006042939915508032, + 0.005973925769329071, + 0.005834758894145488, + 0.005728140544891357, + 0.005655132710933685, + 0.005581422328203916, + 0.005619841815531254, + 0.005785556498169899, + 0.005324072232097387, + 0.005209432889521122, + 0.005334047742933035, + 0.0049825638897717, + 0.004983069800212979, + 0.005002294857800007, + 0.004794969267398119, + 0.005065754823386669, + 0.004756338292360306, + 0.004534189984947443, + 0.004653947391360998, + 0.004516961539536715, + 0.004383903432264924, + 0.004468173056840896, + 0.004392227964103222, + 0.004369974558800459, + 0.00410505149140954, + 0.00409513374119997, + 0.004069356556236744, + 0.004237433210760355 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9367842674255371, + 0.5052818059921265 + ], + "perturbation_rho": [ + 0.846778392791748, + 0.5373459458351135 + ], + "nudging": { + "0.001": [ + -0.028559191152453423, + -0.0038118986412882805 + ], + "0.003": [ + -0.08209788799285889, + -0.011376685462892056 + ], + "0.01": [ + -0.23458413779735565, + -0.037239424884319305 + ] + }, + "state_pred_error_per_layer": [ + 626.5816650390625, + 277.74237060546875 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2841781162261965, + 1.5920361112594605, + 0.9420625007629394, + 0.6396594805717468, + 0.49837059326171873, + 0.4280559380531311, + 0.3917586740493774, + 0.3806812261581421, + 0.37738553323745727, + 0.3776072946548462, + 0.39090942087173464, + 0.3836580893516541, + 0.39848621730804445, + 0.39414596700668336, + 0.4033576976776123, + 0.3954726212978363, + 0.4113054138183594, + 0.43227349529266357, + 0.4576970805168152, + 0.4727818874359131, + 0.4911901863098145, + 0.5089909892082214, + 0.5091109822273254, + 0.5419316413879395, + 0.5682882654190063, + 0.5794619635105133, + 0.5945024296760559, + 0.575393883895874, + 0.6467625747680664, + 0.6348539002418518, + 0.6088227634429931, + 0.6139724615097046, + 0.6312180225372315, + 0.6856759313583374, + 0.7260684799194336, + 0.6503768898010254, + 0.660949840927124, + 0.6826682937622071, + 0.6994050893783569, + 0.6910303967475891, + 0.7174594877243042, + 0.7371259686946869, + 0.7537702695846558, + 0.7966553500175476, + 0.7427541831970215, + 0.7614833879470825, + 0.756250295829773, + 0.7880895990371705, + 0.7913369228363037, + 0.7729651657104493, + 0.7882836460113526, + 0.8180274720668793, + 0.7788889380455017, + 0.7948621809005737, + 0.7926133176803589, + 0.8024183307647705, + 0.8282989875793457, + 0.8377448230743408, + 0.8504006636619568, + 0.8477847335815429, + 0.8469767751693725, + 0.8446590083122253, + 0.8462727046012879, + 0.8549996006011963, + 0.8553122864723206, + 0.8556031386375427, + 0.854762883234024, + 0.8593242017745971, + 0.8556238237857818, + 0.8551858370780945, + 0.8575570917129517, + 0.8572792016983032, + 0.8553469423294068, + 0.8568584102630615, + 0.856532636642456, + 0.8546321733474731, + 0.8542901330947876, + 0.8537617067337037, + 0.8532746227264404, + 0.8529878778457641 + ], + "train_acc": [ + 0.1573, + 0.4756, + 0.6808, + 0.7749, + 0.8136, + 0.836, + 0.85, + 0.8511, + 0.8553, + 0.8572, + 0.8527, + 0.8593, + 0.8568, + 0.8573, + 0.8619, + 0.8616, + 0.8571, + 0.8516, + 0.8481, + 0.845, + 0.8362, + 0.8339, + 0.8298, + 0.8249, + 0.8137, + 0.8071, + 0.7982, + 0.8014, + 0.7849, + 0.7847, + 0.7893, + 0.7842, + 0.7828, + 0.7569, + 0.7527, + 0.7649, + 0.7617, + 0.7532, + 0.7476, + 0.7466, + 0.737, + 0.7329, + 0.7298, + 0.7183, + 0.7324, + 0.7276, + 0.7238, + 0.7159, + 0.7157, + 0.7208, + 0.7177, + 0.7101, + 0.7191, + 0.7112, + 0.7126, + 0.712, + 0.708, + 0.703, + 0.7009, + 0.6985, + 0.7014, + 0.6962, + 0.7016, + 0.6946, + 0.6952, + 0.6951, + 0.6993, + 0.6922, + 0.6964, + 0.6993, + 0.6947, + 0.6965, + 0.6976, + 0.6974, + 0.6963, + 0.6979, + 0.6976, + 0.6964, + 0.6969, + 0.6966 + ], + "test_acc": [ + 0.3095, + 0.579, + 0.7105, + 0.771, + 0.793, + 0.81, + 0.813, + 0.8145, + 0.811, + 0.8295, + 0.819, + 0.811, + 0.812, + 0.8205, + 0.8205, + 0.811, + 0.816, + 0.818, + 0.8055, + 0.8055, + 0.807, + 0.794, + 0.7805, + 0.7755, + 0.7695, + 0.773, + 0.763, + 0.741, + 0.7355, + 0.727, + 0.731, + 0.7175, + 0.6985, + 0.7145, + 0.7185, + 0.716, + 0.717, + 0.7085, + 0.699, + 0.695, + 0.697, + 0.687, + 0.701, + 0.692, + 0.6795, + 0.683, + 0.672, + 0.6625, + 0.691, + 0.682, + 0.6745, + 0.6805, + 0.67, + 0.6715, + 0.6805, + 0.6615, + 0.668, + 0.655, + 0.6685, + 0.6685, + 0.6745, + 0.665, + 0.666, + 0.671, + 0.6685, + 0.668, + 0.6685, + 0.6655, + 0.6655, + 0.666, + 0.6695, + 0.6655, + 0.6675, + 0.669, + 0.667, + 0.667, + 0.668, + 0.6685, + 0.6685, + 0.6685 + ], + "value_loss": [ + 3.183600161743164, + 0.7750385164260865, + 0.6228227703094482, + 0.5807541069030762, + 0.5056938434600831, + 0.48559383153915403, + 0.48110757327079773, + 0.49592300415039064, + 0.5289546810626984, + 0.5474359282016754, + 0.5586690468311309, + 0.5815468026161194, + 0.5854624471187592, + 0.6134045516014099, + 0.6397341026306153, + 0.5935072565078735, + 0.6474540725708008, + 0.7058132423877717, + 0.7731063194274902, + 0.7794260215759278, + 0.759508763885498, + 0.8077074721336365, + 0.7146338634490966, + 0.8551284119606019, + 0.8034313897132873, + 0.7595964660644531, + 0.7274619615554809, + 0.6701016593933106, + 0.7542770774841309, + 0.6366281832695008, + 0.5932489609718323, + 0.5439536237716674, + 0.5317693880081177, + 0.5851134353637696, + 0.6304749866485596, + 0.48910887274742126, + 0.48204327812194825, + 0.4742885886192322, + 0.5095871998548508, + 0.4672426800251007, + 0.4669731388092041, + 0.5084928925275802, + 0.4811704207420349, + 0.5370424214363099, + 0.4818318892478943, + 0.46692917881011964, + 0.4602645688056946, + 0.5055856050491333, + 0.47017913327217103, + 0.44230168209075926, + 0.4720217893600464, + 0.48523768539428713, + 0.4182536519050598, + 0.45286598148345947, + 0.4380767108917236, + 0.44022146463394163, + 0.4837879237651825, + 0.4790394123077393, + 0.49754595942497254, + 0.4781929668426514, + 0.47548961482048036, + 0.49705342779159545, + 0.46111058979034425, + 0.47314323959350585, + 0.471123362159729, + 0.4637605622768402, + 0.45161292238235473, + 0.4605647190570831, + 0.44299064745903016, + 0.43606283235549925, + 0.4616440633773804, + 0.4356783237457275, + 0.4435445850849152, + 0.4211894090652466, + 0.4348035490036011, + 0.43359944195747374, + 0.44066416525840757, + 0.41140582780838014, + 0.4257257164001465, + 0.4186974630832672 + ], + "term_loss": [ + 1.8026321507453917, + 0.3518428315162659, + 0.37675947713851926, + 0.38276648654937745, + 0.32057882099151613, + 0.3065270788550377, + 0.30243567395210263, + 0.32378246574401853, + 0.3653831358909607, + 0.38932991545200346, + 0.39687480373382567, + 0.42393954174518583, + 0.4242467020750046, + 0.4532722057342529, + 0.4773832442760467, + 0.4362155035972595, + 0.486022850227356, + 0.5338006882667542, + 0.5966757208347321, + 0.5939437051773071, + 0.5678820415496826, + 0.6060017887592316, + 0.5143427636623382, + 0.6467780996322632, + 0.5846465341091156, + 0.5283182467222214, + 0.4983976370334625, + 0.44641116333007813, + 0.5112490447998047, + 0.3977337556183338, + 0.3648644490003586, + 0.31504709310531614, + 0.30084985260963437, + 0.3288579341888428, + 0.3635549578666687, + 0.24613730195462705, + 0.23489424538612366, + 0.22370255022048952, + 0.25498708676695825, + 0.20941324164271355, + 0.20957557492256165, + 0.23416928594112396, + 0.21175098605155945, + 0.2531614188194275, + 0.20988761026859284, + 0.18880151594877242, + 0.18631615471839905, + 0.21227661232948303, + 0.18683922771811484, + 0.16496461772918702, + 0.1820032048225403, + 0.19443978843688964, + 0.1429014762878418, + 0.16745004987716675, + 0.1578450297355652, + 0.1553781552016735, + 0.18760945184230804, + 0.1851514247894287, + 0.20025430124998092, + 0.1819072727203369, + 0.17955903453826905, + 0.19871407819390297, + 0.16792754082679748, + 0.17481803393363954, + 0.17089381370544435, + 0.1689176040560007, + 0.15707939043045044, + 0.16704212747812272, + 0.1522603622496128, + 0.14507856206297876, + 0.1677186560511589, + 0.14509016184806825, + 0.1506106904104352, + 0.13293324483036995, + 0.14293194253444672, + 0.1427909223496914, + 0.14778699822425842, + 0.12496376402378083, + 0.13453806335926055, + 0.13192469900846482 + ], + "bridge_loss": [ + 1.086148412281787, + 0.1292816480755806, + 0.02697447990477085, + 0.008380569902062415, + 0.014730357018113135, + 0.02233964946269989, + 0.027988237404823302, + 0.023968446946144105, + 0.01585049637556076, + 0.011189098839461804, + 0.010882902494072914, + 0.010902717466652393, + 0.01232607362344861, + 0.013465753997862338, + 0.015195865526795388, + 0.014546262636780738, + 0.014874154400080443, + 0.01984240630865097, + 0.019618313241004944, + 0.024393686729669573, + 0.024060676431655884, + 0.029791050812602044, + 0.02654157394170761, + 0.028435604375600814, + 0.03134429958462715, + 0.038252703151106834, + 0.031379878085851666, + 0.02969111566543579, + 0.03346356704235077, + 0.029296788448095322, + 0.02688776364326477, + 0.024821505990624427, + 0.02414622390270233, + 0.029408053064346313, + 0.03269558168053627, + 0.02531407674998045, + 0.026356512427330017, + 0.023581733375787735, + 0.024556355768442156, + 0.027951345092058183, + 0.022370386198163034, + 0.03287668476700783, + 0.025288420939445496, + 0.031219502943754196, + 0.02888429069519043, + 0.030735591688752173, + 0.02735620730817318, + 0.03810946992039681, + 0.028575557655096055, + 0.02718697527050972, + 0.03519773906469345, + 0.028369852031767367, + 0.024919191813468935, + 0.02968004021644592, + 0.02626986500620842, + 0.02845469582825899, + 0.03466393163204193, + 0.03076643509864807, + 0.030355132931470873, + 0.030078389501571656, + 0.029866657304763795, + 0.03281264351382852, + 0.028423517215251923, + 0.030412553095817568, + 0.03361335833966732, + 0.02742235606312752, + 0.028246861313283442, + 0.026277213674783705, + 0.024521710814535618, + 0.026038313943147658, + 0.027685920548439026, + 0.024189958955347538, + 0.028101330828666688, + 0.023092676632106304, + 0.026744831919670104, + 0.026103598928451537, + 0.027902939324080944, + 0.021766479524970055, + 0.027076039123535157, + 0.02328252377510071 + ], + "tgrad_loss": [ + 0.294819629573822, + 0.2939140326499939, + 0.219088809299469, + 0.18960705118179322, + 0.17038466613292694, + 0.15672710111141205, + 0.15068366177082063, + 0.14817209043502808, + 0.1477210487008095, + 0.1469169137120247, + 0.15091134042739868, + 0.14670454227924348, + 0.14888966951966287, + 0.14666659691333772, + 0.14715499559640885, + 0.14274549129009248, + 0.1465570687055588, + 0.1521701454281807, + 0.15681228353977203, + 0.16108862676620483, + 0.16756604113578796, + 0.17191463656425476, + 0.17374952573776245, + 0.17991471261978148, + 0.1874405568599701, + 0.19302551550865174, + 0.19768444393873214, + 0.193999383020401, + 0.20956446123123168, + 0.20959763660430908, + 0.20149674859046937, + 0.2040850329399109, + 0.20677331829071044, + 0.2268474468231201, + 0.2342244486808777, + 0.21765749232769013, + 0.22079251861572266, + 0.22700430588722229, + 0.2300437501192093, + 0.229878093290329, + 0.23502717609405518, + 0.2414469205379486, + 0.24413101263046263, + 0.25266150131225584, + 0.24305998911857604, + 0.24739206635951996, + 0.24659220705032348, + 0.2551995223045349, + 0.2547643501758575, + 0.25015008878707884, + 0.25482084245681763, + 0.26242804205417636, + 0.25043298604488373, + 0.2557358948945999, + 0.25396181850433347, + 0.25638861246109007, + 0.2615145419597626, + 0.2631215545654297, + 0.26693652296066284, + 0.2662073058128357, + 0.26606392068862916, + 0.26552670979499815, + 0.26475953006744385, + 0.26791265106201173, + 0.26661619596481323, + 0.2674205995321274, + 0.2662866680383682, + 0.2672453787326813, + 0.2662085753917694, + 0.2649459549665451, + 0.2662394880533218, + 0.2663982018470764, + 0.2648325638771057, + 0.26516348662376404, + 0.2651267763614655, + 0.26470492310523985, + 0.2649742301940918, + 0.26467558369636535, + 0.26411161279678347, + 0.2634902417182922 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.13380715250968933, + 0.28871580958366394 + ], + "perturbation_rho": [ + 0.2647465467453003, + 0.4448530077934265 + ], + "nudging": { + "0.001": [ + -0.007434769067913294, + -0.0024258592166006565 + ], + "0.003": [ + -0.022199923172593117, + -0.007270205765962601 + ], + "0.01": [ + -0.07276535779237747, + -0.024136800318956375 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.25_L4_s123.json b/results/synth_ladder_v2_lo/synth_a0.25_L4_s123.json new file mode 100644 index 0000000..76c8d7a --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.25_L4_s123.json @@ -0,0 +1,1554 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.4145605772018432, + 0.4837885675907135, + 0.3509865976333618, + 0.3320046304702759, + 0.3153838852882385, + 0.26510489492416384, + 0.29119865114092824, + 0.23000359807014464, + 0.25192048209905626, + 0.22606405482292175, + 0.22339799184799194, + 0.24050125465393066, + 0.21707800154685974, + 0.24954306988716127, + 0.23637027411460876, + 0.21085137324333192, + 0.19512076714038848, + 0.17245010232925415, + 0.1894634276986122, + 0.1650419453382492, + 0.1778180214881897, + 0.21894844360351562, + 0.19933833799362183, + 0.1771628651380539, + 0.1553717818260193, + 0.1399657424926758, + 0.14071936559677123, + 0.1601772675037384, + 0.13696529176235198, + 0.14105643473863602, + 0.13802141556739808, + 0.16569645638465882, + 0.12720199494361878, + 0.14186724331378936, + 0.11719292199611664, + 0.11274782953262329, + 0.12050781357288361, + 0.10908292927742004, + 0.10698790650367737, + 0.10439169973134994, + 0.09679698523283005, + 0.10081665986776352, + 0.09919646325707436, + 0.09050822926163674, + 0.08451937192380428, + 0.08149686356782913, + 0.08619351840019226, + 0.08559241333007812, + 0.08397664375305176, + 0.08652843645811081, + 0.08116253237724304, + 0.08460511593818665, + 0.07957250861525536, + 0.07245188212394714, + 0.07476602460145951, + 0.07214559998512268, + 0.06864421527385711, + 0.06543551899790764, + 0.06294125034213066, + 0.06161921464204788, + 0.06044542417526245, + 0.05924299967288971, + 0.05897243957519531, + 0.05819726123511791, + 0.05668298012018204, + 0.057375379399955274, + 0.055825320994853975, + 0.05605454614162445, + 0.05520648413896561, + 0.05462213642001152, + 0.05396175765991211, + 0.05345057912766933, + 0.05290921161174774, + 0.05259452617168427, + 0.052336494362354276, + 0.05208745345771313, + 0.051927010026574134, + 0.05178932168483734, + 0.05169431391954422, + 0.05163790632486343 + ], + "train_acc": [ + 0.5311, + 0.8383, + 0.8684, + 0.8673, + 0.8741, + 0.8952, + 0.885, + 0.9126, + 0.9, + 0.9109, + 0.9124, + 0.903, + 0.9143, + 0.8996, + 0.9057, + 0.9155, + 0.9265, + 0.9344, + 0.9234, + 0.9368, + 0.9274, + 0.9132, + 0.9217, + 0.9312, + 0.9425, + 0.9491, + 0.9462, + 0.9374, + 0.9484, + 0.9474, + 0.9492, + 0.9317, + 0.9533, + 0.9466, + 0.9565, + 0.96, + 0.9521, + 0.962, + 0.9643, + 0.9634, + 0.9697, + 0.9658, + 0.967, + 0.9707, + 0.9744, + 0.976, + 0.973, + 0.9729, + 0.9738, + 0.9721, + 0.974, + 0.9728, + 0.9765, + 0.9806, + 0.9788, + 0.9807, + 0.9819, + 0.985, + 0.9862, + 0.9879, + 0.9879, + 0.9884, + 0.9892, + 0.9888, + 0.9906, + 0.9886, + 0.9909, + 0.9905, + 0.9906, + 0.9918, + 0.9922, + 0.9921, + 0.9931, + 0.9933, + 0.9934, + 0.994, + 0.9938, + 0.9942, + 0.9942, + 0.9942 + ], + "test_acc": [ + 0.7885, + 0.864, + 0.864, + 0.8825, + 0.878, + 0.8865, + 0.881, + 0.888, + 0.881, + 0.8775, + 0.898, + 0.894, + 0.891, + 0.885, + 0.8865, + 0.9005, + 0.8945, + 0.91, + 0.8925, + 0.9065, + 0.901, + 0.897, + 0.895, + 0.9, + 0.9015, + 0.9055, + 0.91, + 0.903, + 0.908, + 0.912, + 0.9095, + 0.902, + 0.9105, + 0.9025, + 0.9115, + 0.909, + 0.9045, + 0.913, + 0.9035, + 0.918, + 0.912, + 0.9045, + 0.912, + 0.9185, + 0.9135, + 0.9085, + 0.914, + 0.9175, + 0.913, + 0.915, + 0.916, + 0.9135, + 0.916, + 0.9145, + 0.919, + 0.918, + 0.9195, + 0.917, + 0.919, + 0.9155, + 0.917, + 0.9165, + 0.917, + 0.9195, + 0.918, + 0.9185, + 0.917, + 0.9175, + 0.9155, + 0.9165, + 0.9175, + 0.918, + 0.918, + 0.9175, + 0.917, + 0.9165, + 0.917, + 0.917, + 0.917, + 0.917 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8279672861099243, + 0.8114954233169556, + 0.7863935232162476, + 0.7482712268829346 + ], + "perturbation_rho": [ + 0.9999987483024597, + 0.9999956488609314, + 0.999983012676239, + 0.9999275207519531 + ], + "nudging": { + "0.001": [ + -0.024539310485124588, + -0.011202658526599407, + -0.004987813998013735, + -0.0025163067039102316 + ], + "0.003": [ + -0.06480148434638977, + -0.031804408878088, + -0.014610698446631432, + -0.00745969545096159 + ], + "0.01": [ + -0.14138484001159668, + -0.08725307881832123, + -0.04476301744580269, + -0.023845836520195007 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2260922397613525, + 1.3989790941238402, + 0.8063462790489196, + 0.5810352697372436, + 0.4776177051544189, + 0.4156474907875061, + 0.40407221131324766, + 0.3906784576416016, + 0.4220227051138878, + 0.408127818775177, + 0.48602376890182497, + 0.4391589762687683, + 0.4726590826034546, + 0.45469081001281736, + 0.46395344314575193, + 0.641008736038208, + 0.4606993099212646, + 0.48619530363082886, + 0.6209182878494263, + 0.579438009929657, + 0.5570708718299866, + 0.6080478384017944, + 0.5757816455364227, + 0.5000022046089172, + 0.554708060836792, + 0.6522365891456604, + 0.5476735515594482, + 0.7547416234016419, + 0.5390356698989868, + 0.5642839532852173, + 0.5649113851547242, + 0.6092495996952056, + 0.5237593853950501, + 0.7170518593788147, + 0.7146096199989319, + 0.4854401762008667, + 0.5638167533874512, + 0.4516558566093445, + 0.7109629370689392, + 0.5448078726768494, + 0.6100124780654907, + 0.647748377609253, + 0.5807090089797974, + 0.5962627920150757, + 0.4787724911212921, + 0.44061123929023743, + 0.45318230543136595, + 0.4324454571247101, + 0.48582389402389525, + 0.48784693965911863, + 0.4654889596939087, + 0.4910616933822632, + 0.44223530769348146, + 0.4255864576339722, + 0.43338484077453615, + 0.40529030129909516, + 0.3956596384048462, + 0.41429238247871397, + 0.4396337124347687, + 0.396600995016098, + 0.37550678915977476, + 0.36028911843299866, + 0.37281743416786195, + 0.36315483593940734, + 0.36328665294647217, + 0.3824797859072685, + 0.35487752180099486, + 0.35909159870147705, + 0.3572547873020172, + 0.336571563911438, + 0.34290257511138916, + 0.3480034410953522, + 0.3370935582637787, + 0.33314969940185546, + 0.33331610808372497, + 0.3301537363290787, + 0.3311965983390808, + 0.3278242862701416, + 0.32672062397003176, + 0.32609617538452146 + ], + "train_acc": [ + 0.1885, + 0.5103, + 0.7062, + 0.7826, + 0.8192, + 0.8434, + 0.8457, + 0.8501, + 0.8376, + 0.8434, + 0.8194, + 0.8365, + 0.8233, + 0.8306, + 0.8244, + 0.7857, + 0.8258, + 0.8158, + 0.7827, + 0.7945, + 0.8047, + 0.7925, + 0.7908, + 0.8134, + 0.797, + 0.7749, + 0.7952, + 0.7653, + 0.8022, + 0.7932, + 0.7963, + 0.7798, + 0.8089, + 0.7659, + 0.7638, + 0.8216, + 0.7988, + 0.8301, + 0.7648, + 0.7997, + 0.787, + 0.7806, + 0.7963, + 0.7918, + 0.8211, + 0.8302, + 0.8283, + 0.8372, + 0.8209, + 0.8197, + 0.8281, + 0.823, + 0.8352, + 0.8373, + 0.8393, + 0.8439, + 0.8478, + 0.8453, + 0.837, + 0.8479, + 0.8551, + 0.86, + 0.8595, + 0.8613, + 0.8576, + 0.8564, + 0.8631, + 0.8603, + 0.8618, + 0.8703, + 0.8667, + 0.8674, + 0.8688, + 0.8719, + 0.8714, + 0.8698, + 0.8719, + 0.8732, + 0.874, + 0.8739 + ], + "test_acc": [ + 0.3485, + 0.642, + 0.7375, + 0.7915, + 0.802, + 0.7915, + 0.807, + 0.812, + 0.804, + 0.767, + 0.8025, + 0.79, + 0.7975, + 0.7715, + 0.7125, + 0.757, + 0.7585, + 0.665, + 0.6875, + 0.6805, + 0.7355, + 0.6705, + 0.7525, + 0.742, + 0.6565, + 0.727, + 0.606, + 0.6405, + 0.7245, + 0.7345, + 0.715, + 0.745, + 0.6045, + 0.578, + 0.712, + 0.7905, + 0.733, + 0.7005, + 0.754, + 0.681, + 0.7345, + 0.6195, + 0.6645, + 0.7995, + 0.754, + 0.72, + 0.739, + 0.7355, + 0.7415, + 0.752, + 0.716, + 0.742, + 0.784, + 0.688, + 0.7865, + 0.8035, + 0.7615, + 0.808, + 0.796, + 0.8005, + 0.8245, + 0.814, + 0.823, + 0.801, + 0.806, + 0.8105, + 0.806, + 0.806, + 0.8265, + 0.8235, + 0.8115, + 0.82, + 0.8275, + 0.823, + 0.826, + 0.8175, + 0.8225, + 0.8235, + 0.8245, + 0.824 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.030194921419024467, + 0.3003618121147156, + 0.18209302425384521, + 0.12414582818746567 + ], + "perturbation_rho": [ + -0.038011275231838226, + 0.29912513494491577, + 0.1735759675502777, + 0.14118143916130066 + ], + "nudging": { + "0.001": [ + 0.0004484695091377944, + -0.0008491222397424281, + -0.0005047788145020604, + -0.0003660085494630039 + ], + "0.003": [ + 0.001385596813634038, + -0.0025426694191992283, + -0.0015110077802091837, + -0.0010910483542829752 + ], + "0.01": [ + 0.005076530389487743, + -0.00841662660241127, + -0.005011391825973988, + -0.0036195346619933844 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.8123929222106934, + 0.7969598731994629, + 0.4681823432445526, + 0.4493808107376099, + 0.4859991237640381, + 0.5615512335777283, + 0.6788585278511048, + 0.769824936580658, + 0.7635405010223388, + 0.7253447900772094, + 0.7080011105537415, + 0.7129657225131989, + 0.7468086644172669, + 0.7786125428199768, + 0.7598382493972778, + 0.7637535655975342, + 0.784446928024292, + 0.791630249786377, + 0.8042271808624267, + 0.8116328013420105, + 0.7919122304916382, + 0.8624911094665527, + 0.8134118410110474, + 0.8004576719284058, + 0.826051163482666, + 0.7835210838317871, + 0.8537725872993469, + 0.8074887325286865, + 0.7989932650566101, + 0.7464404977798462, + 0.7878874625682831, + 0.7705603090286255, + 0.8202200212478638, + 0.7995859888076782, + 0.8566022305488586, + 0.8265386112213134, + 0.8467596694946289, + 0.8278987077713013, + 0.839235195350647, + 0.8700848264694214, + 0.8941480784416199, + 0.8706226264953614, + 0.8077309101104736, + 0.8231417049407959, + 0.8741218314170838, + 0.8338860015869141, + 0.7885824256896973, + 0.7956271339416504, + 0.7766273180007934, + 0.7837719497680664, + 0.7901550762176514, + 0.7942577618598938, + 0.7556007875442505, + 0.7318876386642456, + 0.7315496717453003, + 0.7372453187942505, + 0.7162431858062744, + 0.7204227170467377, + 0.7074315301895142, + 0.7244995565414428, + 0.7033161953926086, + 0.6938653470993043, + 0.7081535718917846, + 0.6887570705413818, + 0.6773336295127869, + 0.6713978358268737, + 0.6677473924636841, + 0.6675515371322632, + 0.6589781717300415, + 0.6592945998191834, + 0.6567529281616211, + 0.6525886249542237, + 0.6496815184593201, + 0.6495527265548706, + 0.6473081888198853, + 0.6461846683502197, + 0.6442305462837219, + 0.6443143812179566, + 0.6430024762630463, + 0.642762578868866 + ], + "train_acc": [ + 0.3465, + 0.7012, + 0.8236, + 0.8291, + 0.8176, + 0.8032, + 0.7708, + 0.7513, + 0.7483, + 0.7484, + 0.7417, + 0.74, + 0.7308, + 0.7243, + 0.7347, + 0.7333, + 0.7311, + 0.7299, + 0.7266, + 0.7204, + 0.732, + 0.7169, + 0.7258, + 0.7261, + 0.7164, + 0.7349, + 0.7103, + 0.7278, + 0.7384, + 0.7499, + 0.7403, + 0.7424, + 0.736, + 0.7367, + 0.7227, + 0.7313, + 0.7293, + 0.7359, + 0.7336, + 0.7305, + 0.7218, + 0.7235, + 0.7413, + 0.7317, + 0.7181, + 0.726, + 0.7331, + 0.7324, + 0.7392, + 0.7341, + 0.7313, + 0.7293, + 0.7439, + 0.7451, + 0.7482, + 0.7447, + 0.7498, + 0.7466, + 0.754, + 0.7472, + 0.7547, + 0.7577, + 0.7519, + 0.7566, + 0.7652, + 0.7641, + 0.7657, + 0.7642, + 0.767, + 0.7672, + 0.7684, + 0.7686, + 0.7703, + 0.7693, + 0.77, + 0.7684, + 0.7718, + 0.771, + 0.7711, + 0.7713 + ], + "test_acc": [ + 0.593, + 0.771, + 0.813, + 0.8005, + 0.7815, + 0.753, + 0.7255, + 0.708, + 0.739, + 0.7295, + 0.7435, + 0.7325, + 0.715, + 0.698, + 0.7005, + 0.6945, + 0.702, + 0.6985, + 0.6985, + 0.711, + 0.694, + 0.695, + 0.715, + 0.6785, + 0.6955, + 0.646, + 0.709, + 0.699, + 0.687, + 0.711, + 0.7145, + 0.692, + 0.6905, + 0.6385, + 0.676, + 0.6885, + 0.685, + 0.694, + 0.693, + 0.663, + 0.642, + 0.6935, + 0.6885, + 0.673, + 0.686, + 0.6815, + 0.693, + 0.704, + 0.686, + 0.6805, + 0.6965, + 0.7025, + 0.7115, + 0.71, + 0.706, + 0.705, + 0.7055, + 0.7155, + 0.709, + 0.714, + 0.7215, + 0.72, + 0.7195, + 0.7185, + 0.73, + 0.725, + 0.727, + 0.723, + 0.725, + 0.7305, + 0.7285, + 0.7285, + 0.728, + 0.734, + 0.733, + 0.733, + 0.734, + 0.7325, + 0.733, + 0.733 + ], + "state_pred_error": [ + 0.7424910880565644, + 0.24538831996917726, + 0.1696438634634018, + 0.1582905143260956, + 0.1631220199584961, + 0.1723755702495575, + 0.1831033411026001, + 0.18637536973953248, + 0.1819893986463547, + 0.16733712508678436, + 0.15095561995506288, + 0.132748974442482, + 0.11434644386768342, + 0.09421088438034057, + 0.08756505841016769, + 0.08341595257520676, + 0.0805468656539917, + 0.07775743334293365, + 0.07735535364151001, + 0.07478679238557816, + 0.06856273975372315, + 0.06119619631767273, + 0.05259707286357879, + 0.04269158652424812, + 0.03410064045786858, + 0.027179633522033692, + 0.023885729551315307, + 0.021235701763629912, + 0.02094485488831997, + 0.02022430610358715, + 0.01988106532692909, + 0.01952715065330267, + 0.019609414368867876, + 0.020033554589748384, + 0.020146991772949697, + 0.01961232684701681, + 0.01936790647506714, + 0.019153894048929216, + 0.01937529597133398, + 0.018842387399077416, + 0.018071847139298915, + 0.017307695150375366, + 0.016579271717369556, + 0.01552603451013565, + 0.015096754413843155, + 0.013859699180722237, + 0.012979740312695503, + 0.012281061121821403, + 0.011574527004361153, + 0.010909687869250775, + 0.010257076373696328, + 0.009821538998931647, + 0.009271138358861208, + 0.008785224071145058, + 0.008230697739124299, + 0.007849063183367252, + 0.0074681182123720645, + 0.007055782772600651, + 0.0067631045818328855, + 0.006486539483070373, + 0.006212053466588259, + 0.005942052242159843, + 0.005858693596720695, + 0.005584450083971023, + 0.005323304799944162, + 0.005180257834494114, + 0.0050939571440219876, + 0.004897539104521275, + 0.004757686843723059, + 0.004607934882491827, + 0.004440061054006219, + 0.004348039439320564, + 0.004419275801628828, + 0.0041590200409293175, + 0.004140176199376583, + 0.00423978632427752, + 0.003907272329181433, + 0.003829565724730492, + 0.003753288455680013, + 0.003695953545719385 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.821143627166748, + 0.36722686886787415, + 0.20176959037780762, + 0.1750764548778534 + ], + "perturbation_rho": [ + 0.6905952095985413, + 0.36183467507362366, + 0.19890159368515015, + 0.15810276567935944 + ], + "nudging": { + "0.001": [ + -0.021994680166244507, + -0.0013722439762204885, + -0.0006841139402240515, + -0.0005768820992670953 + ], + "0.003": [ + -0.06444752216339111, + -0.00411063339561224, + -0.0020494144409894943, + -0.0017298792954534292 + ], + "0.01": [ + -0.1973220407962799, + -0.013631552457809448, + -0.0068134344182908535, + -0.0057535795494914055 + ] + }, + "state_pred_error_per_layer": [ + 3017.568359375, + 2069.30517578125, + 2103.28662109375, + 1370.3270263671875 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2304506519317626, + 1.3942056268692016, + 0.8183312824249268, + 0.5797962010383606, + 0.4764002899169922, + 0.4094866346359253, + 0.4068061854362488, + 0.38665450406074525, + 0.3990870332241058, + 0.4220907788276672, + 0.496053104019165, + 0.4371034680366516, + 0.45066176986694334, + 0.5061244255065918, + 0.4739286370754242, + 0.4944791939735413, + 0.5044361748695374, + 0.6503571970939637, + 0.47436288118362424, + 0.5432016505241394, + 0.5854156719207764, + 0.47859073028564453, + 0.566104229259491, + 0.6238331944465637, + 0.6042083335876465, + 0.7139152729034424, + 0.6597491868972778, + 0.6986511729240418, + 0.6769212335586547, + 0.7593953706741333, + 0.7314193179130554, + 0.7335153755187989, + 0.7572157611846924, + 0.7321065183639527, + 0.7649673822879791, + 0.6976259819984436, + 0.7286087586402893, + 0.7189216842651367, + 0.7617496681213379, + 0.7480665018081665, + 0.7844495740890502, + 0.8273416324615479, + 0.843971639251709, + 0.8851293493270874, + 0.8638077151298523, + 0.8672280294895172, + 0.8649810727119446, + 0.8554271353721619, + 0.8371897335052491, + 0.8481480210304261, + 0.8235589872360229, + 0.8250558439731598, + 0.821573218536377, + 0.8396482845306397, + 0.8538236341476441, + 0.8500017461776733, + 0.8449060009002686, + 0.8542348052978516, + 0.85397573928833, + 0.8410406700134277, + 0.8542406044006348, + 0.8490435265541076, + 0.8294786353111268, + 0.8252912633419037, + 0.8250881828308105, + 0.8167968341827393, + 0.8243150682449341, + 0.810345893573761, + 0.8054994924545288, + 0.8062832556724548, + 0.803090742111206, + 0.7987750416755677, + 0.8018800824165344, + 0.7949400223731995, + 0.7933959410667419, + 0.7913647750854492, + 0.7914622924804687, + 0.7898741424560547, + 0.7892889207839966, + 0.7888304642677307 + ], + "train_acc": [ + 0.192, + 0.518, + 0.7025, + 0.7851, + 0.8191, + 0.8447, + 0.8429, + 0.8512, + 0.8493, + 0.8355, + 0.8181, + 0.8327, + 0.8287, + 0.8171, + 0.8261, + 0.8175, + 0.8159, + 0.7771, + 0.8218, + 0.803, + 0.7916, + 0.8252, + 0.8046, + 0.7807, + 0.7822, + 0.7604, + 0.7775, + 0.7722, + 0.7831, + 0.7659, + 0.7596, + 0.756, + 0.7421, + 0.7452, + 0.7408, + 0.7511, + 0.7441, + 0.744, + 0.7328, + 0.7355, + 0.7311, + 0.7234, + 0.7211, + 0.711, + 0.7102, + 0.7178, + 0.7071, + 0.7128, + 0.7173, + 0.7083, + 0.7174, + 0.7133, + 0.7121, + 0.7048, + 0.7029, + 0.7051, + 0.7006, + 0.7005, + 0.6974, + 0.7041, + 0.696, + 0.6999, + 0.7074, + 0.7052, + 0.7056, + 0.7099, + 0.7086, + 0.7113, + 0.7112, + 0.7122, + 0.7124, + 0.7142, + 0.7134, + 0.7167, + 0.7134, + 0.7162, + 0.7182, + 0.7158, + 0.7159, + 0.7162 + ], + "test_acc": [ + 0.3505, + 0.6215, + 0.7385, + 0.776, + 0.8105, + 0.819, + 0.809, + 0.811, + 0.8155, + 0.749, + 0.796, + 0.8045, + 0.752, + 0.729, + 0.786, + 0.7715, + 0.6865, + 0.72, + 0.7255, + 0.669, + 0.778, + 0.687, + 0.7285, + 0.7615, + 0.734, + 0.7575, + 0.71, + 0.777, + 0.735, + 0.744, + 0.742, + 0.701, + 0.7025, + 0.6955, + 0.7175, + 0.735, + 0.693, + 0.7025, + 0.7245, + 0.6985, + 0.698, + 0.716, + 0.668, + 0.6525, + 0.695, + 0.6575, + 0.702, + 0.7145, + 0.7045, + 0.705, + 0.6925, + 0.7065, + 0.7, + 0.6855, + 0.7, + 0.6935, + 0.696, + 0.6985, + 0.685, + 0.7045, + 0.6975, + 0.701, + 0.6955, + 0.7, + 0.699, + 0.699, + 0.712, + 0.7065, + 0.7075, + 0.7055, + 0.71, + 0.709, + 0.705, + 0.7095, + 0.7125, + 0.7095, + 0.7105, + 0.711, + 0.71, + 0.7085 + ], + "value_loss": [ + 2.875565072822571, + 0.8934291703224182, + 0.7643266316890717, + 0.6411794909477234, + 0.5538642876625061, + 0.5101048704147338, + 0.5553470899581909, + 0.4691417839050293, + 0.4629878062009811, + 0.555866827583313, + 0.7427106724739074, + 0.5367072154998779, + 0.6318443626403809, + 0.720150242805481, + 0.6702281295776367, + 0.6685273101329804, + 0.7366531593322754, + 1.1599597629070282, + 0.6955488331794739, + 0.8128993940353394, + 0.9401766692161561, + 0.7360081169128418, + 0.9247368459701538, + 0.9366291213035584, + 0.850796000289917, + 1.201850381565094, + 1.087157346343994, + 1.1369871886253358, + 1.0918189323425294, + 1.2658386784076692, + 0.9737425192832947, + 0.9713388110160828, + 0.8103028650283813, + 0.7689808444976807, + 0.7541267780303955, + 0.6178562547683716, + 0.6552725201368332, + 0.651333825969696, + 0.6328555109381676, + 0.6119258517742157, + 0.6578858529090882, + 0.7603759881734848, + 0.7731849906921386, + 0.8381655234336853, + 0.7553952046990394, + 0.7562767848968506, + 0.7243463092803956, + 0.6914454604864121, + 0.7287011550903321, + 0.7079713569641113, + 0.5950203428268432, + 0.61903060131073, + 0.6206758731842041, + 0.6741137755393982, + 0.638280230140686, + 0.5789763841867447, + 0.5631655465126038, + 0.6306552550315857, + 0.5531370044708251, + 0.5336048315048217, + 0.6597217742919922, + 0.5602773515224457, + 0.550052008497715, + 0.5294891984701157, + 0.50927531375885, + 0.5022766840934754, + 0.5141903561592102, + 0.4788236827850342, + 0.46827283239364625, + 0.44508712520599364, + 0.4594296352863312, + 0.4582284578323364, + 0.47078573088645936, + 0.4428159856557846, + 0.45073776305913926, + 0.440414612865448, + 0.438992391872406, + 0.44469812307357787, + 0.4330620062351227, + 0.44552071504592894 + ], + "term_loss": [ + 1.6042461963653565, + 0.5282565028190612, + 0.5590828673362732, + 0.47629781847000124, + 0.3978954189300537, + 0.3636821876525879, + 0.4072596705198288, + 0.3282800791442394, + 0.32510876396894456, + 0.4085556797027588, + 0.5720677609920501, + 0.38465584144592285, + 0.47195274906158446, + 0.5482156983375549, + 0.5044927421092987, + 0.49531292711496355, + 0.5535180912971497, + 0.928170532798767, + 0.5174768854379654, + 0.6144302132129669, + 0.7212574210643768, + 0.556490356349945, + 0.7165425998687744, + 0.7060825702667236, + 0.6239088512420654, + 0.9418239488124848, + 0.8416530807495117, + 0.8893139802455902, + 0.851651100063324, + 1.0026947542667388, + 0.7173096209526062, + 0.7091760641098023, + 0.5505894849777222, + 0.5145378706932068, + 0.4895065601348877, + 0.36691248669624327, + 0.3942630385398865, + 0.3903921950340271, + 0.35521844633817673, + 0.33440421884059907, + 0.36932155704498293, + 0.45691595553159714, + 0.4697963525772095, + 0.522415696144104, + 0.4547668980836868, + 0.4589268930077553, + 0.42205919748544696, + 0.3977071187138557, + 0.42937303175926206, + 0.41034482958316804, + 0.3034935749053955, + 0.3259772541999817, + 0.3256353075265884, + 0.3720514593601227, + 0.3364347091197967, + 0.2779531095802784, + 0.2669277866601944, + 0.33009841556549074, + 0.2530543705701828, + 0.24142619206905366, + 0.35455005407333373, + 0.26008426011800767, + 0.25793272792994976, + 0.23912566680461167, + 0.2228550751209259, + 0.21906529731750488, + 0.2285044935464859, + 0.19956185779571534, + 0.1911724850535393, + 0.16786679723262787, + 0.18276870269179343, + 0.18051835017204285, + 0.19217048416137694, + 0.16508175657987595, + 0.17382024183571337, + 0.16160465959310533, + 0.16125739208459855, + 0.1634468115568161, + 0.15457683594822882, + 0.1639193995475769 + ], + "bridge_loss": [ + 0.9688761974389432, + 0.09757226877212524, + 0.012632294435054064, + 0.006896629202365875, + 0.016848481428623198, + 0.02207008745521307, + 0.022640679097175598, + 0.017478782982379197, + 0.010638495054841041, + 0.0098322123169899, + 0.011913983760774136, + 0.00792585155069828, + 0.009292545095086098, + 0.009518902608752251, + 0.008932905950024723, + 0.009623992730677128, + 0.010149495212733745, + 0.01872984848022461, + 0.014103599740564823, + 0.012476106625795364, + 0.021234536376595496, + 0.015649695736169814, + 0.018796107818186282, + 0.017918908199667932, + 0.01956285170018673, + 0.02622278172969818, + 0.026339271712303162, + 0.020386182287335394, + 0.023761410945653916, + 0.027614238518476487, + 0.02414468483030796, + 0.023320833349227906, + 0.012906089831888675, + 0.01244986510872841, + 0.014011499826610088, + 0.014019607320427894, + 0.016671525955200196, + 0.020415333633124828, + 0.022233861681073903, + 0.02509751079156995, + 0.02855886407494545, + 0.03512386602535844, + 0.03239926918745041, + 0.03483687193393707, + 0.02414971941784024, + 0.021885205315425992, + 0.023786303965747355, + 0.01902258104905486, + 0.027144915854930878, + 0.021862186920642852, + 0.019822580271959305, + 0.02127928227558732, + 0.023540232962369918, + 0.024526968252658845, + 0.021736864572763442, + 0.022946330963075162, + 0.017184075573086738, + 0.02062335392832756, + 0.018120812475681303, + 0.015307850694656372, + 0.023829158449172973, + 0.018856425175070763, + 0.018164710475504397, + 0.01771858846768737, + 0.01473103111088276, + 0.013859573656320573, + 0.014396251887083053, + 0.012541232538223267, + 0.011693280148506164, + 0.011579178339242935, + 0.012598556798696517, + 0.014540255971252919, + 0.01518781537413597, + 0.01615833755284548, + 0.015597678692266345, + 0.018065750354528426, + 0.017838929241895677, + 0.02107308625280857, + 0.01863815703690052, + 0.022096455523371698 + ], + "tgrad_loss": [ + 0.3024426766872406, + 0.26760040110349653, + 0.19261146736145018, + 0.15798504416942596, + 0.13912039029598236, + 0.12435259215831757, + 0.12544673397541045, + 0.1233829214334488, + 0.12724055438041687, + 0.1374789370059967, + 0.15872892727851867, + 0.14412552337646484, + 0.15059907083511354, + 0.16241564388275145, + 0.15680248302221297, + 0.16359038968086242, + 0.17298557314872742, + 0.21305938571691513, + 0.16396834471225738, + 0.1859930724620819, + 0.1976847105026245, + 0.1638680607318878, + 0.1893981406211853, + 0.2126276472568512, + 0.20732428936958314, + 0.23380364923477173, + 0.21916499223709107, + 0.22728701264858245, + 0.2164064181804657, + 0.2355296877384186, + 0.23228821861743926, + 0.23884190742969513, + 0.24680728578567504, + 0.24199310512542724, + 0.2506087215423584, + 0.2369241587638855, + 0.24433795733451844, + 0.2405263027191162, + 0.2554032007455826, + 0.25242412157058713, + 0.2600054337501526, + 0.26833617506027224, + 0.2709893661499023, + 0.2809129590988159, + 0.27647859499454497, + 0.275464682662487, + 0.27850080614089967, + 0.27471575455665587, + 0.2721832049369812, + 0.27576433696746827, + 0.2717041887283325, + 0.2717740647315979, + 0.27150033550262453, + 0.2775353482723236, + 0.2801086558818817, + 0.27807693454027177, + 0.2790536849021912, + 0.27993348541259766, + 0.2819618251562119, + 0.2768707938671112, + 0.2813425661563873, + 0.2813366662502289, + 0.2739545676112175, + 0.2726449445486069, + 0.2716892107963562, + 0.26935181140899656, + 0.2712896113157272, + 0.2667205859661102, + 0.2654070652484894, + 0.26564114809036254, + 0.2640623729944229, + 0.26316985001564025, + 0.26342742853164675, + 0.26157588943243026, + 0.26131984198093416, + 0.26074419956207273, + 0.2598960707902908, + 0.26017822399139406, + 0.25984701359272006, + 0.2595048580646515 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.021101564168930054, + 0.1092284768819809, + 0.14931762218475342, + 0.16334021091461182 + ], + "perturbation_rho": [ + 0.026919251307845116, + 0.23688018321990967, + 0.28421375155448914, + 0.2676014304161072 + ], + "nudging": { + "0.001": [ + -0.0008864067494869232, + -0.0009627565741539001, + -0.0012677897466346622, + -0.001255445065908134 + ], + "0.003": [ + -0.0026319557800889015, + -0.0028857083525508642, + -0.003800811246037483, + -0.0037655923515558243 + ], + "0.01": [ + -0.008425744250416756, + -0.009595570154488087, + -0.012630455195903778, + -0.012512242421507835 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.25_L4_s42.json b/results/synth_ladder_v2_lo/synth_a0.25_L4_s42.json new file mode 100644 index 0000000..ec28849 --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.25_L4_s42.json @@ -0,0 +1,1554 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.453296373653412, + 0.4953095598220825, + 0.34828554306030274, + 0.34110426716804504, + 0.27771372408866885, + 0.2927352352142334, + 0.2706843049049377, + 0.3097882106781006, + 0.26225770044326785, + 0.25132905864715577, + 0.25332398891448976, + 0.2514034366607666, + 0.21332003959417342, + 0.1936976969242096, + 0.2505925059080124, + 0.20892606778144837, + 0.2087661534309387, + 0.20852603862285615, + 0.18916085431575774, + 0.1735510662317276, + 0.17585254753828047, + 0.1600837320804596, + 0.184162171459198, + 0.1619161043167114, + 0.18675716395378114, + 0.15804585781097413, + 0.16049944838285446, + 0.14615878117084502, + 0.13879444608688354, + 0.15593961148262023, + 0.1475718964099884, + 0.1584999119758606, + 0.16021934352219105, + 0.11994385460615158, + 0.11137195901870728, + 0.1309328990459442, + 0.11823977715969086, + 0.12014036464691162, + 0.11413699101507664, + 0.09933694800138473, + 0.10369804172515869, + 0.1288715265393257, + 0.10965070486068726, + 0.10025272550582885, + 0.09632523136138917, + 0.09258691647052765, + 0.09523829494118691, + 0.0850349404335022, + 0.09242999118566513, + 0.08526616468429565, + 0.0841564024925232, + 0.08719563089609146, + 0.07787569234371185, + 0.07688848695755005, + 0.07261240689754486, + 0.07009156805276871, + 0.06769767506122588, + 0.06889801435470581, + 0.06692594285011291, + 0.06540395164489746, + 0.06442964359521866, + 0.06337919898033142, + 0.06439190024137496, + 0.061882001066207885, + 0.0627123805642128, + 0.06019558189511299, + 0.05877050402164459, + 0.05892564465999603, + 0.05775531235933304, + 0.057336541628837584, + 0.05673237580060959, + 0.056307577848434445, + 0.05571542314887047, + 0.055296688014268874, + 0.055058483922481534, + 0.05481614050865173, + 0.054657079005241395, + 0.054507050532102586, + 0.054425559097528456, + 0.05437098300457001 + ], + "train_acc": [ + 0.521, + 0.8342, + 0.8734, + 0.8655, + 0.8922, + 0.884, + 0.8912, + 0.8784, + 0.8991, + 0.8983, + 0.9004, + 0.8998, + 0.9154, + 0.9258, + 0.9031, + 0.9158, + 0.9142, + 0.9177, + 0.9273, + 0.9349, + 0.932, + 0.9401, + 0.9262, + 0.9358, + 0.9253, + 0.9406, + 0.9371, + 0.9434, + 0.9492, + 0.9411, + 0.943, + 0.9396, + 0.9373, + 0.9596, + 0.9637, + 0.9514, + 0.9583, + 0.9562, + 0.959, + 0.967, + 0.9641, + 0.9512, + 0.961, + 0.9657, + 0.9694, + 0.9709, + 0.9696, + 0.9747, + 0.9695, + 0.974, + 0.9761, + 0.9749, + 0.9795, + 0.9789, + 0.9826, + 0.9832, + 0.986, + 0.9848, + 0.9866, + 0.9868, + 0.9877, + 0.9874, + 0.9867, + 0.9887, + 0.9889, + 0.9905, + 0.991, + 0.9897, + 0.9917, + 0.992, + 0.9922, + 0.9927, + 0.9928, + 0.9936, + 0.9933, + 0.9932, + 0.9936, + 0.9937, + 0.9935, + 0.9936 + ], + "test_acc": [ + 0.783, + 0.8685, + 0.8705, + 0.8805, + 0.8855, + 0.8775, + 0.8805, + 0.8805, + 0.883, + 0.8825, + 0.883, + 0.8885, + 0.8955, + 0.8915, + 0.8905, + 0.893, + 0.895, + 0.9, + 0.8935, + 0.902, + 0.9075, + 0.903, + 0.9015, + 0.903, + 0.896, + 0.899, + 0.904, + 0.905, + 0.905, + 0.903, + 0.9065, + 0.908, + 0.9055, + 0.914, + 0.907, + 0.909, + 0.9125, + 0.9045, + 0.907, + 0.9065, + 0.9105, + 0.9005, + 0.914, + 0.909, + 0.915, + 0.908, + 0.9105, + 0.9155, + 0.9055, + 0.9145, + 0.909, + 0.91, + 0.9105, + 0.911, + 0.9155, + 0.9125, + 0.9165, + 0.913, + 0.9105, + 0.913, + 0.911, + 0.91, + 0.912, + 0.9125, + 0.9155, + 0.9145, + 0.9135, + 0.9125, + 0.9115, + 0.9115, + 0.912, + 0.9115, + 0.9115, + 0.9115, + 0.911, + 0.9115, + 0.911, + 0.911, + 0.911, + 0.911 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.868922770023346, + 0.8429951667785645, + 0.8289605379104614, + 0.8231275081634521 + ], + "perturbation_rho": [ + 0.999998927116394, + 0.9999972581863403, + 0.9999882578849792, + 0.9999451637268066 + ], + "nudging": { + "0.001": [ + -0.029291702434420586, + -0.013265937566757202, + -0.0059385779313743114, + -0.0030764099210500717 + ], + "0.003": [ + -0.0787585899233818, + -0.03797435015439987, + -0.017459016293287277, + -0.009135493077337742 + ], + "0.01": [ + -0.17674864828586578, + -0.10683682560920715, + -0.05415143817663193, + -0.029372699558734894 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.2496918357849123, + 1.3387847526550294, + 0.7445953012466431, + 0.5398363877296448, + 0.44195732192993165, + 0.406708620595932, + 0.3705522078037262, + 0.37765975799560547, + 0.3639752985954285, + 0.3892137159347534, + 0.3852337788581848, + 0.4254111849784851, + 0.38780576059818267, + 0.41569334573745725, + 0.4350270037651062, + 0.43129599609375, + 0.44781311664581297, + 0.47839186553955076, + 0.48407614097595214, + 0.45144308986663817, + 0.5073113049447536, + 0.48227315073013305, + 0.5290714904785156, + 0.45285613021850585, + 0.4874774526119232, + 0.46561420321464536, + 0.43761558775901793, + 0.45178383803367617, + 0.43797643756866456, + 0.5157751927137375, + 0.4519074549674988, + 0.5198216260910035, + 0.47095790967941287, + 0.45483838151693345, + 0.44220186512470244, + 0.49421512649059296, + 0.5017378551483155, + 0.4660479995489121, + 0.41283108919858935, + 0.4158671610355377, + 0.42750406036376953, + 0.5042367227554321, + 0.47434177494049073, + 0.5477551186561584, + 0.43455731093883515, + 0.4315849390029907, + 0.4076690737605095, + 0.392881183385849, + 0.3990067440032959, + 0.3904748822212219, + 0.37085895271301267, + 0.40754292578697204, + 0.39559432973861697, + 0.3863873209953308, + 0.37049336433410646, + 0.36953919867277146, + 0.36928157291412356, + 0.40962127685546873, + 0.3643629170656204, + 0.3515832754135132, + 0.3692568906784058, + 0.3748962776184082, + 0.3622305648565292, + 0.34127199211120607, + 0.3452877820730209, + 0.3349293503880501, + 0.33011303119659424, + 0.3349422814369202, + 0.3320218985080719, + 0.3275007127761841, + 0.3277460176587105, + 0.32419858107566835, + 0.3230124948501587, + 0.32022189517021177, + 0.3179460354447365, + 0.31657396450042724, + 0.3161927330970764, + 0.3148143844127655, + 0.31444183547496796, + 0.3140971690177917 + ], + "train_acc": [ + 0.1757, + 0.5378, + 0.7229, + 0.7943, + 0.8272, + 0.8416, + 0.8544, + 0.8553, + 0.8624, + 0.859, + 0.8615, + 0.8498, + 0.8606, + 0.8573, + 0.8553, + 0.8551, + 0.8531, + 0.8525, + 0.8513, + 0.8535, + 0.8483, + 0.8558, + 0.8419, + 0.8546, + 0.852, + 0.8583, + 0.8637, + 0.8581, + 0.8621, + 0.848, + 0.8602, + 0.8478, + 0.8558, + 0.859, + 0.8595, + 0.8528, + 0.8544, + 0.8592, + 0.8692, + 0.8682, + 0.8691, + 0.8536, + 0.8621, + 0.8432, + 0.8668, + 0.8678, + 0.8758, + 0.8798, + 0.877, + 0.8799, + 0.8825, + 0.8738, + 0.8764, + 0.8796, + 0.8844, + 0.8804, + 0.8812, + 0.8732, + 0.8853, + 0.888, + 0.8859, + 0.8828, + 0.8854, + 0.8884, + 0.8882, + 0.8911, + 0.89, + 0.8878, + 0.8907, + 0.8914, + 0.893, + 0.8949, + 0.8946, + 0.8942, + 0.8967, + 0.8948, + 0.8971, + 0.8967, + 0.8965, + 0.8966 + ], + "test_acc": [ + 0.3575, + 0.648, + 0.7465, + 0.787, + 0.8045, + 0.817, + 0.82, + 0.822, + 0.8115, + 0.8225, + 0.786, + 0.821, + 0.81, + 0.7845, + 0.8205, + 0.826, + 0.8265, + 0.7955, + 0.8305, + 0.802, + 0.809, + 0.784, + 0.8185, + 0.805, + 0.824, + 0.822, + 0.802, + 0.808, + 0.8, + 0.8025, + 0.7915, + 0.803, + 0.81, + 0.8055, + 0.7815, + 0.8075, + 0.8135, + 0.813, + 0.8385, + 0.814, + 0.792, + 0.81, + 0.811, + 0.8125, + 0.8125, + 0.8265, + 0.833, + 0.8445, + 0.8385, + 0.8405, + 0.838, + 0.84, + 0.8335, + 0.847, + 0.841, + 0.8385, + 0.8335, + 0.848, + 0.843, + 0.8465, + 0.8445, + 0.8415, + 0.8445, + 0.8455, + 0.8475, + 0.8515, + 0.85, + 0.8505, + 0.8505, + 0.852, + 0.8505, + 0.851, + 0.8495, + 0.8515, + 0.8495, + 0.8515, + 0.8505, + 0.8515, + 0.851, + 0.8515 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.006489354185760021, + 0.12851163744926453, + 0.11991241574287415, + 0.11389133334159851 + ], + "perturbation_rho": [ + 0.029786743223667145, + 0.18639126420021057, + 0.11502038687467575, + 0.06601984798908234 + ], + "nudging": { + "0.001": [ + -0.0010971444426104426, + -0.0006575186271220446, + -0.0003536626463755965, + -0.00032158708199858665 + ], + "0.003": [ + -0.003264155238866806, + -0.0019673758652061224, + -0.0010591265745460987, + -0.0009630966233089566 + ], + "0.01": [ + -0.01056693121790886, + -0.006519604474306107, + -0.003515135496854782, + -0.003202090272679925 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.8671920738220216, + 0.8245958818435669, + 0.47314112768173217, + 0.45674627771377563, + 0.4969047926664352, + 0.6115808282852173, + 0.7014055969238281, + 0.7080811479568482, + 0.7012172104358673, + 0.6735383527755737, + 0.649971604347229, + 0.6521630270957947, + 0.6687821681022644, + 0.6728867406845093, + 0.7074090370178223, + 0.698468556690216, + 0.7291404920578003, + 0.7727017598628998, + 0.7500046424865723, + 0.8085200922012329, + 0.779546489238739, + 0.801387744808197, + 0.7530522830963134, + 0.8084568103790283, + 0.8122323418617249, + 0.7676459170341492, + 0.7385737422943115, + 0.7743796340942383, + 0.791342021369934, + 0.7538952941894531, + 0.7233746746063232, + 0.7027450902938843, + 0.6739716813087463, + 0.6575725811958313, + 0.657341569519043, + 0.6534057109832764, + 0.6632411510944366, + 0.6651172963142395, + 0.6753239694595337, + 0.6706813243865967, + 0.6627065504074097, + 0.6668087734222412, + 0.6758873833417892, + 0.6484876903533936, + 0.6945558298110962, + 0.6871001857757568, + 0.6978039226531982, + 0.7010440427780151, + 0.7184338994979859, + 0.7164405530929565, + 0.6952354438781738, + 0.7032188013076782, + 0.7004193035125732, + 0.6734662980079651, + 0.6810175803661347, + 0.677333201789856, + 0.6784080492973328, + 0.6712752502441406, + 0.6656309762001038, + 0.6615614066123963, + 0.660873606300354, + 0.6580983083724976, + 0.6578487804412841, + 0.6565888023853302, + 0.6494241165161133, + 0.6526647891044617, + 0.6507426448822021, + 0.6518581859588624, + 0.653467121887207, + 0.6535044790267944, + 0.6530143226623535, + 0.6528809313774109, + 0.6519273241043091, + 0.6527892800331115, + 0.6520682262420654, + 0.6511607341766358, + 0.6508296747207641, + 0.650347448348999, + 0.6499623192787171, + 0.6497791537284852 + ], + "train_acc": [ + 0.3296, + 0.6941, + 0.8187, + 0.8252, + 0.8134, + 0.7893, + 0.7615, + 0.7534, + 0.7544, + 0.7589, + 0.7658, + 0.7632, + 0.7625, + 0.7609, + 0.7468, + 0.7618, + 0.7486, + 0.738, + 0.7459, + 0.73, + 0.7423, + 0.7321, + 0.7396, + 0.72, + 0.7227, + 0.7321, + 0.7446, + 0.7334, + 0.7344, + 0.7427, + 0.7491, + 0.7572, + 0.7686, + 0.7738, + 0.7677, + 0.7726, + 0.7698, + 0.7665, + 0.7646, + 0.76, + 0.7638, + 0.7633, + 0.7614, + 0.7672, + 0.755, + 0.7548, + 0.7577, + 0.759, + 0.7567, + 0.754, + 0.7634, + 0.7608, + 0.761, + 0.7743, + 0.7697, + 0.7705, + 0.772, + 0.7749, + 0.7764, + 0.7771, + 0.7775, + 0.7809, + 0.7773, + 0.7794, + 0.7836, + 0.7779, + 0.7812, + 0.7804, + 0.7813, + 0.781, + 0.78, + 0.7802, + 0.7855, + 0.7835, + 0.7826, + 0.7841, + 0.783, + 0.7847, + 0.7848, + 0.7848 + ], + "test_acc": [ + 0.5685, + 0.758, + 0.8165, + 0.805, + 0.777, + 0.7565, + 0.74, + 0.7235, + 0.723, + 0.7415, + 0.7465, + 0.7215, + 0.719, + 0.711, + 0.711, + 0.7105, + 0.6965, + 0.713, + 0.6995, + 0.7195, + 0.6795, + 0.708, + 0.679, + 0.66, + 0.664, + 0.711, + 0.7055, + 0.679, + 0.704, + 0.7085, + 0.704, + 0.713, + 0.715, + 0.7205, + 0.7155, + 0.7205, + 0.7165, + 0.702, + 0.719, + 0.717, + 0.7165, + 0.7065, + 0.7285, + 0.7165, + 0.7145, + 0.7105, + 0.7125, + 0.705, + 0.7095, + 0.7115, + 0.7205, + 0.714, + 0.721, + 0.724, + 0.726, + 0.7275, + 0.7335, + 0.732, + 0.734, + 0.727, + 0.7265, + 0.7305, + 0.7375, + 0.732, + 0.7325, + 0.7375, + 0.7365, + 0.7325, + 0.736, + 0.7335, + 0.74, + 0.7395, + 0.7355, + 0.735, + 0.738, + 0.7345, + 0.7375, + 0.737, + 0.7385, + 0.738 + ], + "state_pred_error": [ + 0.7487808745384217, + 0.24732994434833527, + 0.17313961231708527, + 0.16168231008052825, + 0.17035679717063903, + 0.18103363909721373, + 0.18245853021144867, + 0.17743719387054444, + 0.17188244462013244, + 0.16246572191715242, + 0.15361685829162597, + 0.14225484938621522, + 0.1289559740781784, + 0.11635132092237473, + 0.10436125522851944, + 0.09599733033180237, + 0.08721809136271477, + 0.08110790919065475, + 0.0771063295006752, + 0.07525849696397781, + 0.07354050797224045, + 0.0688812373816967, + 0.06121735058426857, + 0.04916935938000679, + 0.03849249759912491, + 0.032670543703436854, + 0.03231753547489643, + 0.03378260580301285, + 0.034706774830818174, + 0.03332062679231167, + 0.031204309898614883, + 0.028909587877988814, + 0.02718178628385067, + 0.025115732821822168, + 0.022915556079149246, + 0.020764808982610704, + 0.018696666319668293, + 0.017864737275242806, + 0.01723333814740181, + 0.016962407499551774, + 0.017021035474538804, + 0.01716751972436905, + 0.017350809542834758, + 0.017860741698741914, + 0.018610822199285032, + 0.019769935327768325, + 0.02077203135192394, + 0.022067637622356414, + 0.022644061627984047, + 0.023021951377391815, + 0.024246234822273255, + 0.02352409240603447, + 0.023992977035045625, + 0.023878568160533905, + 0.02291360137462616, + 0.022536616253852844, + 0.022139397828280925, + 0.021314597645401955, + 0.02067878492474556, + 0.02007001314163208, + 0.019347347635030748, + 0.019004285940527915, + 0.01821923423111439, + 0.01792956632822752, + 0.01759405211508274, + 0.017176553043723106, + 0.016862381353974342, + 0.016874016273021698, + 0.016504883515834807, + 0.016086394381523133, + 0.015596509897708893, + 0.015838253927230834, + 0.014799859385192394, + 0.014545651116967201, + 0.014143282814323902, + 0.01395568735897541, + 0.013814397670328616, + 0.013369649396836757, + 0.013002270936965942, + 0.012713338199257851 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8448630571365356, + 0.4407959580421448, + 0.15707260370254517, + 0.14386749267578125 + ], + "perturbation_rho": [ + 0.7033247947692871, + 0.34020179510116577, + 0.13395404815673828, + 0.1692604124546051 + ], + "nudging": { + "0.001": [ + -0.024531232193112373, + -0.001812139991670847, + -0.0004901132197119296, + -0.0004392624250613153 + ], + "0.003": [ + -0.07187046855688095, + -0.005427503027021885, + -0.0014687320217490196, + -0.001316926209256053 + ], + "0.01": [ + -0.2203540802001953, + -0.01797248050570488, + -0.004883656278252602, + -0.004377881996333599 + ] + }, + "state_pred_error_per_layer": [ + 3192.55322265625, + 2613.6337890625, + 1881.11669921875, + 2102.51953125 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2491588119506836, + 1.3391401213645935, + 0.7448139661788941, + 0.529046625328064, + 0.4409893859386444, + 0.39295122833251955, + 0.3917396518230438, + 0.3638893904685974, + 0.3780584011077881, + 0.4088036222457886, + 0.3839244392633438, + 0.3965308126449585, + 0.4332325538396835, + 0.388488942027092, + 0.3860952439308166, + 0.4289595764160156, + 0.558712983417511, + 0.4192588807106018, + 0.5468189309835434, + 0.4735720682144165, + 0.5481147343516349, + 0.5364306289672851, + 0.6400549737930298, + 0.6401411312103271, + 0.6521704914093017, + 0.6980661613464355, + 0.7174948001861572, + 0.7452107217788696, + 0.7168677276611328, + 0.6955249413490295, + 0.6813755706787109, + 0.8467616846561432, + 0.7442628755569458, + 0.7809717464447021, + 0.835019677734375, + 0.9415380798339844, + 0.8470349615097046, + 0.9357274827957154, + 0.956027186203003, + 0.978194040107727, + 0.9993384301662445, + 1.0430794897079467, + 1.1107125093460084, + 1.0457960997581481, + 1.0835725379943848, + 1.0907151245117188, + 1.0002957998275757, + 1.007777456665039, + 0.9944101539611816, + 1.0391859111785888, + 0.9873703357696533, + 0.9624767935752868, + 0.9792510041236877, + 0.9836898254394532, + 0.9538689140319824, + 0.9946584331512451, + 0.9380921537399292, + 0.956259532213211, + 0.9596250736236572, + 0.94606699924469, + 0.9452685148239136, + 0.923868314743042, + 0.9321948112487793, + 0.9432626096725464, + 0.9381357315063477, + 0.9209384853363037, + 0.9391128986358642, + 0.9220459381103515, + 0.9200671195983887, + 0.9224453427314758, + 0.9143399673461914, + 0.9111755439758301, + 0.9145837394714356, + 0.9098482831001282, + 0.9112333339691162, + 0.9066373474121093, + 0.9067055240631103, + 0.9056244029521943, + 0.9049024011611938, + 0.9045989236831665 + ], + "train_acc": [ + 0.1799, + 0.5387, + 0.723, + 0.7962, + 0.8291, + 0.8477, + 0.8498, + 0.858, + 0.858, + 0.8495, + 0.8613, + 0.8581, + 0.8493, + 0.8637, + 0.8632, + 0.8572, + 0.8381, + 0.8665, + 0.8471, + 0.8543, + 0.8367, + 0.8369, + 0.8172, + 0.818, + 0.8175, + 0.8022, + 0.7871, + 0.78, + 0.7818, + 0.7836, + 0.7796, + 0.744, + 0.7563, + 0.7468, + 0.7334, + 0.7137, + 0.7236, + 0.7024, + 0.6963, + 0.6912, + 0.6787, + 0.6719, + 0.6558, + 0.6645, + 0.6544, + 0.654, + 0.6685, + 0.6631, + 0.6676, + 0.6645, + 0.6706, + 0.6704, + 0.6689, + 0.6688, + 0.6777, + 0.6677, + 0.6782, + 0.6754, + 0.6743, + 0.68, + 0.6768, + 0.6807, + 0.68, + 0.6778, + 0.6792, + 0.6783, + 0.6767, + 0.6821, + 0.6798, + 0.6832, + 0.6829, + 0.6852, + 0.6792, + 0.6853, + 0.6818, + 0.6858, + 0.6824, + 0.6836, + 0.6832, + 0.6832 + ], + "test_acc": [ + 0.3585, + 0.657, + 0.742, + 0.783, + 0.8185, + 0.8245, + 0.8105, + 0.817, + 0.812, + 0.824, + 0.812, + 0.8105, + 0.8235, + 0.8105, + 0.799, + 0.819, + 0.813, + 0.819, + 0.821, + 0.788, + 0.812, + 0.767, + 0.7685, + 0.7705, + 0.7635, + 0.756, + 0.7595, + 0.738, + 0.7195, + 0.7505, + 0.6595, + 0.699, + 0.6885, + 0.6555, + 0.6185, + 0.6805, + 0.685, + 0.6495, + 0.653, + 0.661, + 0.627, + 0.5955, + 0.6305, + 0.6025, + 0.57, + 0.646, + 0.6375, + 0.6485, + 0.6105, + 0.65, + 0.642, + 0.651, + 0.64, + 0.646, + 0.6565, + 0.6655, + 0.6555, + 0.6525, + 0.6325, + 0.655, + 0.6445, + 0.6625, + 0.652, + 0.66, + 0.665, + 0.6605, + 0.6505, + 0.6465, + 0.6585, + 0.6555, + 0.6575, + 0.663, + 0.6575, + 0.6575, + 0.662, + 0.6565, + 0.6605, + 0.661, + 0.662, + 0.662 + ], + "value_loss": [ + 2.8136747930526735, + 0.8132589956283569, + 0.7441051291465759, + 0.5935244509220123, + 0.5305544801712037, + 0.4809351634979248, + 0.5323177522659301, + 0.4937599531173706, + 0.5660051969528198, + 0.6462191902160644, + 0.5763734079837799, + 0.6280713613510132, + 0.7948557285785675, + 0.6167353689074516, + 0.6312321287155152, + 0.7788636138916015, + 1.24904136428833, + 0.8144484006881714, + 1.2646914062023162, + 0.9913992839813233, + 1.2167877242982388, + 1.1537877170562745, + 1.4896245155334473, + 1.4209841236591338, + 1.4288050296783448, + 1.5737432616233826, + 1.472049324798584, + 1.3558264159202575, + 1.2634898232460021, + 1.0622564476013183, + 0.9087878711700439, + 1.2522220923423768, + 0.8374090339660645, + 0.8644590536117553, + 0.9108287329673768, + 1.0323113090515137, + 0.7954086130142212, + 0.9589143196105957, + 0.9973226028442382, + 0.8696648183345794, + 0.9279479406356812, + 0.9467850358963013, + 0.9611213340044021, + 0.8860973155975341, + 0.9274569381713867, + 0.8928450954437256, + 0.7761943910598755, + 0.7452224809646606, + 0.7111061507225037, + 0.9079251007080078, + 0.7042157987594605, + 0.6186297750473022, + 0.6579183887004852, + 0.650217645072937, + 0.6726008516311646, + 0.7288588707923889, + 0.5969251877784729, + 0.6327752158164978, + 0.6609377601623535, + 0.6041857168197632, + 0.5917840515613556, + 0.5548734745502472, + 0.5744958362579345, + 0.5927253926277161, + 0.567703023815155, + 0.5330746456623078, + 0.5393640619277954, + 0.536778436088562, + 0.5437427759170532, + 0.5154631103515624, + 0.5084992980957032, + 0.5075871801376343, + 0.4997114695072174, + 0.4929317692756653, + 0.4871681167125702, + 0.5004887029647828, + 0.4816018688201904, + 0.4893035494327545, + 0.4769497550010681, + 0.5039997359514237 + ], + "term_loss": [ + 1.632562749004364, + 0.48681144256591796, + 0.5579757928848267, + 0.4446354372739792, + 0.38954342555999755, + 0.33837572212219236, + 0.3827962197303772, + 0.3628402814865112, + 0.43823430774211886, + 0.5091175779342652, + 0.44919354333877565, + 0.49555663242340087, + 0.6545826898813247, + 0.484098217099905, + 0.503711657333374, + 0.6411246375083923, + 1.0730022660255432, + 0.6760020233631134, + 1.0891792623758316, + 0.8359037994384766, + 1.0395685426205397, + 0.9751200185298919, + 1.2764028619766234, + 1.2068148810386659, + 1.2142266105651855, + 1.3360229535579682, + 1.2316911418914795, + 1.10275178129673, + 1.0232205655097961, + 0.8254292141914368, + 0.6746950702667236, + 0.9630538293838501, + 0.5811431129455567, + 0.605120336163044, + 0.6237313741922379, + 0.7302495213985443, + 0.5120967150211334, + 0.6533307945251465, + 0.6705779426574707, + 0.5572913918495178, + 0.601477882862091, + 0.619995453453064, + 0.6235214290976524, + 0.5553061120986938, + 0.5913957936286927, + 0.5468049569010734, + 0.4478747470855713, + 0.41719899480342865, + 0.39799570727348327, + 0.5387198917388916, + 0.389376504611969, + 0.3186599224090576, + 0.349000741147995, + 0.344887624168396, + 0.36766607322692874, + 0.40503488359451295, + 0.2990953638792038, + 0.3293440096095204, + 0.3466704918861389, + 0.30466876001358034, + 0.2939660704612732, + 0.2598868667215109, + 0.277480362701416, + 0.2899700213432312, + 0.26971954430937767, + 0.23886673400998115, + 0.24062761631011964, + 0.2402403997540474, + 0.24415884652137756, + 0.2247240812778473, + 0.21601913204193116, + 0.21670277047157288, + 0.20699720672369004, + 0.20146363933086395, + 0.19528962482213974, + 0.20751085200309755, + 0.1899980792403221, + 0.19427047532498837, + 0.1858817045211792, + 0.20441836426854135 + ], + "bridge_loss": [ + 0.8866691899295722, + 0.08224999148249626, + 0.010757447761297226, + 0.0061791808307170865, + 0.013211339366436004, + 0.02400260500907898, + 0.029208013555407523, + 0.016411626595258712, + 0.01054288158416748, + 0.009739568059891462, + 0.00857815499957651, + 0.010147648680210114, + 0.012416441324353218, + 0.013030582279339432, + 0.011700151482224464, + 0.012999499094486236, + 0.027916341756284237, + 0.016938312309980393, + 0.025221791119873525, + 0.020558533179759978, + 0.024548026264831425, + 0.02883436657488346, + 0.041062966972589494, + 0.04241552077531815, + 0.0413472350358963, + 0.053113183903694156, + 0.049302950567007064, + 0.05605897057652474, + 0.04239914432168007, + 0.04438741339594126, + 0.040503136277198794, + 0.05868587039113045, + 0.044476384896039965, + 0.03979057075381279, + 0.04996331431865692, + 0.04867027699947357, + 0.04424825751781464, + 0.048844764399528506, + 0.06250892872810364, + 0.043231787598133085, + 0.05235229188203812, + 0.044943358480930326, + 0.04317686275988817, + 0.04893158612549305, + 0.04527283647060394, + 0.052477565068006514, + 0.04906891460418701, + 0.04816573285460472, + 0.03766437851190567, + 0.08414143166542053, + 0.03915382572412491, + 0.028718653923273087, + 0.0357290733397007, + 0.030860403615236284, + 0.034851776957511904, + 0.04384376324117184, + 0.031289697197079656, + 0.03198159513771534, + 0.04347437092065811, + 0.031240173679590224, + 0.029294288346171378, + 0.030716246968507766, + 0.030886165726184845, + 0.034454310005903245, + 0.029435836976766588, + 0.030154093551635744, + 0.031540098917484286, + 0.032152002370357514, + 0.03537253759801388, + 0.026627822160720824, + 0.029674778524041177, + 0.02880360425710678, + 0.030208065378665924, + 0.029887308536469936, + 0.02994157576560974, + 0.03245688362717628, + 0.030067061227560043, + 0.03423906381428242, + 0.030539594569802285, + 0.03893857387006283 + ], + "tgrad_loss": [ + 0.2944428525924683, + 0.2441975613117218, + 0.17537188875675203, + 0.14270983247756958, + 0.12779971356391906, + 0.11855683698654175, + 0.12031352219581604, + 0.1145080406665802, + 0.11722800314426422, + 0.12736204500198364, + 0.11860171184539794, + 0.12236708498001099, + 0.12785659310817718, + 0.1196065666794777, + 0.11582032089233399, + 0.12473947501182556, + 0.14812274632453917, + 0.12150806620121002, + 0.15029035185575484, + 0.13493695669174194, + 0.152671147570014, + 0.1498333449602127, + 0.1721586901664734, + 0.17175372595787047, + 0.17323119621276856, + 0.18460711754560472, + 0.19105523586273193, + 0.19701567590236663, + 0.1978701251029968, + 0.19243981567621232, + 0.19358965730667113, + 0.23048239738941192, + 0.21178954000473021, + 0.21954814462661743, + 0.2371340503692627, + 0.25339151220321654, + 0.23906364424228668, + 0.2567387635707855, + 0.2642357376098633, + 0.26914163494110105, + 0.2741177690029144, + 0.2818462213039398, + 0.2944230457663536, + 0.2818596136331558, + 0.2907883113384247, + 0.2935625722646713, + 0.2792507260799408, + 0.2798577557086945, + 0.2754460638999939, + 0.28506377139091493, + 0.2756854686737061, + 0.27125119709968565, + 0.2731885812759399, + 0.2744696222305298, + 0.2700830017566681, + 0.2799802258014679, + 0.2665401251077652, + 0.2714496097326279, + 0.2707928934574127, + 0.26827678565979, + 0.2685236934185028, + 0.26427035608291627, + 0.26612931003570556, + 0.26830106143951415, + 0.26854763979911805, + 0.26405381517410276, + 0.267196342420578, + 0.2643860376358032, + 0.26421138830184937, + 0.2641112084388733, + 0.2628053893566132, + 0.26208080410957335, + 0.2625061942100525, + 0.2615808199882507, + 0.26193691883087156, + 0.26052096433639527, + 0.26153672609329226, + 0.2607940129995346, + 0.26052846012115477, + 0.26064279942512514 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.07093458622694016, + 0.19623729586601257, + 0.18378585577011108, + 0.18649986386299133 + ], + "perturbation_rho": [ + 0.14815130829811096, + 0.336488276720047, + 0.35506749153137207, + 0.3242703676223755 + ], + "nudging": { + "0.001": [ + -0.0034058368764817715, + -0.0015302924439311028, + -0.0013900859048590064, + -0.0013669544132426381 + ], + "0.003": [ + -0.010171962901949883, + -0.004587909206748009, + -0.0041659073904156685, + -0.004097048658877611 + ], + "0.01": [ + -0.033366985619068146, + -0.015239425003528595, + -0.013842864893376827, + -0.01361463125795126 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.25_L4_s456.json b/results/synth_ladder_v2_lo/synth_a0.25_L4_s456.json new file mode 100644 index 0000000..a99f2a9 --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.25_L4_s456.json @@ -0,0 +1,1554 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.4280009566307068, + 0.4816410400390625, + 0.35641251850128175, + 0.31376885857582093, + 0.2785879302024841, + 0.2906965353012085, + 0.24813844954967498, + 0.2529641579627991, + 0.29037830834388734, + 0.24602493743896484, + 0.271309370470047, + 0.24193280544281007, + 0.21174109992980958, + 0.2022141403198242, + 0.19511151465177537, + 0.1747492593228817, + 0.16679265608787536, + 0.18226073577404023, + 0.178118130004406, + 0.1698817639350891, + 0.21180371685028077, + 0.22151261649131776, + 0.1692685513496399, + 0.15942963395118714, + 0.15639958801865578, + 0.13424310631752015, + 0.13393100074529649, + 0.1342959972321987, + 0.1233813103556633, + 0.1372558897972107, + 0.15687738795280456, + 0.15556601939201356, + 0.1386237049102783, + 0.12747760764360427, + 0.13082287336587906, + 0.12003014180660247, + 0.1110824688911438, + 0.11324274975061417, + 0.09755915361642838, + 0.09881812291145324, + 0.0983709388077259, + 0.08716794240474701, + 0.09951607349514961, + 0.08897512910366058, + 0.09945852316617966, + 0.08210971295237542, + 0.08215147442817688, + 0.09767722171843052, + 0.07982404861450196, + 0.08341489782333374, + 0.08445568187236786, + 0.07201690224409103, + 0.06894114913269878, + 0.06607745648026467, + 0.06452926009893417, + 0.06370570333003998, + 0.07323879662156105, + 0.06315056117884815, + 0.06021904794573784, + 0.05857481062412262, + 0.06132639021873474, + 0.05991591087579727, + 0.05866761998534203, + 0.0561151444196701, + 0.05675396573543549, + 0.05583441897928715, + 0.054332348388433455, + 0.05344627385139465, + 0.053293361806869506, + 0.05263606111109257, + 0.05185437820851803, + 0.05141058519482613, + 0.05099834645986557, + 0.0506766751408577, + 0.05050799320936203, + 0.050287041491270064, + 0.05010691736936569, + 0.04997352842092514, + 0.04987951598167419, + 0.04983126169741154 + ], + "train_acc": [ + 0.5303, + 0.8408, + 0.8692, + 0.8797, + 0.8918, + 0.8847, + 0.8988, + 0.9028, + 0.8848, + 0.9035, + 0.8886, + 0.9076, + 0.9163, + 0.919, + 0.9247, + 0.9325, + 0.936, + 0.9268, + 0.9308, + 0.9337, + 0.9165, + 0.912, + 0.9336, + 0.9374, + 0.9396, + 0.9515, + 0.9505, + 0.9497, + 0.9545, + 0.9492, + 0.9388, + 0.9385, + 0.9487, + 0.953, + 0.9536, + 0.9576, + 0.9612, + 0.9591, + 0.9682, + 0.9654, + 0.9665, + 0.973, + 0.9655, + 0.9697, + 0.9675, + 0.9764, + 0.9749, + 0.9655, + 0.9764, + 0.9743, + 0.9743, + 0.9809, + 0.9821, + 0.9841, + 0.9845, + 0.9855, + 0.98, + 0.9854, + 0.9889, + 0.989, + 0.9869, + 0.9883, + 0.9879, + 0.9902, + 0.9898, + 0.9906, + 0.9911, + 0.9918, + 0.9917, + 0.9921, + 0.9925, + 0.9929, + 0.9934, + 0.9941, + 0.994, + 0.9942, + 0.9945, + 0.9944, + 0.9942, + 0.9942 + ], + "test_acc": [ + 0.7945, + 0.8695, + 0.8905, + 0.8835, + 0.8885, + 0.892, + 0.88, + 0.883, + 0.881, + 0.9005, + 0.89, + 0.8905, + 0.897, + 0.9045, + 0.9025, + 0.8995, + 0.9025, + 0.9005, + 0.908, + 0.9035, + 0.894, + 0.8945, + 0.903, + 0.911, + 0.9075, + 0.911, + 0.9145, + 0.91, + 0.911, + 0.9065, + 0.9035, + 0.904, + 0.915, + 0.9095, + 0.911, + 0.9095, + 0.9115, + 0.9095, + 0.9175, + 0.9175, + 0.917, + 0.9115, + 0.914, + 0.913, + 0.907, + 0.9165, + 0.918, + 0.9145, + 0.9145, + 0.9175, + 0.915, + 0.913, + 0.9145, + 0.9215, + 0.916, + 0.9195, + 0.9215, + 0.9215, + 0.9185, + 0.919, + 0.921, + 0.919, + 0.9205, + 0.9185, + 0.9195, + 0.918, + 0.9195, + 0.918, + 0.9205, + 0.9195, + 0.9195, + 0.9185, + 0.92, + 0.918, + 0.919, + 0.92, + 0.9195, + 0.919, + 0.9185, + 0.9185 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8029586672782898, + 0.7900986075401306, + 0.7753629684448242, + 0.7581839561462402 + ], + "perturbation_rho": [ + 0.999998927116394, + 0.9999964237213135, + 0.999983549118042, + 0.9999468326568604 + ], + "nudging": { + "0.001": [ + -0.026280783116817474, + -0.012318434193730354, + -0.005662030540406704, + -0.002971941838040948 + ], + "0.003": [ + -0.07031507790088654, + -0.035108231008052826, + -0.016601495444774628, + -0.008812842890620232 + ], + "0.01": [ + -0.15638579428195953, + -0.09745092689990997, + -0.05102477967739105, + -0.028195563703775406 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.232069776535034, + 1.370755326461792, + 0.774408396434784, + 0.5504122185230255, + 0.4551778681755066, + 0.39543955364227296, + 0.3673446969985962, + 0.37010820665359495, + 0.40584990463256837, + 0.36630872459411623, + 0.3967540986061096, + 0.3843751923561096, + 0.4476522427558899, + 0.42575200576782224, + 0.42364864072799685, + 0.38030472977161406, + 0.4079951852798462, + 0.46959167435765264, + 0.4198760874271393, + 0.468362246465683, + 0.45476327400207517, + 0.5178915981292724, + 0.6004542631149292, + 0.5163716057777404, + 0.4734943875789642, + 0.5516410438537598, + 0.49744338874816896, + 0.46432403774261477, + 0.4892093751907349, + 0.6200435506820678, + 0.5751196828842163, + 0.5928933774709702, + 0.4814444019317627, + 0.5967060979366302, + 0.5415381860733032, + 0.4497476665496826, + 0.48320111837387086, + 0.5223149719312787, + 0.4452429738998413, + 0.5263340139627457, + 0.4467347893744707, + 0.4445894860267639, + 0.5922297267913819, + 0.4209597279548645, + 0.4198515675544739, + 0.4481225758552551, + 0.45345114040374757, + 0.4496061055518687, + 0.3991525866508484, + 0.4271981393814087, + 0.40415777770280836, + 0.4262519637107849, + 0.4017188970685005, + 0.38243411012291906, + 0.38553619861602784, + 0.38307219924926755, + 0.43748312458992006, + 0.3661682406932116, + 0.3464682363986969, + 0.3526681913375854, + 0.377327184009552, + 0.3567724729537964, + 0.37950509120225906, + 0.3511497905731201, + 0.36539844236373903, + 0.3426241901397705, + 0.3417411681175232, + 0.33409423093795776, + 0.3281999719619751, + 0.33597293905615805, + 0.32314492433071135, + 0.32010074100494385, + 0.3219986635684967, + 0.3155823324203491, + 0.3164848567008972, + 0.3139919088840485, + 0.3123295421615243, + 0.3108947002887726, + 0.31007582869529726, + 0.30983073345422746 + ], + "train_acc": [ + 0.1919, + 0.5317, + 0.7118, + 0.7954, + 0.8288, + 0.8488, + 0.8578, + 0.8594, + 0.8496, + 0.8626, + 0.855, + 0.8624, + 0.8463, + 0.8538, + 0.8558, + 0.8662, + 0.8636, + 0.8532, + 0.8616, + 0.8542, + 0.8592, + 0.8472, + 0.843, + 0.8527, + 0.8547, + 0.8479, + 0.8562, + 0.8623, + 0.8586, + 0.8466, + 0.8494, + 0.8489, + 0.8668, + 0.8461, + 0.8611, + 0.8737, + 0.867, + 0.8596, + 0.8767, + 0.8588, + 0.8748, + 0.8759, + 0.8555, + 0.8829, + 0.885, + 0.8748, + 0.8786, + 0.8778, + 0.8897, + 0.8793, + 0.8851, + 0.8811, + 0.885, + 0.8887, + 0.8917, + 0.8912, + 0.885, + 0.8906, + 0.8976, + 0.8989, + 0.8919, + 0.8952, + 0.8896, + 0.8976, + 0.8936, + 0.8974, + 0.8994, + 0.8992, + 0.9029, + 0.9, + 0.9028, + 0.9031, + 0.9044, + 0.9036, + 0.906, + 0.905, + 0.9046, + 0.906, + 0.9061, + 0.906 + ], + "test_acc": [ + 0.3785, + 0.6325, + 0.739, + 0.789, + 0.801, + 0.8095, + 0.826, + 0.813, + 0.8085, + 0.814, + 0.794, + 0.7895, + 0.7865, + 0.7875, + 0.815, + 0.825, + 0.83, + 0.802, + 0.7995, + 0.81, + 0.7955, + 0.799, + 0.7875, + 0.8035, + 0.7935, + 0.7985, + 0.8035, + 0.811, + 0.796, + 0.8155, + 0.805, + 0.796, + 0.7855, + 0.804, + 0.8, + 0.825, + 0.797, + 0.7985, + 0.8075, + 0.822, + 0.7985, + 0.787, + 0.8185, + 0.832, + 0.8345, + 0.811, + 0.8165, + 0.826, + 0.82, + 0.8375, + 0.8395, + 0.8275, + 0.823, + 0.8325, + 0.8375, + 0.821, + 0.833, + 0.8355, + 0.8435, + 0.8365, + 0.8435, + 0.845, + 0.8465, + 0.8445, + 0.8405, + 0.847, + 0.8445, + 0.846, + 0.848, + 0.85, + 0.847, + 0.8445, + 0.846, + 0.8495, + 0.848, + 0.848, + 0.85, + 0.8505, + 0.8515, + 0.8515 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.014162426814436913, + 0.0798005759716034, + 0.09311279654502869, + 0.10633827745914459 + ], + "perturbation_rho": [ + 0.041398823261260986, + 0.02247910387814045, + 0.1714327037334442, + 0.17666620016098022 + ], + "nudging": { + "0.001": [ + 0.00017435633344575763, + -0.0005363107775337994, + -0.00033184929634444416, + -0.000325117347529158 + ], + "0.003": [ + 0.000572163553442806, + -0.0016089004930108786, + -0.0009956255089491606, + -0.0009728462900966406 + ], + "0.01": [ + 0.002492401283234358, + -0.005343085154891014, + -0.0033098761923611164, + -0.003237517550587654 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.8165535574913025, + 0.763969938659668, + 0.456514367723465, + 0.4509699695587158, + 0.5203996650695801, + 0.5776345297813416, + 0.5986223049163818, + 0.6544226729393006, + 0.7238446506500245, + 0.7209402904510498, + 0.694066102218628, + 0.698754120349884, + 0.7061762592315673, + 0.7547999785423278, + 0.7718533777236939, + 0.7712728401184082, + 0.7895807289123535, + 0.772668758392334, + 0.7529318264007568, + 0.73342194814682, + 0.7342669651985169, + 0.7617962551116944, + 0.7271483485221862, + 0.7463216340065002, + 0.7824168462753296, + 0.7513881778717041, + 0.7485483713150024, + 0.8226748832702637, + 0.7728332638740539, + 0.7521475864410401, + 0.8052359797477722, + 0.7683963434219361, + 0.839831940460205, + 0.7288411888122559, + 0.7234952001571655, + 0.7603490391731262, + 0.7802042022705078, + 0.7887434216022492, + 0.7879969930648804, + 0.8280424799919128, + 0.8189708654403687, + 0.8561574056625366, + 0.8539019847869873, + 0.8538200400352478, + 0.8228381202697754, + 0.8735623681068421, + 0.8707358804702758, + 0.8457340757369995, + 0.857807723236084, + 0.8657875537872315, + 0.867585726261139, + 0.858120620059967, + 0.8555149084091187, + 0.8709949861526489, + 0.85430686378479, + 0.8638038631439209, + 0.8486660203933716, + 0.8263280488967896, + 0.8541519875526429, + 0.8399642889976502, + 0.8300949808120728, + 0.8287226734161377, + 0.8489915835380554, + 0.8436049571990967, + 0.8391613592147827, + 0.8280179216384888, + 0.828670958518982, + 0.8277772424697876, + 0.8266226589202881, + 0.8310329568862915, + 0.8256790163040161, + 0.8284158477783203, + 0.8229934953689575, + 0.8235222157478332, + 0.8218230583190917, + 0.8219074445724487, + 0.8209780731201172, + 0.8209145902633667, + 0.8202378884792327, + 0.819964693069458 + ], + "train_acc": [ + 0.35, + 0.7124, + 0.8289, + 0.8318, + 0.8146, + 0.7996, + 0.7877, + 0.7706, + 0.7516, + 0.7551, + 0.7457, + 0.7437, + 0.746, + 0.7313, + 0.7343, + 0.7337, + 0.7323, + 0.7287, + 0.7311, + 0.7381, + 0.7416, + 0.7315, + 0.7451, + 0.7449, + 0.7389, + 0.7512, + 0.7488, + 0.7377, + 0.7446, + 0.7504, + 0.7324, + 0.7408, + 0.7233, + 0.7466, + 0.746, + 0.7326, + 0.7295, + 0.726, + 0.7213, + 0.7144, + 0.7167, + 0.708, + 0.7134, + 0.7068, + 0.7173, + 0.7019, + 0.7061, + 0.7126, + 0.7135, + 0.704, + 0.7062, + 0.7064, + 0.7148, + 0.7132, + 0.7086, + 0.7095, + 0.712, + 0.7203, + 0.7144, + 0.7162, + 0.7194, + 0.7223, + 0.717, + 0.7173, + 0.7179, + 0.7248, + 0.723, + 0.7241, + 0.7231, + 0.7263, + 0.7268, + 0.7272, + 0.7299, + 0.7258, + 0.7277, + 0.7302, + 0.7301, + 0.7312, + 0.7319, + 0.7318 + ], + "test_acc": [ + 0.591, + 0.7695, + 0.8165, + 0.7925, + 0.784, + 0.7695, + 0.7725, + 0.7425, + 0.7335, + 0.7115, + 0.716, + 0.72, + 0.707, + 0.7115, + 0.695, + 0.7095, + 0.6895, + 0.68, + 0.711, + 0.7055, + 0.7155, + 0.711, + 0.697, + 0.69, + 0.7035, + 0.699, + 0.697, + 0.699, + 0.7065, + 0.6905, + 0.6875, + 0.698, + 0.6785, + 0.727, + 0.6635, + 0.684, + 0.6395, + 0.687, + 0.6475, + 0.66, + 0.625, + 0.6935, + 0.6905, + 0.695, + 0.664, + 0.6675, + 0.675, + 0.7065, + 0.6715, + 0.6965, + 0.7105, + 0.6765, + 0.6785, + 0.709, + 0.676, + 0.691, + 0.696, + 0.7165, + 0.684, + 0.6925, + 0.697, + 0.6985, + 0.6935, + 0.688, + 0.71, + 0.7075, + 0.708, + 0.713, + 0.7145, + 0.711, + 0.7095, + 0.711, + 0.705, + 0.7095, + 0.709, + 0.708, + 0.7075, + 0.707, + 0.7085, + 0.7085 + ], + "state_pred_error": [ + 0.7406987041473388, + 0.2411207477092743, + 0.16255244364738464, + 0.1493449520111084, + 0.14992456312179567, + 0.1555534377336502, + 0.16155459024906157, + 0.16035395340919495, + 0.15258878574371337, + 0.14208157248497008, + 0.12504443428516387, + 0.10508740864992142, + 0.08725720175504685, + 0.07344181394577026, + 0.06654016046524047, + 0.06139626076221466, + 0.0560697415292263, + 0.05169878583550453, + 0.0489024289727211, + 0.04750510221719742, + 0.04499284594655037, + 0.04229650926589966, + 0.03862137130498886, + 0.03419775420427323, + 0.030702023059129713, + 0.027638143730163576, + 0.02521895556151867, + 0.023234548729658126, + 0.02125667086541653, + 0.019339045375585555, + 0.017155453544855117, + 0.015024662992358207, + 0.013225329960882664, + 0.01183355233669281, + 0.010222357726842164, + 0.008752954179048538, + 0.007925371387600898, + 0.007087908421456813, + 0.0065649920910596845, + 0.005963414085656405, + 0.005528712090849876, + 0.005135756582021713, + 0.004901659817993641, + 0.004578842090815305, + 0.004355525939539075, + 0.004229336945712567, + 0.004050217913836241, + 0.003972229235991835, + 0.0038215931802988053, + 0.0038026397384703157, + 0.0036524082466959954, + 0.0036101686157286165, + 0.0035772004246711732, + 0.0035720416367053987, + 0.0035359943974763155, + 0.0035451125495135783, + 0.0035574036099016667, + 0.003586608001589775, + 0.0035653520226478575, + 0.003511827717348933, + 0.003500817520916462, + 0.0035023676201701164, + 0.003476817812025547, + 0.0034475730940699578, + 0.0036353183921426536, + 0.003350039096549153, + 0.0032939229547977447, + 0.003333185035735369, + 0.003172698828577995, + 0.003134825951978564, + 0.00305225969851017, + 0.003130577512830496, + 0.0029675849348306657, + 0.002851927667111158, + 0.002880720941722393, + 0.0027674298100173475, + 0.0026737776212394236, + 0.0025887268578633667, + 0.0025455289104953406, + 0.00247869050912559 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8312708735466003, + 0.37615716457366943, + 0.14436809718608856, + 0.15281778573989868 + ], + "perturbation_rho": [ + 0.7588610649108887, + 0.34236449003219604, + 0.14024245738983154, + 0.13689765334129333 + ], + "nudging": { + "0.001": [ + -0.02127787098288536, + -0.0016070354031398892, + -0.0004922817461192608, + -0.0005490813055075705 + ], + "0.003": [ + -0.06277377903461456, + -0.004812953062355518, + -0.0014764359220862389, + -0.0016460102051496506 + ], + "0.01": [ + -0.19714727997779846, + -0.01597677543759346, + -0.004914070479571819, + -0.005477628670632839 + ] + }, + "state_pred_error_per_layer": [ + 2233.37158203125, + 1546.82080078125, + 996.9107666015625, + 942.33251953125 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2263490732192994, + 1.372786217880249, + 0.7703747777938843, + 0.5524767992019654, + 0.4545511021375656, + 0.39994027256965636, + 0.3738175000190735, + 0.38151370735168455, + 0.3779865933179855, + 0.3911576789855957, + 0.3810564842700958, + 0.40146919298171996, + 0.42358366951942444, + 0.4113857924461365, + 0.4117763772964477, + 0.4525391309261322, + 0.4548126799583435, + 0.45577107663154603, + 0.48783650531768796, + 0.5700982325077056, + 0.5109643290996552, + 0.5576292927265167, + 0.6397031135559083, + 0.8101890686035156, + 0.7712644341468811, + 0.7676936615467072, + 0.7088435866355896, + 0.785914805984497, + 0.8963895021915436, + 0.8323235744476318, + 0.9798989505767822, + 1.0398858805656432, + 1.0301771236419677, + 1.3176715976715088, + 1.2662531551361085, + 1.23117315826416, + 1.3725950134277343, + 1.2606015678405762, + 1.2498836280822754, + 1.1528087448120117, + 1.1365314014434815, + 1.085456252670288, + 1.1133746538162232, + 1.055409068107605, + 1.0885181948661804, + 1.06560675907135, + 1.06901422996521, + 1.0907034481048583, + 1.1203149961471557, + 1.0966930947303772, + 1.0746682907104492, + 1.1176004346847535, + 1.1059717803955078, + 1.1562017615318299, + 1.11426555519104, + 1.1417513759613036, + 1.1444835793495178, + 1.1437504034042358, + 1.118238719177246, + 1.140546536064148, + 1.1898473086357118, + 1.1313459493637086, + 1.1391136680603027, + 1.1409543603897094, + 1.1357797542572021, + 1.1393927207946777, + 1.1443831789016723, + 1.1221805687904358, + 1.1213734807968139, + 1.1244660341262818, + 1.123013041496277, + 1.1185321440696716, + 1.1202873462677, + 1.1144685082435608, + 1.1160181922912598, + 1.111833641242981, + 1.1105434167861938, + 1.1103411945343018, + 1.1097975526809691, + 1.109219861125946 + ], + "train_acc": [ + 0.1894, + 0.5237, + 0.7185, + 0.7925, + 0.8291, + 0.8455, + 0.8551, + 0.8513, + 0.857, + 0.8526, + 0.863, + 0.8587, + 0.8524, + 0.8549, + 0.8546, + 0.8499, + 0.8552, + 0.8539, + 0.8483, + 0.8349, + 0.843, + 0.832, + 0.8112, + 0.7818, + 0.7819, + 0.7829, + 0.7821, + 0.7697, + 0.7412, + 0.7477, + 0.7172, + 0.6987, + 0.6913, + 0.6398, + 0.6421, + 0.6419, + 0.6205, + 0.6293, + 0.626, + 0.629, + 0.6315, + 0.6442, + 0.637, + 0.6491, + 0.6356, + 0.6471, + 0.6461, + 0.6371, + 0.6321, + 0.6348, + 0.6389, + 0.6273, + 0.6282, + 0.6173, + 0.629, + 0.6242, + 0.6275, + 0.6208, + 0.6292, + 0.623, + 0.6118, + 0.6237, + 0.6201, + 0.6231, + 0.6227, + 0.6224, + 0.6191, + 0.6278, + 0.6266, + 0.6264, + 0.6257, + 0.6311, + 0.6259, + 0.6256, + 0.6278, + 0.6274, + 0.6264, + 0.6264, + 0.6292, + 0.6285 + ], + "test_acc": [ + 0.393, + 0.6405, + 0.739, + 0.789, + 0.7975, + 0.8, + 0.8065, + 0.8095, + 0.817, + 0.81, + 0.8, + 0.783, + 0.8035, + 0.8045, + 0.7975, + 0.793, + 0.809, + 0.8115, + 0.7955, + 0.775, + 0.745, + 0.7755, + 0.7355, + 0.7555, + 0.7295, + 0.751, + 0.6925, + 0.692, + 0.688, + 0.6855, + 0.645, + 0.65, + 0.607, + 0.6235, + 0.5915, + 0.5015, + 0.5855, + 0.61, + 0.5945, + 0.585, + 0.6215, + 0.608, + 0.6155, + 0.6135, + 0.568, + 0.627, + 0.5985, + 0.6045, + 0.6145, + 0.6265, + 0.5945, + 0.6045, + 0.5915, + 0.5945, + 0.602, + 0.609, + 0.6035, + 0.597, + 0.5985, + 0.5695, + 0.5985, + 0.6155, + 0.5825, + 0.609, + 0.6235, + 0.6, + 0.6115, + 0.6125, + 0.612, + 0.614, + 0.601, + 0.6125, + 0.6175, + 0.6085, + 0.616, + 0.615, + 0.614, + 0.6185, + 0.618, + 0.6185 + ], + "value_loss": [ + 3.004816132736206, + 0.8933181741714478, + 0.7472914004325867, + 0.6198880924224853, + 0.49928864874839785, + 0.4533773046016693, + 0.41804420566558836, + 0.45496133618354795, + 0.4769261270999908, + 0.5447554382324219, + 0.5463610198974609, + 0.6101527583122254, + 0.7323229121208191, + 0.654146611404419, + 0.6980391006469726, + 0.758187972164154, + 0.911613033914566, + 0.909905999135971, + 0.9661141172409058, + 1.3761654232025147, + 1.0848820183753967, + 1.2143970355033875, + 1.3779391033172608, + 2.1276612579345704, + 1.9363042541503905, + 1.8150593336105347, + 1.4350913431167602, + 1.5015435070037841, + 1.659292702293396, + 1.4041105354309082, + 1.84923672208786, + 1.7862740999221802, + 1.6408020364761353, + 2.2555280582427977, + 1.91716297416687, + 2.0696146953582764, + 2.0709165517807007, + 1.5185432472229003, + 1.4409057436943054, + 1.1394924449920654, + 1.0243006755828858, + 0.952573077583313, + 0.9513341785430908, + 0.7820314357757568, + 0.8732357313156128, + 0.8816683463096618, + 0.955579030418396, + 0.8554625137329102, + 0.8710546495437622, + 0.8312881650686264, + 0.7633189420700073, + 0.8019674183368682, + 0.7328131550788879, + 0.801051020526886, + 0.746859469127655, + 0.7501679012298584, + 0.8011223143577576, + 0.7507512192726136, + 0.6851235778808594, + 0.7360683244705201, + 0.8436295459747315, + 0.6853977672576904, + 0.7055689754962922, + 0.7252059488296508, + 0.6784087018966675, + 0.6884294319152832, + 0.6989397154808045, + 0.6959970206737518, + 0.6631160745620728, + 0.6498185919761658, + 0.6508113729476929, + 0.6804374390363693, + 0.6624282342433929, + 0.6588281253814697, + 0.6378821391105652, + 0.640788054561615, + 0.6657872777938842, + 0.6686323991775512, + 0.6098757619857789, + 0.64283842253685 + ], + "term_loss": [ + 1.7359011996269227, + 0.5260857672214508, + 0.5611789356231689, + 0.4691473718643189, + 0.35641581667661665, + 0.3125099868893623, + 0.28558482496738435, + 0.32663789620399475, + 0.3523272558569908, + 0.41566965317726134, + 0.4220249535560608, + 0.47944155356884005, + 0.5941028877735138, + 0.5197371693611145, + 0.5607707057952881, + 0.6142034781694412, + 0.7705422173976898, + 0.763801922082901, + 0.8096324970245361, + 1.2002689853668214, + 0.9151784264802932, + 1.0354011665344238, + 1.1660207389831543, + 1.8696075149536133, + 1.6795126104354858, + 1.5453345759391786, + 1.1913600902557373, + 1.2338994720458984, + 1.3612283717632294, + 1.109708225631714, + 1.4900855154037476, + 1.4270168464899062, + 1.2386046768188477, + 1.7514031993865966, + 1.4141266151428222, + 1.5366581008911133, + 1.5076081205368042, + 1.039527117919922, + 0.9725380240678787, + 0.7177947400093079, + 0.6169520056724548, + 0.5577969770908355, + 0.563669540643692, + 0.4297081172943115, + 0.5087772935390472, + 0.5115473824501038, + 0.5738656369566918, + 0.47277311363220215, + 0.4845442730903626, + 0.4545265218049288, + 0.4000856671333313, + 0.43755345803499224, + 0.3792450759291649, + 0.43464683275222776, + 0.39024128130078317, + 0.39411039242744444, + 0.43523220192193984, + 0.38444877996444704, + 0.3343185415267944, + 0.3722025054931641, + 0.4684031509578228, + 0.3343300027370453, + 0.3471951293349266, + 0.36705848178863526, + 0.3202661802768707, + 0.3312775411605835, + 0.3410617515563965, + 0.33340463732481, + 0.3072166344404221, + 0.29471828541755674, + 0.2949522229194641, + 0.31957108319103716, + 0.3035339130759239, + 0.2962215082168579, + 0.28110803384780886, + 0.28337024407982825, + 0.2973673318624496, + 0.2999136340618134, + 0.2588910343647003, + 0.27786159224510193 + ], + "bridge_loss": [ + 0.9794838696058141, + 0.11249453027248382, + 0.013401159876585007, + 0.007677992886304856, + 0.01801637165695429, + 0.02459342247545719, + 0.019867657536268235, + 0.010635345739126206, + 0.00908683493360877, + 0.009039432242512703, + 0.009218453142046928, + 0.010305291563272477, + 0.011811628636717796, + 0.01096362564265728, + 0.01361604914739728, + 0.012970232439041138, + 0.013068722119927406, + 0.018890924017131328, + 0.018672959452867507, + 0.023511534203588962, + 0.025741635078191757, + 0.024518935614824294, + 0.03324915931224823, + 0.04982591823339462, + 0.05101719571352005, + 0.06563201041221618, + 0.044432207286357876, + 0.05200507060289383, + 0.05663267287313938, + 0.06122437345683575, + 0.09713461356163025, + 0.08438427854776383, + 0.12429943964481353, + 0.17007733018398286, + 0.17665135183334352, + 0.21057933068275453, + 0.21602974219322205, + 0.14426904811859131, + 0.13473433861136436, + 0.10179099024534226, + 0.08914142102003098, + 0.08567614158391952, + 0.07007606126666069, + 0.047469612443447114, + 0.05075395459234715, + 0.06365043853521347, + 0.07418297004699707, + 0.06664204177856445, + 0.06561652043461799, + 0.06254049949645996, + 0.05376743358373642, + 0.04661431121826172, + 0.03791740040183067, + 0.04112119258642197, + 0.03973115736246109, + 0.034634311696887014, + 0.04343570882081985, + 0.0430182372033596, + 0.033620422554016115, + 0.040651659190654756, + 0.043216560313105584, + 0.031511343681812284, + 0.036411886563897135, + 0.03738419352769852, + 0.03682520034611225, + 0.034867337346076964, + 0.03554496579170227, + 0.043571460396051406, + 0.0371383314371109, + 0.035206140625476834, + 0.0369823433637619, + 0.04330120563060045, + 0.04176451569497585, + 0.04561741124391556, + 0.039754482871294024, + 0.04048171340227127, + 0.05201617316007614, + 0.05216843712329865, + 0.03526896152496338, + 0.049283357608318326 + ], + "tgrad_loss": [ + 0.2894310550689697, + 0.2547378748416901, + 0.17271129739284516, + 0.1430627270460129, + 0.1248564649105072, + 0.11627389514446258, + 0.11259172101020813, + 0.1176880983710289, + 0.11551203546524048, + 0.12004635149240493, + 0.11511761043071747, + 0.12040591526031494, + 0.1264083997964859, + 0.12344581875801086, + 0.12365235378742218, + 0.13101426265239716, + 0.1280020892560482, + 0.12721314759254457, + 0.13780866494178773, + 0.1523849036693573, + 0.14396195166707038, + 0.15447694187164307, + 0.17866920418739318, + 0.20822782695293426, + 0.20577443714141846, + 0.2040927549123764, + 0.19929904541969298, + 0.2156389590740204, + 0.24143166477680206, + 0.2331779284954071, + 0.26201657457351685, + 0.274872963142395, + 0.2778979238986969, + 0.334047527551651, + 0.32638501477241516, + 0.32237726650238036, + 0.34727867908477783, + 0.33474707689285277, + 0.33363337812423705, + 0.3199067116737366, + 0.3182072554111481, + 0.3090999599933624, + 0.31758857402801516, + 0.3048537001132965, + 0.31370448632240294, + 0.30647052822113036, + 0.3075304272651672, + 0.3160473554611206, + 0.3208938479423523, + 0.31422114033699033, + 0.30946583948135375, + 0.31779965109825137, + 0.3156506803035736, + 0.3252829941034317, + 0.3168870292663574, + 0.32142319972515104, + 0.32245441007614134, + 0.32328419771194455, + 0.3171846125602722, + 0.323214160490036, + 0.3320098324775696, + 0.3195564209461212, + 0.32196195921897885, + 0.32076327590942383, + 0.3213173161506653, + 0.32228455266952516, + 0.3223330054283142, + 0.31902092423439027, + 0.3187611020565033, + 0.3198941662788391, + 0.3188768042564392, + 0.31756515197753904, + 0.3171298073768616, + 0.3169892092704773, + 0.317019620513916, + 0.3169361008644104, + 0.3164037714958191, + 0.31655032963752744, + 0.3157157658576965, + 0.31569347660541536 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.048861026763916016, + 0.17950567603111267, + 0.17905107140541077, + 0.20378535985946655 + ], + "perturbation_rho": [ + 0.07314518839120865, + 0.3309200406074524, + 0.2789418697357178, + 0.3722173571586609 + ], + "nudging": { + "0.001": [ + -0.001814256189391017, + -0.0014669791562482715, + -0.001451535033993423, + -0.0015372845809906721 + ], + "0.003": [ + -0.005412348546087742, + -0.004398588091135025, + -0.004352094605565071, + -0.004607163369655609 + ], + "0.01": [ + -0.017692390829324722, + -0.014619983732700348, + -0.014469930902123451, + -0.015315238386392593 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.25_L8_s123.json b/results/synth_ladder_v2_lo/synth_a0.25_L8_s123.json new file mode 100644 index 0000000..93d3f69 --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.25_L8_s123.json @@ -0,0 +1,1638 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.1118465336799621, + 0.5127583791732788, + 0.4302346032857895, + 0.37507710180282594, + 0.37874902119636533, + 0.358110169172287, + 0.35485055913925173, + 0.33637689504623414, + 0.3376781231403351, + 0.3360303322792053, + 0.31282922410964964, + 0.3255835328102112, + 0.3264058362007141, + 0.2988388967514038, + 0.30576341066360474, + 0.24885234112739563, + 0.2645626920938492, + 0.23710116493701935, + 0.24498434176445008, + 0.25262943110466, + 0.2529470352172852, + 0.20808778538703918, + 0.2323320601463318, + 0.23393779978752136, + 0.21029739031791686, + 0.24577522869110108, + 0.22287568016052245, + 0.19683470277786255, + 0.1955713812351227, + 0.17762795400619508, + 0.1949590757369995, + 0.18015179319381713, + 0.1866455442428589, + 0.17878031969070435, + 0.19590353157520293, + 0.1689172378182411, + 0.15855673022270203, + 0.15442313380241393, + 0.16103034844398498, + 0.18334496784210205, + 0.16386926609277724, + 0.1371785285949707, + 0.16594724979400635, + 0.14151557245254517, + 0.14597930274009704, + 0.1496479096889496, + 0.13319487171173094, + 0.11989519445896149, + 0.12711271942853927, + 0.11571666107177735, + 0.11865356831550598, + 0.11254985160827637, + 0.11379962211847305, + 0.10502011337280273, + 0.10288234763145447, + 0.10125789151191711, + 0.10343788154125214, + 0.10045303144454956, + 0.09661244961619377, + 0.09317599536180496, + 0.09172046147584915, + 0.08994480850696564, + 0.08916794685721398, + 0.08730547853112221, + 0.08572156699895858, + 0.08500556135177613, + 0.08433900206089019, + 0.08323287000656128, + 0.0837702313899994, + 0.0822386646747589, + 0.08129152666330337, + 0.08034330849051476, + 0.0798836398601532, + 0.07978663072586059, + 0.07928232147693634, + 0.07865171662569045, + 0.07832024211883545, + 0.07813211903572083, + 0.07798754007816315, + 0.0779093979716301 + ], + "train_acc": [ + 0.6131, + 0.8006, + 0.8286, + 0.8535, + 0.85, + 0.8578, + 0.8604, + 0.8656, + 0.8674, + 0.8656, + 0.8772, + 0.8694, + 0.8738, + 0.8861, + 0.8785, + 0.9037, + 0.893, + 0.9038, + 0.9026, + 0.9001, + 0.9007, + 0.9186, + 0.9088, + 0.9052, + 0.9204, + 0.9002, + 0.9107, + 0.9242, + 0.9226, + 0.9326, + 0.922, + 0.9286, + 0.9288, + 0.9285, + 0.9246, + 0.934, + 0.9397, + 0.9436, + 0.939, + 0.9281, + 0.9353, + 0.9521, + 0.9383, + 0.9485, + 0.9444, + 0.9469, + 0.9521, + 0.9613, + 0.9543, + 0.96, + 0.9607, + 0.9629, + 0.9618, + 0.9687, + 0.9691, + 0.9694, + 0.9674, + 0.9696, + 0.9733, + 0.9745, + 0.9762, + 0.9756, + 0.9756, + 0.9781, + 0.979, + 0.9801, + 0.9806, + 0.9814, + 0.9808, + 0.9821, + 0.9825, + 0.9836, + 0.9836, + 0.9833, + 0.9839, + 0.9844, + 0.9849, + 0.9851, + 0.9853, + 0.9854 + ], + "test_acc": [ + 0.813, + 0.837, + 0.8425, + 0.8485, + 0.8455, + 0.8655, + 0.8635, + 0.8605, + 0.8615, + 0.865, + 0.867, + 0.856, + 0.874, + 0.8745, + 0.867, + 0.874, + 0.8805, + 0.8845, + 0.88, + 0.8655, + 0.8795, + 0.8875, + 0.8735, + 0.884, + 0.883, + 0.872, + 0.882, + 0.8835, + 0.889, + 0.8835, + 0.8805, + 0.8945, + 0.8845, + 0.879, + 0.8805, + 0.8875, + 0.8875, + 0.893, + 0.887, + 0.8885, + 0.888, + 0.888, + 0.888, + 0.89, + 0.8915, + 0.8925, + 0.8985, + 0.887, + 0.897, + 0.8925, + 0.892, + 0.897, + 0.891, + 0.8965, + 0.892, + 0.8875, + 0.8985, + 0.89, + 0.8895, + 0.893, + 0.8935, + 0.896, + 0.893, + 0.891, + 0.894, + 0.893, + 0.896, + 0.8975, + 0.8955, + 0.8945, + 0.896, + 0.8965, + 0.8955, + 0.894, + 0.893, + 0.895, + 0.895, + 0.8955, + 0.8955, + 0.896 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8995364308357239, + 0.8806806802749634, + 0.8653636574745178, + 0.852218508720398, + 0.8451849222183228, + 0.8416627645492554, + 0.8401176333427429, + 0.8391873240470886 + ], + "perturbation_rho": [ + 0.9999992251396179, + 0.9999973773956299, + 0.9999878406524658, + 0.9999729990959167, + 0.9999438524246216, + 0.9999128580093384, + 0.9999063611030579, + 0.9998599290847778 + ], + "nudging": { + "0.001": [ + -0.031149130314588547, + -0.015606172382831573, + -0.008217571303248405, + -0.0049289376474916935, + -0.0034725882578641176, + -0.0027561166789382696, + -0.002373086055740714, + -0.0021542953327298164 + ], + "0.003": [ + -0.08652011305093765, + -0.045093510299921036, + -0.02417786791920662, + -0.01461886614561081, + -0.010336171835660934, + -0.008218012750148773, + -0.00708259642124176, + -0.006432861555367708 + ], + "0.01": [ + -0.2192329615354538, + -0.13158643245697021, + -0.07524827122688293, + -0.04681030660867691, + -0.03351406753063202, + -0.026811176910996437, + -0.02318240888416767, + -0.02109483815729618 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.261511936378479, + 1.2388046113967897, + 0.7586671992301941, + 0.6045363289833069, + 0.5250408117294312, + 0.48988793330192565, + 0.5181452042102813, + 0.5053172904968262, + 0.5486225427627563, + 0.5680201857566833, + 0.5442982167243957, + 0.5434341896057129, + 0.5798220394134521, + 0.6215977661132812, + 0.6024371314048768, + 0.6234730455398559, + 0.7227652837753296, + 0.677713514328003, + 0.7502383768081665, + 0.6929981166839599, + 0.7150569809913635, + 0.7497701435089111, + 0.7523667077064514, + 0.6890098321437835, + 0.7717183069229125, + 0.8535002285003662, + 0.8195102759838104, + 0.7173164275169372, + 0.7014232642412186, + 0.715224802017212, + 0.8105577381134034, + 0.7098001989364624, + 0.708190748167038, + 0.6264257973670959, + 0.6868150623321533, + 0.8327555156707763, + 0.6983069515705108, + 0.5560035873413086, + 0.5894664196968079, + 0.6142511510848999, + 0.6013524094581604, + 0.6179712162017822, + 0.6110873061180114, + 0.631993100976944, + 0.5848042451381683, + 0.5451607653617859, + 0.5357456830024719, + 0.5887676968812943, + 0.4930126025676727, + 0.48339043197631837, + 0.5699405021667481, + 0.46138914337158204, + 0.5336585921287537, + 0.49541006507873536, + 0.48422760076522825, + 0.47822090463638306, + 0.43970393233299254, + 0.42637463035583495, + 0.4183799235343933, + 0.4340782505989075, + 0.41429271087646485, + 0.4338860253572464, + 0.4003063027858734, + 0.3960654589653015, + 0.3939968942642212, + 0.4079068598270416, + 0.38723310424238444, + 0.37670145826339724, + 0.3791983846902847, + 0.3762376324176788, + 0.37861898155212403, + 0.3750154300689697, + 0.3714167318344116, + 0.36765710716247557, + 0.3650678370475769, + 0.3651044800758362, + 0.3632787693023682, + 0.3633064881324768, + 0.3616319328308105, + 0.36102755069732667 + ], + "train_acc": [ + 0.1812, + 0.5543, + 0.7177, + 0.7696, + 0.8019, + 0.8181, + 0.8078, + 0.8178, + 0.8087, + 0.811, + 0.8164, + 0.8208, + 0.8133, + 0.8118, + 0.8191, + 0.8137, + 0.7918, + 0.8062, + 0.796, + 0.8068, + 0.808, + 0.8087, + 0.8089, + 0.8194, + 0.7966, + 0.7969, + 0.8, + 0.8094, + 0.8111, + 0.8104, + 0.7975, + 0.8106, + 0.8132, + 0.8255, + 0.8132, + 0.8011, + 0.8157, + 0.8347, + 0.8276, + 0.8217, + 0.8287, + 0.823, + 0.8201, + 0.8186, + 0.8244, + 0.8276, + 0.8337, + 0.8308, + 0.8433, + 0.8451, + 0.8317, + 0.8506, + 0.8363, + 0.8437, + 0.8446, + 0.8477, + 0.8536, + 0.8539, + 0.8546, + 0.8535, + 0.8587, + 0.8539, + 0.8631, + 0.8665, + 0.8647, + 0.8588, + 0.8681, + 0.8706, + 0.8658, + 0.8695, + 0.8679, + 0.8699, + 0.8709, + 0.8686, + 0.8715, + 0.8716, + 0.8723, + 0.8723, + 0.8727, + 0.8733 + ], + "test_acc": [ + 0.3855, + 0.659, + 0.7405, + 0.76, + 0.7855, + 0.7495, + 0.7865, + 0.7785, + 0.749, + 0.7695, + 0.799, + 0.774, + 0.773, + 0.77, + 0.738, + 0.753, + 0.759, + 0.774, + 0.7425, + 0.7075, + 0.7635, + 0.7665, + 0.7655, + 0.74, + 0.7105, + 0.7445, + 0.778, + 0.7455, + 0.7895, + 0.7475, + 0.7935, + 0.756, + 0.78, + 0.765, + 0.73, + 0.734, + 0.7685, + 0.8075, + 0.799, + 0.7535, + 0.797, + 0.754, + 0.759, + 0.7985, + 0.81, + 0.7925, + 0.772, + 0.7925, + 0.8055, + 0.7655, + 0.8105, + 0.7975, + 0.7865, + 0.795, + 0.8045, + 0.8255, + 0.824, + 0.808, + 0.8165, + 0.817, + 0.812, + 0.816, + 0.826, + 0.826, + 0.827, + 0.835, + 0.8315, + 0.8255, + 0.829, + 0.8355, + 0.827, + 0.8385, + 0.833, + 0.835, + 0.8305, + 0.8375, + 0.8345, + 0.835, + 0.8335, + 0.833 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.030230171978473663, + 0.1515132635831833, + 0.08784028142690659, + 0.07231537997722626, + 0.09554086625576019, + 0.09082843363285065, + 0.05412551760673523, + 0.0802278220653534 + ], + "perturbation_rho": [ + 0.04074572026729584, + 0.1662997603416443, + 0.08309999853372574, + 0.07389070093631744, + 0.14882703125476837, + 0.04519672691822052, + 0.0252661295235157, + 0.13430552184581757 + ], + "nudging": { + "0.001": [ + 0.0013187117874622345, + -0.00048215428250841796, + -0.0002008694427786395, + -0.00015290860028471798, + -0.0002134581736754626, + -0.00020460024825297296, + -0.00012665732356254011, + -0.00018164707580581307 + ], + "0.003": [ + 0.0040077767334878445, + -0.0014419222716242075, + -0.0006034976686351001, + -0.00045742784277535975, + -0.0006395922391675413, + -0.0006131009431555867, + -0.00037914267159067094, + -0.0005448061274364591 + ], + "0.01": [ + 0.013973418623209, + -0.0047885943204164505, + -0.0020089128520339727, + -0.0015227446565404534, + -0.002120924647897482, + -0.0020366935059428215, + -0.001262089004740119, + -0.0018124101916328073 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.6900189414978026, + 0.8411433074951172, + 0.7035821089744568, + 0.7662129473209381, + 0.9238048450469971, + 0.9465261736869812, + 0.9431295600891113, + 0.9430153847694397, + 0.8930066148757935, + 0.9253942659378052, + 0.9403049263000488, + 0.9278807380676269, + 0.8983365282058716, + 0.9111938871383667, + 0.9078270839691163, + 0.8715127088546752, + 0.8760508625030518, + 0.881078330039978, + 0.9000071779251099, + 0.8816269577026368, + 0.8535635885238647, + 0.8596017469406128, + 0.8243531321525573, + 0.7686523287773133, + 0.7980530646324158, + 0.8087049605369568, + 0.837258325958252, + 0.8231134150981904, + 0.7930005051612854, + 0.8175304112434387, + 0.8106185255527496, + 0.8360982533454895, + 0.8089555241584778, + 0.801400167274475, + 0.7769281364440918, + 0.7804566509246826, + 0.8003368796348572, + 0.7595265312194824, + 0.7870783394813538, + 0.7793847578048706, + 0.7527281112670898, + 0.7428017363548279, + 0.7277878652572631, + 0.7209976235866546, + 0.6881004619121551, + 0.6684544267654419, + 0.6671716670036316, + 0.6666352137565613, + 0.6382144281387329, + 0.6509482036590576, + 0.6767562778472901, + 0.654830322265625, + 0.6389662846565246, + 0.6350968457221985, + 0.6284485641479493, + 0.647821770477295, + 0.6315829051017762, + 0.6223490614891052, + 0.6269909280776977, + 0.6192478479385376, + 0.6175517374992371, + 0.6139361786365509, + 0.609162579536438, + 0.6077277057647705, + 0.6055359146118164, + 0.6021604907035828, + 0.5979869828224182, + 0.5947234419345856, + 0.5964722720146179, + 0.590346819114685, + 0.5898373236656189, + 0.5876562358856201, + 0.5882755388259888, + 0.5854528706550598, + 0.5841325942993164, + 0.5842094928741455, + 0.5827160774230957, + 0.5819865200996399, + 0.5816016881942749, + 0.5813780869483948 + ], + "train_acc": [ + 0.3832, + 0.6771, + 0.7406, + 0.7347, + 0.71, + 0.7016, + 0.686, + 0.678, + 0.6834, + 0.6698, + 0.6698, + 0.6718, + 0.6788, + 0.6772, + 0.6813, + 0.691, + 0.6899, + 0.695, + 0.6891, + 0.6964, + 0.707, + 0.7036, + 0.7172, + 0.7299, + 0.7151, + 0.7181, + 0.7095, + 0.7151, + 0.7253, + 0.7209, + 0.7192, + 0.7166, + 0.7258, + 0.725, + 0.7318, + 0.7339, + 0.7231, + 0.7392, + 0.7281, + 0.7321, + 0.7389, + 0.7402, + 0.7472, + 0.7497, + 0.7526, + 0.7587, + 0.7684, + 0.7649, + 0.7713, + 0.7675, + 0.7624, + 0.7696, + 0.7703, + 0.7689, + 0.7748, + 0.7647, + 0.7778, + 0.7745, + 0.7737, + 0.7737, + 0.7767, + 0.7766, + 0.777, + 0.7776, + 0.7778, + 0.7808, + 0.7852, + 0.7824, + 0.783, + 0.7826, + 0.7859, + 0.7833, + 0.7826, + 0.784, + 0.7842, + 0.7835, + 0.7839, + 0.7845, + 0.7851, + 0.7849 + ], + "test_acc": [ + 0.5965, + 0.721, + 0.702, + 0.7045, + 0.673, + 0.663, + 0.659, + 0.6615, + 0.6405, + 0.6295, + 0.6435, + 0.66, + 0.642, + 0.628, + 0.654, + 0.6645, + 0.66, + 0.673, + 0.6645, + 0.6425, + 0.667, + 0.6895, + 0.692, + 0.699, + 0.6915, + 0.655, + 0.6745, + 0.688, + 0.694, + 0.6655, + 0.6765, + 0.7015, + 0.7005, + 0.691, + 0.7035, + 0.7115, + 0.715, + 0.6985, + 0.698, + 0.7125, + 0.7095, + 0.728, + 0.7225, + 0.732, + 0.725, + 0.738, + 0.74, + 0.728, + 0.733, + 0.744, + 0.736, + 0.7385, + 0.7385, + 0.7355, + 0.7405, + 0.741, + 0.7445, + 0.744, + 0.7515, + 0.7385, + 0.755, + 0.754, + 0.752, + 0.7495, + 0.75, + 0.7515, + 0.7495, + 0.748, + 0.752, + 0.7535, + 0.7515, + 0.75, + 0.754, + 0.752, + 0.7535, + 0.751, + 0.752, + 0.7525, + 0.753, + 0.753 + ], + "state_pred_error": [ + 0.6595856385231018, + 0.18581391699314118, + 0.1389737048149109, + 0.15264776089191437, + 0.17834623737335206, + 0.19413653922080992, + 0.191989035487175, + 0.1882333307504654, + 0.17752823297977446, + 0.17005732750892638, + 0.15737969760894777, + 0.14760457775592803, + 0.13923091561794282, + 0.13096291363239287, + 0.11957425270080567, + 0.11095487377643586, + 0.10258402088880539, + 0.09473015838861465, + 0.08757123013734817, + 0.08079066828489304, + 0.07320248563289643, + 0.06493292402625084, + 0.06027614688873291, + 0.055440726804733276, + 0.05134773366451263, + 0.04849834374189377, + 0.04514253498911858, + 0.04645976569652557, + 0.04907238126993179, + 0.04952519537210465, + 0.04985421462655067, + 0.05048102289438248, + 0.04867895898222923, + 0.04612752487659454, + 0.04500051750540733, + 0.045100632554292676, + 0.046106376844644546, + 0.0457755237698555, + 0.04623996165394783, + 0.04506723956465721, + 0.043494783210754395, + 0.04170223961472511, + 0.03998277345299721, + 0.03828683572411537, + 0.03590715619921684, + 0.03458526620268822, + 0.03327381777763367, + 0.03220812490582466, + 0.03136191112399101, + 0.02989975645840168, + 0.02867936817407608, + 0.027766828721761703, + 0.02639162071943283, + 0.025170314267277717, + 0.02407517617344856, + 0.023122122532129287, + 0.022436111107468605, + 0.02156193360090256, + 0.021339575743675232, + 0.020296311607956887, + 0.019706446814537048, + 0.019259731712937354, + 0.018796706795692442, + 0.018336333370208742, + 0.01777996554672718, + 0.017483672569692136, + 0.017091735473275183, + 0.016544194155931474, + 0.016263828212022782, + 0.015896252320706843, + 0.015430272005498409, + 0.015053019705414773, + 0.014817306607961654, + 0.01454771189391613, + 0.01425941243469715, + 0.013928838320076466, + 0.013689049163460731, + 0.013394512391090393, + 0.013211432878673077, + 0.013250160820782184 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8559742569923401, + 0.48324936628341675, + 0.20313377678394318, + 0.15002062916755676, + 0.13207414746284485, + 0.11473802477121353, + 0.10703189671039581, + 0.10419630259275436 + ], + "perturbation_rho": [ + 0.712527871131897, + 0.4307812452316284, + 0.20181137323379517, + 0.13881561160087585, + 0.15075963735580444, + 0.09288278967142105, + 0.0890430212020874, + 0.0776105523109436 + ], + "nudging": { + "0.001": [ + -0.022853977978229523, + -0.0013667396269738674, + -0.0004074485623277724, + -0.00029726148932240903, + -0.0002571522491052747, + -0.00022330728825181723, + -0.00020516786025837064, + -0.0002069434995064512 + ], + "0.003": [ + -0.06612209230661392, + -0.004091121722012758, + -0.001220933860167861, + -0.0008915449725463986, + -0.0007706802571192384, + -0.0006697832723148167, + -0.0006152803543955088, + -0.0006209201528690755 + ], + "0.01": [ + -0.19413721561431885, + -0.013532894663512707, + -0.004060069564729929, + -0.0029658200219273567, + -0.00256463885307312, + -0.0022291922941803932, + -0.00204793200828135, + -0.002066785003989935 + ] + }, + "state_pred_error_per_layer": [ + 8381.830078125, + 6536.470703125, + 4195.43359375, + 3240.16162109375, + 3085.78857421875, + 3078.50390625, + 3156.81787109375, + 3267.9345703125 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.2583779270172117, + 1.2328803764343261, + 0.7562720144271851, + 0.6132963244438171, + 0.5287181121349335, + 0.5030574288368225, + 0.48532198963165285, + 0.4846679763793945, + 0.5304994377136231, + 0.5362592101097107, + 0.583180138206482, + 0.6139261585235596, + 0.6087016160964965, + 0.5905431600570679, + 0.6277781929016113, + 0.6474135057091713, + 0.59157626247406, + 0.6946684947490692, + 0.8211458179473877, + 0.861908533668518, + 0.7924225975036621, + 0.7633697302818299, + 0.7515091026306152, + 0.720926753616333, + 0.7768987985610962, + 0.8449177289962768, + 0.9629317569732666, + 0.931460041809082, + 0.9021932872772217, + 0.9415567704200745, + 0.8805705249786377, + 0.7279726833343506, + 0.7522793537139892, + 0.8977339170455932, + 0.9053890051841735, + 1.0313119258880614, + 1.0500091316223144, + 1.081573693037033, + 1.0122951402664184, + 1.0065685977935792, + 0.9492526316642761, + 0.9367160196304322, + 1.049492422771454, + 0.979865022277832, + 0.9994352771759033, + 1.162679231929779, + 1.165749097442627, + 1.0634778610229492, + 1.14915854473114, + 1.1030800518035888, + 1.0413856769561767, + 1.0413285767555236, + 1.051336719417572, + 1.0110527751922607, + 1.0733316102981567, + 0.9999018778800964, + 0.9840315793991089, + 0.9711315458297729, + 0.9857265590667724, + 0.9506656970977784, + 0.9560299934387207, + 0.9371125869750977, + 0.9474420023918152, + 0.9461492855072021, + 0.9556923686981201, + 0.9554297721862793, + 0.9499578125, + 0.9548584213256835, + 0.9492132287979126, + 0.9530534173965454, + 0.9477035552978516, + 0.9484292861938477, + 0.9435903357505798, + 0.9424657020568847, + 0.9434539100646973, + 0.941624609375, + 0.9386807306289673, + 0.937810022354126, + 0.9365644121170044, + 0.936181538105011 + ], + "train_acc": [ + 0.1853, + 0.5561, + 0.7227, + 0.7667, + 0.8014, + 0.8089, + 0.816, + 0.8187, + 0.8118, + 0.8168, + 0.8048, + 0.812, + 0.8117, + 0.8194, + 0.8117, + 0.8144, + 0.8229, + 0.8042, + 0.7841, + 0.7748, + 0.7876, + 0.7866, + 0.797, + 0.8064, + 0.8003, + 0.795, + 0.7719, + 0.7755, + 0.7714, + 0.7484, + 0.7513, + 0.7644, + 0.7457, + 0.7144, + 0.7069, + 0.6809, + 0.6746, + 0.6693, + 0.674, + 0.6698, + 0.676, + 0.6723, + 0.6479, + 0.6576, + 0.6479, + 0.6187, + 0.6106, + 0.6341, + 0.6163, + 0.629, + 0.6411, + 0.6433, + 0.638, + 0.6516, + 0.6381, + 0.6526, + 0.6608, + 0.6575, + 0.6575, + 0.6638, + 0.6603, + 0.6717, + 0.6666, + 0.6704, + 0.6663, + 0.6646, + 0.6687, + 0.6665, + 0.6701, + 0.67, + 0.6699, + 0.6699, + 0.6689, + 0.6709, + 0.6748, + 0.67, + 0.6722, + 0.6723, + 0.6729, + 0.6723 + ], + "test_acc": [ + 0.3875, + 0.661, + 0.7345, + 0.771, + 0.7855, + 0.763, + 0.785, + 0.768, + 0.786, + 0.7535, + 0.748, + 0.75, + 0.7505, + 0.763, + 0.7635, + 0.784, + 0.7555, + 0.7285, + 0.7145, + 0.7325, + 0.769, + 0.7425, + 0.783, + 0.774, + 0.7725, + 0.7325, + 0.7345, + 0.7085, + 0.69, + 0.652, + 0.7025, + 0.7115, + 0.686, + 0.635, + 0.5775, + 0.619, + 0.607, + 0.6335, + 0.587, + 0.559, + 0.577, + 0.5445, + 0.6055, + 0.5975, + 0.5495, + 0.536, + 0.6035, + 0.578, + 0.5465, + 0.6125, + 0.632, + 0.6125, + 0.614, + 0.6215, + 0.644, + 0.646, + 0.654, + 0.6265, + 0.6415, + 0.646, + 0.651, + 0.656, + 0.655, + 0.66, + 0.656, + 0.655, + 0.6535, + 0.643, + 0.6525, + 0.65, + 0.657, + 0.6535, + 0.6525, + 0.653, + 0.652, + 0.65, + 0.651, + 0.651, + 0.651, + 0.651 + ], + "value_loss": [ + 3.048217420578003, + 1.0343286740779876, + 0.9000125793457031, + 0.8277910697937012, + 0.7453249110221862, + 0.7300011464118957, + 0.7402240177154541, + 0.7579312013626098, + 0.9181204793930053, + 0.975448628616333, + 1.1214078811645507, + 1.2724024196147918, + 1.3290605850219726, + 1.259645761871338, + 1.3672408729553223, + 1.5799061000347137, + 1.3602543179512023, + 1.712525807094574, + 2.2426450706481935, + 2.359542562866211, + 2.1532579238891603, + 1.9830763484954834, + 1.982039828968048, + 1.8818614783287049, + 2.2171711694717406, + 2.3556669063568116, + 3.0178351165771486, + 3.1578522092819212, + 2.68718074798584, + 2.373463029575348, + 1.8590419352769851, + 1.2517694076538086, + 1.02772789478302, + 1.2108542333602905, + 1.0830044956207276, + 2.0529207768440245, + 1.2919132787704468, + 1.2424284775733947, + 1.0443824444293976, + 1.1778054037094117, + 0.9631912262439728, + 0.8378017754554749, + 1.0295626225471497, + 0.7373762512207032, + 0.7012673536300659, + 0.98064923620224, + 0.862914551448822, + 0.7986299896240234, + 0.8213993213653564, + 0.7129971002578736, + 0.754508529138565, + 0.6246828708648682, + 0.7121831396102906, + 0.5870893394470215, + 0.6755351794242859, + 0.5818774876117706, + 0.5521341813087464, + 0.5238836415290833, + 0.5890642763614654, + 0.5481948862075806, + 0.5332052557468414, + 0.4778835234642029, + 0.49222251901626585, + 0.5597867136955261, + 0.4953978775501251, + 0.5712323989391327, + 0.49952770709991456, + 0.5085798627853394, + 0.45753829402923585, + 0.48174678115844727, + 0.4655922472000122, + 0.4551719659328461, + 0.4378785256385803, + 0.43562724137306214, + 0.4843036180496216, + 0.42520372521877287, + 0.4271356852054596, + 0.4239115475654602, + 0.41854572505950927, + 0.41045001599788666 + ], + "term_loss": [ + 1.7620765068054198, + 0.7570293057441712, + 0.7365578352928162, + 0.6820572528839112, + 0.607182498049736, + 0.5735599759578704, + 0.5921525184631348, + 0.6111434427261353, + 0.7693612571716308, + 0.8335376226425171, + 0.9712094970703125, + 1.1207456881999969, + 1.1779227069854736, + 1.1121969150543214, + 1.209087449645996, + 1.4206154627799987, + 1.2058612494468688, + 1.5412679631948472, + 2.0407606628417967, + 2.108829928779602, + 1.9323839492797852, + 1.738079938840866, + 1.738319782948494, + 1.668429842185974, + 1.9542716176986694, + 2.082409756851196, + 2.71076455078125, + 2.7950469175338744, + 2.3576751346588134, + 2.0379406468629835, + 1.5563349723756312, + 0.987390661239624, + 0.7408796440124512, + 0.8990295526981353, + 0.7904975162506104, + 1.5982429100751876, + 0.9677811861038208, + 0.9073515085697174, + 0.6968293826818466, + 0.8219095712423324, + 0.6385633600115777, + 0.5180883571147918, + 0.6821171250283719, + 0.42861852970123293, + 0.4132593111038208, + 0.6532857032775878, + 0.56343485455513, + 0.5125517870903015, + 0.5286973226547241, + 0.4325035630941391, + 0.4782088125705719, + 0.35716295001506804, + 0.43347521109580994, + 0.32357389335632325, + 0.3969691284179688, + 0.32031551563739774, + 0.29744037152528763, + 0.26996316730976105, + 0.3282479860842228, + 0.2972265742301941, + 0.2775776801109314, + 0.2335032631635666, + 0.24737662796378135, + 0.30518129110336306, + 0.24973544117212296, + 0.31368190834522247, + 0.24900891828536986, + 0.2601964050769806, + 0.21727401604652405, + 0.23666752195358276, + 0.2217332841873169, + 0.2150446552991867, + 0.19714454250335695, + 0.1972746223449707, + 0.23860706584453584, + 0.1892410013794899, + 0.18599554433822632, + 0.18529752838611602, + 0.17899176458120347, + 0.17502211028933526 + ], + "bridge_loss": [ + 0.9885711992692668, + 0.06202600108981132, + 0.005225318079441786, + 0.00572426804304123, + 0.011327691495418549, + 0.033182587127387524, + 0.028435595631599427, + 0.02591904165148735, + 0.019612548558413982, + 0.014960378871113062, + 0.01257537133693695, + 0.015017039102315903, + 0.014422192126512528, + 0.016067288851737978, + 0.019453916008770465, + 0.02241444058343768, + 0.024118383884429932, + 0.025934281665086746, + 0.03934095601439476, + 0.08211781105995178, + 0.06123144483566284, + 0.08744931157231331, + 0.09062072249054909, + 0.06713926913738251, + 0.10762440345287323, + 0.11356958830356598, + 0.12857519801855088, + 0.18905064516067505, + 0.1532894235134125, + 0.15086396114826203, + 0.12008241270184516, + 0.09492742450237274, + 0.10648579494953156, + 0.10877807049751281, + 0.09025130966901779, + 0.22308929166793823, + 0.09408268320858479, + 0.09969470508098602, + 0.11703467042446136, + 0.12739645974636077, + 0.10452780928909779, + 0.10022395522594452, + 0.10734874422848224, + 0.08138678241968154, + 0.05771932463645935, + 0.0699296027958393, + 0.04624857715070248, + 0.048479430437088016, + 0.04053354227542877, + 0.032970554107427594, + 0.0381986954331398, + 0.027493790555000307, + 0.03619121195077896, + 0.029564367485046386, + 0.033955201983451845, + 0.03008670448064804, + 0.02573939528465271, + 0.025961067897081375, + 0.031735689258575436, + 0.0286233449280262, + 0.030725829449296, + 0.023821466904878616, + 0.022386557137966157, + 0.03191109481453896, + 0.022437436121702195, + 0.03390852664113045, + 0.028159854693710806, + 0.024796000277996062, + 0.018291607961058616, + 0.022655895307660105, + 0.021983556759357453, + 0.01841803635209799, + 0.019089927835389972, + 0.017243927240371704, + 0.025458976861834525, + 0.015187921732664108, + 0.020197597947716712, + 0.018675634610652924, + 0.019476617947220803, + 0.01536440534889698 + ], + "tgrad_loss": [ + 0.2975697236061096, + 0.2152733613014221, + 0.15822943115234375, + 0.14000954415798186, + 0.12681471655368806, + 0.12325858645439149, + 0.11963590017557144, + 0.1208687183380127, + 0.12914666900634766, + 0.12695061504840852, + 0.13762302379608155, + 0.13663968855142594, + 0.13671568200588227, + 0.13138156263828277, + 0.13869950284957885, + 0.1368761875152588, + 0.13027468709945678, + 0.14532355861663818, + 0.16254346389770508, + 0.168594819521904, + 0.15964251264333726, + 0.1575471007347107, + 0.1530993018746376, + 0.14629238090515137, + 0.1552751208782196, + 0.15968756294250488, + 0.17849535081386567, + 0.17375466558933259, + 0.17621618556976318, + 0.1846583988547325, + 0.18262455696463584, + 0.16945131740570069, + 0.18036246223449706, + 0.2030466163635254, + 0.20225566873550416, + 0.23158856897354127, + 0.23004940370321275, + 0.23538226161003112, + 0.2305183897972107, + 0.22849935948848724, + 0.22010006467103957, + 0.21948946959972382, + 0.2400967527270317, + 0.22737093563079833, + 0.23028871989250183, + 0.25743392400741577, + 0.2532311152935028, + 0.2375987785100937, + 0.25216845297813417, + 0.2475229881286621, + 0.23810101900100708, + 0.2400261275291443, + 0.24251671900749205, + 0.23395108041763304, + 0.24461085169315339, + 0.231475268471241, + 0.22895441274642944, + 0.2279594036579132, + 0.22908060483932496, + 0.22234496841430665, + 0.22490174407958985, + 0.22055879101753234, + 0.22245933241844176, + 0.22269432792663574, + 0.22322500309944152, + 0.2236419643878937, + 0.22235892748832703, + 0.22358745093345642, + 0.22197266473770141, + 0.22242336502075194, + 0.2218754021167755, + 0.22170927753448486, + 0.2216440571308136, + 0.22110869097709657, + 0.22023757584095002, + 0.22077479939460753, + 0.22094254281520845, + 0.21993838548660277, + 0.22007734408378601, + 0.2200635038137436 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.021486874669790268, + 0.13597777485847473, + 0.14020901918411255, + 0.16125136613845825, + 0.15609152615070343, + 0.1541982889175415, + 0.14447104930877686, + 0.13689197599887848 + ], + "perturbation_rho": [ + 0.021052071824669838, + 0.17873916029930115, + 0.25896143913269043, + 0.18253415822982788, + 0.20761561393737793, + 0.24419330060482025, + 0.21560567617416382, + 0.25087088346481323 + ], + "nudging": { + "0.001": [ + -0.000705907354131341, + -0.0009686042903922498, + -0.0009376371745020151, + -0.0010404230561107397, + -0.0010180952958762646, + -0.0010082813678309321, + -0.0009501518215984106, + -0.0009206526447087526 + ], + "0.003": [ + -0.0020928888116031885, + -0.0029041701927781105, + -0.0028102626092731953, + -0.003118767635896802, + -0.0030542444437742233, + -0.0030217969324439764, + -0.0028490517288446426, + -0.002759187947958708 + ], + "0.01": [ + -0.006693178787827492, + -0.009655885398387909, + -0.009345939382910728, + -0.010369300842285156, + -0.010154420509934425, + -0.010046296752989292, + -0.009472687728703022, + -0.009175874292850494 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.25_L8_s42.json b/results/synth_ladder_v2_lo/synth_a0.25_L8_s42.json new file mode 100644 index 0000000..2731940 --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.25_L8_s42.json @@ -0,0 +1,1638 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.116349330329895, + 0.5001499853610992, + 0.4335407821655273, + 0.4641809904575348, + 0.3640550988435745, + 0.3363292731285095, + 0.3244595282793045, + 0.2982915968179703, + 0.3134564006567001, + 0.30007186489105225, + 0.33086415586471557, + 0.3240265121459961, + 0.36804967494010926, + 0.30622104313373566, + 0.25573331198692323, + 0.26320519745349885, + 0.23574686307907106, + 0.2268525185585022, + 0.25257685260772705, + 0.25333278408050536, + 0.2360077142715454, + 0.23784599598646164, + 0.20709436918497084, + 0.20264402964115144, + 0.21906372356414794, + 0.2614547765254974, + 0.22743566370010376, + 0.22848101971149445, + 0.1859010817527771, + 0.18899251914024354, + 0.22130306813716888, + 0.1667450134754181, + 0.16755338363051414, + 0.1541363487958908, + 0.15326010875701904, + 0.17208767664432525, + 0.1566053614139557, + 0.17658618724346162, + 0.1616819619178772, + 0.16018370108604432, + 0.14088194823265077, + 0.13619720645546912, + 0.12748197174072265, + 0.12225827918052673, + 0.1305396099090576, + 0.15742934291362762, + 0.14194510142803193, + 0.13810368086099625, + 0.12012554352283478, + 0.11385036809444428, + 0.11541433204263449, + 0.10669543639421462, + 0.10731406065821647, + 0.10112672692537308, + 0.1006077661037445, + 0.09703596627712249, + 0.09588335396051406, + 0.09268207312822342, + 0.0937716266810894, + 0.09152986379861831, + 0.08915678606033325, + 0.08682773663103581, + 0.08579734473228455, + 0.0858896899998188, + 0.08425427243709564, + 0.08361117107868195, + 0.08322364587783813, + 0.08275889765024186, + 0.08162834317684174, + 0.08004808874726295, + 0.07940338475704194, + 0.07868385118246078, + 0.07802366590499878, + 0.07752591272592545, + 0.07690682909488677, + 0.07651568021774292, + 0.07623157832026482, + 0.07601269240379334, + 0.07586622917354106, + 0.0757821985900402 + ], + "train_acc": [ + 0.6054, + 0.8027, + 0.8306, + 0.8201, + 0.8517, + 0.8683, + 0.8696, + 0.881, + 0.875, + 0.8779, + 0.8683, + 0.871, + 0.8573, + 0.8771, + 0.8985, + 0.8935, + 0.9042, + 0.9103, + 0.8979, + 0.9, + 0.9047, + 0.9033, + 0.9171, + 0.9238, + 0.9113, + 0.897, + 0.9096, + 0.9096, + 0.9279, + 0.9264, + 0.9117, + 0.9373, + 0.9373, + 0.9408, + 0.9433, + 0.9327, + 0.9416, + 0.9311, + 0.9376, + 0.9375, + 0.9495, + 0.9511, + 0.956, + 0.9589, + 0.9532, + 0.9397, + 0.949, + 0.9498, + 0.958, + 0.9622, + 0.9605, + 0.9676, + 0.9652, + 0.9691, + 0.9715, + 0.9704, + 0.9708, + 0.974, + 0.9738, + 0.974, + 0.9767, + 0.9763, + 0.9787, + 0.9772, + 0.9797, + 0.9786, + 0.9792, + 0.9805, + 0.9804, + 0.9813, + 0.9818, + 0.9825, + 0.9824, + 0.9826, + 0.9831, + 0.9836, + 0.9839, + 0.9843, + 0.9843, + 0.9842 + ], + "test_acc": [ + 0.788, + 0.818, + 0.841, + 0.842, + 0.844, + 0.852, + 0.8525, + 0.8535, + 0.8575, + 0.8625, + 0.854, + 0.856, + 0.851, + 0.855, + 0.859, + 0.871, + 0.881, + 0.876, + 0.8665, + 0.872, + 0.874, + 0.8695, + 0.881, + 0.8735, + 0.883, + 0.8735, + 0.867, + 0.868, + 0.891, + 0.8875, + 0.885, + 0.888, + 0.882, + 0.884, + 0.883, + 0.8795, + 0.8815, + 0.875, + 0.88, + 0.888, + 0.883, + 0.8945, + 0.891, + 0.889, + 0.886, + 0.8885, + 0.8845, + 0.8935, + 0.8925, + 0.89, + 0.8945, + 0.8985, + 0.893, + 0.894, + 0.8935, + 0.894, + 0.895, + 0.893, + 0.8945, + 0.8935, + 0.8935, + 0.8945, + 0.8955, + 0.8935, + 0.896, + 0.8965, + 0.893, + 0.8955, + 0.895, + 0.896, + 0.896, + 0.8975, + 0.897, + 0.8965, + 0.8965, + 0.8965, + 0.896, + 0.8955, + 0.896, + 0.8955 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8706932663917542, + 0.8596300482749939, + 0.8512309789657593, + 0.842391848564148, + 0.8334972858428955, + 0.8275372385978699, + 0.823634147644043, + 0.8208400011062622 + ], + "perturbation_rho": [ + 0.9999992847442627, + 0.9999973773956299, + 0.9999889731407166, + 0.9999737739562988, + 0.999952495098114, + 0.9999229311943054, + 0.9998778104782104, + 0.999873161315918 + ], + "nudging": { + "0.001": [ + -0.029443971812725067, + -0.014739202335476875, + -0.007785398978739977, + -0.004687825217843056, + -0.0033056228421628475, + -0.0026248465292155743, + -0.002249690005555749, + -0.002028122777119279 + ], + "0.003": [ + -0.08119087666273117, + -0.042475294321775436, + -0.02287878468632698, + -0.01389251183718443, + -0.009832184761762619, + -0.007821150124073029, + -0.006710004061460495, + -0.006052234675735235 + ], + "0.01": [ + -0.19971789419651031, + -0.12236367166042328, + -0.07083894312381744, + -0.044348303228616714, + -0.031799670308828354, + -0.02545534446835518, + -0.02191336825489998, + -0.01980404555797577 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.158529169845581, + 1.1195615213394166, + 0.7019768083572387, + 0.576601616859436, + 0.48889441759586333, + 0.4595581695556641, + 0.4664854043006897, + 0.4645276006698608, + 0.45998520455360414, + 0.4998584642410278, + 0.5707068769454956, + 0.5089836866378784, + 0.5772042598724365, + 0.5534915947437287, + 0.5303711235046387, + 0.5757707620620728, + 0.6748943659067154, + 0.5596435680389404, + 0.6271520325660705, + 0.6300130233287812, + 0.6096898103713989, + 0.7022480690956115, + 0.6562287082672119, + 0.7743891611099243, + 0.7019639057159424, + 0.620424409866333, + 0.8657609689712524, + 0.7578481485366821, + 0.8160745024681091, + 0.6845855102539062, + 0.6900003092288971, + 0.665535974407196, + 0.6412346285820008, + 0.5900779844999313, + 0.6110470198631287, + 0.6740109759330749, + 0.6783077709197998, + 0.8065583997726441, + 0.659480087852478, + 0.7328077519893647, + 0.6365110095555894, + 0.6187682289004326, + 0.6504915294289589, + 0.6426675319671631, + 0.6510136894226074, + 0.8234208068847656, + 0.6913283330917358, + 0.6763395458221435, + 0.7061776033401489, + 0.6717531005859375, + 0.6595124167919159, + 0.5512650019645691, + 0.6176838112831116, + 0.5410110770225525, + 0.6010903105020523, + 0.5379902812957764, + 0.5911779655456543, + 0.5408210384368897, + 0.5452302074432374, + 0.5244070569515228, + 0.5323069170594216, + 0.49816671800613405, + 0.508677875328064, + 0.5112697532653808, + 0.5021153599619865, + 0.4942335971832275, + 0.4886833331346512, + 0.48544664058685305, + 0.4812666481971741, + 0.4887116108417511, + 0.48429084918498994, + 0.47187945799827574, + 0.4692245128631592, + 0.46987841338217257, + 0.46758185052871704, + 0.46333528537750246, + 0.46536093158721925, + 0.459875780916214, + 0.4589812075734139, + 0.45842880477905273 + ], + "train_acc": [ + 0.2182, + 0.5995, + 0.7379, + 0.7849, + 0.8137, + 0.8271, + 0.8255, + 0.8312, + 0.8318, + 0.8272, + 0.8161, + 0.8323, + 0.8202, + 0.8275, + 0.8376, + 0.8296, + 0.8188, + 0.8345, + 0.828, + 0.8311, + 0.8286, + 0.8247, + 0.8295, + 0.815, + 0.8308, + 0.8442, + 0.8192, + 0.8286, + 0.8238, + 0.839, + 0.841, + 0.8458, + 0.8487, + 0.852, + 0.8528, + 0.8425, + 0.8458, + 0.832, + 0.848, + 0.8397, + 0.8528, + 0.858, + 0.849, + 0.8507, + 0.8473, + 0.8334, + 0.8433, + 0.8458, + 0.844, + 0.8479, + 0.8504, + 0.8696, + 0.8594, + 0.8689, + 0.8593, + 0.8676, + 0.8612, + 0.8671, + 0.8651, + 0.8661, + 0.8716, + 0.8748, + 0.8722, + 0.8746, + 0.8744, + 0.8769, + 0.8784, + 0.8791, + 0.8772, + 0.8791, + 0.8758, + 0.8803, + 0.8799, + 0.8789, + 0.8822, + 0.8816, + 0.8809, + 0.8835, + 0.8837, + 0.8838 + ], + "test_acc": [ + 0.4375, + 0.665, + 0.7315, + 0.7485, + 0.7955, + 0.7885, + 0.8, + 0.781, + 0.762, + 0.765, + 0.7855, + 0.7455, + 0.7895, + 0.7565, + 0.7715, + 0.746, + 0.786, + 0.781, + 0.7805, + 0.7935, + 0.7455, + 0.789, + 0.737, + 0.7525, + 0.7965, + 0.7215, + 0.7535, + 0.745, + 0.77, + 0.778, + 0.7865, + 0.8105, + 0.8125, + 0.7975, + 0.783, + 0.794, + 0.7765, + 0.8035, + 0.7535, + 0.7855, + 0.789, + 0.805, + 0.7975, + 0.76, + 0.7905, + 0.801, + 0.7875, + 0.816, + 0.767, + 0.791, + 0.8255, + 0.8295, + 0.817, + 0.8145, + 0.8215, + 0.7915, + 0.8105, + 0.817, + 0.8105, + 0.8175, + 0.827, + 0.822, + 0.826, + 0.8245, + 0.8345, + 0.82, + 0.826, + 0.831, + 0.8335, + 0.8285, + 0.832, + 0.829, + 0.83, + 0.8345, + 0.834, + 0.83, + 0.832, + 0.8335, + 0.8345, + 0.835 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.029614916071295738, + 0.08655504137277603, + 0.09347832202911377, + 0.10665939003229141, + 0.10298001766204834, + 0.055703092366456985, + 0.06406168639659882, + 0.054178133606910706 + ], + "perturbation_rho": [ + -0.10576558113098145, + 0.13653026521205902, + 0.13744692504405975, + 0.169493168592453, + 0.1142939031124115, + 0.09325758367776871, + 0.1042378693819046, + -0.00961439497768879 + ], + "nudging": { + "0.001": [ + 0.0020253753755241632, + -0.0006042197346687317, + -0.0003090167883783579, + -0.0003282201651018113, + -0.00030271150171756744, + -0.00016797086573205888, + -0.00020572963694576174, + -0.00016064735245890915 + ], + "0.003": [ + 0.006166902836412191, + -0.0018144691130146384, + -0.0009272561292164028, + -0.000988352345302701, + -0.0009091334650292993, + -0.0005062551936134696, + -0.0006199252675287426, + -0.0004811809048987925 + ], + "0.01": [ + 0.021624702960252762, + -0.006033358629792929, + -0.003085250034928322, + -0.0032903538085520267, + -0.0030274176970124245, + -0.0016871094703674316, + -0.0020643905736505985, + -0.0016031904378905892 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.7370107837677002, + 0.9566345932006836, + 0.7672526609420777, + 0.7551599216461181, + 0.8040943652153015, + 0.8967263271331787, + 0.8947166172027587, + 0.8826603755950928, + 0.9048395864486695, + 0.9103054508209228, + 0.910915373802185, + 0.9105680400848388, + 0.900138374710083, + 0.9003334159851074, + 0.881323463344574, + 0.8399732953071595, + 0.9072862690925598, + 0.8586404010772705, + 0.8466693807601928, + 0.8386851059913635, + 0.8304012378692627, + 0.8648545293807983, + 0.8444964403152466, + 0.787469714641571, + 0.7859655241012573, + 0.8520208901405334, + 0.7876779465675354, + 0.8035705984115601, + 0.7937297729492188, + 0.778717615699768, + 0.7854765256881714, + 0.8042930118560792, + 0.8156058423042297, + 0.7773512923240662, + 0.7559653558731079, + 0.7482747771739959, + 0.7103004894256592, + 0.7591038406848908, + 0.714097739982605, + 0.6922465740203857, + 0.7237790791511536, + 0.71418566198349, + 0.6863883009910583, + 0.6632298639297486, + 0.6979568075180054, + 0.6680784313201904, + 0.6481147897720337, + 0.6357518527030945, + 0.6247223592758179, + 0.6085101871490478, + 0.6133926107406616, + 0.595257430768013, + 0.5753008867263794, + 0.5893147421836853, + 0.5835431252121925, + 0.5568724251270294, + 0.5747560076713562, + 0.5652507972955704, + 0.5538186378479004, + 0.5708896952629089, + 0.5540621002197266, + 0.5491908939361573, + 0.5537193531036377, + 0.5458368228912354, + 0.541802837228775, + 0.5337149509429931, + 0.5353304562568665, + 0.5362093331336976, + 0.5316291991233826, + 0.5267005807876587, + 0.5275578862190247, + 0.5257468720436096, + 0.5230328259944915, + 0.5213959711074829, + 0.5200412568092346, + 0.519229730796814, + 0.5183546719074249, + 0.5177948822975159, + 0.5174177736282348, + 0.517131188583374 + ], + "train_acc": [ + 0.3748, + 0.6465, + 0.712, + 0.7328, + 0.72, + 0.7024, + 0.6979, + 0.6921, + 0.6745, + 0.6807, + 0.6741, + 0.6724, + 0.6781, + 0.6804, + 0.6904, + 0.7012, + 0.6822, + 0.6918, + 0.7011, + 0.7023, + 0.7113, + 0.7001, + 0.7091, + 0.7241, + 0.723, + 0.7167, + 0.7272, + 0.725, + 0.7256, + 0.7303, + 0.726, + 0.7246, + 0.7283, + 0.7379, + 0.7418, + 0.7456, + 0.7525, + 0.7416, + 0.7574, + 0.7607, + 0.7538, + 0.7559, + 0.7642, + 0.7692, + 0.7596, + 0.7661, + 0.7748, + 0.7776, + 0.7821, + 0.7886, + 0.7851, + 0.7912, + 0.7948, + 0.7926, + 0.7926, + 0.8047, + 0.7996, + 0.8021, + 0.8045, + 0.7943, + 0.8037, + 0.8038, + 0.8055, + 0.804, + 0.8064, + 0.8115, + 0.8093, + 0.8102, + 0.8084, + 0.8096, + 0.8122, + 0.8132, + 0.8131, + 0.8128, + 0.8133, + 0.814, + 0.8132, + 0.814, + 0.8158, + 0.8162 + ], + "test_acc": [ + 0.5495, + 0.6655, + 0.695, + 0.6805, + 0.67, + 0.676, + 0.6615, + 0.65, + 0.647, + 0.659, + 0.637, + 0.66, + 0.6585, + 0.67, + 0.6675, + 0.6235, + 0.684, + 0.6465, + 0.659, + 0.6625, + 0.667, + 0.664, + 0.681, + 0.677, + 0.6545, + 0.699, + 0.69, + 0.6775, + 0.7025, + 0.691, + 0.7025, + 0.691, + 0.7025, + 0.7185, + 0.7225, + 0.738, + 0.703, + 0.7235, + 0.7225, + 0.7185, + 0.7135, + 0.7275, + 0.7405, + 0.731, + 0.73, + 0.7375, + 0.7465, + 0.7255, + 0.7515, + 0.754, + 0.762, + 0.757, + 0.756, + 0.7445, + 0.7625, + 0.7615, + 0.772, + 0.767, + 0.76, + 0.7595, + 0.7635, + 0.768, + 0.7575, + 0.7735, + 0.769, + 0.7615, + 0.7675, + 0.7695, + 0.7645, + 0.768, + 0.7715, + 0.771, + 0.772, + 0.774, + 0.7685, + 0.768, + 0.7695, + 0.769, + 0.77, + 0.7705 + ], + "state_pred_error": [ + 0.6510248342990875, + 0.19123697934150696, + 0.15689989979267122, + 0.1638691138982773, + 0.18542276043891906, + 0.19759975728988646, + 0.19750141835212706, + 0.1924255329608917, + 0.18604150733947755, + 0.17945555620193482, + 0.16643357362747194, + 0.1515563004732132, + 0.13873218288421632, + 0.12696559550762176, + 0.11629828469753266, + 0.10857762076854706, + 0.10475670492649078, + 0.10159241337776184, + 0.09809481703042984, + 0.09148724089860916, + 0.08206979176998139, + 0.07435691350698471, + 0.06972167286872864, + 0.06627885436415672, + 0.06546131973266602, + 0.06723697187900543, + 0.06813187596797943, + 0.06687251436710358, + 0.06302478927373886, + 0.058677458524703976, + 0.057898998373746874, + 0.05797914127707481, + 0.058545249927043914, + 0.05916902434825897, + 0.05941378560066223, + 0.05825672425031662, + 0.05480920540094376, + 0.05071420597434044, + 0.04744568449258804, + 0.0444792321562767, + 0.042174161130189895, + 0.040468314665555956, + 0.03879091463685036, + 0.03714785648286342, + 0.0352774528324604, + 0.0339755380153656, + 0.032574092012643815, + 0.03123813125193119, + 0.030104083406925202, + 0.029090672388672828, + 0.028430724573135377, + 0.02767248264551163, + 0.026718193304538725, + 0.02616673924922943, + 0.025693943455815316, + 0.02513220482468605, + 0.024545501339435578, + 0.024053472316265107, + 0.023506799945235253, + 0.022811067420244215, + 0.02227019665837288, + 0.021723036986589433, + 0.021250531101226808, + 0.020513180258870126, + 0.020106326079368592, + 0.019632608953118323, + 0.01921781920492649, + 0.01884053735435009, + 0.0183342476695776, + 0.01785229898095131, + 0.01749335871487856, + 0.01714705436229706, + 0.016820847728848457, + 0.016439079593122005, + 0.016118293267488478, + 0.015841090542078017, + 0.015672565352916716, + 0.015245961971580983, + 0.01504119263291359, + 0.014731109365820885 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8497925996780396, + 0.4692588150501251, + 0.1727459728717804, + 0.1467132717370987, + 0.13944602012634277, + 0.1262509524822235, + 0.13373470306396484, + 0.13821429014205933 + ], + "perturbation_rho": [ + 0.7623768448829651, + 0.4223487377166748, + 0.18194836378097534, + 0.12129966914653778, + 0.11680327355861664, + 0.15588274598121643, + 0.1260674148797989, + 0.06604740768671036 + ], + "nudging": { + "0.001": [ + -0.026710381731390953, + -0.001401002169586718, + -0.00036633311538025737, + -0.0002976981922984123, + -0.0002801758237183094, + -0.00026074639754369855, + -0.00026977190282195807, + -0.000280526204733178 + ], + "0.003": [ + -0.0777532160282135, + -0.004196057096123695, + -0.0010983950924128294, + -0.0008932030177675188, + -0.0008403125102631748, + -0.0007819668389856815, + -0.0008093866053968668, + -0.000841516419313848 + ], + "0.01": [ + -0.23203837871551514, + -0.013907128013670444, + -0.0036564678885042667, + -0.0029728016816079617, + -0.0027978671714663506, + -0.0026036568451672792, + -0.002694307826459408, + -0.0028012352995574474 + ] + }, + "state_pred_error_per_layer": [ + 10530.408203125, + 8501.392578125, + 5819.005859375, + 4775.642578125, + 4112.55224609375, + 3853.83984375, + 4342.64697265625, + 3851.865478515625 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.159124858665466, + 1.116624098110199, + 0.7056743051528931, + 0.5761039943695069, + 0.5095945714950562, + 0.45241021232604983, + 0.46948385772705076, + 0.4793232214689255, + 0.4545422805786133, + 0.5009335787773133, + 0.5597627540111542, + 0.5120361625671387, + 0.5355229542732238, + 0.6279539004325867, + 0.5660819525957107, + 0.5390582748413086, + 0.5889693227291107, + 0.603074467754364, + 0.6584024600982666, + 0.695176156425476, + 0.7920763175964356, + 0.8451283014297485, + 0.8484785719871522, + 0.843716569519043, + 1.014335894203186, + 0.8687970887184143, + 1.0127446592330933, + 1.028154598236084, + 0.9810158153533935, + 0.9665016010284424, + 0.9403284704208374, + 1.0873604711532592, + 1.0908284931182861, + 1.0630552332878114, + 0.9850875625610351, + 1.127894623565674, + 1.1809495683670044, + 1.267158783340454, + 1.287852244567871, + 1.2246507026672364, + 1.2201649879455567, + 1.2201611038208007, + 1.1973112880706787, + 1.234057978248596, + 1.293443548965454, + 1.4402172996520997, + 1.2406691700935364, + 1.2519098442077636, + 1.2208334053039551, + 1.1873869004249573, + 1.177197998905182, + 1.2070206604003906, + 1.299656178665161, + 1.2269725717544555, + 1.1528090390205383, + 1.241765862083435, + 1.1921624895095826, + 1.19609040851593, + 1.167593807220459, + 1.1653289527893067, + 1.164765244102478, + 1.1514347393035889, + 1.158220820236206, + 1.1662875720024108, + 1.1485121864318848, + 1.150432911491394, + 1.1496048480987549, + 1.1453266424179078, + 1.1356859375, + 1.130746061706543, + 1.1316118362426757, + 1.1427904190063476, + 1.132000608253479, + 1.1233850655555726, + 1.1215381189346314, + 1.1214420713424682, + 1.120496761703491, + 1.1187861232757568, + 1.116937138557434, + 1.1163992111206054 + ], + "train_acc": [ + 0.2167, + 0.5976, + 0.7344, + 0.7845, + 0.807, + 0.8282, + 0.8255, + 0.8259, + 0.8331, + 0.8246, + 0.8176, + 0.8301, + 0.8268, + 0.8182, + 0.83, + 0.8362, + 0.8275, + 0.8307, + 0.8192, + 0.8176, + 0.796, + 0.7974, + 0.7834, + 0.7904, + 0.7608, + 0.7847, + 0.7592, + 0.7589, + 0.7547, + 0.7537, + 0.7488, + 0.7186, + 0.712, + 0.7016, + 0.7044, + 0.6673, + 0.6646, + 0.6502, + 0.6499, + 0.6509, + 0.6413, + 0.6409, + 0.6468, + 0.6369, + 0.6236, + 0.5994, + 0.6256, + 0.6259, + 0.6301, + 0.6327, + 0.6351, + 0.6208, + 0.6045, + 0.6189, + 0.6294, + 0.6101, + 0.6179, + 0.6152, + 0.6228, + 0.6201, + 0.6207, + 0.6207, + 0.6233, + 0.6191, + 0.6268, + 0.6248, + 0.6259, + 0.6253, + 0.6282, + 0.6274, + 0.6285, + 0.6264, + 0.6291, + 0.6292, + 0.6309, + 0.631, + 0.6336, + 0.6315, + 0.6322, + 0.6325 + ], + "test_acc": [ + 0.429, + 0.661, + 0.72, + 0.753, + 0.7785, + 0.7805, + 0.7985, + 0.7795, + 0.799, + 0.743, + 0.7975, + 0.784, + 0.794, + 0.765, + 0.7915, + 0.7625, + 0.786, + 0.7555, + 0.773, + 0.765, + 0.735, + 0.747, + 0.729, + 0.6775, + 0.7295, + 0.7225, + 0.737, + 0.7245, + 0.6875, + 0.697, + 0.6295, + 0.6765, + 0.6965, + 0.6915, + 0.6605, + 0.5695, + 0.615, + 0.52, + 0.578, + 0.6125, + 0.6, + 0.586, + 0.566, + 0.5905, + 0.5365, + 0.5565, + 0.5745, + 0.5445, + 0.5685, + 0.5815, + 0.586, + 0.5445, + 0.5635, + 0.5835, + 0.5705, + 0.5875, + 0.588, + 0.582, + 0.6175, + 0.615, + 0.604, + 0.595, + 0.594, + 0.6065, + 0.6115, + 0.619, + 0.6105, + 0.6105, + 0.6135, + 0.6125, + 0.6035, + 0.6105, + 0.6155, + 0.6155, + 0.6155, + 0.615, + 0.6185, + 0.6165, + 0.615, + 0.616 + ], + "value_loss": [ + 2.923849702453613, + 0.929932203578949, + 0.986256123161316, + 0.9705767082214356, + 0.9187479806900024, + 0.8046257507324219, + 0.8280020093917847, + 0.7600664526283741, + 0.6512299965858459, + 0.8722499349117279, + 1.0144303213119508, + 0.9696790258407593, + 1.047098385667801, + 1.3836800573349, + 1.172448957824707, + 1.1310886909484863, + 1.2517949352741242, + 1.449119287109375, + 1.541891334915161, + 1.8401317022323609, + 2.2931220562934875, + 2.6332393630981445, + 2.376218652820587, + 2.4431817691802977, + 3.0396681418418883, + 2.5404992835998534, + 2.9912292552947997, + 2.9550719177246094, + 2.845018405532837, + 2.3893951858520506, + 2.2559028842926026, + 2.5913971235752107, + 2.1639503829956053, + 1.7991520860671997, + 1.5380361373901368, + 1.6679082988739014, + 1.5880424777507782, + 1.986500718688965, + 1.8443089511871338, + 1.6190284337997436, + 1.5703363037109375, + 1.2268877660751343, + 1.235842610359192, + 1.3104468950271606, + 1.4912362480163575, + 2.4344917457580566, + 1.5018931139945983, + 1.2203104718208313, + 1.004470736503601, + 0.9335955861091614, + 0.9949490726470948, + 1.0034673252105712, + 1.0283565370559693, + 0.9653127727031707, + 0.7962954003334045, + 0.8769395300865174, + 0.8055619871139527, + 0.8671702852249146, + 0.7559805934906005, + 0.7425107782363891, + 0.7403785936832428, + 0.7167611845016479, + 0.6846619015693665, + 0.6878714230537415, + 0.7193085783004761, + 0.6548016827583313, + 0.7351945478439331, + 0.644631478023529, + 0.7197158195495605, + 0.6618418259859085, + 0.6821243083953857, + 0.6612376468658447, + 0.6439533136367798, + 0.5963960872650147, + 0.6086718690872193, + 0.599690711593628, + 0.5913591928482056, + 0.6202077602386474, + 0.5772844911575318, + 0.5891867377281189 + ], + "term_loss": [ + 1.6957895690917968, + 0.6753802593231201, + 0.831247025680542, + 0.8390384925842285, + 0.7965053218841552, + 0.6833916404724121, + 0.6818313911437989, + 0.608198171555996, + 0.5294004390478134, + 0.7458023294448852, + 0.8792923537254334, + 0.8413159708023071, + 0.9142087742328644, + 1.2399149011611938, + 1.0347518908500672, + 1.0019392091751098, + 1.1087773736953734, + 1.3111861721038818, + 1.3899584873199462, + 1.6716829993247986, + 2.086436320781708, + 2.397855037689209, + 2.1204052381515504, + 2.1729405517578124, + 2.6674406289100645, + 2.2249885496139528, + 2.6019367149353028, + 2.5479478713989256, + 2.400313151931763, + 2.024853038024902, + 1.8821177783966065, + 2.1543995948791506, + 1.7860287817955016, + 1.452260116672516, + 1.2173033016204835, + 1.3191343141555787, + 1.2516821141004562, + 1.617408494567871, + 1.4755853931427, + 1.2719025758743285, + 1.2177997756958008, + 0.8933947921752929, + 0.8899640788078308, + 0.9326346119403839, + 1.1148540426254272, + 1.898148253440857, + 1.12082442278862, + 0.8921917255401611, + 0.7068623620986938, + 0.6389377068519593, + 0.6924788676023483, + 0.695777419424057, + 0.7078803710460663, + 0.6601581328392029, + 0.5033305398464203, + 0.570631118297577, + 0.5162732218742371, + 0.5679329143404961, + 0.4729079250335693, + 0.461714194560051, + 0.46249124987125395, + 0.44334709153175356, + 0.4196650380134582, + 0.42120836625099184, + 0.44739498138427736, + 0.39437385370731354, + 0.46137346267700197, + 0.38239081733226776, + 0.450170348739624, + 0.4020174507200718, + 0.41444856939315794, + 0.3969281505584717, + 0.3867944943904877, + 0.34640119657516477, + 0.3521443841457367, + 0.3458197787284851, + 0.3377646032333374, + 0.3608278916358948, + 0.3261510276794434, + 0.3338063308954239 + ], + "bridge_loss": [ + 0.9423020985943266, + 0.05520812346786261, + 0.004487565135210752, + 0.002620925185829401, + 0.0048334262125194075, + 0.01594426441192627, + 0.03671039479970932, + 0.03975842403247953, + 0.015591624838858844, + 0.013291598454117775, + 0.01565677783973515, + 0.01498264015391469, + 0.01737629879415035, + 0.0184465979129076, + 0.018480844482779504, + 0.015960913228988648, + 0.024468728888779878, + 0.019229955610632895, + 0.02615500204563141, + 0.03635306806564331, + 0.059548058903217314, + 0.0856127993106842, + 0.10532212686538696, + 0.12074549732208252, + 0.20261099276542663, + 0.16408356733322144, + 0.21867822751998903, + 0.2356453148841858, + 0.272574133682251, + 0.19159529037475587, + 0.2004289361476898, + 0.24411858590841293, + 0.1787075509786606, + 0.14301152968406677, + 0.12255135390758515, + 0.13008755064010621, + 0.11080655341148377, + 0.13113918704390526, + 0.12944001140594483, + 0.1129146324634552, + 0.1154842409491539, + 0.09431586592197418, + 0.11188051323890685, + 0.13759187079668045, + 0.12995593395233154, + 0.27678604226112363, + 0.141656518304348, + 0.08655073091983795, + 0.05993868888616562, + 0.059859430432319644, + 0.06892287590354682, + 0.06750806963741779, + 0.06865553792715072, + 0.061588749042153355, + 0.05957540009617805, + 0.061613469922542574, + 0.05206717085838318, + 0.05907755357027054, + 0.04743152441978454, + 0.04469682623147964, + 0.04149307833611965, + 0.03929951223134995, + 0.030610716843605043, + 0.02995092202425003, + 0.0383457456946373, + 0.026008895072340964, + 0.040196093106269835, + 0.028685746616125107, + 0.03815972879528999, + 0.028288117049634458, + 0.03641813113093376, + 0.03163274981975556, + 0.026057027128338815, + 0.019867237696051598, + 0.02672082303762436, + 0.024199049031734466, + 0.024270879930257797, + 0.030186125880479812, + 0.02228136167526245, + 0.026477533173561097 + ], + "tgrad_loss": [ + 0.2857580623626709, + 0.19934382581710816, + 0.15052154083251953, + 0.1289172974586487, + 0.11740923545360565, + 0.10528984839916229, + 0.10946023015975952, + 0.11210985959172248, + 0.10623793400526046, + 0.11315601377487183, + 0.11948118734359742, + 0.11338041863441467, + 0.11551330276727677, + 0.1253185605764389, + 0.11921620997786522, + 0.1131885776758194, + 0.11854884642362594, + 0.1187031536102295, + 0.12577785356044768, + 0.13209564628601075, + 0.1471376781463623, + 0.14977150740623474, + 0.15049127151966096, + 0.14949570622444153, + 0.16961653110980987, + 0.15142717978954315, + 0.170614333486557, + 0.17147873260974883, + 0.17213111686706542, + 0.17294686603546142, + 0.1733561895608902, + 0.19287895803451538, + 0.19921406044960022, + 0.20388044509887696, + 0.1981814912080765, + 0.21868645486831664, + 0.22555380930900573, + 0.23795305459499358, + 0.2392835365533829, + 0.23421121506690978, + 0.2370522943496704, + 0.2391770931005478, + 0.23399802966117858, + 0.24022042050361633, + 0.24642628200054167, + 0.25955745730400087, + 0.23941217505931855, + 0.24156801874637604, + 0.23766968197822572, + 0.2347984517812729, + 0.23354733331203462, + 0.24018183145523073, + 0.25182062857151033, + 0.24356588566303253, + 0.2333894602775574, + 0.24469494655132293, + 0.23722159390449524, + 0.2401598274230957, + 0.2356411437034607, + 0.23609975414276124, + 0.23639426271915437, + 0.23411457405090333, + 0.23438614721298218, + 0.2367121321439743, + 0.23356784496307373, + 0.23441893281936646, + 0.2336249945640564, + 0.23355491318702698, + 0.23138573913574217, + 0.23153626589775086, + 0.23125760569572448, + 0.2326767508506775, + 0.2311017912387848, + 0.23012765417099, + 0.22980666117668153, + 0.22967188897132873, + 0.2293237120628357, + 0.22919374046325683, + 0.22885210227966307, + 0.2289028725862503 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.0006081201136112213, + 0.13602128624916077, + 0.1264307200908661, + 0.13147516548633575, + 0.14721693098545074, + 0.1274956315755844, + 0.13849349319934845, + 0.1316969096660614 + ], + "perturbation_rho": [ + 0.0121258944272995, + 0.21904222667217255, + 0.23992177844047546, + 0.23384322226047516, + 0.24397125840187073, + 0.24230614304542542, + 0.23810306191444397, + 0.1929502785205841 + ], + "nudging": { + "0.001": [ + 0.00011889888992300257, + -0.0009491944219917059, + -0.0008246820652857423, + -0.0008639077423140407, + -0.0009589982801117003, + -0.0008573950035497546, + -0.0009020413272082806, + -0.000869636656716466 + ], + "0.003": [ + 0.00037957681342959404, + -0.00284576159901917, + -0.0024732202291488647, + -0.0025892104022204876, + -0.002875671721994877, + -0.0025729541666805744, + -0.0027035544626414776, + -0.0026109416503459215 + ], + "0.01": [ + 0.0015163691714406013, + -0.009462166577577591, + -0.008223006501793861, + -0.008610539138317108, + -0.009565019980072975, + -0.00855704490095377, + -0.008995135314762592, + -0.008686890825629234 + ] + } + } + } +} \ No newline at end of file diff --git a/results/synth_ladder_v2_lo/synth_a0.25_L8_s456.json b/results/synth_ladder_v2_lo/synth_a0.25_L8_s456.json new file mode 100644 index 0000000..3a9dc65 --- /dev/null +++ b/results/synth_ladder_v2_lo/synth_a0.25_L8_s456.json @@ -0,0 +1,1638 @@ +{ + "bp": { + "log": { + "train_loss": [ + 1.0949109335899354, + 0.4847292046070099, + 0.43074436836242674, + 0.45461450641155243, + 0.3505706082344055, + 0.36935169534683226, + 0.3458066239833832, + 0.31260078072547914, + 0.3468876272201538, + 0.3495961265563965, + 0.3303800414800644, + 0.27149379975795745, + 0.2737216544628143, + 0.2767748848438263, + 0.2736096446037293, + 0.2938991106033325, + 0.2582871003627777, + 0.23739801230430602, + 0.2594614781618118, + 0.2630785707592964, + 0.2056863129377365, + 0.21809959688186645, + 0.24221352519989015, + 0.256286201775074, + 0.202121930706501, + 0.190755042886734, + 0.21771411544084548, + 0.1782619017124176, + 0.21908559448719025, + 0.18661829199790955, + 0.20600177307128906, + 0.18073079323768615, + 0.17271925398111343, + 0.1645322194814682, + 0.1671620917201042, + 0.15773158494234085, + 0.14472428426742553, + 0.14567419674396515, + 0.1518403840482235, + 0.13865896134376526, + 0.15951423366069795, + 0.16939479804039, + 0.13950223712921142, + 0.14568773169517518, + 0.1383738743185997, + 0.12232284970879555, + 0.1139566089630127, + 0.12166086977720261, + 0.11700058321952819, + 0.13092280693054198, + 0.12311471049785613, + 0.1198555045902729, + 0.1059309095799923, + 0.10063771556615829, + 0.09875465431213379, + 0.0968073558807373, + 0.10243437190055847, + 0.1019424331665039, + 0.0980549189567566, + 0.09463337656855583, + 0.08827412815093993, + 0.09218352751731873, + 0.08814562564194202, + 0.08469899677038192, + 0.083780100274086, + 0.08465643609762191, + 0.08265884437561036, + 0.08110810294151306, + 0.08215825154781342, + 0.07948198096752167, + 0.0788882690012455, + 0.07769866117238998, + 0.07724723608493805, + 0.07669834134578705, + 0.07622871665954589, + 0.07581909760832786, + 0.0755586281299591, + 0.07532668962180615, + 0.07521152381747961, + 0.07513501325845719 + ], + "train_acc": [ + 0.6208, + 0.8105, + 0.8295, + 0.8228, + 0.861, + 0.8558, + 0.8613, + 0.8739, + 0.8607, + 0.8631, + 0.8716, + 0.8908, + 0.8919, + 0.8925, + 0.8897, + 0.8837, + 0.8947, + 0.9068, + 0.8986, + 0.8962, + 0.9213, + 0.9183, + 0.9035, + 0.8971, + 0.9201, + 0.9259, + 0.9141, + 0.9322, + 0.9137, + 0.9271, + 0.9188, + 0.929, + 0.9344, + 0.9371, + 0.9353, + 0.9418, + 0.9461, + 0.9471, + 0.9438, + 0.9501, + 0.9409, + 0.933, + 0.9498, + 0.9473, + 0.9488, + 0.9564, + 0.9626, + 0.9572, + 0.9603, + 0.9521, + 0.9553, + 0.9586, + 0.9663, + 0.9705, + 0.9704, + 0.9724, + 0.9684, + 0.9697, + 0.97, + 0.971, + 0.9757, + 0.9731, + 0.9765, + 0.9777, + 0.9791, + 0.9795, + 0.9788, + 0.9812, + 0.9801, + 0.9815, + 0.9821, + 0.9826, + 0.9825, + 0.9832, + 0.9837, + 0.9842, + 0.9842, + 0.9844, + 0.9843, + 0.9844 + ], + "test_acc": [ + 0.781, + 0.8165, + 0.803, + 0.831, + 0.83, + 0.8365, + 0.849, + 0.8495, + 0.8445, + 0.8555, + 0.841, + 0.851, + 0.854, + 0.859, + 0.858, + 0.8525, + 0.858, + 0.8685, + 0.863, + 0.8625, + 0.8595, + 0.8605, + 0.8715, + 0.8585, + 0.872, + 0.8785, + 0.878, + 0.869, + 0.8685, + 0.8765, + 0.8655, + 0.8735, + 0.878, + 0.874, + 0.8755, + 0.878, + 0.879, + 0.878, + 0.868, + 0.8805, + 0.882, + 0.8785, + 0.8765, + 0.882, + 0.8855, + 0.8845, + 0.883, + 0.878, + 0.8845, + 0.885, + 0.888, + 0.8845, + 0.891, + 0.8855, + 0.888, + 0.884, + 0.8925, + 0.885, + 0.889, + 0.8865, + 0.884, + 0.8875, + 0.8875, + 0.891, + 0.8885, + 0.89, + 0.892, + 0.892, + 0.891, + 0.89, + 0.8895, + 0.891, + 0.892, + 0.8895, + 0.891, + 0.89, + 0.892, + 0.8915, + 0.8915, + 0.8915 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.9125592708587646, + 0.9000785946846008, + 0.8909372687339783, + 0.8829550743103027, + 0.8725745677947998, + 0.8661020994186401, + 0.8620940446853638, + 0.8593741059303284 + ], + "perturbation_rho": [ + 0.999998927116394, + 0.9999973177909851, + 0.9999907612800598, + 0.9999756813049316, + 0.9999436140060425, + 0.9999102354049683, + 0.9998818635940552, + 0.9998610019683838 + ], + "nudging": { + "0.001": [ + -0.030986659228801727, + -0.015735935419797897, + -0.008373400196433067, + -0.005039836745709181, + -0.003523369785398245, + -0.0027713021263480186, + -0.002361869905143976, + -0.0021209304686635733 + ], + "0.003": [ + -0.08494532853364944, + -0.045218996703624725, + -0.02457578107714653, + -0.01492589246481657, + -0.010475864633917809, + -0.008255371823906898, + -0.0070428503677248955, + -0.006327956914901733 + ], + "0.01": [ + -0.20531992614269257, + -0.12906500697135925, + -0.07575342804193497, + -0.04753156006336212, + -0.033830925822257996, + -0.02684028074145317, + -0.02297976426780224, + -0.020688600838184357 + ] + } + } + }, + "dfa": { + "log": { + "train_loss": [ + 2.1472257511138917, + 1.1181638860702514, + 0.7151324203491211, + 0.6038463168144226, + 0.5518400527000428, + 0.5422953238487244, + 0.4989058882713318, + 0.4734929576873779, + 0.5084627376556397, + 0.4886077699661255, + 0.5376619051456452, + 0.5474570850968361, + 0.554305893278122, + 0.5202565354347229, + 0.5240337833404541, + 0.5723548680782318, + 0.6057423986911774, + 0.6335679130554199, + 0.8334042789459228, + 0.6510819962501526, + 0.6476377725601197, + 0.9512515480041503, + 0.7544872245788574, + 0.7667170840382576, + 0.6804751989364624, + 0.6523664590835572, + 0.71346335105896, + 0.7457666255950928, + 0.8066830569267273, + 0.8132523374557495, + 0.6988166690826416, + 0.7388166641235352, + 0.754392647600174, + 0.5883678845405579, + 0.6688721237182618, + 0.6476173947811127, + 0.5539654819488525, + 0.5816531999588013, + 0.6078351530075073, + 0.6152278907775879, + 0.5529029175758362, + 0.5301448690414429, + 0.7110752467155457, + 0.5810994925498962, + 0.6101164865493774, + 0.5994223709389568, + 0.5442744667053223, + 0.6995502103805542, + 0.5148768998146057, + 0.5037326128482819, + 0.5214518201351166, + 0.5883345391273499, + 0.4768081897497177, + 0.5068866291046142, + 0.4764488230466843, + 0.45946760578155516, + 0.49770396411418916, + 0.43602915906906126, + 0.4487738832473755, + 0.4659734072804451, + 0.41908207817077636, + 0.46179782333374025, + 0.48253716304302213, + 0.3953704214572906, + 0.40171479530334475, + 0.42950227117538453, + 0.4127807888507843, + 0.3889078040599823, + 0.38612646083831786, + 0.38572493505477906, + 0.39088242225646974, + 0.3806451151371002, + 0.3771796305656433, + 0.37747309465408324, + 0.37728043706417086, + 0.37282773838043215, + 0.371367804813385, + 0.37083925895690917, + 0.36894340143203735, + 0.3683408546447754 + ], + "train_acc": [ + 0.2179, + 0.5936, + 0.7332, + 0.7781, + 0.7909, + 0.7968, + 0.8133, + 0.8234, + 0.8206, + 0.8287, + 0.8186, + 0.8215, + 0.8234, + 0.8267, + 0.8339, + 0.8278, + 0.8222, + 0.8158, + 0.791, + 0.8208, + 0.8186, + 0.7826, + 0.8065, + 0.8093, + 0.8194, + 0.8173, + 0.8108, + 0.8069, + 0.7948, + 0.8008, + 0.8137, + 0.8097, + 0.8044, + 0.8357, + 0.8234, + 0.8159, + 0.8369, + 0.8315, + 0.8232, + 0.8249, + 0.8354, + 0.8357, + 0.8055, + 0.8279, + 0.8258, + 0.8286, + 0.8311, + 0.806, + 0.8408, + 0.8408, + 0.8354, + 0.826, + 0.8485, + 0.8387, + 0.8468, + 0.8497, + 0.8422, + 0.8578, + 0.8495, + 0.8476, + 0.8598, + 0.8518, + 0.8443, + 0.8643, + 0.8624, + 0.854, + 0.8613, + 0.8654, + 0.8629, + 0.8669, + 0.8666, + 0.8697, + 0.869, + 0.8706, + 0.8686, + 0.869, + 0.8703, + 0.8691, + 0.872, + 0.8716 + ], + "test_acc": [ + 0.4355, + 0.66, + 0.725, + 0.7475, + 0.753, + 0.7685, + 0.753, + 0.7735, + 0.7605, + 0.762, + 0.7605, + 0.7725, + 0.796, + 0.7935, + 0.7745, + 0.7835, + 0.7695, + 0.684, + 0.728, + 0.7755, + 0.6765, + 0.7445, + 0.7595, + 0.779, + 0.7925, + 0.7355, + 0.7405, + 0.7515, + 0.7255, + 0.745, + 0.7365, + 0.717, + 0.778, + 0.737, + 0.746, + 0.805, + 0.791, + 0.769, + 0.7555, + 0.7715, + 0.769, + 0.721, + 0.78, + 0.715, + 0.8, + 0.7675, + 0.7165, + 0.796, + 0.783, + 0.7555, + 0.7335, + 0.7535, + 0.788, + 0.778, + 0.803, + 0.775, + 0.8035, + 0.7955, + 0.8055, + 0.809, + 0.7985, + 0.7825, + 0.8125, + 0.811, + 0.803, + 0.809, + 0.8145, + 0.8145, + 0.8115, + 0.81, + 0.806, + 0.815, + 0.8145, + 0.811, + 0.817, + 0.8105, + 0.817, + 0.814, + 0.815, + 0.8165 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.023487910628318787, + 0.16097302734851837, + 0.15321409702301025, + 0.08171598613262177, + 0.09132305532693863, + 0.0943714827299118, + 0.12134475260972977, + 0.11624611914157867 + ], + "perturbation_rho": [ + 0.006953349336981773, + 0.2090909481048584, + 0.23601846396923065, + 0.09328415989875793, + 0.10916170477867126, + 0.12872634828090668, + 0.15839380025863647, + 0.12173644453287125 + ], + "nudging": { + "0.001": [ + -0.0014989380724728107, + -0.0006578433676622808, + -0.0004933524178341031, + -0.0002418495569145307, + -0.00026780457119457424, + -0.0002914518117904663, + -0.000365283340215683, + -0.0003465903864707798 + ], + "0.003": [ + -0.004386726301163435, + -0.0019725339952856302, + -0.0014801708748564124, + -0.0007235509110614657, + -0.0008033128106035292, + -0.0008723997161723673, + -0.0010960788931697607, + -0.0010392360854893923 + ], + "0.01": [ + -0.013351024128496647, + -0.0065501369535923, + -0.004914519842714071, + -0.002402292797341943, + -0.002674146555364132, + -0.0028969072736799717, + -0.0036479653790593147, + -0.0034563695080578327 + ] + } + } + }, + "state_bridge": { + "log": { + "train_loss": [ + 1.6647419631958007, + 0.8504678049087524, + 0.6401122513771057, + 0.7083625171422958, + 0.7786526877403259, + 0.8720651931762695, + 0.9595140518188476, + 0.9861429462432861, + 0.9323599586486816, + 0.899129944229126, + 0.9279530187606811, + 0.8897452385902405, + 0.8938479597091675, + 0.8638220300674438, + 0.906347576713562, + 0.9050836343765258, + 0.8499874663829804, + 0.8411240774154664, + 0.8651394706249237, + 0.877176913356781, + 0.9522077980041503, + 0.9844632266044616, + 1.0108419298648834, + 0.9732825290679932, + 0.9338093704223632, + 0.9332979538917542, + 0.9276250453948974, + 0.9219045547485352, + 0.9317381838798523, + 0.9388368021011353, + 0.9790681660652161, + 0.9454907520294189, + 0.874178562927246, + 0.8427179465293885, + 0.8024572835922241, + 0.782051385307312, + 0.7510771628379822, + 0.7354073734283447, + 0.72446195602417, + 0.712243512916565, + 0.6917177545070649, + 0.6669502945899963, + 0.6513918544769287, + 0.6493661358833313, + 0.6412696421146393, + 0.6218226390838623, + 0.6146662407398223, + 0.6020424173355102, + 0.5983524523258209, + 0.5852884603500366, + 0.5948307316303253, + 0.598827698802948, + 0.5685866483688354, + 0.5605341876983643, + 0.5632628833770752, + 0.5427094759941101, + 0.5527820866823197, + 0.5406645874023438, + 0.5380706032276154, + 0.5333420150756836, + 0.5350062875747681, + 0.5249489510059356, + 0.5230996351242065, + 0.518796358013153, + 0.5124730639457703, + 0.5120888554573059, + 0.5096150938987732, + 0.5075559856414795, + 0.501591455078125, + 0.5030227668762207, + 0.5024164155960082, + 0.49786798992156983, + 0.49755160512924196, + 0.4957347078323364, + 0.49382514634132385, + 0.49241347570419314, + 0.491490665435791, + 0.4910508768081665, + 0.49063307988643645, + 0.49045275707244873 + ], + "train_acc": [ + 0.3852, + 0.6815, + 0.7626, + 0.7563, + 0.7446, + 0.7077, + 0.6719, + 0.6615, + 0.669, + 0.6782, + 0.6744, + 0.6783, + 0.6715, + 0.6817, + 0.6797, + 0.6778, + 0.6958, + 0.6924, + 0.6897, + 0.69, + 0.6764, + 0.6675, + 0.6555, + 0.6655, + 0.6802, + 0.6835, + 0.6881, + 0.6877, + 0.6863, + 0.6786, + 0.669, + 0.6783, + 0.7029, + 0.709, + 0.723, + 0.7296, + 0.7405, + 0.7436, + 0.7473, + 0.7544, + 0.7569, + 0.7609, + 0.7668, + 0.771, + 0.7733, + 0.7793, + 0.7802, + 0.7834, + 0.7873, + 0.7864, + 0.7863, + 0.7854, + 0.7935, + 0.7963, + 0.7942, + 0.8024, + 0.7976, + 0.8062, + 0.801, + 0.8054, + 0.806, + 0.8117, + 0.8073, + 0.8106, + 0.8125, + 0.8107, + 0.8135, + 0.8147, + 0.8131, + 0.8137, + 0.8118, + 0.8165, + 0.8167, + 0.8162, + 0.8171, + 0.8168, + 0.817, + 0.8161, + 0.8167, + 0.8165 + ], + "test_acc": [ + 0.5895, + 0.708, + 0.7305, + 0.718, + 0.6995, + 0.656, + 0.6345, + 0.6525, + 0.659, + 0.672, + 0.665, + 0.6575, + 0.6675, + 0.6645, + 0.643, + 0.657, + 0.672, + 0.659, + 0.644, + 0.6275, + 0.6365, + 0.616, + 0.6285, + 0.651, + 0.6335, + 0.652, + 0.668, + 0.667, + 0.657, + 0.636, + 0.6035, + 0.658, + 0.681, + 0.6835, + 0.686, + 0.714, + 0.7165, + 0.7065, + 0.71, + 0.7185, + 0.7315, + 0.722, + 0.733, + 0.7315, + 0.734, + 0.746, + 0.7475, + 0.7435, + 0.7505, + 0.7365, + 0.748, + 0.7485, + 0.7465, + 0.7505, + 0.758, + 0.75, + 0.7545, + 0.7575, + 0.7535, + 0.7565, + 0.7515, + 0.764, + 0.7645, + 0.762, + 0.755, + 0.761, + 0.76, + 0.764, + 0.7615, + 0.759, + 0.7635, + 0.7625, + 0.7655, + 0.761, + 0.7635, + 0.7625, + 0.7665, + 0.7665, + 0.7655, + 0.765 + ], + "state_pred_error": [ + 0.666967880153656, + 0.18810060460567474, + 0.13576818842887878, + 0.14196736080646516, + 0.16910594053268432, + 0.18899600715637208, + 0.19789577519893647, + 0.1905871472120285, + 0.18007886242866517, + 0.183910342335701, + 0.17881940922737122, + 0.1657484854698181, + 0.15431137666702271, + 0.14170081236362458, + 0.11855407935380936, + 0.100713077044487, + 0.08262610825300216, + 0.071003964304924, + 0.06459200706481934, + 0.062030674529075625, + 0.05962726338505745, + 0.06061183754205704, + 0.06133104244470596, + 0.06565195535421371, + 0.07003685694932937, + 0.07149426869153977, + 0.06879985384941101, + 0.06506773626804352, + 0.06144233440756798, + 0.05944625381231308, + 0.05934193442463875, + 0.06134367787837982, + 0.06049462513923645, + 0.057841612052917483, + 0.05770603183507919, + 0.05773961628675461, + 0.05772487918138504, + 0.05778447321653366, + 0.05642248193621635, + 0.0548339217543602, + 0.054051065188646316, + 0.050993192440271375, + 0.04841424728631973, + 0.045887135040760044, + 0.04289465088248253, + 0.04155976050496101, + 0.03856938924193382, + 0.03695869625508785, + 0.03501249846816063, + 0.03372661825418472, + 0.032175442039966584, + 0.030927191516757012, + 0.029651006668806077, + 0.029181170132756232, + 0.027786281275749208, + 0.027118772795796393, + 0.0260584001660347, + 0.025425236290693282, + 0.02490214566588402, + 0.023908728045225144, + 0.02325147164463997, + 0.022880420464277268, + 0.022282150906324388, + 0.021651219779253005, + 0.021038192823529242, + 0.020666827112436295, + 0.02006532666683197, + 0.01985739969611168, + 0.01912949861586094, + 0.01871727731227875, + 0.018331202378869055, + 0.017995913481712342, + 0.017765129128098488, + 0.017534943899512292, + 0.01711267368197441, + 0.016710035815835, + 0.016524365159869193, + 0.01614697908014059, + 0.015827153462171555, + 0.015557444103062153 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.8715300559997559, + 0.44268321990966797, + 0.14538408815860748, + 0.1153520941734314, + 0.09680549800395966, + 0.08768410980701447, + 0.08654746413230896, + 0.08166047930717468 + ], + "perturbation_rho": [ + 0.7710200548171997, + 0.4253605008125305, + 0.09275925159454346, + 0.09712537378072739, + 0.11123719066381454, + 0.028249293565750122, + 0.05002531409263611, + 0.09535005688667297 + ], + "nudging": { + "0.001": [ + -0.025821710005402565, + -0.0012925827177241445, + -0.0003022191522177309, + -0.00024204532383009791, + -0.00020273974223528057, + -0.00018941261805593967, + -0.0001821343321353197, + -0.000160791736561805 + ], + "0.003": [ + -0.075216144323349, + -0.003872812259942293, + -0.0009075523121282458, + -0.0007258595433086157, + -0.0006082953768782318, + -0.000569098920095712, + -0.0005463344277814031, + -0.0004819876339752227 + ], + "0.01": [ + -0.22555799782276154, + -0.012845459394156933, + -0.003021553158760071, + -0.0024172987323254347, + -0.002025863155722618, + -0.0018953735707327724, + -0.0018195084994658828, + -0.0016054193256422877 + ] + }, + "state_pred_error_per_layer": [ + 7857.92041015625, + 7327.2666015625, + 4158.3056640625, + 3231.240234375, + 3079.712890625, + 2843.65966796875, + 3014.824951171875, + 2904.82080078125 + ] + } + }, + "credit_bridge": { + "log": { + "train_loss": [ + 2.1516085662841795, + 1.1302078254699708, + 0.7157742590904236, + 0.6024308629989624, + 0.546905074596405, + 0.5507895238399506, + 0.507770078086853, + 0.5723479291915894, + 0.5291493295192718, + 0.530247050857544, + 0.5500000329971313, + 0.5253622520446777, + 0.5810077897071838, + 0.6602574828147888, + 0.5861081640243531, + 0.5804183698654175, + 0.717631731414795, + 0.6733690665245056, + 0.675653500366211, + 0.8460637107849122, + 0.7249561440467834, + 0.6630854389190673, + 0.6966967771530151, + 0.8677938482284546, + 0.8909709131240845, + 0.8387028586387635, + 0.8091570913791657, + 0.906946435213089, + 0.9558572208404541, + 1.0380563579559325, + 1.0291303350448608, + 0.985536870956421, + 1.1072970575332641, + 1.191497057914734, + 1.1032887983322144, + 1.2925684661865235, + 1.1835117977142333, + 1.2306733207702636, + 1.2600920732498169, + 1.2520610203742981, + 1.3718467151641847, + 1.299546180343628, + 1.2947479537963866, + 1.2124139470100403, + 1.1786796666145325, + 1.2429542098999022, + 1.342428367805481, + 1.3632954509735107, + 1.394326601409912, + 1.4198039100646973, + 1.3243803089141846, + 1.2885750002861023, + 1.2663284379005433, + 1.2274728206634522, + 1.193252119922638, + 1.1811400798797607, + 1.1389006465911866, + 1.1180383347272873, + 1.1007250593185425, + 1.1166740408420563, + 1.0792887409210206, + 1.0779459671020508, + 1.0732033897399902, + 1.054119002532959, + 1.0764888476371766, + 1.0661647203445435, + 1.058880652999878, + 1.0551886323928834, + 1.056046497440338, + 1.0552716503143311, + 1.0494010009765624, + 1.0550119636535644, + 1.056201064300537, + 1.0538349277496337, + 1.050132991027832, + 1.0496547233581544, + 1.0486548606872559, + 1.047701007938385, + 1.0474303240776062, + 1.047021061706543 + ], + "train_acc": [ + 0.2212, + 0.5907, + 0.7308, + 0.7758, + 0.7896, + 0.7928, + 0.8108, + 0.8008, + 0.8137, + 0.8162, + 0.8178, + 0.8263, + 0.8161, + 0.8022, + 0.8208, + 0.8282, + 0.7991, + 0.8151, + 0.8142, + 0.7866, + 0.7994, + 0.8071, + 0.7977, + 0.7624, + 0.7546, + 0.7665, + 0.7632, + 0.7433, + 0.7388, + 0.7253, + 0.7212, + 0.7159, + 0.6863, + 0.6817, + 0.7003, + 0.6803, + 0.6991, + 0.6955, + 0.6914, + 0.7001, + 0.6895, + 0.707, + 0.7028, + 0.7173, + 0.7146, + 0.7094, + 0.703, + 0.7109, + 0.7063, + 0.7053, + 0.7144, + 0.7197, + 0.7183, + 0.7167, + 0.7178, + 0.7184, + 0.7194, + 0.7195, + 0.7224, + 0.7209, + 0.7218, + 0.7237, + 0.7201, + 0.7231, + 0.7198, + 0.7243, + 0.7236, + 0.7241, + 0.7237, + 0.7251, + 0.7258, + 0.725, + 0.7239, + 0.723, + 0.7234, + 0.725, + 0.7251, + 0.7263, + 0.7257, + 0.7255 + ], + "test_acc": [ + 0.4255, + 0.675, + 0.7255, + 0.7725, + 0.762, + 0.751, + 0.778, + 0.735, + 0.755, + 0.7685, + 0.761, + 0.735, + 0.7375, + 0.7705, + 0.758, + 0.742, + 0.7245, + 0.764, + 0.695, + 0.745, + 0.755, + 0.7395, + 0.7355, + 0.6945, + 0.674, + 0.6845, + 0.6755, + 0.678, + 0.6845, + 0.6555, + 0.622, + 0.593, + 0.609, + 0.665, + 0.587, + 0.64, + 0.666, + 0.673, + 0.6695, + 0.6125, + 0.667, + 0.6375, + 0.6595, + 0.6575, + 0.6845, + 0.6485, + 0.6795, + 0.662, + 0.678, + 0.6845, + 0.6945, + 0.6785, + 0.688, + 0.666, + 0.6775, + 0.677, + 0.68, + 0.6775, + 0.673, + 0.6735, + 0.6695, + 0.682, + 0.6805, + 0.672, + 0.679, + 0.68, + 0.68, + 0.6825, + 0.6835, + 0.684, + 0.678, + 0.6755, + 0.682, + 0.6815, + 0.6845, + 0.685, + 0.6845, + 0.685, + 0.684, + 0.6845 + ], + "value_loss": [ + 2.7521291855812073, + 0.9180910070419311, + 0.8582979179382324, + 0.8436930362701416, + 0.744080483007431, + 0.810219680595398, + 0.7408779167175293, + 1.0244855613708497, + 0.9338075798034668, + 0.9276992179870606, + 0.9545603949546814, + 0.9124133073806763, + 1.1960320390701293, + 1.4768843864440917, + 1.2014622128486634, + 1.2761426291465758, + 1.7353202412605286, + 1.597738427257538, + 1.664009200668335, + 2.520654060602188, + 1.7846353689193726, + 1.4181387130737304, + 1.567960523223877, + 2.1403896005630494, + 2.0710450025558473, + 2.0047555275917053, + 1.959375698184967, + 2.184535858440399, + 2.2873155586242677, + 2.613582395553589, + 2.3063468826293945, + 2.0280820404052733, + 2.104402416610718, + 2.331796992111206, + 2.082660633468628, + 3.2120836341857912, + 2.8579379402160643, + 2.9819380401611326, + 3.2815154262542725, + 3.207817875480652, + 3.9281045833587647, + 3.7378572341918948, + 3.226262925720215, + 2.85760545463562, + 2.702269359397888, + 3.051305528640747, + 3.384582984352112, + 3.556245400428772, + 3.523557614135742, + 3.2986526222229005, + 3.235401312828064, + 2.9684787987709047, + 2.55984596824646, + 2.2802002365112304, + 2.024176069641113, + 1.8845641685485839, + 1.6243845146179199, + 1.4509369481086731, + 1.4253486824035644, + 1.6850188645362854, + 1.3281672570228578, + 1.3769848492145538, + 1.2704378549575805, + 1.2368674871444703, + 1.2117203078269958, + 1.3598486577987672, + 1.1672960079193115, + 1.1324042590141297, + 1.099521342945099, + 1.1117371515274048, + 1.0886727264404297, + 1.0962153171539306, + 1.1795017189025878, + 1.028487562084198, + 1.0475894167900086, + 0.9848965644836426, + 1.0609243473052978, + 0.9515016955852509, + 0.9616539595603942, + 0.966836922454834 + ], + "term_loss": [ + 1.6331857077598573, + 0.6622896879196167, + 0.6923012922286987, + 0.6955949920654297, + 0.5951863891124726, + 0.6333560477256774, + 0.5823763307571411, + 0.8590701545715332, + 0.7842735334396362, + 0.7716574224472046, + 0.8035843691825867, + 0.7695848602294922, + 1.042638046836853, + 1.3117044958114623, + 1.0455465385437013, + 1.1260901271820067, + 1.5533305332183838, + 1.4299912959575654, + 1.480502073287964, + 2.2650635835170747, + 1.540359531545639, + 1.1929577346801759, + 1.30778198223114, + 1.8106209615707398, + 1.7491421922683716, + 1.705204432630539, + 1.6608541017055511, + 1.8238994772791863, + 1.968325872039795, + 2.2342521270751954, + 1.8975757331848144, + 1.6534874923706055, + 1.7053577472686767, + 1.9309828533172608, + 1.7079864566802978, + 2.7641860927581785, + 2.395140308761597, + 2.4995895553588867, + 2.768734446144104, + 2.668160421562195, + 3.298172906398773, + 3.190414168548584, + 2.731164476776123, + 2.452812270736694, + 2.2980216970443728, + 2.6289563937187195, + 2.9189215684890746, + 2.9973133351325987, + 2.9566734222412108, + 2.7137685440063475, + 2.6214606603622435, + 2.422599083995819, + 2.051107206630707, + 1.8390387191772462, + 1.621574047088623, + 1.4804828034460544, + 1.2685496507644654, + 1.134537624424696, + 1.1113471033096314, + 1.3307540964603424, + 1.0319458944320679, + 1.0690455146431923, + 0.9753837090969085, + 0.9500243383169175, + 0.9227351568281651, + 1.0575221673965454, + 0.8811252347946167, + 0.8428130342483521, + 0.808463958287239, + 0.8252941177845001, + 0.80270101146698, + 0.8058414526939393, + 0.8659901483535767, + 0.7385568500280381, + 0.7546443981647492, + 0.6945585445404052, + 0.7605190132141113, + 0.6639182449221611, + 0.6647407983541489, + 0.6684003219604492 + ], + "bridge_loss": [ + 0.824764238196658, + 0.044050000402331355, + 0.004939059878140688, + 0.003509629046916962, + 0.010820124721527099, + 0.03611986360549927, + 0.026624655377864837, + 0.020322174452245236, + 0.013476835618913174, + 0.017660238027572633, + 0.013312850216031074, + 0.010752266106009484, + 0.012636999948322772, + 0.013416536007821559, + 0.014395894283056258, + 0.017065528978034854, + 0.01921152206361294, + 0.01755097916126251, + 0.03405968930721283, + 0.07861232693195343, + 0.08290403444468974, + 0.0737902283191681, + 0.10246425478458404, + 0.14190780395269395, + 0.1299729973077774, + 0.1119936275959015, + 0.11465253877639771, + 0.16193265878558158, + 0.11800107536315918, + 0.1624113775730133, + 0.18674517183303832, + 0.1529373960018158, + 0.15484059362411498, + 0.14790502850413323, + 0.13012928190231324, + 0.18545440337657929, + 0.2145381217598915, + 0.23015552363395692, + 0.2567644714832306, + 0.29004801396131513, + 0.37015869626998904, + 0.3029533437252045, + 0.24805833730697632, + 0.171279403924942, + 0.17121260148286818, + 0.18421311897039414, + 0.22017569878101348, + 0.31574616441726683, + 0.3227914002418518, + 0.34028916625976563, + 0.3808541042327881, + 0.31664952936172486, + 0.27961636044979093, + 0.2155075138092041, + 0.17780915865898134, + 0.18149373128414154, + 0.13657517416477202, + 0.0972943355768919, + 0.09725244807600975, + 0.13454232428073884, + 0.08104454445838928, + 0.0946770872026682, + 0.08133374876976013, + 0.0761439936414361, + 0.07479231785237789, + 0.09079816563725472, + 0.07500201788544655, + 0.07952561552673579, + 0.08066166642606258, + 0.07689544649124146, + 0.0765585425376892, + 0.0801964148759842, + 0.10329442504644394, + 0.08053842852115631, + 0.08384852820634842, + 0.08137421063184738, + 0.09204534806013108, + 0.07923152014613151, + 0.08891670184135438, + 0.09051647346019745 + ], + "tgrad_loss": [ + 0.2941792365074158, + 0.2117513240814209, + 0.16105757446289062, + 0.1445884093284607, + 0.1380739703655243, + 0.1407437702894211, + 0.13187693030834197, + 0.14509323680400849, + 0.136057210958004, + 0.13838154821395873, + 0.13766317186355592, + 0.1320761749267578, + 0.14075699508190154, + 0.1517633568048477, + 0.1415197740316391, + 0.13298697410821914, + 0.1627781904220581, + 0.15019614602029324, + 0.14944745190143585, + 0.17697814086675645, + 0.16137181975841522, + 0.15139073028564454, + 0.15771429176330568, + 0.18786082315444946, + 0.19192982950210571, + 0.18755748383998871, + 0.18386906574964523, + 0.1987037330508232, + 0.20098859162330626, + 0.21691890804767608, + 0.22202599787712096, + 0.22165712327957154, + 0.24420409016609193, + 0.2529091139793396, + 0.24454488706588745, + 0.26244310545921323, + 0.24825952727794648, + 0.2521929540634155, + 0.25601649553775785, + 0.24960945417881011, + 0.25977299585342406, + 0.2444897561311722, + 0.247040123963356, + 0.23351378746032714, + 0.23303504986763002, + 0.2381359790325165, + 0.2454857085943222, + 0.2431859058380127, + 0.24409279174804688, + 0.24459490759372712, + 0.23308657684326173, + 0.22923018233776093, + 0.22912240728139877, + 0.22565400907993316, + 0.22479286949634553, + 0.22258763573169707, + 0.21925969200134277, + 0.21910499383211135, + 0.21674911706447603, + 0.21972243776321412, + 0.21517683396339415, + 0.21326224946975708, + 0.21372039403915405, + 0.2106991579055786, + 0.21419283254146576, + 0.21152831535339356, + 0.21116876242160798, + 0.21006561065912246, + 0.21039570956230164, + 0.2095475886583328, + 0.20941317224502565, + 0.21017745037078858, + 0.21021716408729554, + 0.20939228029251097, + 0.2090964959383011, + 0.208963818025589, + 0.20835998804569245, + 0.20835193061828614, + 0.20799646167755126, + 0.20792012577056884 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.005484581924974918, + 0.03739434853196144, + 0.0736197978258133, + 0.10366753488779068, + 0.11266068369150162, + 0.12653732299804688, + 0.11692580580711365, + 0.12426558136940002 + ], + "perturbation_rho": [ + -0.0015162499621510506, + 0.12250564247369766, + 0.22542724013328552, + 0.204342320561409, + 0.2217923402786255, + 0.28867796063423157, + 0.33211782574653625, + 0.23834270238876343 + ], + "nudging": { + "0.001": [ + -4.532912862487137e-05, + -0.0006921375170350075, + -0.0008833008469082415, + -0.0010346387280151248, + -0.0010619328822940588, + -0.0011677223956212401, + -0.001099007437005639, + -0.0011405807454138994 + ], + "0.003": [ + -8.596014231443405e-05, + -0.002077887998893857, + -0.0026466129347682, + -0.003103021765127778, + -0.0031822444871068, + -0.0035020317882299423, + -0.003296034876257181, + -0.0034199936781078577 + ], + "0.01": [ + 0.0002549269702285528, + -0.006913396995514631, + -0.008808376267552376, + -0.010325662791728973, + -0.010591026395559311, + -0.011654841713607311, + -0.010967787355184555, + -0.011380846612155437 + ] + } + } + } +} \ No newline at end of file diff --git a/results/topdown_curriculum/topdown_s42.json b/results/topdown_curriculum/topdown_s42.json new file mode 100644 index 0000000..75523f6 --- /dev/null +++ b/results/topdown_curriculum/topdown_s42.json @@ -0,0 +1,620 @@ +{ + "DFA_only": { + "test_acc": [ + 0.3006, + 0.3039, + 0.2971, + 0.2915, + 0.2946, + 0.3055, + 0.3016, + 0.3071, + 0.2983, + 0.2891, + 0.2938, + 0.3097, + 0.2861, + 0.3091, + 0.3089, + 0.2942, + 0.3116, + 0.2963, + 0.2971, + 0.3065, + 0.3158, + 0.299, + 0.2948, + 0.3057, + 0.2977, + 0.3158, + 0.3065, + 0.2975, + 0.3125, + 0.306, + 0.3041, + 0.2915, + 0.2928, + 0.3004, + 0.3148, + 0.307, + 0.297, + 0.3043, + 0.3047, + 0.3002, + 0.3159, + 0.3159, + 0.3046, + 0.2984, + 0.3016, + 0.3024, + 0.29, + 0.3164, + 0.3004, + 0.3073, + 0.3154, + 0.3014, + 0.3072, + 0.3075, + 0.3181, + 0.2923, + 0.306, + 0.3055, + 0.3096, + 0.3027, + 0.3036, + 0.308, + 0.3097, + 0.3109, + 0.3127, + 0.3129, + 0.3155, + 0.3164, + 0.3102, + 0.3021, + 0.3138, + 0.313, + 0.3097, + 0.3088, + 0.3115, + 0.3157, + 0.3126, + 0.311, + 0.309, + 0.3091, + 0.304, + 0.3102, + 0.311, + 0.3136, + 0.3116, + 0.3114, + 0.3108, + 0.3112, + 0.3152, + 0.3077, + 0.3121, + 0.3119, + 0.3122, + 0.3115, + 0.3114, + 0.3118, + 0.3114, + 0.3116, + 0.3116, + 0.3116 + ], + "train_loss": [ + 2.0318866732025147, + 2.0057224438476564, + 2.000193025856018, + 1.9955825387573243, + 1.9903357116699218, + 1.9887702255249022, + 1.9901456210327149, + 1.9876038012313844, + 1.9891375769424438, + 1.9916579194641113, + 1.9882932608032227, + 1.9864958861541748, + 1.989747982635498, + 1.987270903930664, + 1.9892830609512329, + 1.9896244260025024, + 1.9903675205230713, + 1.9884116526794433, + 1.9885369082641602, + 1.986256969833374, + 1.987841325416565, + 1.9860659005355834, + 1.9870660667419433, + 1.9887021855926514, + 1.9881466793823241, + 1.987437709274292, + 1.9851161840438842, + 1.9871229264068604, + 1.987296971054077, + 1.9865425718688965, + 1.985583653526306, + 1.9873635176086426, + 1.9880531158828736, + 1.986221237449646, + 1.9857749569702148, + 1.9882853355407715, + 1.9866280360412598, + 1.98623606010437, + 1.9872347016906737, + 1.9890095454406738, + 1.987217137069702, + 1.9882683947753905, + 1.9873427893066407, + 1.9894943984985352, + 1.9865683745956422, + 1.9856433502197266, + 1.9884860709381103, + 1.9900159615325927, + 1.9878518949127197, + 1.98708917388916, + 1.9877159860992433, + 1.9865355113220216, + 1.9874952691268921, + 1.988472138748169, + 1.9888839432525636, + 1.9876802584075928, + 1.987925719909668, + 1.9862554049301147, + 1.9863393670272826, + 1.9889370369720458, + 1.9876346451187135, + 1.9845583619689942, + 1.9870499811553954, + 1.987435880508423, + 1.9854575398254395, + 1.985907090988159, + 1.9861144110870361, + 1.9871188342666626, + 1.9862679552841187, + 1.9887662117004394, + 1.9872093386840821, + 1.9860852742004393, + 1.9862465969085694, + 1.986481220550537, + 1.9852113827896118, + 1.9885292751312256, + 1.9848377563476562, + 1.986888662185669, + 1.9864294763183594, + 1.9865412310028077, + 1.985109836578369, + 1.9869044762802124, + 1.984938102722168, + 1.9856962964248657, + 1.9853763344573974, + 1.984437050552368, + 1.984452505493164, + 1.9845013403320313, + 1.9867055741119384, + 1.9862973651123046, + 1.9845818555450438, + 1.9843991091156006, + 1.9876228217315675, + 1.985638127822876, + 1.985604430923462, + 1.9853035695648193, + 1.9835245191192628, + 1.9839755685806275, + 1.9846243866729736, + 1.9842720232391358 + ] + }, + "last1_vec": { + "test_acc": [ + 0.2996, + 0.2995, + 0.2874, + 0.3114, + 0.3014, + 0.3096, + 0.2935, + 0.2923, + 0.3155, + 0.3056, + 0.3004, + 0.2872, + 0.2853, + 0.291, + 0.3082, + 0.317, + 0.2986, + 0.3005, + 0.2981, + 0.2822, + 0.3155, + 0.3121, + 0.2866, + 0.3147, + 0.3044, + 0.3059, + 0.3019, + 0.3007, + 0.2893, + 0.3061, + 0.3006, + 0.3012, + 0.3007, + 0.3062, + 0.3012, + 0.305, + 0.302, + 0.3025, + 0.296, + 0.2943, + 0.2975, + 0.2952, + 0.3073, + 0.2781, + 0.3007, + 0.3103, + 0.3036, + 0.3109, + 0.2965, + 0.2935, + 0.3012, + 0.307, + 0.309, + 0.2976, + 0.3011, + 0.3105, + 0.3039, + 0.2984, + 0.313, + 0.3137, + 0.3102, + 0.3068, + 0.296, + 0.3117, + 0.3032, + 0.3039, + 0.3088, + 0.3125, + 0.3165, + 0.2991, + 0.3058, + 0.2998, + 0.3179, + 0.3081, + 0.3006, + 0.3019, + 0.3059, + 0.3083, + 0.3092, + 0.3014, + 0.3044, + 0.3075, + 0.3085, + 0.3082, + 0.3068, + 0.3119, + 0.3071, + 0.3033, + 0.3095, + 0.3078, + 0.3078, + 0.3069, + 0.307, + 0.3092, + 0.3085, + 0.3083, + 0.3082, + 0.3081, + 0.3081, + 0.3081 + ], + "train_loss": [ + 2.0345643396759034, + 2.007593306617737, + 1.9998018278503418, + 1.9952433186340333, + 1.9938917417907716, + 1.9973094646835328, + 1.9969104711914063, + 1.9995911212921142, + 1.9924495524597168, + 1.9925645765686035, + 1.9936081827545167, + 1.993862791442871, + 1.9945276807403565, + 1.990838291168213, + 1.9927610682678223, + 1.9941217697525024, + 1.995144399986267, + 1.9913808044433594, + 1.9932640390014649, + 1.9948721499633788, + 1.9956926623153686, + 1.9973403372192382, + 1.9956930201721192, + 1.9962473291015626, + 1.9961961763000489, + 1.9938987312316894, + 1.9956984431457518, + 1.9971346160888672, + 1.9966354394149781, + 1.9995288914489746, + 1.9983650937652588, + 1.9960051403045653, + 1.9958921543121337, + 1.9955258317565918, + 1.9948776273345947, + 1.9976185216522218, + 1.994564013519287, + 1.9967529223251343, + 1.9981030158996582, + 1.9956832776641846, + 1.9969297004699706, + 1.9976720545196534, + 1.9958299970245361, + 1.9952620266723633, + 1.9946168762969971, + 1.99689278465271, + 1.9948313019561768, + 1.9961831992340089, + 1.9951787072372436, + 1.9960499554824829, + 1.9968265784454347, + 1.9975163645172118, + 1.9960405737686158, + 1.9958240811157226, + 1.9968332024383544, + 1.9965666370391846, + 1.9963636539077758, + 1.994098582496643, + 1.99495549407959, + 1.9951956588745117, + 1.9939876531219483, + 1.9946656102752685, + 1.9945226171875, + 1.9954966610717773, + 1.9952878218078614, + 1.9937264360046387, + 1.9948365911102295, + 1.9957475348281861, + 1.9963784033203125, + 1.9945422202301026, + 1.9945636574554444, + 1.993820396347046, + 1.9934314541244507, + 1.9957507235717773, + 1.9952685816955567, + 1.9934588801574706, + 1.9946705184936524, + 1.9927675800323486, + 1.9936156246566772, + 1.9922025442886353, + 1.992091411743164, + 1.9946434414672851, + 1.9921832648468019, + 1.991840097732544, + 1.9933607837677, + 1.9934361853027345, + 1.9941805229949952, + 1.9909538430786133, + 1.9926601502227783, + 1.9923504639434815, + 1.9904100805664062, + 1.9942665929794312, + 1.9916087580108643, + 1.9929376037597657, + 1.993217103805542, + 1.9917985494232178, + 1.9935525121688842, + 1.9907185480499268, + 1.9935195531463623, + 1.9910154447174073 + ] + }, + "last2_vec": { + "test_acc": [ + 0.3012, + 0.3003, + 0.2921, + 0.3113, + 0.2986, + 0.3137, + 0.2955, + 0.2918, + 0.3136, + 0.304, + 0.3083, + 0.2868, + 0.2818, + 0.2915, + 0.3106, + 0.3123, + 0.2995, + 0.2991, + 0.3056, + 0.282, + 0.3158, + 0.3107, + 0.2931, + 0.3168, + 0.3071, + 0.3053, + 0.3052, + 0.298, + 0.2901, + 0.3099, + 0.302, + 0.3067, + 0.305, + 0.3113, + 0.3051, + 0.3047, + 0.3043, + 0.3022, + 0.3032, + 0.2933, + 0.3003, + 0.2986, + 0.306, + 0.2826, + 0.3024, + 0.3095, + 0.3052, + 0.3099, + 0.3004, + 0.2972, + 0.3039, + 0.3055, + 0.3112, + 0.3008, + 0.3045, + 0.305, + 0.3044, + 0.3016, + 0.3121, + 0.3126, + 0.3111, + 0.3071, + 0.3027, + 0.3093, + 0.3085, + 0.3039, + 0.3121, + 0.3144, + 0.3145, + 0.303, + 0.3068, + 0.3024, + 0.3163, + 0.3107, + 0.3035, + 0.3075, + 0.3084, + 0.3104, + 0.3084, + 0.3025, + 0.3075, + 0.3076, + 0.3099, + 0.3107, + 0.3059, + 0.311, + 0.311, + 0.3073, + 0.311, + 0.3108, + 0.3087, + 0.3095, + 0.3108, + 0.311, + 0.3102, + 0.3113, + 0.3114, + 0.3113, + 0.3112, + 0.311 + ], + "train_loss": [ + 2.031281905136108, + 2.005962927017212, + 2.0026343697357176, + 2.000767257003784, + 1.9990581035614015, + 2.0019706972503664, + 2.001140174636841, + 2.002223112411499, + 1.9962018842315674, + 1.996555118484497, + 1.9969473624038696, + 1.9968425833511352, + 1.9976266242218017, + 1.9935137711334228, + 1.9940641801452637, + 1.9950864477539063, + 1.9965474452972412, + 1.9931761306381226, + 1.9944369088363647, + 1.995346979598999, + 1.995698737411499, + 1.996963890914917, + 1.9950353164672852, + 1.9954320928955078, + 1.9949085402679443, + 1.9924101929473876, + 1.9947130199432372, + 1.9950336464691163, + 1.995009578514099, + 1.9977039695739747, + 1.9959020367431641, + 1.9945704859161377, + 1.9936733311462402, + 1.992494267730713, + 1.9918036214447021, + 1.9950067366027833, + 1.9921373765563966, + 1.9948427129364015, + 1.9950579411315918, + 1.9927953283691406, + 1.994525142288208, + 1.9950615283203126, + 1.9934100622558595, + 1.9922057833099365, + 1.9917935915374756, + 1.9938205920410157, + 1.9920988291168213, + 1.9936680334472656, + 1.9925702806854249, + 1.993347884902954, + 1.993784471206665, + 1.9949239025115966, + 1.9927586205291747, + 1.9929026107788086, + 1.9937749021911622, + 1.9936894316864013, + 1.9937100197982789, + 1.9910739809799194, + 1.9918444245147706, + 1.9925511100769042, + 1.9910740645980836, + 1.9920696559143067, + 1.991673638534546, + 1.992748865661621, + 1.9925844535064696, + 1.9909471715545655, + 1.9921014580917358, + 1.9932282944107056, + 1.9935813955688477, + 1.9919534191894532, + 1.9918435103607177, + 1.9910840378189087, + 1.9909005782318114, + 1.992844515838623, + 1.992722346343994, + 1.9909247700500488, + 1.9922928537368774, + 1.9899731577301025, + 1.9908007229995728, + 1.9893973681259156, + 1.9895213146209716, + 1.991995177307129, + 1.989802378616333, + 1.989543790664673, + 1.9908066551208496, + 1.9911831595611573, + 1.9918553260040284, + 1.9886195541381837, + 1.9899968502426149, + 1.9898636253356934, + 1.9879634398651123, + 1.9917239908599853, + 1.9890282316589356, + 1.9905873622894288, + 1.9908626733779908, + 1.9894285187149048, + 1.9909917958831786, + 1.9881667736434936, + 1.9911110680770874, + 1.9885739231109618 + ] + } +} \ No newline at end of file diff --git a/results/update_swap/update_swap_L4_d256_s42.json b/results/update_swap/update_swap_L4_d256_s42.json new file mode 100644 index 0000000..da8bd60 --- /dev/null +++ b/results/update_swap/update_swap_L4_d256_s42.json @@ -0,0 +1,326 @@ +{ + "dfa_inner_product_k1": { + "credit": "dfa", + "rule": "inner_product", + "k": 1, + "loss_before": 1.1802499413490295, + "loss_after": 1.1798909544944762, + "delta_loss": -0.00035898685455326707, + "delta_acc": 0.002343749999999978 + }, + "dfa_inner_product_k5": { + "credit": "dfa", + "rule": "inner_product", + "k": 5, + "loss_before": 1.1802499413490295, + "loss_after": 1.1801763355731965, + "delta_loss": -7.360577583304106e-05, + "delta_acc": 0.0031249999999999334 + }, + "dfa_inner_product_k20": { + "credit": "dfa", + "rule": "inner_product", + "k": 20, + "loss_before": 1.1802499413490295, + "loss_after": 1.1791145503520966, + "delta_loss": -0.001135390996932939, + "delta_acc": 0.0031249999999999334 + }, + "dfa_target_shift_k1": { + "credit": "dfa", + "rule": "target_shift", + "k": 1, + "loss_before": 1.1802499413490295, + "loss_after": 1.1802448272705077, + "delta_loss": -5.1140785217729245e-06, + "delta_acc": 0.0 + }, + "dfa_target_shift_k5": { + "credit": "dfa", + "rule": "target_shift", + "k": 5, + "loss_before": 1.1802499413490295, + "loss_after": 1.180225706100464, + "delta_loss": -2.42352485655406e-05, + "delta_acc": 0.0 + }, + "dfa_target_shift_k20": { + "credit": "dfa", + "rule": "target_shift", + "k": 20, + "loss_before": 1.1802499413490295, + "loss_after": 1.1801500260829925, + "delta_loss": -9.991526603703171e-05, + "delta_acc": 0.0007812499999999556 + }, + "dfa_cosine_target_k1": { + "credit": "dfa", + "rule": "cosine_target", + "k": 1, + "loss_before": 1.1802499413490295, + "loss_after": 1.1802544593811035, + "delta_loss": 4.518032074019018e-06, + "delta_acc": 0.0 + }, + "dfa_cosine_target_k5": { + "credit": "dfa", + "rule": "cosine_target", + "k": 5, + "loss_before": 1.1802499413490295, + "loss_after": 1.1802321672439575, + "delta_loss": -1.7774105071977075e-05, + "delta_acc": 0.0 + }, + "dfa_cosine_target_k20": { + "credit": "dfa", + "rule": "cosine_target", + "k": 20, + "loss_before": 1.1802499413490295, + "loss_after": 1.1802163660526275, + "delta_loss": -3.357529640202195e-05, + "delta_acc": 0.0 + }, + "scalar_cb_inner_product_k1": { + "credit": "scalar_cb", + "rule": "inner_product", + "k": 1, + "loss_before": 1.1802499413490295, + "loss_after": 1.1847817242145537, + "delta_loss": 0.004531782865524248, + "delta_acc": 0.0 + }, + "scalar_cb_inner_product_k5": { + "credit": "scalar_cb", + "rule": "inner_product", + "k": 5, + "loss_before": 1.1802499413490295, + "loss_after": 1.217646211385727, + "delta_loss": 0.03739627003669743, + "delta_acc": -0.0015625000000000222 + }, + "scalar_cb_inner_product_k20": { + "credit": "scalar_cb", + "rule": "inner_product", + "k": 20, + "loss_before": 1.1802499413490295, + "loss_after": 1.599052119255066, + "delta_loss": 0.41880217790603647, + "delta_acc": -0.06093749999999998 + }, + "scalar_cb_target_shift_k1": { + "credit": "scalar_cb", + "rule": "target_shift", + "k": 1, + "loss_before": 1.1802499413490295, + "loss_after": 1.1802926063537598, + "delta_loss": 4.266500473026902e-05, + "delta_acc": 0.0 + }, + "scalar_cb_target_shift_k5": { + "credit": "scalar_cb", + "rule": "target_shift", + "k": 5, + "loss_before": 1.1802499413490295, + "loss_after": 1.1803449153900147, + "delta_loss": 9.497404098524065e-05, + "delta_acc": 0.0007812499999999556 + }, + "scalar_cb_target_shift_k20": { + "credit": "scalar_cb", + "rule": "target_shift", + "k": 20, + "loss_before": 1.1802499413490295, + "loss_after": 1.1809070765972138, + "delta_loss": 0.0006571352481843373, + "delta_acc": 0.0015625000000000222 + }, + "scalar_cb_cosine_target_k1": { + "credit": "scalar_cb", + "rule": "cosine_target", + "k": 1, + "loss_before": 1.1802499413490295, + "loss_after": 1.1802353382110595, + "delta_loss": -1.4603137969970703e-05, + "delta_acc": 0.0 + }, + "scalar_cb_cosine_target_k5": { + "credit": "scalar_cb", + "rule": "cosine_target", + "k": 5, + "loss_before": 1.1802499413490295, + "loss_after": 1.1802433907985688, + "delta_loss": -6.550550460726612e-06, + "delta_acc": 0.0 + }, + "scalar_cb_cosine_target_k20": { + "credit": "scalar_cb", + "rule": "cosine_target", + "k": 20, + "loss_before": 1.1802499413490295, + "loss_after": 1.180246114730835, + "delta_loss": -3.826618194535669e-06, + "delta_acc": 0.0 + }, + "vec_eT_M4_inner_product_k1": { + "credit": "vec_eT_M4", + "rule": "inner_product", + "k": 1, + "loss_before": 1.1802499413490295, + "loss_after": 1.1842417955398559, + "delta_loss": 0.003991854190826372, + "delta_acc": -0.0015625000000000222 + }, + "vec_eT_M4_inner_product_k5": { + "credit": "vec_eT_M4", + "rule": "inner_product", + "k": 5, + "loss_before": 1.1802499413490295, + "loss_after": 1.236989963054657, + "delta_loss": 0.05674002170562753, + "delta_acc": -0.025781249999999978 + }, + "vec_eT_M4_inner_product_k20": { + "credit": "vec_eT_M4", + "rule": "inner_product", + "k": 20, + "loss_before": 1.1802499413490295, + "loss_after": 1.3920087337493896, + "delta_loss": 0.2117587924003601, + "delta_acc": -0.05859375 + }, + "vec_eT_M4_target_shift_k1": { + "credit": "vec_eT_M4", + "rule": "target_shift", + "k": 1, + "loss_before": 1.1802499413490295, + "loss_after": 1.1802446365356445, + "delta_loss": -5.304813385009766e-06, + "delta_acc": 0.0 + }, + "vec_eT_M4_target_shift_k5": { + "credit": "vec_eT_M4", + "rule": "target_shift", + "k": 5, + "loss_before": 1.1802499413490295, + "loss_after": 1.1803565859794616, + "delta_loss": 0.0001066446304320845, + "delta_acc": 0.0007812499999999556 + }, + "vec_eT_M4_target_shift_k20": { + "credit": "vec_eT_M4", + "rule": "target_shift", + "k": 20, + "loss_before": 1.1802499413490295, + "loss_after": 1.1805941879749298, + "delta_loss": 0.00034424662590026855, + "delta_acc": 0.0015625000000000222 + }, + "vec_eT_M4_cosine_target_k1": { + "credit": "vec_eT_M4", + "rule": "cosine_target", + "k": 1, + "loss_before": 1.1802499413490295, + "loss_after": 1.1802608609199523, + "delta_loss": 1.0919570922807154e-05, + "delta_acc": 0.0 + }, + "vec_eT_M4_cosine_target_k5": { + "credit": "vec_eT_M4", + "rule": "cosine_target", + "k": 5, + "loss_before": 1.1802499413490295, + "loss_after": 1.1802728593349456, + "delta_loss": 2.2917985916137695e-05, + "delta_acc": 0.0 + }, + "vec_eT_M4_cosine_target_k20": { + "credit": "vec_eT_M4", + "rule": "cosine_target", + "k": 20, + "loss_before": 1.1802499413490295, + "loss_after": 1.1801955819129943, + "delta_loss": -5.435943603515625e-05, + "delta_acc": 0.0 + }, + "oracle_bp_inner_product_k1": { + "credit": "oracle_bp", + "rule": "inner_product", + "k": 1, + "loss_before": 1.1802499413490295, + "loss_after": 1.1826384663581848, + "delta_loss": 0.002388525009155318, + "delta_acc": 0.002343749999999978 + }, + "oracle_bp_inner_product_k5": { + "credit": "oracle_bp", + "rule": "inner_product", + "k": 5, + "loss_before": 1.1802499413490295, + "loss_after": 1.1915695667266846, + "delta_loss": 0.011319625377655074, + "delta_acc": 0.005468750000000022 + }, + "oracle_bp_inner_product_k20": { + "credit": "oracle_bp", + "rule": "inner_product", + "k": 20, + "loss_before": 1.1802499413490295, + "loss_after": 1.2219606041908264, + "delta_loss": 0.04171066284179692, + "delta_acc": -0.007031250000000044 + }, + "oracle_bp_target_shift_k1": { + "credit": "oracle_bp", + "rule": "target_shift", + "k": 1, + "loss_before": 1.1802499413490295, + "loss_after": 1.1802712082862854, + "delta_loss": 2.1266937255903784e-05, + "delta_acc": 0.0 + }, + "oracle_bp_target_shift_k5": { + "credit": "oracle_bp", + "rule": "target_shift", + "k": 5, + "loss_before": 1.1802499413490295, + "loss_after": 1.1803063929080964, + "delta_loss": 5.645155906686128e-05, + "delta_acc": 0.0 + }, + "oracle_bp_target_shift_k20": { + "credit": "oracle_bp", + "rule": "target_shift", + "k": 20, + "loss_before": 1.1802499413490295, + "loss_after": 1.1803919494152069, + "delta_loss": 0.00014200806617736816, + "delta_acc": 0.0 + }, + "oracle_bp_cosine_target_k1": { + "credit": "oracle_bp", + "rule": "cosine_target", + "k": 1, + "loss_before": 1.1802499413490295, + "loss_after": 1.1802570879459382, + "delta_loss": 7.146596908702563e-06, + "delta_acc": 0.0 + }, + "oracle_bp_cosine_target_k5": { + "credit": "oracle_bp", + "rule": "cosine_target", + "k": 5, + "loss_before": 1.1802499413490295, + "loss_after": 1.1802275061607361, + "delta_loss": -2.2435188293368213e-05, + "delta_acc": 0.0 + }, + "oracle_bp_cosine_target_k20": { + "credit": "oracle_bp", + "rule": "cosine_target", + "k": 20, + "loss_before": 1.1802499413490295, + "loss_after": 1.1802619516849517, + "delta_loss": 1.2010335922241211e-05, + "delta_acc": 0.0 + } +} \ No newline at end of file diff --git a/results/vector_audit/audit_results.json b/results/vector_audit/audit_results.json new file mode 100644 index 0000000..9b37b64 --- /dev/null +++ b/results/vector_audit/audit_results.json @@ -0,0 +1,184 @@ +[ + { + "method": "dfa", + "L": 4, + "seed": 42, + "mean_gamma": 0.012759206583723426, + "mean_rho": 0.010203135898336768, + "mean_nudge": -0.00013293450319906697, + "per_layer_gamma": [ + -0.005139289423823357, + 0.008053570054471493, + 0.024840975180268288, + 0.02328157052397728 + ], + "per_layer_rho": [ + -0.004372224677354097, + 0.0029046176932752132, + 0.0310027077794075, + 0.011277442798018456 + ], + "per_layer_nudge": [ + 0.0003250446170568466, + -0.0001853172725532204, + -0.00036372727481648326, + -0.00030773808248341084 + ] + }, + { + "method": "scalar_cb", + "L": 4, + "seed": 42, + "mean_gamma": 0.2243543565273285, + "mean_rho": 0.20948006212711334, + "mean_nudge": -0.007398057030513883, + "per_layer_gamma": [ + 0.23697319626808167, + 0.13470041751861572, + 0.186288982629776, + 0.3394548296928406 + ], + "per_layer_rho": [ + 0.2484399378299713, + 0.1292348951101303, + 0.18184946477413177, + 0.27839595079421997 + ], + "per_layer_nudge": [ + -0.008707698434591293, + -0.004232201725244522, + -0.00588453933596611, + -0.010767788626253605 + ] + }, + { + "method": "vec_eT_M4", + "L": 4, + "seed": 42, + "mean_gamma": 0.846664547920227, + "mean_rho": 0.9511756896972656, + "mean_nudge": -0.025688248220831156, + "per_layer_gamma": [ + 0.743350088596344, + 0.8330336809158325, + 0.8981793522834778, + 0.9120950698852539 + ], + "per_layer_rho": [ + 0.8806748390197754, + 0.9658336639404297, + 0.9759747982025146, + 0.9822194576263428 + ], + "per_layer_nudge": [ + -0.0588495098054409, + -0.01651737093925476, + -0.013681922107934952, + -0.013704190030694008 + ] + }, + { + "method": "vec_eT_M8", + "L": 4, + "seed": 42, + "mean_gamma": 0.8704017400741577, + "mean_rho": 0.9432401657104492, + "mean_nudge": -0.028888660948723555, + "per_layer_gamma": [ + 0.7826259136199951, + 0.877338171005249, + 0.9058365821838379, + 0.9158062934875488 + ], + "per_layer_rho": [ + 0.8731295466423035, + 0.9544992446899414, + 0.9707695245742798, + 0.9745623469352722 + ], + "per_layer_nudge": [ + -0.059486024081707, + -0.01946994476020336, + -0.018279198557138443, + -0.018319476395845413 + ] + }, + { + "method": "vec_eT_M4_shuffleCtrl", + "L": 4, + "seed": 42, + "mean_gamma": 0.0513513587648049, + "mean_rho": 0.0681416861480102, + "mean_nudge": -0.0007606418039358687, + "per_layer_gamma": [ + -0.09132926911115646, + -0.013022630475461483, + 0.0033656186424195766, + 0.30639171600341797 + ], + "per_layer_rho": [ + -0.047784049063920975, + -0.0063863289542496204, + 0.01414431817829609, + 0.3125928044319153 + ], + "per_layer_nudge": [ + 0.006318309810012579, + 0.0002974363451357931, + -0.00020490401948336512, + -0.009453409351408482 + ] + }, + { + "method": "vec_eT_M4_noTerm", + "L": 4, + "seed": 42, + "mean_gamma": 0.954873263835907, + "mean_rho": 0.9708771407604218, + "mean_nudge": -0.027431895025074482, + "per_layer_gamma": [ + 0.9027864336967468, + 0.9722906351089478, + 0.9725323915481567, + 0.9718835949897766 + ], + "per_layer_rho": [ + 0.9104452133178711, + 0.9908294677734375, + 0.991165280342102, + 0.9910686016082764 + ], + "per_layer_nudge": [ + -0.04417877644300461, + -0.022297389805316925, + -0.021837987005710602, + -0.021413426846265793 + ] + }, + { + "method": "vec_eT_M4_onesided", + "L": 4, + "seed": 42, + "mean_gamma": 0.8315763473510742, + "mean_rho": 0.9426839649677277, + "mean_nudge": -0.02414578991010785, + "per_layer_gamma": [ + 0.7389893531799316, + 0.8383945226669312, + 0.8796361684799194, + 0.8692853450775146 + ], + "per_layer_rho": [ + 0.8755806684494019, + 0.9449398517608643, + 0.9726759195327759, + 0.9775394201278687 + ], + "per_layer_nudge": [ + -0.055945657193660736, + -0.01551580149680376, + -0.012561880983412266, + -0.012559819966554642 + ] + } +] \ No newline at end of file diff --git a/results/vector_audit_full/audit_results.json b/results/vector_audit_full/audit_results.json new file mode 100644 index 0000000..06a244b --- /dev/null +++ b/results/vector_audit_full/audit_results.json @@ -0,0 +1,1346 @@ +[ + { + "method": "dfa", + "L": 4, + "seed": 42, + "mean_gamma": 0.012759206583723426, + "mean_rho": 0.010203135898336768, + "mean_nudge": -0.00013293450319906697, + "per_layer_gamma": [ + -0.005139289423823357, + 0.008053570054471493, + 0.024840975180268288, + 0.02328157052397728 + ], + "per_layer_rho": [ + -0.004372224677354097, + 0.0029046176932752132, + 0.0310027077794075, + 0.011277442798018456 + ], + "per_layer_nudge": [ + 0.0003250446170568466, + -0.0001853172725532204, + -0.00036372727481648326, + -0.00030773808248341084 + ] + }, + { + "method": "scalar_cb", + "L": 4, + "seed": 42, + "mean_gamma": 0.2243543565273285, + "mean_rho": 0.20948006212711334, + "mean_nudge": -0.007398057030513883, + "per_layer_gamma": [ + 0.23697319626808167, + 0.13470041751861572, + 0.186288982629776, + 0.3394548296928406 + ], + "per_layer_rho": [ + 0.2484399378299713, + 0.1292348951101303, + 0.18184946477413177, + 0.27839595079421997 + ], + "per_layer_nudge": [ + -0.008707698434591293, + -0.004232201725244522, + -0.00588453933596611, + -0.010767788626253605 + ] + }, + { + "method": "vec_eT_M4", + "L": 4, + "seed": 42, + "mean_gamma": 0.846664547920227, + "mean_rho": 0.9511756896972656, + "mean_nudge": -0.025688248220831156, + "per_layer_gamma": [ + 0.743350088596344, + 0.8330336809158325, + 0.8981793522834778, + 0.9120950698852539 + ], + "per_layer_rho": [ + 0.8806748390197754, + 0.9658336639404297, + 0.9759747982025146, + 0.9822194576263428 + ], + "per_layer_nudge": [ + -0.0588495098054409, + -0.01651737093925476, + -0.013681922107934952, + -0.013704190030694008 + ] + }, + { + "method": "vec_eT_M8", + "L": 4, + "seed": 42, + "mean_gamma": 0.8704017400741577, + "mean_rho": 0.9432401657104492, + "mean_nudge": -0.028888660948723555, + "per_layer_gamma": [ + 0.7826259136199951, + 0.877338171005249, + 0.9058365821838379, + 0.9158062934875488 + ], + "per_layer_rho": [ + 0.8731295466423035, + 0.9544992446899414, + 0.9707695245742798, + 0.9745623469352722 + ], + "per_layer_nudge": [ + -0.059486024081707, + -0.01946994476020336, + -0.018279198557138443, + -0.018319476395845413 + ] + }, + { + "method": "vec_eT_M4_shuffleCtrl", + "L": 4, + "seed": 42, + "mean_gamma": 0.0513513587648049, + "mean_rho": 0.0681416861480102, + "mean_nudge": -0.0007606418039358687, + "per_layer_gamma": [ + -0.09132926911115646, + -0.013022630475461483, + 0.0033656186424195766, + 0.30639171600341797 + ], + "per_layer_rho": [ + -0.047784049063920975, + -0.0063863289542496204, + 0.01414431817829609, + 0.3125928044319153 + ], + "per_layer_nudge": [ + 0.006318309810012579, + 0.0002974363451357931, + -0.00020490401948336512, + -0.009453409351408482 + ] + }, + { + "method": "vec_eT_M4_noTerm", + "L": 4, + "seed": 42, + "mean_gamma": 0.954873263835907, + "mean_rho": 0.9708771407604218, + "mean_nudge": -0.027431895025074482, + "per_layer_gamma": [ + 0.9027864336967468, + 0.9722906351089478, + 0.9725323915481567, + 0.9718835949897766 + ], + "per_layer_rho": [ + 0.9104452133178711, + 0.9908294677734375, + 0.991165280342102, + 0.9910686016082764 + ], + "per_layer_nudge": [ + -0.04417877644300461, + -0.022297389805316925, + -0.021837987005710602, + -0.021413426846265793 + ] + }, + { + "method": "vec_eT_M4_onesided", + "L": 4, + "seed": 42, + "mean_gamma": 0.8315763473510742, + "mean_rho": 0.9426839649677277, + "mean_nudge": -0.02414578991010785, + "per_layer_gamma": [ + 0.7389893531799316, + 0.8383945226669312, + 0.8796361684799194, + 0.8692853450775146 + ], + "per_layer_rho": [ + 0.8755806684494019, + 0.9449398517608643, + 0.9726759195327759, + 0.9775394201278687 + ], + "per_layer_nudge": [ + -0.055945657193660736, + -0.01551580149680376, + -0.012561880983412266, + -0.012559819966554642 + ] + }, + { + "method": "dfa", + "L": 4, + "seed": 123, + "mean_gamma": 0.0021313047036528587, + "mean_rho": 0.00923872203566134, + "mean_nudge": 0.000226999055826127, + "per_layer_gamma": [ + -0.013840198516845703, + 0.020386721938848495, + -0.0008580549620091915, + 0.002836750354617834 + ], + "per_layer_rho": [ + -0.012609685771167278, + 0.019667847082018852, + -0.009115943685173988, + 0.03901267051696777 + ], + "per_layer_nudge": [ + 0.0012924917973577976, + -0.0003459132567513734, + 3.6447577258513775e-06, + -4.222707502776757e-05 + ] + }, + { + "method": "scalar_cb", + "L": 4, + "seed": 123, + "mean_gamma": 0.4006684720516205, + "mean_rho": 0.3810938075184822, + "mean_nudge": -0.016430767253041267, + "per_layer_gamma": [ + 0.39850419759750366, + 0.4013897776603699, + 0.4055132269859314, + 0.397266685962677 + ], + "per_layer_rho": [ + 0.3824196457862854, + 0.4083380699157715, + 0.37734755873680115, + 0.3562699556350708 + ], + "per_layer_nudge": [ + -0.016568617895245552, + -0.016357120126485825, + -0.01656804233789444, + -0.016229288652539253 + ] + }, + { + "method": "vec_eT_M4", + "L": 4, + "seed": 123, + "mean_gamma": 0.8960145115852356, + "mean_rho": 0.9537482112646103, + "mean_nudge": -0.02881092019379139, + "per_layer_gamma": [ + 0.8080605864524841, + 0.8870053887367249, + 0.9341694116592407, + 0.9548226594924927 + ], + "per_layer_rho": [ + 0.8955597877502441, + 0.9675844311714172, + 0.9722031354904175, + 0.9796454906463623 + ], + "per_layer_nudge": [ + -0.0648956224322319, + -0.01859605871140957, + -0.01589030772447586, + -0.015861691907048225 + ] + }, + { + "method": "vec_eT_M8", + "L": 4, + "seed": 123, + "mean_gamma": 0.9169906079769135, + "mean_rho": 0.9518635720014572, + "mean_nudge": -0.030037105083465576, + "per_layer_gamma": [ + 0.813483715057373, + 0.9396308064460754, + 0.9553613662719727, + 0.9594865441322327 + ], + "per_layer_rho": [ + 0.8809271454811096, + 0.9691250324249268, + 0.9771296977996826, + 0.9802724123001099 + ], + "per_layer_nudge": [ + -0.06450991332530975, + -0.018834944814443588, + -0.018407035619020462, + -0.0183965265750885 + ] + }, + { + "method": "vec_eT_M4_shuffleCtrl", + "L": 4, + "seed": 123, + "mean_gamma": -0.03672784520313144, + "mean_rho": -0.000436956062912941, + "mean_nudge": 0.0007004090439295396, + "per_layer_gamma": [ + -0.012967733666300774, + -0.18309307098388672, + -0.33163735270500183, + 0.3807867765426636 + ], + "per_layer_rho": [ + 0.05609207600355148, + -0.16973736882209778, + -0.34432661533355713, + 0.45622408390045166 + ], + "per_layer_nudge": [ + 0.0007166759460233152, + 0.004922591149806976, + 0.009576696902513504, + -0.012414327822625637 + ] + }, + { + "method": "vec_eT_M4_noTerm", + "L": 4, + "seed": 123, + "mean_gamma": 0.9524389505386353, + "mean_rho": 0.9689934253692627, + "mean_nudge": -0.02997258398681879, + "per_layer_gamma": [ + 0.8996936082839966, + 0.9695490598678589, + 0.9714151620864868, + 0.9690979719161987 + ], + "per_layer_rho": [ + 0.9063906073570251, + 0.9897294640541077, + 0.9902646541595459, + 0.9895889759063721 + ], + "per_layer_nudge": [ + -0.048146918416023254, + -0.024354536086320877, + -0.023889556527137756, + -0.023499324917793274 + ] + }, + { + "method": "vec_eT_M4_onesided", + "L": 4, + "seed": 123, + "mean_gamma": 0.8988931030035019, + "mean_rho": 0.9505570530891418, + "mean_nudge": -0.02708751056343317, + "per_layer_gamma": [ + 0.8175626397132874, + 0.9190162420272827, + 0.9264382719993591, + 0.9325552582740784 + ], + "per_layer_rho": [ + 0.8918192386627197, + 0.9622496366500854, + 0.9709856510162354, + 0.9771736860275269 + ], + "per_layer_nudge": [ + -0.05964129418134689, + -0.017833322286605835, + -0.015457207337021828, + -0.015418218448758125 + ] + }, + { + "method": "dfa", + "L": 4, + "seed": 456, + "mean_gamma": 0.016278030583634973, + "mean_rho": 0.019018374383449554, + "mean_nudge": -0.001155311170805362, + "per_layer_gamma": [ + 0.034280914813280106, + 0.018388552591204643, + 0.004948894493281841, + 0.0074937604367733 + ], + "per_layer_rho": [ + 0.026491232216358185, + 0.0305374376475811, + -0.001606430858373642, + 0.020651258528232574 + ], + "per_layer_nudge": [ + -0.004200353287160397, + -0.0002525914169382304, + -7.005853694863617e-05, + -9.824144217418507e-05 + ] + }, + { + "method": "scalar_cb", + "L": 4, + "seed": 456, + "mean_gamma": 0.40844712406396866, + "mean_rho": 0.4075355716049671, + "mean_nudge": -0.011171038961037993, + "per_layer_gamma": [ + 0.261852890253067, + 0.41412365436553955, + 0.4508002996444702, + 0.5070116519927979 + ], + "per_layer_rho": [ + 0.2299479991197586, + 0.4202876687049866, + 0.4645801782608032, + 0.5153264403343201 + ], + "per_layer_nudge": [ + -0.009456473402678967, + -0.01063506305217743, + -0.011527800001204014, + -0.013064819388091564 + ] + }, + { + "method": "vec_eT_M4", + "L": 4, + "seed": 456, + "mean_gamma": 0.9677009582519531, + "mean_rho": 0.9615653902292252, + "mean_nudge": -0.02802830934524536, + "per_layer_gamma": [ + 0.90372633934021, + 0.9808875918388367, + 0.9896383285522461, + 0.9965515732765198 + ], + "per_layer_rho": [ + 0.9064497947692871, + 0.9720321297645569, + 0.980293869972229, + 0.9874857664108276 + ], + "per_layer_nudge": [ + -0.04350632429122925, + -0.0233478881418705, + -0.02268034964799881, + -0.02257867529988289 + ] + }, + { + "method": "vec_eT_M8", + "L": 4, + "seed": 456, + "mean_gamma": 0.7236898243427277, + "mean_rho": 0.8553760200738907, + "mean_nudge": -0.02606209833174944, + "per_layer_gamma": [ + 0.6436039209365845, + 0.6319636106491089, + 0.7965036630630493, + 0.822688102722168 + ], + "per_layer_rho": [ + 0.7970162630081177, + 0.7741899490356445, + 0.916257917881012, + 0.9340399503707886 + ], + "per_layer_nudge": [ + -0.05365825071930885, + -0.015726309269666672, + -0.017313942313194275, + -0.017549891024827957 + ] + }, + { + "method": "vec_eT_M4_shuffleCtrl", + "L": 4, + "seed": 456, + "mean_gamma": -0.12004246190190315, + "mean_rho": -0.09116240590810776, + "mean_nudge": 0.003779993741773069, + "per_layer_gamma": [ + -0.18761609494686127, + -0.4131208062171936, + -0.33985134959220886, + 0.4604184031486511 + ], + "per_layer_rho": [ + -0.08593425154685974, + -0.4190409183502197, + -0.3457789421081543, + 0.48610448837280273 + ], + "per_layer_nudge": [ + 0.007614006754010916, + 0.010954373516142368, + 0.009015142917633057, + -0.012463548220694065 + ] + }, + { + "method": "vec_eT_M4_noTerm", + "L": 4, + "seed": 456, + "mean_gamma": 0.9375280737876892, + "mean_rho": 0.9757244437932968, + "mean_nudge": -0.02518668444827199, + "per_layer_gamma": [ + 0.9148672819137573, + 0.9444636106491089, + 0.946875810623169, + 0.9439055919647217 + ], + "per_layer_rho": [ + 0.9372595548629761, + 0.9872512817382812, + 0.9900106191635132, + 0.9883763194084167 + ], + "per_layer_nudge": [ + -0.04899398609995842, + -0.018192578107118607, + -0.017080236226320267, + -0.016479937359690666 + ] + }, + { + "method": "vec_eT_M4_onesided", + "L": 4, + "seed": 456, + "mean_gamma": 0.9691873788833618, + "mean_rho": 0.9595922082662582, + "mean_nudge": -0.026451716665178537, + "per_layer_gamma": [ + 0.906065821647644, + 0.9809720516204834, + 0.992091178894043, + 0.9976204633712769 + ], + "per_layer_rho": [ + 0.9050431251525879, + 0.9693447351455688, + 0.9793726205825806, + 0.9846083521842957 + ], + "per_layer_nudge": [ + -0.04136938229203224, + -0.02186034619808197, + -0.021370645612478256, + -0.02120649255812168 + ] + }, + { + "method": "dfa", + "L": 8, + "seed": 42, + "mean_gamma": 0.09906564746052027, + "mean_rho": 0.09740300523117185, + "mean_nudge": -0.002161820186302066, + "per_layer_gamma": [ + 0.01413647085428238, + 0.28074702620506287, + 0.11767441779375076, + 0.054444827139377594, + 0.14474442601203918, + 0.06295441836118698, + 0.07057145237922668, + 0.04725214093923569 + ], + "per_layer_rho": [ + 0.02532106265425682, + 0.23610877990722656, + 0.12464869767427444, + 0.07118558138608932, + 0.1357075721025467, + 0.06361411511898041, + 0.08849744498729706, + 0.03414078801870346 + ], + "per_layer_nudge": [ + -0.0018329978920519352, + -0.0055640568025410175, + -0.002374582923948765, + -0.0012062718160450459, + -0.00274146581068635, + -0.0013790605589747429, + -0.0014756014570593834, + -0.0007205242291092873 + ] + }, + { + "method": "scalar_cb", + "L": 8, + "seed": 42, + "mean_gamma": 0.30624711513519287, + "mean_rho": 0.3206122815608978, + "mean_nudge": -0.009207659168168902, + "per_layer_gamma": [ + 0.16885146498680115, + 0.3251064419746399, + 0.292763888835907, + 0.3125339150428772, + 0.3227536380290985, + 0.33606037497520447, + 0.3436194658279419, + 0.3482877314090729 + ], + "per_layer_rho": [ + 0.15158507227897644, + 0.2908586263656616, + 0.29920056462287903, + 0.34763777256011963, + 0.3629569113254547, + 0.35797882080078125, + 0.38447317481040955, + 0.3702073097229004 + ], + "per_layer_nudge": [ + -0.005164027214050293, + -0.00964929535984993, + -0.00890397373586893, + -0.009508647955954075, + -0.009753547608852386, + -0.010073650628328323, + -0.010293008759617805, + -0.010315122082829475 + ] + }, + { + "method": "vec_eT_M4", + "L": 8, + "seed": 42, + "mean_gamma": 0.9610838517546654, + "mean_rho": 0.9551834538578987, + "mean_nudge": -0.02005277667194605, + "per_layer_gamma": [ + 0.8267648220062256, + 0.9711159467697144, + 0.9782320261001587, + 0.9792516827583313, + 0.9823880195617676, + 0.9807887077331543, + 0.9809024333953857, + 0.9892271757125854 + ], + "per_layer_rho": [ + 0.8289316892623901, + 0.9607423543930054, + 0.9680945873260498, + 0.970350980758667, + 0.9744545221328735, + 0.9756993055343628, + 0.9772317409515381, + 0.985962450504303 + ], + "per_layer_nudge": [ + -0.03688318282365799, + -0.017963383346796036, + -0.017710430547595024, + -0.017620962113142014, + -0.017566435039043427, + -0.017552118748426437, + -0.017480310052633286, + -0.017645390704274178 + ] + }, + { + "method": "vec_eT_M8", + "L": 8, + "seed": 42, + "mean_gamma": 0.9476289451122284, + "mean_rho": 0.952806644141674, + "mean_nudge": -0.021474516252055764, + "per_layer_gamma": [ + 0.7826216220855713, + 0.9704389572143555, + 0.9734323024749756, + 0.9753161072731018, + 0.9732745885848999, + 0.9694249033927917, + 0.9685238599777222, + 0.9679992198944092 + ], + "per_layer_rho": [ + 0.8156931400299072, + 0.965274453163147, + 0.9699603319168091, + 0.970566987991333, + 0.9739295244216919, + 0.9735742211341858, + 0.9758409261703491, + 0.9776135683059692 + ], + "per_layer_nudge": [ + -0.042923636734485626, + -0.018625982105731964, + -0.01854044198989868, + -0.018480297178030014, + -0.01844090223312378, + -0.018325258046388626, + -0.018257396295666695, + -0.018202215433120728 + ] + }, + { + "method": "vec_eT_M4_shuffleCtrl", + "L": 8, + "seed": 42, + "mean_gamma": -0.019792123697698116, + "mean_rho": 0.01533439988270402, + "mean_nudge": 0.0001886758691398427, + "per_layer_gamma": [ + 0.2983958125114441, + 0.2871808111667633, + -0.6762481927871704, + -0.09076518565416336, + -0.4631124436855316, + -0.5284497141838074, + 0.10263068974018097, + 0.9120312333106995 + ], + "per_layer_rho": [ + 0.436443030834198, + 0.31577497720718384, + -0.6712953448295593, + -0.038358043879270554, + -0.4568558931350708, + -0.533319890499115, + 0.1618560254573822, + 0.9084303379058838 + ], + "per_layer_nudge": [ + -0.00789229478687048, + -0.007670246995985508, + 0.016546625643968582, + 0.0017870900919660926, + 0.010900387540459633, + 0.012512469664216042, + -0.0028577707707881927, + -0.021816853433847427 + ] + }, + { + "method": "vec_eT_M4_noTerm", + "L": 8, + "seed": 42, + "mean_gamma": 0.9694314822554588, + "mean_rho": 0.9782926589250565, + "mean_nudge": -0.020679548615589738, + "per_layer_gamma": [ + 0.9044460654258728, + 0.9779231548309326, + 0.9797878861427307, + 0.9809790849685669, + 0.9813997149467468, + 0.9814468622207642, + 0.979229211807251, + 0.9702398777008057 + ], + "per_layer_rho": [ + 0.9102598428726196, + 0.9878777265548706, + 0.9896679520606995, + 0.9906449317932129, + 0.9906293153762817, + 0.9896650314331055, + 0.98812335729599, + 0.9794731140136719 + ], + "per_layer_nudge": [ + -0.04101525992155075, + -0.019054662436246872, + -0.018692705780267715, + -0.018473587930202484, + -0.01803751476109028, + -0.01748315989971161, + -0.016935309395194054, + -0.01574418880045414 + ] + }, + { + "method": "vec_eT_M4_onesided", + "L": 8, + "seed": 42, + "mean_gamma": 0.961296834051609, + "mean_rho": 0.9601987227797508, + "mean_nudge": -0.020286154001951218, + "per_layer_gamma": [ + 0.8300719857215881, + 0.975559413433075, + 0.9798641204833984, + 0.9784993529319763, + 0.9792141318321228, + 0.9826849102973938, + 0.9828553199768066, + 0.9816254377365112 + ], + "per_layer_rho": [ + 0.8414288759231567, + 0.9681671261787415, + 0.9723494052886963, + 0.9737668037414551, + 0.9768325686454773, + 0.9811946749687195, + 0.9829471111297607, + 0.9849032163619995 + ], + "per_layer_nudge": [ + -0.03684248775243759, + -0.01817578822374344, + -0.018080510199069977, + -0.017905343323946, + -0.017797425389289856, + -0.017846036702394485, + -0.017828192561864853, + -0.01781344786286354 + ] + }, + { + "method": "dfa", + "L": 8, + "seed": 123, + "mean_gamma": 0.0418074403423816, + "mean_rho": 0.043065165635198355, + "mean_nudge": -0.000943926574109355, + "per_layer_gamma": [ + 0.008853738196194172, + 0.060307569801807404, + 0.04014270007610321, + 0.046701639890670776, + 0.04881899803876877, + 0.07526923716068268, + 0.012093071825802326, + 0.04227256774902344 + ], + "per_layer_rho": [ + -0.00892745889723301, + 0.05283857136964798, + 0.04637228325009346, + 0.05245576798915863, + 0.05450460687279701, + 0.07646007835865021, + 0.02843533270061016, + 0.042382143437862396 + ], + "per_layer_nudge": [ + -0.0022439619060605764, + -0.0013329577632248402, + -0.0005934120854362845, + -0.0006395552773028612, + -0.0007643825374543667, + -0.001089449506253004, + -0.00021647402900271118, + -0.0006712194881401956 + ] + }, + { + "method": "scalar_cb", + "L": 8, + "seed": 123, + "mean_gamma": 0.2247180617414415, + "mean_rho": 0.26628467813134193, + "mean_nudge": -0.007505320216296241, + "per_layer_gamma": [ + 0.04518688842654228, + 0.17972084879875183, + 0.21200382709503174, + 0.24014034867286682, + 0.276295006275177, + 0.28583356738090515, + 0.2899315357208252, + 0.2686324715614319 + ], + "per_layer_rho": [ + 0.14380130171775818, + 0.22897371649742126, + 0.23557049036026, + 0.26198533177375793, + 0.3003377914428711, + 0.32919156551361084, + 0.3204420208930969, + 0.30997520685195923 + ], + "per_layer_nudge": [ + -0.0017040509264916182, + -0.006164136342704296, + -0.006984173320233822, + -0.008167261257767677, + -0.00930502824485302, + -0.009475477039813995, + -0.009366653859615326, + -0.008875780738890171 + ] + }, + { + "method": "vec_eT_M4", + "L": 8, + "seed": 123, + "mean_gamma": 0.9508489817380905, + "mean_rho": 0.9518037140369415, + "mean_nudge": -0.02076399209909141, + "per_layer_gamma": [ + 0.8060562014579773, + 0.9650354385375977, + 0.9726169109344482, + 0.973420262336731, + 0.9732815027236938, + 0.9745521545410156, + 0.9734596610069275, + 0.968369722366333 + ], + "per_layer_rho": [ + 0.8418968915939331, + 0.9559968113899231, + 0.962238073348999, + 0.9662503600120544, + 0.9685378670692444, + 0.9712143540382385, + 0.9724422097206116, + 0.9758531451225281 + ], + "per_layer_nudge": [ + -0.0521555095911026, + -0.016341347247362137, + -0.01634775847196579, + -0.01629696600139141, + -0.016271617263555527, + -0.016253814101219177, + -0.01619817316532135, + -0.016246750950813293 + ] + }, + { + "method": "vec_eT_M8", + "L": 8, + "seed": 123, + "mean_gamma": 0.9676685556769371, + "mean_rho": 0.9591586142778397, + "mean_nudge": -0.019975336268544197, + "per_layer_gamma": [ + 0.8518213033676147, + 0.9811072945594788, + 0.9843889474868774, + 0.983165442943573, + 0.9847903251647949, + 0.9829460382461548, + 0.9856388568878174, + 0.9874902367591858 + ], + "per_layer_rho": [ + 0.8631762266159058, + 0.9645696878433228, + 0.9685958027839661, + 0.9701895713806152, + 0.9725322127342224, + 0.9733850955963135, + 0.9789502024650574, + 0.9818701148033142 + ], + "per_layer_nudge": [ + -0.04242108017206192, + -0.017025835812091827, + -0.016797807067632675, + -0.016749639064073563, + -0.016767453402280807, + -0.01670318841934204, + -0.016672292724251747, + -0.016665393486618996 + ] + }, + { + "method": "vec_eT_M4_shuffleCtrl", + "L": 8, + "seed": 123, + "mean_gamma": -0.11373000172898173, + "mean_rho": -0.1359611451625824, + "mean_nudge": 0.004932066862238571, + "per_layer_gamma": [ + -0.056351568549871445, + -0.44720304012298584, + -0.6338962316513062, + -0.408905029296875, + -0.37608587741851807, + -0.18018096685409546, + 0.33276063203811646, + 0.8600220680236816 + ], + "per_layer_rho": [ + 0.044625282287597656, + -0.4992668628692627, + -0.6965052485466003, + -0.46216896176338196, + -0.42366287112236023, + -0.23159649968147278, + 0.2991888225078583, + 0.8816971778869629 + ], + "per_layer_nudge": [ + 0.003119478700682521, + 0.016028771176934242, + 0.022319095209240913, + 0.01471712812781334, + 0.013586362823843956, + 0.007011811248958111, + -0.010123632848262787, + -0.027202479541301727 + ] + }, + { + "method": "vec_eT_M4_noTerm", + "L": 8, + "seed": 123, + "mean_gamma": 0.8755882158875465, + "mean_rho": 0.9470387101173401, + "mean_nudge": -0.01607380306813866, + "per_layer_gamma": [ + 0.8875797986984253, + 0.9009760618209839, + 0.8808510899543762, + 0.8799238204956055, + 0.8797831535339355, + 0.8745893239974976, + 0.861487865447998, + 0.8395146131515503 + ], + "per_layer_rho": [ + 0.9190670847892761, + 0.9546182751655579, + 0.9534507393836975, + 0.9524415731430054, + 0.9578260183334351, + 0.9576990008354187, + 0.9501173496246338, + 0.9310896396636963 + ], + "per_layer_nudge": [ + -0.051533639430999756, + -0.015572542324662209, + -0.012057723477482796, + -0.011056014336645603, + -0.010354170575737953, + -0.009953269734978676, + -0.009345149621367455, + -0.008717915043234825 + ] + }, + { + "method": "vec_eT_M4_onesided", + "L": 8, + "seed": 123, + "mean_gamma": 0.9602480605244637, + "mean_rho": 0.9577522128820419, + "mean_nudge": -0.020163135835900903, + "per_layer_gamma": [ + 0.8212144374847412, + 0.9718189239501953, + 0.9794400930404663, + 0.9788751602172852, + 0.9804568886756897, + 0.9820123910903931, + 0.9819177389144897, + 0.9862488508224487 + ], + "per_layer_rho": [ + 0.8539210557937622, + 0.9595734477043152, + 0.968142032623291, + 0.9713950753211975, + 0.9739673137664795, + 0.9758511781692505, + 0.9757622480392456, + 0.983405351638794 + ], + "per_layer_nudge": [ + -0.048084814101457596, + -0.016458425670862198, + -0.01623723655939102, + -0.016196511685848236, + -0.016157593578100204, + -0.016071485355496407, + -0.015993185341358185, + -0.016105834394693375 + ] + }, + { + "method": "dfa", + "L": 8, + "seed": 456, + "mean_gamma": 0.11447641160339117, + "mean_rho": 0.11044186353683472, + "mean_nudge": -0.0029411360155791044, + "per_layer_gamma": [ + 0.051631297916173935, + 0.2667747735977173, + 0.1608148217201233, + 0.05039509758353233, + 0.09734607487916946, + 0.1104668602347374, + 0.10407236963510513, + 0.07430999726057053 + ], + "per_layer_rho": [ + 0.0571255087852478, + 0.24121275544166565, + 0.1396293193101883, + 0.03282786160707474, + 0.0832589864730835, + 0.12599189579486847, + 0.10961247235536575, + 0.09387610852718353 + ], + "per_layer_nudge": [ + -0.004148983396589756, + -0.006073276046663523, + -0.0035690395161509514, + -0.0011961309937760234, + -0.0020613158121705055, + -0.002379970159381628, + -0.00227751350030303, + -0.0018228586995974183 + ] + }, + { + "method": "scalar_cb", + "L": 8, + "seed": 456, + "mean_gamma": 0.2596400445327163, + "mean_rho": 0.29122191295027733, + "mean_nudge": -0.009376821690239012, + "per_layer_gamma": [ + 0.09049498289823532, + 0.2076151967048645, + 0.28473690152168274, + 0.29515770077705383, + 0.31399405002593994, + 0.29933249950408936, + 0.2904508113861084, + 0.2953382134437561 + ], + "per_layer_rho": [ + 0.10262437164783478, + 0.23574362695217133, + 0.32356733083724976, + 0.3371298313140869, + 0.3557179868221283, + 0.34890225529670715, + 0.31407758593559265, + 0.31201231479644775 + ], + "per_layer_nudge": [ + -0.003384523093700409, + -0.007686353288590908, + -0.010352302342653275, + -0.010613547638058662, + -0.011347497813403606, + -0.010740532539784908, + -0.010370716452598572, + -0.010519100353121758 + ] + }, + { + "method": "vec_eT_M4", + "L": 8, + "seed": 456, + "mean_gamma": 0.9574749916791916, + "mean_rho": 0.9430182427167892, + "mean_nudge": -0.025299219880253077, + "per_layer_gamma": [ + 0.8182810544967651, + 0.9655625820159912, + 0.9788223505020142, + 0.9715414047241211, + 0.9763141870498657, + 0.9819262623786926, + 0.9831951260566711, + 0.9841569662094116 + ], + "per_layer_rho": [ + 0.8498371243476868, + 0.9464435577392578, + 0.9519747495651245, + 0.9531487822532654, + 0.9558645486831665, + 0.9587409496307373, + 0.9619686007499695, + 0.9661676287651062 + ], + "per_layer_nudge": [ + -0.04676084965467453, + -0.022278331220149994, + -0.022243071347475052, + -0.022241756319999695, + -0.022209325805306435, + -0.022194838151335716, + -0.02222602069377899, + -0.0222395658493042 + ] + }, + { + "method": "vec_eT_M8", + "L": 8, + "seed": 456, + "mean_gamma": 0.8017567023634911, + "mean_rho": 0.8739266619086266, + "mean_nudge": -0.0273550299461931, + "per_layer_gamma": [ + 0.5685268640518188, + 0.8541168570518494, + 0.8301878571510315, + 0.8351892232894897, + 0.8266328573226929, + 0.8315808773040771, + 0.8355091214179993, + 0.8323099613189697 + ], + "per_layer_rho": [ + 0.6454399824142456, + 0.8863531947135925, + 0.893866240978241, + 0.90782630443573, + 0.9073142409324646, + 0.9110382795333862, + 0.9168291091918945, + 0.922745943069458 + ], + "per_layer_nudge": [ + -0.059318192303180695, + -0.022695917636156082, + -0.022645555436611176, + -0.022771799936890602, + -0.02274298295378685, + -0.022797273471951485, + -0.022850075736641884, + -0.02301844209432602 + ] + }, + { + "method": "vec_eT_M4_shuffleCtrl", + "L": 8, + "seed": 456, + "mean_gamma": 0.5487924553453922, + "mean_rho": 0.5787655711174011, + "mean_nudge": -0.01472583191934973, + "per_layer_gamma": [ + 0.4987947940826416, + 0.6894677877426147, + 0.5756305456161499, + 0.5317898392677307, + 0.4938901960849762, + 0.48660987615585327, + 0.4679740071296692, + 0.6461825966835022 + ], + "per_layer_rho": [ + 0.5681551694869995, + 0.6849030256271362, + 0.5905652046203613, + 0.5603526830673218, + 0.529013991355896, + 0.5252480506896973, + 0.505163311958313, + 0.6667231321334839 + ], + "per_layer_nudge": [ + -0.013360938057303429, + -0.018475033342838287, + -0.015427734702825546, + -0.0143125606700778, + -0.013382941484451294, + -0.013140549883246422, + -0.012608321383595467, + -0.017098575830459595 + ] + }, + { + "method": "vec_eT_M4_noTerm", + "L": 8, + "seed": 456, + "mean_gamma": 0.9719733148813248, + "mean_rho": 0.9774252474308014, + "mean_nudge": -0.021229598904028535, + "per_layer_gamma": [ + 0.8793158531188965, + 0.9842267632484436, + 0.9851877689361572, + 0.9860390424728394, + 0.9860944747924805, + 0.9856378436088562, + 0.9863163232803345, + 0.9829684495925903 + ], + "per_layer_rho": [ + 0.8756503462791443, + 0.9914530515670776, + 0.9921013712882996, + 0.9924013614654541, + 0.9925580024719238, + 0.992135763168335, + 0.9925041198730469, + 0.9905979633331299 + ], + "per_layer_nudge": [ + -0.039753369987010956, + -0.019631527364253998, + -0.019158396869897842, + -0.01886080764234066, + -0.018597319722175598, + -0.01827744022011757, + -0.017960023134946823, + -0.017597906291484833 + ] + }, + { + "method": "vec_eT_M4_onesided", + "L": 8, + "seed": 456, + "mean_gamma": 0.968105711042881, + "mean_rho": 0.9448694735765457, + "mean_nudge": -0.02237516944296658, + "per_layer_gamma": [ + 0.8237834572792053, + 0.981438159942627, + 0.984513521194458, + 0.9858155846595764, + 0.9882583618164062, + 0.9903416633605957, + 0.9931073784828186, + 0.9975875616073608 + ], + "per_layer_rho": [ + 0.8182570934295654, + 0.9534345269203186, + 0.956415593624115, + 0.9588236808776855, + 0.9621551036834717, + 0.9646933674812317, + 0.9697130918502808, + 0.975463330745697 + ], + "per_layer_nudge": [ + -0.040218278765678406, + -0.01982394978404045, + -0.019831635057926178, + -0.019780701026320457, + -0.01978381723165512, + -0.019830182194709778, + -0.019829627126455307, + -0.019903164356946945 + ] + } +] \ No newline at end of file diff --git a/results/vector_credit_pilot/results.json b/results/vector_credit_pilot/results.json new file mode 100644 index 0000000..0d5a95b --- /dev/null +++ b/results/vector_credit_pilot/results.json @@ -0,0 +1,590 @@ +[ + { + "method": "dfa", + "L": 4, + "seed": 42, + "mean_gamma": 0.012147892965003848, + "mean_rho": 0.01192134665325284, + "mean_nudge": 0.0003465710469754413, + "per_layer_gamma": [ + -0.008250176906585693, + 0.009299487806856632, + 0.025026513263583183, + 0.02251574769616127 + ], + "per_layer_rho": [ + -0.023004790768027306, + -0.001884380355477333, + 0.02913304604589939, + 0.04344151169061661 + ] + }, + { + "method": "scalar_cb", + "L": 4, + "seed": 42, + "mean_gamma": 0.21985775604844093, + "mean_rho": 0.1995779424905777, + "mean_nudge": -0.00718017655890435, + "per_layer_gamma": [ + 0.23413987457752228, + 0.13205617666244507, + 0.17927157878875732, + 0.33396339416503906 + ], + "per_layer_rho": [ + 0.23052650690078735, + 0.12983247637748718, + 0.16552400588989258, + 0.2724287807941437 + ] + }, + { + "method": "vector_M4", + "L": 4, + "seed": 42, + "M": 4, + "mean_gamma": 0.8662685304880142, + "mean_rho": 0.9519537538290024, + "mean_nudge": -0.02709634741768241, + "per_layer_gamma": [ + 0.7652574181556702, + 0.8526232838630676, + 0.9186504483222961, + 0.928542971611023 + ], + "per_layer_rho": [ + 0.8851539492607117, + 0.9653596878051758, + 0.9761222004890442, + 0.9811791777610779 + ] + }, + { + "method": "vector_M8", + "L": 4, + "seed": 42, + "M": 8, + "mean_gamma": 0.8658886104822159, + "mean_rho": 0.9449075609445572, + "mean_nudge": -0.029197553172707558, + "per_layer_gamma": [ + 0.7732181549072266, + 0.8716340065002441, + 0.9039424061775208, + 0.9147598743438721 + ], + "per_layer_rho": [ + 0.8748108148574829, + 0.9573958516120911, + 0.9716492891311646, + 0.9757742881774902 + ] + }, + { + "method": "dfa", + "L": 4, + "seed": 123, + "mean_gamma": 0.003229829511838034, + "mean_rho": 0.00163999292999506, + "mean_nudge": 0.00024945657537500665, + "per_layer_gamma": [ + -0.014626468531787395, + 0.025253605097532272, + 0.0005082360003143549, + 0.0017839454812929034 + ], + "per_layer_rho": [ + -0.013803189620375633, + 0.036788348108530045, + -0.001500369980931282, + -0.01492481678724289 + ] + }, + { + "method": "scalar_cb", + "L": 4, + "seed": 123, + "mean_gamma": 0.39710141718387604, + "mean_rho": 0.379002220928669, + "mean_nudge": -0.016321706119924784, + "per_layer_gamma": [ + 0.39424756169319153, + 0.4008973240852356, + 0.40283483266830444, + 0.3904259502887726 + ], + "per_layer_rho": [ + 0.37951934337615967, + 0.4084340035915375, + 0.38294172286987305, + 0.3451138138771057 + ] + }, + { + "method": "vector_M4", + "L": 4, + "seed": 123, + "M": 4, + "mean_gamma": 0.8867881596088409, + "mean_rho": 0.9528021663427353, + "mean_nudge": -0.026435222942382097, + "per_layer_gamma": [ + 0.7937425374984741, + 0.875928521156311, + 0.927625298500061, + 0.9498562812805176 + ], + "per_layer_rho": [ + 0.8932725191116333, + 0.9669736623764038, + 0.9716669321060181, + 0.979295551776886 + ] + }, + { + "method": "vector_M8", + "L": 4, + "seed": 123, + "M": 8, + "mean_gamma": 0.9158899784088135, + "mean_rho": 0.9517841935157776, + "mean_nudge": -0.02811066061258316, + "per_layer_gamma": [ + 0.8141916990280151, + 0.9413568377494812, + 0.9519738554954529, + 0.9560375213623047 + ], + "per_layer_rho": [ + 0.8822289705276489, + 0.9683880805969238, + 0.9763948917388916, + 0.980124831199646 + ] + }, + { + "method": "dfa", + "L": 4, + "seed": 456, + "mean_gamma": 0.0145260663703084, + "mean_rho": 0.022942777490243316, + "mean_nudge": -0.0009695220105641056, + "per_layer_gamma": [ + 0.02722274139523506, + 0.01860036328434944, + 0.004503400065004826, + 0.007777760736644268 + ], + "per_layer_rho": [ + 0.05302194505929947, + 0.0076346490532159805, + 0.025450842455029488, + 0.005663673393428326 + ] + }, + { + "method": "scalar_cb", + "L": 4, + "seed": 456, + "mean_gamma": 0.4040673300623894, + "mean_rho": 0.40459180623292923, + "mean_nudge": -0.011024328647181392, + "per_layer_gamma": [ + 0.27310311794281006, + 0.40135008096694946, + 0.438569575548172, + 0.503246545791626 + ], + "per_layer_rho": [ + 0.2368279993534088, + 0.40752148628234863, + 0.45139557123184204, + 0.5226221680641174 + ] + }, + { + "method": "vector_M4", + "L": 4, + "seed": 456, + "M": 4, + "mean_gamma": 0.9666130393743515, + "mean_rho": 0.9611468017101288, + "mean_nudge": -0.027259222231805325, + "per_layer_gamma": [ + 0.9003310203552246, + 0.9805972576141357, + 0.9892021417617798, + 0.9963217377662659 + ], + "per_layer_rho": [ + 0.9047541618347168, + 0.9721742868423462, + 0.9798319339752197, + 0.9878268241882324 + ] + }, + { + "method": "vector_M8", + "L": 4, + "seed": 456, + "M": 8, + "mean_gamma": 0.7273575365543365, + "mean_rho": 0.854712963104248, + "mean_nudge": -0.026176680345088243, + "per_layer_gamma": [ + 0.6557849049568176, + 0.6333819627761841, + 0.7958562970161438, + 0.8244069814682007 + ], + "per_layer_rho": [ + 0.7897602319717407, + 0.7803139686584473, + 0.9154964685440063, + 0.9332811832427979 + ] + }, + { + "method": "dfa", + "L": 8, + "seed": 42, + "mean_gamma": 0.09646139270626009, + "mean_rho": 0.10066868900321424, + "mean_nudge": -0.0021505439945030957, + "per_layer_gamma": [ + 0.020206334069371223, + 0.28005093336105347, + 0.10910443961620331, + 0.05392846465110779, + 0.13815951347351074, + 0.06548097729682922, + 0.06045090779662132, + 0.044309571385383606 + ], + "per_layer_rho": [ + 0.023506762459874153, + 0.2456609010696411, + 0.1322387009859085, + 0.08064419776201248, + 0.12704811990261078, + 0.09092238545417786, + 0.06660012900829315, + 0.03872831538319588 + ] + }, + { + "method": "scalar_cb", + "L": 8, + "seed": 42, + "mean_gamma": 0.2887882422655821, + "mean_rho": 0.31615289114415646, + "mean_nudge": -0.008607904077507555, + "per_layer_gamma": [ + 0.1581556648015976, + 0.30974239110946655, + 0.2763316333293915, + 0.2932790219783783, + 0.30333060026168823, + 0.3180520534515381, + 0.3235378861427307, + 0.3278766870498657 + ], + "per_layer_rho": [ + 0.16209523379802704, + 0.270870566368103, + 0.3148571252822876, + 0.34910714626312256, + 0.35669511556625366, + 0.3541313409805298, + 0.35600799322128296, + 0.365458607673645 + ] + }, + { + "method": "vector_M4", + "L": 8, + "seed": 42, + "M": 4, + "mean_gamma": 0.961564302444458, + "mean_rho": 0.9551431238651276, + "mean_nudge": -0.019874528981745243, + "per_layer_gamma": [ + 0.8240220546722412, + 0.9724991321563721, + 0.9790397882461548, + 0.9801962375640869, + 0.9832960367202759, + 0.9817315340042114, + 0.9818849563598633, + 0.9898446798324585 + ], + "per_layer_rho": [ + 0.8262996673583984, + 0.9621720314025879, + 0.9684443473815918, + 0.9724023938179016, + 0.9747618436813354, + 0.9747101664543152, + 0.9763842821121216, + 0.9859702587127686 + ] + }, + { + "method": "vector_M8", + "L": 8, + "seed": 42, + "M": 8, + "mean_gamma": 0.953937828540802, + "mean_rho": 0.9505700841546059, + "mean_nudge": -0.02167696040123701, + "per_layer_gamma": [ + 0.7907432317733765, + 0.9761166572570801, + 0.9785570502281189, + 0.979189932346344, + 0.9788146018981934, + 0.9763517379760742, + 0.975960373878479, + 0.97576904296875 + ], + "per_layer_rho": [ + 0.8080886006355286, + 0.9629194736480713, + 0.96845942735672, + 0.969330906867981, + 0.9729516506195068, + 0.9717377424240112, + 0.9743517637252808, + 0.9767211079597473 + ] + }, + { + "method": "dfa", + "L": 8, + "seed": 123, + "mean_gamma": 0.03813134285155684, + "mean_rho": 0.03381418902426958, + "mean_nudge": -0.0009109743532462744, + "per_layer_gamma": [ + 0.013361184857785702, + 0.05827388912439346, + 0.0349937379360199, + 0.04099487513303757, + 0.04462064802646637, + 0.06228824704885483, + 0.012631343677639961, + 0.03788681700825691 + ], + "per_layer_rho": [ + 0.0002537630498409271, + 0.043776169419288635, + 0.05000852793455124, + 0.03221482038497925, + 0.04221296310424805, + 0.033549584448337555, + 0.028929945081472397, + 0.0395677387714386 + ] + }, + { + "method": "scalar_cb", + "L": 8, + "seed": 123, + "mean_gamma": 0.23267090553417802, + "mean_rho": 0.2789924703538418, + "mean_nudge": -0.007711792801273987, + "per_layer_gamma": [ + 0.04650892689824104, + 0.1706242561340332, + 0.22027906775474548, + 0.2470434308052063, + 0.29134616255760193, + 0.30053815245628357, + 0.3030412197113037, + 0.2819860279560089 + ], + "per_layer_rho": [ + 0.1475682556629181, + 0.25340142846107483, + 0.25207415223121643, + 0.27266043424606323, + 0.31578385829925537, + 0.34466448426246643, + 0.3341771364212036, + 0.31161001324653625 + ] + }, + { + "method": "vector_M4", + "L": 8, + "seed": 123, + "M": 4, + "mean_gamma": 0.9465279653668404, + "mean_rho": 0.9515762850642204, + "mean_nudge": -0.020021548261865973, + "per_layer_gamma": [ + 0.8061791658401489, + 0.9617274403572083, + 0.9699997901916504, + 0.9668513536453247, + 0.9676209092140198, + 0.9689860939979553, + 0.9675877094268799, + 0.9632712602615356 + ], + "per_layer_rho": [ + 0.8417923450469971, + 0.9546955823898315, + 0.9617888927459717, + 0.9657822847366333, + 0.9680895209312439, + 0.9720520973205566, + 0.9722585678100586, + 0.9761509895324707 + ] + }, + { + "method": "vector_M8", + "L": 8, + "seed": 123, + "M": 8, + "mean_gamma": 0.9704969301819801, + "mean_rho": 0.9587301984429359, + "mean_nudge": -0.019836972700431943, + "per_layer_gamma": [ + 0.8533698320388794, + 0.9837186336517334, + 0.9865810871124268, + 0.986007571220398, + 0.9872775077819824, + 0.9863162040710449, + 0.9895119667053223, + 0.991192638874054 + ], + "per_layer_rho": [ + 0.8637727499008179, + 0.9640783071517944, + 0.9682940244674683, + 0.9682257771492004, + 0.9719105958938599, + 0.9726260900497437, + 0.9787560701370239, + 0.9821779727935791 + ] + }, + { + "method": "dfa", + "L": 8, + "seed": 456, + "mean_gamma": 0.11119568115100265, + "mean_rho": 0.10901899263262749, + "mean_nudge": -0.0028466961084632203, + "per_layer_gamma": [ + 0.05529828742146492, + 0.2547764182090759, + 0.1614864468574524, + 0.04146638512611389, + 0.08870386332273483, + 0.11080816388130188, + 0.10890999436378479, + 0.06811589002609253 + ], + "per_layer_rho": [ + 0.06376742571592331, + 0.2428635060787201, + 0.1625976264476776, + 0.044902823865413666, + 0.07067717611789703, + 0.10982732474803925, + 0.09756864607334137, + 0.07994741201400757 + ] + }, + { + "method": "scalar_cb", + "L": 8, + "seed": 456, + "mean_gamma": 0.25821398198604584, + "mean_rho": 0.2895875396206975, + "mean_nudge": -0.009281879727495834, + "per_layer_gamma": [ + 0.08930805325508118, + 0.2056446671485901, + 0.28487229347229004, + 0.2956193685531616, + 0.31186550855636597, + 0.2977675199508667, + 0.2889428436756134, + 0.2916916012763977 + ], + "per_layer_rho": [ + 0.08820285648107529, + 0.23076175153255463, + 0.3447152376174927, + 0.33077409863471985, + 0.36015045642852783, + 0.34089183807373047, + 0.32037046551704407, + 0.3008336126804352 + ] + }, + { + "method": "vector_M4", + "L": 8, + "seed": 456, + "M": 4, + "mean_gamma": 0.9567814320325851, + "mean_rho": 0.944110669195652, + "mean_nudge": -0.02485128422267735, + "per_layer_gamma": [ + 0.8119911551475525, + 0.9660953283309937, + 0.9787583947181702, + 0.9719283580780029, + 0.9761261343955994, + 0.9817196130752563, + 0.9831972122192383, + 0.9844352602958679 + ], + "per_layer_rho": [ + 0.8555350303649902, + 0.9452790021896362, + 0.9511818885803223, + 0.953883945941925, + 0.9569692015647888, + 0.9590786695480347, + 0.9632436633110046, + 0.9677139520645142 + ] + }, + { + "method": "vector_M8", + "L": 8, + "seed": 456, + "M": 8, + "mean_gamma": 0.7746431976556778, + "mean_rho": 0.8761332184076309, + "mean_nudge": -0.02582810539752245, + "per_layer_gamma": [ + 0.5509668588638306, + 0.8370974063873291, + 0.8026038408279419, + 0.8056985139846802, + 0.7948079705238342, + 0.8015545606613159, + 0.8045971989631653, + 0.7998192310333252 + ], + "per_layer_rho": [ + 0.6415740847587585, + 0.8904659748077393, + 0.9008272886276245, + 0.9081338047981262, + 0.9142714738845825, + 0.9122859239578247, + 0.9184960126876831, + 0.9230111837387085 + ] + } +] \ No newline at end of file diff --git a/results/vit_dfa_train_s42.log b/results/vit_dfa_train_s42.log new file mode 100644 index 0000000..02225d7 --- /dev/null +++ b/results/vit_dfa_train_s42.log @@ -0,0 +1,4 @@ +Train ViT-Mini DFA: seed=42 epochs=60 + ep 1: test_acc=0.2073 + ep 10: test_acc=0.2030 + ep 20: test_acc=0.2201 diff --git a/results/vit_frozen_blocks_s123.log b/results/vit_frozen_blocks_s123.log new file mode 100644 index 0000000..6a4f6c3 --- /dev/null +++ b/results/vit_frozen_blocks_s123.log @@ -0,0 +1,34 @@ +Device: cuda:0, seed=123, epochs=30 + +=== BP frozen-blocks baseline (4 random-init transformer blocks, frozen), seed=123 === +BP-frozen-blocks: 16266/809354 params trainable + BP-frozen ep 1: test_acc=0.3805 + BP-frozen ep 5: test_acc=0.4832 + BP-frozen ep 10: test_acc=0.5225 + BP-frozen ep 15: test_acc=0.5236 + BP-frozen ep 20: test_acc=0.5381 + BP-frozen ep 25: test_acc=0.5519 + BP-frozen ep 30: test_acc=0.5521 +FINAL BP-frozen-blocks acc: 0.5521 + +=== DFA frozen-blocks baseline, seed=123 === +DFA-frozen-blocks: 16266/809354 params trainable + DFA-frozen ep 1: test_acc=0.2587 + DFA-frozen ep 5: test_acc=0.2585 + DFA-frozen ep 10: test_acc=0.2597 + DFA-frozen ep 15: test_acc=0.2508 + DFA-frozen ep 20: test_acc=0.2578 + DFA-frozen ep 25: test_acc=0.2553 + DFA-frozen ep 30: test_acc=0.2605 +FINAL DFA-frozen-blocks acc: 0.2605 + +=== Summary === +BP-frozen-blocks: 0.5521 (chance=0.10) +DFA-frozen-blocks: 0.2605 +Compare to ViT-Mini 4-block trainable (3-seed avg): BP=0.792, DFA=0.237 +Compare to ViT-Mini 0-block (shallow baseline): BP=0.10, DFA=0.10 + +Interpretation: + If DFA-frozen-blocks ≈ 0.237: blocks are passengers, DFA is just learning patch_embed+head + If DFA-frozen-blocks << 0.237: trainable blocks ARE doing learned work + If DFA-frozen-blocks ~ 0.10: untrained blocks add no useful mixing (less informative) diff --git a/results/vit_frozen_blocks_s42.log b/results/vit_frozen_blocks_s42.log new file mode 100644 index 0000000..c2a20f6 --- /dev/null +++ b/results/vit_frozen_blocks_s42.log @@ -0,0 +1,34 @@ +Device: cuda:0 + +=== BP frozen-blocks baseline (4 random-init transformer blocks, frozen) === +BP-frozen-blocks: 16266/809354 params trainable + BP-frozen ep 1: test_acc=0.3762 + BP-frozen ep 5: test_acc=0.4724 + BP-frozen ep 10: test_acc=0.4961 + BP-frozen ep 15: test_acc=0.5189 + BP-frozen ep 20: test_acc=0.5252 + BP-frozen ep 25: test_acc=0.5366 + BP-frozen ep 30: test_acc=0.5402 +FINAL BP-frozen-blocks acc: 0.5402 + +=== DFA frozen-blocks baseline === +DFA-frozen-blocks: 16266/809354 params trainable + DFA-frozen ep 1: test_acc=0.2529 + DFA-frozen ep 5: test_acc=0.2477 + DFA-frozen ep 10: test_acc=0.2530 + DFA-frozen ep 15: test_acc=0.2566 + DFA-frozen ep 20: test_acc=0.2530 + DFA-frozen ep 25: test_acc=0.2545 + DFA-frozen ep 30: test_acc=0.2554 +FINAL DFA-frozen-blocks acc: 0.2554 + +=== Summary === +BP-frozen-blocks: 0.5402 (chance=0.10) +DFA-frozen-blocks: 0.2554 +Compare to ViT-Mini 4-block trainable (3-seed avg): BP=0.792, DFA=0.237 +Compare to ViT-Mini 0-block (shallow baseline): BP=0.10, DFA=0.10 + +Interpretation: + If DFA-frozen-blocks ≈ 0.237: blocks are passengers, DFA is just learning patch_embed+head + If DFA-frozen-blocks << 0.237: trainable blocks ARE doing learned work + If DFA-frozen-blocks ~ 0.10: untrained blocks add no useful mixing (less informative) diff --git a/results/vit_frozen_blocks_s456.log b/results/vit_frozen_blocks_s456.log new file mode 100644 index 0000000..1441ff5 --- /dev/null +++ b/results/vit_frozen_blocks_s456.log @@ -0,0 +1,34 @@ +Device: cuda:0, seed=456, epochs=30 + +=== BP frozen-blocks baseline (4 random-init transformer blocks, frozen), seed=456 === +BP-frozen-blocks: 16266/809354 params trainable + BP-frozen ep 1: test_acc=0.3755 + BP-frozen ep 5: test_acc=0.4748 + BP-frozen ep 10: test_acc=0.5053 + BP-frozen ep 15: test_acc=0.5210 + BP-frozen ep 20: test_acc=0.5304 + BP-frozen ep 25: test_acc=0.5443 + BP-frozen ep 30: test_acc=0.5410 +FINAL BP-frozen-blocks acc: 0.5410 + +=== DFA frozen-blocks baseline, seed=456 === +DFA-frozen-blocks: 16266/809354 params trainable + DFA-frozen ep 1: test_acc=0.2538 + DFA-frozen ep 5: test_acc=0.2617 + DFA-frozen ep 10: test_acc=0.2537 + DFA-frozen ep 15: test_acc=0.2571 + DFA-frozen ep 20: test_acc=0.2540 + DFA-frozen ep 25: test_acc=0.2540 + DFA-frozen ep 30: test_acc=0.2540 +FINAL DFA-frozen-blocks acc: 0.2540 + +=== Summary === +BP-frozen-blocks: 0.5410 (chance=0.10) +DFA-frozen-blocks: 0.2540 +Compare to ViT-Mini 4-block trainable (3-seed avg): BP=0.792, DFA=0.237 +Compare to ViT-Mini 0-block (shallow baseline): BP=0.10, DFA=0.10 + +Interpretation: + If DFA-frozen-blocks ≈ 0.237: blocks are passengers, DFA is just learning patch_embed+head + If DFA-frozen-blocks << 0.237: trainable blocks ARE doing learned work + If DFA-frozen-blocks ~ 0.10: untrained blocks add no useful mixing (less informative) diff --git a/results/vit_shallow_baseline_s42.log b/results/vit_shallow_baseline_s42.log new file mode 100644 index 0000000..1967d51 --- /dev/null +++ b/results/vit_shallow_baseline_s42.log @@ -0,0 +1,28 @@ +Device: cuda:0 + +=== BP shallow baseline (ViT-Mini num_blocks=0) === +BP-shallow: n_params=16266 + BP-shallow ep 1: test_acc=0.1000 + BP-shallow ep 5: test_acc=0.1000 + BP-shallow ep 10: test_acc=0.1000 + BP-shallow ep 15: test_acc=0.1000 + BP-shallow ep 20: test_acc=0.1000 + BP-shallow ep 25: test_acc=0.1000 + BP-shallow ep 30: test_acc=0.1000 +FINAL BP-shallow acc: 0.1000 + +=== DFA shallow baseline (ViT-Mini num_blocks=0) === +DFA-shallow: n_params=16266 + DFA-shallow ep 1: test_acc=0.1000 + DFA-shallow ep 5: test_acc=0.1000 + DFA-shallow ep 10: test_acc=0.1000 + DFA-shallow ep 15: test_acc=0.1000 + DFA-shallow ep 20: test_acc=0.1000 + DFA-shallow ep 25: test_acc=0.1000 + DFA-shallow ep 30: test_acc=0.1000 +FINAL DFA-shallow acc: 0.1000 + +=== Summary === +BP-shallow: 0.1000 (chance=0.10) +DFA-shallow: 0.1000 +Compare to ViT-Mini 4-block (3-seed avg): BP=0.792, DFA=0.237 diff --git a/results/vit_test/snapshot_vit_s42.json b/results/vit_test/snapshot_vit_s42.json new file mode 100644 index 0000000..f0095db --- /dev/null +++ b/results/vit_test/snapshot_vit_s42.json @@ -0,0 +1,244 @@ +{ + "config": { + "output_dir": "results/vit_test", + "epochs": 2, + "lr": 0.001, + "wd": 0.05, + "seed": 42, + "depth": 4, + "d_model": 128, + "n_heads": 4 + }, + "depth": 4, + "d_model": 128, + "architecture": "ViTMini", + "bp_log": [ + { + "hidden_norms_cls": [ + 0.31052109599113464, + 3.2536301612854004, + 4.7681732177734375, + 6.129599571228027, + 7.124356746673584 + ], + "hidden_norms_avg": [ + 6.008513927459717, + 7.034290313720703, + 7.942849636077881, + 8.915729522705078, + 9.635361671447754 + ], + "bp_grad_per_sample_l2_med": [ + 0.004442029166966677, + 0.0012008437188342214, + 0.0009976272704079747, + 0.0009104337659664452, + 0.0008558662957511842 + ], + "bp_grad_F": [ + 0.18535660207271576, + 0.03968670591711998, + 0.032604776322841644, + 0.029427478089928627, + 0.02746850810945034 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.1376953125, + "loss_eval": 2.35188627243042, + "epoch": 0 + }, + { + "hidden_norms_cls": [ + 0.5119581818580627, + 12.45346450805664, + 18.367006301879883, + 25.541183471679688, + 31.80698585510254 + ], + "hidden_norms_avg": [ + 4.10694694519043, + 10.166566848754883, + 14.66998291015625, + 19.933429718017578, + 25.32620620727539 + ], + "bp_grad_per_sample_l2_med": [ + 0.001977165462449193, + 0.0002232444821856916, + 0.00016308759222738445, + 0.00014621141599491239, + 0.0001451292773708701 + ], + "bp_grad_F": [ + 0.11066912859678268, + 0.010344989597797394, + 0.006372526753693819, + 0.005224850494414568, + 0.005017552524805069 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4501953125, + "loss_eval": 1.5154452323913574, + "epoch": 1 + }, + { + "hidden_norms_cls": [ + 0.5624178647994995, + 10.294456481933594, + 15.314032554626465, + 21.36781883239746, + 25.580961227416992 + ], + "hidden_norms_avg": [ + 3.8611817359924316, + 9.257936477661133, + 13.537341117858887, + 17.418514251708984, + 20.89995002746582 + ], + "bp_grad_per_sample_l2_med": [ + 0.0021491278894245625, + 0.0003653931198641658, + 0.00022418916341848671, + 0.00018154713325202465, + 0.00017043459229171276 + ], + "bp_grad_F": [ + 0.10512559115886688, + 0.014831307344138622, + 0.008541438728570938, + 0.006647223141044378, + 0.005966350436210632 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.52734375, + "loss_eval": 1.3002638816833496, + "epoch": 2 + } + ], + "dfa_log": [ + { + "hidden_norms_cls": [ + 0.31052109599113464, + 3.2536301612854004, + 4.7681732177734375, + 6.129599571228027, + 7.124356746673584 + ], + "hidden_norms_avg": [ + 6.008513927459717, + 7.034290313720703, + 7.942849636077881, + 8.915729522705078, + 9.635361671447754 + ], + "bp_grad_per_sample_l2_med": [ + 0.004442029166966677, + 0.0012008437188342214, + 0.0009976272704079747, + 0.0009104337659664452, + 0.0008558662957511842 + ], + "bp_grad_F": [ + 0.18535660207271576, + 0.03968670591711998, + 0.032604776322841644, + 0.029427478089928627, + 0.02746850810945034 + ], + "gamma_dfa": 0.003905070887412876, + "gamma_dfa_per_layer": [ + 0.004920602310448885, + 0.005249542184174061, + 0.0038580193649977446, + 0.0015921196900308132 + ], + "acc_eval": 0.1376953125, + "loss_eval": 2.35188627243042, + "epoch": 0 + }, + { + "hidden_norms_cls": [ + 1.9684416055679321, + 2029.23681640625, + 2826.160400390625, + 4672.1005859375, + 8737.1298828125 + ], + "hidden_norms_avg": [ + 45.1302375793457, + 3068.238037109375, + 8890.5302734375, + 11475.16015625, + 14973.22265625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002814636391121894, + 7.465861813216179e-07, + 6.924062745383708e-07, + 6.833349175394687e-07, + 6.810931267864362e-07 + ], + "bp_grad_F": [ + 0.08884845674037933, + 7.258133700815961e-05, + 4.2221599869662896e-05, + 2.3938106096466072e-05, + 2.3418680939357728e-05 + ], + "gamma_dfa": 0.0073737858911044896, + "gamma_dfa_per_layer": [ + 0.0056831855326890945, + 0.015363219194114208, + 0.009368096478283405, + -0.0009193576406687498 + ], + "acc_eval": 0.23046875, + "loss_eval": 2.054917335510254, + "epoch": 1 + }, + { + "hidden_norms_cls": [ + 3.0175483226776123, + 3912.425048828125, + 6017.75830078125, + 8192.2646484375, + 19695.205078125 + ], + "hidden_norms_avg": [ + 70.26815032958984, + 6088.02001953125, + 20950.01953125, + 25550.255859375, + 33917.15625 + ], + "bp_grad_per_sample_l2_med": [ + 0.000260332744801417, + 3.430939727877558e-07, + 3.090381710535439e-07, + 3.0240653359214775e-07, + 2.9979452165207476e-07 + ], + "bp_grad_F": [ + 0.25490984320640564, + 2.9280510716489516e-05, + 1.6399520973209292e-05, + 9.804005458136089e-06, + 9.64422997640213e-06 + ], + "gamma_dfa": 0.007508119277190417, + "gamma_dfa_per_layer": [ + 0.007269312161952257, + 0.013389883562922478, + 0.01044462900608778, + -0.0010713476222008467 + ], + "acc_eval": 0.2265625, + "loss_eval": 2.0774288177490234, + "epoch": 2 + } + ] +} \ No newline at end of file -- cgit v1.2.3