diff options
| author | YurenHao0426 <Blackhao0426@gmail.com> | 2026-06-14 04:06:32 -0500 |
|---|---|---|
| committer | YurenHao0426 <Blackhao0426@gmail.com> | 2026-06-14 04:06:32 -0500 |
| commit | aa73718eb6427d7da3b9cb416275802d90c4b2ed (patch) | |
| tree | b68b0a664fb650744ef934a1c22abd740a7b62a6 /results/frozen_cifar | |
| parent | 827c658fa9a750f3c6ebdb87703762f10f69f6ff (diff) | |
Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
Diffstat (limited to 'results/frozen_cifar')
| -rw-r--r-- | results/frozen_cifar/frozen_L4_d256_s42.json | 174 | ||||
| -rw-r--r-- | results/frozen_cifar/frozen_L4_d512_s42.json | 174 | ||||
| -rw-r--r-- | results/frozen_cifar/frozen_L6_d256_s42.json | 216 |
3 files changed, 564 insertions, 0 deletions
diff --git a/results/frozen_cifar/frozen_L4_d256_s42.json b/results/frozen_cifar/frozen_L4_d256_s42.json new file mode 100644 index 0000000..2fb0bd3 --- /dev/null +++ b/results/frozen_cifar/frozen_L4_d256_s42.json @@ -0,0 +1,174 @@ +{ + "config": { + "num_blocks": 4, + "d_hidden": 256, + "seed": 42, + "bp_epochs": 100, + "estimator_epochs": 100, + "lr_fb": 0.001, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0 + }, + "bp_acc": 0.6173, + "summary": { + "dfa": { + "mean_gamma": 0.005605479117366485, + "mean_rho": 0.005194449331611395, + "mean_nudge": -2.151036460418254e-05 + }, + "sb_eT": { + "mean_gamma": 0.2866372682154179, + "mean_rho": 0.24588057771325111, + "mean_nudge": -0.0009568915702402592 + }, + "cb_eT": { + "mean_gamma": 0.11484479499049485, + "mean_rho": 0.125152001157403, + "mean_nudge": -0.00036998098585172556 + }, + "cb_deltaL": { + "mean_gamma": 0.06995358848944307, + "mean_rho": 0.06243711616843939, + "mean_nudge": -0.00015994706336641684 + } + }, + "per_layer": { + "dfa": { + "bp_cosine": [ + 0.01097307917661965, + -0.00982702277833596, + 0.004532583430409432, + 0.016743276640772818 + ], + "perturbation_rho": [ + 0.0032103070989251137, + -0.030966611579060555, + 0.06208299845457077, + -0.01354889664798975 + ], + "nudging_0.001": [ + -3.2122152333613485e-06, + 7.709997589699924e-06, + -2.053854950645473e-05, + -1.2655042155529372e-05 + ], + "nudging_0.003": [ + -9.568146197125316e-06, + 2.312526703462936e-05, + -6.160693010315299e-05, + -3.799164915108122e-05 + ], + "nudging_0.01": [ + -3.1933166610542685e-05, + 7.745913171675056e-05, + -0.0002052279596682638, + -0.00012646839604713023 + ] + }, + "sb_eT": { + "bp_cosine": [ + 0.19993784725666047, + 0.2704531639814377, + 0.3183140277862549, + 0.35784403383731844 + ], + "perturbation_rho": [ + 0.14796550571918488, + 0.23224923014640808, + 0.27324193716049194, + 0.33006563782691956 + ], + "nudging_0.001": [ + -0.00020024771220050752, + -0.00030526291811838746, + -0.0003735219652298838, + -0.0003972915874328464 + ], + "nudging_0.003": [ + -0.0006005102768540382, + -0.0009154834551736712, + -0.001120006782002747, + -0.0011915657669305801 + ], + "nudging_0.01": [ + -0.002000064356252551, + -0.0030484027229249477, + -0.0037288377061486244, + -0.0039670998230576515 + ] + }, + "cb_eT": { + "bp_cosine": [ + 0.045131212659180166, + 0.06221269443631172, + 0.1209193505346775, + 0.23111592233181 + ], + "perturbation_rho": [ + 0.05690425634384155, + 0.10793692618608475, + 0.10616493225097656, + 0.2296018898487091 + ], + "nudging_0.001": [ + -5.6506225519115105e-05, + -8.837308996589854e-05, + -0.00011208542855456471, + -0.00023653265088796616 + ], + "nudging_0.003": [ + -0.00016947659605648369, + -0.00026502960827201605, + -0.0003360719420015812, + -0.0007093457970768213 + ], + "nudging_0.01": [ + -0.0005644541233778, + -0.0008825073018670082, + -0.0011192080564796925, + -0.0023615544196218252 + ] + }, + "cb_deltaL": { + "bp_cosine": [ + 0.03819061610847711, + 0.05208469983190298, + 0.06935825981199742, + 0.12018077820539474 + ], + "perturbation_rho": [ + 0.047517478466033936, + 0.013643201440572739, + 0.04729664325714111, + 0.14129114151000977 + ], + "nudging_0.001": [ + -2.239555396954529e-05, + -2.458264680171851e-05, + -4.0700091631151736e-05, + -0.0001256012765225023 + ], + "nudging_0.003": [ + -6.710628804285079e-05, + -7.37799855414778e-05, + -0.00012205714301671833, + -0.00037684483686462045 + ], + "nudging_0.01": [ + -0.0002235029242001474, + -0.00024507055059075356, + -0.00040636284393258393, + -0.0012548293452709913 + ] + } + }, + "sb_pred_error": [ + 9093.49886875, + 3872.840365234375, + 2899.67371015625, + 2407.756592578125 + ] +}
\ No newline at end of file diff --git a/results/frozen_cifar/frozen_L4_d512_s42.json b/results/frozen_cifar/frozen_L4_d512_s42.json new file mode 100644 index 0000000..025eea9 --- /dev/null +++ b/results/frozen_cifar/frozen_L4_d512_s42.json @@ -0,0 +1,174 @@ +{ + "config": { + "num_blocks": 4, + "d_hidden": 512, + "seed": 42, + "bp_epochs": 100, + "estimator_epochs": 100, + "lr_fb": 0.001, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0 + }, + "bp_acc": 0.6046, + "summary": { + "dfa": { + "mean_gamma": 0.00014940524997655283, + "mean_rho": 0.0021846434101462364, + "mean_nudge": 9.80043569143163e-06 + }, + "sb_eT": { + "mean_gamma": 0.16364388447254896, + "mean_rho": 0.1367498729377985, + "mean_nudge": -0.0008324724767589942 + }, + "cb_eT": { + "mean_gamma": 0.05695507084019482, + "mean_rho": 0.10538733564317226, + "mean_nudge": -0.00041578355740057305 + }, + "cb_deltaL": { + "mean_gamma": 0.03857357995584607, + "mean_rho": 0.02690578391775489, + "mean_nudge": -0.00015572691336274147 + } + }, + "per_layer": { + "dfa": { + "bp_cosine": [ + 0.0003761224914342165, + 0.0014630826306529343, + 0.0025856316089630125, + -0.0038272157311439515 + ], + "perturbation_rho": [ + 0.041057292371988297, + 0.04760625958442688, + -0.04939739778637886, + -0.03052758052945137 + ], + "nudging_0.001": [ + -6.823556759627536e-07, + 5.570012035605032e-06, + 7.243079380714335e-07, + 7.61153205530718e-06 + ], + "nudging_0.003": [ + -2.2219755919650197e-06, + 1.6406695067416877e-05, + 2.2961030481383204e-06, + 2.2720920242136344e-05 + ], + "nudging_0.01": [ + -7.2418697527609766e-06, + 5.4833959438838065e-05, + 7.364731573034078e-06, + 7.559901860076934e-05 + ] + }, + "sb_eT": { + "bp_cosine": [ + 0.11779971644282342, + 0.15058264434337615, + 0.1757924109697342, + 0.2104007661342621 + ], + "perturbation_rho": [ + 0.05106552690267563, + 0.14929687976837158, + 0.1366019994020462, + 0.21003508567810059 + ], + "nudging_0.001": [ + -0.00020435426267795265, + -0.000274428486591205, + -0.0003065963101107627, + -0.0003246065170969814 + ], + "nudging_0.003": [ + -0.0006134338327683508, + -0.0008232325781136751, + -0.0009195499587804079, + -0.0009736735373735428 + ], + "nudging_0.01": [ + -0.0020439010113477707, + -0.0027431542985141277, + -0.0030633914284408092, + -0.003243957180529833 + ] + }, + "cb_eT": { + "bp_cosine": [ + 0.028400307334959508, + 0.030753960087895393, + 0.04988271631300449, + 0.11878329962491989 + ], + "perturbation_rho": [ + 0.06698533892631531, + 0.07322317361831665, + 0.11097840219736099, + 0.1703624278306961 + ], + "nudging_0.001": [ + -8.199035073630512e-05, + -9.967104415409267e-05, + -0.00014070692122913897, + -0.00023186377075035125 + ], + "nudging_0.003": [ + -0.000246370182139799, + -0.000298988597933203, + -0.0004220257396809757, + -0.0006957497098483145 + ], + "nudging_0.01": [ + -0.0008211369859054685, + -0.0009962331969290972, + -0.0014064292190596461, + -0.0023175508249551058 + ] + }, + "cb_deltaL": { + "bp_cosine": [ + 0.019338275119662286, + 0.03327283784747124, + 0.040172213315963747, + 0.061510993540287016 + ], + "perturbation_rho": [ + -0.0003883522003889084, + 0.029364485293626785, + 0.04492279514670372, + 0.03372420743107796 + ], + "nudging_0.001": [ + -2.7410198526922613e-05, + -5.19197310495656e-05, + -6.934596603969112e-05, + -5.898199015064165e-05 + ], + "nudging_0.003": [ + -8.237811562139541e-05, + -0.00015559815801680088, + -0.00020809093257412314, + -0.00017684044723864645 + ], + "nudging_0.01": [ + -0.00027475334354676306, + -0.000518541899509728, + -0.0006934736738912761, + -0.0005893784109503031 + ] + } + }, + "sb_pred_error": [ + 32627.8307125, + 17715.490584375, + 13710.30735, + 10994.33838125 + ] +}
\ No newline at end of file diff --git a/results/frozen_cifar/frozen_L6_d256_s42.json b/results/frozen_cifar/frozen_L6_d256_s42.json new file mode 100644 index 0000000..703dd5a --- /dev/null +++ b/results/frozen_cifar/frozen_L6_d256_s42.json @@ -0,0 +1,216 @@ +{ + "config": { + "num_blocks": 6, + "d_hidden": 256, + "seed": 42, + "bp_epochs": 100, + "estimator_epochs": 100, + "lr_fb": 0.001, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0 + }, + "bp_acc": 0.6172, + "summary": { + "dfa": { + "mean_gamma": 0.008224744617473334, + "mean_rho": -0.007729481750478347, + "mean_nudge": -1.4484473164581383e-05 + }, + "sb_eT": { + "mean_gamma": 0.28419415106376006, + "mean_rho": 0.24331255008776984, + "mean_nudge": -0.0010212107930177201 + }, + "cb_eT": { + "mean_gamma": 0.1356087997245292, + "mean_rho": 0.11836575530469418, + "mean_nudge": -0.000398846738486706 + }, + "cb_deltaL": { + "mean_gamma": 0.06269844393245876, + "mean_rho": 0.07167995596925418, + "mean_nudge": -0.000200468028197065 + } + }, + "per_layer": { + "dfa": { + "bp_cosine": [ + -0.010780696198344231, + -0.0024464363697916268, + 0.006427376973442733, + 0.023271656595170498, + 0.017338427528738976, + 0.015538139175623656 + ], + "perturbation_rho": [ + -0.018140554428100586, + 0.003606993705034256, + -0.045406848192214966, + 0.023949457332491875, + -0.016462121158838272, + 0.00607618223875761 + ], + "nudging_0.001": [ + 3.0692412110511214e-05, + 7.64157812227495e-06, + -9.760969987837598e-08, + -3.085116622969508e-05, + -1.6509711713297293e-05, + -1.9992370653199032e-05 + ], + "nudging_0.003": [ + 9.20678285183385e-05, + 2.31226204050472e-05, + -2.7300666260998696e-07, + -9.241211228072643e-05, + -4.9478214350529015e-05, + -5.993395461700857e-05 + ], + "nudging_0.01": [ + 0.0003075606073252857, + 7.720924622844905e-05, + -5.05835487274453e-07, + -0.0003076052526012063, + -0.00016470525588374585, + -0.00019945789244957268 + ] + }, + "sb_eT": { + "bp_cosine": [ + 0.1685526818037033, + 0.23167533278465272, + 0.2697907418012619, + 0.30822172164916994, + 0.3446090370416641, + 0.3823153913021088 + ], + "perturbation_rho": [ + 0.07154904305934906, + 0.19288617372512817, + 0.2876003682613373, + 0.27649810910224915, + 0.3115084767341614, + 0.3198331296443939 + ], + "nudging_0.001": [ + -0.00018972528050653636, + -0.0002750377752818167, + -0.00032653682865202427, + -0.00039390879101119936, + -0.00042474071960896254, + -0.00043361991993151605 + ], + "nudging_0.003": [ + -0.0005688090459443629, + -0.0008246920770034194, + -0.0009791019838303328, + -0.00118098477832973, + -0.001273483969271183, + -0.001300192903727293 + ], + "nudging_0.01": [ + -0.0018940127920359373, + -0.0027450949419289827, + -0.0032586848828941584, + -0.003929748199880123, + -0.004237486980855465, + -0.004327159374952316 + ] + }, + "cb_eT": { + "bp_cosine": [ + 0.045225401408970356, + 0.053792066499590875, + 0.08010791838169098, + 0.12435948699712754, + 0.19471128135919571, + 0.31545664370059967 + ], + "perturbation_rho": [ + 0.024685420095920563, + -0.01572572812438011, + 0.08793376386165619, + 0.11664978414773941, + 0.1602637767791748, + 0.3363875150680542 + ], + "nudging_0.001": [ + -2.2263082428253256e-05, + -5.150778451934457e-05, + -7.369300146820024e-05, + -0.00012175041774753481, + -0.00019730909843929112, + -0.000331797928083688 + ], + "nudging_0.003": [ + -6.678207137156278e-05, + -0.00015438658010680228, + -0.0002208092628279701, + -0.00036489206831902266, + -0.0005915500223636627, + -0.0009946604259312153 + ], + "nudging_0.01": [ + -0.00022176679340191185, + -0.0005135145038366318, + -0.0007348398794420063, + -0.0012142673367634416, + -0.0019682790152728558, + -0.0033080100547522306 + ] + }, + "cb_deltaL": { + "bp_cosine": [ + 0.01903119832277298, + 0.03658499242737889, + 0.04136112704873085, + 0.05426537357270718, + 0.07572877742350101, + 0.14921919479966164 + ], + "perturbation_rho": [ + -0.004729617387056351, + 0.06955375522375107, + 0.07996401935815811, + 0.11149539798498154, + 0.055956777185201645, + 0.11783940345048904 + ], + "nudging_0.001": [ + -3.080447640968487e-05, + -4.9154667067341506e-05, + -5.3297979320632294e-05, + -5.973243969492614e-05, + -7.465035014320165e-05, + -0.00013362003664951771 + ], + "nudging_0.003": [ + -9.23606421565637e-05, + -0.00014715960423927754, + -0.00015975572750903666, + -0.00017912944895215333, + -0.00022374786203727126, + -0.0004006548842880875 + ], + "nudging_0.01": [ + -0.00030725268879905343, + -0.0004887805553153157, + -0.0005310464184731245, + -0.0005952278152108192, + -0.0007444550283253193, + -0.0013336975825950503 + ] + } + }, + "sb_pred_error": [ + 8914.44174921875, + 5038.8783640625, + 4058.455402734375, + 3433.17113046875, + 2884.829894921875, + 2573.41313515625 + ] +}
\ No newline at end of file |
