summaryrefslogtreecommitdiff
path: root/results/frozen_cifar
diff options
context:
space:
mode:
authorYurenHao0426 <Blackhao0426@gmail.com>2026-06-14 04:06:32 -0500
committerYurenHao0426 <Blackhao0426@gmail.com>2026-06-14 04:06:32 -0500
commitaa73718eb6427d7da3b9cb416275802d90c4b2ed (patch)
treeb68b0a664fb650744ef934a1c22abd740a7b62a6 /results/frozen_cifar
parent827c658fa9a750f3c6ebdb87703762f10f69f6ff (diff)
Add new experiment scripts, figures, and paper assets; untrack pyc/build artifactsHEADmaster
Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
Diffstat (limited to 'results/frozen_cifar')
-rw-r--r--results/frozen_cifar/frozen_L4_d256_s42.json174
-rw-r--r--results/frozen_cifar/frozen_L4_d512_s42.json174
-rw-r--r--results/frozen_cifar/frozen_L6_d256_s42.json216
3 files changed, 564 insertions, 0 deletions
diff --git a/results/frozen_cifar/frozen_L4_d256_s42.json b/results/frozen_cifar/frozen_L4_d256_s42.json
new file mode 100644
index 0000000..2fb0bd3
--- /dev/null
+++ b/results/frozen_cifar/frozen_L4_d256_s42.json
@@ -0,0 +1,174 @@
+{
+ "config": {
+ "num_blocks": 4,
+ "d_hidden": 256,
+ "seed": 42,
+ "bp_epochs": 100,
+ "estimator_epochs": 100,
+ "lr_fb": 0.001,
+ "lam": 0.1,
+ "K": 4,
+ "sigma_bridge": 0.05,
+ "ema_momentum": 0.995,
+ "term_grad_weight": 1.0
+ },
+ "bp_acc": 0.6173,
+ "summary": {
+ "dfa": {
+ "mean_gamma": 0.005605479117366485,
+ "mean_rho": 0.005194449331611395,
+ "mean_nudge": -2.151036460418254e-05
+ },
+ "sb_eT": {
+ "mean_gamma": 0.2866372682154179,
+ "mean_rho": 0.24588057771325111,
+ "mean_nudge": -0.0009568915702402592
+ },
+ "cb_eT": {
+ "mean_gamma": 0.11484479499049485,
+ "mean_rho": 0.125152001157403,
+ "mean_nudge": -0.00036998098585172556
+ },
+ "cb_deltaL": {
+ "mean_gamma": 0.06995358848944307,
+ "mean_rho": 0.06243711616843939,
+ "mean_nudge": -0.00015994706336641684
+ }
+ },
+ "per_layer": {
+ "dfa": {
+ "bp_cosine": [
+ 0.01097307917661965,
+ -0.00982702277833596,
+ 0.004532583430409432,
+ 0.016743276640772818
+ ],
+ "perturbation_rho": [
+ 0.0032103070989251137,
+ -0.030966611579060555,
+ 0.06208299845457077,
+ -0.01354889664798975
+ ],
+ "nudging_0.001": [
+ -3.2122152333613485e-06,
+ 7.709997589699924e-06,
+ -2.053854950645473e-05,
+ -1.2655042155529372e-05
+ ],
+ "nudging_0.003": [
+ -9.568146197125316e-06,
+ 2.312526703462936e-05,
+ -6.160693010315299e-05,
+ -3.799164915108122e-05
+ ],
+ "nudging_0.01": [
+ -3.1933166610542685e-05,
+ 7.745913171675056e-05,
+ -0.0002052279596682638,
+ -0.00012646839604713023
+ ]
+ },
+ "sb_eT": {
+ "bp_cosine": [
+ 0.19993784725666047,
+ 0.2704531639814377,
+ 0.3183140277862549,
+ 0.35784403383731844
+ ],
+ "perturbation_rho": [
+ 0.14796550571918488,
+ 0.23224923014640808,
+ 0.27324193716049194,
+ 0.33006563782691956
+ ],
+ "nudging_0.001": [
+ -0.00020024771220050752,
+ -0.00030526291811838746,
+ -0.0003735219652298838,
+ -0.0003972915874328464
+ ],
+ "nudging_0.003": [
+ -0.0006005102768540382,
+ -0.0009154834551736712,
+ -0.001120006782002747,
+ -0.0011915657669305801
+ ],
+ "nudging_0.01": [
+ -0.002000064356252551,
+ -0.0030484027229249477,
+ -0.0037288377061486244,
+ -0.0039670998230576515
+ ]
+ },
+ "cb_eT": {
+ "bp_cosine": [
+ 0.045131212659180166,
+ 0.06221269443631172,
+ 0.1209193505346775,
+ 0.23111592233181
+ ],
+ "perturbation_rho": [
+ 0.05690425634384155,
+ 0.10793692618608475,
+ 0.10616493225097656,
+ 0.2296018898487091
+ ],
+ "nudging_0.001": [
+ -5.6506225519115105e-05,
+ -8.837308996589854e-05,
+ -0.00011208542855456471,
+ -0.00023653265088796616
+ ],
+ "nudging_0.003": [
+ -0.00016947659605648369,
+ -0.00026502960827201605,
+ -0.0003360719420015812,
+ -0.0007093457970768213
+ ],
+ "nudging_0.01": [
+ -0.0005644541233778,
+ -0.0008825073018670082,
+ -0.0011192080564796925,
+ -0.0023615544196218252
+ ]
+ },
+ "cb_deltaL": {
+ "bp_cosine": [
+ 0.03819061610847711,
+ 0.05208469983190298,
+ 0.06935825981199742,
+ 0.12018077820539474
+ ],
+ "perturbation_rho": [
+ 0.047517478466033936,
+ 0.013643201440572739,
+ 0.04729664325714111,
+ 0.14129114151000977
+ ],
+ "nudging_0.001": [
+ -2.239555396954529e-05,
+ -2.458264680171851e-05,
+ -4.0700091631151736e-05,
+ -0.0001256012765225023
+ ],
+ "nudging_0.003": [
+ -6.710628804285079e-05,
+ -7.37799855414778e-05,
+ -0.00012205714301671833,
+ -0.00037684483686462045
+ ],
+ "nudging_0.01": [
+ -0.0002235029242001474,
+ -0.00024507055059075356,
+ -0.00040636284393258393,
+ -0.0012548293452709913
+ ]
+ }
+ },
+ "sb_pred_error": [
+ 9093.49886875,
+ 3872.840365234375,
+ 2899.67371015625,
+ 2407.756592578125
+ ]
+} \ No newline at end of file
diff --git a/results/frozen_cifar/frozen_L4_d512_s42.json b/results/frozen_cifar/frozen_L4_d512_s42.json
new file mode 100644
index 0000000..025eea9
--- /dev/null
+++ b/results/frozen_cifar/frozen_L4_d512_s42.json
@@ -0,0 +1,174 @@
+{
+ "config": {
+ "num_blocks": 4,
+ "d_hidden": 512,
+ "seed": 42,
+ "bp_epochs": 100,
+ "estimator_epochs": 100,
+ "lr_fb": 0.001,
+ "lam": 0.1,
+ "K": 4,
+ "sigma_bridge": 0.05,
+ "ema_momentum": 0.995,
+ "term_grad_weight": 1.0
+ },
+ "bp_acc": 0.6046,
+ "summary": {
+ "dfa": {
+ "mean_gamma": 0.00014940524997655283,
+ "mean_rho": 0.0021846434101462364,
+ "mean_nudge": 9.80043569143163e-06
+ },
+ "sb_eT": {
+ "mean_gamma": 0.16364388447254896,
+ "mean_rho": 0.1367498729377985,
+ "mean_nudge": -0.0008324724767589942
+ },
+ "cb_eT": {
+ "mean_gamma": 0.05695507084019482,
+ "mean_rho": 0.10538733564317226,
+ "mean_nudge": -0.00041578355740057305
+ },
+ "cb_deltaL": {
+ "mean_gamma": 0.03857357995584607,
+ "mean_rho": 0.02690578391775489,
+ "mean_nudge": -0.00015572691336274147
+ }
+ },
+ "per_layer": {
+ "dfa": {
+ "bp_cosine": [
+ 0.0003761224914342165,
+ 0.0014630826306529343,
+ 0.0025856316089630125,
+ -0.0038272157311439515
+ ],
+ "perturbation_rho": [
+ 0.041057292371988297,
+ 0.04760625958442688,
+ -0.04939739778637886,
+ -0.03052758052945137
+ ],
+ "nudging_0.001": [
+ -6.823556759627536e-07,
+ 5.570012035605032e-06,
+ 7.243079380714335e-07,
+ 7.61153205530718e-06
+ ],
+ "nudging_0.003": [
+ -2.2219755919650197e-06,
+ 1.6406695067416877e-05,
+ 2.2961030481383204e-06,
+ 2.2720920242136344e-05
+ ],
+ "nudging_0.01": [
+ -7.2418697527609766e-06,
+ 5.4833959438838065e-05,
+ 7.364731573034078e-06,
+ 7.559901860076934e-05
+ ]
+ },
+ "sb_eT": {
+ "bp_cosine": [
+ 0.11779971644282342,
+ 0.15058264434337615,
+ 0.1757924109697342,
+ 0.2104007661342621
+ ],
+ "perturbation_rho": [
+ 0.05106552690267563,
+ 0.14929687976837158,
+ 0.1366019994020462,
+ 0.21003508567810059
+ ],
+ "nudging_0.001": [
+ -0.00020435426267795265,
+ -0.000274428486591205,
+ -0.0003065963101107627,
+ -0.0003246065170969814
+ ],
+ "nudging_0.003": [
+ -0.0006134338327683508,
+ -0.0008232325781136751,
+ -0.0009195499587804079,
+ -0.0009736735373735428
+ ],
+ "nudging_0.01": [
+ -0.0020439010113477707,
+ -0.0027431542985141277,
+ -0.0030633914284408092,
+ -0.003243957180529833
+ ]
+ },
+ "cb_eT": {
+ "bp_cosine": [
+ 0.028400307334959508,
+ 0.030753960087895393,
+ 0.04988271631300449,
+ 0.11878329962491989
+ ],
+ "perturbation_rho": [
+ 0.06698533892631531,
+ 0.07322317361831665,
+ 0.11097840219736099,
+ 0.1703624278306961
+ ],
+ "nudging_0.001": [
+ -8.199035073630512e-05,
+ -9.967104415409267e-05,
+ -0.00014070692122913897,
+ -0.00023186377075035125
+ ],
+ "nudging_0.003": [
+ -0.000246370182139799,
+ -0.000298988597933203,
+ -0.0004220257396809757,
+ -0.0006957497098483145
+ ],
+ "nudging_0.01": [
+ -0.0008211369859054685,
+ -0.0009962331969290972,
+ -0.0014064292190596461,
+ -0.0023175508249551058
+ ]
+ },
+ "cb_deltaL": {
+ "bp_cosine": [
+ 0.019338275119662286,
+ 0.03327283784747124,
+ 0.040172213315963747,
+ 0.061510993540287016
+ ],
+ "perturbation_rho": [
+ -0.0003883522003889084,
+ 0.029364485293626785,
+ 0.04492279514670372,
+ 0.03372420743107796
+ ],
+ "nudging_0.001": [
+ -2.7410198526922613e-05,
+ -5.19197310495656e-05,
+ -6.934596603969112e-05,
+ -5.898199015064165e-05
+ ],
+ "nudging_0.003": [
+ -8.237811562139541e-05,
+ -0.00015559815801680088,
+ -0.00020809093257412314,
+ -0.00017684044723864645
+ ],
+ "nudging_0.01": [
+ -0.00027475334354676306,
+ -0.000518541899509728,
+ -0.0006934736738912761,
+ -0.0005893784109503031
+ ]
+ }
+ },
+ "sb_pred_error": [
+ 32627.8307125,
+ 17715.490584375,
+ 13710.30735,
+ 10994.33838125
+ ]
+} \ No newline at end of file
diff --git a/results/frozen_cifar/frozen_L6_d256_s42.json b/results/frozen_cifar/frozen_L6_d256_s42.json
new file mode 100644
index 0000000..703dd5a
--- /dev/null
+++ b/results/frozen_cifar/frozen_L6_d256_s42.json
@@ -0,0 +1,216 @@
+{
+ "config": {
+ "num_blocks": 6,
+ "d_hidden": 256,
+ "seed": 42,
+ "bp_epochs": 100,
+ "estimator_epochs": 100,
+ "lr_fb": 0.001,
+ "lam": 0.1,
+ "K": 4,
+ "sigma_bridge": 0.05,
+ "ema_momentum": 0.995,
+ "term_grad_weight": 1.0
+ },
+ "bp_acc": 0.6172,
+ "summary": {
+ "dfa": {
+ "mean_gamma": 0.008224744617473334,
+ "mean_rho": -0.007729481750478347,
+ "mean_nudge": -1.4484473164581383e-05
+ },
+ "sb_eT": {
+ "mean_gamma": 0.28419415106376006,
+ "mean_rho": 0.24331255008776984,
+ "mean_nudge": -0.0010212107930177201
+ },
+ "cb_eT": {
+ "mean_gamma": 0.1356087997245292,
+ "mean_rho": 0.11836575530469418,
+ "mean_nudge": -0.000398846738486706
+ },
+ "cb_deltaL": {
+ "mean_gamma": 0.06269844393245876,
+ "mean_rho": 0.07167995596925418,
+ "mean_nudge": -0.000200468028197065
+ }
+ },
+ "per_layer": {
+ "dfa": {
+ "bp_cosine": [
+ -0.010780696198344231,
+ -0.0024464363697916268,
+ 0.006427376973442733,
+ 0.023271656595170498,
+ 0.017338427528738976,
+ 0.015538139175623656
+ ],
+ "perturbation_rho": [
+ -0.018140554428100586,
+ 0.003606993705034256,
+ -0.045406848192214966,
+ 0.023949457332491875,
+ -0.016462121158838272,
+ 0.00607618223875761
+ ],
+ "nudging_0.001": [
+ 3.0692412110511214e-05,
+ 7.64157812227495e-06,
+ -9.760969987837598e-08,
+ -3.085116622969508e-05,
+ -1.6509711713297293e-05,
+ -1.9992370653199032e-05
+ ],
+ "nudging_0.003": [
+ 9.20678285183385e-05,
+ 2.31226204050472e-05,
+ -2.7300666260998696e-07,
+ -9.241211228072643e-05,
+ -4.9478214350529015e-05,
+ -5.993395461700857e-05
+ ],
+ "nudging_0.01": [
+ 0.0003075606073252857,
+ 7.720924622844905e-05,
+ -5.05835487274453e-07,
+ -0.0003076052526012063,
+ -0.00016470525588374585,
+ -0.00019945789244957268
+ ]
+ },
+ "sb_eT": {
+ "bp_cosine": [
+ 0.1685526818037033,
+ 0.23167533278465272,
+ 0.2697907418012619,
+ 0.30822172164916994,
+ 0.3446090370416641,
+ 0.3823153913021088
+ ],
+ "perturbation_rho": [
+ 0.07154904305934906,
+ 0.19288617372512817,
+ 0.2876003682613373,
+ 0.27649810910224915,
+ 0.3115084767341614,
+ 0.3198331296443939
+ ],
+ "nudging_0.001": [
+ -0.00018972528050653636,
+ -0.0002750377752818167,
+ -0.00032653682865202427,
+ -0.00039390879101119936,
+ -0.00042474071960896254,
+ -0.00043361991993151605
+ ],
+ "nudging_0.003": [
+ -0.0005688090459443629,
+ -0.0008246920770034194,
+ -0.0009791019838303328,
+ -0.00118098477832973,
+ -0.001273483969271183,
+ -0.001300192903727293
+ ],
+ "nudging_0.01": [
+ -0.0018940127920359373,
+ -0.0027450949419289827,
+ -0.0032586848828941584,
+ -0.003929748199880123,
+ -0.004237486980855465,
+ -0.004327159374952316
+ ]
+ },
+ "cb_eT": {
+ "bp_cosine": [
+ 0.045225401408970356,
+ 0.053792066499590875,
+ 0.08010791838169098,
+ 0.12435948699712754,
+ 0.19471128135919571,
+ 0.31545664370059967
+ ],
+ "perturbation_rho": [
+ 0.024685420095920563,
+ -0.01572572812438011,
+ 0.08793376386165619,
+ 0.11664978414773941,
+ 0.1602637767791748,
+ 0.3363875150680542
+ ],
+ "nudging_0.001": [
+ -2.2263082428253256e-05,
+ -5.150778451934457e-05,
+ -7.369300146820024e-05,
+ -0.00012175041774753481,
+ -0.00019730909843929112,
+ -0.000331797928083688
+ ],
+ "nudging_0.003": [
+ -6.678207137156278e-05,
+ -0.00015438658010680228,
+ -0.0002208092628279701,
+ -0.00036489206831902266,
+ -0.0005915500223636627,
+ -0.0009946604259312153
+ ],
+ "nudging_0.01": [
+ -0.00022176679340191185,
+ -0.0005135145038366318,
+ -0.0007348398794420063,
+ -0.0012142673367634416,
+ -0.0019682790152728558,
+ -0.0033080100547522306
+ ]
+ },
+ "cb_deltaL": {
+ "bp_cosine": [
+ 0.01903119832277298,
+ 0.03658499242737889,
+ 0.04136112704873085,
+ 0.05426537357270718,
+ 0.07572877742350101,
+ 0.14921919479966164
+ ],
+ "perturbation_rho": [
+ -0.004729617387056351,
+ 0.06955375522375107,
+ 0.07996401935815811,
+ 0.11149539798498154,
+ 0.055956777185201645,
+ 0.11783940345048904
+ ],
+ "nudging_0.001": [
+ -3.080447640968487e-05,
+ -4.9154667067341506e-05,
+ -5.3297979320632294e-05,
+ -5.973243969492614e-05,
+ -7.465035014320165e-05,
+ -0.00013362003664951771
+ ],
+ "nudging_0.003": [
+ -9.23606421565637e-05,
+ -0.00014715960423927754,
+ -0.00015975572750903666,
+ -0.00017912944895215333,
+ -0.00022374786203727126,
+ -0.0004006548842880875
+ ],
+ "nudging_0.01": [
+ -0.00030725268879905343,
+ -0.0004887805553153157,
+ -0.0005310464184731245,
+ -0.0005952278152108192,
+ -0.0007444550283253193,
+ -0.0013336975825950503
+ ]
+ }
+ },
+ "sb_pred_error": [
+ 8914.44174921875,
+ 5038.8783640625,
+ 4058.455402734375,
+ 3433.17113046875,
+ 2884.829894921875,
+ 2573.41313515625
+ ]
+} \ No newline at end of file