diff options
| author | YurenHao0426 <blackhao0426@gmail.com> | 2026-01-13 23:49:05 -0600 |
|---|---|---|
| committer | YurenHao0426 <blackhao0426@gmail.com> | 2026-01-13 23:49:05 -0600 |
| commit | cd99d6b874d9d09b3bb87b8485cc787885af71f1 (patch) | |
| tree | 59a233959932ca0e4f12f196275e07fcf443b33f /runs/grid_search_cifar10 | |
init commit
Diffstat (limited to 'runs/grid_search_cifar10')
| -rw-r--r-- | runs/grid_search_cifar10/20251230-134445/config.json | 32 | ||||
| -rw-r--r-- | runs/grid_search_cifar10/20251230-134445/grid_search_heatmaps.png | bin | 0 -> 77326 bytes | |||
| -rw-r--r-- | runs/grid_search_cifar10/20251230-134445/grid_search_results.json | 914 | ||||
| -rw-r--r-- | runs/grid_search_cifar10/20251230-134445/optimal_hyperparameters.png | bin | 0 -> 94623 bytes |
4 files changed, 946 insertions, 0 deletions
diff --git a/runs/grid_search_cifar10/20251230-134445/config.json b/runs/grid_search_cifar10/20251230-134445/config.json new file mode 100644 index 0000000..e63a5bf --- /dev/null +++ b/runs/grid_search_cifar10/20251230-134445/config.json @@ -0,0 +1,32 @@ +{ + "depths": [ + 4, + 6, + 8, + 10 + ], + "lambda_regs": [ + 0.01, + 0.05, + 0.1, + 0.2, + 0.3 + ], + "lambda_targets": [ + 0.0, + -0.05, + -0.1, + -0.2 + ], + "hidden_dim": 256, + "epochs": 15, + "lr": 0.001, + "batch_size": 128, + "seed": 42, + "synthetic": false, + "data_dir": "./data", + "T": 8, + "out_dir": "runs/grid_search_cifar10", + "device": "cuda", + "no_progress": false +}
\ No newline at end of file diff --git a/runs/grid_search_cifar10/20251230-134445/grid_search_heatmaps.png b/runs/grid_search_cifar10/20251230-134445/grid_search_heatmaps.png Binary files differnew file mode 100644 index 0000000..13195e1 --- /dev/null +++ b/runs/grid_search_cifar10/20251230-134445/grid_search_heatmaps.png diff --git a/runs/grid_search_cifar10/20251230-134445/grid_search_results.json b/runs/grid_search_cifar10/20251230-134445/grid_search_results.json new file mode 100644 index 0000000..23270dd --- /dev/null +++ b/runs/grid_search_cifar10/20251230-134445/grid_search_results.json @@ -0,0 +1,914 @@ +{ + "optimal_per_depth": { + "4": { + "lambda_reg": 0.01, + "lambda_target": -0.1, + "val_acc": 0.1988, + "lyapunov": 0.9432953708921857, + "epochs_to_90": -1 + }, + "6": { + "lambda_reg": 0.01, + "lambda_target": 0.0, + "val_acc": 0.1, + "lyapunov": 1.1385156285122533, + "epochs_to_90": -1 + }, + "8": { + "lambda_reg": 0.01, + "lambda_target": -0.1, + "val_acc": 0.1001, + "lyapunov": 1.2825916834804407, + "epochs_to_90": -1 + }, + "10": { + "lambda_reg": 0.01, + "lambda_target": 0.0, + "val_acc": 0.1, + "lyapunov": 1.3936041294766204, + "epochs_to_90": -1 + } + }, + "all_results": [ + { + "depth": 4, + "lambda_reg": 0.01, + "lambda_target": 0.0, + "final_train_acc": 0.17938, + "final_val_acc": 0.1953, + "final_lyapunov": 0.9437398303805105, + "final_grad_norm": 0.5733915362923737, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.01, + "lambda_target": -0.05, + "final_train_acc": 0.1808, + "final_val_acc": 0.1896, + "final_lyapunov": 0.941756814184701, + "final_grad_norm": 0.4886330016660691, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.01, + "lambda_target": -0.1, + "final_train_acc": 0.186, + "final_val_acc": 0.1988, + "final_lyapunov": 0.9432953708921857, + "final_grad_norm": 0.6184321650421675, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.01, + "lambda_target": -0.2, + "final_train_acc": 0.18272, + "final_val_acc": 0.1921, + "final_lyapunov": 0.946702331380771, + "final_grad_norm": 0.6163956989755326, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.05, + "lambda_target": 0.0, + "final_train_acc": 0.16566, + "final_val_acc": 0.1805, + "final_lyapunov": 0.9517296686806642, + "final_grad_norm": 0.5857529188999518, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.05, + "lambda_target": -0.05, + "final_train_acc": 0.17794, + "final_val_acc": 0.1904, + "final_lyapunov": 0.948808985293064, + "final_grad_norm": 0.8242237658942144, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.05, + "lambda_target": -0.1, + "final_train_acc": 0.17408, + "final_val_acc": 0.1862, + "final_lyapunov": 0.9462877124776621, + "final_grad_norm": 0.9866581503705883, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.05, + "lambda_target": -0.2, + "final_train_acc": 0.09782, + "final_val_acc": 0.1, + "final_lyapunov": 0.9379962789433082, + "final_grad_norm": 0.08252957736853016, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.1, + "lambda_target": 0.0, + "final_train_acc": 0.16898, + "final_val_acc": 0.1826, + "final_lyapunov": 0.9547330970349519, + "final_grad_norm": 0.6566210459274582, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.1, + "lambda_target": -0.05, + "final_train_acc": 0.09818, + "final_val_acc": 0.1001, + "final_lyapunov": 0.9364221222565302, + "final_grad_norm": 0.08249123851656585, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.1, + "lambda_target": -0.1, + "final_train_acc": 0.16122, + "final_val_acc": 0.184, + "final_lyapunov": 0.9531408563599257, + "final_grad_norm": 1.3077979331200735, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.1, + "lambda_target": -0.2, + "final_train_acc": 0.16576, + "final_val_acc": 0.1771, + "final_lyapunov": 0.9479860334140261, + "final_grad_norm": 1.006747799591025, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.2, + "lambda_target": 0.0, + "final_train_acc": 0.15346, + "final_val_acc": 0.1789, + "final_lyapunov": 0.9490250833808919, + "final_grad_norm": 0.5347205469421413, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.2, + "lambda_target": -0.05, + "final_train_acc": 0.10152, + "final_val_acc": 0.1614, + "final_lyapunov": 0.9405348759782893, + "final_grad_norm": 1.8371456687852115, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.2, + "lambda_target": -0.1, + "final_train_acc": 0.09858, + "final_val_acc": 0.1, + "final_lyapunov": 0.9397584945344559, + "final_grad_norm": 0.0899413574774814, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.2, + "lambda_target": -0.2, + "final_train_acc": 0.09812, + "final_val_acc": 0.1, + "final_lyapunov": 0.9385917991628427, + "final_grad_norm": 0.08375695480428061, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.3, + "lambda_target": 0.0, + "final_train_acc": 0.09788, + "final_val_acc": 0.1, + "final_lyapunov": 0.9406521692300391, + "final_grad_norm": 0.08339080862058595, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.3, + "lambda_target": -0.05, + "final_train_acc": 0.0976, + "final_val_acc": 0.1, + "final_lyapunov": 0.9406559307252049, + "final_grad_norm": 0.08241204122770836, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.3, + "lambda_target": -0.1, + "final_train_acc": 0.09784, + "final_val_acc": 0.1001, + "final_lyapunov": 0.9388094913319248, + "final_grad_norm": 0.0824405699507713, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 4, + "lambda_reg": 0.3, + "lambda_target": -0.2, + "final_train_acc": 0.09782, + "final_val_acc": 0.1, + "final_lyapunov": 0.9403619379033823, + "final_grad_norm": 0.08280762916104432, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.01, + "lambda_target": 0.0, + "final_train_acc": 0.09628, + "final_val_acc": 0.1, + "final_lyapunov": 1.1385156285122533, + "final_grad_norm": 0.08287535503680316, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.01, + "lambda_target": -0.05, + "final_train_acc": 0.09628, + "final_val_acc": 0.1, + "final_lyapunov": 1.138988980856698, + "final_grad_norm": 0.08293673519739811, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.01, + "lambda_target": -0.1, + "final_train_acc": 0.09628, + "final_val_acc": 0.1, + "final_lyapunov": 1.1391457858902718, + "final_grad_norm": 0.08288053033711852, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.01, + "lambda_target": -0.2, + "final_train_acc": 0.09628, + "final_val_acc": 0.1, + "final_lyapunov": 1.138157954911137, + "final_grad_norm": 0.08287555741773707, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.05, + "lambda_target": 0.0, + "final_train_acc": 0.09628, + "final_val_acc": 0.1, + "final_lyapunov": 1.139664650268262, + "final_grad_norm": 0.08294427145037926, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.05, + "lambda_target": -0.05, + "final_train_acc": 0.09628, + "final_val_acc": 0.1, + "final_lyapunov": 1.1396977364864496, + "final_grad_norm": 0.0828774686357299, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.05, + "lambda_target": -0.1, + "final_train_acc": 0.09628, + "final_val_acc": 0.1, + "final_lyapunov": 1.1413045710005114, + "final_grad_norm": 0.08286388617728013, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.05, + "lambda_target": -0.2, + "final_train_acc": 0.09628, + "final_val_acc": 0.1, + "final_lyapunov": 1.1390106086535832, + "final_grad_norm": 0.08287740141317775, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.1, + "lambda_target": 0.0, + "final_train_acc": 0.097, + "final_val_acc": 0.1, + "final_lyapunov": 1.141337064221082, + "final_grad_norm": 0.08399748563857064, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.1, + "lambda_target": -0.05, + "final_train_acc": 0.09674, + "final_val_acc": 0.1, + "final_lyapunov": 1.1404877102283566, + "final_grad_norm": 0.08293794170822359, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.1, + "lambda_target": -0.1, + "final_train_acc": 0.0969, + "final_val_acc": 0.1, + "final_lyapunov": 1.140710405376561, + "final_grad_norm": 0.08314413205401962, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.1, + "lambda_target": -0.2, + "final_train_acc": 0.09636, + "final_val_acc": 0.1, + "final_lyapunov": 1.1404222932922872, + "final_grad_norm": 0.08296281348743317, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.2, + "lambda_target": 0.0, + "final_train_acc": 0.09782, + "final_val_acc": 0.1, + "final_lyapunov": 1.1415441371595767, + "final_grad_norm": 0.0828345253420129, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.2, + "lambda_target": -0.05, + "final_train_acc": 0.09628, + "final_val_acc": 0.1, + "final_lyapunov": 1.1419490356274578, + "final_grad_norm": 0.08281989622138378, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.2, + "lambda_target": -0.1, + "final_train_acc": 0.09672, + "final_val_acc": 0.1, + "final_lyapunov": 1.1404405426796136, + "final_grad_norm": 0.08283674106810397, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.2, + "lambda_target": -0.2, + "final_train_acc": 0.09614, + "final_val_acc": 0.1, + "final_lyapunov": 1.1409168340970792, + "final_grad_norm": 0.08286801169721057, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.3, + "lambda_target": 0.0, + "final_train_acc": 0.09628, + "final_val_acc": 0.1, + "final_lyapunov": 1.1420772383585, + "final_grad_norm": 0.08282499803728872, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.3, + "lambda_target": -0.05, + "final_train_acc": 0.09628, + "final_val_acc": 0.1, + "final_lyapunov": 1.1412645739972438, + "final_grad_norm": 0.08392543470742864, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.3, + "lambda_target": -0.1, + "final_train_acc": 0.09628, + "final_val_acc": 0.1, + "final_lyapunov": 1.1425321044214547, + "final_grad_norm": 0.08283797434789233, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 6, + "lambda_reg": 0.3, + "lambda_target": -0.2, + "final_train_acc": 0.09642, + "final_val_acc": 0.1, + "final_lyapunov": 1.1405771723793596, + "final_grad_norm": 0.08283968811672689, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.01, + "lambda_target": 0.0, + "final_train_acc": 0.09606, + "final_val_acc": 0.1, + "final_lyapunov": 1.282112029507337, + "final_grad_norm": 0.08238888704245423, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.01, + "lambda_target": -0.05, + "final_train_acc": 0.09618, + "final_val_acc": 0.1, + "final_lyapunov": 1.28174534874499, + "final_grad_norm": 0.08231914116363483, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.01, + "lambda_target": -0.1, + "final_train_acc": 0.09606, + "final_val_acc": 0.1001, + "final_lyapunov": 1.2825916834804407, + "final_grad_norm": 0.08258902578018723, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.01, + "lambda_target": -0.2, + "final_train_acc": 0.09618, + "final_val_acc": 0.1, + "final_lyapunov": 1.2820049259058959, + "final_grad_norm": 0.08232743477986716, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.05, + "lambda_target": 0.0, + "final_train_acc": 0.09606, + "final_val_acc": 0.1, + "final_lyapunov": 1.2829882177855352, + "final_grad_norm": 0.08233253899320181, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.05, + "lambda_target": -0.05, + "final_train_acc": 0.09606, + "final_val_acc": 0.1, + "final_lyapunov": 1.283354894279519, + "final_grad_norm": 0.08233173174046388, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.05, + "lambda_target": -0.1, + "final_train_acc": 0.09622, + "final_val_acc": 0.1, + "final_lyapunov": 1.283211630933425, + "final_grad_norm": 0.0824676591114568, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.05, + "lambda_target": -0.2, + "final_train_acc": 0.09672, + "final_val_acc": 0.1, + "final_lyapunov": 1.2829850515746095, + "final_grad_norm": 0.08519084401251485, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.1, + "lambda_target": 0.0, + "final_train_acc": 0.0963, + "final_val_acc": 0.1, + "final_lyapunov": 1.2835611769610353, + "final_grad_norm": 0.082416774166316, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.1, + "lambda_target": -0.05, + "final_train_acc": 0.09614, + "final_val_acc": 0.1, + "final_lyapunov": 1.2845280630814144, + "final_grad_norm": 0.08767280341035139, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.1, + "lambda_target": -0.1, + "final_train_acc": 0.09742, + "final_val_acc": 0.1, + "final_lyapunov": 1.2838158720289654, + "final_grad_norm": 0.08568109147029492, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.1, + "lambda_target": -0.2, + "final_train_acc": 0.096, + "final_val_acc": 0.1, + "final_lyapunov": 1.2840089212598094, + "final_grad_norm": 0.08227305794056056, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.2, + "lambda_target": 0.0, + "final_train_acc": 0.09638, + "final_val_acc": 0.1, + "final_lyapunov": 1.2844933588486498, + "final_grad_norm": 0.08512696672137617, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.2, + "lambda_target": -0.05, + "final_train_acc": 0.09618, + "final_val_acc": 0.1, + "final_lyapunov": 1.2843177443575067, + "final_grad_norm": 0.08231501883595474, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.2, + "lambda_target": -0.1, + "final_train_acc": 0.09604, + "final_val_acc": 0.1, + "final_lyapunov": 1.2844979894130737, + "final_grad_norm": 0.08260603178077829, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.2, + "lambda_target": -0.2, + "final_train_acc": 0.09618, + "final_val_acc": 0.1, + "final_lyapunov": 1.2838659871874563, + "final_grad_norm": 0.08228155133296543, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.3, + "lambda_target": 0.0, + "final_train_acc": 0.0957, + "final_val_acc": 0.1, + "final_lyapunov": 1.2848752886438004, + "final_grad_norm": 0.08245992869877969, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.3, + "lambda_target": -0.05, + "final_train_acc": 0.09692, + "final_val_acc": 0.1, + "final_lyapunov": 1.2840831913911472, + "final_grad_norm": 0.0823793461016338, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.3, + "lambda_target": -0.1, + "final_train_acc": 0.09626, + "final_val_acc": 0.1, + "final_lyapunov": 1.2847454633249347, + "final_grad_norm": 0.08265625463299375, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 8, + "lambda_reg": 0.3, + "lambda_target": -0.2, + "final_train_acc": 0.09618, + "final_val_acc": 0.1, + "final_lyapunov": 1.2837977290458387, + "final_grad_norm": 0.08227328030081477, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.01, + "lambda_target": 0.0, + "final_train_acc": 0.09802, + "final_val_acc": 0.1, + "final_lyapunov": 1.3936041294766204, + "final_grad_norm": 0.0810773216211147, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.01, + "lambda_target": -0.05, + "final_train_acc": 0.09794, + "final_val_acc": 0.1, + "final_lyapunov": 1.3934821189212068, + "final_grad_norm": 0.08108704666671128, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.01, + "lambda_target": -0.1, + "final_train_acc": 0.09802, + "final_val_acc": 0.1, + "final_lyapunov": 1.3931444648586575, + "final_grad_norm": 0.08108521605893095, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.01, + "lambda_target": -0.2, + "final_train_acc": 0.09802, + "final_val_acc": 0.1, + "final_lyapunov": 1.3935116352632528, + "final_grad_norm": 0.08108062104446316, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.05, + "lambda_target": 0.0, + "final_train_acc": 0.09802, + "final_val_acc": 0.1, + "final_lyapunov": 1.3949058507104664, + "final_grad_norm": 0.08108257712636058, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.05, + "lambda_target": -0.05, + "final_train_acc": 0.09802, + "final_val_acc": 0.1, + "final_lyapunov": 1.3947931890902312, + "final_grad_norm": 0.0810832896708942, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.05, + "lambda_target": -0.1, + "final_train_acc": 0.09802, + "final_val_acc": 0.1, + "final_lyapunov": 1.394568802450624, + "final_grad_norm": 0.0810773571533469, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.05, + "lambda_target": -0.2, + "final_train_acc": 0.0984, + "final_val_acc": 0.1, + "final_lyapunov": 1.3954170716693028, + "final_grad_norm": 0.08778735801635837, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.1, + "lambda_target": 0.0, + "final_train_acc": 0.0972, + "final_val_acc": 0.1, + "final_lyapunov": 1.3952556305834094, + "final_grad_norm": 0.09052299104974379, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.1, + "lambda_target": -0.05, + "final_train_acc": 0.09802, + "final_val_acc": 0.1, + "final_lyapunov": 1.3948042667125498, + "final_grad_norm": 0.08116479991900416, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.1, + "lambda_target": -0.1, + "final_train_acc": 0.09744, + "final_val_acc": 0.1, + "final_lyapunov": 1.3950299341660326, + "final_grad_norm": 0.08177695089641489, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.1, + "lambda_target": -0.2, + "final_train_acc": 0.09792, + "final_val_acc": 0.1, + "final_lyapunov": 1.3952085682193336, + "final_grad_norm": 0.08119665047385813, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.2, + "lambda_target": 0.0, + "final_train_acc": 0.09716, + "final_val_acc": 0.1, + "final_lyapunov": 1.3955303390922449, + "final_grad_norm": 0.08152741514663026, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.2, + "lambda_target": -0.05, + "final_train_acc": 0.09796, + "final_val_acc": 0.1, + "final_lyapunov": 1.396121849489334, + "final_grad_norm": 0.08563396405027882, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.2, + "lambda_target": -0.1, + "final_train_acc": 0.0985, + "final_val_acc": 0.1, + "final_lyapunov": 1.3953984298974351, + "final_grad_norm": 0.0819596680368273, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.2, + "lambda_target": -0.2, + "final_train_acc": 0.09802, + "final_val_acc": 0.1, + "final_lyapunov": 1.3953755539091652, + "final_grad_norm": 0.08102330433994928, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.3, + "lambda_target": 0.0, + "final_train_acc": 0.09772, + "final_val_acc": 0.1, + "final_lyapunov": 1.3954071937619572, + "final_grad_norm": 0.08165895073173139, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.3, + "lambda_target": -0.05, + "final_train_acc": 0.09806, + "final_val_acc": 0.1, + "final_lyapunov": 1.395664310516299, + "final_grad_norm": 0.0810914615806199, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.3, + "lambda_target": -0.1, + "final_train_acc": 0.09802, + "final_val_acc": 0.1, + "final_lyapunov": 1.395855899966891, + "final_grad_norm": 0.08103700774993476, + "converged": true, + "epochs_to_90pct": -1 + }, + { + "depth": 10, + "lambda_reg": 0.3, + "lambda_target": -0.2, + "final_train_acc": 0.09788, + "final_val_acc": 0.1, + "final_lyapunov": 1.3956506441316336, + "final_grad_norm": 0.08102633202138995, + "converged": true, + "epochs_to_90pct": -1 + } + ] +}
\ No newline at end of file diff --git a/runs/grid_search_cifar10/20251230-134445/optimal_hyperparameters.png b/runs/grid_search_cifar10/20251230-134445/optimal_hyperparameters.png Binary files differnew file mode 100644 index 0000000..86de782 --- /dev/null +++ b/runs/grid_search_cifar10/20251230-134445/optimal_hyperparameters.png |
