diff options
| author | YurenHao0426 <blackhao0426@gmail.com> | 2026-06-13 12:35:36 -0500 |
|---|---|---|
| committer | YurenHao0426 <blackhao0426@gmail.com> | 2026-06-13 12:35:36 -0500 |
| commit | 66e0d8b9fd4d0f7a2231d689c055e26fdf1cf04a (patch) | |
| tree | c29cba61124018755a19b02c9d33e3ad5f2e05cc /research/flossing/engelken_python/official_py_prefloss_N80_k40_E1000_setsid.json | |
Curated export for clone-and-run Maze training (2x A6000) + diagnostics.
trm/hrm pretrain.py carry trajectory-augmentation code (backward-compatible).
Heavy artifacts (checkpoints/wandb/npz) gitignored; see PROVENANCE.md.
Co-Authored-By: Claude Fable 5 <noreply@anthropic.com>
Diffstat (limited to 'research/flossing/engelken_python/official_py_prefloss_N80_k40_E1000_setsid.json')
| -rw-r--r-- | research/flossing/engelken_python/official_py_prefloss_N80_k40_E1000_setsid.json | 179 |
1 files changed, 179 insertions, 0 deletions
diff --git a/research/flossing/engelken_python/official_py_prefloss_N80_k40_E1000_setsid.json b/research/flossing/engelken_python/official_py_prefloss_N80_k40_E1000_setsid.json new file mode 100644 index 0000000..87d5d4b --- /dev/null +++ b/research/flossing/engelken_python/official_py_prefloss_N80_k40_E1000_setsid.json @@ -0,0 +1,179 @@ +{ + "config": { + "hidden_size": 80, + "train_epochs": 1000, + "inter_period": 100, + "inter_epochs": 100, + "pre_epochs": 100, + "max_inter_episodes": 0, + "batch_size": 16, + "input_dim": 1, + "train_steps": 300, + "lyap_steps": 55, + "floss_input_steps": 300, + "seed_ic": 1, + "seed_input": 1, + "seed_net": 1, + "seed_ons": 1, + "lr": 0.001, + "beta1": 0.9, + "beta2": 0.999, + "init_type": 1, + "recurrent_gain": 1.0, + "recurrent_mean_gain": 0.0, + "input_scale": 1.0, + "delay": 10, + "ws_std": 1.0, + "ws_mean": 0.0, + "wr_std": 1.0, + "wr_mean": 0.0, + "b_std": 0.1, + "b_mean": 0.0, + "n_lyap": 40, + "task": -1, + "lyap_target": 0.0, + "eval_every": 100, + "eval_batches": 4, + "log_every_floss": 25, + "device": "cuda", + "out": "research/flossing/engelken_python/official_py_prefloss_N80_k40_E1000_setsid.json" + }, + "evals": [ + { + "epoch": 1, + "train_loss": 1.8594624996185303, + "train_accuracy": 0.49777580071174377, + "eval_loss": 1.6856758892536163, + "eval_accuracy": 0.5019461743772242, + "elapsed": 6.69805383682251 + }, + { + "epoch": 100, + "train_loss": 0.11722302436828613, + "train_accuracy": 0.964635231316726, + "eval_loss": 0.11776464246213436, + "eval_accuracy": 0.9623554270462634, + "elapsed": 21.55224633216858 + }, + { + "epoch": 200, + "train_loss": 0.028137803077697754, + "train_accuracy": 0.9931049822064056, + "eval_loss": 0.027145093772560358, + "eval_accuracy": 0.9935498220640568, + "elapsed": 36.35071516036987 + }, + { + "epoch": 300, + "train_loss": 0.012114334851503372, + "train_accuracy": 0.9975533807829181, + "eval_loss": 0.014187443535774946, + "eval_accuracy": 0.9963300711743772, + "elapsed": 50.83105397224426 + }, + { + "epoch": 400, + "train_loss": 0.008550425991415977, + "train_accuracy": 0.9986654804270463, + "eval_loss": 0.009522247593849897, + "eval_accuracy": 0.9975533807829181, + "elapsed": 65.30040979385376 + }, + { + "epoch": 500, + "train_loss": 0.006629249546676874, + "train_accuracy": 0.998220640569395, + "eval_loss": 0.009814425837248564, + "eval_accuracy": 0.9973865658362989, + "elapsed": 79.79007005691528 + }, + { + "epoch": 600, + "train_loss": 0.007227692287415266, + "train_accuracy": 0.998220640569395, + "eval_loss": 0.006339075975120068, + "eval_accuracy": 0.9983874555160143, + "elapsed": 94.47823691368103 + }, + { + "epoch": 700, + "train_loss": 0.00907257292419672, + "train_accuracy": 0.9979982206405694, + "eval_loss": 0.008150239707902074, + "eval_accuracy": 0.9981094306049823, + "elapsed": 109.5779447555542 + }, + { + "epoch": 800, + "train_loss": 0.005422760266810656, + "train_accuracy": 0.998220640569395, + "eval_loss": 0.006329314899630845, + "eval_accuracy": 0.9981650355871887, + "elapsed": 124.25900483131409 + }, + { + "epoch": 900, + "train_loss": 0.0072866384871304035, + "train_accuracy": 0.998220640569395, + "eval_loss": 0.0068275314988568425, + "eval_accuracy": 0.9981650355871886, + "elapsed": 138.78803777694702 + }, + { + "epoch": 1000, + "train_loss": 0.010031766258180141, + "train_accuracy": 0.9973309608540926, + "eval_loss": 0.01047352165915072, + "eval_accuracy": 0.9972753558718862, + "elapsed": 153.229962348938 + } + ], + "floss": [ + { + "epoch": 1, + "kind": "pre", + "floss_step": 1, + "loss": 0.2797410190105438, + "lambda_mean": -0.507389485836029, + "lambda_1": -0.2639281749725342, + "elapsed": 0.7526497840881348 + }, + { + "epoch": 1, + "kind": "pre", + "floss_step": 25, + "loss": 0.09786238521337509, + "lambda_mean": -0.29911166429519653, + "lambda_1": -0.1687435507774353, + "elapsed": 2.0286896228790283 + }, + { + "epoch": 1, + "kind": "pre", + "floss_step": 50, + "loss": 0.04969814047217369, + "lambda_mean": -0.21222734451293945, + "lambda_1": -0.13751955330371857, + "elapsed": 3.3226377964019775 + }, + { + "epoch": 1, + "kind": "pre", + "floss_step": 75, + "loss": 0.02838609553873539, + "lambda_mean": -0.1609755903482437, + "lambda_1": -0.10771095007658005, + "elapsed": 4.703521490097046 + }, + { + "epoch": 1, + "kind": "pre", + "floss_step": 100, + "loss": 0.00937537383288145, + "lambda_mean": -0.09084373712539673, + "lambda_1": -0.053737666457891464, + "elapsed": 6.211953639984131 + } + ], + "task": [] +}
\ No newline at end of file |
