summaryrefslogtreecommitdiff
path: root/research/flossing/ptrm_same_subset
diff options
context:
space:
mode:
Diffstat (limited to 'research/flossing/ptrm_same_subset')
-rw-r--r--research/flossing/ptrm_same_subset/base58590_k25_d64_sigma03_Lonly_n10000_seed20260602.meta.json15
-rw-r--r--research/flossing/ptrm_same_subset/base58590_k25_d64_sigma03_Lonly_n10000_seed20260602.summary.csv2
-rw-r--r--research/flossing/ptrm_same_subset/multi4_35805_k25_d64_sigma03_Lonly_n10000_seed20260602.meta.json15
-rw-r--r--research/flossing/ptrm_same_subset/multi4_35805_k25_d64_sigma03_Lonly_n10000_seed20260602.summary.csv2
-rw-r--r--research/flossing/ptrm_same_subset/paired_ptrm_k100_n1000_seed0_summary.csv2
5 files changed, 36 insertions, 0 deletions
diff --git a/research/flossing/ptrm_same_subset/base58590_k25_d64_sigma03_Lonly_n10000_seed20260602.meta.json b/research/flossing/ptrm_same_subset/base58590_k25_d64_sigma03_Lonly_n10000_seed20260602.meta.json
new file mode 100644
index 0000000..843c266
--- /dev/null
+++ b/research/flossing/ptrm_same_subset/base58590_k25_d64_sigma03_Lonly_n10000_seed20260602.meta.json
@@ -0,0 +1,15 @@
+{
+ "batch_size": 64,
+ "ckpt_name": "step_58590",
+ "ckpt_root": "trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro",
+ "fd_eps": 0.01,
+ "fd_lyap": false,
+ "fd_spectrum_k": 0,
+ "include_clean": false,
+ "n_samples": 10000,
+ "noise_std": 0.3,
+ "perturb": "l",
+ "rollouts": 25,
+ "seed": 20260602,
+ "steps": 64
+} \ No newline at end of file
diff --git a/research/flossing/ptrm_same_subset/base58590_k25_d64_sigma03_Lonly_n10000_seed20260602.summary.csv b/research/flossing/ptrm_same_subset/base58590_k25_d64_sigma03_Lonly_n10000_seed20260602.summary.csv
new file mode 100644
index 0000000..16c5a1b
--- /dev/null
+++ b/research/flossing/ptrm_same_subset/base58590_k25_d64_sigma03_Lonly_n10000_seed20260602.summary.csv
@@ -0,0 +1,2 @@
+correct_count/det_fail_mean,correct_count/det_success_mean,correct_count/full_frac,correct_count/ge_10_frac,correct_count/ge_1_frac,correct_count/ge_25_frac,correct_count/ge_5_frac,correct_count/mean,correct_count/median,correct_count/q10,correct_count/q25,correct_count/q75,correct_count/q90,correct_count/std,correct_count/zero_frac,deterministic/exact,deterministic/token_acc,fd_lyap,fd_spectrum_k,include_clean,mean_rollout/exact,mean_rollout/token_acc,n_samples,noise_std,oracle_pass/det_fail_frac,oracle_pass/det_success_frac,oracle_pass/exact,oracle_pass/token_acc,perturb_both,perturb_h,perturb_l,q_max/det_fail_frac,q_max/det_success_frac,q_max/exact,q_max/token_acc,q_mean,rollout0/exact,rollout0/token_acc,rollouts,steps
+13.544709205627441,24.74855613708496,0.847599983215332,0.944599986076355,0.9776999950408936,0.847599983215332,0.9599999785423279,23.2450008392334,25.0,20.0,25.0,25.0,25.0,5.4259724617004395,0.022299999371170998,0.8658000230789185,0.9498122930526733,0.0,0.0,0.0,0.9297999739646912,0.9728542566299438,10000.0,0.3,0.8338301181793213,1.0,0.9776999950408936,0.9922346472740173,0.0,0.0,1.0,0.8338301181793213,0.9998844861984253,0.9775999784469604,0.9908208847045898,6.504925727844238,0.9284999966621399,0.9722283482551575,25.0,64.0
diff --git a/research/flossing/ptrm_same_subset/multi4_35805_k25_d64_sigma03_Lonly_n10000_seed20260602.meta.json b/research/flossing/ptrm_same_subset/multi4_35805_k25_d64_sigma03_Lonly_n10000_seed20260602.meta.json
new file mode 100644
index 0000000..dee5762
--- /dev/null
+++ b/research/flossing/ptrm_same_subset/multi4_35805_k25_d64_sigma03_Lonly_n10000_seed20260602.meta.json
@@ -0,0 +1,15 @@
+{
+ "batch_size": 64,
+ "ckpt_name": "step_35805",
+ "ckpt_root": "trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_multi4_loguniform_repro",
+ "fd_eps": 0.01,
+ "fd_lyap": false,
+ "fd_spectrum_k": 0,
+ "include_clean": false,
+ "n_samples": 10000,
+ "noise_std": 0.3,
+ "perturb": "l",
+ "rollouts": 25,
+ "seed": 20260602,
+ "steps": 64
+} \ No newline at end of file
diff --git a/research/flossing/ptrm_same_subset/multi4_35805_k25_d64_sigma03_Lonly_n10000_seed20260602.summary.csv b/research/flossing/ptrm_same_subset/multi4_35805_k25_d64_sigma03_Lonly_n10000_seed20260602.summary.csv
new file mode 100644
index 0000000..f991531
--- /dev/null
+++ b/research/flossing/ptrm_same_subset/multi4_35805_k25_d64_sigma03_Lonly_n10000_seed20260602.summary.csv
@@ -0,0 +1,2 @@
+correct_count/det_fail_mean,correct_count/det_success_mean,correct_count/full_frac,correct_count/ge_10_frac,correct_count/ge_1_frac,correct_count/ge_25_frac,correct_count/ge_5_frac,correct_count/mean,correct_count/median,correct_count/q10,correct_count/q25,correct_count/q75,correct_count/q90,correct_count/std,correct_count/zero_frac,deterministic/exact,deterministic/token_acc,fd_lyap,fd_spectrum_k,include_clean,mean_rollout/exact,mean_rollout/token_acc,n_samples,noise_std,oracle_pass/det_fail_frac,oracle_pass/det_success_frac,oracle_pass/exact,oracle_pass/token_acc,perturb_both,perturb_h,perturb_l,q_max/det_fail_frac,q_max/det_success_frac,q_max/exact,q_max/token_acc,q_mean,rollout0/exact,rollout0/token_acc,rollouts,steps
+13.846529960632324,24.8140811920166,0.8842999935150146,0.9599000215530396,0.9828000068664551,0.8842999935150146,0.9696999788284302,23.692100524902344,25.0,24.0,25.0,25.0,25.0,4.753871917724609,0.01720000058412552,0.8977000117301941,0.9607678651809692,0.0,0.0,0.0,0.9476839900016785,0.9795129895210266,10000.0,0.3,0.8328445553779602,0.9998885989189148,0.9828000068664551,0.9940740466117859,0.0,0.0,1.0,0.829912006855011,0.9995543956756592,0.982200026512146,0.9926013946533203,6.862946510314941,0.9480999708175659,0.979781448841095,25.0,64.0
diff --git a/research/flossing/ptrm_same_subset/paired_ptrm_k100_n1000_seed0_summary.csv b/research/flossing/ptrm_same_subset/paired_ptrm_k100_n1000_seed0_summary.csv
new file mode 100644
index 0000000..8122604
--- /dev/null
+++ b/research/flossing/ptrm_same_subset/paired_ptrm_k100_n1000_seed0_summary.csv
@@ -0,0 +1,2 @@
+n,rollouts,base_det,multi4_det,delta_det,base_mean_rollout,multi4_mean_rollout,delta_mean_rollout,base_qmax,multi4_qmax,delta_qmax,base_oracle,multi4_oracle,delta_oracle,base_correct_count_mean,multi4_correct_count_mean,delta_correct_count_mean,det_base_only_frac,det_multi4_only_frac,oracle_base_only_frac,oracle_multi4_only_frac
+1000,100,0.887,0.911,0.02400000000000002,0.94188,0.95417,0.012289999999999912,0.984,0.988,0.0040000000000000036,0.985,0.988,0.0030000000000000027,94.188,95.417,1.2289999999999992,0.034,0.058,0.001,0.004