summaryrefslogtreecommitdiff
path: root/directional_lyap_perturb_eps_sweep/trm_baseline_best_step58590_n1000_c8_fdeps001.summary.csv
blob: fe53bc3b34b4378a35393ecd262332a6f4b516b4 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
label,perturb_after,sigma,n_samples,candidates,fd_eps,ckpt_root,ckpt_name,clean_acc,mean_sign_exact,mean_sign_token_acc,worst_sign_exact,best_sign_exact,selected_growth_mean,selected_growth_q90,retain_mean_on_clean_success,retain_worst_on_clean_success,rescue_mean_on_clean_fail,rescue_best_on_clean_fail
trm_baseline_best,0,0.0,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8949999809265137,0.8949999809265137,0.961814820766449,0.8949999809265137,0.8949999809265137,0.5487902164459229,0.6468369364738464,1.0,1.0,0.0,0.0
trm_baseline_best,0,0.001,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8949999809265137,0.8949999809265137,0.961814820766449,0.8949999809265137,0.8949999809265137,0.5487902164459229,0.6468369364738464,1.0,1.0,0.0,0.0
trm_baseline_best,0,0.003,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8949999809265137,0.8934999704360962,0.961506187915802,0.8790000081062317,0.9079999923706055,0.5487902164459229,0.6468369364738464,0.9905027747154236,0.9821228981018066,0.06666667014360428,0.13333334028720856
trm_baseline_best,0,0.01,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8949999809265137,0.890500009059906,0.9606789350509644,0.8539999723434448,0.9269999861717224,0.5487902164459229,0.6468369364738464,0.9631285071372986,0.9396647810935974,0.27142858505249023,0.41904762387275696
trm_baseline_best,0,0.03,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8949999809265137,0.8859999775886536,0.9576419591903687,0.8610000014305115,0.9110000133514404,0.5487902164459229,0.6468369364738464,0.9642457962036133,0.9486033320426941,0.21904762089252472,0.32380953431129456
trm_baseline_best,0,0.1,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8949999809265137,0.890500009059906,0.9597654342651367,0.8579999804496765,0.9229999780654907,0.5487902164459229,0.6468369364738464,0.9653631448745728,0.9474860429763794,0.25238096714019775,0.4095238149166107
trm_baseline_best,4,0.0,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8980000019073486,0.8980000019073486,0.9629135727882385,0.8980000019073486,0.8980000019073486,0.6417636275291443,0.8611953854560852,1.0,1.0,0.0,0.0
trm_baseline_best,4,0.001,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8980000019073486,0.8974999785423279,0.9625309109687805,0.8920000195503235,0.902999997138977,0.6417636275291443,0.8611953854560852,0.9966592192649841,0.993318498134613,0.02450980432331562,0.04901960864663124
trm_baseline_best,4,0.003,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8980000019073486,0.8934999704360962,0.9609135389328003,0.8659999966621399,0.9210000038146973,0.6417636275291443,0.8611953854560852,0.9760578870773315,0.9587973356246948,0.1666666716337204,0.28431373834609985
trm_baseline_best,4,0.01,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8980000019073486,0.8859999775886536,0.9590432047843933,0.8629999756813049,0.9089999794960022,0.6417636275291443,0.8611953854560852,0.9660356640815735,0.948775053024292,0.18137255311012268,0.2549019753932953
trm_baseline_best,4,0.03,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8980000019073486,0.8840000033378601,0.957679033279419,0.8560000061988831,0.9120000004768372,0.6417636275291443,0.8611953854560852,0.9649220705032349,0.9476614594459534,0.1715686321258545,0.29411765933036804
trm_baseline_best,4,0.1,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8980000019073486,0.8889999985694885,0.9591296315193176,0.8629999756813049,0.9150000214576721,0.6417636275291443,0.8611953854560852,0.9671491980552673,0.9521158337593079,0.20098039507865906,0.3235294222831726
trm_baseline_best,8,0.0,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8970000147819519,0.8970000147819519,0.9637901186943054,0.8970000147819519,0.8970000147819519,0.8348738551139832,1.2223771810531616,1.0,1.0,0.0,0.0
trm_baseline_best,8,0.001,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8970000147819519,0.8970000147819519,0.9635308980941772,0.8939999938011169,0.8999999761581421,0.8348738551139832,1.2223771810531616,0.997770369052887,0.9966555237770081,0.019417475908994675,0.03883495181798935
trm_baseline_best,8,0.003,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8970000147819519,0.8964999914169312,0.9620987772941589,0.8769999742507935,0.9160000085830688,0.8348738551139832,1.2223771810531616,0.9832776188850403,0.9732441306114197,0.14077669382095337,0.24271844327449799
trm_baseline_best,8,0.01,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8970000147819519,0.8945000171661377,0.9619569182395935,0.8790000081062317,0.9100000262260437,0.8348738551139832,1.2223771810531616,0.9777034521102905,0.9732441306114197,0.16990290582180023,0.28155338764190674
trm_baseline_best,8,0.03,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8970000147819519,0.8964999914169312,0.9622469544410706,0.8809999823570251,0.9120000004768372,0.8348738551139832,1.2223771810531616,0.9821627736091614,0.9754738211631775,0.15048544108867645,0.24271844327449799
trm_baseline_best,8,0.1,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8970000147819519,0.890500009059906,0.9603580236434937,0.875,0.906000018119812,0.8348738551139832,1.2223771810531616,0.9771460294723511,0.9676700234413147,0.13592232763767242,0.20388349890708923
trm_baseline_best,12,0.0,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8930000066757202,0.8930000066757202,0.9613826274871826,0.8930000066757202,0.8930000066757202,1.5429991483688354,2.3959367275238037,1.0,1.0,0.0,0.0
trm_baseline_best,12,0.001,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8930000066757202,0.8924999833106995,0.961481511592865,0.8920000195503235,0.8930000066757202,1.5429991483688354,2.3959367275238037,0.99944007396698,0.9988802075386047,0.0,0.0
trm_baseline_best,12,0.003,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8930000066757202,0.8914999961853027,0.9610123634338379,0.8859999775886536,0.8970000147819519,1.5429991483688354,2.3959367275238037,0.9938409924507141,0.9910414218902588,0.037383176386356354,0.06542056053876877
trm_baseline_best,12,0.01,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8930000066757202,0.8914999961853027,0.9606543183326721,0.8849999904632568,0.8980000019073486,1.5429991483688354,2.3959367275238037,0.9921612739562988,0.9899216294288635,0.05140186846256256,0.09345794469118118
trm_baseline_best,12,0.03,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8930000066757202,0.8930000066757202,0.9610803127288818,0.8849999904632568,0.9010000228881836,1.5429991483688354,2.3959367275238037,0.9927211403846741,0.9899216294288635,0.0607476644217968,0.11214952915906906
trm_baseline_best,12,0.1,1000,8,0.01,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8930000066757202,0.8930000066757202,0.961530864238739,0.8859999775886536,0.8999999761581421,1.5429991483688354,2.3959367275238037,0.9938409924507141,0.9910414218902588,0.05140186846256256,0.09345794469118118