summaryrefslogtreecommitdiff
path: root/directional_lyap_perturb_eps_sweep/trm_baseline_best_step58590_n1000_c8_fdeps003.summary.csv
blob: 696a9e917dd17640789f69c16420f55d4f34cedc (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
label,perturb_after,sigma,n_samples,candidates,fd_eps,ckpt_root,ckpt_name,clean_acc,mean_sign_exact,mean_sign_token_acc,worst_sign_exact,best_sign_exact,selected_growth_mean,selected_growth_q90,retain_mean_on_clean_success,retain_worst_on_clean_success,rescue_mean_on_clean_fail,rescue_best_on_clean_fail
trm_baseline_best,0,0.0,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8949999809265137,0.8949999809265137,0.961814820766449,0.8949999809265137,0.8949999809265137,0.4821663796901703,0.5784756541252136,1.0,1.0,0.0,0.0
trm_baseline_best,0,0.001,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8949999809265137,0.8949999809265137,0.961814820766449,0.8949999809265137,0.8949999809265137,0.4821663796901703,0.5784756541252136,1.0,1.0,0.0,0.0
trm_baseline_best,0,0.003,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8949999809265137,0.8980000019073486,0.9630987644195557,0.8790000081062317,0.9169999957084656,0.4821663796901703,0.5784756541252136,0.9893854856491089,0.9798882603645325,0.1190476194024086,0.21904762089252472
trm_baseline_best,0,0.01,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8949999809265137,0.887499988079071,0.9590184688568115,0.8600000143051147,0.9150000214576721,0.4821663796901703,0.5784756541252136,0.9653631448745728,0.9463686943054199,0.22380952537059784,0.32380953431129456
trm_baseline_best,0,0.03,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8949999809265137,0.8895000219345093,0.9602900743484497,0.8619999885559082,0.9169999957084656,0.4821663796901703,0.5784756541252136,0.9670391082763672,0.9508379697799683,0.22857142984867096,0.3523809611797333
trm_baseline_best,0,0.1,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8949999809265137,0.8930000066757202,0.961030900478363,0.8619999885559082,0.9240000247955322,0.4821663796901703,0.5784756541252136,0.9670391082763672,0.9474860429763794,0.261904776096344,0.39047619700431824
trm_baseline_best,4,0.0,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8980000019073486,0.8980000019073486,0.9629135727882385,0.8980000019073486,0.8980000019073486,0.5513403415679932,0.7693743705749512,1.0,1.0,0.0,0.0
trm_baseline_best,4,0.001,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8980000019073486,0.8955000042915344,0.9619382619857788,0.8899999856948853,0.9010000228881836,0.5513403415679932,0.7693743705749512,0.9955456852912903,0.9910913109779358,0.014705882407724857,0.029411764815449715
trm_baseline_best,4,0.003,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8980000019073486,0.8880000114440918,0.9597716331481934,0.8669999837875366,0.9089999794960022,0.5513403415679932,0.7693743705749512,0.9716035723686218,0.9599109292030334,0.15196079015731812,0.2549019753932953
trm_baseline_best,4,0.01,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8980000019073486,0.8934999704360962,0.9613086581230164,0.8700000047683716,0.9169999957084656,0.5513403415679932,0.7693743705749512,0.9738307595252991,0.9610245227813721,0.18627451360225677,0.30392158031463623
trm_baseline_best,4,0.03,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8980000019073486,0.890999972820282,0.9601975083351135,0.8650000095367432,0.9169999957084656,0.5513403415679932,0.7693743705749512,0.9688196182250977,0.9510022401809692,0.20588235557079315,0.30392158031463623
trm_baseline_best,4,0.1,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8980000019073486,0.8880000114440918,0.9588024616241455,0.8640000224113464,0.9120000004768372,0.5513403415679932,0.7693743705749512,0.9699332118034363,0.955456554889679,0.1666666716337204,0.27450981736183167
trm_baseline_best,8,0.0,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8970000147819519,0.8970000147819519,0.9637901186943054,0.8970000147819519,0.8970000147819519,0.6981183886528015,1.082965612411499,1.0,1.0,0.0,0.0
trm_baseline_best,8,0.001,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8970000147819519,0.8974999785423279,0.963746964931488,0.8939999938011169,0.9010000228881836,0.6981183886528015,1.082965612411499,0.9983277320861816,0.9966555237770081,0.019417475908994675,0.03883495181798935
trm_baseline_best,8,0.003,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8970000147819519,0.8934999704360962,0.9613950848579407,0.8769999742507935,0.9100000262260437,0.6981183886528015,1.082965612411499,0.9793757200241089,0.9698996543884277,0.1456310749053955,0.223300963640213
trm_baseline_best,8,0.01,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8970000147819519,0.8914999961853027,0.9603024125099182,0.8759999871253967,0.9070000052452087,0.6981183886528015,1.082965612411499,0.9788182973861694,0.9710144996643066,0.13106796145439148,0.21359223127365112
trm_baseline_best,8,0.03,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8970000147819519,0.8985000252723694,0.9633148312568665,0.8820000290870667,0.9150000214576721,0.6981183886528015,1.082965612411499,0.9816053509712219,0.9743589758872986,0.17475728690624237,0.27184465527534485
trm_baseline_best,8,0.1,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8970000147819519,0.8920000195503235,0.9607345461845398,0.8790000081062317,0.9049999713897705,0.6981183886528015,1.082965612411499,0.97826087474823,0.9698996543884277,0.14077669382095337,0.19417475163936615
trm_baseline_best,12,0.0,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8930000066757202,0.8930000066757202,0.9613826274871826,0.8930000066757202,0.8930000066757202,1.2681450843811035,2.1185879707336426,1.0,1.0,0.0,0.0
trm_baseline_best,12,0.001,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8930000066757202,0.8914999961853027,0.9607530236244202,0.8899999856948853,0.8930000066757202,1.2681450843811035,2.1185879707336426,0.9983202815055847,0.9966405630111694,0.0,0.0
trm_baseline_best,12,0.003,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8930000066757202,0.8930000066757202,0.9613209962844849,0.8880000114440918,0.8980000019073486,1.2681450843811035,2.1185879707336426,0.9955207109451294,0.9921612739562988,0.037383176386356354,0.05607476457953453
trm_baseline_best,12,0.01,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8930000066757202,0.8899999856948853,0.9602900743484497,0.8849999904632568,0.8949999809265137,1.2681450843811035,2.1185879707336426,0.9904814958572388,0.9888017773628235,0.05140186846256256,0.08411215245723724
trm_baseline_best,12,0.03,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8930000066757202,0.890999972820282,0.9605308175086975,0.8870000243186951,0.8949999809265137,1.2681450843811035,2.1185879707336426,0.9921612739562988,0.9910414218902588,0.04672897234559059,0.07476635277271271
trm_baseline_best,12,0.1,1000,8,0.03,/home/yurenh2/rrm/trm/checkpoints/Sudoku-extreme-1k-aug-1000-ACT-torch/pretrain_mlp_t_sudoku_official_gbs768_repro,step_58590,0.8930000066757202,0.8895000219345093,0.9602345824241638,0.8840000033378601,0.8949999809265137,1.2681450843811035,2.1185879707336426,0.9921612739562988,0.9899216294288635,0.032710280269384384,0.06542056053876877