summaryrefslogtreecommitdiff
path: root/results/boundary_ablation_s456/ablation_a1.0_L4_s456.json
blob: 29afee7c2f97cf865e42a28e80e5f593b235188b (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
{
  "s_eT_tgw1.0_wr0.2": {
    "test_acc": 0.4935,
    "mean_bp_cosine": 0.49867621809244156,
    "mean_rho": 0.5327592641115189,
    "mean_nudge": -0.04268983006477356,
    "bp_cosine_per_layer": [
      0.21021124720573425,
      0.5842739939689636,
      0.5913121700286865,
      0.6089074611663818
    ],
    "rho_per_layer": [
      0.24787980318069458,
      0.6222057342529297,
      0.6273762583732605,
      0.6335752606391907
    ],
    "final_value_loss": 0.4651986366271973,
    "s_type": "eT",
    "term_grad_weight": 1.0,
    "warmup_ratio": 0.2
  },
  "s_deltaL_tgw1.0_wr0.2": {
    "test_acc": 0.4805,
    "mean_bp_cosine": 0.572130560874939,
    "mean_rho": 0.5290974006056786,
    "mean_nudge": -0.05305152013897896,
    "bp_cosine_per_layer": [
      0.3073272705078125,
      0.6108690500259399,
      0.6810163259506226,
      0.6893095970153809
    ],
    "rho_per_layer": [
      0.33536288142204285,
      0.6113735437393188,
      0.6066526174545288,
      0.5630005598068237
    ],
    "final_value_loss": 0.48287113523483277,
    "s_type": "deltaL",
    "term_grad_weight": 1.0,
    "warmup_ratio": 0.2
  }
}