summaryrefslogtreecommitdiff
path: root/results/boundary_ablation_tgw_sweep/ablation_a1.0_L4_s42.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/boundary_ablation_tgw_sweep/ablation_a1.0_L4_s42.json')
-rw-r--r--results/boundary_ablation_tgw_sweep/ablation_a1.0_L4_s42.json90
1 files changed, 90 insertions, 0 deletions
diff --git a/results/boundary_ablation_tgw_sweep/ablation_a1.0_L4_s42.json b/results/boundary_ablation_tgw_sweep/ablation_a1.0_L4_s42.json
new file mode 100644
index 0000000..8a70394
--- /dev/null
+++ b/results/boundary_ablation_tgw_sweep/ablation_a1.0_L4_s42.json
@@ -0,0 +1,90 @@
+{
+ "s_eT_tgw0.0_wr0.2": {
+ "test_acc": 0.532,
+ "mean_bp_cosine": 0.11989971622824669,
+ "mean_rho": 0.16079141944646835,
+ "mean_nudge": -0.010690351715311408,
+ "bp_cosine_per_layer": [
+ 0.03718709945678711,
+ 0.1347142904996872,
+ 0.15199805796146393,
+ 0.15569941699504852
+ ],
+ "rho_per_layer": [
+ 0.08883650600910187,
+ 0.1502864807844162,
+ 0.20964613556861877,
+ 0.19439655542373657
+ ],
+ "final_value_loss": 0.07598549057245255,
+ "s_type": "eT",
+ "term_grad_weight": 0.0,
+ "warmup_ratio": 0.2
+ },
+ "s_eT_tgw0.25_wr0.2": {
+ "test_acc": 0.558,
+ "mean_bp_cosine": 0.22698336280882359,
+ "mean_rho": 0.2679573856294155,
+ "mean_nudge": -0.0202574310824275,
+ "bp_cosine_per_layer": [
+ 0.09379873424768448,
+ 0.2528688311576843,
+ 0.2722504138946533,
+ 0.2890154719352722
+ ],
+ "rho_per_layer": [
+ 0.13511960208415985,
+ 0.289243221282959,
+ 0.33815300464630127,
+ 0.30931371450424194
+ ],
+ "final_value_loss": 0.16253001551628113,
+ "s_type": "eT",
+ "term_grad_weight": 0.25,
+ "warmup_ratio": 0.2
+ },
+ "s_eT_tgw1.0_wr0.2": {
+ "test_acc": 0.558,
+ "mean_bp_cosine": 0.45794273912906647,
+ "mean_rho": 0.5322257168591022,
+ "mean_nudge": -0.038075629621744156,
+ "bp_cosine_per_layer": [
+ 0.17809242010116577,
+ 0.5349531173706055,
+ 0.5522423982620239,
+ 0.5664830207824707
+ ],
+ "rho_per_layer": [
+ 0.22843755781650543,
+ 0.5910820364952087,
+ 0.6707864999771118,
+ 0.638596773147583
+ ],
+ "final_value_loss": 0.38718592133522034,
+ "s_type": "eT",
+ "term_grad_weight": 1.0,
+ "warmup_ratio": 0.2
+ },
+ "s_eT_tgw4.0_wr0.2": {
+ "test_acc": 0.3935,
+ "mean_bp_cosine": 0.5738203078508377,
+ "mean_rho": 0.5946865696460009,
+ "mean_nudge": -0.04504407802596688,
+ "bp_cosine_per_layer": [
+ 0.07111608982086182,
+ 0.6408071517944336,
+ 0.787927508354187,
+ 0.7954304814338684
+ ],
+ "rho_per_layer": [
+ 0.10197217017412186,
+ 0.6885993480682373,
+ 0.7956527471542358,
+ 0.7925220131874084
+ ],
+ "final_value_loss": 1.2652584648132323,
+ "s_type": "eT",
+ "term_grad_weight": 4.0,
+ "warmup_ratio": 0.2
+ }
+} \ No newline at end of file