From 2aaabd9a95386bf9f274cb9907ac6a5306171759 Mon Sep 17 00:00:00 2001
From: YurenHao0426 <Blackhao0426@gmail.com>
Date: Thu, 2 Apr 2026 23:34:12 -0500
Subject: =?UTF-8?q?Fix=20EP=20credit=20sign:=20negate=20(h=5Fnudge=20-=20h?=
 =?UTF-8?q?=5Ffree)/=CE=B2=20to=20align=20with=20BP=20grad=20direction?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

EP nudge moves h toward lower loss (opposite to BP grad which points toward loss increase).
Without negation, Gamma is negative and rho is -0.25.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 experiments/ep_synthetic.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

(limited to 'experiments/ep_synthetic.py')

diff --git a/experiments/ep_synthetic.py b/experiments/ep_synthetic.py
index 7daecde..a2f24df 100644
--- a/experiments/ep_synthetic.py
+++ b/experiments/ep_synthetic.py
@@ -115,7 +115,9 @@ def compute_diagnostics(model, teacher, dev, d, C, L, beta=0.5, T_nudge=20, alph
     gammas,rhos=[],[]
     with torch.no_grad():_,hi=model(x,return_hidden=True)
     for l in range(L):
-        a_ep=(h_nudge[l+1].detach()-h_free[l+1])/beta
+        # EP nudge moves h toward lower loss, so (h_nudge - h_free) points opposite to BP grad.
+        # Negate to align with BP gradient convention (pointing toward loss increase).
+        a_ep=-(h_nudge[l+1].detach()-h_free[l+1])/beta
         gammas.append(cosine_similarity_batch(a_ep,bp[l+1]))
         def mk(sl):
             def f(h):
-- 
cgit v1.2.3