From a53936a17cebb8b9fc85a917e1cedd7e8103113e Mon Sep 17 00:00:00 2001 From: biondizzle Date: Mon, 1 Jun 2026 03:54:29 +0000 Subject: [PATCH] diag: print l1_out shape warning in shared expert --- dsv4/layers/shared_expert.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/dsv4/layers/shared_expert.py b/dsv4/layers/shared_expert.py index 930b5674..26472412 100644 --- a/dsv4/layers/shared_expert.py +++ b/dsv4/layers/shared_expert.py @@ -316,6 +316,8 @@ class Nvfp4SharedExpert: self._ensure_initialized() l1_out = self._run_l1(hidden_states) + if l1_out.shape[1] < 2 * self.intermediate_size: + print(f" WARNING: l1_out shape {l1_out.shape} < expected (N, {2*self.intermediate_size})", flush=True) gate = l1_out[:, :self.intermediate_size] up = l1_out[:, self.intermediate_size:]