Add prefill inputs NaN debug
This commit is contained in:
@@ -742,6 +742,12 @@ class DeepseekV4MultiHeadLatentAttentionWrapper(PluggableLayer):
|
||||
kv_rope_prefill = self._apply_rope_kv(
|
||||
kv[num_decode_tokens:], positions[num_decode_tokens:],
|
||||
)
|
||||
# Debug: check attention inputs
|
||||
import sys as _sys
|
||||
_q_nan = torch.isnan(q_prefill).any().item()
|
||||
_kv_nan = torch.isnan(kv_rope_prefill).any().item()
|
||||
if _q_nan or _kv_nan:
|
||||
print(f"[BLACKWELL] PREFILL INPUTS NaN: q_nan={_q_nan} kv_nan={_kv_nan} cr={self.compress_ratio}", file=_sys.stderr, flush=True)
|
||||
if swa_only:
|
||||
o[num_decode_tokens:] = causal_prefill_attention(
|
||||
q_prefill, kv_rope_prefill, self.scale,
|
||||
|
||||
Reference in New Issue
Block a user