From fa769b6214ff0ef813a43bd03b573682f35c8c78 Mon Sep 17 00:00:00 2001
From: biondizzle <biondizzle@gmail.com>
Date: Tue, 2 Jun 2026 08:18:26 +0000
Subject: [PATCH] fix: pad activation as uint8 view for float4 dtype

---
 tests/unit/test_fused_swiglu_kernel.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/unit/test_fused_swiglu_kernel.py b/tests/unit/test_fused_swiglu_kernel.py
index 7527b668..e6f7901f 100644
--- a/tests/unit/test_fused_swiglu_kernel.py
+++ b/tests/unit/test_fused_swiglu_kernel.py
@@ -80,8 +80,8 @@ def test_fused_swiglu_compilation():
     padded_offsets = torch.tensor([128], dtype=torch.int32, device=device)  # padded to 128
 
     # Pad activation to 128 rows
-    x_padded = torch.zeros(128, K_packed, dtype=x_fp4.dtype, device=device)
-    x_padded[:tokens] = x_fp4
+    x_padded = torch.zeros(128, K_packed, dtype=torch.uint8, device=device).view(torch.float4_e2m1fn_x2)
+    x_padded.view(torch.uint8)[:tokens] = x_fp4.view(torch.uint8)
 
     # Assemble scales (simplified — just pad + swizzle)
     from dsv4.ops.layouts import pad_and_swizzle_single, ceil_div as cutedsl_ceil_div