diff --git a/fp8_to_nvfp4_streaming.py b/fp8_to_nvfp4_streaming.py index 5106cfc..bdbcf08 100644 --- a/fp8_to_nvfp4_streaming.py +++ b/fp8_to_nvfp4_streaming.py @@ -293,8 +293,8 @@ def build_plan(src_dir: Path): for base, parts in expert_pairs.items(): if "w1" in parts and "w3" in parts: expert_pair_groups.append((base, parts["w1"], parts["w3"])) - paired_names.add(parts["gate_proj"]) - paired_names.add(parts["up_proj"]) + paired_names.add(parts["w1"]) + paired_names.add(parts["w3"]) # Classify everything else solo_quantize = []