fix: indexer compressor weight path — weights are at *.indexer.kv_proj not *.indexer.compressor.kv_proj
This commit is contained in:
@@ -398,9 +398,11 @@ class Indexer:
|
||||
wp_out = wp_w.shape[0]
|
||||
wp_in = wp_w.shape[1] * 2
|
||||
self.wp_lin = make_nvfp4_linear(wp_in, wp_out, dev, w, pfx, 'weights_proj')
|
||||
if f"{pfx}.compressor.kv_proj.weight" in w:
|
||||
# Indexer compressor weights are directly under the indexer prefix
|
||||
# (e.g. *.indexer.kv_proj.weight), NOT nested under *.indexer.compressor.
|
||||
if f"{pfx}.kv_proj.weight" in w:
|
||||
self.compressor = Compressor(4, self.ihd, 7168, dev)
|
||||
self.compressor.load(w, f"{pfx}.compressor", dev)
|
||||
self.compressor.load(w, pfx, dev)
|
||||
|
||||
def forward(self, q_lora, hidden_states, comp_indexer_kv, positions, layer_idx=None):
|
||||
if self.q_b_lin is None or comp_indexer_kv is None or comp_indexer_kv.shape[0] == 0:
|
||||
|
||||
Reference in New Issue
Block a user