hotfix attn alibi wo head mapping (#496)

Co-authored-by: oliveryuan <oliveryuan@basemind.com>
This commit is contained in:
Song
2023-07-19 02:31:48 +08:00
committed by GitHub
parent 453bafb96f
commit bda41c70dd
2 changed files with 3 additions and 0 deletions

View File

@@ -408,6 +408,7 @@ class PagedAttentionWithALiBi(PagedAttention):
query,
key_cache,
value_cache,
self.head_mapping,
self.scale,
input_metadata.block_tables,
input_metadata.context_lens,