Add support for BLOOM (#331)
This commit is contained in:
@@ -216,6 +216,7 @@ def run_single_query_cached_kv_attention(
|
||||
context_lens,
|
||||
block_size,
|
||||
max_context_len,
|
||||
None, # ALiBi slopes.
|
||||
)
|
||||
|
||||
ref_output = torch.empty_like(query)
|
||||
|
||||
Reference in New Issue
Block a user