We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
2 parents e8e0934 + 74fefdd commit bc11239Copy full SHA for bc11239
benchmarks/bench_mixed_attention.py
@@ -23,10 +23,10 @@ def run_bench(
23
q_lens = torch.tensor(d_qo_lens + p_qo_lens, dtype=torch.int32)
24
25
seq_lens_blocks = torch.ceil(seq_lens / page_block_size).int()
26
- p_seq_lens_blocks = (
+ p_seq_lens_blocks = torch.ceil(
27
torch.tensor(p_kv_lens, dtype=torch.int32) / page_block_size
28
).int()
29
- d_seq_lens_blocks = (
+ d_seq_lens_blocks = torch.ceil(
30
torch.tensor(d_kv_lens, dtype=torch.int32) / page_block_size
31
32
0 commit comments