[core][scheduler] simplify and improve scheduler (#6867)

2024-07-31 23:51:09 -07:00
parent 3c10591ef2
commit c8a7e93273
4 changed files with 112 additions and 214 deletions
--- a/tests/core/block/e2e/test_correctness.py
+++ b/tests/core/block/e2e/test_correctness.py
@@ -183,7 +183,7 @@ def test_v1_v2_greedy_equality_with_cow(baseline_llm_generator,

            # Allow only 2 sequences of ~128 tokens in worst case.
            # Note 16 = 128/block_size
-            "num_gpu_blocks_override": 2 * (16 + 1),
+            "num_gpu_blocks_override": 2 * (16 + 2),
        }
    ])
@pytest.mark.parametrize("baseline_llm_kwargs", [{