Skip to content

Commit e00875a

Browse files
committed
hack around slices bug
1 parent 9639b0d commit e00875a

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

vllm/v1/engine/async_llm.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -251,13 +251,14 @@ async def _run_output_handler(self):
251251
# event loop for too long.
252252
num_outputs = len(outputs.new_token_id_offsets)
253253

254-
if num_outputs <= VLLM_V1_OUTPUT_PROC_CHUNK_SIZE:
254+
if True or num_outputs <= VLLM_V1_OUTPUT_PROC_CHUNK_SIZE:
255255
slices = ((0, num_outputs), )
256256
else:
257257
slices = []
258258
parts = np.linspace(
259259
num_outputs,
260-
cdiv(num_outputs, VLLM_V1_OUTPUT_PROC_CHUNK_SIZE))
260+
cdiv(num_outputs, VLLM_V1_OUTPUT_PROC_CHUNK_SIZE),
261+
dtype='int')
261262
last = 0
262263
for i in parts:
263264
slices.append((last, i))

0 commit comments

Comments
 (0)