Skip to content

Commit cddb07b

Browse files
committed
fix block num setting in scheduler v1
1 parent b25a6b7 commit cddb07b

File tree

1 file changed

+5
-1
lines changed

1 file changed

+5
-1
lines changed

fastdeploy/worker/gpu_model_runner.py

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -208,11 +208,15 @@ def insert_tasks_v1(self, req_dicts: List[Request]):
208208
request = req_dicts[i]
209209
idx = request.idx
210210
if request.task_type.value == RequestType.PREFILL.value: # prefill task
211-
logger.debug(f"Handle prefill request {request} at idx {idx}")
212211
prefill_start_index = request.prefill_start_index
213212
prefill_end_index = request.prefill_end_index
214213
length = prefill_end_index - prefill_start_index
215214
input_ids = request.prompt_token_ids + request.output_token_ids
215+
logger.debug(
216+
f"Handle prefill request {request} at idx {idx}, "
217+
f"{prefill_start_index=}, {prefill_end_index=}, "
218+
f"need_prefilled_token_num={len(input_ids)}"
219+
)
216220
self.share_inputs["input_ids"][idx : idx + 1, :length] = np.array(
217221
input_ids[prefill_start_index:prefill_end_index]
218222
)

0 commit comments

Comments
 (0)