File tree Expand file tree Collapse file tree 1 file changed +4
-4
lines changed Expand file tree Collapse file tree 1 file changed +4
-4
lines changed Original file line number Diff line number Diff line change @@ -472,9 +472,9 @@ def schedule(self) -> SchedulerOutput:
472472 num_computed_tokens = (
473473 num_new_local_computed_tokens + num_external_computed_tokens
474474 )
475- # KVTransfer: WAITING reqs have num_computed_tokens > 0
476- # after async KV recvs are completed.
477475 else :
476+ # KVTransfer: WAITING reqs have num_computed_tokens > 0
477+ # after async KV recvs are completed.
478478 new_computed_blocks = self .kv_cache_manager .empty_kv_cache_blocks
479479 num_new_local_computed_tokens = 0
480480 num_computed_tokens = request .num_computed_tokens
@@ -483,12 +483,12 @@ def schedule(self) -> SchedulerOutput:
483483 external_load_encoder_input = []
484484 new_encoder_compute_budget = encoder_compute_budget
485485
486- # KVTransfer: loading remote KV, do not allocate for new work.
487486 if load_kv_async :
487+ # KVTransfer: loading remote KV, do not allocate for new work.
488488 assert num_external_computed_tokens > 0
489489 num_new_tokens = 0
490- # Number of tokens to be scheduled.
491490 else :
491+ # Number of tokens to be scheduled.
492492 # We use `request.num_tokens` instead of
493493 # `request.num_prompt_tokens` to consider the resumed
494494 # requests, which have output tokens.
You can’t perform that action at this time.
0 commit comments