Skip to content

Commit beeb0a3

Browse files
committed
Pass peft_cache_manager=None to BindCapacityScheduler in create_autodeploy_executor function in ad_executor.py
Signed-off-by: Amit Zuker <[email protected]>
1 parent 523efb7 commit beeb0a3

File tree

2 files changed

+4
-2
lines changed

2 files changed

+4
-2
lines changed

tensorrt_llm/_torch/auto_deploy/shim/ad_executor.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -286,7 +286,9 @@ def create_autodeploy_executor(executor_config: ExecutorConfig, checkpoint_dir:
286286
resource_manager.resource_managers.move_to_end(ResourceManagerType.KV_CACHE_MANAGER, last=True)
287287

288288
# scheduling
289-
capacitor_scheduler = BindCapacityScheduler(ad_config.max_batch_size, kv_cache_manager.impl)
289+
capacitor_scheduler = BindCapacityScheduler(
290+
ad_config.max_batch_size, kv_cache_manager.impl, peft_cache_manager=None
291+
)
290292
mb_scheduler = BindMicroBatchScheduler(
291293
ad_config.max_batch_size, engine.cache_seq_interface.info.max_num_tokens
292294
)

tensorrt_llm/_torch/pyexecutor/scheduler.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -73,7 +73,7 @@ def __init__(
7373
self,
7474
max_num_requests: int,
7575
kv_cache_manager,
76-
peft_cache_manager: tb_internal.batch_manager.PeftCacheManager,
76+
peft_cache_manager: tb_internal.batch_manager.PeftCacheManager | None,
7777
scheduler_policy: tb_executor.CapacitySchedulerPolicy = tb_executor.
7878
CapacitySchedulerPolicy.GUARANTEED_NO_EVICT,
7979
two_step_lookahead: bool = False,

0 commit comments

Comments
 (0)