feat: add BaseLogitsProcessor core interface (#2613)

bhuvan002 · web-flow · commit b92a805edb78 · 2025-08-22T13:41:30.000-04:00
Signed-off-by: Bhuvan Agrawal &lt;11240550+bhuvan002@users.noreply.github.com&gt;
diff --git a/lib/bindings/python/src/dynamo/logits_processing/__init__.py b/lib/bindings/python/src/dynamo/logits_processing/__init__.py
@@ -0,0 +1,13 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+
+"""
+Dynamo Logits Processing - Backend-agnostic logits processors.
+
+This module provides the BaseLogitsProcessor protocol that can be used
+across different backend adapters (TRT-LLM, vLLM, SGLang).
+"""
+
+from .base import BaseLogitsProcessor
+
+__all__ = ["BaseLogitsProcessor"]
diff --git a/lib/bindings/python/src/dynamo/logits_processing/base.py b/lib/bindings/python/src/dynamo/logits_processing/base.py
@@ -0,0 +1,39 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+
+"""
+Base logits processor protocol for Dynamo.
+
+This module defines the core BaseLogitsProcessor interface that all
+logits processors must implement.
+"""
+
+from typing import Protocol, Sequence
+
+import torch
+
+
+class BaseLogitsProcessor(Protocol):
+    """
+    Protocol for logits processors in Dynamo.
+
+    All logits processors must implement this interface to be compatible
+    with backend adapters (TRT-LLM, vLLM, SGLang).
+    """
+
+    def __call__(
+        self,
+        input_ids: Sequence[int],
+        logits: torch.Tensor,
+    ) -> torch.Tensor:
+        """
+        Process the logits for the next token prediction.
+
+        Args:
+            input_ids: The input token IDs generated so far.
+            logits: The raw logits for the next token. Shape: (vocab_size,)
+
+        Returns:
+            A tensor with the same shape, dtype, and device as `logits`.
+        """
+        ...