Skip to content

Commit 830a4a2

Browse files
committed
remove relaxed thinking
Signed-off-by: qgai <[email protected]>
1 parent 9ae0936 commit 830a4a2

File tree

3 files changed

+2
-11
lines changed

3 files changed

+2
-11
lines changed

examples/llm-api/quickstart_advanced.py

Lines changed: 1 addition & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -176,12 +176,7 @@ def setup_llm(args, **kwargs):
176176
max_draft_len=args.spec_decode_max_draft_len,
177177
speculative_model_dir=args.model_dir,
178178
eagle3_one_model=args.use_one_model,
179-
is_mtp_eagle=True,
180-
use_relaxed_acceptance_for_thinking=args.
181-
use_relaxed_acceptance_for_thinking,
182-
relaxed_topk=args.relaxed_topk,
183-
relaxed_delta=args.relaxed_delta,
184-
)
179+
is_mtp_eagle=True)
185180
else:
186181
spec_config = MTPDecodingConfig(
187182
num_nextn_predict_layers=args.spec_decode_max_draft_len,

tensorrt_llm/_torch/models/modeling_auto.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@ def from_config(
2020
"") # Strip the appended EAGLE3
2121
if hasattr(config.pretrained_config, "draft_vocab_size"):
2222
model_arch = "EAGLE3" + model_arch
23-
if model_arch == "DeepseekV3ForCausalLM" and config.spec_config.max_draft_len == 0:
23+
if model_arch == "DeepseekV3ForCausalLM" and config.spec_config is not None and config.spec_config.max_draft_len == 0:
2424
model_arch = "MTPDraftModelForCausalLM"
2525

2626
cls = MODEL_CLASS_MAPPING.get(model_arch)

tensorrt_llm/llmapi/llm_args.py

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -427,10 +427,6 @@ class EagleDecodingConfig(DecodingBaseConfig):
427427
eagle3_one_model: Optional[bool] = True
428428
eagle3_layers_to_capture: Optional[Tuple[int, ...]] = None
429429
is_mtp_eagle: Optional[bool] = False # which also means eagle2
430-
#TODO:add the support of relaxed acceptance for thinking
431-
use_relaxed_acceptance_for_thinking: Optional[bool] = False
432-
relaxed_topk: Optional[int] = 10
433-
relaxed_delta: Optional[float] = 0.01
434430

435431
@classmethod
436432
def from_dict(cls, data: dict):

0 commit comments

Comments
 (0)