From f40cf422e8fa6b411dc3682e30082964d80ef19f Mon Sep 17 00:00:00 2001 From: ckl117 Date: Fri, 17 Oct 2025 17:29:25 +0800 Subject: [PATCH 1/3] check --- fastdeploy/model_executor/utils.py | 16 ++++++++++++++++ fastdeploy/worker/worker_process.py | 4 ++++ 2 files changed, 20 insertions(+) diff --git a/fastdeploy/model_executor/utils.py b/fastdeploy/model_executor/utils.py index 8e90fb80fd..daf0c10f72 100644 --- a/fastdeploy/model_executor/utils.py +++ b/fastdeploy/model_executor/utils.py @@ -199,3 +199,19 @@ def temporary_dtype(dtype: str): yield finally: paddle.set_default_dtype(orig_dtype) + + +def is_paddle_support_v1_loader(): + src_shape = [32, 32] + tgt_shape = [1, 32, 64] + src_tensor = paddle.ones(src_shape, dtype="float32") + tgt_tensor = paddle.zeros(tgt_shape, dtype="float32") + for exp_id in range(tgt_shape[0]): + # gate + gate_tgt = tgt_tensor[exp_id][..., : tgt_shape[2] // 2] + gate_tgt.copy_(src_tensor, False) + # up + up_tgt = tgt_tensor[exp_id][..., tgt_shape[2] // 2 :] + up_tgt.copy_(src_tensor, False) + is_same = bool(paddle.all(tgt_tensor == 1)) + return is_same diff --git a/fastdeploy/worker/worker_process.py b/fastdeploy/worker/worker_process.py index 2b2ed9a591..89d0f974a5 100644 --- a/fastdeploy/worker/worker_process.py +++ b/fastdeploy/worker/worker_process.py @@ -42,6 +42,7 @@ from fastdeploy.input.ernie4_5_tokenizer import Ernie4_5Tokenizer from fastdeploy.inter_communicator import EngineWorkerQueue as TaskQueue from fastdeploy.inter_communicator import ExistTaskStatus, IPCSignal, ModelWeightsStatus +from fastdeploy.model_executor import is_paddle_support_v1_loader from fastdeploy.model_executor.layers.quantization import get_quantization_config from fastdeploy.platforms import current_platform from fastdeploy.utils import get_logger, parse_quantization @@ -809,6 +810,9 @@ def initialize_fd_config(args, ranks: int = 1, local_rank: int = 0) -> FDConfig: update_fd_config_for_mm(fd_config) update_think_end_id_for_ernie(fd_config) + if not is_paddle_support_v1_loader(): + raise ValueError("The install Paddle don't support v1 loader.") + return fd_config From e818f1f94954afb94e5b0c36e67b7d82889af556 Mon Sep 17 00:00:00 2001 From: ckl117 Date: Fri, 17 Oct 2025 17:32:19 +0800 Subject: [PATCH 2/3] check --- fastdeploy/worker/worker_process.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/fastdeploy/worker/worker_process.py b/fastdeploy/worker/worker_process.py index 89d0f974a5..a441f9c407 100644 --- a/fastdeploy/worker/worker_process.py +++ b/fastdeploy/worker/worker_process.py @@ -810,7 +810,7 @@ def initialize_fd_config(args, ranks: int = 1, local_rank: int = 0) -> FDConfig: update_fd_config_for_mm(fd_config) update_think_end_id_for_ernie(fd_config) - if not is_paddle_support_v1_loader(): + if load_config.load_choices == "default_v1" and not is_paddle_support_v1_loader(): raise ValueError("The install Paddle don't support v1 loader.") return fd_config From 95d943688ab09be742a673999313fe5a78f5363a Mon Sep 17 00:00:00 2001 From: ckl117 Date: Mon, 20 Oct 2025 10:54:59 +0800 Subject: [PATCH 3/3] check import --- fastdeploy/worker/worker_process.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/fastdeploy/worker/worker_process.py b/fastdeploy/worker/worker_process.py index a441f9c407..43384f8ba2 100644 --- a/fastdeploy/worker/worker_process.py +++ b/fastdeploy/worker/worker_process.py @@ -42,8 +42,8 @@ from fastdeploy.input.ernie4_5_tokenizer import Ernie4_5Tokenizer from fastdeploy.inter_communicator import EngineWorkerQueue as TaskQueue from fastdeploy.inter_communicator import ExistTaskStatus, IPCSignal, ModelWeightsStatus -from fastdeploy.model_executor import is_paddle_support_v1_loader from fastdeploy.model_executor.layers.quantization import get_quantization_config +from fastdeploy.model_executor.utils import is_paddle_support_v1_loader from fastdeploy.platforms import current_platform from fastdeploy.utils import get_logger, parse_quantization from fastdeploy.worker.worker_base import WorkerBase