diff --git a/onnxruntime/contrib_ops/webgpu/moe/moe.h b/onnxruntime/contrib_ops/webgpu/moe/moe.h index 5e329dc12b5c9..332aa39a8d23e 100755 --- a/onnxruntime/contrib_ops/webgpu/moe/moe.h +++ b/onnxruntime/contrib_ops/webgpu/moe/moe.h @@ -3,6 +3,8 @@ #pragma once +#include + #include "core/providers/webgpu/program.h" #include "core/providers/webgpu/webgpu_kernel.h" @@ -31,7 +33,7 @@ class MoE : public WebGpuKernel { activation_alpha_ = static_cast(info.GetAttrOrDefault("activation_alpha", 1.0)); activation_beta_ = static_cast(info.GetAttrOrDefault("activation_beta", 1.0)); swiglu_fusion_ = static_cast(info.GetAttrOrDefault("swiglu_fusion", 0)); - swiglu_limit_ = info.GetAttrOrDefault("swiglu_limit", 0); + swiglu_limit_ = info.GetAttrOrDefault("swiglu_limit", std::numeric_limits::infinity()); k_ = static_cast(info.GetAttrOrDefault("k", 4)); normalize_routing_weights_ = info.GetAttrOrDefault("normalize_routing_weights", 0) == 1; use_sparse_mixer_ = info.GetAttrOrDefault("use_sparse_mixer", 0) == 1;