ray-project · ArturNiederfahrenhorst · Nov 22, 2025 · Nov 18, 2025 · Nov 20, 2025 · Nov 21, 2025
@@ -4452,6 +4452,12 @@ def get_rl_module_spec(
         # If module_config_dict is not defined, set to our generic one.
         if rl_module_spec.model_config is None:
             rl_module_spec.model_config = self.model_config
+        # Otherwise we combine the two dictionaries where settings from the
+        # `RLModuleSpec` have higher priority.
+        else:
+            rl_module_spec.model_config = (
+                self.model_config | rl_module_spec._get_model_config()
+            )
 
         if inference_only is not None:
             rl_module_spec.inference_only = inference_only

@@ -130,7 +130,19 @@ def set_state(self, state: StateDict) -> None:
         # these keys (strict=False). This is most likely due to `state` coming from
         # an `inference_only=False` RLModule, while `self` is an `inference_only=True`
         # RLModule.
-        self.load_state_dict(convert_to_torch_tensor(state), strict=False)
+        missing_keys, unexpected_keys = self.load_state_dict(
+            convert_to_torch_tensor(state), strict=False
+        )
+
+        # For inference_only modules, missing_keys should always be empty.
+        # If there are missing keys, it means the target module expects parameters
+        # that don't exist in the source, indicating an architecture mismatch.
+        if self.inference_only and missing_keys:
+            raise ValueError(
+                "Architecture mismatch detected when loading state into inference_only module! "
+                f"Missing parameters (not found in source state): {list(missing_keys)} "
+                "This usually indicates the learner and env-runner have different architectures."
+            )
 
     @OverrideToImplementCustomLogic
     @override(RLModule)