File tree Expand file tree Collapse file tree 2 files changed +4
-6
lines changed
Expand file tree Collapse file tree 2 files changed +4
-6
lines changed Original file line number Diff line number Diff line change @@ -67,14 +67,14 @@ type InferenceModelSpec struct {
6767 // This can be done by specifying a target model and setting the weight to zero,
6868 // an error will be returned specifying that no valid target model is found.
6969 //
70- // +kubebuilder:validation:MaxLength=253
70+ // +kubebuilder:validation:MaxLength=256
7171 // +kubebuilder:validation:Required
7272 ModelName string `json:"modelName"`
7373
7474 // Criticality defines how important it is to serve the model compared to other models referencing the same pool.
75+ // The lack of defaulting is intentional, the behavior of not setting criticality future-proofs the API without complicating.
7576 //
7677 // +optional
77- // +kubebuilder:default="Default"
7878 Criticality * Criticality `json:"criticality,omitempty"`
7979
8080 // TargetModels allow multiple versions of a model for traffic splitting.
@@ -196,7 +196,7 @@ const (
196196 ModelReasonNameInUse InferenceModelConditionReason = "ModelNameInUse"
197197
198198 // This reason is the initial state, and indicates that the controller has not yet reconciled the InferenceModel.
199- PoolReasonPending InferenceModelConditionReason = "Pending"
199+ ModelReasonPending InferenceModelConditionReason = "Pending"
200200)
201201
202202func init () {
Original file line number Diff line number Diff line change @@ -45,9 +45,7 @@ type InferencePoolList struct {
4545// InferencePoolSpec defines the desired state of InferencePool
4646type InferencePoolSpec struct {
4747 // Selector defines a map of label to watch model server pods
48- // that should be included in the InferencePool. ModelServers should not
49- // be with any other Service or InferencePool, that behavior is not supported
50- // and will result in sub-optimal utilization.
48+ // that should be included in the InferencePool.
5149 // In some cases, implementations may translate this to a Service selector, so this matches the simple
5250 // map used for Service selectors instead of the full Kubernetes LabelSelector type.
5351 //
You can’t perform that action at this time.
0 commit comments