File tree Expand file tree Collapse file tree 2 files changed +4
-6
lines changed Expand file tree Collapse file tree 2 files changed +4
-6
lines changed Original file line number Diff line number Diff line change @@ -67,14 +67,14 @@ type InferenceModelSpec struct {
67
67
// This can be done by specifying a target model and setting the weight to zero,
68
68
// an error will be returned specifying that no valid target model is found.
69
69
//
70
- // +kubebuilder:validation:MaxLength=253
70
+ // +kubebuilder:validation:MaxLength=256
71
71
// +kubebuilder:validation:Required
72
72
ModelName string `json:"modelName"`
73
73
74
74
// Criticality defines how important it is to serve the model compared to other models referencing the same pool.
75
+ // The lack of defaulting is intentional, the behavior of not setting criticality future-proofs the API without complicating.
75
76
//
76
77
// +optional
77
- // +kubebuilder:default="Default"
78
78
Criticality * Criticality `json:"criticality,omitempty"`
79
79
80
80
// TargetModels allow multiple versions of a model for traffic splitting.
@@ -196,7 +196,7 @@ const (
196
196
ModelReasonNameInUse InferenceModelConditionReason = "ModelNameInUse"
197
197
198
198
// This reason is the initial state, and indicates that the controller has not yet reconciled the InferenceModel.
199
- PoolReasonPending InferenceModelConditionReason = "Pending"
199
+ ModelReasonPending InferenceModelConditionReason = "Pending"
200
200
)
201
201
202
202
func init () {
Original file line number Diff line number Diff line change @@ -45,9 +45,7 @@ type InferencePoolList struct {
45
45
// InferencePoolSpec defines the desired state of InferencePool
46
46
type InferencePoolSpec struct {
47
47
// Selector defines a map of label to watch model server pods
48
- // that should be included in the InferencePool. ModelServers should not
49
- // be with any other Service or InferencePool, that behavior is not supported
50
- // and will result in sub-optimal utilization.
48
+ // that should be included in the InferencePool.
51
49
// In some cases, implementations may translate this to a Service selector, so this matches the simple
52
50
// map used for Service selectors instead of the full Kubernetes LabelSelector type.
53
51
//
You can’t perform that action at this time.
0 commit comments