Skip to content

Commit 613fd37

Browse files
committed
feedback updates
1 parent 3f971ca commit 613fd37

File tree

2 files changed

+4
-6
lines changed

2 files changed

+4
-6
lines changed

api/inferencemodel_types.go

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -67,14 +67,14 @@ type InferenceModelSpec struct {
6767
// This can be done by specifying a target model and setting the weight to zero,
6868
// an error will be returned specifying that no valid target model is found.
6969
//
70-
// +kubebuilder:validation:MaxLength=253
70+
// +kubebuilder:validation:MaxLength=256
7171
// +kubebuilder:validation:Required
7272
ModelName string `json:"modelName"`
7373

7474
// Criticality defines how important it is to serve the model compared to other models referencing the same pool.
75+
// The lack of defaulting is intentional, the behavior of not setting criticality future-proofs the API without complicating.
7576
//
7677
// +optional
77-
// +kubebuilder:default="Default"
7878
Criticality *Criticality `json:"criticality,omitempty"`
7979

8080
// TargetModels allow multiple versions of a model for traffic splitting.
@@ -196,7 +196,7 @@ const (
196196
ModelReasonNameInUse InferenceModelConditionReason = "ModelNameInUse"
197197

198198
// This reason is the initial state, and indicates that the controller has not yet reconciled the InferenceModel.
199-
PoolReasonPending InferenceModelConditionReason = "Pending"
199+
ModelReasonPending InferenceModelConditionReason = "Pending"
200200
)
201201

202202
func init() {

api/inferencepool_types.go

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -45,9 +45,7 @@ type InferencePoolList struct {
4545
// InferencePoolSpec defines the desired state of InferencePool
4646
type InferencePoolSpec struct {
4747
// Selector defines a map of label to watch model server pods
48-
// that should be included in the InferencePool. ModelServers should not
49-
// be with any other Service or InferencePool, that behavior is not supported
50-
// and will result in sub-optimal utilization.
48+
// that should be included in the InferencePool.
5149
// In some cases, implementations may translate this to a Service selector, so this matches the simple
5250
// map used for Service selectors instead of the full Kubernetes LabelSelector type.
5351
//

0 commit comments

Comments
 (0)