@@ -28,19 +28,19 @@ import (
28
28
logutil "sigs.k8s.io/gateway-api-inference-extension/pkg/epp/util/logging"
29
29
)
30
30
31
- type BasicFilter struct {
31
+ type Filter struct {
32
32
name string
33
33
filter filterFunc
34
34
}
35
35
36
- func (bf * BasicFilter ) Name () string {
36
+ func (bf * Filter ) Name () string {
37
37
if bf == nil {
38
38
return "nil"
39
39
}
40
40
return bf .name
41
41
}
42
42
43
- func (bf * BasicFilter ) Filter (ctx * types.Context , pods []types.Pod ) ([]types.Pod , error ) {
43
+ func (bf * Filter ) Filter (ctx * types.Context , pods []types.Pod ) ([]types.Pod , error ) {
44
44
loggerTrace := ctx .Logger .V (logutil .TRACE )
45
45
loggerTrace .Info ("Running a filter" , "name" , bf .Name (), "podCount" , len (pods ))
46
46
@@ -123,7 +123,7 @@ func toFilterFunc(pp podPredicate) filterFunc {
123
123
}
124
124
}
125
125
126
- var LeastQueueFilter = & BasicFilter {
126
+ var LeastQueueFilter = & Filter {
127
127
name : "least queuing" ,
128
128
filter : leastQueuingFilterFunc ,
129
129
}
@@ -157,12 +157,12 @@ func leastQueuingFilterFunc(ctx *types.Context, pods []types.Pod) ([]types.Pod,
157
157
return filtered , nil
158
158
}
159
159
160
- var LowQueueFilter = & BasicFilter {
160
+ var LowQueueFilter = & Filter {
161
161
name : "low queueing filter" ,
162
162
filter : toFilterFunc ((queueThresholdPredicate (config .Conf .QueueingThresholdLoRA ))),
163
163
}
164
164
165
- var LeastKVCacheFilter = & BasicFilter {
165
+ var LeastKVCacheFilter = & Filter {
166
166
name : "least KV cache percent" ,
167
167
filter : leastKVCacheFilterFunc ,
168
168
}
@@ -195,7 +195,7 @@ func leastKVCacheFilterFunc(ctx *types.Context, pods []types.Pod) ([]types.Pod,
195
195
return filtered , nil
196
196
}
197
197
198
- var LoRAAffinityFilter = & BasicFilter {
198
+ var LoRAAffinityFilter = & Filter {
199
199
name : "affinity LoRA" ,
200
200
filter : loRASoftAffinityFilterFunc ,
201
201
}
@@ -254,12 +254,12 @@ func loRASoftAffinityFilterFunc(ctx *types.Context, pods []types.Pod) ([]types.P
254
254
return filtered_available , nil
255
255
}
256
256
257
- var HasCapacityFilter = & BasicFilter {
257
+ var HasCapacityFilter = & Filter {
258
258
name : "has capacity for sheddable requests" ,
259
259
filter : toFilterFunc (queueThresholdPredicate (config .Conf .QueueThresholdCritical ).and (kvCacheThresholdPredicate (config .Conf .KVCacheThreshold ))),
260
260
}
261
261
262
- var DropRequestFilter = & BasicFilter {
262
+ var DropRequestFilter = & Filter {
263
263
name : "drop request" ,
264
264
filter : func (ctx * types.Context , pods []types.Pod ) ([]types.Pod , error ) {
265
265
ctx .Logger .V (logutil .DEFAULT ).Info ("Request dropped" , "request" , ctx .Req )
@@ -269,7 +269,7 @@ var DropRequestFilter = &BasicFilter{
269
269
},
270
270
}
271
271
272
- var NoopFilter = & BasicFilter {
272
+ var NoopFilter = & Filter {
273
273
name : "noop" ,
274
274
filter : func (ctx * types.Context , pods []types.Pod ) ([]types.Pod , error ) {
275
275
ctx .Logger .V (logutil .DEBUG ).Info ("All pods pass" )
0 commit comments