@@ -20,14 +20,10 @@ import (
20
20
"errors"
21
21
"math"
22
22
23
- << << << < HEAD :pkg / epp / scheduling / filter.go
24
23
"github.com/go-logr/logr"
25
- "sigs.k8s.io/gateway-api-inference-extension/pkg/epp/datastore"
26
- logutil "sigs.k8s.io/gateway-api-inference-extension/pkg/epp/util/logging"
27
- == == == =
28
24
klog "k8s.io/klog/v2"
25
+ "sigs.k8s.io/gateway-api-inference-extension/pkg/epp/datastore"
29
26
"sigs.k8s.io/gateway-api-inference-extension/pkg/ext-proc/backend"
30
- >> >> >> > 78 c0740 (changes for multilora ):pkg / ext - proc / scheduling / filter .go
31
27
)
32
28
33
29
type Filter interface {
@@ -66,14 +62,8 @@ func (f *filter) Name() string {
66
62
return f .name
67
63
}
68
64
69
- << << << < HEAD:pkg / epp / scheduling / filter .go
70
- func (f * filter ) Filter (logger logr.Logger , req * LLMRequest , pods []* datastore.PodMetrics ) ([]* datastore.PodMetrics , error ) {
71
- loggerTrace := logger .V (logutil .TRACE )
72
- loggerTrace .Info ("Running a filter" , "name" , f .Name (), "podCount" , len (pods ))
73
- == == == =
74
65
func (f * filter ) Filter (req * LLMRequest , pods []* backend.PodMetrics ) ([]* backend.PodMetrics , error ) {
75
66
klog .InfoS ("Running a filter" , "name" , f .Name (), "request" , req , "podCount" , len (pods ))
76
- >> >> >> > 78 c0740 (changes for multilora ):pkg / ext - proc / scheduling / filter .go
77
67
78
68
filtered , err := f .filter (logger , req , pods )
79
69
@@ -86,12 +76,8 @@ func (f *filter) Filter(req *LLMRequest, pods []*backend.PodMetrics) ([]*backend
86
76
if f .nextOnSuccess != nil {
87
77
next = f .nextOnSuccess
88
78
}
89
- << << << < HEAD:pkg / epp / scheduling / filter .go
90
- loggerTrace .Info ("Filter succeeded" , "filter" , f .Name (), "next" , next .Name (), "filteredPodCount" , len (filtered ))
91
- == == == =
92
79
klog .InfoS ("Filter succeeded" , "filter" , f .Name (), "next" , next .Name (), "filteredPodCount" , len (filtered ))
93
80
94
- >> >> >> > 78 c0740 (changes for multilora ):pkg / ext - proc / scheduling / filter .go
95
81
// On success, pass the filtered result to the next filter.
96
82
return next .Filter (logger , req , filtered )
97
83
} else {
@@ -102,11 +88,7 @@ func (f *filter) Filter(req *LLMRequest, pods []*backend.PodMetrics) ([]*backend
102
88
if f .nextOnFailure != nil {
103
89
next = f .nextOnFailure
104
90
}
105
- << << << < HEAD:pkg / epp / scheduling / filter .go
106
- loggerTrace .Info ("Filter failed" , "filter" , f .Name (), "next" , next .Name ())
107
- == == == =
108
91
klog .InfoS ("Filter failed" , "filter" , f .Name (), "next" , next .Name ())
109
- >> >> >> > 78 c0740 (changes for multilora ):pkg / ext - proc / scheduling / filter .go
110
92
// On failure, pass the initial set of pods to the next filter.
111
93
return next .Filter (logger , req , pods )
112
94
}
@@ -229,13 +211,8 @@ func loRAAffinityPredicate(req *LLMRequest, pod *datastore.PodMetrics) bool {
229
211
}
230
212
231
213
// canAcceptNewLoraPredicate is a filter function to check whether a pod has room to load the adapter.
232
- << << << < HEAD:pkg / epp / scheduling / filter .go
233
- func canAcceptNewLoraPredicate (req * LLMRequest , pod * datastore.PodMetrics ) bool {
234
- return len (pod .ActiveModels ) < pod .MaxActiveModels
235
- == == == =
236
214
func canAcceptNewLoraPredicate (req * LLMRequest , pod * backend.PodMetrics ) bool {
237
215
return len (pod .ActiveModels ) < maxLoRACost
238
- >> >> >> > 78 c0740 (changes for multilora ):pkg / ext - proc / scheduling / filter .go
239
216
}
240
217
241
218
func criticalRequestPredicate (req * LLMRequest , pod * datastore.PodMetrics ) bool {
0 commit comments