File tree 5 files changed +443
-199
lines changed 5 files changed +443
-199
lines changed Original file line number Diff line number Diff line change @@ -110,6 +110,11 @@ func run() error {
110
110
flag .Parse ()
111
111
initLogging (& opts )
112
112
113
+ useStreamingServer , err := strconv .ParseBool (os .Getenv ("USE_STREAMING" ))
114
+ if err != nil {
115
+ setupLog .Error (err , "Failed to parse env var USE_STREAMING, defaulting to false" )
116
+ }
117
+
113
118
// Validate flags
114
119
if err := validateFlags (); err != nil {
115
120
setupLog .Error (err , "Failed to validate flags" )
@@ -153,6 +158,7 @@ func run() error {
153
158
SecureServing : * secureServing ,
154
159
CertPath : * certPath ,
155
160
Provider : provider ,
161
+ UseStreaming : useStreamingServer ,
156
162
}
157
163
if err := serverRunner .SetupWithManager (ctx , mgr ); err != nil {
158
164
setupLog .Error (err , "Failed to setup ext-proc controllers" )
Original file line number Diff line number Diff line change @@ -71,17 +71,20 @@ spec:
71
71
spec :
72
72
containers :
73
73
- name : inference-gateway-ext-proc
74
- image : us-east1-docker.pkg.dev/kfswain-gke-dev/test-repo/ext-proc:test-feb-32
74
+ image : us-east1-docker.pkg.dev/kfswain-gke-dev/test-repo/ext-proc:test-mar-35
75
75
imagePullPolicy : Always
76
76
args :
77
77
- -poolName
78
78
- " my-pool"
79
79
- -v
80
- - " 3 "
80
+ - " 4 "
81
81
- -grpcPort
82
82
- " 9002"
83
83
- -grpcHealthPort
84
84
- " 9003"
85
+ env :
86
+ - name : USE_STREAMING
87
+ value : " true"
85
88
ports :
86
89
- containerPort : 9002
87
90
- containerPort : 9003
Original file line number Diff line number Diff line change 66
66
op : add
67
67
path : " /default_filter_chain/filters/0/typed_config/http_filters/0/typed_config/processing_mode/request_trailer_mode"
68
68
value : SEND
69
+ # Uncomment to enable full duplex streaming
70
+ # - type: "type.googleapis.com/envoy.config.listener.v3.Listener"
71
+ # name: "default/inference-gateway/llm-gw"
72
+ # operation:
73
+ # op: add
74
+ # path: "/default_filter_chain/filters/0/typed_config/http_filters/0/typed_config/processing_mode/response_body_mode"
75
+ # value: FULL_DUPLEX_STREAMED
76
+ # - type: "type.googleapis.com/envoy.config.listener.v3.Listener"
77
+ # name: "default/inference-gateway/llm-gw"
78
+ # operation:
79
+ # op: replace
80
+ # path: "/default_filter_chain/filters/0/typed_config/http_filters/0/typed_config/processing_mode/response_trailer_mode"
81
+ # value: SEND
82
+ # - type: "type.googleapis.com/envoy.config.listener.v3.Listener"
83
+ # name: "default/inference-gateway/llm-gw"
84
+ # operation:
85
+ # op: replace
86
+ # path: "/default_filter_chain/filters/0/typed_config/http_filters/0/typed_config/processing_mode/response_header_mode"
87
+ # value: SEND
88
+
You can’t perform that action at this time.
0 commit comments