@@ -121,8 +121,7 @@ func TestFullDuplexStreamed_KubeInferenceModelRequest(t *testing.T) {
121
121
KVCacheUsagePercent : 0.2 ,
122
122
},
123
123
},
124
- wantMetrics : map [string ]string {
125
- `inference_model_request_total` : `
124
+ wantMetrics : map [string ]string {`inference_model_request_total` : `
126
125
# HELP inference_model_request_total [ALPHA] Counter of inference model requests broken out for each model and target model.
127
126
# TYPE inference_model_request_total counter
128
127
inference_model_request_total{model_name="my-model",target_model_name="my-model-12345"} 1
@@ -154,8 +153,7 @@ func TestFullDuplexStreamed_KubeInferenceModelRequest(t *testing.T) {
154
153
RawValue : []byte (strconv .Itoa (76 )),
155
154
},
156
155
},
157
- },
158
- },
156
+ }},
159
157
},
160
158
},
161
159
},
@@ -239,8 +237,7 @@ func TestFullDuplexStreamed_KubeInferenceModelRequest(t *testing.T) {
239
237
RawValue : []byte (strconv .Itoa (76 )),
240
238
},
241
239
},
242
- },
243
- },
240
+ }},
244
241
},
245
242
},
246
243
},
@@ -324,8 +321,7 @@ func TestFullDuplexStreamed_KubeInferenceModelRequest(t *testing.T) {
324
321
RawValue : []byte (strconv .Itoa (76 )),
325
322
},
326
323
},
327
- },
328
- },
324
+ }},
329
325
},
330
326
},
331
327
},
@@ -458,8 +454,7 @@ func TestFullDuplexStreamed_KubeInferenceModelRequest(t *testing.T) {
458
454
RawValue : []byte (strconv .Itoa (76 )),
459
455
},
460
456
},
461
- },
462
- },
457
+ }},
463
458
},
464
459
},
465
460
},
@@ -570,8 +565,7 @@ func TestFullDuplexStreamed_KubeInferenceModelRequest(t *testing.T) {
570
565
RawValue : []byte (strconv .Itoa (76 )),
571
566
},
572
567
},
573
- },
574
- },
568
+ }},
575
569
},
576
570
},
577
571
},
@@ -682,8 +676,7 @@ func TestFullDuplexStreamed_KubeInferenceModelRequest(t *testing.T) {
682
676
RawValue : []byte (strconv .Itoa (74 )),
683
677
},
684
678
},
685
- },
686
- },
679
+ }},
687
680
},
688
681
},
689
682
},
@@ -931,40 +924,35 @@ func TestFullDuplexStreamed_KubeInferenceModelRequest(t *testing.T) {
931
924
Request : & extProcPb.ProcessingRequest_ResponseBody {
932
925
ResponseBody : & extProcPb.HttpBody {
933
926
Body : []byte (`data: {"id":"cmpl-0fee233f-7d56-404a-acd3-4dad775d03d9","object":"text_completion","created":1741379018,"model":"food-review-1","choices":[{"index":0,"text":"NEVER","logprobs":null,"finish_reason":null,"stop_reason":null}],"usage":null}` ),
934
- EndOfStream : false ,
935
- },
927
+ EndOfStream : false },
936
928
},
937
929
},
938
930
{
939
931
Request : & extProcPb.ProcessingRequest_ResponseBody {
940
932
ResponseBody : & extProcPb.HttpBody {
941
933
Body : []byte (`data: {"id":"cmpl-0fee233f-7d56-404a-acd3-4dad775d03d9","object":"text_completion","created":1741379018,"model":"food-review-1","choices":[{"index":0,"text":"GONNA","logprobs":null,"finish_reason":null,"stop_reason":null}],"usage":null}` ),
942
- EndOfStream : false ,
943
- },
934
+ EndOfStream : false },
944
935
},
945
936
},
946
937
{
947
938
Request : & extProcPb.ProcessingRequest_ResponseBody {
948
939
ResponseBody : & extProcPb.HttpBody {
949
940
Body : []byte (`data: {"id":"cmpl-0fee233f-7d56-404a-acd3-4dad775d03d9","object":"text_completion","created":1741379018,"model":"food-review-1","choices":[{"index":0,"text":"GIVE","logprobs":null,"finish_reason":null,"stop_reason":null}],"usage":null}` ),
950
- EndOfStream : false ,
951
- },
941
+ EndOfStream : false },
952
942
},
953
943
},
954
944
{
955
945
Request : & extProcPb.ProcessingRequest_ResponseBody {
956
946
ResponseBody : & extProcPb.HttpBody {
957
947
Body : []byte (`data: {"id":"cmpl-0fee233f-7d56-404a-acd3-4dad775d03d9","object":"text_completion","created":1741379018,"model":"food-review-1","choices":[{"index":0,"text":"YOU","logprobs":null,"finish_reason":null,"stop_reason":null}],"usage":null}` ),
958
- EndOfStream : false ,
959
- },
948
+ EndOfStream : false },
960
949
},
961
950
},
962
951
{
963
952
Request : & extProcPb.ProcessingRequest_ResponseBody {
964
953
ResponseBody : & extProcPb.HttpBody {
965
954
Body : []byte (`data: {"id":"cmpl-0fee233f-7d56-404a-acd3-4dad775d03d9","object":"text_completion","created":1741379018,"model":"food-review-1","choices":[{"index":0,"text":"UP","logprobs":null,"finish_reason":null,"stop_reason":null}],"usage":null}` ),
966
- EndOfStream : false ,
967
- },
955
+ EndOfStream : false },
968
956
},
969
957
},
970
958
{
@@ -973,16 +961,14 @@ func TestFullDuplexStreamed_KubeInferenceModelRequest(t *testing.T) {
973
961
Body : []byte (`data: {"id":"cmpl-0fee233f-7d56-404a-acd3-4dad775d03d9","object":"text_completion","created":1741379018,"model":"food-review-1","choices":[],"usage":{"prompt_tokens":7,"total_tokens":17,"completion_tokens":10}}
974
962
data: [DONE]` ,
975
963
),
976
- EndOfStream : false ,
977
- },
964
+ EndOfStream : false },
978
965
},
979
966
},
980
967
{
981
968
Request : & extProcPb.ProcessingRequest_ResponseBody {
982
969
ResponseBody : & extProcPb.HttpBody {
983
970
Body : []byte ("" ),
984
- EndOfStream : true ,
985
- },
971
+ EndOfStream : true },
986
972
},
987
973
},
988
974
},
@@ -1186,8 +1172,7 @@ func TestFullDuplexStreamed_KubeInferenceModelRequest(t *testing.T) {
1186
1172
RawValue : []byte ("192.168.1.1:8000" ),
1187
1173
},
1188
1174
},
1189
- },
1190
- },
1175
+ }},
1191
1176
},
1192
1177
},
1193
1178
},
0 commit comments