@@ -128,10 +128,10 @@ func (s *Server) Process(srv extProcPb.ExternalProcessor_ProcessServer) error {
128
128
reqCtx .ResponseCompleteTimestamp = time .Now ()
129
129
metrics .RecordRequestLatencies (ctx , reqCtx .Model , reqCtx .ResolvedTargetModel , reqCtx .RequestReceivedTimestamp , reqCtx .ResponseCompleteTimestamp )
130
130
metrics .RecordResponseSizes (reqCtx .Model , reqCtx .ResolvedTargetModel , reqCtx .ResponseSize )
131
- metrics .RecordInputTokens (reqCtx .Model , reqCtx .ResolvedTargetModel , reqCtx .Response . Usage .PromptTokens )
132
- metrics .RecordOutputTokens (reqCtx .Model , reqCtx .ResolvedTargetModel , reqCtx .Response . Usage .CompletionTokens )
131
+ metrics .RecordInputTokens (reqCtx .Model , reqCtx .ResolvedTargetModel , reqCtx .Usage .PromptTokens )
132
+ metrics .RecordOutputTokens (reqCtx .Model , reqCtx .ResolvedTargetModel , reqCtx .Usage .CompletionTokens )
133
133
}
134
- if reqCtx .Streaming {
134
+ if reqCtx .modelServerStreaming {
135
135
logger .V (logutil .DEBUG ).Info ("Request context after HandleResponseBody" , "context" , reqCtx )
136
136
} else {
137
137
loggerVerbose .Info ("Request context after HandleResponseBody" , "context" , reqCtx )
@@ -149,7 +149,7 @@ func (s *Server) Process(srv extProcPb.ExternalProcessor_ProcessServer) error {
149
149
}
150
150
}
151
151
152
- if ! reqCtx .Streaming {
152
+ if ! reqCtx .modelServerStreaming {
153
153
loggerVerbose .Info ("Response generated" , "response" , resp )
154
154
} else {
155
155
logger .V (logutil .DEBUG ).Info ("Response generated" , "response" , resp )
@@ -224,9 +224,32 @@ type RequestContext struct {
224
224
RequestReceivedTimestamp time.Time
225
225
ResponseCompleteTimestamp time.Time
226
226
RequestSize int
227
- Response Response
227
+ Usage Usage
228
228
ResponseSize int
229
229
ResponseComplete bool
230
230
ResponseStatusCode string
231
- Streaming bool
231
+
232
+ RequestState StreamRequestState
233
+ modelServerStreaming bool
234
+
235
+ reqHeaderResp * extProcPb.ProcessingResponse
236
+ reqBodyResp * extProcPb.ProcessingResponse
237
+ reqTrailerResp * extProcPb.ProcessingResponse
238
+
239
+ respHeaderResp * extProcPb.ProcessingResponse
240
+ respBodyResp * extProcPb.ProcessingResponse
241
+ respTrailerResp * extProcPb.ProcessingResponse
232
242
}
243
+
244
+ type StreamRequestState int
245
+
246
+ const (
247
+ RequestReceived StreamRequestState = 0
248
+ HeaderRequestResponseComplete StreamRequestState = 1
249
+ BodyRequestResponsesComplete StreamRequestState = 2
250
+ TrailerRequestResponsesComplete StreamRequestState = 3
251
+ ResponseRecieved StreamRequestState = 4
252
+ HeaderResponseResponseComplete StreamRequestState = 5
253
+ BodyResponseResponsesComplete StreamRequestState = 6
254
+ TrailerResponseResponsesComplete StreamRequestState = 7
255
+ )
0 commit comments