File tree Expand file tree Collapse file tree 3 files changed +16
-1
lines changed
Expand file tree Collapse file tree 3 files changed +16
-1
lines changed Original file line number Diff line number Diff line change @@ -88,6 +88,9 @@ async def handle_request(
8888 """Handle the specific request type with common pattern
8989 If you want to override this method, you should be careful to record the validation time.
9090 """
91+ received_time = time .time ()
92+ received_time_perf = time .perf_counter ()
93+
9194 try :
9295 # Validate request
9396 validation_start = time .perf_counter ()
@@ -103,6 +106,12 @@ async def handle_request(
103106 if hasattr (adapted_request , "validation_time" ):
104107 adapted_request .validation_time = validation_time
105108
109+ if hasattr (adapted_request , "received_time" ):
110+ adapted_request .received_time = received_time
111+
112+ if hasattr (adapted_request , "received_time_perf" ):
113+ adapted_request .received_time_perf = received_time_perf
114+
106115 # Note(Xinyuan): raw_request below is only used for detecting the connection of the client
107116 if hasattr (request , "stream" ) and request .stream :
108117 return await self ._handle_streaming_request (
Original file line number Diff line number Diff line change @@ -204,6 +204,12 @@ class GenerateReqInput(BaseReq):
204204 # Validation step duration
205205 validation_time : Optional [float ] = None
206206
207+ # For metrics
208+ received_time : Optional [float ] = None
209+
210+ # Perf_counter equivalents for accurate time calculations
211+ received_time_perf : Optional [float ] = None
212+
207213 # For data parallel rank routing
208214 data_parallel_rank : Optional [int ] = None
209215
Original file line number Diff line number Diff line change @@ -431,7 +431,7 @@ async def generate_request(
431431 obj : Union [GenerateReqInput , EmbeddingReqInput ],
432432 request : Optional [fastapi .Request ] = None ,
433433 ):
434- created_time = time .time ()
434+ created_time = obj . received_time if obj . received_time else time .time ()
435435 self .auto_create_handle_loop ()
436436 obj .normalize_batch_and_arguments ()
437437
You can’t perform that action at this time.
0 commit comments