@@ -82,7 +82,7 @@ def _parse_log_file(self, filename):
8282
8383 return json .loads (json_string )
8484
85- def _parse_triton_metrics (self , filename , is_v1 ):
85+ def _parse_triton_metrics (self , filename ):
8686 curl_counts = {}
8787 with open (filename ) as metrics_file :
8888 for line in metrics_file :
@@ -91,12 +91,11 @@ def _parse_triton_metrics(self, filename, is_v1):
9191 metric_output = re .sub (r"^.*?{" , "{" , line ).split ()
9292 metric_key = metric_output [0 ]
9393 metric_value = metric_output [1 ]
94- key = self ._convert_metric_key_to_stats_key (
95- metric_key , is_v1 )
94+ key = self ._convert_metric_key_to_stats_key (metric_key )
9695 curl_counts [key ] = metric_value
9796 return curl_counts
9897
99- def _convert_metric_key_to_stats_key (self , metric_output , is_v1 ):
98+ def _convert_metric_key_to_stats_key (self , metric_output ):
10099 # Converts:
101100 # '{model="tensorrt_llm",request_type="context",version="1"}'
102101 # to:
@@ -107,15 +106,12 @@ def _convert_metric_key_to_stats_key(self, metric_output, is_v1):
107106 if not i .startswith ('model' ) and not i .startswith ('version' )
108107 ][0 ]
109108 self .assertIn (key , metric_to_stat_dict )
110- if (is_v1 ):
111- self .assertNotIn ("inflight_batcher_specific_metric" , key )
112- else :
113- self .assertNotIn ("v1_specific_metric" , key )
109+ self .assertNotIn ("v1_specific_metric" , key )
114110 return metric_to_stat_dict [key ]
115111
116- def _base_test (self , stats_file , metrics_file , is_v1 ):
112+ def _base_test (self , stats_file , metrics_file ):
117113 stats = self ._parse_log_file (stats_file )
118- metrics = self ._parse_triton_metrics (metrics_file , is_v1 )
114+ metrics = self ._parse_triton_metrics (metrics_file )
119115 self .assertEqual (len (stats .keys ()), len (metrics .keys ()))
120116 self .assertEqual (list (stats .keys ()).sort (), list (metrics .keys ()).sort ())
121117 for metric_key in stats .keys ():
@@ -140,45 +136,33 @@ def _base_test(self, stats_file, metrics_file, is_v1):
140136 timedelta (seconds = - 1 ) <= difference , difference
141137 <= timedelta (seconds = 1 ))
142138
143- def test_1_gpu_v1 (self ):
144- self ._base_test ("1gpu_v1_no_streaming_server.log" ,
145- "1gpu_v1_no_stream_metrics.out" , True )
146-
147139 def test_1_gpu_IFB_no_stream (self ):
148140 self ._base_test ("1gpu_IFB_no_streaming_server.log" ,
149- "1gpu_IFB_no_stream_metrics.out" , False )
141+ "1gpu_IFB_no_stream_metrics.out" )
150142
151143 def test_1_gpu_IFB_stream (self ):
152144 self ._base_test ("1gpu_IFB_streaming_server.log" ,
153- "1gpu_IFB_stream_metrics.out" , False )
145+ "1gpu_IFB_stream_metrics.out" )
154146
155147 if AVAILABLE_GPUS >= 2 :
156148
157- def test_2_gpu_v1 (self ):
158- self ._base_test ("2gpu_v1_no_streaming_server.log" ,
159- "2gpu_v1_no_stream_metrics.out" , True )
160-
161149 def test_2_gpu_IFB_no_stream (self ):
162150 self ._base_test ("2gpu_IFB_no_streaming_server.log" ,
163- "2gpu_IFB_no_stream_metrics.out" , False )
151+ "2gpu_IFB_no_stream_metrics.out" )
164152
165153 def test_2_gpu_IFB_stream (self ):
166154 self ._base_test ("2gpu_IFB_streaming_server.log" ,
167- "2gpu_IFB_stream_metrics.out" , False )
155+ "2gpu_IFB_stream_metrics.out" )
168156
169157 if AVAILABLE_GPUS >= 4 :
170158
171- def test_4_gpu_v1 (self ):
172- self ._base_test ("4gpu_v1_no_streaming_server.log" ,
173- "4gpu_v1_no_stream_metrics.out" , True )
174-
175159 def test_4_gpu_IFB_no_stream (self ):
176160 self ._base_test ("4gpu_IFB_no_streaming_server.log" ,
177- "4gpu_IFB_no_stream_metrics.out" , False )
161+ "4gpu_IFB_no_stream_metrics.out" )
178162
179163 def test_4_gpu_IFB_stream (self ):
180164 self ._base_test ("4gpu_IFB_streaming_server.log" ,
181- "4gpu_IFB_stream_metrics.out" , False )
165+ "4gpu_IFB_stream_metrics.out" )
182166
183167
184168if __name__ == "__main__" :
0 commit comments