Skip to content

Commit dc93b6b

Browse files
committed
Make benchmark_serving part of the library
Signed-off-by: Kaiyu Xie <[email protected]>
1 parent b3a4c1f commit dc93b6b

File tree

3 files changed

+12
-10
lines changed

3 files changed

+12
-10
lines changed

tensorrt_llm/serve/scripts/__init__.py

Whitespace-only changes.

tensorrt_llm/serve/scripts/benchmark_dataset.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -26,10 +26,11 @@
2626

2727
import numpy as np
2828
import pandas as pd
29-
from benchmark_utils import download_and_cache_file
3029
from datasets import load_dataset
3130
from transformers import PreTrainedTokenizerBase
3231

32+
from .benchmark_utils import download_and_cache_file
33+
3334
logger = logging.getLogger(__name__)
3435

3536
# -----------------------------------------------------------------------------

tensorrt_llm/serve/scripts/benchmark_serving.py

Lines changed: 10 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -31,18 +31,19 @@
3131
from typing import Any, Optional
3232

3333
import numpy as np
34-
from backend_request_func import (ASYNC_REQUEST_FUNCS,
35-
OPENAI_COMPATIBLE_BACKENDS, RequestFuncInput,
36-
RequestFuncOutput, get_tokenizer)
37-
from benchmark_dataset import (AIMODataset, BurstGPTDataset,
38-
ConversationDataset, HuggingFaceDataset,
39-
InstructCoderDataset, RandomDataset,
40-
SampleRequest, ShareGPTDataset, SonnetDataset,
41-
VisionArenaDataset)
42-
from benchmark_utils import convert_to_pytorch_benchmark_format, write_to_json
4334
from tqdm.asyncio import tqdm
4435
from transformers import PreTrainedTokenizerBase
4536

37+
from .backend_request_func import (ASYNC_REQUEST_FUNCS,
38+
OPENAI_COMPATIBLE_BACKENDS, RequestFuncInput,
39+
RequestFuncOutput, get_tokenizer)
40+
from .benchmark_dataset import (AIMODataset, BurstGPTDataset,
41+
ConversationDataset, HuggingFaceDataset,
42+
InstructCoderDataset, RandomDataset,
43+
SampleRequest, ShareGPTDataset, SonnetDataset,
44+
VisionArenaDataset)
45+
from .benchmark_utils import convert_to_pytorch_benchmark_format, write_to_json
46+
4647
MILLISECONDS_TO_SECONDS_CONVERSION = 1000
4748

4849

0 commit comments

Comments
 (0)