|
3 | 3 | "test_name": "serving_llama8B_tp1_sharegpt", |
4 | 4 | "qps_list": [1, 4, 16, "inf"], |
5 | 5 | "server_parameters": { |
6 | | - "model": "meta-llama/Meta-Llama-3-8B", |
| 6 | + "model": "meta-llama/Meta-Llama-3.1-8B-Instruct", |
7 | 7 | "tensor_parallel_size": 1, |
8 | 8 | "swap_space": 16, |
9 | 9 | "disable_log_stats": "", |
10 | 10 | "disable_log_requests": "", |
11 | 11 | "load_format": "dummy" |
12 | 12 | }, |
13 | 13 | "client_parameters": { |
14 | | - "model": "meta-llama/Meta-Llama-3-8B", |
| 14 | + "model": "meta-llama/Meta-Llama-3.1-8B-Instruct", |
15 | 15 | "backend": "vllm", |
16 | 16 | "dataset_name": "sharegpt", |
17 | 17 | "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", |
|
22 | 22 | "test_name": "serving_llama70B_tp4_sharegpt", |
23 | 23 | "qps_list": [1, 4, 16, "inf"], |
24 | 24 | "server_parameters": { |
25 | | - "model": "meta-llama/Meta-Llama-3-70B-Instruct", |
| 25 | + "model": "meta-llama/Meta-Llama-3.1-70B-Instruct", |
26 | 26 | "tensor_parallel_size": 4, |
27 | 27 | "swap_space": 16, |
28 | 28 | "disable_log_stats": "", |
29 | 29 | "disable_log_requests": "", |
30 | 30 | "load_format": "dummy" |
31 | 31 | }, |
32 | 32 | "client_parameters": { |
33 | | - "model": "meta-llama/Meta-Llama-3-70B-Instruct", |
| 33 | + "model": "meta-llama/Meta-Llama-3.1-70B-Instruct", |
34 | 34 | "backend": "vllm", |
35 | 35 | "dataset_name": "sharegpt", |
36 | 36 | "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", |
|
60 | 60 | "test_name": "serving_llama70B_tp4_sharegpt_specdecode", |
61 | 61 | "qps_list": [2], |
62 | 62 | "server_parameters": { |
63 | | - "model": "meta-llama/Meta-Llama-3-70B-Instruct", |
| 63 | + "model": "meta-llama/Meta-Llama-3.1-70B-Instruct", |
64 | 64 | "disable_log_requests": "", |
65 | 65 | "tensor_parallel_size": 4, |
66 | 66 | "swap_space": 16, |
|
70 | 70 | "use_v2_block_manager": "" |
71 | 71 | }, |
72 | 72 | "client_parameters": { |
73 | | - "model": "meta-llama/Meta-Llama-3-70B-Instruct", |
| 73 | + "model": "meta-llama/Meta-Llama-3.1-70B-Instruct", |
74 | 74 | "backend": "vllm", |
75 | 75 | "dataset_name": "sharegpt", |
76 | 76 | "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", |
|
0 commit comments