root@llm-test-f9dfff4cb-hgjsf:/workspace/pytorch/vllm-0.7.2# python3 benchmarks/benchmark_serving.py --backend vllm --model /mnt/DeepSeek-R1-bf16 --dataset-name random --host 0.0.0.0 --port 8000 --served_model_name DeepSeek-R1-bf16 --num-prompts 500 --max-concurrency 1
Namespace(backend='vllm', base_url=None, host='0.0.0.0', port=8000, endpoint='/v1/chat/completions', dataset=None, dataset_name='random', dataset_path=None, max_concurrency=1, model='/mnt/DeepSeek-R1-bf16', tokenizer=None, best_of=1, use_beam_search=False, num_prompts=500, logprobs=None, request_rate=inf, burstiness=1.0, seed=0, trust_remote_code=False, disable_tqdm=False, profile=False, save_result=False, metadata=None, result_dir=None, result_filename=None, ignore_eos=False, percentile_metrics='ttft,tpot,itl', metric_percentiles='99', goodput=None, sonnet_input_len=550, sonnet_output_len=150, sonnet_prefix_len=200, sharegpt_output_len=None, random_input_len=1024, random_output_len=128, random_range_ratio=1.0, random_prefix_len=0, hf_subset=None, hf_split=None, hf_output_len=None, tokenizer_mode='auto', served_model_name='DeepSeek-R1-bf16')
Starting initial single prompt test run...
Traceback (most recent call last):
File "/workspace/pytorch/vllm-0.7.2/benchmarks/benchmark_serving.py", line 1241, in <module>
main(args)
File "/workspace/pytorch/vllm-0.7.2/benchmarks/benchmark_serving.py", line 881, in main
benchmark_result = asyncio.run(
File "/usr/local/lib/python3.10/asyncio/runners.py", line 44, in run
return loop.run_until_complete(main)
File "/usr/local/lib/python3.10/asyncio/base_events.py", line 649, in run_until_complete
return future.result()
File "/workspace/pytorch/vllm-0.7.2/benchmarks/benchmark_serving.py", line 567, in benchmark
raise ValueError(
ValueError: Initial test run failed - Please make sure benchmark arguments are correctly specified. Error: Bad Request解释