reasoning-parser: ernie-x1 tool_call_parser: ernie-x1 tensor_parallel_size: 4 max_model_len: 65536 max_num_seqs: 128 enable_prefix_caching: True enable_chunked_prefill: True gpu_memory_utilization: 0.85 graph_optimization_config: use_cudagraph: True