diff --git a/tests/graph_optimization/test_cuda_graph_dynamic_subgraph.py b/tests/graph_optimization/test_cuda_graph_dynamic_subgraph.py index 98c7383f07b..b70c2f4d87b 100644 --- a/tests/graph_optimization/test_cuda_graph_dynamic_subgraph.py +++ b/tests/graph_optimization/test_cuda_graph_dynamic_subgraph.py @@ -161,7 +161,7 @@ def test_cuda_graph_subgraph(self): model_config = Mock() model_config.max_model_len = 512 # Initialize cuda graph capture list - graph_opt_config._set_cudagraph_sizes(max_num_seqs=scheduler_config.max_num_seqs) + graph_opt_config._set_cudagraph_sizes(max_capture_size=scheduler_config.max_num_seqs) graph_opt_config.init_with_cudagrpah_size(max_capture_size=scheduler_config.max_num_seqs) fd_config = FDConfig( graph_opt_config=graph_opt_config, diff --git a/tests/graph_optimization/test_cuda_graph_spec_decode.py b/tests/graph_optimization/test_cuda_graph_spec_decode.py index 40c32ca91ef..0e379b1501c 100644 --- a/tests/graph_optimization/test_cuda_graph_spec_decode.py +++ b/tests/graph_optimization/test_cuda_graph_spec_decode.py @@ -108,7 +108,7 @@ def test_cuda_graph_spec_decode(self): model_config = Mock() model_config.max_model_len = 512 # Initialize cuda graph capture list - graph_opt_config._set_cudagraph_sizes(max_num_seqs=scheduler_config.max_num_seqs) + graph_opt_config._set_cudagraph_sizes(max_capture_size=scheduler_config.max_num_seqs) graph_opt_config.init_with_cudagrpah_size(max_capture_size=scheduler_config.max_num_seqs) fd_config = FDConfig( graph_opt_config=graph_opt_config, diff --git a/tests/graph_optimization/test_static_graph_cuda_graph_split.py b/tests/graph_optimization/test_static_graph_cuda_graph_split.py index 4ccc34f0b1d..d8e22bbb042 100644 --- a/tests/graph_optimization/test_static_graph_cuda_graph_split.py +++ b/tests/graph_optimization/test_static_graph_cuda_graph_split.py @@ -91,7 +91,7 @@ def test(self): # Set FastDeploy config graph_opt_config = GraphOptimizationConfig({"use_cudagraph": True, "graph_opt_level": 1}) scheduler_config = SchedulerConfig({"max_num_seqs": 1}) - graph_opt_config._set_cudagraph_sizes(max_num_seqs=scheduler_config.max_num_seqs) + graph_opt_config._set_cudagraph_sizes(max_capture_size=scheduler_config.max_num_seqs) graph_opt_config.init_with_cudagrpah_size(max_capture_size=scheduler_config.max_num_seqs) cache_config = CacheConfig({}) parallel_config = ParallelConfig(args={})