@@ -409,9 +409,7 @@ class EngineArgs:
409409 get_field (LoadConfig , "model_loader_extra_config" )
410410 ignore_patterns : Optional [Union [str ,
411411 List [str ]]] = LoadConfig .ignore_patterns
412- preemption_mode : Optional [str ] = SchedulerConfig .preemption_mode
413412
414- scheduler_delay_factor : float = SchedulerConfig .delay_factor
415413 enable_chunked_prefill : Optional [
416414 bool ] = SchedulerConfig .enable_chunked_prefill
417415 disable_chunked_mm_input : bool = SchedulerConfig .disable_chunked_mm_input
@@ -439,7 +437,6 @@ class EngineArgs:
439437 ObservabilityConfig .otlp_traces_endpoint
440438 collect_detailed_traces : Optional [list [DetailedTraceModules ]] = \
441439 ObservabilityConfig .collect_detailed_traces
442- disable_async_output_proc : bool = not ModelConfig .use_async_output_proc
443440 scheduling_policy : SchedulerPolicy = SchedulerConfig .policy
444441 scheduler_cls : Union [str , Type [object ]] = SchedulerConfig .scheduler_cls
445442
@@ -561,14 +558,6 @@ def add_cli_args(parser: FlexibleArgumentParser) -> FlexibleArgumentParser:
561558 ** model_kwargs ["enable_prompt_embeds" ])
562559 model_group .add_argument ("--served-model-name" ,
563560 ** model_kwargs ["served_model_name" ])
564- # This one is a special case because it is the
565- # opposite of ModelConfig.use_async_output_proc
566- model_group .add_argument (
567- "--disable-async-output-proc" ,
568- action = "store_true" ,
569- default = EngineArgs .disable_async_output_proc ,
570- help = "Disable async output processing. This may result in "
571- "lower performance." )
572561 model_group .add_argument ("--config-format" ,
573562 ** model_kwargs ["config_format" ])
574563 # This one is a special case because it can bool
@@ -897,10 +886,6 @@ def add_cli_args(parser: FlexibleArgumentParser) -> FlexibleArgumentParser:
897886 ** scheduler_kwargs ["long_prefill_token_threshold" ])
898887 scheduler_group .add_argument ("--num-lookahead-slots" ,
899888 ** scheduler_kwargs ["num_lookahead_slots" ])
900- scheduler_group .add_argument ("--scheduler-delay-factor" ,
901- ** scheduler_kwargs ["delay_factor" ])
902- scheduler_group .add_argument ("--preemption-mode" ,
903- ** scheduler_kwargs ["preemption_mode" ])
904889 # multi-step scheduling has been removed; corresponding arguments
905890 # are no longer supported.
906891 scheduler_group .add_argument ("--scheduling-policy" ,
@@ -1029,7 +1014,6 @@ def create_model_config(self) -> ModelConfig:
10291014 interleave_mm_strings = self .interleave_mm_strings ,
10301015 media_io_kwargs = self .media_io_kwargs ,
10311016 skip_mm_profiling = self .skip_mm_profiling ,
1032- use_async_output_proc = not self .disable_async_output_proc ,
10331017 config_format = self .config_format ,
10341018 mm_processor_kwargs = self .mm_processor_kwargs ,
10351019 mm_processor_cache_gb = self .mm_processor_cache_gb ,
@@ -1395,11 +1379,9 @@ def create_engine_config(
13951379 max_model_len = model_config .max_model_len ,
13961380 cuda_graph_sizes = self .cuda_graph_sizes ,
13971381 num_lookahead_slots = num_lookahead_slots ,
1398- delay_factor = self .scheduler_delay_factor ,
13991382 enable_chunked_prefill = self .enable_chunked_prefill ,
14001383 disable_chunked_mm_input = self .disable_chunked_mm_input ,
14011384 is_multimodal_model = model_config .is_multimodal_model ,
1402- preemption_mode = self .preemption_mode ,
14031385 send_delta_data = (envs .VLLM_USE_RAY_SPMD_WORKER
14041386 and parallel_config .use_ray ),
14051387 policy = self .scheduling_policy ,
@@ -1492,22 +1474,6 @@ def _is_v1_supported_oracle(self, model_config: ModelConfig) -> bool:
14921474 recommend_to_remove = False )
14931475 return False
14941476
1495- if self .preemption_mode != SchedulerConfig .preemption_mode :
1496- _raise_or_fallback (feature_name = "--preemption-mode" ,
1497- recommend_to_remove = True )
1498- return False
1499-
1500- if (self .disable_async_output_proc
1501- != EngineArgs .disable_async_output_proc ):
1502- _raise_or_fallback (feature_name = "--disable-async-output-proc" ,
1503- recommend_to_remove = True )
1504- return False
1505-
1506- if self .scheduler_delay_factor != SchedulerConfig .delay_factor :
1507- _raise_or_fallback (feature_name = "--scheduler-delay-factor" ,
1508- recommend_to_remove = True )
1509- return False
1510-
15111477 # No Mamba or Encoder-Decoder so far.
15121478 if not model_config .is_v1_compatible :
15131479 _raise_or_fallback (feature_name = model_config .architectures ,
0 commit comments