Bases: GPUModelRunner
Source code in vllm/v1/worker/cpu_model_runner.py
  
 __init__(vllm_config: VllmConfig, device: device)
Source code in vllm/v1/worker/cpu_model_runner.py
  
    
 _may_reorder_batch(
    scheduler_output: SchedulerOutput,
) -> None
Source code in vllm/v1/worker/cpu_model_runner.py
   
  Source code in vllm/v1/worker/cpu_model_runner.py
  
    
    
    
 load_model(eep_scale_up: bool = False) -> None
Source code in vllm/v1/worker/cpu_model_runner.py
   
  Source code in vllm/v1/worker/cpu_model_runner.py
  
 _set_global_compilation_settings(config: VllmConfig)