diff --git a/vllm/model_executor/model_loader/neuron.py b/vllm/model_executor/model_loader/neuron.py index a9f1e6e88d792..a90fbd648def9 100644 --- a/vllm/model_executor/model_loader/neuron.py +++ b/vllm/model_executor/model_loader/neuron.py @@ -37,7 +37,7 @@ } -class NeuronCasualLM(nn.Module): +class NeuronCausalLM(nn.Module): def __init__(self, config: PretrainedConfig, @@ -184,7 +184,7 @@ def get_neuron_model(model_config: ModelConfig, scheduler_config: SchedulerConfig) -> nn.Module: # Create a model instance. - model = NeuronCasualLM( + model = NeuronCausalLM( model_config.hf_config, _is_neuron_on_device_sampling_disabled(model_config)) diff --git a/vllm/model_executor/model_loader/openvino.py b/vllm/model_executor/model_loader/openvino.py index 8ada2210d0d51..573f2a04895d9 100644 --- a/vllm/model_executor/model_loader/openvino.py +++ b/vllm/model_executor/model_loader/openvino.py @@ -95,7 +95,7 @@ def _require_model_export(model_id, revision=None, subfolder=None): return True -class OpenVINOCasualLM(nn.Module): +class OpenVINOCausalLM(nn.Module): def __init__( self, @@ -199,5 +199,5 @@ def get_model( "be added in the future. If this is important to you, " "please open an issue on github.") - return OpenVINOCasualLM(ov_core, model_config, device_config, + return OpenVINOCausalLM(ov_core, model_config, device_config, kv_cache_dtype)