diff --git a/ads/aqua/modeldeployment/deployment.py b/ads/aqua/modeldeployment/deployment.py index e6ba00a93..25f528925 100644 --- a/ads/aqua/modeldeployment/deployment.py +++ b/ads/aqua/modeldeployment/deployment.py @@ -563,7 +563,16 @@ def _create( params = f"{params} {deployment_params}".strip() - if create_deployment_details.model_name: + if ( + container_type_key.lower() + in [ + InferenceContainerTypeFamily.AQUA_VLLM_CONTAINER_FAMILY, + InferenceContainerTypeFamily.AQUA_VLLM_V1_CONTAINER_FAMILY, + InferenceContainerTypeFamily.AQUA_VLLM_LLAMA4_CONTAINER_FAMILY, + InferenceContainerTypeFamily.AQUA_VLLM_OPENAI_CONTAINER_FAMILY, + ] + and create_deployment_details.model_name + ): # Replace existing --served-model-name argument if present, otherwise add it if "--served-model-name" in params: params = re.sub(