3 years ago · 2e8bf33b0a
--- a/docs/changelog/91296.yaml
+++ b/docs/changelog/91296.yaml
@@ -0,0 +1,5 @@
 
															+pr: 91296
														
 
															+summary: Allow `model_aliases` to be used with Pytorch trained models
														
 
															+area: Machine Learning
														
 
															+type: enhancement
														
 
															+issues: []
														
--- a/docs/reference/ml/trained-models/apis/infer-trained-model-deployment.asciidoc
+++ b/docs/reference/ml/trained-models/apis/infer-trained-model-deployment.asciidoc
@@ -31,7 +31,7 @@ deprecated::[8.3.0,Replaced by <<infer-trained-model>>.]
 
															 `<model_id>`::
														
 
															 (Required, string)
														
 
															-include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=model-id]
														
 
															+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=model-id-or-alias]
														
 
															 [[infer-trained-model-deployment-query-params]]
														
 
															 == {api-query-parms-title}
														
--- a/docs/reference/ml/trained-models/apis/infer-trained-model.asciidoc
+++ b/docs/reference/ml/trained-models/apis/infer-trained-model.asciidoc
@@ -31,7 +31,7 @@ beta::[]
 
															 `<model_id>`::
														
 
															 (Required, string)
														
 
															-include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=model-id]
														
 
															+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=model-id-or-alias]
														
 
															 [[infer-trained-model-query-params]]
														
 
															 == {api-query-parms-title}
														
@@ -629,7 +629,7 @@ include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-tokenizati
 
															 The response depends on the kind of model.
														
 
															-For example, for {lang-ident} the response is the predicted language and the 
														
 
															+For example, for {lang-ident} the response is the predicted language and the
														
 
															 score:
														
 
															 [source,console]
														
@@ -658,7 +658,7 @@ Here are the results predicting english with a high probability.
 
															 // NOTCONSOLE
														
 
															-When it is a text classification model, the response is the score and predicted 
														
 
															+When it is a text classification model, the response is the score and predicted
														
 
															 classification.
														
 
															 For example:
														
@@ -822,8 +822,8 @@ The API returns a response similar to the following:
 
															 ----
														
 
															 // NOTCONSOLE
														
 
															-Text similarity models require at least two sequences of text to compare. It's 
														
 
															-possible to provide multiple strings of text to compare to another text 
														
 
															+Text similarity models require at least two sequences of text to compare. It's
														
 
															+possible to provide multiple strings of text to compare to another text
														
 
															 sequence:
														
 
															 [source,console]
														
@@ -840,7 +840,7 @@ POST _ml/trained_models/cross-encoder__ms-marco-tinybert-l-2-v2/_infer
 
															 --------------------------------------------------
														
 
															 // TEST[skip:TBD]
														
 
															-The response contains the prediction for every string that is compared to the 
														
 
															+The response contains the prediction for every string that is compared to the
														
 
															 text provided in the `text_similarity`.`text` field:
														
 
															 [source,console-result]
														
--- a/docs/reference/ml/trained-models/apis/put-trained-models-aliases.asciidoc
+++ b/docs/reference/ml/trained-models/apis/put-trained-models-aliases.asciidoc
@@ -20,7 +20,7 @@ A trained model alias is a logical name used to reference a single trained model
 
															 [[ml-put-trained-models-aliases-prereq]]
														
 
															 == {api-prereq-title}
														
 
															-Requires the `manage_ml` cluster privilege. This privilege is included in the 
														
 
															+Requires the `manage_ml` cluster privilege. This privilege is included in the
														
 
															 `machine_learning_admin` built-in role.
														
@@ -34,11 +34,18 @@ and processors.
 
															 An alias must be unique and refer to only a single trained model. However,
														
 
															 you can have multiple aliases for each trained model.
														
 
															-If you use this API to update an alias such that it references a different
														
 
															-trained model ID and the model uses a different type of {dfanalytics}, an error
														
 
															-occurs. For example, this situation occurs if you have a trained model for
														
 
															+API Restrictions:
														
 
															++
														
 
															+--
														
 
															+* You are not allowed to update an alias such that it references a different
														
 
															+trained model ID and the model uses a different type of {dfanalytics}. For example,
														
 
															+this situation occurs if you have a trained model for
														
 
															 {reganalysis} and a trained model for {classanalysis}; you cannot reassign an
														
 
															 alias from one type of trained model to another.
														
 
															+* You cannot update an alias from a `pytorch` model and a {dfanalytics} model.
														
 
															+* You cannot update the alias from a deployed `pytorch` model to one
														
 
															+not currently deployed.
														
 
															+--
														
 
															 If you use this API to update an alias and there are very few input fields in
														
 
															 common between the old and new trained models for the model alias, the API
														
@@ -62,7 +69,7 @@ The identifier for the trained model that the alias refers to.
 
															 (Optional, boolean)
														
 
															 Specifies whether the alias gets reassigned to the specified trained model if it
														
 
															 is already assigned to a different model. If the alias is already assigned and
														
 
															-this parameter is `false`, the API returns an error. Defaults to `false`. 
														
 
															+this parameter is `false`, the API returns an error. Defaults to `false`.
														
 
															 [[ml-put-trained-models-aliases-example]]
														
 
															 == {api-examples-title}
														
--- a/docs/reference/ml/trained-models/apis/stop-trained-model-deployment.asciidoc
+++ b/docs/reference/ml/trained-models/apis/stop-trained-model-deployment.asciidoc
@@ -18,7 +18,7 @@ beta::[]
 
															 [[stop-trained-model-deployment-prereq]]
														
 
															 == {api-prereq-title}
														
 
															-Requires the `manage_ml` cluster privilege. This privilege is included in the 
														
 
															+Requires the `manage_ml` cluster privilege. This privilege is included in the
														
 
															 `machine_learning_admin` built-in role.
														
 
															 [[stop-trained-model-deployment-desc]]
														
@@ -42,8 +42,8 @@ include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=model-id]
 
															 include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=allow-no-match-deployments]
														
 
															 `force`::
														
 
															-(Optional, Boolean) If true, the deployment is stopped even if it is referenced
														
 
															-by ingest pipelines. You can't use these pipelines until you restart the model
														
 
															+(Optional, Boolean) If true, the deployment is stopped even if it or one of its model aliases
														
 
															+is referenced by ingest pipelines. You can't use these pipelines until you restart the model
														
 
															 deployment.
														
 
															 ////
														
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ml/action/InferTrainedModelDeploymentAction.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ml/action/InferTrainedModelDeploymentAction.java
@@ -86,7 +86,7 @@ public class InferTrainedModelDeploymentAction extends ActionType<InferTrainedMo
 
															             return builder;
														
 
															         }
														
 
															-        private final String modelId;
														
 
															+        private String modelId;
														
 
															         private final List<Map<String, Object>> docs;
														
 
															         private final InferenceConfigUpdate update;
														
 
															         private final TimeValue inferenceTimeout;
														
@@ -165,6 +165,10 @@ public class InferTrainedModelDeploymentAction extends ActionType<InferTrainedMo
 
															             return inferenceTimeout == null ? DEFAULT_TIMEOUT : inferenceTimeout;
														
 
															         }
														
 
															+        public void setModelId(String modelId) {
														
 
															+            this.modelId = modelId;
														
 
															+        }
														
 
															+
														
 
															         /**
														
 
															          * This is always null as we want the inference call to handle the timeout, not the tasks framework
														
 
															          * @return null
														
--- a/x-pack/plugin/ml/qa/native-multi-node-tests/src/javaRestTest/java/org/elasticsearch/xpack/ml/integration/PyTorchModelIT.java
+++ b/x-pack/plugin/ml/qa/native-multi-node-tests/src/javaRestTest/java/org/elasticsearch/xpack/ml/integration/PyTorchModelIT.java
@@ -585,6 +585,74 @@ public class PyTorchModelIT extends PyTorchModelRestTestCase {
 
															         stopDeployment(modelId, true);
														
 
															     }
														
 
															+    public void testStopWithModelAliasUsedDeploymentByIngestProcessor() throws IOException {
														
 
															+        String modelId = "test_stop_model_alias_used_deployment_by_ingest_processor";
														
 
															+        String modelAlias = "used_model_alias";
														
 
															+        createPassThroughModel(modelId);
														
 
															+        putModelDefinition(modelId);
														
 
															+        putVocabulary(List.of("these", "are", "my", "words"), modelId);
														
 
															+        startDeployment(modelId);
														
 
															+        client().performRequest(new Request("PUT", formatted("_ml/trained_models/%s/model_aliases/%s", modelId, modelAlias)));
														
 
															+
														
 
															+        client().performRequest(putPipeline("my_pipeline", formatted("""
														
 
															+            {
														
 
															+              "processors": [
														
 
															+                {
														
 
															+                  "inference": {
														
 
															+                    "model_id": "%s"
														
 
															+                  }
														
 
															+                }
														
 
															+              ]
														
 
															+            }""", modelAlias)));
														
 
															+        ResponseException ex = expectThrows(ResponseException.class, () -> stopDeployment(modelId));
														
 
															+        assertThat(ex.getResponse().getStatusLine().getStatusCode(), equalTo(409));
														
 
															+        assertThat(
														
 
															+            EntityUtils.toString(ex.getResponse().getEntity()),
														
 
															+            containsString(
														
 
															+                "Cannot stop deployment for model [test_stop_model_alias_used_deployment_by_ingest_processor] as it has a "
														
 
															+                    + "model_alias [used_model_alias] that is still referenced"
														
 
															+                    + " by ingest processors; use force to stop the deployment"
														
 
															+            )
														
 
															+        );
														
 
															+        stopDeployment(modelId, true);
														
 
															+    }
														
 
															+
														
 
															+    public void testInferenceProcessorWithModelAlias() throws IOException {
														
 
															+        String modelId = "test_model_alias_infer";
														
 
															+        String modelAlias = "pytorch_model_alias";
														
 
															+        createPassThroughModel(modelId);
														
 
															+        putModelDefinition(modelId);
														
 
															+        putVocabulary(List.of("these", "are", "my", "words"), modelId);
														
 
															+        startDeployment(modelId);
														
 
															+        client().performRequest(new Request("PUT", formatted("_ml/trained_models/%s/model_aliases/%s", modelId, modelAlias)));
														
 
															+
														
 
															+        String source = formatted("""
														
 
															+            {
														
 
															+              "pipeline": {
														
 
															+                "processors": [
														
 
															+                  {
														
 
															+                    "inference": {
														
 
															+                      "model_id": "%s"
														
 
															+                    }
														
 
															+                  }
														
 
															+                ]
														
 
															+              },
														
 
															+              "docs": [
														
 
															+                {"_source": {"input": "my words"}}]
														
 
															+            }
														
 
															+            """, modelAlias);
														
 
															+
														
 
															+        String response = EntityUtils.toString(client().performRequest(simulateRequest(source)).getEntity());
														
 
															+        assertThat(
														
 
															+            response,
														
 
															+            allOf(
														
 
															+                containsString("\"ml\":{\"inference\":{\"predicted_value\":[[1.0,1.0]]"),
														
 
															+                containsString(modelId),
														
 
															+                not(containsString("warning"))
														
 
															+            )
														
 
															+        );
														
 
															+    }
														
 
															+
														
 
															     public void testPipelineWithBadProcessor() throws IOException {
														
 
															         String model = "deployed";
														
 
															         createPassThroughModel(model);
														
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportDeleteTrainedModelAction.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportDeleteTrainedModelAction.java
@@ -186,7 +186,7 @@ public class TransportDeleteTrainedModelAction extends AcknowledgedTransportMast
 
															         return allReferencedModelKeys;
														
 
															     }
														
 
															-    private static List<String> getModelAliases(ClusterState clusterState, String modelId) {
														
 
															+    static List<String> getModelAliases(ClusterState clusterState, String modelId) {
														
 
															         final ModelAliasMetadata currentMetadata = ModelAliasMetadata.fromState(clusterState);
														
 
															         final List<String> modelAliases = new ArrayList<>();
														
 
															         for (Map.Entry<String, ModelAliasMetadata.ModelAliasEntry> modelAliasEntry : currentMetadata.modelAliases().entrySet()) {
														
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportInferTrainedModelDeploymentAction.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportInferTrainedModelDeploymentAction.java
@@ -29,12 +29,14 @@ import org.elasticsearch.xpack.core.ml.inference.TrainedModelType;
 
															 import org.elasticsearch.xpack.core.ml.inference.assignment.AssignmentState;
														
 
															 import org.elasticsearch.xpack.core.ml.inference.assignment.TrainedModelAssignment;
														
 
															 import org.elasticsearch.xpack.core.ml.utils.ExceptionsHelper;
														
 
															+import org.elasticsearch.xpack.ml.inference.ModelAliasMetadata;
														
 
															 import org.elasticsearch.xpack.ml.inference.assignment.TrainedModelAssignmentMetadata;
														
 
															 import org.elasticsearch.xpack.ml.inference.deployment.NlpInferenceInput;
														
 
															 import org.elasticsearch.xpack.ml.inference.deployment.TrainedModelDeploymentTask;
														
 
															 import org.elasticsearch.xpack.ml.inference.persistence.TrainedModelProvider;
														
 
															 import java.util.List;
														
 
															+import java.util.Optional;
														
 
															 import static org.elasticsearch.core.Strings.format;
														
@@ -75,14 +77,18 @@ public class TransportInferTrainedModelDeploymentAction extends TransportTasksAc
 
															         ActionListener<InferTrainedModelDeploymentAction.Response> listener
														
 
															     ) {
														
 
															         TaskId taskId = new TaskId(clusterService.localNode().getId(), task.getId());
														
 
															-        final String modelId = request.getModelId();
														
 
															+        // Update the requests model ID if it's an alias
														
 
															+        Optional.ofNullable(ModelAliasMetadata.fromState(clusterService.state()).getModelId(request.getModelId()))
														
 
															+            .ifPresent(request::setModelId);
														
 
															         // We need to check whether there is at least an assigned task here, otherwise we cannot redirect to the
														
 
															         // node running the job task.
														
 
															-        TrainedModelAssignment assignment = TrainedModelAssignmentMetadata.assignmentForModelId(clusterService.state(), modelId)
														
 
															-            .orElse(null);
														
 
															+        TrainedModelAssignment assignment = TrainedModelAssignmentMetadata.assignmentForModelId(
														
 
															+            clusterService.state(),
														
 
															+            request.getModelId()
														
 
															+        ).orElse(null);
														
 
															         if (assignment == null) {
														
 
															             // If there is no assignment, verify the model even exists so that we can provide a nicer error message
														
 
															-            provider.getTrainedModel(modelId, GetTrainedModelsAction.Includes.empty(), taskId, ActionListener.wrap(config -> {
														
 
															+            provider.getTrainedModel(request.getModelId(), GetTrainedModelsAction.Includes.empty(), taskId, ActionListener.wrap(config -> {
														
 
															                 if (config.getModelType() != TrainedModelType.PYTORCH) {
														
 
															                     listener.onFailure(
														
 
															                         ExceptionsHelper.badRequestException(
														
@@ -93,13 +99,13 @@ public class TransportInferTrainedModelDeploymentAction extends TransportTasksAc
 
															                     );
														
 
															                     return;
														
 
															                 }
														
 
															-                String message = "Trained model [" + modelId + "] is not deployed";
														
 
															+                String message = "Trained model [" + request.getModelId() + "] is not deployed";
														
 
															                 listener.onFailure(ExceptionsHelper.conflictStatusException(message));
														
 
															             }, listener::onFailure));
														
 
															             return;
														
 
															         }
														
 
															         if (assignment.getAssignmentState() == AssignmentState.STOPPING) {
														
 
															-            String message = "Trained model [" + modelId + "] is STOPPING";
														
 
															+            String message = "Trained model [" + request.getModelId() + "] is STOPPING";
														
 
															             listener.onFailure(ExceptionsHelper.conflictStatusException(message));
														
 
															             return;
														
 
															         }
														
@@ -114,7 +120,9 @@ public class TransportInferTrainedModelDeploymentAction extends TransportTasksAc
 
															             }, listener::onFailure));
														
 
															         }, () -> {
														
 
															             logger.trace(() -> format("[%s] model not allocated to any node [%s]", assignment.getModelId()));
														
 
															-            listener.onFailure(ExceptionsHelper.conflictStatusException("Trained model [" + modelId + "] is not allocated to any nodes"));
														
 
															+            listener.onFailure(
														
 
															+                ExceptionsHelper.conflictStatusException("Trained model [" + request.getModelId() + "] is not allocated to any nodes")
														
 
															+            );
														
 
															         });
														
 
															     }
														
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportInternalInferModelAction.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportInternalInferModelAction.java
@@ -31,6 +31,7 @@ import org.elasticsearch.xpack.core.ml.action.InferTrainedModelDeploymentAction;
 
															 import org.elasticsearch.xpack.core.ml.inference.results.InferenceResults;
														
 
															 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.InferenceConfigUpdate;
														
 
															 import org.elasticsearch.xpack.ml.MachineLearning;
														
 
															+import org.elasticsearch.xpack.ml.inference.ModelAliasMetadata;
														
 
															 import org.elasticsearch.xpack.ml.inference.assignment.TrainedModelAssignmentMetadata;
														
 
															 import org.elasticsearch.xpack.ml.inference.loadingservice.LocalModel;
														
 
															 import org.elasticsearch.xpack.ml.inference.loadingservice.ModelLoadingService;
														
@@ -39,6 +40,7 @@ import org.elasticsearch.xpack.ml.utils.TypedChainTaskExecutor;
 
															 import java.util.Collections;
														
 
															 import java.util.Map;
														
 
															+import java.util.Optional;
														
 
															 import static org.elasticsearch.core.Strings.format;
														
 
															 import static org.elasticsearch.xpack.core.ClientHelper.ML_ORIGIN;
														
@@ -128,8 +130,11 @@ public class TransportInternalInferModelAction extends HandledTransportAction<Re
 
															         TaskId parentTaskId,
														
 
															         ActionListener<Response> listener
														
 
															     ) {
														
 
															-        if (isAllocatedModel(request.getModelId())) {
														
 
															-            inferAgainstAllocatedModel(request, responseBuilder, parentTaskId, listener);
														
 
															+        String concreteModelId = Optional.ofNullable(ModelAliasMetadata.fromState(clusterService.state()).getModelId(request.getModelId()))
														
 
															+            .orElse(request.getModelId());
														
 
															+        if (isAllocatedModel(concreteModelId)) {
														
 
															+            // It is important to use the resolved model ID here as the alias could change between transport calls.
														
 
															+            inferAgainstAllocatedModel(request, concreteModelId, responseBuilder, parentTaskId, listener);
														
 
															         } else {
														
 
															             getModelAndInfer(request, responseBuilder, parentTaskId, (CancellableTask) task, listener);
														
 
															         }
														
@@ -176,6 +181,7 @@ public class TransportInternalInferModelAction extends HandledTransportAction<Re
 
															     private void inferAgainstAllocatedModel(
														
 
															         Request request,
														
 
															+        String concreteModelId,
														
 
															         Response.Builder responseBuilder,
														
 
															         TaskId parentTaskId,
														
 
															         ActionListener<Response> listener
														
@@ -191,7 +197,7 @@ public class TransportInternalInferModelAction extends HandledTransportAction<Re
 
															             .forEach(
														
 
															                 stringObjectMap -> typedChainTaskExecutor.add(
														
 
															                     chainedTask -> inferSingleDocAgainstAllocatedModel(
														
 
															-                        request.getModelId(),
														
 
															+                        concreteModelId,
														
 
															                         request.getTimeout(),
														
 
															                         request.getUpdate(),
														
 
															                         stringObjectMap,
														
@@ -204,7 +210,7 @@ public class TransportInternalInferModelAction extends HandledTransportAction<Re
 
															         typedChainTaskExecutor.execute(
														
 
															             ActionListener.wrap(
														
 
															                 inferenceResults -> listener.onResponse(
														
 
															-                    responseBuilder.setInferenceResults(inferenceResults).setModelId(request.getModelId()).build()
														
 
															+                    responseBuilder.setInferenceResults(inferenceResults).setModelId(concreteModelId).build()
														
 
															                 ),
														
 
															                 listener::onFailure
														
 
															             )
														
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportPutTrainedModelAliasAction.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportPutTrainedModelAliasAction.java
@@ -37,15 +37,20 @@ import org.elasticsearch.xpack.core.ml.action.GetTrainedModelsAction;
 
															 import org.elasticsearch.xpack.core.ml.action.PutTrainedModelAliasAction;
														
 
															 import org.elasticsearch.xpack.core.ml.inference.TrainedModelConfig;
														
 
															 import org.elasticsearch.xpack.core.ml.inference.TrainedModelType;
														
 
															+import org.elasticsearch.xpack.core.ml.inference.assignment.AllocationStatus;
														
 
															+import org.elasticsearch.xpack.core.ml.inference.assignment.TrainedModelAssignment;
														
 
															 import org.elasticsearch.xpack.core.ml.job.messages.Messages;
														
 
															 import org.elasticsearch.xpack.core.ml.utils.ExceptionsHelper;
														
 
															 import org.elasticsearch.xpack.ml.inference.ModelAliasMetadata;
														
 
															+import org.elasticsearch.xpack.ml.inference.assignment.TrainedModelAssignmentMetadata;
														
 
															 import org.elasticsearch.xpack.ml.inference.persistence.TrainedModelProvider;
														
 
															 import org.elasticsearch.xpack.ml.notifications.InferenceAuditor;
														
 
															 import java.util.HashMap;
														
 
															 import java.util.HashSet;
														
 
															 import java.util.Map;
														
 
															+import java.util.Objects;
														
 
															+import java.util.Optional;
														
 
															 import java.util.Set;
														
 
															 import java.util.function.Predicate;
														
@@ -141,10 +146,6 @@ public class TransportPutTrainedModelAliasAction extends AcknowledgedTransportMa
 
															                 listener.onFailure(LicenseUtils.newComplianceException(XPackField.MACHINE_LEARNING));
														
 
															                 return;
														
 
															             }
														
 
															-            if (newModel.getModelType() == TrainedModelType.PYTORCH) {
														
 
															-                listener.onFailure(ExceptionsHelper.badRequestException("model_alias is not supported on pytorch models"));
														
 
															-                return;
														
 
															-            }
														
 
															             // if old model is null, none of these validations matter
														
 
															             // we should still allow reassignment even if the old model was some how deleted and the alias still refers to it
														
 
															             if (oldModel != null) {
														
@@ -166,6 +167,70 @@ public class TransportPutTrainedModelAliasAction extends AcknowledgedTransportMa
 
															                     }
														
 
															                 }
														
 
															+                if (Objects.equals(newModel.getModelType(), oldModel.getModelType()) == false) {
														
 
															+                    listener.onFailure(
														
 
															+                        ExceptionsHelper.badRequestException(
														
 
															+                            "cannot reassign model_alias [{}] to model [{}] with type [{}] from model [{}] with type [{}]",
														
 
															+                            request.getModelAlias(),
														
 
															+                            newModel.getModelId(),
														
 
															+                            Optional.ofNullable(newModel.getModelType()).orElse(TrainedModelType.TREE_ENSEMBLE).toString(),
														
 
															+                            oldModel.getModelId(),
														
 
															+                            Optional.ofNullable(oldModel.getModelType()).orElse(TrainedModelType.TREE_ENSEMBLE).toString()
														
 
															+                        )
														
 
															+                    );
														
 
															+                    return;
														
 
															+                }
														
 
															+
														
 
															+                // If we are reassigning Pytorch models, we need to validate assignments are acceptable.
														
 
															+                if (newModel.getModelType() == TrainedModelType.PYTORCH) {
														
 
															+                    Optional<TrainedModelAssignment> oldAssignment = TrainedModelAssignmentMetadata.assignmentForModelId(state, oldModelId);
														
 
															+                    Optional<TrainedModelAssignment> newAssignment = TrainedModelAssignmentMetadata.assignmentForModelId(
														
 
															+                        state,
														
 
															+                        newModel.getModelId()
														
 
															+                    );
														
 
															+                    // Old model is currently deployed
														
 
															+                    if (oldAssignment.isPresent()) {
														
 
															+                        // disallow changing the model alias from a deployed model to an undeployed model
														
 
															+                        if (newAssignment.isEmpty()) {
														
 
															+                            listener.onFailure(
														
 
															+                                ExceptionsHelper.badRequestException(
														
 
															+                                    "cannot reassign model_alias [{}] to model [{}] from model [{}] as it is not yet deployed",
														
 
															+                                    request.getModelAlias(),
														
 
															+                                    newModel.getModelId(),
														
 
															+                                    oldModel.getModelId()
														
 
															+                                )
														
 
															+                            );
														
 
															+                            return;
														
 
															+                        } else {
														
 
															+                            Optional<AllocationStatus> oldAllocationStatus = oldAssignment.map(
														
 
															+                                TrainedModelAssignment::calculateAllocationStatus
														
 
															+                            ).get();
														
 
															+                            // Old model is deployed and its allocation status is NOT "stopping" or "starting"
														
 
															+                            if (oldAllocationStatus.isPresent()
														
 
															+                                && oldAllocationStatus.get()
														
 
															+                                    .calculateState()
														
 
															+                                    .isAnyOf(AllocationStatus.State.FULLY_ALLOCATED, AllocationStatus.State.STARTED)) {
														
 
															+                                Optional<AllocationStatus> newAllocationStatus = newAssignment.map(
														
 
															+                                    TrainedModelAssignment::calculateAllocationStatus
														
 
															+                                ).get();
														
 
															+                                if (newAllocationStatus.isEmpty()
														
 
															+                                    || newAllocationStatus.get().calculateState().equals(AllocationStatus.State.STARTING)) {
														
 
															+                                    listener.onFailure(
														
 
															+                                        ExceptionsHelper.badRequestException(
														
 
															+                                            "cannot reassign model_alias [{}] to model [{}] "
														
 
															+                                                + " from model [{}] as it is not yet allocated to any nodes",
														
 
															+                                            request.getModelAlias(),
														
 
															+                                            newModel.getModelId(),
														
 
															+                                            oldModel.getModelId()
														
 
															+                                        )
														
 
															+                                    );
														
 
															+                                    return;
														
 
															+                                }
														
 
															+                            }
														
 
															+                        }
														
 
															+                    }
														
 
															+                }
														
 
															+
														
 
															                 Set<String> oldInputFields = new HashSet<>(oldModel.getInput().getFieldNames());
														
 
															                 Set<String> newInputFields = new HashSet<>(newModel.getInput().getFieldNames());
														
 
															                 // TODO should we fail in this case???
														
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportStopTrainedModelDeploymentAction.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportStopTrainedModelDeploymentAction.java
@@ -50,6 +50,7 @@ import java.util.Set;
 
															 import static org.elasticsearch.core.Strings.format;
														
 
															 import static org.elasticsearch.xpack.core.ClientHelper.ML_ORIGIN;
														
 
															+import static org.elasticsearch.xpack.ml.action.TransportDeleteTrainedModelAction.getModelAliases;
														
 
															 import static org.elasticsearch.xpack.ml.action.TransportDeleteTrainedModelAction.getReferencedModelKeys;
														
 
															 /**
														
@@ -138,15 +139,32 @@ public class TransportStopTrainedModelDeploymentAction extends TransportTasksAct
 
															             IngestMetadata currentIngestMetadata = state.metadata().custom(IngestMetadata.TYPE);
														
 
															             Set<String> referencedModels = getReferencedModelKeys(currentIngestMetadata, ingestService);
														
 
															-            if (request.isForce() == false && referencedModels.contains(modelId)) {
														
 
															-                listener.onFailure(
														
 
															-                    new ElasticsearchStatusException(
														
 
															-                        "Cannot stop deployment for model [{}] as it is referenced by ingest processors; use force to stop the deployment",
														
 
															-                        RestStatus.CONFLICT,
														
 
															-                        modelId
														
 
															-                    )
														
 
															-                );
														
 
															-                return;
														
 
															+            if (request.isForce() == false) {
														
 
															+                if (referencedModels.contains(modelId)) {
														
 
															+                    listener.onFailure(
														
 
															+                        new ElasticsearchStatusException(
														
 
															+                            "Cannot stop deployment for model [{}] as it is referenced by ingest processors; "
														
 
															+                                + "use force to stop the deployment",
														
 
															+                            RestStatus.CONFLICT,
														
 
															+                            modelId
														
 
															+                        )
														
 
															+                    );
														
 
															+                    return;
														
 
															+                }
														
 
															+                List<String> modelAliases = getModelAliases(state, modelId);
														
 
															+                Optional<String> referencedModelAlias = modelAliases.stream().filter(referencedModels::contains).findFirst();
														
 
															+                if (referencedModelAlias.isPresent()) {
														
 
															+                    listener.onFailure(
														
 
															+                        new ElasticsearchStatusException(
														
 
															+                            "Cannot stop deployment for model [{}] as it has a model_alias [{}] that is still referenced"
														
 
															+                                + " by ingest processors; use force to stop the deployment",
														
 
															+                            RestStatus.CONFLICT,
														
 
															+                            modelId,
														
 
															+                            referencedModelAlias.get()
														
 
															+                        )
														
 
															+                    );
														
 
															+                    return;
														
 
															+                }
														
 
															             }
														
 
															             // NOTE, should only run on Master node
														
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/ModelAliasMetadata.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/ModelAliasMetadata.java
@@ -227,5 +227,10 @@ public class ModelAliasMetadata implements Metadata.Custom {
 
															         public int hashCode() {
														
 
															             return Objects.hash(modelId);
														
 
															         }
														
 
															+
														
 
															+        @Override
														
 
															+        public String toString() {
														
 
															+            return "ModelAliasEntry{modelId='" + modelId + "'}";
														
 
															+        }
														
 
															     }
														
 
															 }
														
--- a/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/ml/3rd_party_deployment.yml
+++ b/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/ml/3rd_party_deployment.yml
--- a/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/ml/inference_crud.yml
+++ b/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/ml/inference_crud.yml
@@ -998,26 +998,6 @@ setup:
 
															   - match: { trained_model_configs.0.metadata.model_aliases.0: "regression-model" }
														
 
															   - match: { trained_model_configs.0.metadata.model_aliases.1: "regression-model-again" }
														
 
															 ---
														
 
															-"Test put model model aliases with nlp model":
														
 
															-
														
 
															-  - do:
														
 
															-      ml.put_trained_model:
														
 
															-        model_id: my-nlp-model
														
 
															-        body: >
														
 
															-          {
														
 
															-            "description": "distilbert-base-uncased-finetuned-sst-2-english.pt",
														
 
															-            "model_type": "pytorch",
														
 
															-            "inference_config": {
														
 
															-              "ner": {
														
 
															-              }
														
 
															-            }
														
 
															-          }
														
 
															-  - do:
														
 
															-      catch: /model_alias is not supported on pytorch models/
														
 
															-      ml.put_trained_model_alias:
														
 
															-        model_alias: "nlp-model"
														
 
															-        model_id: "my-nlp-model"
														
 
															----
														
 
															 "Test update model alias with model id referring to missing model":
														
 
															   - do:
														
 
															       catch: missing