elastic · prwhelan · Oct 13, 2025 · Jul 22, 2025 · Jul 22, 2025 · Jul 23, 2025
diff --git a/server/src/main/java/org/elasticsearch/TransportVersions.java b/server/src/main/java/org/elasticsearch/TransportVersions.java
@@ -351,6 +351,7 @@ static TransportVersion def(int id) {
     public static final TransportVersion SHARD_WRITE_LOAD_IN_CLUSTER_INFO = def(9_126_0_00);
     public static final TransportVersion ESQL_SAMPLE_OPERATOR_STATUS = def(9_127_0_00);
     public static final TransportVersion ESQL_TOPN_TIMINGS = def(9_128_0_00);
+    public static final TransportVersion INFERENCE_UPDATE_ML = def(9_129_0_00);
 
     /*
      * STOP! READ THIS FIRST! No, really,

diff --git a/.../main/java/org/elasticsearch/xpack/core/ml/action/UpdateTrainedModelDeploymentAction.java b/.../main/java/org/elasticsearch/xpack/core/ml/action/UpdateTrainedModelDeploymentAction.java
@@ -27,6 +27,7 @@
 import java.io.IOException;
 import java.util.Objects;
 
+import static org.elasticsearch.TransportVersions.INFERENCE_UPDATE_ML;
 import static org.elasticsearch.xpack.core.ml.action.StartTrainedModelDeploymentAction.Request.ADAPTIVE_ALLOCATIONS;
 import static org.elasticsearch.xpack.core.ml.action.StartTrainedModelDeploymentAction.Request.MODEL_ID;
 import static org.elasticsearch.xpack.core.ml.action.StartTrainedModelDeploymentAction.Request.NUMBER_OF_ALLOCATIONS;
@@ -74,6 +75,7 @@ public static Request parseRequest(String deploymentId, XContentParser parser) {
         private Integer numberOfAllocations;
         private AdaptiveAllocationsSettings adaptiveAllocationsSettings;
         private boolean isInternal;
+        private boolean fromInference;
 
         private Request() {
             super(TRAPPY_IMPLICIT_DEFAULT_MASTER_NODE_TIMEOUT, DEFAULT_ACK_TIMEOUT);
@@ -96,6 +98,7 @@ public Request(StreamInput in) throws IOException {
                 adaptiveAllocationsSettings = in.readOptionalWriteable(AdaptiveAllocationsSettings::new);
                 isInternal = in.readBoolean();
             }
+            fromInference = in.getTransportVersion().onOrAfter(INFERENCE_UPDATE_ML) && in.readBoolean();
         }
 
         public final void setDeploymentId(String deploymentId) {
@@ -126,6 +129,15 @@ public void setIsInternal(boolean isInternal) {
             this.isInternal = isInternal;
         }
 
+        public boolean fromInference() {
+            return fromInference;
+        }
+
+        public void setFromInference(boolean fromInference) {
+            this.fromInference = fromInference;
+            this.isInternal = fromInference;
+        }
+
         public AdaptiveAllocationsSettings getAdaptiveAllocationsSettings() {
             return adaptiveAllocationsSettings;
         }
@@ -141,6 +153,9 @@ public void writeTo(StreamOutput out) throws IOException {
                 out.writeOptionalWriteable(adaptiveAllocationsSettings);
                 out.writeBoolean(isInternal);
             }
+            if (out.getTransportVersion().onOrAfter(INFERENCE_UPDATE_ML)) {
+                out.writeBoolean(fromInference);
+            }
         }
 
         @Override
@@ -183,7 +198,7 @@ public ActionRequestValidationException validate() {
 
         @Override
         public int hashCode() {
-            return Objects.hash(deploymentId, numberOfAllocations, adaptiveAllocationsSettings, isInternal);
+            return Objects.hash(deploymentId, numberOfAllocations, adaptiveAllocationsSettings, isInternal, fromInference);
         }
 
         @Override
@@ -198,7 +213,8 @@ public boolean equals(Object obj) {
             return Objects.equals(deploymentId, other.deploymentId)
                 && Objects.equals(numberOfAllocations, other.numberOfAllocations)
                 && Objects.equals(adaptiveAllocationsSettings, other.adaptiveAllocationsSettings)
-                && isInternal == other.isInternal;
+                && isInternal == other.isInternal
+                && fromInference == other.fromInference;
         }
 
         @Override

diff --git a/...in/java/org/elasticsearch/xpack/inference/action/TransportUpdateInferenceModelAction.java b/...in/java/org/elasticsearch/xpack/inference/action/TransportUpdateInferenceModelAction.java
@@ -294,7 +294,7 @@ private void updateInClusterEndpoint(
             var updateRequest = new UpdateTrainedModelDeploymentAction.Request(deploymentId);
             updateRequest.setNumberOfAllocations(elasticServiceSettings.getNumAllocations());
             updateRequest.setAdaptiveAllocationsSettings(elasticServiceSettings.getAdaptiveAllocationsSettings());
-            updateRequest.setIsInternal(true);
+            updateRequest.setFromInference(true);
 
             var delegate = listener.<CreateTrainedModelAssignmentAction.Response>delegateFailure((l2, response) -> {
                 modelRegistry.updateModelTransaction(newModel, existingParsedModel, l2);

diff --git a/...ugin/src/yamlRestTest/resources/rest-api-spec/test/ml/update_trained_model_deployment.yml b/...ugin/src/yamlRestTest/resources/rest-api-spec/test/ml/update_trained_model_deployment.yml
@@ -6,5 +6,9 @@
         model_id: "missing-model"
         body: >
           {
-            "number_of_allocations": 4
+            "adaptive_allocations": {
+              "enabled": true,
+              "min_number_of_allocations": 0,
+              "max_number_of_allocations": 1
+            }
           }