4 年之前 · 408489310c
--- a/docs/reference/ml/df-analytics/apis/get-trained-models.asciidoc
+++ b/docs/reference/ml/df-analytics/apis/get-trained-models.asciidoc
@@ -27,7 +27,7 @@ Retrieves configuration information for a trained model.
 
				 [[ml-get-trained-models-prereq]]
			
 
				 == {api-prereq-title}
			
 
				 
			
 
				-Requires the `monitor_ml` cluster privilege. This privilege is included in the 
			
 
				+Requires the `monitor_ml` cluster privilege. This privilege is included in the
			
 
				 `machine_learning_user` built-in role.
			
 
				 
			
 
				 
			
@@ -71,9 +71,9 @@ default value is empty, indicating no optional fields are included. Valid
 
				 options are:
			
 
				  - `definition`: Includes the model definition.
			
 
				  - `feature_importance_baseline`: Includes the baseline for {feat-imp} values.
			
 
				- - `hyperparameters`: Includes the information about hyperparameters used to 
			
 
				-    train the model. This information consists of the value, the absolute and 
			
 
				-    relative importance of the hyperparameter as well as an indicator of whether 
			
 
				+ - `hyperparameters`: Includes the information about hyperparameters used to
			
 
				+    train the model. This information consists of the value, the absolute and
			
 
				+    relative importance of the hyperparameter as well as an indicator of whether
			
 
				     it was specified by the user or tuned during hyperparameter optimization.
			
 
				  - `total_feature_importance`: Includes the total {feat-imp} for the training
			
 
				    data set.
			
@@ -222,8 +222,8 @@ include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-ner]
 
				 [%collapsible%open]
			
 
				 ======
			
 
				 `classification_labels`::::
			
 
				-(Optional, string) 
			
 
				-An array of classification labels. NER supports only 
			
 
				+(Optional, string)
			
 
				+An array of classification labels. NER supports only
			
 
				 Inside-Outside-Beginning labels (IOB) and only persons, organizations, locations,
			
 
				 and miscellaneous. For example:
			
 
				 `["O", "B-PER", "I-PER", "B-ORG", "I-ORG", "B-LOC", "I-LOC", "B-MISC", "I-MISC"]`.
			
@@ -338,7 +338,7 @@ include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-text-classific
 
				 [%collapsible%open]
			
 
				 ======
			
 
				 `classification_labels`::::
			
 
				-(Optional, string) 
			
 
				+(Optional, string)
			
 
				 An array of classification labels.
			
 
				 
			
 
				 `num_top_classes`::::
			
@@ -414,6 +414,68 @@ include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-tokenizati
 
				 (Optional, integer)
			
 
				 include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-tokenization-bert-max-sequence-length]
			
 
				 
			
 
				+`with_special_tokens`::::
			
 
				+(Optional, boolean)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-tokenization-bert-with-special-tokens]
			
 
				+========
			
 
				+=======
			
 
				+`vocabulary`::::
			
 
				+(Optional, object)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-vocabulary]
			
 
				++
			
 
				+.Properties of vocabulary
			
 
				+[%collapsible%open]
			
 
				+=======
			
 
				+`index`::::
			
 
				+(Required, string)
			
 
				+The index where the vocabulary is stored.
			
 
				+=======
			
 
				+======
			
 
				+`zero_shot_classification`::::
			
 
				+(Object, optional)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-zero-shot-classification]
			
 
				++
			
 
				+.Properties of zero_shot_classification inference
			
 
				+[%collapsible%open]
			
 
				+======
			
 
				+`classification_labels`::::
			
 
				+(Required, array)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-zero-shot-classification-classification-labels]
			
 
				+
			
 
				+`hypothesis_template`::::
			
 
				+(Optional, string)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-zero-shot-classification-hypothesis-template]
			
 
				+
			
 
				+`labels`::::
			
 
				+(Optional, array)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-zero-shot-classification-labels]
			
 
				+
			
 
				+`multi_label`::::
			
 
				+(Optional, boolean)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-zero-shot-classification-multi-label]
			
 
				+
			
 
				+`tokenization`::::
			
 
				+(Optional, object)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-tokenization]
			
 
				++
			
 
				+.Properties of tokenization
			
 
				+[%collapsible%open]
			
 
				+=======
			
 
				+`bert`::::
			
 
				+(Optional, object)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-tokenization-bert]
			
 
				++
			
 
				+.Properties of bert
			
 
				+[%collapsible%open]
			
 
				+========
			
 
				+`do_lower_case`::::
			
 
				+(Optional, boolean)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-tokenization-bert-do-lower-case]
			
 
				+
			
 
				+`max_sequence_length`::::
			
 
				+(Optional, integer)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-tokenization-bert-max-sequence-length]
			
 
				+
			
 
				 `with_special_tokens`::::
			
 
				 (Optional, boolean)
			
 
				 include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-tokenization-bert-with-special-tokens]
			
@@ -456,7 +518,7 @@ provided.
 
				 =====
			
 
				 `index`:::
			
 
				 (Required, object)
			
 
				-Indicates that the model definition is stored in an index. It is required to be empty as 
			
 
				+Indicates that the model definition is stored in an index. It is required to be empty as
			
 
				 the index for storing model definitions is configured automatically.
			
 
				 =====
			
 
				 // End location
			
@@ -480,7 +542,7 @@ it is a single value. For {classanalysis}, there is a value for each class.
 
				 
			
 
				 `hyperparameters`:::
			
 
				 (array)
			
 
				-List of the available hyperparameters optimized during the 
			
 
				+List of the available hyperparameters optimized during the
			
 
				 `fine_parameter_tuning` phase as well as specified by the user.
			
 
				 +
			
 
				 .Properties of hyperparameters
			
@@ -488,10 +550,10 @@ List of the available hyperparameters optimized during the
 
				 ======
			
 
				 `absolute_importance`::::
			
 
				 (double)
			
 
				-A positive number showing how much the parameter influences the variation of the 
			
 
				-{ml-docs}/dfa-regression-lossfunction.html[loss function]. For 
			
 
				-hyperparameters with values that are not specified by the user but tuned during 
			
 
				-hyperparameter optimization. 
			
 
				+A positive number showing how much the parameter influences the variation of the
			
 
				+{ml-docs}/dfa-regression-lossfunction.html[loss function]. For
			
 
				+hyperparameters with values that are not specified by the user but tuned during
			
 
				+hyperparameter optimization.
			
 
				 
			
 
				 `max_trees`::::
			
 
				 (integer)
			
@@ -503,14 +565,14 @@ Name of the hyperparameter.
 
				 
			
 
				 `relative_importance`::::
			
 
				 (double)
			
 
				-A number between 0 and 1 showing the proportion of influence on the variation of 
			
 
				-the loss function among all tuned hyperparameters. For hyperparameters with 
			
 
				-values that are not specified by the user but tuned during hyperparameter 
			
 
				+A number between 0 and 1 showing the proportion of influence on the variation of
			
 
				+the loss function among all tuned hyperparameters. For hyperparameters with
			
 
				+values that are not specified by the user but tuned during hyperparameter
			
 
				 optimization.
			
 
				 
			
 
				 `supplied`::::
			
 
				 (Boolean)
			
 
				-Indicates if the hyperparameter is specified by the user (`true`) or optimized 
			
 
				+Indicates if the hyperparameter is specified by the user (`true`) or optimized
			
 
				 (`false`).
			
 
				 
			
 
				 `value`::::
			
@@ -602,7 +664,7 @@ Identifier for the trained model.
 
				 `model_type`::
			
 
				 (Optional, string)
			
 
				 The created model type. By default the model type is `tree_ensemble`.
			
 
				-Appropriate types are: 
			
 
				+Appropriate types are:
			
 
				 +
			
 
				 --
			
 
				 * `tree_ensemble`: The model definition is an ensemble model of decision trees.
			
--- a/docs/reference/ml/df-analytics/apis/put-trained-models.asciidoc
+++ b/docs/reference/ml/df-analytics/apis/put-trained-models.asciidoc
@@ -377,7 +377,7 @@ A human-readable description of the {infer} trained model.
 
				 `inference_config`::
			
 
				 (Required, object)
			
 
				 The default configuration for inference. This can be: `regression`,
			
 
				-`classification`, `fill_mask`, `ner`, `text_classification`, or `text_embedding`. 
			
 
				+`classification`, `fill_mask`, `ner`, `text_classification`, `text_embedding` or `zero_shot_classification`.
			
 
				 If `regression` or `classification`, it must match the `target_type` of the
			
 
				 underlying `definition.trained_model`. If `fill_mask`, `ner`,
			
 
				 `text_classification`, or `text_embedding`; the `model_type` must be `pytorch`.
			
@@ -457,7 +457,7 @@ include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-ner]
 
				 [%collapsible%open]
			
 
				 =====
			
 
				 `classification_labels`::::
			
 
				-(Optional, string) 
			
 
				+(Optional, string)
			
 
				 An array of classification labels. NER only supports Inside-Outside-Beginning labels (IOB)
			
 
				 and only persons, organizations, locations, and miscellaneous.
			
 
				 Example: ["O", "B-PER", "I-PER", "B-ORG", "I-ORG", "B-LOC", "I-LOC", "B-MISC", "I-MISC"]
			
@@ -614,6 +614,57 @@ include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-tokenizati
 
				 (Optional, integer)
			
 
				 include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-tokenization-bert-max-sequence-length]
			
 
				 
			
 
				+`with_special_tokens`::::
			
 
				+(Optional, boolean)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-tokenization-bert-with-special-tokens]
			
 
				+=======
			
 
				+======
			
 
				+=====
			
 
				+`zero_shot_classification`:::
			
 
				+(Object, optional)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-zero-shot-classification]
			
 
				++
			
 
				+.Properties of zero_shot_classification inference
			
 
				+[%collapsible%open]
			
 
				+=====
			
 
				+`classification_labels`::::
			
 
				+(Required, array)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-zero-shot-classification-classification-labels]
			
 
				+
			
 
				+`hypothesis_template`::::
			
 
				+(Optional, string)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-zero-shot-classification-hypothesis-template]
			
 
				+
			
 
				+`labels`::::
			
 
				+(Optional, array)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-zero-shot-classification-labels]
			
 
				+
			
 
				+`multi_label`::::
			
 
				+(Optional, boolean)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-zero-shot-classification-multi-label]
			
 
				+
			
 
				+`tokenization`::::
			
 
				+(Optional, object)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-tokenization]
			
 
				++
			
 
				+.Properties of tokenization
			
 
				+[%collapsible%open]
			
 
				+======
			
 
				+`bert`::::
			
 
				+(Optional, object)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-tokenization-bert]
			
 
				++
			
 
				+.Properties of bert
			
 
				+[%collapsible%open]
			
 
				+=======
			
 
				+`do_lower_case`::::
			
 
				+(Optional, boolean)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-tokenization-bert-do-lower-case]
			
 
				+
			
 
				+`max_sequence_length`::::
			
 
				+(Optional, integer)
			
 
				+include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-tokenization-bert-max-sequence-length]
			
 
				+
			
 
				 `with_special_tokens`::::
			
 
				 (Optional, boolean)
			
 
				 include::{es-repo-dir}/ml/ml-shared.asciidoc[tag=inference-config-nlp-tokenization-bert-with-special-tokens]
			
@@ -660,7 +711,7 @@ An object map that contains metadata about the model.
 
				 `model_type`::
			
 
				 (Optional, string)
			
 
				 The created model type. By default the model type is `tree_ensemble`.
			
 
				-Appropriate types are: 
			
 
				+Appropriate types are:
			
 
				 +
			
 
				 --
			
 
				 * `tree_ensemble`: The model definition is an ensemble model of decision trees.
			
--- a/docs/reference/ml/ml-shared.asciidoc
+++ b/docs/reference/ml/ml-shared.asciidoc
@@ -323,7 +323,7 @@ end::custom-preprocessor[]
 
				 tag::custom-rules[]
			
 
				 An array of custom rule objects, which enable you to customize the way detectors
			
 
				 operate. For example, a rule may dictate to the detector conditions under which
			
 
				-results should be skipped. {kib} refers to custom rules as _job rules_. For more 
			
 
				+results should be skipped. {kib} refers to custom rules as _job rules_. For more
			
 
				 examples, see
			
 
				 {ml-docs}/ml-configuring-detector-custom-rules.html[Customizing detectors with custom rules].
			
 
				 end::custom-rules[]
			
@@ -526,21 +526,21 @@ end::detector-index[]
 
				 tag::dfas-alpha[]
			
 
				 Advanced configuration option. {ml-cap} uses loss guided tree growing, which
			
 
				 means that the decision trees grow where the regularized loss decreases most
			
 
				-quickly. This parameter affects loss calculations by acting as a multiplier of 
			
 
				-the tree depth. Higher alpha values result in shallower trees and faster 
			
 
				-training times. By default, this value is calculated during hyperparameter 
			
 
				-optimization. It must be greater than or equal to zero. 
			
 
				+quickly. This parameter affects loss calculations by acting as a multiplier of
			
 
				+the tree depth. Higher alpha values result in shallower trees and faster
			
 
				+training times. By default, this value is calculated during hyperparameter
			
 
				+optimization. It must be greater than or equal to zero.
			
 
				 end::dfas-alpha[]
			
 
				 
			
 
				 tag::dfas-downsample-factor[]
			
 
				-Advanced configuration option. Controls the fraction of data that is used to 
			
 
				-compute the derivatives of the loss function for tree training. A small value 
			
 
				-results in the use of a small fraction of the data. If this value is set to be 
			
 
				-less than 1, accuracy typically improves. However, too small a value may result 
			
 
				+Advanced configuration option. Controls the fraction of data that is used to
			
 
				+compute the derivatives of the loss function for tree training. A small value
			
 
				+results in the use of a small fraction of the data. If this value is set to be
			
 
				+less than 1, accuracy typically improves. However, too small a value may result
			
 
				 in poor convergence for the ensemble and so require more trees. For more
			
 
				 information about shrinkage, refer to
			
 
				 {wikipedia}/Gradient_boosting#Stochastic_gradient_boosting[this wiki article].
			
 
				-By default, this value is calculated during hyperparameter optimization. It 
			
 
				+By default, this value is calculated during hyperparameter optimization. It
			
 
				 must be greater than zero and less than or equal to 1.
			
 
				 end::dfas-downsample-factor[]
			
 
				 
			
@@ -553,9 +553,9 @@ By default, early stoppping is enabled.
 
				 end::dfas-early-stopping-enabled[]
			
 
				 
			
 
				 tag::dfas-eta-growth[]
			
 
				-Advanced configuration option. Specifies the rate at which `eta` increases for 
			
 
				-each new tree that is added to the forest. For example, a rate of 1.05 
			
 
				-increases `eta` by 5% for each extra tree. By default, this value is calculated 
			
 
				+Advanced configuration option. Specifies the rate at which `eta` increases for
			
 
				+each new tree that is added to the forest. For example, a rate of 1.05
			
 
				+increases `eta` by 5% for each extra tree. By default, this value is calculated
			
 
				 during hyperparameter optimization. It must be between 0.5 and 2.
			
 
				 end::dfas-eta-growth[]
			
 
				 
			
@@ -565,16 +565,16 @@ candidate split.
 
				 end::dfas-feature-bag-fraction[]
			
 
				 
			
 
				 tag::dfas-feature-processors[]
			
 
				-Advanced configuration option. A collection of feature preprocessors that modify 
			
 
				-one or more included fields. The analysis uses the resulting one or more 
			
 
				-features instead of the original document field. However, these features are 
			
 
				-ephemeral; they are not stored in the destination index. Multiple 
			
 
				-`feature_processors` entries can refer to the same document fields. Automatic 
			
 
				-categorical {ml-docs}/ml-feature-encoding.html[feature encoding] still occurs 
			
 
				+Advanced configuration option. A collection of feature preprocessors that modify
			
 
				+one or more included fields. The analysis uses the resulting one or more
			
 
				+features instead of the original document field. However, these features are
			
 
				+ephemeral; they are not stored in the destination index. Multiple
			
 
				+`feature_processors` entries can refer to the same document fields. Automatic
			
 
				+categorical {ml-docs}/ml-feature-encoding.html[feature encoding] still occurs
			
 
				 for the fields that are unprocessed by a custom processor or that have
			
 
				-categorical values. Use this property only if you want to override the automatic 
			
 
				-feature encoding of the specified fields. Refer to 
			
 
				-{ml-docs}/ml-feature-processors.html[{dfanalytics} feature processors] to learn 
			
 
				+categorical values. Use this property only if you want to override the automatic
			
 
				+feature encoding of the specified fields. Refer to
			
 
				+{ml-docs}/ml-feature-processors.html[{dfanalytics} feature processors] to learn
			
 
				 more.
			
 
				 end::dfas-feature-processors[]
			
 
				 
			
@@ -591,13 +591,13 @@ The configuration information necessary to perform frequency encoding.
 
				 end::dfas-feature-processors-frequency[]
			
 
				 
			
 
				 tag::dfas-feature-processors-frequency-map[]
			
 
				-The resulting frequency map for the field value. If the field value is missing 
			
 
				+The resulting frequency map for the field value. If the field value is missing
			
 
				 from the `frequency_map`, the resulting value is `0`.
			
 
				 end::dfas-feature-processors-frequency-map[]
			
 
				 
			
 
				 tag::dfas-feature-processors-multi[]
			
 
				-The configuration information necessary to perform multi encoding. It allows 
			
 
				-multiple processors to be changed together. This way the output of a processor 
			
 
				+The configuration information necessary to perform multi encoding. It allows
			
 
				+multiple processors to be changed together. This way the output of a processor
			
 
				 can then be passed to another as an input.
			
 
				 end::dfas-feature-processors-multi[]
			
 
				 
			
@@ -606,10 +606,10 @@ The ordered array of custom processors to execute. Must be more than 1.
 
				 end::dfas-feature-processors-multi-proc[]
			
 
				 
			
 
				 tag::dfas-feature-processors-ngram[]
			
 
				-The configuration information necessary to perform n-gram encoding. Features 
			
 
				-created by this encoder have the following name format: 
			
 
				-`<feature_prefix>.<ngram><string position>`. For example, if the 
			
 
				-`feature_prefix` is `f`, the feature name for the second unigram in a string is 
			
 
				+The configuration information necessary to perform n-gram encoding. Features
			
 
				+created by this encoder have the following name format:
			
 
				+`<feature_prefix>.<ngram><string position>`. For example, if the
			
 
				+`feature_prefix` is `f`, the feature name for the second unigram in a string is
			
 
				 `f.11`.
			
 
				 end::dfas-feature-processors-ngram[]
			
 
				 
			
@@ -622,17 +622,17 @@ The name of the text field to encode.
 
				 end::dfas-feature-processors-ngram-field[]
			
 
				 
			
 
				 tag::dfas-feature-processors-ngram-length[]
			
 
				-Specifies the length of the n-gram substring. Defaults to `50`. Must be greater 
			
 
				+Specifies the length of the n-gram substring. Defaults to `50`. Must be greater
			
 
				 than `0`.
			
 
				 end::dfas-feature-processors-ngram-length[]
			
 
				 
			
 
				 tag::dfas-feature-processors-ngram-ngrams[]
			
 
				-Specifies which n-grams to gather. It’s an array of integer values where the 
			
 
				+Specifies which n-grams to gather. It’s an array of integer values where the
			
 
				 minimum value is 1, and a maximum value is 5.
			
 
				 end::dfas-feature-processors-ngram-ngrams[]
			
 
				 
			
 
				 tag::dfas-feature-processors-ngram-start[]
			
 
				-Specifies the zero-indexed start of the n-gram substring. Negative values are 
			
 
				+Specifies the zero-indexed start of the n-gram substring. Negative values are
			
 
				 allowed for encoding n-grams of string suffixes. Defaults to `0`.
			
 
				 end::dfas-feature-processors-ngram-start[]
			
 
				 
			
@@ -686,19 +686,19 @@ decision tree when the tree is trained.
 
				 end::dfas-num-splits[]
			
 
				 
			
 
				 tag::dfas-soft-limit[]
			
 
				-Advanced configuration option. {ml-cap} uses loss guided tree growing, which 
			
 
				-means that the decision trees grow where the regularized loss decreases most 
			
 
				-quickly. This soft limit combines with the `soft_tree_depth_tolerance` to 
			
 
				-penalize trees that exceed the specified depth; the regularized loss increases 
			
 
				-quickly beyond this depth. By default, this value is calculated during 
			
 
				+Advanced configuration option. {ml-cap} uses loss guided tree growing, which
			
 
				+means that the decision trees grow where the regularized loss decreases most
			
 
				+quickly. This soft limit combines with the `soft_tree_depth_tolerance` to
			
 
				+penalize trees that exceed the specified depth; the regularized loss increases
			
 
				+quickly beyond this depth. By default, this value is calculated during
			
 
				 hyperparameter optimization. It must be greater than or equal to 0.
			
 
				 end::dfas-soft-limit[]
			
 
				 
			
 
				 tag::dfas-soft-tolerance[]
			
 
				-Advanced configuration option. This option controls how quickly the regularized 
			
 
				-loss increases when the tree depth exceeds `soft_tree_depth_limit`. By default, 
			
 
				-this value is calculated during hyperparameter optimization. It must be greater 
			
 
				-than or equal to 0.01. 
			
 
				+Advanced configuration option. This option controls how quickly the regularized
			
 
				+loss increases when the tree depth exceeds `soft_tree_depth_limit`. By default,
			
 
				+this value is calculated during hyperparameter optimization. It must be greater
			
 
				+than or equal to 0.01.
			
 
				 end::dfas-soft-tolerance[]
			
 
				 
			
 
				 tag::dfas-timestamp[]
			
@@ -744,7 +744,7 @@ end::empty-bucket-count[]
 
				 tag::eta[]
			
 
				 Advanced configuration option. The shrinkage applied to the weights. Smaller
			
 
				 values result in larger forests which have a better generalization error.
			
 
				-However, larger forests cause slower training. For more information about 
			
 
				+However, larger forests cause slower training. For more information about
			
 
				 shrinkage, refer to
			
 
				 {wikipedia}/Gradient_boosting#Shrinkage[this wiki article].
			
 
				 By default, this value is calculated during hyperparameter optimization. It must
			
@@ -833,10 +833,10 @@ end::function[]
 
				 
			
 
				 tag::gamma[]
			
 
				 Advanced configuration option. Regularization parameter to prevent overfitting
			
 
				-on the training data set. Multiplies a linear penalty associated with the size 
			
 
				-of individual trees in the forest. A high gamma value causes training to prefer 
			
 
				-small trees. A small gamma value results in larger individual trees and slower 
			
 
				-training. By default, this value is calculated during hyperparameter 
			
 
				+on the training data set. Multiplies a linear penalty associated with the size
			
 
				+of individual trees in the forest. A high gamma value causes training to prefer
			
 
				+small trees. A small gamma value results in larger individual trees and slower
			
 
				+training. By default, this value is calculated during hyperparameter
			
 
				 optimization. It must be a nonnegative value.
			
 
				 end::gamma[]
			
 
				 
			
@@ -849,7 +849,7 @@ An array of index names. Wildcards are supported. For example:
 
				 `["it_ops_metrics", "server*"]`.
			
 
				 +
			
 
				 --
			
 
				-NOTE: If any indices are in remote clusters then the {ml} nodes need to have the 
			
 
				+NOTE: If any indices are in remote clusters then the {ml} nodes need to have the
			
 
				 `remote_cluster_client` role.
			
 
				 
			
 
				 --
			
@@ -921,7 +921,7 @@ BERT-style tokenization is to be performed with the enclosed settings.
 
				 end::inference-config-nlp-tokenization-bert[]
			
 
				 
			
 
				 tag::inference-config-nlp-tokenization-bert-do-lower-case[]
			
 
				-Should the tokenization lower case the text sequence when building 
			
 
				+Should the tokenization lower case the text sequence when building
			
 
				 the tokens.
			
 
				 end::inference-config-nlp-tokenization-bert-do-lower-case[]
			
 
				 
			
@@ -930,7 +930,7 @@ Tokenize with special tokens. The tokens typically included in BERT-style tokeni
 
				 +
			
 
				 --
			
 
				 * `[CLS]`: The first token of the sequence being classified.
			
 
				-* `[SEP]`: Indicates sequence separation. 
			
 
				+* `[SEP]`: Indicates sequence separation.
			
 
				 --
			
 
				 end::inference-config-nlp-tokenization-bert-with-special-tokens[]
			
 
				 
			
@@ -998,6 +998,46 @@ prediction. Defaults to the `results_field` value of the {dfanalytics-job} that
 
				 used to train the model, which defaults to `<dependent_variable>_prediction`.
			
 
				 end::inference-config-results-field-processor[]
			
 
				 
			
 
				+tag::inference-config-zero-shot-classification[]
			
 
				+Configures a zero-shot classification task. Zero-shot classification allows for
			
 
				+text classification to occur without pre-determined labels. At inference time,
			
 
				+it is possible to adjust the labels to classify. This makes this type of model
			
 
				+and task exceptionally flexible.
			
 
				+
			
 
				+If consistently classifying the same labels, it may be better to use a fine turned
			
 
				+text classification model.
			
 
				+end::inference-config-zero-shot-classification[]
			
 
				+
			
 
				+tag::inference-config-zero-shot-classification-classification-labels[]
			
 
				+The classification labels used during the zero-shot classification. Classification
			
 
				+labels must not be empty or null and only set at model creation. They must be all three
			
 
				+of ["entailment", "neutral", "contradiction"].
			
 
				+
			
 
				+NOTE: This is NOT the same as `labels` which are the values that zero-shot is attempting to
			
 
				+      classify.
			
 
				+end::inference-config-zero-shot-classification-classification-labels[]
			
 
				+
			
 
				+tag::inference-config-zero-shot-classification-hypothesis-template[]
			
 
				+This is the template used when tokenizing the sequences for classification.
			
 
				+
			
 
				+The labels replace the `{}` value in the text. The default value is:
			
 
				+`This example is {}.`
			
 
				+end::inference-config-zero-shot-classification-hypothesis-template[]
			
 
				+
			
 
				+tag::inference-config-zero-shot-classification-labels[]
			
 
				+The labels to classify. Can be set at creation for default labels, and
			
 
				+then updated during inference.
			
 
				+end::inference-config-zero-shot-classification-labels[]
			
 
				+
			
 
				+tag::inference-config-zero-shot-classification-multi-label[]
			
 
				+Indicates if more than one `true` label is possible given the input.
			
 
				+
			
 
				+This is useful when labeling text that could pertain to more than one of the
			
 
				+input labels.
			
 
				+
			
 
				+Defaults to `false`.
			
 
				+end::inference-config-zero-shot-classification-multi-label[]
			
 
				+
			
 
				 tag::inference-metadata-feature-importance-feature-name[]
			
 
				 The feature for which this importance was calculated.
			
 
				 end::inference-metadata-feature-importance-feature-name[]
			
@@ -1102,11 +1142,11 @@ end::job-id-datafeed[]
 
				 tag::lambda[]
			
 
				 Advanced configuration option. Regularization parameter to prevent overfitting
			
 
				 on the training data set. Multiplies an L2 regularization term which applies to
			
 
				-leaf weights of the individual trees in the forest. A high lambda value causes 
			
 
				-training to favor small leaf weights. This behavior makes the prediction 
			
 
				+leaf weights of the individual trees in the forest. A high lambda value causes
			
 
				+training to favor small leaf weights. This behavior makes the prediction
			
 
				 function smoother at the expense of potentially not being able to capture
			
 
				 relevant relationships between the features and the {depvar}. A small lambda
			
 
				-value results in large individual trees and slower training. By default, this 
			
 
				+value results in large individual trees and slower training. By default, this
			
 
				 value is calculated during hyperparameter optimization. It must be a nonnegative
			
 
				 value.
			
 
				 end::lambda[]
			
@@ -1151,13 +1191,13 @@ set.
 
				 end::max-empty-searches[]
			
 
				 
			
 
				 tag::max-trees[]
			
 
				-Advanced configuration option. Defines the maximum number of decision trees in 
			
 
				-the forest. The maximum value is 2000. By default, this value is calculated 
			
 
				+Advanced configuration option. Defines the maximum number of decision trees in
			
 
				+the forest. The maximum value is 2000. By default, this value is calculated
			
 
				 during hyperparameter optimization.
			
 
				 end::max-trees[]
			
 
				 
			
 
				 tag::max-trees-trained-models[]
			
 
				-The maximum number of decision trees in the forest. The maximum value is 2000. 
			
 
				+The maximum number of decision trees in the forest. The maximum value is 2000.
			
 
				 By default, this value is calculated during hyperparameter optimization.
			
 
				 end::max-trees-trained-models[]
			
 
				 
			
@@ -1222,7 +1262,7 @@ default value for jobs created in version 6.1 and later is `1024mb`. If the
 
				 than `1024mb`, however, that value is used instead. The default value is
			
 
				 relatively small to ensure that high resource usage is a conscious decision. If
			
 
				 you have jobs that are expected to analyze high cardinality fields, you will
			
 
				-likely need to use a higher value. 
			
 
				+likely need to use a higher value.
			
 
				 +
			
 
				 If you specify a number instead of a string, the units are assumed to be MiB.
			
 
				 Specifying a string is recommended for clarity. If you specify a byte size unit
			
@@ -1299,11 +1339,11 @@ Only the specified `terms` can be viewed when using the Single Metric Viewer.
 
				 end::model-plot-config-terms[]
			
 
				 
			
 
				 tag::model-prune-window[]
			
 
				-Advanced configuration option. 
			
 
				-Affects the pruning of models that have not been updated for the given time 
			
 
				-duration. The value must be set to a multiple of the `bucket_span`. If set too 
			
 
				-low, important information may be removed from the model. Typically, set to 
			
 
				-`30d` or longer. If not set, model pruning only occurs if the model memory 
			
 
				+Advanced configuration option.
			
 
				+Affects the pruning of models that have not been updated for the given time
			
 
				+duration. The value must be set to a multiple of the `bucket_span`. If set too
			
 
				+low, important information may be removed from the model. Typically, set to
			
 
				+`30d` or longer. If not set, model pruning only occurs if the model memory
			
 
				 status reaches the soft limit or the hard limit.
			
 
				 end::model-prune-window[]
			
 
				 
			
@@ -1391,10 +1431,10 @@ end::open-time[]
 
				 
			
 
				 tag::out-of-order-timestamp-count[]
			
 
				 The number of input documents that have a timestamp chronologically
			
 
				-preceding the start of the current anomaly detection bucket offset by 
			
 
				-the latency window. This information is applicable only when you provide 
			
 
				-data to the {anomaly-job} by using the <<ml-post-data,post data API>>. 
			
 
				-These out of order documents are discarded, since jobs require time 
			
 
				+preceding the start of the current anomaly detection bucket offset by
			
 
				+the latency window. This information is applicable only when you provide
			
 
				+data to the {anomaly-job} by using the <<ml-post-data,post data API>>.
			
 
				+These out of order documents are discarded, since jobs require time
			
 
				 series data to be in ascending chronological order.
			
 
				 end::out-of-order-timestamp-count[]
			
 
				 
			
@@ -1459,9 +1499,9 @@ number of {es} documents.
 
				 end::processed-record-count[]
			
 
				 
			
 
				 tag::randomize-seed[]
			
 
				-Defines the seed for the random generator that is used to pick training data. By 
			
 
				-default, it is randomly generated. Set it to a specific value to use the same 
			
 
				-training data each time you start a job (assuming other related parameters such 
			
 
				+Defines the seed for the random generator that is used to pick training data. By
			
 
				+default, it is randomly generated. Set it to a specific value to use the same
			
 
				+training data each time you start a job (assuming other related parameters such
			
 
				 as `source` and `analyzed_fields` are the same).
			
 
				 end::randomize-seed[]
			
 
				 
			
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ml/action/InferTrainedModelDeploymentAction.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ml/action/InferTrainedModelDeploymentAction.java
@@ -11,19 +11,19 @@ import org.elasticsearch.action.ActionRequestValidationException;
 
				 import org.elasticsearch.action.ActionType;
			
 
				 import org.elasticsearch.action.support.tasks.BaseTasksRequest;
			
 
				 import org.elasticsearch.action.support.tasks.BaseTasksResponse;
			
 
				-import org.elasticsearch.common.Strings;
			
 
				 import org.elasticsearch.common.io.stream.StreamInput;
			
 
				 import org.elasticsearch.common.io.stream.StreamOutput;
			
 
				 import org.elasticsearch.common.io.stream.Writeable;
			
 
				 import org.elasticsearch.common.xcontent.ObjectParser;
			
 
				 import org.elasticsearch.common.xcontent.ParseField;
			
 
				-import org.elasticsearch.common.xcontent.ToXContent;
			
 
				 import org.elasticsearch.common.xcontent.ToXContentObject;
			
 
				 import org.elasticsearch.common.xcontent.XContentBuilder;
			
 
				 import org.elasticsearch.common.xcontent.XContentParser;
			
 
				 import org.elasticsearch.core.TimeValue;
			
 
				 import org.elasticsearch.tasks.Task;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.results.InferenceResults;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.EmptyConfigUpdate;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.InferenceConfigUpdate;
			
 
				 import org.elasticsearch.xpack.core.ml.utils.ExceptionsHelper;
			
 
				 
			
 
				 import java.io.IOException;
			
@@ -31,6 +31,7 @@ import java.util.Collections;
 
				 import java.util.List;
			
 
				 import java.util.Map;
			
 
				 import java.util.Objects;
			
 
				+import java.util.Optional;
			
 
				 
			
 
				 import static org.elasticsearch.action.ValidateActions.addValidationError;
			
 
				 
			
@@ -45,11 +46,12 @@ public class InferTrainedModelDeploymentAction extends ActionType<InferTrainedMo
 
				         super(NAME, InferTrainedModelDeploymentAction.Response::new);
			
 
				     }
			
 
				 
			
 
				-    public static class Request extends BaseTasksRequest<Request> implements ToXContentObject {
			
 
				+    public static class Request extends BaseTasksRequest<Request> {
			
 
				 
			
 
				         public static final ParseField DEPLOYMENT_ID = new ParseField("deployment_id");
			
 
				         public static final ParseField DOCS = new ParseField("docs");
			
 
				         public static final ParseField TIMEOUT = new ParseField("timeout");
			
 
				+        public static final ParseField INFERENCE_CONFIG = new ParseField("inference_config");
			
 
				 
			
 
				         public static final TimeValue DEFAULT_TIMEOUT = TimeValue.timeValueSeconds(10);
			
 
				 
			
@@ -58,6 +60,11 @@ public class InferTrainedModelDeploymentAction extends ActionType<InferTrainedMo
 
				             PARSER.declareString(Request.Builder::setDeploymentId, DEPLOYMENT_ID);
			
 
				             PARSER.declareObjectArray(Request.Builder::setDocs, (p, c) -> p.mapOrdered(), DOCS);
			
 
				             PARSER.declareString(Request.Builder::setTimeout, TIMEOUT);
			
 
				+            PARSER.declareNamedObject(
			
 
				+                Request.Builder::setUpdate,
			
 
				+                ((p, c, name) -> p.namedObject(InferenceConfigUpdate.class, name, c)),
			
 
				+                INFERENCE_CONFIG
			
 
				+            );
			
 
				         }
			
 
				 
			
 
				         public static Request parseRequest(String deploymentId, XContentParser parser) {
			
@@ -70,16 +77,19 @@ public class InferTrainedModelDeploymentAction extends ActionType<InferTrainedMo
 
				 
			
 
				         private final String deploymentId;
			
 
				         private final List<Map<String, Object>> docs;
			
 
				+        private final InferenceConfigUpdate update;
			
 
				 
			
 
				-        public Request(String deploymentId, List<Map<String, Object>> docs) {
			
 
				+        public Request(String deploymentId, InferenceConfigUpdate update, List<Map<String, Object>> docs) {
			
 
				             this.deploymentId = ExceptionsHelper.requireNonNull(deploymentId, DEPLOYMENT_ID);
			
 
				             this.docs = ExceptionsHelper.requireNonNull(Collections.unmodifiableList(docs), DOCS);
			
 
				+            this.update = update;
			
 
				         }
			
 
				 
			
 
				         public Request(StreamInput in) throws IOException {
			
 
				             super(in);
			
 
				             deploymentId = in.readString();
			
 
				             docs = Collections.unmodifiableList(in.readList(StreamInput::readMap));
			
 
				+            update = in.readOptionalNamedWriteable(InferenceConfigUpdate.class);
			
 
				         }
			
 
				 
			
 
				         public String getDeploymentId() {
			
@@ -90,6 +100,10 @@ public class InferTrainedModelDeploymentAction extends ActionType<InferTrainedMo
 
				             return docs;
			
 
				         }
			
 
				 
			
 
				+        public InferenceConfigUpdate getUpdate() {
			
 
				+            return Optional.ofNullable(update).orElse(new EmptyConfigUpdate());
			
 
				+        }
			
 
				+
			
 
				         @Override
			
 
				         public TimeValue getTimeout() {
			
 
				             TimeValue tv = super.getTimeout();
			
@@ -124,16 +138,7 @@ public class InferTrainedModelDeploymentAction extends ActionType<InferTrainedMo
 
				             super.writeTo(out);
			
 
				             out.writeString(deploymentId);
			
 
				             out.writeCollection(docs, StreamOutput::writeMap);
			
 
				-        }
			
 
				-
			
 
				-        @Override
			
 
				-        public XContentBuilder toXContent(XContentBuilder builder, ToXContent.Params params) throws IOException {
			
 
				-            builder.startObject();
			
 
				-            builder.field(DEPLOYMENT_ID.getPreferredName(), deploymentId);
			
 
				-            builder.field(DOCS.getPreferredName(), docs);
			
 
				-            builder.field(TIMEOUT.getPreferredName(), getTimeout().getStringRep());
			
 
				-            builder.endObject();
			
 
				-            return builder;
			
 
				+            out.writeOptionalNamedWriteable(update);
			
 
				         }
			
 
				 
			
 
				         @Override
			
@@ -148,17 +153,13 @@ public class InferTrainedModelDeploymentAction extends ActionType<InferTrainedMo
 
				             InferTrainedModelDeploymentAction.Request that = (InferTrainedModelDeploymentAction.Request) o;
			
 
				             return Objects.equals(deploymentId, that.deploymentId)
			
 
				                 && Objects.equals(docs, that.docs)
			
 
				+                && Objects.equals(update, that.update)
			
 
				                 && Objects.equals(getTimeout(), that.getTimeout());
			
 
				         }
			
 
				 
			
 
				         @Override
			
 
				         public int hashCode() {
			
 
				-            return Objects.hash(deploymentId, docs, getTimeout());
			
 
				-        }
			
 
				-
			
 
				-        @Override
			
 
				-        public String toString() {
			
 
				-            return Strings.toString(this);
			
 
				+            return Objects.hash(deploymentId, update, docs, getTimeout());
			
 
				         }
			
 
				 
			
 
				         public static class Builder {
			
@@ -166,6 +167,7 @@ public class InferTrainedModelDeploymentAction extends ActionType<InferTrainedMo
 
				             private String deploymentId;
			
 
				             private List<Map<String, Object>> docs;
			
 
				             private TimeValue timeout;
			
 
				+            private InferenceConfigUpdate update;
			
 
				 
			
 
				             private Builder() {}
			
 
				 
			
@@ -184,12 +186,17 @@ public class InferTrainedModelDeploymentAction extends ActionType<InferTrainedMo
 
				                 return this;
			
 
				             }
			
 
				 
			
 
				+            public Builder setUpdate(InferenceConfigUpdate update) {
			
 
				+                this.update = update;
			
 
				+                return this;
			
 
				+            }
			
 
				+
			
 
				             private Builder setTimeout(String timeout) {
			
 
				                 return setTimeout(TimeValue.parseTimeValue(timeout, TIMEOUT.getPreferredName()));
			
 
				             }
			
 
				 
			
 
				             public Request build() {
			
 
				-                Request request = new Request(deploymentId, docs);
			
 
				+                Request request = new Request(deploymentId, update, docs);
			
 
				                 if (timeout != null) {
			
 
				                     request.setTimeout(timeout);
			
 
				                 }
			
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ml/inference/MlInferenceNamedXContentProvider.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ml/inference/MlInferenceNamedXContentProvider.java
@@ -52,6 +52,8 @@ import org.elasticsearch.xpack.core.ml.inference.trainedmodel.TextEmbeddingConfi
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.Tokenization;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.TrainedModel;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.TrainedModelLocation;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.ZeroShotClassificationConfig;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.ZeroShotClassificationConfigUpdate;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.ensemble.Ensemble;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.ensemble.Exponent;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.ensemble.LenientlyParsedOutputAggregator;
			
@@ -184,11 +186,23 @@ public class MlInferenceNamedXContentProvider implements NamedXContentProvider {
 
				             new ParseField(TextEmbeddingConfig.NAME), TextEmbeddingConfig::fromXContentLenient));
			
 
				         namedXContent.add(new NamedXContentRegistry.Entry(StrictlyParsedInferenceConfig.class, new ParseField(TextEmbeddingConfig.NAME),
			
 
				             TextEmbeddingConfig::fromXContentStrict));
			
 
				+        namedXContent.add(new NamedXContentRegistry.Entry(LenientlyParsedInferenceConfig.class,
			
 
				+            new ParseField(ZeroShotClassificationConfig.NAME), ZeroShotClassificationConfig::fromXContentLenient));
			
 
				+        namedXContent.add(new NamedXContentRegistry.Entry(StrictlyParsedInferenceConfig.class,
			
 
				+            new ParseField(ZeroShotClassificationConfig.NAME),
			
 
				+            ZeroShotClassificationConfig::fromXContentStrict));
			
 
				 
			
 
				         namedXContent.add(new NamedXContentRegistry.Entry(InferenceConfigUpdate.class, ClassificationConfigUpdate.NAME,
			
 
				             ClassificationConfigUpdate::fromXContentStrict));
			
 
				         namedXContent.add(new NamedXContentRegistry.Entry(InferenceConfigUpdate.class, RegressionConfigUpdate.NAME,
			
 
				             RegressionConfigUpdate::fromXContentStrict));
			
 
				+        namedXContent.add(
			
 
				+            new NamedXContentRegistry.Entry(
			
 
				+                InferenceConfigUpdate.class,
			
 
				+                new ParseField(ZeroShotClassificationConfigUpdate.NAME),
			
 
				+                ZeroShotClassificationConfigUpdate::fromXContentStrict
			
 
				+            )
			
 
				+        );
			
 
				 
			
 
				         // Inference models
			
 
				         namedXContent.add(new NamedXContentRegistry.Entry(InferenceModel.class, Ensemble.NAME, EnsembleInferenceModel::fromXContent));
			
@@ -288,6 +302,8 @@ public class MlInferenceNamedXContentProvider implements NamedXContentProvider {
 
				             PassThroughConfig.NAME, PassThroughConfig::new));
			
 
				         namedWriteables.add(new NamedWriteableRegistry.Entry(InferenceConfig.class,
			
 
				             TextEmbeddingConfig.NAME, TextEmbeddingConfig::new));
			
 
				+        namedWriteables.add(new NamedWriteableRegistry.Entry(InferenceConfig.class,
			
 
				+            ZeroShotClassificationConfig.NAME, ZeroShotClassificationConfig::new));
			
 
				 
			
 
				         namedWriteables.add(new NamedWriteableRegistry.Entry(InferenceConfigUpdate.class,
			
 
				             ClassificationConfigUpdate.NAME.getPreferredName(), ClassificationConfigUpdate::new));
			
@@ -297,6 +313,8 @@ public class MlInferenceNamedXContentProvider implements NamedXContentProvider {
 
				             ResultsFieldUpdate.NAME, ResultsFieldUpdate::new));
			
 
				         namedWriteables.add(new NamedWriteableRegistry.Entry(InferenceConfigUpdate.class,
			
 
				             EmptyConfigUpdate.NAME, EmptyConfigUpdate::new));
			
 
				+        namedWriteables.add(new NamedWriteableRegistry.Entry(InferenceConfigUpdate.class,
			
 
				+            ZeroShotClassificationConfigUpdate.NAME, ZeroShotClassificationConfigUpdate::new));
			
 
				 
			
 
				         // Location
			
 
				         namedWriteables.add(new NamedWriteableRegistry.Entry(TrainedModelLocation.class,
			
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ml/inference/trainedmodel/NlpConfigUpdate.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ml/inference/trainedmodel/NlpConfigUpdate.java
@@ -0,0 +1,21 @@
 
				+/*
			
 
				+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
			
 
				+ * or more contributor license agreements. Licensed under the Elastic License
			
 
				+ * 2.0; you may not use this file except in compliance with the Elastic License
			
 
				+ * 2.0.
			
 
				+ */
			
 
				+
			
 
				+package org.elasticsearch.xpack.core.ml.inference.trainedmodel;
			
 
				+
			
 
				+import org.elasticsearch.common.xcontent.ParseField;
			
 
				+
			
 
				+public abstract class NlpConfigUpdate implements InferenceConfigUpdate {
			
 
				+
			
 
				+    static ParseField CLASSIFICATION_LABELS = new ParseField("classification_labels");
			
 
				+
			
 
				+    @Override
			
 
				+    public InferenceConfig toConfig() {
			
 
				+        throw new UnsupportedOperationException("cannot serialize to nodes before 7.8");
			
 
				+    }
			
 
				+
			
 
				+}
			
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ml/inference/trainedmodel/ZeroShotClassificationConfig.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ml/inference/trainedmodel/ZeroShotClassificationConfig.java
@@ -0,0 +1,245 @@
 
				+/*
			
 
				+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
			
 
				+ * or more contributor license agreements. Licensed under the Elastic License
			
 
				+ * 2.0; you may not use this file except in compliance with the Elastic License
			
 
				+ * 2.0.
			
 
				+ */
			
 
				+
			
 
				+package org.elasticsearch.xpack.core.ml.inference.trainedmodel;
			
 
				+
			
 
				+import org.elasticsearch.Version;
			
 
				+import org.elasticsearch.common.io.stream.StreamInput;
			
 
				+import org.elasticsearch.common.io.stream.StreamOutput;
			
 
				+import org.elasticsearch.common.xcontent.ConstructingObjectParser;
			
 
				+import org.elasticsearch.common.xcontent.ParseField;
			
 
				+import org.elasticsearch.common.xcontent.XContentBuilder;
			
 
				+import org.elasticsearch.common.xcontent.XContentParser;
			
 
				+import org.elasticsearch.core.Nullable;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.persistence.InferenceIndexConstants;
			
 
				+import org.elasticsearch.xpack.core.ml.utils.ExceptionsHelper;
			
 
				+import org.elasticsearch.xpack.core.ml.utils.NamedXContentObjectHelper;
			
 
				+
			
 
				+import java.io.IOException;
			
 
				+import java.util.List;
			
 
				+import java.util.Locale;
			
 
				+import java.util.Objects;
			
 
				+import java.util.Optional;
			
 
				+import java.util.Set;
			
 
				+import java.util.TreeSet;
			
 
				+import java.util.stream.Collectors;
			
 
				+
			
 
				+/**
			
 
				+ * This builds out a 0-shot classification task.
			
 
				+ *
			
 
				+ * The 0-shot methodology assumed is MNLI optimized task. For further info see: https://arxiv.org/abs/1909.00161
			
 
				+ *
			
 
				+ */
			
 
				+public class ZeroShotClassificationConfig implements NlpConfig {
			
 
				+
			
 
				+    public static final String NAME = "zero_shot_classification";
			
 
				+    public static final ParseField HYPOTHESIS_TEMPLATE = new ParseField("hypothesis_template");
			
 
				+    public static final ParseField MULTI_LABEL = new ParseField("multi_label");
			
 
				+    public static final ParseField LABELS = new ParseField("labels");
			
 
				+
			
 
				+    public static ZeroShotClassificationConfig fromXContentStrict(XContentParser parser) {
			
 
				+        return STRICT_PARSER.apply(parser, null);
			
 
				+    }
			
 
				+
			
 
				+    public static ZeroShotClassificationConfig fromXContentLenient(XContentParser parser) {
			
 
				+        return LENIENT_PARSER.apply(parser, null);
			
 
				+    }
			
 
				+
			
 
				+    private static final Set<String> REQUIRED_CLASSIFICATION_LABELS = new TreeSet<>(List.of("entailment", "neutral", "contradiction"));
			
 
				+    private static final String DEFAULT_HYPOTHESIS_TEMPLATE = "This example is {}.";
			
 
				+    private static final ConstructingObjectParser<ZeroShotClassificationConfig, Void> STRICT_PARSER = createParser(false);
			
 
				+    private static final ConstructingObjectParser<ZeroShotClassificationConfig, Void> LENIENT_PARSER = createParser(true);
			
 
				+
			
 
				+    @SuppressWarnings({ "unchecked"})
			
 
				+    private static ConstructingObjectParser<ZeroShotClassificationConfig, Void> createParser(boolean ignoreUnknownFields) {
			
 
				+        ConstructingObjectParser<ZeroShotClassificationConfig, Void> parser = new ConstructingObjectParser<>(
			
 
				+            NAME,
			
 
				+            ignoreUnknownFields,
			
 
				+            a -> new ZeroShotClassificationConfig(
			
 
				+                (List<String>)a[0],
			
 
				+                (VocabularyConfig) a[1],
			
 
				+                (Tokenization) a[2],
			
 
				+                (String) a[3],
			
 
				+                (Boolean) a[4],
			
 
				+                (List<String>) a[5]
			
 
				+            )
			
 
				+        );
			
 
				+        parser.declareStringArray(ConstructingObjectParser.constructorArg(), CLASSIFICATION_LABELS);
			
 
				+        parser.declareObject(
			
 
				+            ConstructingObjectParser.optionalConstructorArg(),
			
 
				+            (p, c) -> {
			
 
				+                if (ignoreUnknownFields == false) {
			
 
				+                    throw ExceptionsHelper.badRequestException(
			
 
				+                        "illegal setting [{}] on inference model creation",
			
 
				+                        VOCABULARY.getPreferredName()
			
 
				+                    );
			
 
				+                }
			
 
				+                return VocabularyConfig.fromXContentLenient(p);
			
 
				+            },
			
 
				+            VOCABULARY
			
 
				+        );
			
 
				+        parser.declareNamedObject(
			
 
				+            ConstructingObjectParser.optionalConstructorArg(), (p, c, n) -> p.namedObject(Tokenization.class, n, ignoreUnknownFields),
			
 
				+                TOKENIZATION
			
 
				+        );
			
 
				+        parser.declareString(ConstructingObjectParser.optionalConstructorArg(), HYPOTHESIS_TEMPLATE);
			
 
				+        parser.declareBoolean(ConstructingObjectParser.optionalConstructorArg(), MULTI_LABEL);
			
 
				+        parser.declareStringArray(ConstructingObjectParser.optionalConstructorArg(), LABELS);
			
 
				+        return parser;
			
 
				+    }
			
 
				+
			
 
				+    private final VocabularyConfig vocabularyConfig;
			
 
				+    private final Tokenization tokenization;
			
 
				+    private final List<String> classificationLabels;
			
 
				+    private final List<String> labels;
			
 
				+    private final boolean isMultiLabel;
			
 
				+    private final String hypothesisTemplate;
			
 
				+
			
 
				+    public ZeroShotClassificationConfig(
			
 
				+        List<String> classificationLabels,
			
 
				+        @Nullable VocabularyConfig vocabularyConfig,
			
 
				+        @Nullable Tokenization tokenization,
			
 
				+        @Nullable String hypothesisTemplate,
			
 
				+        @Nullable Boolean isMultiLabel,
			
 
				+        @Nullable List<String> labels
			
 
				+    ) {
			
 
				+        this.classificationLabels = ExceptionsHelper.requireNonNull(classificationLabels, CLASSIFICATION_LABELS);
			
 
				+        if (this.classificationLabels.size() != 3) {
			
 
				+            throw ExceptionsHelper.badRequestException(
			
 
				+                "[{}] must contain exactly the three values {}",
			
 
				+                CLASSIFICATION_LABELS.getPreferredName(),
			
 
				+                REQUIRED_CLASSIFICATION_LABELS
			
 
				+            );
			
 
				+        }
			
 
				+        List<String> badLabels = classificationLabels.stream()
			
 
				+            .map(s -> s.toLowerCase(Locale.ROOT))
			
 
				+            .filter(c -> REQUIRED_CLASSIFICATION_LABELS.contains(c) == false)
			
 
				+            .collect(Collectors.toList());
			
 
				+        if (badLabels.isEmpty() == false) {
			
 
				+            throw ExceptionsHelper.badRequestException(
			
 
				+                "[{}] must contain exactly the three values {}. Invalid labels {}",
			
 
				+                CLASSIFICATION_LABELS.getPreferredName(),
			
 
				+                REQUIRED_CLASSIFICATION_LABELS,
			
 
				+                badLabels
			
 
				+            );
			
 
				+        }
			
 
				+        this.vocabularyConfig = Optional.ofNullable(vocabularyConfig)
			
 
				+            .orElse(new VocabularyConfig(InferenceIndexConstants.nativeDefinitionStore()));
			
 
				+        this.tokenization = tokenization == null ? Tokenization.createDefault() : tokenization;
			
 
				+        this.isMultiLabel = isMultiLabel != null && isMultiLabel;
			
 
				+        this.hypothesisTemplate = Optional.ofNullable(hypothesisTemplate).orElse(DEFAULT_HYPOTHESIS_TEMPLATE);
			
 
				+        this.labels = labels;
			
 
				+        if (labels != null && labels.isEmpty()) {
			
 
				+            throw ExceptionsHelper.badRequestException("[{}] must not be empty", LABELS.getPreferredName());
			
 
				+        }
			
 
				+    }
			
 
				+
			
 
				+    public ZeroShotClassificationConfig(StreamInput in) throws IOException {
			
 
				+        vocabularyConfig = new VocabularyConfig(in);
			
 
				+        tokenization = in.readNamedWriteable(Tokenization.class);
			
 
				+        classificationLabels = in.readStringList();
			
 
				+        isMultiLabel = in.readBoolean();
			
 
				+        hypothesisTemplate = in.readString();
			
 
				+        labels = in.readOptionalStringList();
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public void writeTo(StreamOutput out) throws IOException {
			
 
				+        vocabularyConfig.writeTo(out);
			
 
				+        out.writeNamedWriteable(tokenization);
			
 
				+        out.writeStringCollection(classificationLabels);
			
 
				+        out.writeBoolean(isMultiLabel);
			
 
				+        out.writeString(hypothesisTemplate);
			
 
				+        out.writeOptionalStringCollection(labels);
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public XContentBuilder toXContent(XContentBuilder builder, Params params) throws IOException {
			
 
				+        builder.startObject();
			
 
				+        builder.field(VOCABULARY.getPreferredName(), vocabularyConfig, params);
			
 
				+        NamedXContentObjectHelper.writeNamedObject(builder, params, TOKENIZATION.getPreferredName(), tokenization);
			
 
				+        builder.field(CLASSIFICATION_LABELS.getPreferredName(), classificationLabels);
			
 
				+        builder.field(MULTI_LABEL.getPreferredName(), isMultiLabel);
			
 
				+        builder.field(HYPOTHESIS_TEMPLATE.getPreferredName(), hypothesisTemplate);
			
 
				+        if (labels != null) {
			
 
				+            builder.field(LABELS.getPreferredName(), labels);
			
 
				+        }
			
 
				+        builder.endObject();
			
 
				+        return builder;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public String getWriteableName() {
			
 
				+        return NAME;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public boolean isTargetTypeSupported(TargetType targetType) {
			
 
				+        return false;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public Version getMinimalSupportedVersion() {
			
 
				+        return Version.V_8_0_0;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public String getName() {
			
 
				+        return NAME;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public boolean equals(Object o) {
			
 
				+        if (o == this) return true;
			
 
				+        if (o == null || getClass() != o.getClass()) return false;
			
 
				+
			
 
				+        ZeroShotClassificationConfig that = (ZeroShotClassificationConfig) o;
			
 
				+        return Objects.equals(vocabularyConfig, that.vocabularyConfig)
			
 
				+            && Objects.equals(tokenization, that.tokenization)
			
 
				+            && Objects.equals(isMultiLabel, that.isMultiLabel)
			
 
				+            && Objects.equals(hypothesisTemplate, that.hypothesisTemplate)
			
 
				+            && Objects.equals(labels, that.labels)
			
 
				+            && Objects.equals(classificationLabels, that.classificationLabels);
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public int hashCode() {
			
 
				+        return Objects.hash(vocabularyConfig, tokenization, classificationLabels, hypothesisTemplate, isMultiLabel, labels);
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public VocabularyConfig getVocabularyConfig() {
			
 
				+        return vocabularyConfig;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public Tokenization getTokenization() {
			
 
				+        return tokenization;
			
 
				+    }
			
 
				+
			
 
				+    public List<String> getClassificationLabels() {
			
 
				+        return classificationLabels;
			
 
				+    }
			
 
				+
			
 
				+    public boolean isMultiLabel() {
			
 
				+        return isMultiLabel;
			
 
				+    }
			
 
				+
			
 
				+    public String getHypothesisTemplate() {
			
 
				+        return hypothesisTemplate;
			
 
				+    }
			
 
				+
			
 
				+    public List<String> getLabels() {
			
 
				+        return Optional.ofNullable(labels).orElse(List.of());
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public boolean isAllocateOnly() {
			
 
				+        return true;
			
 
				+    }
			
 
				+
			
 
				+}
			
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ml/inference/trainedmodel/ZeroShotClassificationConfigUpdate.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ml/inference/trainedmodel/ZeroShotClassificationConfigUpdate.java
@@ -0,0 +1,201 @@
 
				+/*
			
 
				+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
			
 
				+ * or more contributor license agreements. Licensed under the Elastic License
			
 
				+ * 2.0; you may not use this file except in compliance with the Elastic License
			
 
				+ * 2.0.
			
 
				+ */
			
 
				+
			
 
				+package org.elasticsearch.xpack.core.ml.inference.trainedmodel;
			
 
				+
			
 
				+import org.elasticsearch.common.io.stream.StreamInput;
			
 
				+import org.elasticsearch.common.io.stream.StreamOutput;
			
 
				+import org.elasticsearch.common.xcontent.ConstructingObjectParser;
			
 
				+import org.elasticsearch.common.xcontent.XContentBuilder;
			
 
				+import org.elasticsearch.common.xcontent.XContentParser;
			
 
				+import org.elasticsearch.core.Nullable;
			
 
				+import org.elasticsearch.xpack.core.ml.utils.ExceptionsHelper;
			
 
				+import org.elasticsearch.xpack.core.ml.utils.NamedXContentObject;
			
 
				+
			
 
				+import java.io.IOException;
			
 
				+import java.util.HashMap;
			
 
				+import java.util.List;
			
 
				+import java.util.Map;
			
 
				+import java.util.Objects;
			
 
				+import java.util.Optional;
			
 
				+
			
 
				+import static org.elasticsearch.xpack.core.ml.inference.trainedmodel.ZeroShotClassificationConfig.LABELS;
			
 
				+import static org.elasticsearch.xpack.core.ml.inference.trainedmodel.ZeroShotClassificationConfig.MULTI_LABEL;
			
 
				+
			
 
				+public class ZeroShotClassificationConfigUpdate extends NlpConfigUpdate implements NamedXContentObject {
			
 
				+
			
 
				+    public static final String NAME = "zero_shot_classification";
			
 
				+
			
 
				+    public static ZeroShotClassificationConfigUpdate fromXContentStrict(XContentParser parser) {
			
 
				+        return STRICT_PARSER.apply(parser, null);
			
 
				+    }
			
 
				+
			
 
				+    @SuppressWarnings({ "unchecked"})
			
 
				+    public static ZeroShotClassificationConfigUpdate fromMap(Map<String, Object> map) {
			
 
				+        Map<String, Object> options = new HashMap<>(map);
			
 
				+        Boolean isMultiLabel = (Boolean)options.remove(MULTI_LABEL.getPreferredName());
			
 
				+        List<String> labels = (List<String>)options.remove(LABELS.getPreferredName());
			
 
				+        if (options.isEmpty() == false) {
			
 
				+            throw ExceptionsHelper.badRequestException("Unrecognized fields {}.", map.keySet());
			
 
				+        }
			
 
				+        return new ZeroShotClassificationConfigUpdate(labels, isMultiLabel);
			
 
				+    }
			
 
				+
			
 
				+    @SuppressWarnings({ "unchecked"})
			
 
				+    private static final ConstructingObjectParser<ZeroShotClassificationConfigUpdate, Void> STRICT_PARSER = new ConstructingObjectParser<>(
			
 
				+        NAME,
			
 
				+        a -> new ZeroShotClassificationConfigUpdate((List<String>)a[0], (Boolean) a[1])
			
 
				+    );
			
 
				+
			
 
				+    static {
			
 
				+        STRICT_PARSER.declareStringArray(ConstructingObjectParser.optionalConstructorArg(), LABELS);
			
 
				+        STRICT_PARSER.declareBoolean(ConstructingObjectParser.optionalConstructorArg(), MULTI_LABEL);
			
 
				+    }
			
 
				+
			
 
				+    private final List<String> labels;
			
 
				+    private final Boolean isMultiLabel;
			
 
				+
			
 
				+    public ZeroShotClassificationConfigUpdate(
			
 
				+        @Nullable List<String> labels,
			
 
				+        @Nullable Boolean isMultiLabel
			
 
				+    ) {
			
 
				+        this.labels = labels;
			
 
				+        if (labels != null && labels.isEmpty()) {
			
 
				+            throw ExceptionsHelper.badRequestException("[{}] must not be empty", LABELS.getPreferredName());
			
 
				+        }
			
 
				+        this.isMultiLabel = isMultiLabel;
			
 
				+    }
			
 
				+
			
 
				+    public ZeroShotClassificationConfigUpdate(StreamInput in) throws IOException {
			
 
				+        labels = in.readOptionalStringList();
			
 
				+        isMultiLabel = in.readOptionalBoolean();
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public void writeTo(StreamOutput out) throws IOException {
			
 
				+        out.writeOptionalStringCollection(labels);
			
 
				+        out.writeOptionalBoolean(isMultiLabel);
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public XContentBuilder toXContent(XContentBuilder builder, Params params) throws IOException {
			
 
				+        builder.startObject();
			
 
				+        if (labels != null) {
			
 
				+            builder.field(LABELS.getPreferredName(), labels);
			
 
				+        }
			
 
				+        if (isMultiLabel != null) {
			
 
				+            builder.field(MULTI_LABEL.getPreferredName(), isMultiLabel);
			
 
				+        }
			
 
				+        builder.endObject();
			
 
				+        return builder;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public String getWriteableName() {
			
 
				+        return NAME;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public InferenceConfig apply(InferenceConfig originalConfig) {
			
 
				+        if (originalConfig instanceof ZeroShotClassificationConfig == false) {
			
 
				+            throw ExceptionsHelper.badRequestException(
			
 
				+                "Inference config of type [{}] can not be updated with a inference request of type [{}]",
			
 
				+                originalConfig.getName(),
			
 
				+                getName());
			
 
				+        }
			
 
				+
			
 
				+        ZeroShotClassificationConfig zeroShotConfig = (ZeroShotClassificationConfig)originalConfig;
			
 
				+        if ((labels == null || labels.isEmpty()) && (zeroShotConfig.getLabels() == null || zeroShotConfig.getLabels().isEmpty())) {
			
 
				+            throw ExceptionsHelper.badRequestException(
			
 
				+                "stored configuration has no [{}] defined, supplied inference_config update must supply [{}]",
			
 
				+                LABELS.getPreferredName(),
			
 
				+                LABELS.getPreferredName()
			
 
				+            );
			
 
				+        }
			
 
				+        if (isNoop(zeroShotConfig)) {
			
 
				+            return originalConfig;
			
 
				+        }
			
 
				+        return new ZeroShotClassificationConfig(
			
 
				+            zeroShotConfig.getClassificationLabels(),
			
 
				+            zeroShotConfig.getVocabularyConfig(),
			
 
				+            zeroShotConfig.getTokenization(),
			
 
				+            zeroShotConfig.getHypothesisTemplate(),
			
 
				+            Optional.ofNullable(isMultiLabel).orElse(zeroShotConfig.isMultiLabel()),
			
 
				+            Optional.ofNullable(labels).orElse(zeroShotConfig.getLabels())
			
 
				+        );
			
 
				+    }
			
 
				+
			
 
				+    boolean isNoop(ZeroShotClassificationConfig originalConfig) {
			
 
				+        return (labels == null || labels.equals(originalConfig.getClassificationLabels()))
			
 
				+            && (isMultiLabel == null || isMultiLabel.equals(originalConfig.isMultiLabel()));
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public boolean isSupported(InferenceConfig config) {
			
 
				+        return config instanceof ZeroShotClassificationConfig;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public String getResultsField() {
			
 
				+        return null;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public InferenceConfigUpdate.Builder<? extends InferenceConfigUpdate.Builder<?, ?>, ? extends InferenceConfigUpdate> newBuilder() {
			
 
				+        return new Builder().setLabels(labels).setMultiLabel(isMultiLabel);
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public String getName() {
			
 
				+        return NAME;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public boolean equals(Object o) {
			
 
				+        if (o == this) return true;
			
 
				+        if (o == null || getClass() != o.getClass()) return false;
			
 
				+
			
 
				+        ZeroShotClassificationConfigUpdate that = (ZeroShotClassificationConfigUpdate) o;
			
 
				+        return Objects.equals(isMultiLabel, that.isMultiLabel) && Objects.equals(labels, that.labels);
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public int hashCode() {
			
 
				+        return Objects.hash(labels, isMultiLabel);
			
 
				+    }
			
 
				+
			
 
				+    public List<String> getLabels() {
			
 
				+        return labels;
			
 
				+    }
			
 
				+
			
 
				+    public static class Builder implements InferenceConfigUpdate.Builder<
			
 
				+        ZeroShotClassificationConfigUpdate.Builder,
			
 
				+        ZeroShotClassificationConfigUpdate
			
 
				+        > {
			
 
				+        private List<String> labels;
			
 
				+        private Boolean isMultiLabel;
			
 
				+
			
 
				+        @Override
			
 
				+        public ZeroShotClassificationConfigUpdate.Builder setResultsField(String resultsField) {
			
 
				+            throw new IllegalArgumentException();
			
 
				+        }
			
 
				+
			
 
				+        public Builder setLabels(List<String> labels) {
			
 
				+            this.labels = labels;
			
 
				+            return this;
			
 
				+        }
			
 
				+
			
 
				+        public Builder setMultiLabel(Boolean multiLabel) {
			
 
				+            isMultiLabel = multiLabel;
			
 
				+            return this;
			
 
				+        }
			
 
				+
			
 
				+        public ZeroShotClassificationConfigUpdate build() {
			
 
				+            return new ZeroShotClassificationConfigUpdate(labels, isMultiLabel);
			
 
				+        }
			
 
				+    }
			
 
				+}
			
--- a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ml/action/InferTrainedModelDeploymentRequestsTests.java
+++ b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ml/action/InferTrainedModelDeploymentRequestsTests.java
@@ -7,19 +7,24 @@
 
				 
			
 
				 package org.elasticsearch.xpack.core.ml.action;
			
 
				 
			
 
				+import org.elasticsearch.common.io.stream.NamedWriteableRegistry;
			
 
				 import org.elasticsearch.common.io.stream.Writeable;
			
 
				-import org.elasticsearch.common.xcontent.XContentParser;
			
 
				 import org.elasticsearch.core.Tuple;
			
 
				-import org.elasticsearch.test.AbstractSerializingTestCase;
			
 
				+import org.elasticsearch.test.AbstractWireSerializingTestCase;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.MlInferenceNamedXContentProvider;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.EmptyConfigUpdateTests;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.InferenceConfigUpdate;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.ZeroShotClassificationConfigUpdateTests;
			
 
				 
			
 
				-import java.io.IOException;
			
 
				+import java.util.ArrayList;
			
 
				 import java.util.List;
			
 
				 import java.util.Map;
			
 
				 
			
 
				-public class InferTrainedModelDeploymentRequestsTests extends AbstractSerializingTestCase<InferTrainedModelDeploymentAction.Request> {
			
 
				-    @Override
			
 
				-    protected InferTrainedModelDeploymentAction.Request doParseInstance(XContentParser parser) throws IOException {
			
 
				-        return InferTrainedModelDeploymentAction.Request.parseRequest(null, parser);
			
 
				+public class InferTrainedModelDeploymentRequestsTests extends AbstractWireSerializingTestCase<InferTrainedModelDeploymentAction.Request> {
			
 
				+
			
 
				+
			
 
				+    private static InferenceConfigUpdate randomInferenceConfigUpdate() {
			
 
				+        return randomFrom(ZeroShotClassificationConfigUpdateTests.createRandom(), EmptyConfigUpdateTests.testInstance());
			
 
				     }
			
 
				 
			
 
				     @Override
			
@@ -32,14 +37,24 @@ public class InferTrainedModelDeploymentRequestsTests extends AbstractSerializin
 
				         List<Map<String, Object>> docs = randomList(5, () -> randomMap(1, 3,
			
 
				             () -> Tuple.tuple(randomAlphaOfLength(7), randomAlphaOfLength(7))));
			
 
				 
			
 
				-        InferTrainedModelDeploymentAction.Request request =
			
 
				-            new InferTrainedModelDeploymentAction.Request(randomAlphaOfLength(4), docs);
			
 
				+        InferTrainedModelDeploymentAction.Request request = new InferTrainedModelDeploymentAction.Request(
			
 
				+            randomAlphaOfLength(4),
			
 
				+            randomBoolean() ? null : randomInferenceConfigUpdate(),
			
 
				+            docs
			
 
				+        );
			
 
				         if (randomBoolean()) {
			
 
				             request.setTimeout(randomTimeValue());
			
 
				         }
			
 
				         return request;
			
 
				     }
			
 
				 
			
 
				+    @Override
			
 
				+    protected NamedWriteableRegistry getNamedWriteableRegistry() {
			
 
				+        List<NamedWriteableRegistry.Entry> entries = new ArrayList<>();
			
 
				+        entries.addAll(new MlInferenceNamedXContentProvider().getNamedWriteables());
			
 
				+        return new NamedWriteableRegistry(entries);
			
 
				+    }
			
 
				+
			
 
				     public void testTimeoutNotNull() {
			
 
				         assertNotNull(createTestInstance().getTimeout());
			
 
				     }
			
--- a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ml/inference/trainedmodel/ZeroShotClassificationConfigTests.java
+++ b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ml/inference/trainedmodel/ZeroShotClassificationConfigTests.java
@@ -0,0 +1,61 @@
 
				+/*
			
 
				+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
			
 
				+ * or more contributor license agreements. Licensed under the Elastic License
			
 
				+ * 2.0; you may not use this file except in compliance with the Elastic License
			
 
				+ * 2.0.
			
 
				+ */
			
 
				+
			
 
				+package org.elasticsearch.xpack.core.ml.inference.trainedmodel;
			
 
				+
			
 
				+import org.elasticsearch.Version;
			
 
				+import org.elasticsearch.common.io.stream.Writeable;
			
 
				+import org.elasticsearch.common.xcontent.XContentParser;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.InferenceConfigItemTestCase;
			
 
				+
			
 
				+import java.io.IOException;
			
 
				+import java.util.List;
			
 
				+import java.util.function.Predicate;
			
 
				+
			
 
				+public class ZeroShotClassificationConfigTests extends InferenceConfigItemTestCase<ZeroShotClassificationConfig> {
			
 
				+
			
 
				+    @Override
			
 
				+    protected boolean supportsUnknownFields() {
			
 
				+        return true;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    protected Predicate<String> getRandomFieldsExcludeFilter() {
			
 
				+        return field -> field.isEmpty() == false;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    protected ZeroShotClassificationConfig doParseInstance(XContentParser parser) throws IOException {
			
 
				+        return ZeroShotClassificationConfig.fromXContentLenient(parser);
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    protected Writeable.Reader<ZeroShotClassificationConfig> instanceReader() {
			
 
				+        return ZeroShotClassificationConfig::new;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    protected ZeroShotClassificationConfig createTestInstance() {
			
 
				+        return createRandom();
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    protected ZeroShotClassificationConfig mutateInstanceForVersion(ZeroShotClassificationConfig instance, Version version) {
			
 
				+        return instance;
			
 
				+    }
			
 
				+
			
 
				+    public static ZeroShotClassificationConfig createRandom() {
			
 
				+        return new ZeroShotClassificationConfig(
			
 
				+            randomFrom(List.of("entailment", "neutral", "contradiction"), List.of("contradiction", "neutral", "entailment")),
			
 
				+            randomBoolean() ? null : VocabularyConfigTests.createRandom(),
			
 
				+            randomBoolean() ? null : BertTokenizationTests.createRandom(),
			
 
				+            randomAlphaOfLength(10),
			
 
				+            randomBoolean(),
			
 
				+            randomBoolean() ? null : randomList(1, 5, () -> randomAlphaOfLength(10))
			
 
				+        );
			
 
				+    }
			
 
				+}
			
--- a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ml/inference/trainedmodel/ZeroShotClassificationConfigUpdateTests.java
+++ b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ml/inference/trainedmodel/ZeroShotClassificationConfigUpdateTests.java
@@ -0,0 +1,134 @@
 
				+/*
			
 
				+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
			
 
				+ * or more contributor license agreements. Licensed under the Elastic License
			
 
				+ * 2.0; you may not use this file except in compliance with the Elastic License
			
 
				+ * 2.0.
			
 
				+ */
			
 
				+
			
 
				+package org.elasticsearch.xpack.core.ml.inference.trainedmodel;
			
 
				+
			
 
				+import org.elasticsearch.ElasticsearchException;
			
 
				+import org.elasticsearch.Version;
			
 
				+import org.elasticsearch.common.io.stream.Writeable;
			
 
				+import org.elasticsearch.common.xcontent.XContentParser;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.InferenceConfigItemTestCase;
			
 
				+
			
 
				+import java.io.IOException;
			
 
				+import java.util.Collections;
			
 
				+import java.util.HashMap;
			
 
				+import java.util.List;
			
 
				+import java.util.Map;
			
 
				+
			
 
				+import static org.hamcrest.Matchers.containsString;
			
 
				+import static org.hamcrest.Matchers.equalTo;
			
 
				+
			
 
				+public class ZeroShotClassificationConfigUpdateTests extends InferenceConfigItemTestCase<ZeroShotClassificationConfigUpdate> {
			
 
				+
			
 
				+    @Override
			
 
				+    protected boolean supportsUnknownFields() {
			
 
				+        return false;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    protected ZeroShotClassificationConfigUpdate doParseInstance(XContentParser parser) throws IOException {
			
 
				+        return ZeroShotClassificationConfigUpdate.fromXContentStrict(parser);
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    protected Writeable.Reader<ZeroShotClassificationConfigUpdate> instanceReader() {
			
 
				+        return ZeroShotClassificationConfigUpdate::new;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    protected ZeroShotClassificationConfigUpdate createTestInstance() {
			
 
				+        return createRandom();
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    protected ZeroShotClassificationConfigUpdate mutateInstanceForVersion(ZeroShotClassificationConfigUpdate instance, Version version) {
			
 
				+        return instance;
			
 
				+    }
			
 
				+
			
 
				+    public void testFromMap() {
			
 
				+        ZeroShotClassificationConfigUpdate expected = new ZeroShotClassificationConfigUpdate(List.of("foo", "bar"), false);
			
 
				+        Map<String, Object> config = new HashMap<>(){{
			
 
				+            put(ZeroShotClassificationConfig.LABELS.getPreferredName(), List.of("foo", "bar"));
			
 
				+            put(ZeroShotClassificationConfig.MULTI_LABEL.getPreferredName(), false);
			
 
				+        }};
			
 
				+        assertThat(ZeroShotClassificationConfigUpdate.fromMap(config), equalTo(expected));
			
 
				+    }
			
 
				+
			
 
				+    public void testFromMapWithUnknownField() {
			
 
				+        ElasticsearchException ex = expectThrows(ElasticsearchException.class,
			
 
				+            () -> ZeroShotClassificationConfigUpdate.fromMap(Collections.singletonMap("some_key", 1)));
			
 
				+        assertThat(ex.getMessage(), equalTo("Unrecognized fields [some_key]."));
			
 
				+    }
			
 
				+
			
 
				+    public void testApply() {
			
 
				+        ZeroShotClassificationConfig originalConfig = new ZeroShotClassificationConfig(
			
 
				+            randomFrom(List.of("entailment", "neutral", "contradiction"), List.of("contradiction", "neutral", "entailment")),
			
 
				+            randomBoolean() ? null : VocabularyConfigTests.createRandom(),
			
 
				+            randomBoolean() ? null : BertTokenizationTests.createRandom(),
			
 
				+            randomAlphaOfLength(10),
			
 
				+            randomBoolean(),
			
 
				+            randomList(1, 5, () -> randomAlphaOfLength(10))
			
 
				+        );
			
 
				+
			
 
				+        assertThat(originalConfig, equalTo(new ZeroShotClassificationConfigUpdate.Builder().build().apply(originalConfig)));
			
 
				+
			
 
				+        assertThat(
			
 
				+            new ZeroShotClassificationConfig(
			
 
				+                originalConfig.getClassificationLabels(),
			
 
				+                originalConfig.getVocabularyConfig(),
			
 
				+                originalConfig.getTokenization(),
			
 
				+                originalConfig.getHypothesisTemplate(),
			
 
				+                originalConfig.isMultiLabel(),
			
 
				+                List.of("foo", "bar")
			
 
				+            ),
			
 
				+            equalTo(
			
 
				+                new ZeroShotClassificationConfigUpdate.Builder()
			
 
				+                    .setLabels(List.of("foo", "bar")).build()
			
 
				+                    .apply(originalConfig)
			
 
				+            )
			
 
				+        );
			
 
				+        assertThat(
			
 
				+            new ZeroShotClassificationConfig(
			
 
				+                originalConfig.getClassificationLabels(),
			
 
				+                originalConfig.getVocabularyConfig(),
			
 
				+                originalConfig.getTokenization(),
			
 
				+                originalConfig.getHypothesisTemplate(),
			
 
				+                true,
			
 
				+                originalConfig.getLabels()
			
 
				+            ),
			
 
				+            equalTo(
			
 
				+                new ZeroShotClassificationConfigUpdate.Builder()
			
 
				+                    .setMultiLabel(true).build()
			
 
				+                    .apply(originalConfig)
			
 
				+            )
			
 
				+        );
			
 
				+    }
			
 
				+
			
 
				+    public void testApplyWithEmptyLabelsInConfigAndUpdate() {
			
 
				+        ZeroShotClassificationConfig originalConfig = new ZeroShotClassificationConfig(
			
 
				+            randomFrom(List.of("entailment", "neutral", "contradiction"), List.of("contradiction", "neutral", "entailment")),
			
 
				+            randomBoolean() ? null : VocabularyConfigTests.createRandom(),
			
 
				+            randomBoolean() ? null : BertTokenizationTests.createRandom(),
			
 
				+            randomAlphaOfLength(10),
			
 
				+            randomBoolean(),
			
 
				+            null
			
 
				+        );
			
 
				+
			
 
				+        Exception ex = expectThrows(Exception.class, () -> new ZeroShotClassificationConfigUpdate.Builder().build().apply(originalConfig));
			
 
				+        assertThat(
			
 
				+            ex.getMessage(),
			
 
				+            containsString("stored configuration has no [labels] defined, supplied inference_config update must supply [labels]")
			
 
				+        );
			
 
				+    }
			
 
				+
			
 
				+    public static ZeroShotClassificationConfigUpdate createRandom() {
			
 
				+        return new ZeroShotClassificationConfigUpdate(
			
 
				+            randomBoolean() ? null : randomList(1,5, () -> randomAlphaOfLength(10)),
			
 
				+            randomBoolean() ? null : randomBoolean()
			
 
				+        );
			
 
				+    }
			
 
				+}
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportInferTrainedModelDeploymentAction.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportInferTrainedModelDeploymentAction.java
@@ -80,7 +80,10 @@ public class TransportInferTrainedModelDeploymentAction extends TransportTasksAc
 
				     @Override
			
 
				     protected void taskOperation(InferTrainedModelDeploymentAction.Request request, TrainedModelDeploymentTask task,
			
 
				                                  ActionListener<InferTrainedModelDeploymentAction.Response> listener) {
			
 
				-        task.infer(request.getDocs().get(0), request.getTimeout(),
			
 
				+        task.infer(
			
 
				+            request.getDocs().get(0),
			
 
				+            request.getUpdate(),
			
 
				+            request.getTimeout(),
			
 
				             ActionListener.wrap(
			
 
				                 pyTorchResult -> listener.onResponse(new InferTrainedModelDeploymentAction.Response(pyTorchResult)),
			
 
				                 listener::onFailure)
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportInternalInferModelAction.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportInternalInferModelAction.java
@@ -25,6 +25,7 @@ import org.elasticsearch.xpack.core.ml.action.InternalInferModelAction.Request;
 
				 import org.elasticsearch.xpack.core.ml.action.InternalInferModelAction.Response;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.results.InferenceResults;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.results.WarningInferenceResults;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.InferenceConfigUpdate;
			
 
				 import org.elasticsearch.xpack.ml.inference.allocation.TrainedModelAllocationMetadata;
			
 
				 import org.elasticsearch.xpack.ml.inference.loadingservice.LocalModel;
			
 
				 import org.elasticsearch.xpack.ml.inference.loadingservice.ModelLoadingService;
			
@@ -138,7 +139,7 @@ public class TransportInternalInferModelAction extends HandledTransportAction<Re
 
				                 // Always fail immediately and return an error
			
 
				                 ex -> true);
			
 
				         request.getObjectsToInfer().forEach(stringObjectMap -> typedChainTaskExecutor.add(
			
 
				-            chainedTask -> inferSingleDocAgainstAllocatedModel(request.getModelId(), stringObjectMap, chainedTask)));
			
 
				+            chainedTask -> inferSingleDocAgainstAllocatedModel(request.getModelId(), request.getUpdate(), stringObjectMap, chainedTask)));
			
 
				 
			
 
				         typedChainTaskExecutor.execute(ActionListener.wrap(
			
 
				             inferenceResults -> listener.onResponse(responseBuilder.setInferenceResults(inferenceResults)
			
@@ -148,11 +149,16 @@ public class TransportInternalInferModelAction extends HandledTransportAction<Re
 
				         ));
			
 
				     }
			
 
				 
			
 
				-    private void inferSingleDocAgainstAllocatedModel(String modelId, Map<String, Object> doc, ActionListener<InferenceResults> listener) {
			
 
				+    private void inferSingleDocAgainstAllocatedModel(
			
 
				+        String modelId,
			
 
				+        InferenceConfigUpdate inferenceConfigUpdate,
			
 
				+        Map<String, Object> doc,
			
 
				+        ActionListener<InferenceResults> listener
			
 
				+    ) {
			
 
				         executeAsyncWithOrigin(client,
			
 
				             ML_ORIGIN,
			
 
				             InferTrainedModelDeploymentAction.INSTANCE,
			
 
				-            new InferTrainedModelDeploymentAction.Request(modelId, Collections.singletonList(doc)),
			
 
				+            new InferTrainedModelDeploymentAction.Request(modelId, inferenceConfigUpdate, Collections.singletonList(doc)),
			
 
				             ActionListener.wrap(
			
 
				                 r -> listener.onResponse(r.getResults()),
			
 
				                 e -> listener.onResponse(new WarningInferenceResults(e.getMessage()))
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/allocation/TrainedModelAllocationNodeService.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/allocation/TrainedModelAllocationNodeService.java
@@ -33,6 +33,7 @@ import org.elasticsearch.xpack.core.ml.inference.allocation.RoutingState;
 
				 import org.elasticsearch.xpack.core.ml.inference.allocation.RoutingStateAndReason;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.allocation.TrainedModelAllocation;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.results.InferenceResults;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.InferenceConfig;
			
 
				 import org.elasticsearch.xpack.core.ml.utils.ExceptionsHelper;
			
 
				 import org.elasticsearch.xpack.ml.MachineLearning;
			
 
				 import org.elasticsearch.xpack.ml.inference.deployment.DeploymentManager;
			
@@ -227,9 +228,12 @@ public class TrainedModelAllocationNodeService implements ClusterStateListener {
 
				         );
			
 
				     }
			
 
				 
			
 
				-    public void infer(TrainedModelDeploymentTask task, Map<String, Object> doc, TimeValue timeout,
			
 
				+    public void infer(TrainedModelDeploymentTask task,
			
 
				+                      InferenceConfig config,
			
 
				+                      Map<String, Object> doc,
			
 
				+                      TimeValue timeout,
			
 
				                       ActionListener<InferenceResults> listener) {
			
 
				-        deploymentManager.infer(task, doc, timeout, listener);
			
 
				+        deploymentManager.infer(task, config, doc, timeout, listener);
			
 
				     }
			
 
				 
			
 
				     public Optional<ModelStats> modelStats(TrainedModelDeploymentTask task) {
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/deployment/DeploymentManager.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/deployment/DeploymentManager.java
@@ -33,6 +33,7 @@ import org.elasticsearch.xpack.core.ml.inference.TrainedModelConfig;
 
				 import org.elasticsearch.xpack.core.ml.inference.TrainedModelInput;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.results.InferenceResults;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.IndexLocation;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.InferenceConfig;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.NlpConfig;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.TrainedModelLocation;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.VocabularyConfig;
			
@@ -131,6 +132,7 @@ public class DeploymentManager {
 
				 
			
 
				                 assert modelConfig.getInferenceConfig() instanceof NlpConfig;
			
 
				                 NlpConfig nlpConfig = (NlpConfig) modelConfig.getInferenceConfig();
			
 
				+                task.init(nlpConfig);
			
 
				 
			
 
				                 SearchRequest searchRequest = vocabSearchRequest(nlpConfig.getVocabularyConfig(), modelConfig.getModelId());
			
 
				                 executeAsyncWithOrigin(client, ML_ORIGIN, SearchAction.INSTANCE, searchRequest, ActionListener.wrap(
			
@@ -203,7 +205,9 @@ public class DeploymentManager {
 
				     }
			
 
				 
			
 
				     public void infer(TrainedModelDeploymentTask task,
			
 
				-                      Map<String, Object> doc, TimeValue timeout,
			
 
				+                      InferenceConfig config,
			
 
				+                      Map<String, Object> doc,
			
 
				+                      TimeValue timeout,
			
 
				                       ActionListener<InferenceResults> listener) {
			
 
				         if (task.isStopped()) {
			
 
				             listener.onFailure(
			
@@ -240,12 +244,20 @@ public class DeploymentManager {
 
				                     List<String> text = Collections.singletonList(NlpTask.extractInput(processContext.modelInput.get(), doc));
			
 
				                     NlpTask.Processor processor = processContext.nlpTaskProcessor.get();
			
 
				                     processor.validateInputs(text);
			
 
				-                    NlpTask.Request request = processor.getRequestBuilder().buildRequest(text, requestId);
			
 
				+                    assert config instanceof NlpConfig;
			
 
				+                    NlpTask.Request request = processor.getRequestBuilder((NlpConfig) config).buildRequest(text, requestId);
			
 
				                     logger.trace(() -> "Inference Request "+ request.processInput.utf8ToString());
			
 
				                     PyTorchResultProcessor.PendingResult pendingResult = processContext.resultProcessor.registerRequest(requestId);
			
 
				                     processContext.process.get().writeInferenceRequest(request.processInput);
			
 
				-                    waitForResult(processContext, pendingResult, request.tokenization, requestId, timeout, processor.getResultProcessor(),
			
 
				-                        listener);
			
 
				+                    waitForResult(
			
 
				+                        processContext,
			
 
				+                        pendingResult,
			
 
				+                        request.tokenization,
			
 
				+                        requestId,
			
 
				+                        timeout,
			
 
				+                        processor.getResultProcessor((NlpConfig) config),
			
 
				+                        listener
			
 
				+                    );
			
 
				                 } catch (IOException e) {
			
 
				                     logger.error(new ParameterizedMessage("[{}] error writing to process", processContext.modelId), e);
			
 
				                     onFailure(ExceptionsHelper.serverError("error writing to process", e));
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/deployment/TrainedModelDeploymentTask.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/deployment/TrainedModelDeploymentTask.java
@@ -18,6 +18,8 @@ import org.elasticsearch.xpack.core.ml.MlTasks;
 
				 import org.elasticsearch.xpack.core.ml.action.StartTrainedModelDeploymentAction;
			
 
				 import org.elasticsearch.xpack.core.ml.action.StartTrainedModelDeploymentAction.TaskParams;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.results.InferenceResults;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.InferenceConfig;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.InferenceConfigUpdate;
			
 
				 import org.elasticsearch.xpack.core.ml.utils.ExceptionsHelper;
			
 
				 import org.elasticsearch.xpack.ml.inference.allocation.TrainedModelAllocationNodeService;
			
 
				 
			
@@ -32,6 +34,7 @@ public class TrainedModelDeploymentTask extends CancellableTask implements Start
 
				     private final TrainedModelAllocationNodeService trainedModelAllocationNodeService;
			
 
				     private volatile boolean stopped;
			
 
				     private final SetOnce<String> stoppedReason = new SetOnce<>();
			
 
				+    private final SetOnce<InferenceConfig> inferenceConfig = new SetOnce<>();
			
 
				 
			
 
				     public TrainedModelDeploymentTask(
			
 
				         long id,
			
@@ -50,6 +53,10 @@ public class TrainedModelDeploymentTask extends CancellableTask implements Start
 
				         );
			
 
				     }
			
 
				 
			
 
				+    void init(InferenceConfig inferenceConfig) {
			
 
				+        this.inferenceConfig.set(inferenceConfig);
			
 
				+    }
			
 
				+
			
 
				     public String getModelId() {
			
 
				         return params.getModelId();
			
 
				     }
			
@@ -85,8 +92,25 @@ public class TrainedModelDeploymentTask extends CancellableTask implements Start
 
				         stop(reason);
			
 
				     }
			
 
				 
			
 
				-    public void infer(Map<String, Object> doc, TimeValue timeout, ActionListener<InferenceResults> listener) {
			
 
				-        trainedModelAllocationNodeService.infer(this, doc, timeout, listener);
			
 
				+    public void infer(Map<String, Object> doc, InferenceConfigUpdate update, TimeValue timeout, ActionListener<InferenceResults> listener) {
			
 
				+        if (inferenceConfig.get() == null) {
			
 
				+            listener.onFailure(
			
 
				+                ExceptionsHelper.badRequestException("[{}] inference not possible against uninitialized model", params.getModelId())
			
 
				+            );
			
 
				+            return;
			
 
				+        }
			
 
				+        if (update.isSupported(inferenceConfig.get()) == false) {
			
 
				+            listener.onFailure(
			
 
				+                ExceptionsHelper.badRequestException(
			
 
				+                    "[{}] inference not possible. Task is configured with [{}] but received update of type [{}]",
			
 
				+                    params.getModelId(),
			
 
				+                    inferenceConfig.get().getName(),
			
 
				+                    update.getName()
			
 
				+                )
			
 
				+            );
			
 
				+            return;
			
 
				+        }
			
 
				+        trainedModelAllocationNodeService.infer(this, update.apply(inferenceConfig.get()), doc, timeout, listener);
			
 
				     }
			
 
				 
			
 
				     public Optional<ModelStats> modelStats() {
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/ingest/InferenceProcessor.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/ingest/InferenceProcessor.java
@@ -37,6 +37,8 @@ import org.elasticsearch.xpack.core.ml.inference.trainedmodel.InferenceConfig;
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.InferenceConfigUpdate;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.RegressionConfig;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.RegressionConfigUpdate;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.ZeroShotClassificationConfig;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.ZeroShotClassificationConfigUpdate;
			
 
				 import org.elasticsearch.xpack.core.ml.job.messages.Messages;
			
 
				 import org.elasticsearch.xpack.core.ml.utils.ExceptionsHelper;
			
 
				 import org.elasticsearch.xpack.ml.inference.loadingservice.LocalModel;
			
@@ -358,7 +360,11 @@ public class InferenceProcessor extends AbstractProcessor {
 
				             } else if (configMap.containsKey(RegressionConfig.NAME.getPreferredName())) {
			
 
				                 checkSupportedVersion(RegressionConfig.EMPTY_PARAMS);
			
 
				                 return RegressionConfigUpdate.fromMap(valueMap);
			
 
				-            } else {
			
 
				+            } else if (configMap.containsKey(ZeroShotClassificationConfig.NAME)) {
			
 
				+                checkSupportedVersion(new ZeroShotClassificationConfig(List.of("unused"), null, null, null, null, null));
			
 
				+                return ZeroShotClassificationConfigUpdate.fromMap(valueMap);
			
 
				+            }
			
 
				+            else {
			
 
				                 throw ExceptionsHelper.badRequestException("unrecognized inference configuration type {}. Supported types {}",
			
 
				                     configMap.keySet(),
			
 
				                     Arrays.asList(ClassificationConfig.NAME.getPreferredName(), RegressionConfig.NAME.getPreferredName()));
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/BertRequestBuilder.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/BertRequestBuilder.java
@@ -15,6 +15,7 @@ import org.elasticsearch.xpack.ml.inference.nlp.tokenizers.TokenizationResult;
 
				 
			
 
				 import java.io.IOException;
			
 
				 import java.util.List;
			
 
				+import java.util.stream.Collectors;
			
 
				 
			
 
				 public class BertRequestBuilder implements NlpTask.RequestBuilder {
			
 
				 
			
@@ -37,7 +38,18 @@ public class BertRequestBuilder implements NlpTask.RequestBuilder {
 
				                 " token in its vocabulary");
			
 
				         }
			
 
				 
			
 
				-        TokenizationResult tokenization = tokenizer.tokenize(inputs);
			
 
				+        TokenizationResult tokenization = tokenizer.buildTokenizationResult(
			
 
				+            inputs.stream().map(tokenizer::tokenize).collect(Collectors.toList())
			
 
				+        );
			
 
				+        return buildRequest(tokenization, requestId);
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public NlpTask.Request buildRequest(TokenizationResult tokenization, String requestId) throws IOException {
			
 
				+        if (tokenizer.getPadToken().isEmpty()) {
			
 
				+            throw new IllegalStateException("The input tokenizer does not have a " + BertTokenizer.PAD_TOKEN +
			
 
				+                " token in its vocabulary");
			
 
				+        }
			
 
				         return new NlpTask.Request(tokenization, jsonRequest(tokenization, tokenizer.getPadToken().getAsInt(), requestId));
			
 
				     }
			
 
				 
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/FillMaskProcessor.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/FillMaskProcessor.java
@@ -10,12 +10,14 @@ package org.elasticsearch.xpack.ml.inference.nlp;
 
				 import org.elasticsearch.xpack.core.ml.inference.results.FillMaskResults;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.results.InferenceResults;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.FillMaskConfig;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.NlpConfig;
			
 
				 import org.elasticsearch.xpack.ml.inference.deployment.PyTorchResult;
			
 
				 import org.elasticsearch.xpack.ml.inference.nlp.tokenizers.BertTokenizer;
			
 
				 import org.elasticsearch.xpack.ml.inference.nlp.tokenizers.NlpTokenizer;
			
 
				 import org.elasticsearch.xpack.ml.inference.nlp.tokenizers.TokenizationResult;
			
 
				 
			
 
				 import java.util.ArrayList;
			
 
				+import java.util.Arrays;
			
 
				 import java.util.Collections;
			
 
				 import java.util.List;
			
 
				 
			
@@ -49,23 +51,23 @@ public class FillMaskProcessor implements NlpTask.Processor {
 
				     }
			
 
				 
			
 
				     @Override
			
 
				-    public NlpTask.RequestBuilder getRequestBuilder() {
			
 
				+    public NlpTask.RequestBuilder getRequestBuilder(NlpConfig config) {
			
 
				         return requestBuilder;
			
 
				     }
			
 
				 
			
 
				     @Override
			
 
				-    public NlpTask.ResultProcessor getResultProcessor() {
			
 
				+    public NlpTask.ResultProcessor getResultProcessor(NlpConfig config) {
			
 
				         return this::processResult;
			
 
				     }
			
 
				 
			
 
				     InferenceResults processResult(TokenizationResult tokenization, PyTorchResult pyTorchResult) {
			
 
				 
			
 
				         if (tokenization.getTokenizations().isEmpty() ||
			
 
				-            tokenization.getTokenizations().get(0).getTokens().isEmpty()) {
			
 
				+            tokenization.getTokenizations().get(0).getTokens().length == 0) {
			
 
				             return new FillMaskResults(Collections.emptyList());
			
 
				         }
			
 
				 
			
 
				-        int maskTokenIndex = tokenization.getTokenizations().get(0).getTokens().indexOf(BertTokenizer.MASK_TOKEN);
			
 
				+        int maskTokenIndex = Arrays.asList(tokenization.getTokenizations().get(0).getTokens()).indexOf(BertTokenizer.MASK_TOKEN);
			
 
				         // TODO - process all results in the batch
			
 
				         double[] normalizedScores = NlpHelpers.convertToProbabilitiesBySoftMax(pyTorchResult.getInferenceResult()[0][maskTokenIndex]);
			
 
				 
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/NerProcessor.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/NerProcessor.java
@@ -13,6 +13,7 @@ import org.elasticsearch.common.io.stream.Writeable;
 
				 import org.elasticsearch.xpack.core.ml.inference.results.InferenceResults;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.results.NerResults;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.NerConfig;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.NlpConfig;
			
 
				 import org.elasticsearch.xpack.ml.inference.deployment.PyTorchResult;
			
 
				 import org.elasticsearch.xpack.ml.inference.nlp.tokenizers.NlpTokenizer;
			
 
				 import org.elasticsearch.xpack.ml.inference.nlp.tokenizers.TokenizationResult;
			
@@ -124,12 +125,12 @@ public class NerProcessor implements NlpTask.Processor {
 
				     }
			
 
				 
			
 
				     @Override
			
 
				-    public NlpTask.RequestBuilder getRequestBuilder() {
			
 
				+    public NlpTask.RequestBuilder getRequestBuilder(NlpConfig config) {
			
 
				         return requestBuilder;
			
 
				     }
			
 
				 
			
 
				     @Override
			
 
				-    public NlpTask.ResultProcessor getResultProcessor() {
			
 
				+    public NlpTask.ResultProcessor getResultProcessor(NlpConfig config) {
			
 
				         return new NerResultProcessor(iobMap);
			
 
				     }
			
 
				 
			
@@ -143,7 +144,7 @@ public class NerProcessor implements NlpTask.Processor {
 
				         @Override
			
 
				         public InferenceResults processResult(TokenizationResult tokenization, PyTorchResult pyTorchResult) {
			
 
				             if (tokenization.getTokenizations().isEmpty() ||
			
 
				-                tokenization.getTokenizations().get(0).getTokens().isEmpty()) {
			
 
				+                tokenization.getTokenizations().get(0).getTokens().length == 0) {
			
 
				                 return new NerResults(Collections.emptyList());
			
 
				             }
			
 
				             // TODO - process all results in the batch
			
@@ -171,7 +172,7 @@ public class NerProcessor implements NlpTask.Processor {
 
				                                            IobTag[] iobMap) {
			
 
				             List<TaggedToken> taggedTokens = new ArrayList<>();
			
 
				             int startTokenIndex = 0;
			
 
				-            while (startTokenIndex < tokenization.getTokens().size()) {
			
 
				+            while (startTokenIndex < tokenization.getTokens().length) {
			
 
				                 int inputMapping = tokenization.getTokenMap()[startTokenIndex];
			
 
				                 if (inputMapping < 0) {
			
 
				                     // This token does not map to a token in the input (special tokens)
			
@@ -179,14 +180,14 @@ public class NerProcessor implements NlpTask.Processor {
 
				                     continue;
			
 
				                 }
			
 
				                 int endTokenIndex = startTokenIndex;
			
 
				-                StringBuilder word = new StringBuilder(tokenization.getTokens().get(startTokenIndex));
			
 
				-                while (endTokenIndex < tokenization.getTokens().size() - 1
			
 
				+                StringBuilder word = new StringBuilder(tokenization.getTokens()[startTokenIndex]);
			
 
				+                while (endTokenIndex < tokenization.getTokens().length - 1
			
 
				                     && tokenization.getTokenMap()[endTokenIndex + 1] == inputMapping) {
			
 
				                     endTokenIndex++;
			
 
				                     // TODO Here we try to get rid of the continuation hashes at the beginning of sub-tokens.
			
 
				                     // It is probably more correct to implement detokenization on the tokenizer
			
 
				                     // that does reverse lookup based on token IDs.
			
 
				-                    String endTokenWord = tokenization.getTokens().get(endTokenIndex).substring(2);
			
 
				+                    String endTokenWord = tokenization.getTokens()[endTokenIndex].substring(2);
			
 
				                     word.append(endTokenWord);
			
 
				                 }
			
 
				                 double[] avgScores = Arrays.copyOf(scores[startTokenIndex], iobMap.length);
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/NlpTask.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/NlpTask.java
@@ -56,6 +56,8 @@ public class NlpTask {
 
				 
			
 
				         Request buildRequest(List<String> inputs, String requestId) throws IOException;
			
 
				 
			
 
				+        Request buildRequest(TokenizationResult tokenizationResult, String requestId) throws IOException;
			
 
				+
			
 
				         static void writePaddedTokens(String fieldName,
			
 
				                                       TokenizationResult tokenization,
			
 
				                                       int padToken,
			
@@ -97,10 +99,6 @@ public class NlpTask {
 
				         InferenceResults processResult(TokenizationResult tokenization, PyTorchResult pyTorchResult);
			
 
				     }
			
 
				 
			
 
				-    public interface ResultProcessorFactory {
			
 
				-        ResultProcessor build(TokenizationResult tokenizationResult);
			
 
				-    }
			
 
				-
			
 
				     public interface Processor {
			
 
				         /**
			
 
				          * Validate the task input string.
			
@@ -110,8 +108,8 @@ public class NlpTask {
 
				          */
			
 
				         void validateInputs(List<String> inputs);
			
 
				 
			
 
				-        RequestBuilder getRequestBuilder();
			
 
				-        ResultProcessor getResultProcessor();
			
 
				+        RequestBuilder getRequestBuilder(NlpConfig config);
			
 
				+        ResultProcessor getResultProcessor(NlpConfig config);
			
 
				     }
			
 
				 
			
 
				     public static String extractInput(TrainedModelInput input, Map<String, Object> doc) {
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/PassThroughProcessor.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/PassThroughProcessor.java
@@ -9,6 +9,7 @@ package org.elasticsearch.xpack.ml.inference.nlp;
 
				 
			
 
				 import org.elasticsearch.xpack.core.ml.inference.results.InferenceResults;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.results.PyTorchPassThroughResults;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.NlpConfig;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.PassThroughConfig;
			
 
				 import org.elasticsearch.xpack.ml.inference.deployment.PyTorchResult;
			
 
				 import org.elasticsearch.xpack.ml.inference.nlp.tokenizers.NlpTokenizer;
			
@@ -34,12 +35,12 @@ public class PassThroughProcessor implements NlpTask.Processor {
 
				     }
			
 
				 
			
 
				     @Override
			
 
				-    public NlpTask.RequestBuilder getRequestBuilder() {
			
 
				+    public NlpTask.RequestBuilder getRequestBuilder(NlpConfig config) {
			
 
				         return requestBuilder;
			
 
				     }
			
 
				 
			
 
				     @Override
			
 
				-    public NlpTask.ResultProcessor getResultProcessor() {
			
 
				+    public NlpTask.ResultProcessor getResultProcessor(NlpConfig config) {
			
 
				         return PassThroughProcessor::processResult;
			
 
				     }
			
 
				 
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/TaskType.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/TaskType.java
@@ -13,6 +13,7 @@ import org.elasticsearch.xpack.core.ml.inference.trainedmodel.NerConfig;
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.NlpConfig;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.TextClassificationConfig;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.TextEmbeddingConfig;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.ZeroShotClassificationConfig;
			
 
				 import org.elasticsearch.xpack.ml.inference.nlp.tokenizers.NlpTokenizer;
			
 
				 
			
 
				 import java.util.Locale;
			
@@ -48,6 +49,12 @@ public enum TaskType {
 
				         public NlpTask.Processor createProcessor(NlpTokenizer tokenizer, NlpConfig config) {
			
 
				             return new TextEmbeddingProcessor(tokenizer, (TextEmbeddingConfig) config);
			
 
				         }
			
 
				+    },
			
 
				+    ZERO_SHOT_CLASSIFICATION {
			
 
				+        @Override
			
 
				+        public NlpTask.Processor createProcessor(NlpTokenizer tokenizer, NlpConfig config) {
			
 
				+            return new ZeroShotClassificationProcessor(tokenizer, (ZeroShotClassificationConfig) config);
			
 
				+        }
			
 
				     };
			
 
				 
			
 
				     public NlpTask.Processor createProcessor(NlpTokenizer tokenizer, NlpConfig config) {
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/TextClassificationProcessor.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/TextClassificationProcessor.java
@@ -13,6 +13,7 @@ import org.elasticsearch.xpack.core.ml.inference.results.InferenceResults;
 
				 import org.elasticsearch.xpack.core.ml.inference.results.TextClassificationResults;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.results.TopClassEntry;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.results.WarningInferenceResults;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.NlpConfig;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.TextClassificationConfig;
			
 
				 import org.elasticsearch.xpack.ml.inference.deployment.PyTorchResult;
			
 
				 import org.elasticsearch.xpack.ml.inference.nlp.tokenizers.NlpTokenizer;
			
@@ -73,12 +74,12 @@ public class TextClassificationProcessor implements NlpTask.Processor {
 
				     }
			
 
				 
			
 
				     @Override
			
 
				-    public NlpTask.RequestBuilder getRequestBuilder() {
			
 
				+    public NlpTask.RequestBuilder getRequestBuilder(NlpConfig config) {
			
 
				         return requestBuilder;
			
 
				     }
			
 
				 
			
 
				     @Override
			
 
				-    public NlpTask.ResultProcessor getResultProcessor() {
			
 
				+    public NlpTask.ResultProcessor getResultProcessor(NlpConfig config) {
			
 
				         return this::processResult;
			
 
				     }
			
 
				 
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/TextEmbeddingProcessor.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/TextEmbeddingProcessor.java
@@ -9,6 +9,7 @@ package org.elasticsearch.xpack.ml.inference.nlp;
 
				 
			
 
				 import org.elasticsearch.xpack.core.ml.inference.results.InferenceResults;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.results.TextEmbeddingResults;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.NlpConfig;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.TextEmbeddingConfig;
			
 
				 import org.elasticsearch.xpack.ml.inference.deployment.PyTorchResult;
			
 
				 import org.elasticsearch.xpack.ml.inference.nlp.tokenizers.NlpTokenizer;
			
@@ -33,12 +34,12 @@ public class TextEmbeddingProcessor implements NlpTask.Processor {
 
				     }
			
 
				 
			
 
				     @Override
			
 
				-    public NlpTask.RequestBuilder getRequestBuilder() {
			
 
				+    public NlpTask.RequestBuilder getRequestBuilder(NlpConfig config) {
			
 
				         return requestBuilder;
			
 
				     }
			
 
				 
			
 
				     @Override
			
 
				-    public NlpTask.ResultProcessor getResultProcessor() {
			
 
				+    public NlpTask.ResultProcessor getResultProcessor(NlpConfig config) {
			
 
				         return TextEmbeddingProcessor::processResult;
			
 
				     }
			
 
				 
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/ZeroShotClassificationProcessor.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/ZeroShotClassificationProcessor.java
@@ -0,0 +1,194 @@
 
				+/*
			
 
				+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
			
 
				+ * or more contributor license agreements. Licensed under the Elastic License
			
 
				+ * 2.0; you may not use this file except in compliance with the Elastic License
			
 
				+ * 2.0.
			
 
				+ */
			
 
				+
			
 
				+package org.elasticsearch.xpack.ml.inference.nlp;
			
 
				+
			
 
				+import org.elasticsearch.common.logging.LoggerMessageFormat;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.results.InferenceResults;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.results.TextClassificationResults;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.results.TopClassEntry;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.results.WarningInferenceResults;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.NlpConfig;
			
 
				+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.ZeroShotClassificationConfig;
			
 
				+import org.elasticsearch.xpack.core.ml.utils.ExceptionsHelper;
			
 
				+import org.elasticsearch.xpack.ml.inference.deployment.PyTorchResult;
			
 
				+import org.elasticsearch.xpack.ml.inference.nlp.tokenizers.NlpTokenizer;
			
 
				+import org.elasticsearch.xpack.ml.inference.nlp.tokenizers.TokenizationResult;
			
 
				+
			
 
				+import java.io.IOException;
			
 
				+import java.util.ArrayList;
			
 
				+import java.util.Comparator;
			
 
				+import java.util.List;
			
 
				+import java.util.Locale;
			
 
				+import java.util.Optional;
			
 
				+import java.util.stream.Collectors;
			
 
				+import java.util.stream.IntStream;
			
 
				+
			
 
				+public class ZeroShotClassificationProcessor implements NlpTask.Processor {
			
 
				+
			
 
				+    private final NlpTokenizer tokenizer;
			
 
				+    private final int entailmentPos;
			
 
				+    private final int contraPos;
			
 
				+    private final String[] labels;
			
 
				+    private final String hypothesisTemplate;
			
 
				+    private final boolean isMultiLabel;
			
 
				+
			
 
				+    ZeroShotClassificationProcessor(NlpTokenizer tokenizer, ZeroShotClassificationConfig config) {
			
 
				+        this.tokenizer = tokenizer;
			
 
				+        List<String> lowerCased = config.getClassificationLabels()
			
 
				+            .stream()
			
 
				+            .map(s -> s.toLowerCase(Locale.ROOT))
			
 
				+            .collect(Collectors.toList());
			
 
				+        this.entailmentPos = lowerCased.indexOf("entailment");
			
 
				+        this.contraPos = lowerCased.indexOf("contradiction");
			
 
				+        if (entailmentPos == -1 || contraPos == -1) {
			
 
				+            throw ExceptionsHelper.badRequestException(
			
 
				+                "zero_shot_classification requires [entailment] and [contradiction] in classification_labels"
			
 
				+            );
			
 
				+        }
			
 
				+        this.labels = Optional.ofNullable(config.getLabels()).orElse(List.of()).toArray(String[]::new);
			
 
				+        this.hypothesisTemplate = config.getHypothesisTemplate();
			
 
				+        this.isMultiLabel = config.isMultiLabel();
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public void validateInputs(List<String> inputs) {
			
 
				+        // nothing to validate
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public NlpTask.RequestBuilder getRequestBuilder(NlpConfig nlpConfig) {
			
 
				+        final String[] labels;
			
 
				+        if (nlpConfig instanceof ZeroShotClassificationConfig) {
			
 
				+            ZeroShotClassificationConfig zeroShotConfig = (ZeroShotClassificationConfig) nlpConfig;
			
 
				+            labels = zeroShotConfig.getLabels().toArray(new String[0]);
			
 
				+        } else {
			
 
				+            labels = this.labels;
			
 
				+        }
			
 
				+        if (this.labels == null || this.labels.length == 0) {
			
 
				+            throw ExceptionsHelper.badRequestException("zero_shot_classification requires non-empty [labels]");
			
 
				+        }
			
 
				+        return new RequestBuilder(tokenizer, labels, hypothesisTemplate);
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public NlpTask.ResultProcessor getResultProcessor(NlpConfig nlpConfig) {
			
 
				+        final String[] labels;
			
 
				+        final boolean isMultiLabel;
			
 
				+        if (nlpConfig instanceof ZeroShotClassificationConfig) {
			
 
				+            ZeroShotClassificationConfig zeroShotConfig = (ZeroShotClassificationConfig) nlpConfig;
			
 
				+            labels = zeroShotConfig.getLabels().toArray(new String[0]);
			
 
				+            isMultiLabel = zeroShotConfig.isMultiLabel();
			
 
				+        } else {
			
 
				+            labels = this.labels;
			
 
				+            isMultiLabel = this.isMultiLabel;
			
 
				+        }
			
 
				+        return new ResultProcessor(entailmentPos, contraPos, labels, isMultiLabel);
			
 
				+    }
			
 
				+
			
 
				+    static class RequestBuilder implements NlpTask.RequestBuilder {
			
 
				+
			
 
				+        private final NlpTokenizer tokenizer;
			
 
				+        private final String[] labels;
			
 
				+        private final String hypothesisTemplate;
			
 
				+
			
 
				+        RequestBuilder(NlpTokenizer tokenizer, String[] labels, String hypothesisTemplate) {
			
 
				+            this.tokenizer = tokenizer;
			
 
				+            this.labels = labels;
			
 
				+            this.hypothesisTemplate = hypothesisTemplate;
			
 
				+        }
			
 
				+
			
 
				+        @Override
			
 
				+        public NlpTask.Request buildRequest(List<String> inputs, String requestId) throws IOException {
			
 
				+            if (inputs.size() > 1) {
			
 
				+                throw new IllegalArgumentException("Unable to do zero-shot classification on more than one text input at a time");
			
 
				+            }
			
 
				+            List<TokenizationResult.Tokenization> tokenizations = new ArrayList<>(labels.length);
			
 
				+            for (String label : labels) {
			
 
				+                tokenizations.add(tokenizer.tokenize(inputs.get(0), LoggerMessageFormat.format(null, hypothesisTemplate, label)));
			
 
				+            }
			
 
				+            TokenizationResult result = tokenizer.buildTokenizationResult(tokenizations);
			
 
				+            return buildRequest(result, requestId);
			
 
				+        }
			
 
				+
			
 
				+        @Override
			
 
				+        public NlpTask.Request buildRequest(TokenizationResult tokenizationResult, String requestId) throws IOException {
			
 
				+            return tokenizer.requestBuilder().buildRequest(tokenizationResult, requestId);
			
 
				+        }
			
 
				+    }
			
 
				+
			
 
				+    static class ResultProcessor implements NlpTask.ResultProcessor {
			
 
				+        private final int entailmentPos;
			
 
				+        private final int contraPos;
			
 
				+        private final String[] labels;
			
 
				+        private final boolean isMultiLabel;
			
 
				+
			
 
				+        ResultProcessor(int entailmentPos, int contraPos, String[] labels, boolean isMultiLabel) {
			
 
				+            this.entailmentPos = entailmentPos;
			
 
				+            this.contraPos = contraPos;
			
 
				+            this.labels = labels;
			
 
				+            this.isMultiLabel = isMultiLabel;
			
 
				+        }
			
 
				+
			
 
				+        @Override
			
 
				+        public InferenceResults processResult(TokenizationResult tokenization, PyTorchResult pyTorchResult) {
			
 
				+            if (pyTorchResult.getInferenceResult().length < 1) {
			
 
				+                return new WarningInferenceResults("Zero shot classification result has no data");
			
 
				+            }
			
 
				+            // TODO only the first entry in the batch result is verified and
			
 
				+            // checked. Implement for all in batch
			
 
				+            if (pyTorchResult.getInferenceResult()[0].length != labels.length) {
			
 
				+                return new WarningInferenceResults(
			
 
				+                    "Expected exactly [{}] values in zero shot classification result; got [{}]",
			
 
				+                    labels.length,
			
 
				+                    pyTorchResult.getInferenceResult().length
			
 
				+                );
			
 
				+            }
			
 
				+            final double[] normalizedScores;
			
 
				+            if (isMultiLabel) {
			
 
				+                normalizedScores = new double[pyTorchResult.getInferenceResult()[0].length];
			
 
				+                int v = 0;
			
 
				+                for (double[] vals : pyTorchResult.getInferenceResult()[0]) {
			
 
				+                    if (vals.length != 3) {
			
 
				+                        return new WarningInferenceResults(
			
 
				+                            "Expected exactly [{}] values in inner zero shot classification result; got [{}]",
			
 
				+                            3,
			
 
				+                            vals.length
			
 
				+                        );
			
 
				+                    }
			
 
				+                    // assume entailment is `0`, softmax between entailment and contradiction
			
 
				+                    normalizedScores[v++] = NlpHelpers.convertToProbabilitiesBySoftMax(
			
 
				+                        new double[]{vals[entailmentPos], vals[contraPos]}
			
 
				+                    )[0];
			
 
				+                }
			
 
				+            } else {
			
 
				+                double[] entailmentScores = new double[pyTorchResult.getInferenceResult()[0].length];
			
 
				+                int v = 0;
			
 
				+                for (double[] vals : pyTorchResult.getInferenceResult()[0]) {
			
 
				+                    if (vals.length != 3) {
			
 
				+                        return new WarningInferenceResults(
			
 
				+                            "Expected exactly [{}] values in inner zero shot classification result; got [{}]",
			
 
				+                            3,
			
 
				+                            vals.length
			
 
				+                        );
			
 
				+                    }
			
 
				+                    entailmentScores[v++] = vals[entailmentPos];
			
 
				+                }
			
 
				+                normalizedScores = NlpHelpers.convertToProbabilitiesBySoftMax(entailmentScores);
			
 
				+            }
			
 
				+
			
 
				+            return new TextClassificationResults(
			
 
				+                IntStream.range(0, normalizedScores.length)
			
 
				+                    .mapToObj(i -> new TopClassEntry(labels[i], normalizedScores[i]))
			
 
				+                    // Put the highest scoring class first
			
 
				+                    .sorted(Comparator.comparing(TopClassEntry::getProbability).reversed())
			
 
				+                    .limit(labels.length)
			
 
				+                    .collect(Collectors.toList())
			
 
				+            );
			
 
				+        }
			
 
				+    }
			
 
				+}
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/tokenizers/BertTokenizer.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/tokenizers/BertTokenizer.java
@@ -7,6 +7,7 @@
 
				 package org.elasticsearch.xpack.ml.inference.nlp.tokenizers;
			
 
				 
			
 
				 import org.elasticsearch.common.util.set.Sets;
			
 
				+import org.elasticsearch.core.Tuple;
			
 
				 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.Tokenization;
			
 
				 import org.elasticsearch.xpack.core.ml.utils.ExceptionsHelper;
			
 
				 import org.elasticsearch.xpack.ml.inference.nlp.BertRequestBuilder;
			
@@ -76,74 +77,63 @@ public class BertTokenizer implements NlpTokenizer {
 
				         this.requestBuilder = requestBuilderFactory.apply(this);
			
 
				     }
			
 
				 
			
 
				+    @Override
			
 
				+    public OptionalInt getPadToken() {
			
 
				+        Integer pad = vocab.get(PAD_TOKEN);
			
 
				+        if (pad != null) {
			
 
				+            return OptionalInt.of(pad);
			
 
				+        } else {
			
 
				+            return OptionalInt.empty();
			
 
				+        }
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public TokenizationResult buildTokenizationResult(List<TokenizationResult.Tokenization> tokenizations) {
			
 
				+        TokenizationResult tokenizationResult = new TokenizationResult(originalVocab);
			
 
				+        for (TokenizationResult.Tokenization tokenization : tokenizations) {
			
 
				+            tokenizationResult.addTokenization(tokenization);
			
 
				+        }
			
 
				+        return tokenizationResult;
			
 
				+    }
			
 
				+
			
 
				     /**
			
 
				-     * Tokenize the list of inputs according to the basic tokenization
			
 
				+     * Tokenize the input according to the basic tokenization
			
 
				      * options then perform Word Piece tokenization with the given vocabulary.
			
 
				      *
			
 
				      * The result is the Word Piece tokens, a map of the Word Piece
			
 
				      * token position to the position of the token in the source for
			
 
				      * each input string grouped into a {@link Tokenization}.
			
 
				      *
			
 
				-     * @param text Text to tokenize
			
 
				+     * @param seq Text to tokenize
			
 
				      * @return A {@link Tokenization}
			
 
				      */
			
 
				     @Override
			
 
				-    public TokenizationResult tokenize(List<String> text) {
			
 
				-        TokenizationResult tokenization = new TokenizationResult(originalVocab);
			
 
				-
			
 
				-        for (String input: text) {
			
 
				-            addTokenization(tokenization, input);
			
 
				-        }
			
 
				-        return tokenization;
			
 
				-    }
			
 
				-
			
 
				-
			
 
				-    private void addTokenization(TokenizationResult tokenization, String text) {
			
 
				-        BasicTokenizer basicTokenizer = new BasicTokenizer(doLowerCase, doTokenizeCjKChars, doStripAccents, neverSplit);
			
 
				-
			
 
				-        List<String> delineatedTokens = basicTokenizer.tokenize(text);
			
 
				-        List<WordPieceTokenizer.TokenAndId> wordPieceTokens = new ArrayList<>();
			
 
				-        List<Integer> tokenPositionMap = new ArrayList<>();
			
 
				-        if (withSpecialTokens) {
			
 
				-            // insert the first token to simplify the loop counter logic later
			
 
				-            tokenPositionMap.add(SPECIAL_TOKEN_POSITION);
			
 
				-        }
			
 
				-
			
 
				-        for (int sourceIndex = 0; sourceIndex < delineatedTokens.size(); sourceIndex++) {
			
 
				-            String token = delineatedTokens.get(sourceIndex);
			
 
				-            if (neverSplit.contains(token)) {
			
 
				-                wordPieceTokens.add(new WordPieceTokenizer.TokenAndId(token, vocab.getOrDefault(token, vocab.get(UNKNOWN_TOKEN))));
			
 
				-                tokenPositionMap.add(sourceIndex);
			
 
				-            } else {
			
 
				-                List<WordPieceTokenizer.TokenAndId> tokens = wordPieceTokenizer.tokenize(token);
			
 
				-                for (int tokenCount = 0; tokenCount < tokens.size(); tokenCount++) {
			
 
				-                    tokenPositionMap.add(sourceIndex);
			
 
				-                }
			
 
				-                wordPieceTokens.addAll(tokens);
			
 
				-            }
			
 
				-        }
			
 
				-
			
 
				+    public TokenizationResult.Tokenization tokenize(String seq) {
			
 
				+        var innerResult = innerTokenize(seq);
			
 
				+        List<WordPieceTokenizer.TokenAndId> wordPieceTokens = innerResult.v1();
			
 
				+        List<Integer> tokenPositionMap = innerResult.v2();
			
 
				         int numTokens = withSpecialTokens ? wordPieceTokens.size() + 2 : wordPieceTokens.size();
			
 
				-        List<String> tokens = new ArrayList<>(numTokens);
			
 
				-        int [] tokenIds = new int[numTokens];
			
 
				-        int [] tokenMap = new int[numTokens];
			
 
				+        String[] tokens = new String[numTokens];
			
 
				+        int[] tokenIds = new int[numTokens];
			
 
				+        int[] tokenMap = new int[numTokens];
			
 
				 
			
 
				         if (withSpecialTokens) {
			
 
				-            tokens.add(CLASS_TOKEN);
			
 
				+            tokens[0] = CLASS_TOKEN;
			
 
				             tokenIds[0] = vocab.get(CLASS_TOKEN);
			
 
				             tokenMap[0] = SPECIAL_TOKEN_POSITION;
			
 
				         }
			
 
				 
			
 
				         int i = withSpecialTokens ? 1 : 0;
			
 
				+        final int decrementHandler = withSpecialTokens ? 1 : 0;
			
 
				         for (WordPieceTokenizer.TokenAndId tokenAndId : wordPieceTokens) {
			
 
				-            tokens.add(tokenAndId.getToken());
			
 
				+            tokens[i] = tokenAndId.getToken();
			
 
				             tokenIds[i] = tokenAndId.getId();
			
 
				-            tokenMap[i] = tokenPositionMap.get(i);
			
 
				+            tokenMap[i] = tokenPositionMap.get(i-decrementHandler);
			
 
				             i++;
			
 
				         }
			
 
				 
			
 
				         if (withSpecialTokens) {
			
 
				-            tokens.add(SEPARATOR_TOKEN);
			
 
				+            tokens[i] = SEPARATOR_TOKEN;
			
 
				             tokenIds[i] = vocab.get(SEPARATOR_TOKEN);
			
 
				             tokenMap[i] = SPECIAL_TOKEN_POSITION;
			
 
				         }
			
@@ -155,18 +145,86 @@ public class BertTokenizer implements NlpTokenizer {
 
				                 maxSequenceLength
			
 
				             );
			
 
				         }
			
 
				-
			
 
				-        tokenization.addTokenization(text, tokens, tokenIds, tokenMap);
			
 
				+        return new TokenizationResult.Tokenization(seq, tokens, tokenIds, tokenMap);
			
 
				     }
			
 
				 
			
 
				     @Override
			
 
				-    public OptionalInt getPadToken() {
			
 
				-        Integer pad = vocab.get(PAD_TOKEN);
			
 
				-        if (pad != null) {
			
 
				-            return OptionalInt.of(pad);
			
 
				-        } else {
			
 
				-            return OptionalInt.empty();
			
 
				+    public TokenizationResult.Tokenization tokenize(String seq1, String seq2) {
			
 
				+        var innerResult = innerTokenize(seq1);
			
 
				+        List<WordPieceTokenizer.TokenAndId> wordPieceTokenSeq1s = innerResult.v1();
			
 
				+        List<Integer> tokenPositionMapSeq1 = innerResult.v2();
			
 
				+        innerResult = innerTokenize(seq2);
			
 
				+        List<WordPieceTokenizer.TokenAndId> wordPieceTokenSeq2s = innerResult.v1();
			
 
				+        List<Integer> tokenPositionMapSeq2 = innerResult.v2();
			
 
				+        if (withSpecialTokens == false)  {
			
 
				+            throw new IllegalArgumentException("Unable to do sequence pair tokenization without special tokens");
			
 
				+        }
			
 
				+        // [CLS] seq1 [SEP] seq2 [SEP]
			
 
				+        int numTokens = wordPieceTokenSeq1s.size() + wordPieceTokenSeq2s.size() + 3;
			
 
				+        String[] tokens = new String[numTokens];
			
 
				+        int[] tokenIds = new int[numTokens];
			
 
				+        int[] tokenMap = new int[numTokens];
			
 
				+
			
 
				+        tokens[0] = CLASS_TOKEN;
			
 
				+        tokenIds[0] = vocab.get(CLASS_TOKEN);
			
 
				+        tokenMap[0] = SPECIAL_TOKEN_POSITION;
			
 
				+
			
 
				+        int i = 1;
			
 
				+        for (WordPieceTokenizer.TokenAndId tokenAndId : wordPieceTokenSeq1s) {
			
 
				+            tokens[i] = tokenAndId.getToken();
			
 
				+            tokenIds[i] = tokenAndId.getId();
			
 
				+            tokenMap[i] = tokenPositionMapSeq1.get(i - 1);
			
 
				+            i++;
			
 
				+        }
			
 
				+        tokens[i] = SEPARATOR_TOKEN;
			
 
				+        tokenIds[i] = vocab.get(SEPARATOR_TOKEN);
			
 
				+        tokenMap[i] = SPECIAL_TOKEN_POSITION;
			
 
				+        ++i;
			
 
				+
			
 
				+        int j = 0;
			
 
				+        for (WordPieceTokenizer.TokenAndId tokenAndId : wordPieceTokenSeq2s) {
			
 
				+            tokens[i] = tokenAndId.getToken();
			
 
				+            tokenIds[i] = tokenAndId.getId();
			
 
				+            tokenMap[i] = tokenPositionMapSeq2.get(j);
			
 
				+            i++;
			
 
				+            j++;
			
 
				+        }
			
 
				+
			
 
				+        tokens[i] = SEPARATOR_TOKEN;
			
 
				+        tokenIds[i] = vocab.get(SEPARATOR_TOKEN);
			
 
				+        tokenMap[i] = SPECIAL_TOKEN_POSITION;
			
 
				+
			
 
				+        // TODO handle seq1 truncation
			
 
				+        if (tokenIds.length > maxSequenceLength) {
			
 
				+            throw ExceptionsHelper.badRequestException(
			
 
				+                "Input too large. The tokenized input length [{}] exceeds the maximum sequence length [{}]",
			
 
				+                tokenIds.length,
			
 
				+                maxSequenceLength
			
 
				+            );
			
 
				+        }
			
 
				+        return new TokenizationResult.Tokenization(seq1 + seq2, tokens, tokenIds, tokenMap);
			
 
				+    }
			
 
				+
			
 
				+    private Tuple<List<WordPieceTokenizer.TokenAndId>, List<Integer>> innerTokenize(String seq) {
			
 
				+        BasicTokenizer basicTokenizer = new BasicTokenizer(doLowerCase, doTokenizeCjKChars, doStripAccents, neverSplit);
			
 
				+        List<String> delineatedTokens = basicTokenizer.tokenize(seq);
			
 
				+        List<WordPieceTokenizer.TokenAndId> wordPieceTokens = new ArrayList<>();
			
 
				+        List<Integer> tokenPositionMap = new ArrayList<>();
			
 
				+
			
 
				+        for (int sourceIndex = 0; sourceIndex < delineatedTokens.size(); sourceIndex++) {
			
 
				+            String token = delineatedTokens.get(sourceIndex);
			
 
				+            if (neverSplit.contains(token)) {
			
 
				+                wordPieceTokens.add(new WordPieceTokenizer.TokenAndId(token, vocab.getOrDefault(token, vocab.get(UNKNOWN_TOKEN))));
			
 
				+                tokenPositionMap.add(sourceIndex);
			
 
				+            } else {
			
 
				+                List<WordPieceTokenizer.TokenAndId> tokens = wordPieceTokenizer.tokenize(token);
			
 
				+                for (int tokenCount = 0; tokenCount < tokens.size(); tokenCount++) {
			
 
				+                    tokenPositionMap.add(sourceIndex);
			
 
				+                }
			
 
				+                wordPieceTokens.addAll(tokens);
			
 
				+            }
			
 
				         }
			
 
				+        return Tuple.tuple(wordPieceTokens, tokenPositionMap);
			
 
				     }
			
 
				 
			
 
				     @Override
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/tokenizers/NlpTokenizer.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/tokenizers/NlpTokenizer.java
@@ -22,7 +22,11 @@ import static org.elasticsearch.xpack.core.ml.inference.trainedmodel.NlpConfig.V
 
				 
			
 
				 public interface NlpTokenizer {
			
 
				 
			
 
				-    TokenizationResult tokenize(List<String> text);
			
 
				+    TokenizationResult buildTokenizationResult(List<TokenizationResult.Tokenization> tokenizations);
			
 
				+
			
 
				+    TokenizationResult.Tokenization tokenize(String seq);
			
 
				+
			
 
				+    TokenizationResult.Tokenization tokenize(String seq1, String seq2);
			
 
				 
			
 
				     NlpTask.RequestBuilder requestBuilder();
			
 
				 
			
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/tokenizers/TokenizationResult.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/tokenizers/TokenizationResult.java
@@ -29,26 +29,31 @@ public class TokenizationResult {
 
				         return tokenizations;
			
 
				     }
			
 
				 
			
 
				-    public void addTokenization(String input, List<String> tokens, int[] tokenIds, int[] tokenMap) {
			
 
				+    public void addTokenization(String input, String[] tokens, int[] tokenIds, int[] tokenMap) {
			
 
				         maxLength = Math.max(maxLength, tokenIds.length);
			
 
				         tokenizations.add(new Tokenization(input, tokens, tokenIds, tokenMap));
			
 
				     }
			
 
				 
			
 
				+    public void addTokenization(Tokenization tokenization) {
			
 
				+        maxLength = Math.max(maxLength, tokenization.tokenIds.length);
			
 
				+        tokenizations.add(tokenization);
			
 
				+    }
			
 
				+
			
 
				     public int getLongestSequenceLength() {
			
 
				         return maxLength;
			
 
				     }
			
 
				 
			
 
				     public static class Tokenization {
			
 
				 
			
 
				-        String input;
			
 
				-        private final List<String> tokens;
			
 
				+        private final String inputSeqs;
			
 
				+        private final String[] tokens;
			
 
				         private final int[] tokenIds;
			
 
				         private final int[] tokenMap;
			
 
				 
			
 
				-        public Tokenization(String input, List<String> tokens, int[] tokenIds, int[] tokenMap) {
			
 
				-            assert tokens.size() == tokenIds.length;
			
 
				+        public Tokenization(String input, String[] tokens, int[] tokenIds, int[] tokenMap) {
			
 
				+            assert tokens.length == tokenIds.length;
			
 
				             assert tokenIds.length == tokenMap.length;
			
 
				-            this.input = input;
			
 
				+            this.inputSeqs = input;
			
 
				             this.tokens = tokens;
			
 
				             this.tokenIds = tokenIds;
			
 
				             this.tokenMap = tokenMap;
			
@@ -59,7 +64,7 @@ public class TokenizationResult {
 
				          *
			
 
				          * @return A list of tokens
			
 
				          */
			
 
				-        public List<String> getTokens() {
			
 
				+        public String[] getTokens() {
			
 
				             return tokens;
			
 
				         }
			
 
				 
			
@@ -84,7 +89,7 @@ public class TokenizationResult {
 
				         }
			
 
				 
			
 
				         public String getInput() {
			
 
				-            return input;
			
 
				+            return inputSeqs;
			
 
				         }
			
 
				     }
			
 
				 }
			
--- a/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/inference/nlp/FillMaskProcessorTests.java
+++ b/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/inference/nlp/FillMaskProcessorTests.java
@@ -41,7 +41,7 @@ public class FillMaskProcessorTests extends ESTestCase {
 
				         String input = "The capital of " + BertTokenizer.MASK_TOKEN + " is Paris";
			
 
				 
			
 
				         List<String> vocab = Arrays.asList("The", "capital", "of", BertTokenizer.MASK_TOKEN, "is", "Paris", "France");
			
 
				-        List<String> tokens = Arrays.asList(input.split(" "));
			
 
				+        String[] tokens = input.split(" ");
			
 
				         int[] tokenMap = new int[] {0, 1, 2, 3, 4, 5};
			
 
				         int[] tokenIds = new int[] {0, 1, 2, 3, 4, 5};
			
 
				 
			
@@ -68,7 +68,7 @@ public class FillMaskProcessorTests extends ESTestCase {
 
				 
			
 
				     public void testProcessResults_GivenMissingTokens() {
			
 
				         TokenizationResult tokenization = new TokenizationResult(Collections.emptyList());
			
 
				-        tokenization.addTokenization("", Collections.emptyList(), new int[] {}, new int[] {});
			
 
				+        tokenization.addTokenization("", new String[]{}, new int[] {}, new int[] {});
			
 
				 
			
 
				         FillMaskConfig config = new FillMaskConfig(new VocabularyConfig("test-index"), null);
			
 
				         FillMaskProcessor processor = new FillMaskProcessor(mock(BertTokenizer.class), config);
			
--- a/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/inference/nlp/NerProcessorTests.java
+++ b/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/inference/nlp/NerProcessorTests.java
@@ -222,6 +222,6 @@ public class NerProcessorTests extends ESTestCase {
 
				             vocab,
			
 
				             new BertTokenization(true, false, null)
			
 
				         ).setDoLowerCase(true).setWithSpecialTokens(false).build();
			
 
				-        return tokenizer.tokenize(List.of(input));
			
 
				+        return tokenizer.buildTokenizationResult(List.of(tokenizer.tokenize(input)));
			
 
				     }
			
 
				 }
			
--- a/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/inference/nlp/TextClassificationProcessorTests.java
+++ b/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/inference/nlp/TextClassificationProcessorTests.java
@@ -65,7 +65,7 @@ public class TextClassificationProcessorTests extends ESTestCase {
 
				         TextClassificationConfig config = new TextClassificationConfig(new VocabularyConfig("test-index"), null, null, null);
			
 
				         TextClassificationProcessor processor = new TextClassificationProcessor(tokenizer, config);
			
 
				 
			
 
				-        NlpTask.Request request = processor.getRequestBuilder().buildRequest(List.of("Elasticsearch fun"), "request1");
			
 
				+        NlpTask.Request request = processor.getRequestBuilder(config).buildRequest(List.of("Elasticsearch fun"), "request1");
			
 
				 
			
 
				         Map<String, Object> jsonDocAsMap = XContentHelper.convertToMap(request.processInput, true, XContentType.JSON).v2();
			
 
				 
			
--- a/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/inference/nlp/tokenizers/BertTokenizerTests.java
+++ b/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/inference/nlp/tokenizers/BertTokenizerTests.java
@@ -15,7 +15,7 @@ import java.util.Arrays;
 
				 import java.util.Collections;
			
 
				 import java.util.List;
			
 
				 
			
 
				-import static org.hamcrest.Matchers.contains;
			
 
				+import static org.hamcrest.Matchers.arrayContaining;
			
 
				 import static org.hamcrest.Matchers.hasSize;
			
 
				 
			
 
				 public class BertTokenizerTests extends ESTestCase {
			
@@ -26,9 +26,8 @@ public class BertTokenizerTests extends ESTestCase {
 
				             new BertTokenization(null, false, null)
			
 
				         ).build();
			
 
				 
			
 
				-        TokenizationResult tr = tokenizer.tokenize(List.of("Elasticsearch fun"));
			
 
				-        TokenizationResult.Tokenization tokenization = tr.getTokenizations().get(0);
			
 
				-        assertThat(tokenization.getTokens(), contains("Elastic", "##search", "fun"));
			
 
				+        TokenizationResult.Tokenization tokenization = tokenizer.tokenize("Elasticsearch fun");
			
 
				+        assertThat(tokenization.getTokens(), arrayContaining("Elastic", "##search", "fun"));
			
 
				         assertArrayEquals(new int[] {0, 1, 2}, tokenization.getTokenIds());
			
 
				         assertArrayEquals(new int[] {0, 0, 1}, tokenization.getTokenMap());
			
 
				     }
			
@@ -39,9 +38,8 @@ public class BertTokenizerTests extends ESTestCase {
 
				             Tokenization.createDefault()
			
 
				         ).build();
			
 
				 
			
 
				-        TokenizationResult tr = tokenizer.tokenize(List.of("elasticsearch fun"));
			
 
				-        TokenizationResult.Tokenization tokenization = tr.getTokenizations().get(0);
			
 
				-        assertThat(tokenization.getTokens(), contains("[CLS]", "elastic", "##search", "fun", "[SEP]"));
			
 
				+        TokenizationResult.Tokenization tokenization = tokenizer.tokenize("elasticsearch fun");
			
 
				+        assertThat(tokenization.getTokens(), arrayContaining("[CLS]", "elastic", "##search", "fun", "[SEP]"));
			
 
				         assertArrayEquals(new int[] {3, 0, 1, 2, 4}, tokenization.getTokenIds());
			
 
				         assertArrayEquals(new int[] {-1, 0, 0, 1, -1}, tokenization.getTokenMap());
			
 
				     }
			
@@ -56,9 +54,8 @@ public class BertTokenizerTests extends ESTestCase {
 
				          .setWithSpecialTokens(false)
			
 
				          .build();
			
 
				 
			
 
				-        TokenizationResult tr = tokenizer.tokenize(List.of("Elasticsearch " + specialToken + " fun"));
			
 
				-        TokenizationResult.Tokenization tokenization = tr.getTokenizations().get(0);
			
 
				-        assertThat(tokenization.getTokens(), contains("Elastic", "##search", specialToken, "fun"));
			
 
				+        TokenizationResult.Tokenization tokenization = tokenizer.tokenize("Elasticsearch " + specialToken + " fun");
			
 
				+        assertThat(tokenization.getTokens(), arrayContaining("Elastic", "##search", specialToken, "fun"));
			
 
				         assertArrayEquals(new int[] {0, 1, 3, 2}, tokenization.getTokenIds());
			
 
				         assertArrayEquals(new int[] {0, 0, 1, 2}, tokenization.getTokenMap());
			
 
				     }
			
@@ -72,15 +69,13 @@ public class BertTokenizerTests extends ESTestCase {
 
				              .setWithSpecialTokens(false)
			
 
				              .build();
			
 
				 
			
 
				-            TokenizationResult tr = tokenizer.tokenize(List.of("Elasticsearch fun"));
			
 
				-            TokenizationResult.Tokenization tokenization = tr.getTokenizations().get(0);
			
 
				-            assertThat(tokenization.getTokens(), contains(BertTokenizer.UNKNOWN_TOKEN, "fun"));
			
 
				+            TokenizationResult.Tokenization tokenization = tokenizer.tokenize("Elasticsearch fun");
			
 
				+            assertThat(tokenization.getTokens(), arrayContaining(BertTokenizer.UNKNOWN_TOKEN, "fun"));
			
 
				             assertArrayEquals(new int[] {3, 2}, tokenization.getTokenIds());
			
 
				             assertArrayEquals(new int[] {0, 1}, tokenization.getTokenMap());
			
 
				 
			
 
				-            tr = tokenizer.tokenize(List.of("elasticsearch fun"));
			
 
				-            tokenization = tr.getTokenizations().get(0);
			
 
				-            assertThat(tokenization.getTokens(), contains("elastic", "##search", "fun"));
			
 
				+            tokenization = tokenizer.tokenize("elasticsearch fun");
			
 
				+            assertThat(tokenization.getTokens(), arrayContaining("elastic", "##search", "fun"));
			
 
				         }
			
 
				 
			
 
				         {
			
@@ -89,9 +84,8 @@ public class BertTokenizerTests extends ESTestCase {
 
				                 .setWithSpecialTokens(false)
			
 
				                 .build();
			
 
				 
			
 
				-            TokenizationResult tr = tokenizer.tokenize(List.of("Elasticsearch fun"));
			
 
				-            TokenizationResult.Tokenization tokenization = tr.getTokenizations().get(0);
			
 
				-            assertThat(tokenization.getTokens(), contains("elastic", "##search", "fun"));
			
 
				+            TokenizationResult.Tokenization tokenization = tokenizer.tokenize("Elasticsearch fun");
			
 
				+            assertThat(tokenization.getTokens(), arrayContaining("elastic", "##search", "fun"));
			
 
				         }
			
 
				     }
			
 
				 
			
@@ -101,15 +95,13 @@ public class BertTokenizerTests extends ESTestCase {
 
				             Tokenization.createDefault()
			
 
				         ).setWithSpecialTokens(false).build();
			
 
				 
			
 
				-        TokenizationResult tr = tokenizer.tokenize(List.of("Elasticsearch, fun."));
			
 
				-        TokenizationResult.Tokenization tokenization = tr.getTokenizations().get(0);
			
 
				-        assertThat(tokenization.getTokens(), contains("Elastic", "##search", ",", "fun", "."));
			
 
				+        TokenizationResult.Tokenization tokenization = tokenizer.tokenize("Elasticsearch, fun.");
			
 
				+        assertThat(tokenization.getTokens(), arrayContaining("Elastic", "##search", ",", "fun", "."));
			
 
				         assertArrayEquals(new int[] {0, 1, 4, 2, 3}, tokenization.getTokenIds());
			
 
				         assertArrayEquals(new int[] {0, 0, 1, 2, 3}, tokenization.getTokenMap());
			
 
				 
			
 
				-        tr = tokenizer.tokenize(List.of("Elasticsearch, fun [MASK]."));
			
 
				-        tokenization = tr.getTokenizations().get(0);
			
 
				-        assertThat(tokenization.getTokens(), contains("Elastic", "##search", ",", "fun", "[MASK]", "."));
			
 
				+        tokenization = tokenizer.tokenize("Elasticsearch, fun [MASK].");
			
 
				+        assertThat(tokenization.getTokens(), arrayContaining("Elastic", "##search", ",", "fun", "[MASK]", "."));
			
 
				         assertArrayEquals(new int[] {0, 1, 4, 2, 5, 3}, tokenization.getTokenIds());
			
 
				         assertArrayEquals(new int[] {0, 0, 1, 2, 3, 4}, tokenization.getTokenMap());
			
 
				     }
			
@@ -124,31 +116,83 @@ public class BertTokenizerTests extends ESTestCase {
 
				             new BertTokenization(null, false, null)
			
 
				         ).build();
			
 
				 
			
 
				-        TokenizationResult tr = tokenizer.tokenize(List.of("Elasticsearch",
			
 
				-            "my little red car",
			
 
				-            "Godzilla day",
			
 
				-            "Godzilla Pancake red car day"
			
 
				-            ));
			
 
				+        TokenizationResult tr = tokenizer.buildTokenizationResult(
			
 
				+            List.of(
			
 
				+                tokenizer.tokenize("Elasticsearch"),
			
 
				+                tokenizer.tokenize("my little red car"),
			
 
				+                tokenizer.tokenize("Godzilla day"),
			
 
				+                tokenizer.tokenize("Godzilla Pancake red car day")
			
 
				+            )
			
 
				+        );
			
 
				         assertThat(tr.getTokenizations(), hasSize(4));
			
 
				 
			
 
				         TokenizationResult.Tokenization tokenization = tr.getTokenizations().get(0);
			
 
				-        assertThat(tokenization.getTokens(), contains("Elastic", "##search"));
			
 
				+        assertThat(tokenization.getTokens(), arrayContaining("Elastic", "##search"));
			
 
				         assertArrayEquals(new int[] {0, 1}, tokenization.getTokenIds());
			
 
				         assertArrayEquals(new int[] {0, 0}, tokenization.getTokenMap());
			
 
				 
			
 
				         tokenization = tr.getTokenizations().get(1);
			
 
				-        assertThat(tokenization.getTokens(), contains("my", "little", "red", "car"));
			
 
				+        assertThat(tokenization.getTokens(), arrayContaining("my", "little", "red", "car"));
			
 
				         assertArrayEquals(new int[] {5, 6, 7, 8}, tokenization.getTokenIds());
			
 
				         assertArrayEquals(new int[] {0, 1, 2, 3}, tokenization.getTokenMap());
			
 
				 
			
 
				         tokenization = tr.getTokenizations().get(2);
			
 
				-        assertThat(tokenization.getTokens(), contains("God", "##zilla", "day"));
			
 
				+        assertThat(tokenization.getTokens(), arrayContaining("God", "##zilla", "day"));
			
 
				         assertArrayEquals(new int[] {9, 10, 4}, tokenization.getTokenIds());
			
 
				         assertArrayEquals(new int[] {0, 0, 1}, tokenization.getTokenMap());
			
 
				 
			
 
				         tokenization = tr.getTokenizations().get(3);
			
 
				-        assertThat(tokenization.getTokens(), contains("God", "##zilla", "Pancake", "red", "car", "day"));
			
 
				+        assertThat(tokenization.getTokens(), arrayContaining("God", "##zilla", "Pancake", "red", "car", "day"));
			
 
				         assertArrayEquals(new int[] {9, 10, 3, 7, 8, 4}, tokenization.getTokenIds());
			
 
				         assertArrayEquals(new int[] {0, 0, 1, 2, 3, 4}, tokenization.getTokenMap());
			
 
				     }
			
 
				+
			
 
				+    public void testMultiSeqTokenization() {
			
 
				+        List<String> vocab = List.of(
			
 
				+            "Elastic",
			
 
				+            "##search",
			
 
				+            "is",
			
 
				+            "fun",
			
 
				+            "my",
			
 
				+            "little",
			
 
				+            "red",
			
 
				+            "car",
			
 
				+            "God",
			
 
				+            "##zilla",
			
 
				+            BertTokenizer.CLASS_TOKEN,
			
 
				+            BertTokenizer.SEPARATOR_TOKEN
			
 
				+        );
			
 
				+        BertTokenizer tokenizer = BertTokenizer.builder(vocab, Tokenization.createDefault())
			
 
				+            .setDoLowerCase(false)
			
 
				+            .setWithSpecialTokens(true)
			
 
				+            .build();
			
 
				+        TokenizationResult.Tokenization tokenization = tokenizer.tokenize("Elasticsearch is fun", "Godzilla my little red car");
			
 
				+        assertThat(
			
 
				+            tokenization.getTokens(),
			
 
				+            arrayContaining(
			
 
				+                BertTokenizer.CLASS_TOKEN,
			
 
				+                "Elastic",
			
 
				+                "##search",
			
 
				+                "is",
			
 
				+                "fun",
			
 
				+                BertTokenizer.SEPARATOR_TOKEN,
			
 
				+                "God",
			
 
				+                "##zilla",
			
 
				+                "my",
			
 
				+                "little",
			
 
				+                "red",
			
 
				+                "car",
			
 
				+                BertTokenizer.SEPARATOR_TOKEN
			
 
				+            )
			
 
				+        );
			
 
				+        assertArrayEquals(new int[] { 10, 0, 1, 2, 3, 11, 8, 9, 4, 5, 6, 7, 11 }, tokenization.getTokenIds());
			
 
				+    }
			
 
				+
			
 
				+    public void testMultiSeqRequiresSpecialTokens() {
			
 
				+        BertTokenizer tokenizer = BertTokenizer.builder(List.of("foo"), Tokenization.createDefault())
			
 
				+            .setDoLowerCase(false)
			
 
				+            .setWithSpecialTokens(false)
			
 
				+            .build();
			
 
				+        expectThrows(Exception.class, () -> tokenizer.tokenize("foo", "foo"));
			
 
				+    }
			
 
				 }