From 2a5afca1ba42548dbe4d84b61a31946b3fe586b2 Mon Sep 17 00:00:00 2001
From: YeonghyeonKo <46114393+YeonghyeonKO@users.noreply.github.com>
Date: Tue, 24 Sep 2024 00:53:38 +0900
Subject: [PATCH 01/28] fix typos of docs/plugins (#113348)

---
 docs/plugins/analysis-icu.asciidoc            |  4 +-
 docs/plugins/analysis-kuromoji.asciidoc       |  4 +-
 docs/plugins/analysis-nori.asciidoc           |  2 +-
 .../creating-stable-plugins.asciidoc          | 50 +++++++++----------
 docs/plugins/discovery-azure-classic.asciidoc |  2 +-
 docs/plugins/discovery-gce.asciidoc           |  2 +-
 docs/plugins/integrations.asciidoc            |  4 +-
 docs/plugins/mapper-annotated-text.asciidoc   |  2 +-
 docs/plugins/store-smb.asciidoc               |  4 +-
 9 files changed, 37 insertions(+), 37 deletions(-)

diff --git a/docs/plugins/analysis-icu.asciidoc b/docs/plugins/analysis-icu.asciidoc
index f6ca6ceae7ea4..da7efd2843f50 100644
--- a/docs/plugins/analysis-icu.asciidoc
+++ b/docs/plugins/analysis-icu.asciidoc
@@ -380,7 +380,7 @@ GET /my-index-000001/_search <3>
 
 --------------------------
 
-<1> The `name` field uses the `standard` analyzer, and so support full text queries.
+<1> The `name` field uses the `standard` analyzer, and so supports full text queries.
 <2> The `name.sort` field is an `icu_collation_keyword` field that will preserve the name as
     a single token doc values, and applies the German ``phonebook'' order.
 <3> An example query which searches the `name` field and sorts on the `name.sort` field.
@@ -467,7 +467,7 @@ differences.
 `case_first`::
 
 Possible values: `lower` or `upper`. Useful to control which case is sorted
-first when case is not ignored for strength `tertiary`. The default depends on
+first when the case is not ignored for strength `tertiary`. The default depends on
 the collation.
 
 `numeric`::
diff --git a/docs/plugins/analysis-kuromoji.asciidoc b/docs/plugins/analysis-kuromoji.asciidoc
index e8380ce0aca17..0a167bf3f0240 100644
--- a/docs/plugins/analysis-kuromoji.asciidoc
+++ b/docs/plugins/analysis-kuromoji.asciidoc
@@ -86,7 +86,7 @@ The `kuromoji_iteration_mark` normalizes Japanese horizontal iteration marks
 
 `normalize_kanji`::
 
-    Indicates whether kanji iteration marks should be normalize. Defaults to `true`.
+    Indicates whether kanji iteration marks should be normalized. Defaults to `true`.
 
 `normalize_kana`::
 
@@ -194,7 +194,7 @@ PUT kuromoji_sample
 +
 --
 Additional expert user parameters `nbest_cost` and `nbest_examples` can be used
-to include additional tokens that most likely according to the statistical model.
+to include additional tokens that are most likely according to the statistical model.
 If both parameters are used, the largest number of both is applied.
 
 `nbest_cost`::
diff --git a/docs/plugins/analysis-nori.asciidoc b/docs/plugins/analysis-nori.asciidoc
index e7855f94758e1..02980a4ed8a8c 100644
--- a/docs/plugins/analysis-nori.asciidoc
+++ b/docs/plugins/analysis-nori.asciidoc
@@ -452,7 +452,7 @@ Which responds with:
 The `nori_number` token filter normalizes Korean numbers
 to regular Arabic decimal numbers in half-width characters.
 
-Korean numbers are often written using a combination of Hangul and Arabic numbers with various kinds punctuation.
+Korean numbers are often written using a combination of Hangul and Arabic numbers with various kinds of punctuation.
 For example, ３．２천 means 3200.
 This filter does this kind of normalization and allows a search for 3200 to match ３．２천 in text,
 but can also be used to make range facets based on the normalized numbers and so on.
diff --git a/docs/plugins/development/creating-stable-plugins.asciidoc b/docs/plugins/development/creating-stable-plugins.asciidoc
index c9a8a1f6c7e2a..9f98774b5a761 100644
--- a/docs/plugins/development/creating-stable-plugins.asciidoc
+++ b/docs/plugins/development/creating-stable-plugins.asciidoc
@@ -1,8 +1,8 @@
 [[creating-stable-plugins]]
 === Creating text analysis plugins with the stable plugin API
 
-Text analysis plugins provide {es} with custom {ref}/analysis.html[Lucene 
-analyzers, token filters, character filters, and tokenizers]. 
+Text analysis plugins provide {es} with custom {ref}/analysis.html[Lucene
+analyzers, token filters, character filters, and tokenizers].
 
 [discrete]
 ==== The stable plugin API
@@ -10,7 +10,7 @@ analyzers, token filters, character filters, and tokenizers].
 Text analysis plugins can be developed against the stable plugin API. This API
 consists of the following dependencies:
 
-* `plugin-api` - an API used by plugin developers to implement custom {es} 
+* `plugin-api` - an API used by plugin developers to implement custom {es}
 plugins.
 * `plugin-analysis-api` - an API used by plugin developers to implement analysis
 plugins and integrate them into {es}.
@@ -18,7 +18,7 @@ plugins and integrate them into {es}.
 core Lucene analysis interfaces like `Tokenizer`, `Analyzer`, and `TokenStream`.
 
 For new versions of {es} within the same major version, plugins built against
-this API do not need to be recompiled. Future versions of the API will be
+this API does not need to be recompiled. Future versions of the API will be
 backwards compatible and plugins are binary compatible with future versions of
 {es}. In other words, once you have a working artifact, you can re-use it when
 you upgrade {es} to a new bugfix or minor version.
@@ -48,9 +48,9 @@ require code changes.
 
 Stable plugins are ZIP files composed of JAR files and two metadata files:
 
-* `stable-plugin-descriptor.properties` - a Java properties file that describes 
+* `stable-plugin-descriptor.properties` - a Java properties file that describes
 the plugin. Refer to <<plugin-descriptor-file-{plugin-type}>>.
-* `named_components.json` - a JSON file mapping interfaces to key-value pairs 
+* `named_components.json` - a JSON file mapping interfaces to key-value pairs
 of component names and implementation classes.
 
 Note that only JAR files at the root of the plugin are added to the classpath
@@ -65,7 +65,7 @@ you use this plugin. However, you don't need Gradle to create plugins.
 
 The {es} Github repository contains
 {es-repo}tree/main/plugins/examples/stable-analysis[an example analysis plugin].
-The example `build.gradle` build script provides a good starting point for 
+The example `build.gradle` build script provides a good starting point for
 developing your own plugin.
 
 [discrete]
@@ -77,29 +77,29 @@ Plugins are written in Java, so you need to install a Java Development Kit
 [discrete]
 ===== Step by step
 
-. Create a directory for your project. 
+. Create a directory for your project.
 . Copy the example `build.gradle` build script to your project directory.  Note
 that this build script uses the `elasticsearch.stable-esplugin` gradle plugin to
 build your plugin.
 . Edit the `build.gradle` build script:
-** Add a definition for the `pluginApiVersion` and matching `luceneVersion` 
-variables to the top of the file. You can find these versions in the 
-`build-tools-internal/version.properties` file in the {es-repo}[Elasticsearch 
+** Add a definition for the `pluginApiVersion` and matching `luceneVersion`
+variables to the top of the file. You can find these versions in the
+`build-tools-internal/version.properties` file in the {es-repo}[Elasticsearch
 Github repository].
-** Edit the `name` and `description` in the `esplugin` section of the build 
-script. This will create the plugin descriptor file. If you're not using the 
-`elasticsearch.stable-esplugin` gradle plugin, refer to 
+** Edit the `name` and `description` in the `esplugin` section of the build
+script. This will create the plugin descriptor file. If you're not using the
+`elasticsearch.stable-esplugin` gradle plugin, refer to
 <<plugin-descriptor-file-{plugin-type}>> to create the file manually.
 ** Add module information.
-** Ensure you have declared the following compile-time dependencies. These 
-dependencies are compile-time only because {es} will provide these libraries at 
+** Ensure you have declared the following compile-time dependencies. These
+dependencies are compile-time only because {es} will provide these libraries at
 runtime.
 *** `org.elasticsearch.plugin:elasticsearch-plugin-api`
 *** `org.elasticsearch.plugin:elasticsearch-plugin-analysis-api`
 *** `org.apache.lucene:lucene-analysis-common`
-** For unit testing, ensure these dependencies have also been added to the 
+** For unit testing, ensure these dependencies have also been added to the
 `build.gradle` script as `testImplementation` dependencies.
-. Implement an interface from the analysis plugin API, annotating it with 
+. Implement an interface from the analysis plugin API, annotating it with
 `NamedComponent`. Refer to <<example-text-analysis-plugin>> for an example.
 . You should now be able to assemble a plugin ZIP file by running:
 +
@@ -107,22 +107,22 @@ runtime.
 ----
 gradle bundlePlugin
 ----
-The resulting plugin ZIP file is written to the  `build/distributions` 
+The resulting plugin ZIP file is written to the  `build/distributions`
 directory.
 
 [discrete]
 ===== YAML REST tests
 
-The Gradle `elasticsearch.yaml-rest-test` plugin enables testing of your 
-plugin using the {es-repo}blob/main/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/README.asciidoc[{es} yamlRestTest framework]. 
+The Gradle `elasticsearch.yaml-rest-test` plugin enables testing of your
+plugin using the {es-repo}blob/main/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/README.asciidoc[{es} yamlRestTest framework].
 These tests use a YAML-formatted domain language to issue REST requests against
-an internal {es} cluster that has your plugin installed, and to check the 
-results of those requests. The structure of a YAML REST test directory is as 
+an internal {es} cluster that has your plugin installed, and to check the
+results of those requests. The structure of a YAML REST test directory is as
 follows:
 
-* A test suite class, defined under `src/yamlRestTest/java`. This class should 
+* A test suite class, defined under `src/yamlRestTest/java`. This class should
 extend `ESClientYamlSuiteTestCase`.
-* The YAML tests themselves should be defined under 
+* The YAML tests themselves should be defined under
 `src/yamlRestTest/resources/test/`.
 
 [[plugin-descriptor-file-stable]]
diff --git a/docs/plugins/discovery-azure-classic.asciidoc b/docs/plugins/discovery-azure-classic.asciidoc
index aa710a2fe7ef9..b8d37f024172c 100644
--- a/docs/plugins/discovery-azure-classic.asciidoc
+++ b/docs/plugins/discovery-azure-classic.asciidoc
@@ -148,7 +148,7 @@ Before starting, you need to have:
 --
 
 You should follow http://azure.microsoft.com/en-us/documentation/articles/linux-use-ssh-key/[this guide] to learn
-how to create or use existing SSH keys. If you have already did it, you can skip the following.
+how to create or use existing SSH keys. If you have already done it, you can skip the following.
 
 Here is a description on how to generate SSH keys using `openssl`:
 
diff --git a/docs/plugins/discovery-gce.asciidoc b/docs/plugins/discovery-gce.asciidoc
index 2e8cff21208e0..0a2629b7f094b 100644
--- a/docs/plugins/discovery-gce.asciidoc
+++ b/docs/plugins/discovery-gce.asciidoc
@@ -478,7 +478,7 @@ discovery:
       seed_providers: gce
 --------------------------------------------------
 
-Replaces `project_id` and `zone` with your settings.
+Replace `project_id` and `zone` with your settings.
 
 To run test:
 
diff --git a/docs/plugins/integrations.asciidoc b/docs/plugins/integrations.asciidoc
index 71f237692ad35..aff4aed0becd2 100644
--- a/docs/plugins/integrations.asciidoc
+++ b/docs/plugins/integrations.asciidoc
@@ -91,7 +91,7 @@ Integrations are not plugins, but are external tools or modules that make it eas
   Elasticsearch Grails plugin.
 
 * https://hibernate.org/search/[Hibernate Search]
-  Integration with Hibernate ORM, from the Hibernate team. Automatic synchronization of write operations, yet exposes full Elasticsearch capabilities for queries. Can return either Elasticsearch native or re-map queries back into managed entities loaded within transaction from the reference database.
+  Integration with Hibernate ORM, from the Hibernate team. Automatic synchronization of write operations, yet exposes full Elasticsearch capabilities for queries. Can return either Elasticsearch native or re-map queries back into managed entities loaded within transactions from the reference database.
 
 * https://github.com/spring-projects/spring-data-elasticsearch[Spring Data Elasticsearch]:
   Spring Data implementation for Elasticsearch
@@ -104,7 +104,7 @@ Integrations are not plugins, but are external tools or modules that make it eas
 
 * https://pulsar.apache.org/docs/en/io-elasticsearch[Apache Pulsar]:
   The Elasticsearch Sink Connector is used to pull messages from Pulsar topics
-  and persist the messages to a index.
+  and persist the messages to an index.
 
 * https://micronaut-projects.github.io/micronaut-elasticsearch/latest/guide/index.html[Micronaut Elasticsearch Integration]:
   Integration of Micronaut with Elasticsearch
diff --git a/docs/plugins/mapper-annotated-text.asciidoc b/docs/plugins/mapper-annotated-text.asciidoc
index afe8ba41da9b8..e4141e98a2285 100644
--- a/docs/plugins/mapper-annotated-text.asciidoc
+++ b/docs/plugins/mapper-annotated-text.asciidoc
@@ -143,7 +143,7 @@ broader positional queries e.g. finding mentions of a `Guitarist` near to `strat
 
 WARNING: Any use of `=` signs in annotation values eg `[Prince](person=Prince)` will
 cause the document to be rejected with a parse failure. In future we hope to have a use for
-the equals signs so wil actively reject documents that contain this today.
+the equals signs so will actively reject documents that contain this today.
 
 [[annotated-text-synthetic-source]]
 ===== Synthetic `_source`
diff --git a/docs/plugins/store-smb.asciidoc b/docs/plugins/store-smb.asciidoc
index 8557ef868010f..da803b4f42022 100644
--- a/docs/plugins/store-smb.asciidoc
+++ b/docs/plugins/store-smb.asciidoc
@@ -10,7 +10,7 @@ include::install_remove.asciidoc[]
 ==== Working around a bug in Windows SMB and Java on windows
 
 When using a shared file system based on the SMB protocol (like Azure File Service) to store indices, the way Lucene
-open index segment files is with a write only flag. This is the _correct_ way to open the files, as they will only be
+opens index segment files is with a write only flag. This is the _correct_ way to open the files, as they will only be
 used for writes and allows different FS implementations to optimize for it. Sadly, in windows with SMB, this disables
 the cache manager, causing writes to be slow. This has been described in
 https://issues.apache.org/jira/browse/LUCENE-6176[LUCENE-6176], but it affects each and every Java program out there!.
@@ -44,7 +44,7 @@ This can be configured for all indices by adding this to the `elasticsearch.yml`
 index.store.type: smb_nio_fs
 ----
 
-Note that setting will be applied for newly created indices.
+Note that settings will be applied for newly created indices.
 
 It can also be set on a per-index basis at index creation time:
 

From cc37be136a3c0a4b4e74ea2c13b12bdd67a7117d Mon Sep 17 00:00:00 2001
From: David Turner <david.turner@elastic.co>
Date: Mon, 23 Sep 2024 17:01:48 +0100
Subject: [PATCH 02/28] Make `UpdateSettingsClusterStateUpdateRequest` a record
 (#113353)

No need to extend `IndicesClusterStateUpdateRequest`, this thing can be
completely immutable.
---
 .../MetadataUpdateSettingsServiceIT.java      | 133 ++++++++++--------
 .../put/TransportUpdateSettingsAction.java    |  31 ++--
 ...dateSettingsClusterStateUpdateRequest.java |  86 +++++------
 .../MetadataUpdateSettingsService.java        |   4 +-
 .../upgrades/SystemIndexMigrator.java         |  16 ++-
 ...TransportUpdateSecuritySettingsAction.java |  16 ++-
 .../TransportUpdateWatcherSettingsAction.java |  12 +-
 7 files changed, 166 insertions(+), 132 deletions(-)

diff --git a/server/src/internalClusterTest/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsServiceIT.java b/server/src/internalClusterTest/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsServiceIT.java
index b3b7957801cd7..c1e68040e075b 100644
--- a/server/src/internalClusterTest/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsServiceIT.java
+++ b/server/src/internalClusterTest/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsServiceIT.java
@@ -28,6 +28,7 @@
 import java.util.List;
 import java.util.concurrent.atomic.AtomicBoolean;
 import java.util.concurrent.atomic.AtomicReference;
+import java.util.function.Function;
 
 import static org.hamcrest.Matchers.equalTo;
 
@@ -42,45 +43,58 @@ public void testThatNonDynamicSettingChangesTakeEffect() throws Exception {
         MetadataUpdateSettingsService metadataUpdateSettingsService = internalCluster().getCurrentMasterNodeInstance(
             MetadataUpdateSettingsService.class
         );
-        UpdateSettingsClusterStateUpdateRequest request = new UpdateSettingsClusterStateUpdateRequest().ackTimeout(TimeValue.ZERO);
-        List<Index> indices = new ArrayList<>();
+        List<Index> indicesList = new ArrayList<>();
         for (IndicesService indicesService : internalCluster().getInstances(IndicesService.class)) {
             for (IndexService indexService : indicesService) {
-                indices.add(indexService.index());
+                indicesList.add(indexService.index());
             }
         }
-        request.indices(indices.toArray(Index.EMPTY_ARRAY));
-        request.settings(Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData").build());
+        final var indices = indicesList.toArray(Index.EMPTY_ARRAY);
+
+        final Function<UpdateSettingsClusterStateUpdateRequest.OnStaticSetting, UpdateSettingsClusterStateUpdateRequest> requestFactory =
+            onStaticSetting -> new UpdateSettingsClusterStateUpdateRequest(
+                TEST_REQUEST_TIMEOUT,
+                TimeValue.ZERO,
+                Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData").build(),
+                UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
+                onStaticSetting,
+                indices
+            );
 
         // First make sure it fails if reopenShards is not set on the request:
         AtomicBoolean expectedFailureOccurred = new AtomicBoolean(false);
-        metadataUpdateSettingsService.updateSettings(request, new ActionListener<>() {
-            @Override
-            public void onResponse(AcknowledgedResponse acknowledgedResponse) {
-                fail("Should have failed updating a non-dynamic setting without reopenShards set to true");
-            }
+        metadataUpdateSettingsService.updateSettings(
+            requestFactory.apply(UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT),
+            new ActionListener<>() {
+                @Override
+                public void onResponse(AcknowledgedResponse acknowledgedResponse) {
+                    fail("Should have failed updating a non-dynamic setting without reopenShards set to true");
+                }
 
-            @Override
-            public void onFailure(Exception e) {
-                expectedFailureOccurred.set(true);
+                @Override
+                public void onFailure(Exception e) {
+                    expectedFailureOccurred.set(true);
+                }
             }
-        });
+        );
         assertBusy(() -> assertThat(expectedFailureOccurred.get(), equalTo(true)));
 
         // Now we set reopenShards and expect it to work:
-        request.reopenShards(true);
         AtomicBoolean success = new AtomicBoolean(false);
-        metadataUpdateSettingsService.updateSettings(request, new ActionListener<>() {
-            @Override
-            public void onResponse(AcknowledgedResponse acknowledgedResponse) {
-                success.set(true);
-            }
+        metadataUpdateSettingsService.updateSettings(
+            requestFactory.apply(UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REOPEN_INDICES),
+            new ActionListener<>() {
+                @Override
+                public void onResponse(AcknowledgedResponse acknowledgedResponse) {
+                    success.set(true);
+                }
 
-            @Override
-            public void onFailure(Exception e) {
-                fail(e);
+                @Override
+                public void onFailure(Exception e) {
+                    fail(e);
+                }
             }
-        });
+        );
         assertBusy(() -> assertThat(success.get(), equalTo(true)));
 
         // Now we look into the IndexShard objects to make sure that the code was actually updated (vs just the setting):
@@ -110,16 +124,23 @@ public void testThatNonDynamicSettingChangesDoNotUnncessesarilyCauseReopens() th
         MetadataUpdateSettingsService metadataUpdateSettingsService = internalCluster().getCurrentMasterNodeInstance(
             MetadataUpdateSettingsService.class
         );
-        UpdateSettingsClusterStateUpdateRequest request = new UpdateSettingsClusterStateUpdateRequest().ackTimeout(TimeValue.ZERO);
-        List<Index> indices = new ArrayList<>();
+        List<Index> indicesList = new ArrayList<>();
         for (IndicesService indicesService : internalCluster().getInstances(IndicesService.class)) {
             for (IndexService indexService : indicesService) {
-                indices.add(indexService.index());
+                indicesList.add(indexService.index());
             }
         }
-        request.indices(indices.toArray(Index.EMPTY_ARRAY));
-        request.settings(Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData").build());
-        request.reopenShards(true);
+        final var indices = indicesList.toArray(Index.EMPTY_ARRAY);
+
+        final Function<Settings.Builder, UpdateSettingsClusterStateUpdateRequest> requestFactory =
+            settings -> new UpdateSettingsClusterStateUpdateRequest(
+                TEST_REQUEST_TIMEOUT,
+                TimeValue.ZERO,
+                settings.build(),
+                UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
+                UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REOPEN_INDICES,
+                indices
+            );
 
         ClusterService clusterService = internalCluster().getInstance(ClusterService.class);
         AtomicBoolean shardsUnassigned = new AtomicBoolean(false);
@@ -142,47 +163,49 @@ public void testThatNonDynamicSettingChangesDoNotUnncessesarilyCauseReopens() th
 
         AtomicBoolean success = new AtomicBoolean(false);
         // Make the first request, just to set things up:
-        metadataUpdateSettingsService.updateSettings(request, new ActionListener<>() {
-            @Override
-            public void onResponse(AcknowledgedResponse acknowledgedResponse) {
-                success.set(true);
-            }
+        metadataUpdateSettingsService.updateSettings(
+            requestFactory.apply(Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData")),
+            new ActionListener<>() {
+                @Override
+                public void onResponse(AcknowledgedResponse acknowledgedResponse) {
+                    success.set(true);
+                }
 
-            @Override
-            public void onFailure(Exception e) {
-                fail(e);
+                @Override
+                public void onFailure(Exception e) {
+                    fail(e);
+                }
             }
-        });
+        );
         assertBusy(() -> assertThat(success.get(), equalTo(true)));
         assertBusy(() -> assertThat(expectedSettingsChangeInClusterState.get(), equalTo(true)));
         assertThat(shardsUnassigned.get(), equalTo(true));
 
         assertBusy(() -> assertThat(hasUnassignedShards(clusterService.state(), indexName), equalTo(false)));
 
-        // Same request, except now we'll also set the dynamic "index.max_result_window" setting:
-        request.settings(
-            Settings.builder()
-                .put("index.codec", "FastDecompressionCompressingStoredFieldsData")
-                .put("index.max_result_window", "1500")
-                .build()
-        );
         success.set(false);
         expectedSettingsChangeInClusterState.set(false);
         shardsUnassigned.set(false);
         expectedSetting.set("index.max_result_window");
         expectedSettingValue.set("1500");
         // Making this request ought to add this new setting but not unassign the shards:
-        metadataUpdateSettingsService.updateSettings(request, new ActionListener<>() {
-            @Override
-            public void onResponse(AcknowledgedResponse acknowledgedResponse) {
-                success.set(true);
-            }
+        metadataUpdateSettingsService.updateSettings(
+            // Same request, except now we'll also set the dynamic "index.max_result_window" setting:
+            requestFactory.apply(
+                Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData").put("index.max_result_window", "1500")
+            ),
+            new ActionListener<>() {
+                @Override
+                public void onResponse(AcknowledgedResponse acknowledgedResponse) {
+                    success.set(true);
+                }
 
-            @Override
-            public void onFailure(Exception e) {
-                fail(e);
+                @Override
+                public void onFailure(Exception e) {
+                    fail(e);
+                }
             }
-        });
+        );
 
         assertBusy(() -> assertThat(success.get(), equalTo(true)));
         assertBusy(() -> assertThat(expectedSettingsChangeInClusterState.get(), equalTo(true)));
diff --git a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/TransportUpdateSettingsAction.java b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/TransportUpdateSettingsAction.java
index 1d7c264065d6f..1e7f32641b86f 100644
--- a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/TransportUpdateSettingsAction.java
+++ b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/TransportUpdateSettingsAction.java
@@ -124,19 +124,24 @@ protected void masterOperation(
             return;
         }
 
-        UpdateSettingsClusterStateUpdateRequest clusterStateUpdateRequest = new UpdateSettingsClusterStateUpdateRequest().indices(
-            concreteIndices
-        )
-            .settings(requestSettings)
-            .setPreserveExisting(request.isPreserveExisting())
-            .reopenShards(request.reopen())
-            .ackTimeout(request.ackTimeout())
-            .masterNodeTimeout(request.masterNodeTimeout());
-
-        updateSettingsService.updateSettings(clusterStateUpdateRequest, listener.delegateResponse((l, e) -> {
-            logger.debug(() -> "failed to update settings on indices [" + Arrays.toString(concreteIndices) + "]", e);
-            l.onFailure(e);
-        }));
+        updateSettingsService.updateSettings(
+            new UpdateSettingsClusterStateUpdateRequest(
+                request.masterNodeTimeout(),
+                request.ackTimeout(),
+                requestSettings,
+                request.isPreserveExisting()
+                    ? UpdateSettingsClusterStateUpdateRequest.OnExisting.PRESERVE
+                    : UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
+                request.reopen()
+                    ? UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REOPEN_INDICES
+                    : UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT,
+                concreteIndices
+            ),
+            listener.delegateResponse((l, e) -> {
+                logger.debug(() -> "failed to update settings on indices [" + Arrays.toString(concreteIndices) + "]", e);
+                l.onFailure(e);
+            })
+        );
     }
 
     /**
diff --git a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java
index 42a904c704bf3..fe8573da5fb68 100644
--- a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java
+++ b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java
@@ -9,70 +9,60 @@
 
 package org.elasticsearch.action.admin.indices.settings.put;
 
-import org.elasticsearch.cluster.ack.IndicesClusterStateUpdateRequest;
 import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.index.Index;
 
-import java.util.Arrays;
+import java.util.Objects;
 
 /**
  * Cluster state update request that allows to update settings for some indices
  */
-public class UpdateSettingsClusterStateUpdateRequest extends IndicesClusterStateUpdateRequest<UpdateSettingsClusterStateUpdateRequest> {
-
-    private Settings settings;
-
-    private boolean preserveExisting = false;
-
-    private boolean reopenShards = false;
-
-    /**
-     * Returns <code>true</code> iff the settings update should only add but not update settings. If the setting already exists
-     * it should not be overwritten by this update. The default is <code>false</code>
-     */
-    public boolean isPreserveExisting() {
-        return preserveExisting;
-    }
+public record UpdateSettingsClusterStateUpdateRequest(
+    TimeValue masterNodeTimeout,
+    TimeValue ackTimeout,
+    Settings settings,
+    OnExisting onExisting,
+    OnStaticSetting onStaticSetting,
+    Index... indices
+) {
 
     /**
-     * Returns <code>true</code> if non-dynamic setting updates should go through, by automatically unassigning shards in the same cluster
-     * state change as the setting update. The shards will be automatically reassigned after the cluster state update is made. The
-     * default is <code>false</code>.
+     * Specifies the behaviour of an update-settings action on existing settings.
      */
-    public boolean reopenShards() {
-        return reopenShards;
-    }
+    public enum OnExisting {
+        /**
+         * Update all the specified settings, overwriting any settings which already exist. This is the API default.
+         */
+        OVERWRITE,
 
-    public UpdateSettingsClusterStateUpdateRequest reopenShards(boolean reopenShards) {
-        this.reopenShards = reopenShards;
-        return this;
+        /**
+         * Only add new settings, preserving the values of any settings which are already set and ignoring the new values specified in the
+         * request.
+         */
+        PRESERVE
     }
 
     /**
-     * Iff set to <code>true</code> this settings update will only add settings not already set on an index. Existing settings remain
-     * unchanged.
+     * Specifies the behaviour of an update-settings action which is trying to adjust a non-dynamic setting.
      */
-    public UpdateSettingsClusterStateUpdateRequest setPreserveExisting(boolean preserveExisting) {
-        this.preserveExisting = preserveExisting;
-        return this;
-    }
+    public enum OnStaticSetting {
+        /**
+         * Reject attempts to update non-dynamic settings on open indices. This is the API default.
+         */
+        REJECT,
 
-    /**
-     * Returns the {@link Settings} to update
-     */
-    public Settings settings() {
-        return settings;
-    }
-
-    /**
-     * Sets the {@link Settings} to update
-     */
-    public UpdateSettingsClusterStateUpdateRequest settings(Settings settings) {
-        this.settings = settings;
-        return this;
+        /**
+         * Automatically close and reopen the shards of any open indices when updating a non-dynamic setting, forcing the shard to
+         * reinitialize from scratch.
+         */
+        REOPEN_INDICES
     }
 
-    @Override
-    public String toString() {
-        return Arrays.toString(indices()) + settings;
+    public UpdateSettingsClusterStateUpdateRequest {
+        Objects.requireNonNull(masterNodeTimeout);
+        Objects.requireNonNull(ackTimeout);
+        Objects.requireNonNull(settings);
+        Objects.requireNonNull(indices);
     }
 }
diff --git a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java
index cee3b4c0bdac1..4fcbd4165423b 100644
--- a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java
+++ b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java
@@ -176,7 +176,7 @@ ClusterState execute(ClusterState currentState) {
             }
             final Settings closedSettings = settingsForClosedIndices.build();
             final Settings openSettings = settingsForOpenIndices.build();
-            final boolean preserveExisting = request.isPreserveExisting();
+            final boolean preserveExisting = request.onExisting() == UpdateSettingsClusterStateUpdateRequest.OnExisting.PRESERVE;
 
             RoutingTable.Builder routingTableBuilder = null;
             Metadata.Builder metadataBuilder = Metadata.builder(currentState.metadata());
@@ -199,7 +199,7 @@ ClusterState execute(ClusterState currentState) {
             }
 
             if (skippedSettings.isEmpty() == false && openIndices.isEmpty() == false) {
-                if (request.reopenShards()) {
+                if (request.onStaticSetting() == UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REOPEN_INDICES) {
                     // We have non-dynamic settings and open indices. We will unassign all of the shards in these indices so that the new
                     // changed settings are applied when the shards are re-assigned.
                     routingTableBuilder = RoutingTable.builder(
diff --git a/server/src/main/java/org/elasticsearch/upgrades/SystemIndexMigrator.java b/server/src/main/java/org/elasticsearch/upgrades/SystemIndexMigrator.java
index 94b856f7a22fb..a131f63cb75f3 100644
--- a/server/src/main/java/org/elasticsearch/upgrades/SystemIndexMigrator.java
+++ b/server/src/main/java/org/elasticsearch/upgrades/SystemIndexMigrator.java
@@ -19,6 +19,7 @@
 import org.elasticsearch.action.admin.indices.settings.put.UpdateSettingsClusterStateUpdateRequest;
 import org.elasticsearch.action.support.ActiveShardCount;
 import org.elasticsearch.action.support.master.AcknowledgedResponse;
+import org.elasticsearch.action.support.master.MasterNodeRequest;
 import org.elasticsearch.action.support.master.ShardsAcknowledgedResponse;
 import org.elasticsearch.client.internal.Client;
 import org.elasticsearch.client.internal.ParentTaskAssigningClient;
@@ -537,11 +538,18 @@ private CheckedBiConsumer<ActionListener<BulkByScrollResponse>, AcknowledgedResp
      */
     private void setWriteBlock(Index index, boolean readOnlyValue, ActionListener<AcknowledgedResponse> listener) {
         final Settings readOnlySettings = Settings.builder().put(IndexMetadata.INDEX_BLOCKS_WRITE_SETTING.getKey(), readOnlyValue).build();
-        UpdateSettingsClusterStateUpdateRequest updateSettingsRequest = new UpdateSettingsClusterStateUpdateRequest().indices(
-            new Index[] { index }
-        ).settings(readOnlySettings).setPreserveExisting(false).ackTimeout(TimeValue.ZERO);
 
-        metadataUpdateSettingsService.updateSettings(updateSettingsRequest, listener);
+        metadataUpdateSettingsService.updateSettings(
+            new UpdateSettingsClusterStateUpdateRequest(
+                MasterNodeRequest.INFINITE_MASTER_NODE_TIMEOUT,
+                TimeValue.ZERO,
+                readOnlySettings,
+                UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
+                UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT,
+                index
+            ),
+            listener
+        );
     }
 
     private void reindex(SystemIndexMigrationInfo migrationInfo, ActionListener<BulkByScrollResponse> listener) {
diff --git a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportUpdateSecuritySettingsAction.java b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportUpdateSecuritySettingsAction.java
index 49f8846c36e1f..b924fe0d983bb 100644
--- a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportUpdateSecuritySettingsAction.java
+++ b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportUpdateSecuritySettingsAction.java
@@ -119,8 +119,8 @@ protected void masterOperation(
     private Optional<UpdateSettingsClusterStateUpdateRequest> createUpdateSettingsRequest(
         String indexName,
         Settings settingsToUpdate,
-        TimeValue timeout,
-        TimeValue masterTimeout,
+        TimeValue ackTimeout,
+        TimeValue masterNodeTimeout,
         ClusterState state
     ) {
         if (settingsToUpdate.isEmpty()) {
@@ -136,10 +136,14 @@ private Optional<UpdateSettingsClusterStateUpdateRequest> createUpdateSettingsRe
         }
 
         return Optional.of(
-            new UpdateSettingsClusterStateUpdateRequest().indices(new Index[] { writeIndex })
-                .settings(settingsToUpdate)
-                .ackTimeout(timeout)
-                .masterNodeTimeout(masterTimeout)
+            new UpdateSettingsClusterStateUpdateRequest(
+                masterNodeTimeout,
+                ackTimeout,
+                settingsToUpdate,
+                UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
+                UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT,
+                writeIndex
+            )
         );
     }
 
diff --git a/x-pack/plugin/watcher/src/main/java/org/elasticsearch/xpack/watcher/transport/actions/TransportUpdateWatcherSettingsAction.java b/x-pack/plugin/watcher/src/main/java/org/elasticsearch/xpack/watcher/transport/actions/TransportUpdateWatcherSettingsAction.java
index 378ee642cf105..0407c2db63ac6 100644
--- a/x-pack/plugin/watcher/src/main/java/org/elasticsearch/xpack/watcher/transport/actions/TransportUpdateWatcherSettingsAction.java
+++ b/x-pack/plugin/watcher/src/main/java/org/elasticsearch/xpack/watcher/transport/actions/TransportUpdateWatcherSettingsAction.java
@@ -24,7 +24,6 @@
 import org.elasticsearch.cluster.service.ClusterService;
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.util.concurrent.EsExecutors;
-import org.elasticsearch.index.Index;
 import org.elasticsearch.injection.guice.Inject;
 import org.elasticsearch.logging.LogManager;
 import org.elasticsearch.logging.Logger;
@@ -91,9 +90,14 @@ protected void masterOperation(
             return;
         }
         final Settings newSettings = Settings.builder().loadFromMap(request.settings()).build();
-        final UpdateSettingsClusterStateUpdateRequest clusterStateUpdateRequest = new UpdateSettingsClusterStateUpdateRequest().indices(
-            new Index[] { watcherIndexMd.getIndex() }
-        ).settings(newSettings).ackTimeout(request.ackTimeout()).masterNodeTimeout(request.masterNodeTimeout());
+        final UpdateSettingsClusterStateUpdateRequest clusterStateUpdateRequest = new UpdateSettingsClusterStateUpdateRequest(
+            request.masterNodeTimeout(),
+            request.ackTimeout(),
+            newSettings,
+            UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
+            UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT,
+            watcherIndexMd.getIndex()
+        );
 
         updateSettingsService.updateSettings(clusterStateUpdateRequest, new ActionListener<>() {
             @Override

From 208a1fe5714c0e49549de7aaed7a9a847e7b4a15 Mon Sep 17 00:00:00 2001
From: Salvatore Campagna
 <93581129+salvatore-campagna@users.noreply.github.com>
Date: Mon, 23 Sep 2024 18:05:02 +0200
Subject: [PATCH 03/28] Introduce an `ignore_above` index-level setting
 (#113121)

Here we introduce a new index-level setting, `ignore_above`, similar to what we have
for `ignore_malformed`. The setting will apply to all `keyword`, `wildcard` and `flattened`
fields. Each field mapping will still be allowed to override the index-level setting using a
mapping-level `ignore_above` value.
---
 .../mapping/params/ignore-above.asciidoc      |  30 +++
 .../search/530_ignore_above_stored_source.yml | 214 ++++++++++++++++++
 .../540_ignore_above_synthetic_source.yml     | 179 +++++++++++++++
 .../test/search/550_ignore_above_invalid.yml  |  63 ++++++
 .../common/settings/IndexScopedSettings.java  |   1 +
 .../elasticsearch/index/IndexSettings.java    |  26 +++
 .../index/mapper/KeywordFieldMapper.java      |  53 +++--
 .../index/mapper/MapperFeatures.java          |   2 +
 .../flattened/FlattenedFieldMapper.java       |  49 ++--
 .../index/mapper/KeywordFieldTypeTests.java   |   1 +
 .../index/mapper/MultiFieldsTests.java        |   1 +
 .../20_ignore_above_stored_source.yml         |  56 +++++
 .../30_ignore_above_synthetic_source.yml      |  58 +++++
 .../wildcard/mapper/WildcardFieldMapper.java  |  68 +++---
 .../test/CoreTestTranslater.java              |  24 +-
 15 files changed, 762 insertions(+), 63 deletions(-)
 create mode 100644 rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/search/530_ignore_above_stored_source.yml
 create mode 100644 rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/search/540_ignore_above_synthetic_source.yml
 create mode 100644 rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/search/550_ignore_above_invalid.yml
 create mode 100644 x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/wildcard/20_ignore_above_stored_source.yml
 create mode 100644 x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/wildcard/30_ignore_above_synthetic_source.yml

diff --git a/docs/reference/mapping/params/ignore-above.asciidoc b/docs/reference/mapping/params/ignore-above.asciidoc
index 7d04bc82dcbb3..526f2d6205961 100644
--- a/docs/reference/mapping/params/ignore-above.asciidoc
+++ b/docs/reference/mapping/params/ignore-above.asciidoc
@@ -57,3 +57,33 @@ NOTE: The value for `ignore_above` is the _character count_, but Lucene counts
 bytes. If you use UTF-8 text with many non-ASCII characters, you may want to
 set the limit to `32766 / 4 = 8191` since UTF-8 characters may occupy at most
 4 bytes.
+
+[[index-mapping-ignore-above]]
+=== `index.mapping.ignore_above`
+
+The `ignore_above` setting, typically used at the field level, can also be applied at the index level using
+`index.mapping.ignore_above`. This setting lets you define a maximum string length for all applicable fields across
+the index, including `keyword`, `wildcard`, and keyword values in `flattened` fields. Any values that exceed this
+limit will be ignored during indexing and won’t be stored.
+
+This index-wide setting ensures a consistent approach to managing excessively long values. It works the same as the
+field-level setting—if a string’s length goes over the specified limit, that string won’t be indexed or stored.
+When dealing with arrays, each element is evaluated separately, and only the elements that exceed the limit are ignored.
+
+[source,console]
+--------------------------------------------------
+PUT my-index-000001
+{
+  "settings": {
+    "index.mapping.ignore_above": 256
+  }
+}
+--------------------------------------------------
+
+In this example, all applicable fields in `my-index-000001` will ignore any strings longer than 256 characters.
+
+TIP: You can override this index-wide setting for specific fields by specifying a custom `ignore_above` value in the
+field mapping.
+
+NOTE: Just like the field-level `ignore_above`, this setting only affects indexing and storage. The original values
+are still available in the `_source` field if `_source` is enabled, which is the default behavior in Elasticsearch.
diff --git a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/search/530_ignore_above_stored_source.yml b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/search/530_ignore_above_stored_source.yml
new file mode 100644
index 0000000000000..1730a49f743d9
--- /dev/null
+++ b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/search/530_ignore_above_stored_source.yml
@@ -0,0 +1,214 @@
+---
+ignore_above mapping level setting:
+  - requires:
+      cluster_features: [ "mapper.ignore_above_index_level_setting" ]
+      reason: introduce ignore_above index level setting
+  - do:
+      indices.create:
+        index:  test
+        body:
+          settings:
+            index:
+              mapping:
+                ignore_above: 10
+          mappings:
+            properties:
+              keyword:
+                type: keyword
+              flattened:
+                type: flattened
+
+  - do:
+      index:
+        index:  test
+        refresh: true
+        id: "1"
+        body:   { "keyword": "foo bar", "flattened": { "value": "the quick brown fox" } }
+
+  - do:
+      search:
+        body:
+          fields:
+            - keyword
+            - flattened
+          query:
+            match_all: {}
+
+  - length: { hits.hits: 1 }
+  - match: { hits.hits.0._source.keyword: "foo bar" }
+  - match: { hits.hits.0._source.flattened.value: "the quick brown fox" }
+  - match: { hits.hits.0.fields.keyword.0: "foo bar" }
+  - match: { hits.hits.0.fields.flattened: null }
+
+---
+ignore_above mapping level setting on arrays:
+  - requires:
+      cluster_features: [ "mapper.ignore_above_index_level_setting" ]
+      reason: introduce ignore_above index level setting
+  - do:
+      indices.create:
+        index:  test
+        body:
+          settings:
+            index:
+              mapping:
+                ignore_above: 10
+          mappings:
+            properties:
+              keyword:
+                type: keyword
+              flattened:
+                type: flattened
+
+  - do:
+      index:
+        index:  test
+        refresh: true
+        id: "1"
+        body:   { "keyword": ["foo bar", "the quick brown fox"], "flattened": { "value": ["the quick brown fox", "jumps over"] } }
+
+  - do:
+      search:
+        body:
+          fields:
+            - keyword
+            - flattened
+          query:
+            match_all: {}
+
+  - length: { hits.hits: 1 }
+  - match: { hits.hits.0._source.keyword: ["foo bar", "the quick brown fox"] }
+  - match: { hits.hits.0._source.flattened.value: ["the quick brown fox", "jumps over"] }
+  - match: { hits.hits.0.fields.keyword.0: "foo bar" }
+  - match: { hits.hits.0.fields.flattened.0.value: "jumps over" }
+
+---
+ignore_above mapping overrides setting:
+  - requires:
+      cluster_features: [ "mapper.ignore_above_index_level_setting" ]
+      reason: introduce ignore_above index level setting
+  - do:
+      indices.create:
+        index:  test
+        body:
+          settings:
+            index:
+              mapping:
+                ignore_above: 10
+          mappings:
+            properties:
+              keyword:
+                type: keyword
+                ignore_above: 100
+              flattened:
+                type: flattened
+                ignore_above: 100
+
+  - do:
+      index:
+        index:  test
+        refresh: true
+        id: "1"
+        body:   { "keyword": "foo bar baz foo bar baz", "flattened": { "value": "the quick brown fox" } }
+
+  - do:
+      search:
+        body:
+          fields:
+            - keyword
+            - flattened
+          query:
+            match_all: { }
+
+  - length: { hits.hits: 1 }
+  - match: { hits.hits.0._source.keyword: "foo bar baz foo bar baz" }
+  - match: { hits.hits.0._source.flattened.value: "the quick brown fox" }
+  - match: { hits.hits.0.fields.keyword.0: "foo bar baz foo bar baz" }
+  - match: { hits.hits.0.fields.flattened.0.value: "the quick brown fox" }
+
+---
+ignore_above mapping overrides setting on arrays:
+  - requires:
+      cluster_features: [ "mapper.ignore_above_index_level_setting" ]
+      reason: introduce ignore_above index level setting
+  - do:
+      indices.create:
+        index: test
+        body:
+          settings:
+            index:
+              mapping:
+                ignore_above: 10
+          mappings:
+            properties:
+              keyword:
+                type: keyword
+                ignore_above: 100
+              flattened:
+                type: flattened
+                ignore_above: 100
+
+  - do:
+      index:
+        index: test
+        refresh: true
+        id: "1"
+        body: { "keyword": ["foo bar baz foo bar baz", "the quick brown fox jumps over"], "flattened": { "value": ["the quick brown fox", "jumps over the lazy dog"] } }
+
+  - do:
+      search:
+        body:
+          fields:
+            - keyword
+            - flattened
+          query:
+            match_all: { }
+
+  - length: { hits.hits: 1 }
+  - match: { hits.hits.0._source.keyword: ["foo bar baz foo bar baz", "the quick brown fox jumps over"] }
+  - match: { hits.hits.0._source.flattened.value: ["the quick brown fox", "jumps over the lazy dog"] }
+  - match: { hits.hits.0.fields.keyword: ["foo bar baz foo bar baz", "the quick brown fox jumps over"] }
+  - match: { hits.hits.0.fields.flattened.0.value: ["the quick brown fox", "jumps over the lazy dog"] }
+
+---
+date ignore_above index level setting:
+  - requires:
+      cluster_features: [ "mapper.ignore_above_index_level_setting" ]
+      reason: introduce ignore_above index level setting
+  - do:
+      indices.create:
+        index:  test
+        body:
+          settings:
+            index:
+              mapping:
+                ignore_above: 10
+          mappings:
+            properties:
+              keyword:
+                type: keyword
+              date:
+                type: date
+                format: "yyyy-MM-dd'T'HH:mm:ss"
+
+  - do:
+      index:
+        index:  test
+        refresh: true
+        id: "1"
+        body:   { "keyword": ["2023-09-17T15:30:00", "2023-09-17T15:31:00"], "date": ["2023-09-17T15:30:00", "2023-09-17T15:31:00"] }
+
+  - do:
+      search:
+        body:
+          fields:
+            - keyword
+            - date
+          query:
+            match_all: {}
+
+  - length: { hits.hits: 1 }
+  - match: { hits.hits.0._source.keyword: ["2023-09-17T15:30:00", "2023-09-17T15:31:00"] }
+  - match: { hits.hits.0._source.date: ["2023-09-17T15:30:00", "2023-09-17T15:31:00"] }
+  - match: { hits.hits.0.fields.keyword: null }
+  - match: { hits.hits.0.fields.date: ["2023-09-17T15:30:00","2023-09-17T15:31:00"] }
diff --git a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/search/540_ignore_above_synthetic_source.yml b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/search/540_ignore_above_synthetic_source.yml
new file mode 100644
index 0000000000000..defdc8467bf8d
--- /dev/null
+++ b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/search/540_ignore_above_synthetic_source.yml
@@ -0,0 +1,179 @@
+---
+ignore_above mapping level setting:
+  - requires:
+      cluster_features: [ "mapper.ignore_above_index_level_setting" ]
+      reason: introduce ignore_above index level setting
+  - do:
+      indices.create:
+        index:  test
+        body:
+          settings:
+            index:
+              mapping:
+                ignore_above: 10
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              keyword:
+                type: keyword
+              flattened:
+                type: flattened
+
+  - do:
+      index:
+        index:  test
+        refresh: true
+        id: "1"
+        body:   { "keyword": "foo bar", "flattened": { "value": "the quick brown fox" } }
+
+  - do:
+      search:
+        body:
+          fields:
+            - keyword
+            - flattened
+          query:
+            match_all: {}
+
+  - length: { hits.hits: 1 }
+  - match: { hits.hits.0._source.keyword: "foo bar" }
+  - match: { hits.hits.0._source.flattened.value: "the quick brown fox" }
+  - match: { hits.hits.0.fields.keyword.0: "foo bar" }
+
+---
+ignore_above mapping level setting on arrays:
+  - requires:
+      cluster_features: [ "mapper.ignore_above_index_level_setting" ]
+      reason: introduce ignore_above index level setting
+  - do:
+      indices.create:
+        index:  test
+        body:
+          settings:
+            index:
+              mapping:
+                ignore_above: 10
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              keyword:
+                type: keyword
+              flattened:
+                type: flattened
+
+  - do:
+      index:
+        index:  test
+        refresh: true
+        id: "1"
+        body:   { "keyword": ["foo bar", "the quick brown fox"], "flattened": { "value": ["the quick brown fox", "jumps over"] } }
+
+  - do:
+      search:
+        body:
+          fields:
+            - keyword
+            - flattened
+          query:
+            match_all: {}
+
+  - length: { hits.hits: 1 }
+  #TODO: synthetic source field reconstruction bug (TBD: add link to the issue here)
+  #- match: { hits.hits.0._source.keyword: ["foo bar", "the quick brown fox"] }
+  - match: { hits.hits.0._source.flattened.value: ["the quick brown fox", "jumps over"] }
+  - match: { hits.hits.0.fields.keyword.0: "foo bar" }
+  - match: { hits.hits.0.fields.flattened.0.value: "jumps over" }
+
+---
+ignore_above mapping overrides setting:
+  - requires:
+      cluster_features: [ "mapper.ignore_above_index_level_setting" ]
+      reason: introduce ignore_above index level setting
+  - do:
+      indices.create:
+        index:  test
+        body:
+          settings:
+            index:
+              mapping:
+                ignore_above: 10
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              keyword:
+                type: keyword
+                ignore_above: 100
+              flattened:
+                type: flattened
+                ignore_above: 100
+
+  - do:
+      index:
+        index:  test
+        refresh: true
+        id: "1"
+        body:   { "keyword": "foo bar baz foo bar baz", "flattened": { "value": "the quick brown fox" } }
+
+  - do:
+      search:
+        body:
+          fields:
+            - keyword
+            - flattened
+          query:
+            match_all: { }
+
+  - length: { hits.hits: 1 }
+  - match: { hits.hits.0._source.keyword: "foo bar baz foo bar baz" }
+  - match: { hits.hits.0._source.flattened.value: "the quick brown fox" }
+  - match: { hits.hits.0.fields.keyword.0: "foo bar baz foo bar baz" }
+  - match: { hits.hits.0.fields.flattened.0.value: "the quick brown fox" }
+
+---
+ignore_above mapping overrides setting on arrays:
+  - requires:
+      cluster_features: [ "mapper.ignore_above_index_level_setting" ]
+      reason: introduce ignore_above index level setting
+  - do:
+      indices.create:
+        index: test
+        body:
+          settings:
+            index:
+              mapping:
+                ignore_above: 10
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              keyword:
+                type: keyword
+                ignore_above: 100
+              flattened:
+                type: flattened
+                ignore_above: 100
+
+  - do:
+      index:
+        index: test
+        refresh: true
+        id: "1"
+        body: { "keyword": ["foo bar baz foo bar baz", "the quick brown fox jumps over"], "flattened": { "value": ["the quick brown fox", "jumps over the lazy dog"] } }
+
+  - do:
+      search:
+        body:
+          fields:
+            - keyword
+            - flattened
+          query:
+            match_all: { }
+
+  - length: { hits.hits: 1 }
+  - match: { hits.hits.0._source.keyword: ["foo bar baz foo bar baz", "the quick brown fox jumps over"] }
+  - match: { hits.hits.0._source.flattened.value: ["jumps over the lazy dog", "the quick brown fox"] }
+  - match: { hits.hits.0.fields.keyword: ["foo bar baz foo bar baz", "the quick brown fox jumps over"] }
+  - match: { hits.hits.0.fields.flattened.0.value: ["jumps over the lazy dog", "the quick brown fox"] }
diff --git a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/search/550_ignore_above_invalid.yml b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/search/550_ignore_above_invalid.yml
new file mode 100644
index 0000000000000..3c29845871fe7
--- /dev/null
+++ b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/search/550_ignore_above_invalid.yml
@@ -0,0 +1,63 @@
+---
+ignore_above index setting negative value:
+  - do:
+      catch: bad_request
+      indices.create:
+        index:  test
+        body:
+          settings:
+            index:
+              mapping:
+                ignore_above: -1
+          mappings:
+            properties:
+              keyword:
+                type: keyword
+
+---
+keyword ignore_above mapping setting negative value:
+  - requires:
+      cluster_features: [ "mapper.ignore_above_index_level_setting" ]
+      reason: introduce ignore_above index level setting
+  - do:
+      catch: bad_request
+      indices.create:
+        index:  test
+        body:
+          mappings:
+            properties:
+              keyword:
+                ignore_above: -2
+                type: keyword
+
+---
+flattened ignore_above mapping setting negative value:
+  - requires:
+      cluster_features: [ "mapper.ignore_above_index_level_setting" ]
+      reason: introduce ignore_above index level setting
+  - do:
+      catch: bad_request
+      indices.create:
+        index:  test
+        body:
+          mappings:
+            properties:
+              flattened:
+                ignore_above: -2
+                type: flattened
+
+---
+wildcard ignore_above mapping setting negative value:
+  - requires:
+      cluster_features: [ "mapper.ignore_above_index_level_setting" ]
+      reason: introduce ignore_above index level setting
+  - do:
+      catch: bad_request
+      indices.create:
+        index:  test
+        body:
+          mappings:
+            properties:
+              wildcard:
+                ignore_above: -2
+                type: wildcard
diff --git a/server/src/main/java/org/elasticsearch/common/settings/IndexScopedSettings.java b/server/src/main/java/org/elasticsearch/common/settings/IndexScopedSettings.java
index 69abb59689c00..ad3d7d7f1c2ec 100644
--- a/server/src/main/java/org/elasticsearch/common/settings/IndexScopedSettings.java
+++ b/server/src/main/java/org/elasticsearch/common/settings/IndexScopedSettings.java
@@ -151,6 +151,7 @@ public final class IndexScopedSettings extends AbstractScopedSettings {
         IndexSettings.INDEX_SEARCH_IDLE_AFTER,
         IndexSettings.INDEX_SEARCH_THROTTLED,
         IndexFieldDataService.INDEX_FIELDDATA_CACHE_KEY,
+        IndexSettings.IGNORE_ABOVE_SETTING,
         FieldMapper.IGNORE_MALFORMED_SETTING,
         FieldMapper.COERCE_SETTING,
         Store.INDEX_STORE_STATS_REFRESH_INTERVAL_SETTING,
diff --git a/server/src/main/java/org/elasticsearch/index/IndexSettings.java b/server/src/main/java/org/elasticsearch/index/IndexSettings.java
index 92abdb39acf56..f6ad5e22b9ed7 100644
--- a/server/src/main/java/org/elasticsearch/index/IndexSettings.java
+++ b/server/src/main/java/org/elasticsearch/index/IndexSettings.java
@@ -25,6 +25,7 @@
 import org.elasticsearch.common.unit.ByteSizeUnit;
 import org.elasticsearch.common.unit.ByteSizeValue;
 import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.features.NodeFeature;
 import org.elasticsearch.index.mapper.IgnoredSourceFieldMapper;
 import org.elasticsearch.index.mapper.Mapper;
 import org.elasticsearch.index.translog.Translog;
@@ -697,6 +698,31 @@ public Iterator<Setting<?>> settings() {
         Property.IndexSettingDeprecatedInV7AndRemovedInV8
     );
 
+    /**
+     * The `index.mapping.ignore_above` setting defines the maximum length for the content of a field that will be indexed
+     * or stored. If the length of the field’s content exceeds this limit, the field value will be ignored during indexing.
+     * This setting is  useful for `keyword`, `flattened`, and `wildcard` fields where very large values are undesirable.
+     * It allows users to manage the size of indexed data by skipping fields with excessively long content. As an index-level
+     * setting, it applies to all `keyword` and `wildcard` fields, as well as to keyword values within `flattened` fields.
+     * When it comes to arrays, the `ignore_above` setting applies individually to each element of the array. If any element's
+     * length exceeds the specified limit, only that element will be ignored during indexing, while the rest of the array will
+     * still be processed. This behavior is consistent with the field-level `ignore_above` setting.
+     * This setting can be overridden at the field level by specifying a custom `ignore_above` value in the field mapping.
+     * <p>
+     * Example usage:
+     * <pre>
+     * "index.mapping.ignore_above": 256
+     * </pre>
+     */
+    public static final Setting<Integer> IGNORE_ABOVE_SETTING = Setting.intSetting(
+        "index.mapping.ignore_above",
+        Integer.MAX_VALUE,
+        0,
+        Property.IndexScope,
+        Property.ServerlessPublic
+    );
+    public static final NodeFeature IGNORE_ABOVE_INDEX_LEVEL_SETTING = new NodeFeature("mapper.ignore_above_index_level_setting");
+
     private final Index index;
     private final IndexVersion version;
     private final Logger logger;
diff --git a/server/src/main/java/org/elasticsearch/index/mapper/KeywordFieldMapper.java b/server/src/main/java/org/elasticsearch/index/mapper/KeywordFieldMapper.java
index 2da8d32773733..46b1dbdce4c4b 100644
--- a/server/src/main/java/org/elasticsearch/index/mapper/KeywordFieldMapper.java
+++ b/server/src/main/java/org/elasticsearch/index/mapper/KeywordFieldMapper.java
@@ -79,6 +79,7 @@
 
 import static org.apache.lucene.index.IndexWriter.MAX_TERM_LENGTH;
 import static org.elasticsearch.core.Strings.format;
+import static org.elasticsearch.index.IndexSettings.IGNORE_ABOVE_SETTING;
 
 /**
  * A field mapper for keywords. This mapper accepts strings and indexes them as-is.
@@ -110,8 +111,6 @@ public static class Defaults {
             Lucene.KEYWORD_ANALYZER,
             Lucene.KEYWORD_ANALYZER
         );
-
-        public static final int IGNORE_ABOVE = Integer.MAX_VALUE;
     }
 
     public static class KeywordField extends Field {
@@ -158,12 +157,8 @@ public static final class Builder extends FieldMapper.DimensionBuilder {
             m -> toType(m).fieldType().eagerGlobalOrdinals(),
             false
         );
-        private final Parameter<Integer> ignoreAbove = Parameter.intParam(
-            "ignore_above",
-            true,
-            m -> toType(m).fieldType().ignoreAbove(),
-            Defaults.IGNORE_ABOVE
-        );
+        private final Parameter<Integer> ignoreAbove;
+        private final int ignoreAboveDefault;
 
         private final Parameter<String> indexOptions = TextParams.keywordIndexOptions(m -> toType(m).indexOptions);
         private final Parameter<Boolean> hasNorms = TextParams.norms(false, m -> toType(m).fieldType.omitNorms() == false);
@@ -193,7 +188,23 @@ public static final class Builder extends FieldMapper.DimensionBuilder {
         private final ScriptCompiler scriptCompiler;
         private final IndexVersion indexCreatedVersion;
 
-        public Builder(String name, IndexAnalyzers indexAnalyzers, ScriptCompiler scriptCompiler, IndexVersion indexCreatedVersion) {
+        public Builder(final String name, final MappingParserContext mappingParserContext) {
+            this(
+                name,
+                mappingParserContext.getIndexAnalyzers(),
+                mappingParserContext.scriptCompiler(),
+                IGNORE_ABOVE_SETTING.get(mappingParserContext.getSettings()),
+                mappingParserContext.getIndexSettings().getIndexVersionCreated()
+            );
+        }
+
+        Builder(
+            String name,
+            IndexAnalyzers indexAnalyzers,
+            ScriptCompiler scriptCompiler,
+            int ignoreAboveDefault,
+            IndexVersion indexCreatedVersion
+        ) {
             super(name);
             this.indexAnalyzers = indexAnalyzers;
             this.scriptCompiler = Objects.requireNonNull(scriptCompiler);
@@ -220,10 +231,17 @@ public Builder(String name, IndexAnalyzers indexAnalyzers, ScriptCompiler script
                     );
                 }
             }).precludesParameters(normalizer);
+            this.ignoreAboveDefault = ignoreAboveDefault;
+            this.ignoreAbove = Parameter.intParam("ignore_above", true, m -> toType(m).fieldType().ignoreAbove(), ignoreAboveDefault)
+                .addValidator(v -> {
+                    if (v < 0) {
+                        throw new IllegalArgumentException("[ignore_above] must be positive, got [" + v + "]");
+                    }
+                });
         }
 
         public Builder(String name, IndexVersion indexCreatedVersion) {
-            this(name, null, ScriptCompiler.NONE, indexCreatedVersion);
+            this(name, null, ScriptCompiler.NONE, Integer.MAX_VALUE, indexCreatedVersion);
         }
 
         public Builder ignoreAbove(int ignoreAbove) {
@@ -370,10 +388,7 @@ public KeywordFieldMapper build(MapperBuilderContext context) {
 
     private static final IndexVersion MINIMUM_COMPATIBILITY_VERSION = IndexVersion.fromId(5000099);
 
-    public static final TypeParser PARSER = new TypeParser(
-        (n, c) -> new Builder(n, c.getIndexAnalyzers(), c.scriptCompiler(), c.indexVersionCreated()),
-        MINIMUM_COMPATIBILITY_VERSION
-    );
+    public static final TypeParser PARSER = new TypeParser(Builder::new, MINIMUM_COMPATIBILITY_VERSION);
 
     public static final class KeywordFieldType extends StringFieldType {
 
@@ -865,6 +880,8 @@ public boolean hasNormalizer() {
     private final boolean isSyntheticSource;
 
     private final IndexAnalyzers indexAnalyzers;
+    private final int ignoreAboveDefault;
+    private final int ignoreAbove;
 
     private KeywordFieldMapper(
         String simpleName,
@@ -887,6 +904,8 @@ private KeywordFieldMapper(
         this.scriptCompiler = builder.scriptCompiler;
         this.indexCreatedVersion = builder.indexCreatedVersion;
         this.isSyntheticSource = isSyntheticSource;
+        this.ignoreAboveDefault = builder.ignoreAboveDefault;
+        this.ignoreAbove = builder.ignoreAbove.getValue();
     }
 
     @Override
@@ -1004,7 +1023,9 @@ public Map<String, NamedAnalyzer> indexAnalyzers() {
 
     @Override
     public FieldMapper.Builder getMergeBuilder() {
-        return new Builder(leafName(), indexAnalyzers, scriptCompiler, indexCreatedVersion).dimension(fieldType().isDimension()).init(this);
+        return new Builder(leafName(), indexAnalyzers, scriptCompiler, ignoreAboveDefault, indexCreatedVersion).dimension(
+            fieldType().isDimension()
+        ).init(this);
     }
 
     @Override
@@ -1072,7 +1093,7 @@ protected BytesRef preserve(BytesRef value) {
             });
         }
 
-        if (fieldType().ignoreAbove != Defaults.IGNORE_ABOVE) {
+        if (fieldType().ignoreAbove != ignoreAboveDefault) {
             layers.add(new CompositeSyntheticFieldLoader.StoredFieldLayer(originalName()) {
                 @Override
                 protected void writeValue(Object value, XContentBuilder b) throws IOException {
diff --git a/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java b/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java
index d18c3283ef909..d2ca7a24a78fd 100644
--- a/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java
+++ b/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java
@@ -11,6 +11,7 @@
 
 import org.elasticsearch.features.FeatureSpecification;
 import org.elasticsearch.features.NodeFeature;
+import org.elasticsearch.index.IndexSettings;
 import org.elasticsearch.index.mapper.flattened.FlattenedFieldMapper;
 import org.elasticsearch.index.mapper.vectors.DenseVectorFieldMapper;
 
@@ -41,6 +42,7 @@ public Set<NodeFeature> getFeatures() {
             SourceFieldMapper.SYNTHETIC_SOURCE_WITH_COPY_TO_AND_DOC_VALUES_FALSE_SUPPORT,
             SourceFieldMapper.SYNTHETIC_SOURCE_COPY_TO_FIX,
             FlattenedFieldMapper.IGNORE_ABOVE_SUPPORT,
+            IndexSettings.IGNORE_ABOVE_INDEX_LEVEL_SETTING,
             SourceFieldMapper.SYNTHETIC_SOURCE_COPY_TO_INSIDE_OBJECTS_FIX
         );
     }
diff --git a/server/src/main/java/org/elasticsearch/index/mapper/flattened/FlattenedFieldMapper.java b/server/src/main/java/org/elasticsearch/index/mapper/flattened/FlattenedFieldMapper.java
index 43890abf25aa7..2c504262c35ad 100644
--- a/server/src/main/java/org/elasticsearch/index/mapper/flattened/FlattenedFieldMapper.java
+++ b/server/src/main/java/org/elasticsearch/index/mapper/flattened/FlattenedFieldMapper.java
@@ -82,6 +82,8 @@
 import java.util.Set;
 import java.util.function.Function;
 
+import static org.elasticsearch.index.IndexSettings.IGNORE_ABOVE_SETTING;
+
 /**
  * A field mapper that accepts a JSON object and flattens it into a single field. This data type
  * can be a useful alternative to an 'object' mapping when the object has a large, unknown set
@@ -123,6 +125,9 @@ private static Builder builder(Mapper in) {
         return ((FlattenedFieldMapper) in).builder;
     }
 
+    private final int ignoreAboveDefault;
+    private final int ignoreAbove;
+
     public static class Builder extends FieldMapper.Builder {
 
         final Parameter<Integer> depthLimit = Parameter.intParam(
@@ -148,12 +153,8 @@ public static class Builder extends FieldMapper.Builder {
             m -> builder(m).eagerGlobalOrdinals.get(),
             false
         );
-        private final Parameter<Integer> ignoreAbove = Parameter.intParam(
-            "ignore_above",
-            true,
-            m -> builder(m).ignoreAbove.get(),
-            Integer.MAX_VALUE
-        );
+        private final int ignoreAboveDefault;
+        private final Parameter<Integer> ignoreAbove;
 
         private final Parameter<String> indexOptions = TextParams.keywordIndexOptions(m -> builder(m).indexOptions.get());
         private final Parameter<SimilarityProvider> similarity = TextParams.similarity(m -> builder(m).similarity.get());
@@ -176,7 +177,7 @@ public static class Builder extends FieldMapper.Builder {
                         + "] are true"
                 );
             }
-        }).precludesParameters(ignoreAbove);
+        });
 
         private final Parameter<Map<String, String>> meta = Parameter.metaParam();
 
@@ -184,8 +185,20 @@ public static FieldMapper.Parameter<List<String>> dimensionsParam(Function<Field
             return FieldMapper.Parameter.stringArrayParam(TIME_SERIES_DIMENSIONS_ARRAY_PARAM, false, initializer);
         }
 
-        public Builder(String name) {
+        public Builder(final String name) {
+            this(name, Integer.MAX_VALUE);
+        }
+
+        private Builder(String name, int ignoreAboveDefault) {
             super(name);
+            this.ignoreAboveDefault = ignoreAboveDefault;
+            this.ignoreAbove = Parameter.intParam("ignore_above", true, m -> builder(m).ignoreAbove.get(), ignoreAboveDefault)
+                .addValidator(v -> {
+                    if (v < 0) {
+                        throw new IllegalArgumentException("[ignore_above] must be positive, got [" + v + "]");
+                    }
+                });
+            this.dimensions.precludesParameters(ignoreAbove);
         }
 
         @Override
@@ -223,11 +236,11 @@ public FlattenedFieldMapper build(MapperBuilderContext context) {
                 dimensions.get(),
                 ignoreAbove.getValue()
             );
-            return new FlattenedFieldMapper(leafName(), ft, builderParams(this, context), this);
+            return new FlattenedFieldMapper(leafName(), ft, builderParams(this, context), ignoreAboveDefault, this);
         }
     }
 
-    public static final TypeParser PARSER = new TypeParser((n, c) -> new Builder(n));
+    public static final TypeParser PARSER = new TypeParser((n, c) -> new Builder(n, IGNORE_ABOVE_SETTING.get(c.getSettings())));
 
     /**
      * A field type that represents the values under a particular JSON key, used
@@ -808,9 +821,17 @@ public void validateMatchedRoutingPath(final String routingPath) {
     private final FlattenedFieldParser fieldParser;
     private final Builder builder;
 
-    private FlattenedFieldMapper(String leafName, MappedFieldType mappedFieldType, BuilderParams builderParams, Builder builder) {
+    private FlattenedFieldMapper(
+        String leafName,
+        MappedFieldType mappedFieldType,
+        BuilderParams builderParams,
+        int ignoreAboveDefault,
+        Builder builder
+    ) {
         super(leafName, mappedFieldType, builderParams);
+        this.ignoreAboveDefault = ignoreAboveDefault;
         this.builder = builder;
+        this.ignoreAbove = builder.ignoreAbove.get();
         this.fieldParser = new FlattenedFieldParser(
             mappedFieldType.name(),
             mappedFieldType.name() + KEYED_FIELD_SUFFIX,
@@ -835,8 +856,8 @@ int depthLimit() {
         return builder.depthLimit.get();
     }
 
-    int ignoreAbove() {
-        return builder.ignoreAbove.get();
+    public int ignoreAbove() {
+        return ignoreAbove;
     }
 
     @Override
@@ -876,7 +897,7 @@ protected void parseCreateField(DocumentParserContext context) throws IOExceptio
 
     @Override
     public FieldMapper.Builder getMergeBuilder() {
-        return new Builder(leafName()).init(this);
+        return new Builder(leafName(), ignoreAboveDefault).init(this);
     }
 
     @Override
diff --git a/server/src/test/java/org/elasticsearch/index/mapper/KeywordFieldTypeTests.java b/server/src/test/java/org/elasticsearch/index/mapper/KeywordFieldTypeTests.java
index 7e5cc5045c100..b4c7ea0ed9508 100644
--- a/server/src/test/java/org/elasticsearch/index/mapper/KeywordFieldTypeTests.java
+++ b/server/src/test/java/org/elasticsearch/index/mapper/KeywordFieldTypeTests.java
@@ -243,6 +243,7 @@ public void testFetchSourceValue() throws IOException {
             "field",
             createIndexAnalyzers(),
             ScriptCompiler.NONE,
+            Integer.MAX_VALUE,
             IndexVersion.current()
         ).normalizer("lowercase").build(MapperBuilderContext.root(false, false)).fieldType();
         assertEquals(List.of("value"), fetchSourceValue(normalizerMapper, "VALUE"));
diff --git a/server/src/test/java/org/elasticsearch/index/mapper/MultiFieldsTests.java b/server/src/test/java/org/elasticsearch/index/mapper/MultiFieldsTests.java
index 06c3125648309..fd024c5d23e28 100644
--- a/server/src/test/java/org/elasticsearch/index/mapper/MultiFieldsTests.java
+++ b/server/src/test/java/org/elasticsearch/index/mapper/MultiFieldsTests.java
@@ -63,6 +63,7 @@ private KeywordFieldMapper.Builder getKeywordFieldMapperBuilder(boolean isStored
             "field",
             IndexAnalyzers.of(Map.of(), Map.of("normalizer", Lucene.STANDARD_ANALYZER), Map.of()),
             ScriptCompiler.NONE,
+            Integer.MAX_VALUE,
             IndexVersion.current()
         );
         if (isStored) {
diff --git a/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/wildcard/20_ignore_above_stored_source.yml b/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/wildcard/20_ignore_above_stored_source.yml
new file mode 100644
index 0000000000000..252bafbdbe15a
--- /dev/null
+++ b/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/wildcard/20_ignore_above_stored_source.yml
@@ -0,0 +1,56 @@
+---
+wildcard field type ignore_above:
+  - requires:
+      cluster_features: [ "mapper.ignore_above_index_level_setting" ]
+      reason: introduce ignore_above index level setting
+  - do:
+      indices.create:
+        index:  test
+        body:
+          settings:
+            index:
+              mapping:
+                ignore_above: 10
+          mappings:
+            properties:
+              a_wildcard:
+                type: wildcard
+              b_wildcard:
+                type: wildcard
+                ignore_above: 20
+              c_wildcard:
+                type: wildcard
+              d_wildcard:
+                type: wildcard
+                ignore_above: 5
+
+
+
+  - do:
+      index:
+        index:  test
+        refresh: true
+        id: "1"
+        body:   { "a_wildcard": "foo bar", "b_wildcard": "the quick brown", "c_wildcard": ["foo", "bar", "jumps over the lazy dog"], "d_wildcard": ["foo", "bar", "the quick"]}
+
+  - do:
+      search:
+        body:
+          fields:
+            - a_wildcard
+            - b_wildcard
+            - c_wildcard
+            - d_wildcard
+          query:
+            match_all: {}
+
+  - length: { hits.hits: 1 }
+  - match: { hits.hits.0._source.a_wildcard: "foo bar" }
+  - match: { hits.hits.0._source.b_wildcard: "the quick brown" }
+  - match: { hits.hits.0._source.c_wildcard: ["foo", "bar", "jumps over the lazy dog"] }
+  - match: { hits.hits.0._source.d_wildcard: ["foo", "bar", "the quick"] }
+  - match: { hits.hits.0.fields.a_wildcard.0: "foo bar" }
+  - match: { hits.hits.0.fields.b_wildcard.0: "the quick brown" }
+  - match: { hits.hits.0.fields.c_wildcard: ["foo", "bar"] }
+  - match: { hits.hits.0.fields.d_wildcard: ["foo", "bar"] }
+
diff --git a/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/wildcard/30_ignore_above_synthetic_source.yml b/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/wildcard/30_ignore_above_synthetic_source.yml
new file mode 100644
index 0000000000000..f5c9f3d92369a
--- /dev/null
+++ b/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/wildcard/30_ignore_above_synthetic_source.yml
@@ -0,0 +1,58 @@
+---
+wildcard field type ignore_above:
+  - requires:
+      cluster_features: [ "mapper.ignore_above_index_level_setting" ]
+      reason: introduce ignore_above index level setting
+  - do:
+      indices.create:
+        index:  test
+        body:
+          settings:
+            index:
+              mapping:
+                ignore_above: 10
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              a_wildcard:
+                type: wildcard
+              b_wildcard:
+                type: wildcard
+                ignore_above: 20
+              c_wildcard:
+                type: wildcard
+              d_wildcard:
+                type: wildcard
+                ignore_above: 5
+
+
+
+  - do:
+      index:
+        index:  test
+        refresh: true
+        id: "1"
+        body:   { "a_wildcard": "foo bar", "b_wildcard": "the quick brown", "c_wildcard": ["foo", "bar", "jumps over the lazy dog"], "d_wildcard": ["foo", "bar", "the quick"]}
+
+  - do:
+      search:
+        body:
+          fields:
+            - a_wildcard
+            - b_wildcard
+            - c_wildcard
+            - d_wildcard
+          query:
+            match_all: {}
+
+  - length: { hits.hits: 1 }
+  - match: { hits.hits.0._source.a_wildcard: "foo bar" }
+  - match: { hits.hits.0._source.b_wildcard: "the quick brown" }
+  - match: { hits.hits.0._source.c_wildcard: ["bar", "foo"] }
+  - match: { hits.hits.0._source.d_wildcard: ["bar", "foo", "the quick"] }
+  - match: { hits.hits.0.fields.a_wildcard.0: "foo bar" }
+  - match: { hits.hits.0.fields.b_wildcard.0: "the quick brown" }
+  - match: { hits.hits.0.fields.c_wildcard: ["bar", "foo"] }
+  - match: { hits.hits.0.fields.d_wildcard: ["bar", "foo"] }
+
diff --git a/x-pack/plugin/wildcard/src/main/java/org/elasticsearch/xpack/wildcard/mapper/WildcardFieldMapper.java b/x-pack/plugin/wildcard/src/main/java/org/elasticsearch/xpack/wildcard/mapper/WildcardFieldMapper.java
index 8e4f56e299587..1e97e64371586 100644
--- a/x-pack/plugin/wildcard/src/main/java/org/elasticsearch/xpack/wildcard/mapper/WildcardFieldMapper.java
+++ b/x-pack/plugin/wildcard/src/main/java/org/elasticsearch/xpack/wildcard/mapper/WildcardFieldMapper.java
@@ -87,6 +87,8 @@
 import java.util.Map;
 import java.util.Set;
 
+import static org.elasticsearch.index.IndexSettings.IGNORE_ABOVE_SETTING;
+
 /**
  * A {@link FieldMapper} for indexing fields with ngrams for efficient wildcard matching
  */
@@ -191,7 +193,6 @@ public static class Defaults {
             Lucene.KEYWORD_ANALYZER,
             Lucene.KEYWORD_ANALYZER
         );
-        public static final int IGNORE_ABOVE = Integer.MAX_VALUE;
     }
 
     private static WildcardFieldMapper toType(FieldMapper in) {
@@ -200,21 +201,28 @@ private static WildcardFieldMapper toType(FieldMapper in) {
 
     public static class Builder extends FieldMapper.Builder {
 
-        final Parameter<Integer> ignoreAbove = Parameter.intParam("ignore_above", true, m -> toType(m).ignoreAbove, Defaults.IGNORE_ABOVE)
-            .addValidator(v -> {
-                if (v < 0) {
-                    throw new IllegalArgumentException("[ignore_above] must be positive, got [" + v + "]");
-                }
-            });
+        final Parameter<Integer> ignoreAbove;
         final Parameter<String> nullValue = Parameter.stringParam("null_value", false, m -> toType(m).nullValue, null).acceptsNull();
 
         final Parameter<Map<String, String>> meta = Parameter.metaParam();
 
         final IndexVersion indexVersionCreated;
 
-        public Builder(String name, IndexVersion indexVersionCreated) {
+        final int ignoreAboveDefault;
+
+        public Builder(final String name, IndexVersion indexVersionCreated) {
+            this(name, Integer.MAX_VALUE, indexVersionCreated);
+        }
+
+        private Builder(String name, int ignoreAboveDefault, IndexVersion indexVersionCreated) {
             super(name);
             this.indexVersionCreated = indexVersionCreated;
+            this.ignoreAboveDefault = ignoreAboveDefault;
+            this.ignoreAbove = Parameter.intParam("ignore_above", true, m -> toType(m).ignoreAbove, ignoreAboveDefault).addValidator(v -> {
+                if (v < 0) {
+                    throw new IllegalArgumentException("[ignore_above] must be positive, got [" + v + "]");
+                }
+            });
         }
 
         @Override
@@ -236,23 +244,18 @@ Builder nullValue(String nullValue) {
         public WildcardFieldMapper build(MapperBuilderContext context) {
             return new WildcardFieldMapper(
                 leafName(),
-                new WildcardFieldType(
-                    context.buildFullName(leafName()),
-                    nullValue.get(),
-                    ignoreAbove.get(),
-                    indexVersionCreated,
-                    meta.get()
-                ),
-                ignoreAbove.get(),
+                new WildcardFieldType(context.buildFullName(leafName()), indexVersionCreated, meta.get(), this),
                 context.isSourceSynthetic(),
                 builderParams(this, context),
-                nullValue.get(),
-                indexVersionCreated
+                indexVersionCreated,
+                this
             );
         }
     }
 
-    public static TypeParser PARSER = new TypeParser((n, c) -> new Builder(n, c.indexVersionCreated()));
+    public static TypeParser PARSER = new TypeParser(
+        (n, c) -> new Builder(n, IGNORE_ABOVE_SETTING.get(c.getSettings()), c.indexVersionCreated())
+    );
 
     public static final char TOKEN_START_OR_END_CHAR = 0;
     public static final String TOKEN_START_STRING = Character.toString(TOKEN_START_OR_END_CHAR);
@@ -263,18 +266,18 @@ public static final class WildcardFieldType extends MappedFieldType {
         static Analyzer lowercaseNormalizer = new LowercaseNormalizer();
 
         private final String nullValue;
-        private final int ignoreAbove;
         private final NamedAnalyzer analyzer;
+        private final int ignoreAbove;
 
-        private WildcardFieldType(String name, String nullValue, int ignoreAbove, IndexVersion version, Map<String, String> meta) {
+        private WildcardFieldType(String name, IndexVersion version, Map<String, String> meta, Builder builder) {
             super(name, true, false, true, Defaults.TEXT_SEARCH_INFO, meta);
             if (version.onOrAfter(IndexVersions.V_7_10_0)) {
                 this.analyzer = WILDCARD_ANALYZER_7_10;
             } else {
                 this.analyzer = WILDCARD_ANALYZER_7_9;
             }
-            this.nullValue = nullValue;
-            this.ignoreAbove = ignoreAbove;
+            this.nullValue = builder.nullValue.getValue();
+            this.ignoreAbove = builder.ignoreAbove.getValue();
         }
 
         @Override
@@ -889,26 +892,27 @@ protected String parseSourceValue(Object value) {
         NGRAM_FIELD_TYPE = freezeAndDeduplicateFieldType(ft);
         assert NGRAM_FIELD_TYPE.indexOptions() == IndexOptions.DOCS;
     }
-
-    private final int ignoreAbove;
     private final String nullValue;
     private final IndexVersion indexVersionCreated;
+
+    private final int ignoreAbove;
+    private final int ignoreAboveDefault;
     private final boolean storeIgnored;
 
     private WildcardFieldMapper(
         String simpleName,
         WildcardFieldType mappedFieldType,
-        int ignoreAbove,
         boolean storeIgnored,
         BuilderParams builderParams,
-        String nullValue,
-        IndexVersion indexVersionCreated
+        IndexVersion indexVersionCreated,
+        Builder builder
     ) {
         super(simpleName, mappedFieldType, builderParams);
-        this.nullValue = nullValue;
-        this.ignoreAbove = ignoreAbove;
+        this.nullValue = builder.nullValue.getValue();
         this.storeIgnored = storeIgnored;
         this.indexVersionCreated = indexVersionCreated;
+        this.ignoreAbove = builder.ignoreAbove.getValue();
+        this.ignoreAboveDefault = builder.ignoreAboveDefault;
     }
 
     @Override
@@ -983,14 +987,14 @@ protected String contentType() {
 
     @Override
     public FieldMapper.Builder getMergeBuilder() {
-        return new Builder(leafName(), indexVersionCreated).init(this);
+        return new Builder(leafName(), ignoreAboveDefault, indexVersionCreated).init(this);
     }
 
     @Override
     protected SyntheticSourceSupport syntheticSourceSupport() {
         var layers = new ArrayList<CompositeSyntheticFieldLoader.Layer>();
         layers.add(new WildcardSyntheticFieldLoader());
-        if (ignoreAbove != Defaults.IGNORE_ABOVE) {
+        if (ignoreAbove != ignoreAboveDefault) {
             layers.add(new CompositeSyntheticFieldLoader.StoredFieldLayer(originalName()) {
                 @Override
                 protected void writeValue(Object value, XContentBuilder b) throws IOException {
diff --git a/x-pack/qa/runtime-fields/src/main/java/org/elasticsearch/xpack/runtimefields/test/CoreTestTranslater.java b/x-pack/qa/runtime-fields/src/main/java/org/elasticsearch/xpack/runtimefields/test/CoreTestTranslater.java
index 2bea4bb247d8f..d34303ea803d6 100644
--- a/x-pack/qa/runtime-fields/src/main/java/org/elasticsearch/xpack/runtimefields/test/CoreTestTranslater.java
+++ b/x-pack/qa/runtime-fields/src/main/java/org/elasticsearch/xpack/runtimefields/test/CoreTestTranslater.java
@@ -222,10 +222,32 @@ public boolean modifySections(List<ExecutableSection> executables) {
          */
         protected abstract boolean modifySearch(ApiCallSection search);
 
+        private static Object getSetting(final Object map, final String... keys) {
+            Map<?, ?> current = (Map<?, ?>) map;
+            for (final String key : keys) {
+                if (current != null) {
+                    current = (Map<?, ?>) current.get(key);
+                } else {
+                    return null;
+                }
+            }
+            return current;
+        }
+
         private boolean modifyCreateIndex(ApiCallSection createIndex) {
             String index = createIndex.getParams().get("index");
             for (Map<?, ?> body : createIndex.getBodies()) {
-                Object settings = body.get("settings");
+                final Object settings = body.get("settings");
+                final Object indexMapping = getSetting(settings, "index", "mapping");
+                if (indexMapping instanceof Map<?, ?> m) {
+                    final Object ignoreAbove = m.get("ignore_above");
+                    if (ignoreAbove instanceof Integer ignoreAboveValue) {
+                        if (ignoreAboveValue >= 0) {
+                            // Scripts don't support ignore_above so we skip those fields
+                            continue;
+                        }
+                    }
+                }
                 if (settings instanceof Map && ((Map<?, ?>) settings).containsKey("sort.field")) {
                     /*
                      * You can't sort the index on a runtime field

From 89af9e5a4560f15bd24a1e9ddc69dc6df6f92cc3 Mon Sep 17 00:00:00 2001
From: David Turner <david.turner@elastic.co>
Date: Mon, 23 Sep 2024 17:11:37 +0100
Subject: [PATCH 04/28] Revert "Make `UpdateSettingsClusterStateUpdateRequest`
 a record (#113353)"

This reverts commit cc37be136a3c0a4b4e74ea2c13b12bdd67a7117d.
---
 .../MetadataUpdateSettingsServiceIT.java      | 133 ++++++++----------
 .../put/TransportUpdateSettingsAction.java    |  31 ++--
 ...dateSettingsClusterStateUpdateRequest.java |  86 ++++++-----
 .../MetadataUpdateSettingsService.java        |   4 +-
 .../upgrades/SystemIndexMigrator.java         |  16 +--
 ...TransportUpdateSecuritySettingsAction.java |  16 +--
 .../TransportUpdateWatcherSettingsAction.java |  12 +-
 7 files changed, 132 insertions(+), 166 deletions(-)

diff --git a/server/src/internalClusterTest/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsServiceIT.java b/server/src/internalClusterTest/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsServiceIT.java
index c1e68040e075b..b3b7957801cd7 100644
--- a/server/src/internalClusterTest/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsServiceIT.java
+++ b/server/src/internalClusterTest/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsServiceIT.java
@@ -28,7 +28,6 @@
 import java.util.List;
 import java.util.concurrent.atomic.AtomicBoolean;
 import java.util.concurrent.atomic.AtomicReference;
-import java.util.function.Function;
 
 import static org.hamcrest.Matchers.equalTo;
 
@@ -43,58 +42,45 @@ public void testThatNonDynamicSettingChangesTakeEffect() throws Exception {
         MetadataUpdateSettingsService metadataUpdateSettingsService = internalCluster().getCurrentMasterNodeInstance(
             MetadataUpdateSettingsService.class
         );
-        List<Index> indicesList = new ArrayList<>();
+        UpdateSettingsClusterStateUpdateRequest request = new UpdateSettingsClusterStateUpdateRequest().ackTimeout(TimeValue.ZERO);
+        List<Index> indices = new ArrayList<>();
         for (IndicesService indicesService : internalCluster().getInstances(IndicesService.class)) {
             for (IndexService indexService : indicesService) {
-                indicesList.add(indexService.index());
+                indices.add(indexService.index());
             }
         }
-        final var indices = indicesList.toArray(Index.EMPTY_ARRAY);
-
-        final Function<UpdateSettingsClusterStateUpdateRequest.OnStaticSetting, UpdateSettingsClusterStateUpdateRequest> requestFactory =
-            onStaticSetting -> new UpdateSettingsClusterStateUpdateRequest(
-                TEST_REQUEST_TIMEOUT,
-                TimeValue.ZERO,
-                Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData").build(),
-                UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
-                onStaticSetting,
-                indices
-            );
+        request.indices(indices.toArray(Index.EMPTY_ARRAY));
+        request.settings(Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData").build());
 
         // First make sure it fails if reopenShards is not set on the request:
         AtomicBoolean expectedFailureOccurred = new AtomicBoolean(false);
-        metadataUpdateSettingsService.updateSettings(
-            requestFactory.apply(UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT),
-            new ActionListener<>() {
-                @Override
-                public void onResponse(AcknowledgedResponse acknowledgedResponse) {
-                    fail("Should have failed updating a non-dynamic setting without reopenShards set to true");
-                }
+        metadataUpdateSettingsService.updateSettings(request, new ActionListener<>() {
+            @Override
+            public void onResponse(AcknowledgedResponse acknowledgedResponse) {
+                fail("Should have failed updating a non-dynamic setting without reopenShards set to true");
+            }
 
-                @Override
-                public void onFailure(Exception e) {
-                    expectedFailureOccurred.set(true);
-                }
+            @Override
+            public void onFailure(Exception e) {
+                expectedFailureOccurred.set(true);
             }
-        );
+        });
         assertBusy(() -> assertThat(expectedFailureOccurred.get(), equalTo(true)));
 
         // Now we set reopenShards and expect it to work:
+        request.reopenShards(true);
         AtomicBoolean success = new AtomicBoolean(false);
-        metadataUpdateSettingsService.updateSettings(
-            requestFactory.apply(UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REOPEN_INDICES),
-            new ActionListener<>() {
-                @Override
-                public void onResponse(AcknowledgedResponse acknowledgedResponse) {
-                    success.set(true);
-                }
+        metadataUpdateSettingsService.updateSettings(request, new ActionListener<>() {
+            @Override
+            public void onResponse(AcknowledgedResponse acknowledgedResponse) {
+                success.set(true);
+            }
 
-                @Override
-                public void onFailure(Exception e) {
-                    fail(e);
-                }
+            @Override
+            public void onFailure(Exception e) {
+                fail(e);
             }
-        );
+        });
         assertBusy(() -> assertThat(success.get(), equalTo(true)));
 
         // Now we look into the IndexShard objects to make sure that the code was actually updated (vs just the setting):
@@ -124,23 +110,16 @@ public void testThatNonDynamicSettingChangesDoNotUnncessesarilyCauseReopens() th
         MetadataUpdateSettingsService metadataUpdateSettingsService = internalCluster().getCurrentMasterNodeInstance(
             MetadataUpdateSettingsService.class
         );
-        List<Index> indicesList = new ArrayList<>();
+        UpdateSettingsClusterStateUpdateRequest request = new UpdateSettingsClusterStateUpdateRequest().ackTimeout(TimeValue.ZERO);
+        List<Index> indices = new ArrayList<>();
         for (IndicesService indicesService : internalCluster().getInstances(IndicesService.class)) {
             for (IndexService indexService : indicesService) {
-                indicesList.add(indexService.index());
+                indices.add(indexService.index());
             }
         }
-        final var indices = indicesList.toArray(Index.EMPTY_ARRAY);
-
-        final Function<Settings.Builder, UpdateSettingsClusterStateUpdateRequest> requestFactory =
-            settings -> new UpdateSettingsClusterStateUpdateRequest(
-                TEST_REQUEST_TIMEOUT,
-                TimeValue.ZERO,
-                settings.build(),
-                UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
-                UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REOPEN_INDICES,
-                indices
-            );
+        request.indices(indices.toArray(Index.EMPTY_ARRAY));
+        request.settings(Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData").build());
+        request.reopenShards(true);
 
         ClusterService clusterService = internalCluster().getInstance(ClusterService.class);
         AtomicBoolean shardsUnassigned = new AtomicBoolean(false);
@@ -163,49 +142,47 @@ public void testThatNonDynamicSettingChangesDoNotUnncessesarilyCauseReopens() th
 
         AtomicBoolean success = new AtomicBoolean(false);
         // Make the first request, just to set things up:
-        metadataUpdateSettingsService.updateSettings(
-            requestFactory.apply(Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData")),
-            new ActionListener<>() {
-                @Override
-                public void onResponse(AcknowledgedResponse acknowledgedResponse) {
-                    success.set(true);
-                }
+        metadataUpdateSettingsService.updateSettings(request, new ActionListener<>() {
+            @Override
+            public void onResponse(AcknowledgedResponse acknowledgedResponse) {
+                success.set(true);
+            }
 
-                @Override
-                public void onFailure(Exception e) {
-                    fail(e);
-                }
+            @Override
+            public void onFailure(Exception e) {
+                fail(e);
             }
-        );
+        });
         assertBusy(() -> assertThat(success.get(), equalTo(true)));
         assertBusy(() -> assertThat(expectedSettingsChangeInClusterState.get(), equalTo(true)));
         assertThat(shardsUnassigned.get(), equalTo(true));
 
         assertBusy(() -> assertThat(hasUnassignedShards(clusterService.state(), indexName), equalTo(false)));
 
+        // Same request, except now we'll also set the dynamic "index.max_result_window" setting:
+        request.settings(
+            Settings.builder()
+                .put("index.codec", "FastDecompressionCompressingStoredFieldsData")
+                .put("index.max_result_window", "1500")
+                .build()
+        );
         success.set(false);
         expectedSettingsChangeInClusterState.set(false);
         shardsUnassigned.set(false);
         expectedSetting.set("index.max_result_window");
         expectedSettingValue.set("1500");
         // Making this request ought to add this new setting but not unassign the shards:
-        metadataUpdateSettingsService.updateSettings(
-            // Same request, except now we'll also set the dynamic "index.max_result_window" setting:
-            requestFactory.apply(
-                Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData").put("index.max_result_window", "1500")
-            ),
-            new ActionListener<>() {
-                @Override
-                public void onResponse(AcknowledgedResponse acknowledgedResponse) {
-                    success.set(true);
-                }
+        metadataUpdateSettingsService.updateSettings(request, new ActionListener<>() {
+            @Override
+            public void onResponse(AcknowledgedResponse acknowledgedResponse) {
+                success.set(true);
+            }
 
-                @Override
-                public void onFailure(Exception e) {
-                    fail(e);
-                }
+            @Override
+            public void onFailure(Exception e) {
+                fail(e);
             }
-        );
+        });
 
         assertBusy(() -> assertThat(success.get(), equalTo(true)));
         assertBusy(() -> assertThat(expectedSettingsChangeInClusterState.get(), equalTo(true)));
diff --git a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/TransportUpdateSettingsAction.java b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/TransportUpdateSettingsAction.java
index 1e7f32641b86f..1d7c264065d6f 100644
--- a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/TransportUpdateSettingsAction.java
+++ b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/TransportUpdateSettingsAction.java
@@ -124,24 +124,19 @@ protected void masterOperation(
             return;
         }
 
-        updateSettingsService.updateSettings(
-            new UpdateSettingsClusterStateUpdateRequest(
-                request.masterNodeTimeout(),
-                request.ackTimeout(),
-                requestSettings,
-                request.isPreserveExisting()
-                    ? UpdateSettingsClusterStateUpdateRequest.OnExisting.PRESERVE
-                    : UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
-                request.reopen()
-                    ? UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REOPEN_INDICES
-                    : UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT,
-                concreteIndices
-            ),
-            listener.delegateResponse((l, e) -> {
-                logger.debug(() -> "failed to update settings on indices [" + Arrays.toString(concreteIndices) + "]", e);
-                l.onFailure(e);
-            })
-        );
+        UpdateSettingsClusterStateUpdateRequest clusterStateUpdateRequest = new UpdateSettingsClusterStateUpdateRequest().indices(
+            concreteIndices
+        )
+            .settings(requestSettings)
+            .setPreserveExisting(request.isPreserveExisting())
+            .reopenShards(request.reopen())
+            .ackTimeout(request.ackTimeout())
+            .masterNodeTimeout(request.masterNodeTimeout());
+
+        updateSettingsService.updateSettings(clusterStateUpdateRequest, listener.delegateResponse((l, e) -> {
+            logger.debug(() -> "failed to update settings on indices [" + Arrays.toString(concreteIndices) + "]", e);
+            l.onFailure(e);
+        }));
     }
 
     /**
diff --git a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java
index fe8573da5fb68..42a904c704bf3 100644
--- a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java
+++ b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java
@@ -9,60 +9,70 @@
 
 package org.elasticsearch.action.admin.indices.settings.put;
 
+import org.elasticsearch.cluster.ack.IndicesClusterStateUpdateRequest;
 import org.elasticsearch.common.settings.Settings;
-import org.elasticsearch.core.TimeValue;
-import org.elasticsearch.index.Index;
 
-import java.util.Objects;
+import java.util.Arrays;
 
 /**
  * Cluster state update request that allows to update settings for some indices
  */
-public record UpdateSettingsClusterStateUpdateRequest(
-    TimeValue masterNodeTimeout,
-    TimeValue ackTimeout,
-    Settings settings,
-    OnExisting onExisting,
-    OnStaticSetting onStaticSetting,
-    Index... indices
-) {
+public class UpdateSettingsClusterStateUpdateRequest extends IndicesClusterStateUpdateRequest<UpdateSettingsClusterStateUpdateRequest> {
+
+    private Settings settings;
+
+    private boolean preserveExisting = false;
+
+    private boolean reopenShards = false;
+
+    /**
+     * Returns <code>true</code> iff the settings update should only add but not update settings. If the setting already exists
+     * it should not be overwritten by this update. The default is <code>false</code>
+     */
+    public boolean isPreserveExisting() {
+        return preserveExisting;
+    }
 
     /**
-     * Specifies the behaviour of an update-settings action on existing settings.
+     * Returns <code>true</code> if non-dynamic setting updates should go through, by automatically unassigning shards in the same cluster
+     * state change as the setting update. The shards will be automatically reassigned after the cluster state update is made. The
+     * default is <code>false</code>.
      */
-    public enum OnExisting {
-        /**
-         * Update all the specified settings, overwriting any settings which already exist. This is the API default.
-         */
-        OVERWRITE,
+    public boolean reopenShards() {
+        return reopenShards;
+    }
 
-        /**
-         * Only add new settings, preserving the values of any settings which are already set and ignoring the new values specified in the
-         * request.
-         */
-        PRESERVE
+    public UpdateSettingsClusterStateUpdateRequest reopenShards(boolean reopenShards) {
+        this.reopenShards = reopenShards;
+        return this;
     }
 
     /**
-     * Specifies the behaviour of an update-settings action which is trying to adjust a non-dynamic setting.
+     * Iff set to <code>true</code> this settings update will only add settings not already set on an index. Existing settings remain
+     * unchanged.
      */
-    public enum OnStaticSetting {
-        /**
-         * Reject attempts to update non-dynamic settings on open indices. This is the API default.
-         */
-        REJECT,
+    public UpdateSettingsClusterStateUpdateRequest setPreserveExisting(boolean preserveExisting) {
+        this.preserveExisting = preserveExisting;
+        return this;
+    }
 
-        /**
-         * Automatically close and reopen the shards of any open indices when updating a non-dynamic setting, forcing the shard to
-         * reinitialize from scratch.
-         */
-        REOPEN_INDICES
+    /**
+     * Returns the {@link Settings} to update
+     */
+    public Settings settings() {
+        return settings;
+    }
+
+    /**
+     * Sets the {@link Settings} to update
+     */
+    public UpdateSettingsClusterStateUpdateRequest settings(Settings settings) {
+        this.settings = settings;
+        return this;
     }
 
-    public UpdateSettingsClusterStateUpdateRequest {
-        Objects.requireNonNull(masterNodeTimeout);
-        Objects.requireNonNull(ackTimeout);
-        Objects.requireNonNull(settings);
-        Objects.requireNonNull(indices);
+    @Override
+    public String toString() {
+        return Arrays.toString(indices()) + settings;
     }
 }
diff --git a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java
index 4fcbd4165423b..cee3b4c0bdac1 100644
--- a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java
+++ b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java
@@ -176,7 +176,7 @@ ClusterState execute(ClusterState currentState) {
             }
             final Settings closedSettings = settingsForClosedIndices.build();
             final Settings openSettings = settingsForOpenIndices.build();
-            final boolean preserveExisting = request.onExisting() == UpdateSettingsClusterStateUpdateRequest.OnExisting.PRESERVE;
+            final boolean preserveExisting = request.isPreserveExisting();
 
             RoutingTable.Builder routingTableBuilder = null;
             Metadata.Builder metadataBuilder = Metadata.builder(currentState.metadata());
@@ -199,7 +199,7 @@ ClusterState execute(ClusterState currentState) {
             }
 
             if (skippedSettings.isEmpty() == false && openIndices.isEmpty() == false) {
-                if (request.onStaticSetting() == UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REOPEN_INDICES) {
+                if (request.reopenShards()) {
                     // We have non-dynamic settings and open indices. We will unassign all of the shards in these indices so that the new
                     // changed settings are applied when the shards are re-assigned.
                     routingTableBuilder = RoutingTable.builder(
diff --git a/server/src/main/java/org/elasticsearch/upgrades/SystemIndexMigrator.java b/server/src/main/java/org/elasticsearch/upgrades/SystemIndexMigrator.java
index a131f63cb75f3..94b856f7a22fb 100644
--- a/server/src/main/java/org/elasticsearch/upgrades/SystemIndexMigrator.java
+++ b/server/src/main/java/org/elasticsearch/upgrades/SystemIndexMigrator.java
@@ -19,7 +19,6 @@
 import org.elasticsearch.action.admin.indices.settings.put.UpdateSettingsClusterStateUpdateRequest;
 import org.elasticsearch.action.support.ActiveShardCount;
 import org.elasticsearch.action.support.master.AcknowledgedResponse;
-import org.elasticsearch.action.support.master.MasterNodeRequest;
 import org.elasticsearch.action.support.master.ShardsAcknowledgedResponse;
 import org.elasticsearch.client.internal.Client;
 import org.elasticsearch.client.internal.ParentTaskAssigningClient;
@@ -538,18 +537,11 @@ private CheckedBiConsumer<ActionListener<BulkByScrollResponse>, AcknowledgedResp
      */
     private void setWriteBlock(Index index, boolean readOnlyValue, ActionListener<AcknowledgedResponse> listener) {
         final Settings readOnlySettings = Settings.builder().put(IndexMetadata.INDEX_BLOCKS_WRITE_SETTING.getKey(), readOnlyValue).build();
+        UpdateSettingsClusterStateUpdateRequest updateSettingsRequest = new UpdateSettingsClusterStateUpdateRequest().indices(
+            new Index[] { index }
+        ).settings(readOnlySettings).setPreserveExisting(false).ackTimeout(TimeValue.ZERO);
 
-        metadataUpdateSettingsService.updateSettings(
-            new UpdateSettingsClusterStateUpdateRequest(
-                MasterNodeRequest.INFINITE_MASTER_NODE_TIMEOUT,
-                TimeValue.ZERO,
-                readOnlySettings,
-                UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
-                UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT,
-                index
-            ),
-            listener
-        );
+        metadataUpdateSettingsService.updateSettings(updateSettingsRequest, listener);
     }
 
     private void reindex(SystemIndexMigrationInfo migrationInfo, ActionListener<BulkByScrollResponse> listener) {
diff --git a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportUpdateSecuritySettingsAction.java b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportUpdateSecuritySettingsAction.java
index b924fe0d983bb..49f8846c36e1f 100644
--- a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportUpdateSecuritySettingsAction.java
+++ b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportUpdateSecuritySettingsAction.java
@@ -119,8 +119,8 @@ protected void masterOperation(
     private Optional<UpdateSettingsClusterStateUpdateRequest> createUpdateSettingsRequest(
         String indexName,
         Settings settingsToUpdate,
-        TimeValue ackTimeout,
-        TimeValue masterNodeTimeout,
+        TimeValue timeout,
+        TimeValue masterTimeout,
         ClusterState state
     ) {
         if (settingsToUpdate.isEmpty()) {
@@ -136,14 +136,10 @@ private Optional<UpdateSettingsClusterStateUpdateRequest> createUpdateSettingsRe
         }
 
         return Optional.of(
-            new UpdateSettingsClusterStateUpdateRequest(
-                masterNodeTimeout,
-                ackTimeout,
-                settingsToUpdate,
-                UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
-                UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT,
-                writeIndex
-            )
+            new UpdateSettingsClusterStateUpdateRequest().indices(new Index[] { writeIndex })
+                .settings(settingsToUpdate)
+                .ackTimeout(timeout)
+                .masterNodeTimeout(masterTimeout)
         );
     }
 
diff --git a/x-pack/plugin/watcher/src/main/java/org/elasticsearch/xpack/watcher/transport/actions/TransportUpdateWatcherSettingsAction.java b/x-pack/plugin/watcher/src/main/java/org/elasticsearch/xpack/watcher/transport/actions/TransportUpdateWatcherSettingsAction.java
index 0407c2db63ac6..378ee642cf105 100644
--- a/x-pack/plugin/watcher/src/main/java/org/elasticsearch/xpack/watcher/transport/actions/TransportUpdateWatcherSettingsAction.java
+++ b/x-pack/plugin/watcher/src/main/java/org/elasticsearch/xpack/watcher/transport/actions/TransportUpdateWatcherSettingsAction.java
@@ -24,6 +24,7 @@
 import org.elasticsearch.cluster.service.ClusterService;
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.util.concurrent.EsExecutors;
+import org.elasticsearch.index.Index;
 import org.elasticsearch.injection.guice.Inject;
 import org.elasticsearch.logging.LogManager;
 import org.elasticsearch.logging.Logger;
@@ -90,14 +91,9 @@ protected void masterOperation(
             return;
         }
         final Settings newSettings = Settings.builder().loadFromMap(request.settings()).build();
-        final UpdateSettingsClusterStateUpdateRequest clusterStateUpdateRequest = new UpdateSettingsClusterStateUpdateRequest(
-            request.masterNodeTimeout(),
-            request.ackTimeout(),
-            newSettings,
-            UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
-            UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT,
-            watcherIndexMd.getIndex()
-        );
+        final UpdateSettingsClusterStateUpdateRequest clusterStateUpdateRequest = new UpdateSettingsClusterStateUpdateRequest().indices(
+            new Index[] { watcherIndexMd.getIndex() }
+        ).settings(newSettings).ackTimeout(request.ackTimeout()).masterNodeTimeout(request.masterNodeTimeout());
 
         updateSettingsService.updateSettings(clusterStateUpdateRequest, new ActionListener<>() {
             @Override

From 0a546611436b16f66b60d6bb26c880a7a4474b99 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Iv=C3=A1n=20Cea=20Fontenla?= <ivancea96@outlook.com>
Date: Mon, 23 Sep 2024 18:23:14 +0200
Subject: [PATCH 05/28] Remove Analytical engine CODEOWNERS (#113178)

Reverts https://github.com/elastic/elasticsearch/pull/112465

After a week and a half trying the team CODEOWNERS, there are some
problems with not being able to (easily?) identify the direct, personal
review requests from team requests in notifications.

Unless it's solved, and given that these CODEOWNERS are more like an
"auto-documentation" tool right now, we are better reverting it.
---
 .github/CODEOWNERS | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/.github/CODEOWNERS b/.github/CODEOWNERS
index f0d9068820029..5b98444c044d2 100644
--- a/.github/CODEOWNERS
+++ b/.github/CODEOWNERS
@@ -70,7 +70,3 @@ server/src/main/java/org/elasticsearch/threadpool @elastic/es-core-infra
 # Security
 x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authz/privilege @elastic/es-security
 x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authz/store/ReservedRolesStore.java @elastic/es-security
-
-# Analytical engine
-x-pack/plugin/esql @elastic/es-analytical-engine
-x-pack/plugin/esql-core @elastic/es-analytical-engine

From 58021c340567d0461a39a7a74e765052ac3d4465 Mon Sep 17 00:00:00 2001
From: Nik Everett <nik9000@gmail.com>
Date: Mon, 23 Sep 2024 13:00:18 -0400
Subject: [PATCH 06/28] ESQL: TOP support for strings (#113183)

Adds support to the `TOP` aggregation for `keyword` and `text` field
types.

Closes #109849
---
 docs/changelog/113183.yaml                    |   6 +
 .../esql/functions/kibana/definition/top.json |  48 +++
 .../esql/functions/types/top.asciidoc         |   2 +
 x-pack/plugin/esql/compute/build.gradle       |   5 +
 .../aggregation/TopBytesRefAggregator.java    | 146 +++++++
 .../TopBytesRefAggregatorFunction.java        | 174 ++++++++
 ...TopBytesRefAggregatorFunctionSupplier.java |  45 ++
 ...TopBytesRefGroupingAggregatorFunction.java | 221 ++++++++++
 .../aggregation/X-TopAggregator.java.st       |  15 +-
 .../compute/data/sort/BucketedSortCommon.java |  68 +++
 .../data/sort/BytesRefBucketedSort.java       | 386 ++++++++++++++++++
 .../compute/data/sort/IpBucketedSort.java     |  82 ++--
 ...actTopBytesRefAggregatorFunctionTests.java |  37 ++
 ...tesRefGroupingAggregatorFunctionTests.java |  49 +++
 .../TopBytesRefAggregatorFunctionTests.java   |  29 ++
 ...tesRefGroupingAggregatorFunctionTests.java |  35 ++
 .../TopIpAggregatorFunctionTests.java         |  25 +-
 .../TopIpGroupingAggregatorFunctionTests.java |  43 +-
 .../data/sort/BytesRefBucketedSortTests.java  |  79 ++++
 .../esql/qa/mixed/MixedClusterEsqlSpecIT.java |   4 +
 .../xpack/esql/ccq/MultiClusterSpecIT.java    |   4 +
 .../src/main/resources/meta.csv-spec          |  30 +-
 .../src/main/resources/stats_top.csv-spec     |  74 ++++
 .../xpack/esql/action/EsqlCapabilities.java   |  12 +
 .../expression/function/aggregate/Top.java    |  10 +-
 .../xpack/esql/planner/AggregateMapper.java   |   2 +-
 .../function/aggregate/TopTests.java          |   4 +-
 27 files changed, 1507 insertions(+), 128 deletions(-)
 create mode 100644 docs/changelog/113183.yaml
 create mode 100644 x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/aggregation/TopBytesRefAggregator.java
 create mode 100644 x-pack/plugin/esql/compute/src/main/generated/org/elasticsearch/compute/aggregation/TopBytesRefAggregatorFunction.java
 create mode 100644 x-pack/plugin/esql/compute/src/main/generated/org/elasticsearch/compute/aggregation/TopBytesRefAggregatorFunctionSupplier.java
 create mode 100644 x-pack/plugin/esql/compute/src/main/generated/org/elasticsearch/compute/aggregation/TopBytesRefGroupingAggregatorFunction.java
 create mode 100644 x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/sort/BucketedSortCommon.java
 create mode 100644 x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/sort/BytesRefBucketedSort.java
 create mode 100644 x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/AbstractTopBytesRefAggregatorFunctionTests.java
 create mode 100644 x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/AbstractTopBytesRefGroupingAggregatorFunctionTests.java
 create mode 100644 x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/TopBytesRefAggregatorFunctionTests.java
 create mode 100644 x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/TopBytesRefGroupingAggregatorFunctionTests.java
 create mode 100644 x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/sort/BytesRefBucketedSortTests.java

diff --git a/docs/changelog/113183.yaml b/docs/changelog/113183.yaml
new file mode 100644
index 0000000000000..f30ce9831adb3
--- /dev/null
+++ b/docs/changelog/113183.yaml
@@ -0,0 +1,6 @@
+pr: 113183
+summary: "ESQL: TOP support for strings"
+area: ES|QL
+type: feature
+issues:
+ - 109849
diff --git a/docs/reference/esql/functions/kibana/definition/top.json b/docs/reference/esql/functions/kibana/definition/top.json
index 2e8e51e726588..62184326994fe 100644
--- a/docs/reference/esql/functions/kibana/definition/top.json
+++ b/docs/reference/esql/functions/kibana/definition/top.json
@@ -124,6 +124,30 @@
       "variadic" : false,
       "returnType" : "ip"
     },
+    {
+      "params" : [
+        {
+          "name" : "field",
+          "type" : "keyword",
+          "optional" : false,
+          "description" : "The field to collect the top values for."
+        },
+        {
+          "name" : "limit",
+          "type" : "integer",
+          "optional" : false,
+          "description" : "The maximum number of values to collect."
+        },
+        {
+          "name" : "order",
+          "type" : "keyword",
+          "optional" : false,
+          "description" : "The order to calculate the top values. Either `asc` or `desc`."
+        }
+      ],
+      "variadic" : false,
+      "returnType" : "keyword"
+    },
     {
       "params" : [
         {
@@ -147,6 +171,30 @@
       ],
       "variadic" : false,
       "returnType" : "long"
+    },
+    {
+      "params" : [
+        {
+          "name" : "field",
+          "type" : "text",
+          "optional" : false,
+          "description" : "The field to collect the top values for."
+        },
+        {
+          "name" : "limit",
+          "type" : "integer",
+          "optional" : false,
+          "description" : "The maximum number of values to collect."
+        },
+        {
+          "name" : "order",
+          "type" : "keyword",
+          "optional" : false,
+          "description" : "The order to calculate the top values. Either `asc` or `desc`."
+        }
+      ],
+      "variadic" : false,
+      "returnType" : "text"
     }
   ],
   "examples" : [
diff --git a/docs/reference/esql/functions/types/top.asciidoc b/docs/reference/esql/functions/types/top.asciidoc
index 0eb329c10b9ed..25d7962a27252 100644
--- a/docs/reference/esql/functions/types/top.asciidoc
+++ b/docs/reference/esql/functions/types/top.asciidoc
@@ -10,5 +10,7 @@ date | integer | keyword | date
 double | integer | keyword | double
 integer | integer | keyword | integer
 ip | integer | keyword | ip
+keyword | integer | keyword | keyword
 long | integer | keyword | long
+text | integer | keyword | text
 |===
diff --git a/x-pack/plugin/esql/compute/build.gradle b/x-pack/plugin/esql/compute/build.gradle
index 81d1a6f5360ca..49e819b7cdc88 100644
--- a/x-pack/plugin/esql/compute/build.gradle
+++ b/x-pack/plugin/esql/compute/build.gradle
@@ -635,6 +635,11 @@ tasks.named('stringTemplates').configure {
     it.inputFile = topAggregatorInputFile
     it.outputFile = "org/elasticsearch/compute/aggregation/TopBooleanAggregator.java"
   }
+  template {
+    it.properties = bytesRefProperties
+    it.inputFile = topAggregatorInputFile
+    it.outputFile = "org/elasticsearch/compute/aggregation/TopBytesRefAggregator.java"
+  }
   template {
     it.properties = ipProperties
     it.inputFile = topAggregatorInputFile
diff --git a/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/aggregation/TopBytesRefAggregator.java b/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/aggregation/TopBytesRefAggregator.java
new file mode 100644
index 0000000000000..c9b0e679b3e64
--- /dev/null
+++ b/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/aggregation/TopBytesRefAggregator.java
@@ -0,0 +1,146 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.compute.aggregation;
+
+import org.apache.lucene.util.BytesRef;
+import org.elasticsearch.common.breaker.CircuitBreaker;
+import org.elasticsearch.common.util.BigArrays;
+import org.elasticsearch.compute.ann.Aggregator;
+import org.elasticsearch.compute.ann.GroupingAggregator;
+import org.elasticsearch.compute.ann.IntermediateState;
+import org.elasticsearch.compute.data.Block;
+import org.elasticsearch.compute.data.BlockFactory;
+import org.elasticsearch.compute.data.BytesRefBlock;
+import org.elasticsearch.compute.data.IntVector;
+import org.elasticsearch.compute.data.sort.BytesRefBucketedSort;
+import org.elasticsearch.compute.operator.DriverContext;
+import org.elasticsearch.core.Releasable;
+import org.elasticsearch.core.Releasables;
+import org.elasticsearch.search.sort.SortOrder;
+
+/**
+ * Aggregates the top N field values for BytesRef.
+ * <p>
+ *     This class is generated. Edit `X-TopAggregator.java.st` to edit this file.
+ * </p>
+ */
+@Aggregator({ @IntermediateState(name = "top", type = "BYTES_REF_BLOCK") })
+@GroupingAggregator
+class TopBytesRefAggregator {
+    public static SingleState initSingle(BigArrays bigArrays, int limit, boolean ascending) {
+        return new SingleState(bigArrays, limit, ascending);
+    }
+
+    public static void combine(SingleState state, BytesRef v) {
+        state.add(v);
+    }
+
+    public static void combineIntermediate(SingleState state, BytesRefBlock values) {
+        int start = values.getFirstValueIndex(0);
+        int end = start + values.getValueCount(0);
+        var scratch = new BytesRef();
+        for (int i = start; i < end; i++) {
+            combine(state, values.getBytesRef(i, scratch));
+        }
+    }
+
+    public static Block evaluateFinal(SingleState state, DriverContext driverContext) {
+        return state.toBlock(driverContext.blockFactory());
+    }
+
+    public static GroupingState initGrouping(BigArrays bigArrays, int limit, boolean ascending) {
+        return new GroupingState(bigArrays, limit, ascending);
+    }
+
+    public static void combine(GroupingState state, int groupId, BytesRef v) {
+        state.add(groupId, v);
+    }
+
+    public static void combineIntermediate(GroupingState state, int groupId, BytesRefBlock values, int valuesPosition) {
+        int start = values.getFirstValueIndex(valuesPosition);
+        int end = start + values.getValueCount(valuesPosition);
+        var scratch = new BytesRef();
+        for (int i = start; i < end; i++) {
+            combine(state, groupId, values.getBytesRef(i, scratch));
+        }
+    }
+
+    public static void combineStates(GroupingState current, int groupId, GroupingState state, int statePosition) {
+        current.merge(groupId, state, statePosition);
+    }
+
+    public static Block evaluateFinal(GroupingState state, IntVector selected, DriverContext driverContext) {
+        return state.toBlock(driverContext.blockFactory(), selected);
+    }
+
+    public static class GroupingState implements Releasable {
+        private final BytesRefBucketedSort sort;
+
+        private GroupingState(BigArrays bigArrays, int limit, boolean ascending) {
+            // TODO pass the breaker in from the DriverContext
+            CircuitBreaker breaker = bigArrays.breakerService().getBreaker(CircuitBreaker.REQUEST);
+            this.sort = new BytesRefBucketedSort(breaker, "top", bigArrays, ascending ? SortOrder.ASC : SortOrder.DESC, limit);
+        }
+
+        public void add(int groupId, BytesRef value) {
+            sort.collect(value, groupId);
+        }
+
+        public void merge(int groupId, GroupingState other, int otherGroupId) {
+            sort.merge(groupId, other.sort, otherGroupId);
+        }
+
+        void toIntermediate(Block[] blocks, int offset, IntVector selected, DriverContext driverContext) {
+            blocks[offset] = toBlock(driverContext.blockFactory(), selected);
+        }
+
+        Block toBlock(BlockFactory blockFactory, IntVector selected) {
+            return sort.toBlock(blockFactory, selected);
+        }
+
+        void enableGroupIdTracking(SeenGroupIds seen) {
+            // we figure out seen values from nulls on the values block
+        }
+
+        @Override
+        public void close() {
+            Releasables.closeExpectNoException(sort);
+        }
+    }
+
+    public static class SingleState implements Releasable {
+        private final GroupingState internalState;
+
+        private SingleState(BigArrays bigArrays, int limit, boolean ascending) {
+            this.internalState = new GroupingState(bigArrays, limit, ascending);
+        }
+
+        public void add(BytesRef value) {
+            internalState.add(0, value);
+        }
+
+        public void merge(GroupingState other) {
+            internalState.merge(0, other, 0);
+        }
+
+        void toIntermediate(Block[] blocks, int offset, DriverContext driverContext) {
+            blocks[offset] = toBlock(driverContext.blockFactory());
+        }
+
+        Block toBlock(BlockFactory blockFactory) {
+            try (var intValues = blockFactory.newConstantIntVector(0, 1)) {
+                return internalState.toBlock(blockFactory, intValues);
+            }
+        }
+
+        @Override
+        public void close() {
+            Releasables.closeExpectNoException(internalState);
+        }
+    }
+}
diff --git a/x-pack/plugin/esql/compute/src/main/generated/org/elasticsearch/compute/aggregation/TopBytesRefAggregatorFunction.java b/x-pack/plugin/esql/compute/src/main/generated/org/elasticsearch/compute/aggregation/TopBytesRefAggregatorFunction.java
new file mode 100644
index 0000000000000..17b3d84ab0028
--- /dev/null
+++ b/x-pack/plugin/esql/compute/src/main/generated/org/elasticsearch/compute/aggregation/TopBytesRefAggregatorFunction.java
@@ -0,0 +1,174 @@
+// Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+// or more contributor license agreements. Licensed under the Elastic License
+// 2.0; you may not use this file except in compliance with the Elastic License
+// 2.0.
+package org.elasticsearch.compute.aggregation;
+
+import java.lang.Integer;
+import java.lang.Override;
+import java.lang.String;
+import java.lang.StringBuilder;
+import java.util.List;
+import org.apache.lucene.util.BytesRef;
+import org.elasticsearch.compute.data.Block;
+import org.elasticsearch.compute.data.BooleanVector;
+import org.elasticsearch.compute.data.BytesRefBlock;
+import org.elasticsearch.compute.data.BytesRefVector;
+import org.elasticsearch.compute.data.ElementType;
+import org.elasticsearch.compute.data.Page;
+import org.elasticsearch.compute.operator.DriverContext;
+
+/**
+ * {@link AggregatorFunction} implementation for {@link TopBytesRefAggregator}.
+ * This class is generated. Do not edit it.
+ */
+public final class TopBytesRefAggregatorFunction implements AggregatorFunction {
+  private static final List<IntermediateStateDesc> INTERMEDIATE_STATE_DESC = List.of(
+      new IntermediateStateDesc("top", ElementType.BYTES_REF)  );
+
+  private final DriverContext driverContext;
+
+  private final TopBytesRefAggregator.SingleState state;
+
+  private final List<Integer> channels;
+
+  private final int limit;
+
+  private final boolean ascending;
+
+  public TopBytesRefAggregatorFunction(DriverContext driverContext, List<Integer> channels,
+      TopBytesRefAggregator.SingleState state, int limit, boolean ascending) {
+    this.driverContext = driverContext;
+    this.channels = channels;
+    this.state = state;
+    this.limit = limit;
+    this.ascending = ascending;
+  }
+
+  public static TopBytesRefAggregatorFunction create(DriverContext driverContext,
+      List<Integer> channels, int limit, boolean ascending) {
+    return new TopBytesRefAggregatorFunction(driverContext, channels, TopBytesRefAggregator.initSingle(driverContext.bigArrays(), limit, ascending), limit, ascending);
+  }
+
+  public static List<IntermediateStateDesc> intermediateStateDesc() {
+    return INTERMEDIATE_STATE_DESC;
+  }
+
+  @Override
+  public int intermediateBlockCount() {
+    return INTERMEDIATE_STATE_DESC.size();
+  }
+
+  @Override
+  public void addRawInput(Page page, BooleanVector mask) {
+    if (mask.isConstant()) {
+      if (mask.getBoolean(0) == false) {
+        // Entire page masked away
+        return;
+      }
+      // No masking
+      BytesRefBlock block = page.getBlock(channels.get(0));
+      BytesRefVector vector = block.asVector();
+      if (vector != null) {
+        addRawVector(vector);
+      } else {
+        addRawBlock(block);
+      }
+      return;
+    }
+    // Some positions masked away, others kept
+    BytesRefBlock block = page.getBlock(channels.get(0));
+    BytesRefVector vector = block.asVector();
+    if (vector != null) {
+      addRawVector(vector, mask);
+    } else {
+      addRawBlock(block, mask);
+    }
+  }
+
+  private void addRawVector(BytesRefVector vector) {
+    BytesRef scratch = new BytesRef();
+    for (int i = 0; i < vector.getPositionCount(); i++) {
+      TopBytesRefAggregator.combine(state, vector.getBytesRef(i, scratch));
+    }
+  }
+
+  private void addRawVector(BytesRefVector vector, BooleanVector mask) {
+    BytesRef scratch = new BytesRef();
+    for (int i = 0; i < vector.getPositionCount(); i++) {
+      if (mask.getBoolean(i) == false) {
+        continue;
+      }
+      TopBytesRefAggregator.combine(state, vector.getBytesRef(i, scratch));
+    }
+  }
+
+  private void addRawBlock(BytesRefBlock block) {
+    BytesRef scratch = new BytesRef();
+    for (int p = 0; p < block.getPositionCount(); p++) {
+      if (block.isNull(p)) {
+        continue;
+      }
+      int start = block.getFirstValueIndex(p);
+      int end = start + block.getValueCount(p);
+      for (int i = start; i < end; i++) {
+        TopBytesRefAggregator.combine(state, block.getBytesRef(i, scratch));
+      }
+    }
+  }
+
+  private void addRawBlock(BytesRefBlock block, BooleanVector mask) {
+    BytesRef scratch = new BytesRef();
+    for (int p = 0; p < block.getPositionCount(); p++) {
+      if (mask.getBoolean(p) == false) {
+        continue;
+      }
+      if (block.isNull(p)) {
+        continue;
+      }
+      int start = block.getFirstValueIndex(p);
+      int end = start + block.getValueCount(p);
+      for (int i = start; i < end; i++) {
+        TopBytesRefAggregator.combine(state, block.getBytesRef(i, scratch));
+      }
+    }
+  }
+
+  @Override
+  public void addIntermediateInput(Page page) {
+    assert channels.size() == intermediateBlockCount();
+    assert page.getBlockCount() >= channels.get(0) + intermediateStateDesc().size();
+    Block topUncast = page.getBlock(channels.get(0));
+    if (topUncast.areAllValuesNull()) {
+      return;
+    }
+    BytesRefBlock top = (BytesRefBlock) topUncast;
+    assert top.getPositionCount() == 1;
+    BytesRef scratch = new BytesRef();
+    TopBytesRefAggregator.combineIntermediate(state, top);
+  }
+
+  @Override
+  public void evaluateIntermediate(Block[] blocks, int offset, DriverContext driverContext) {
+    state.toIntermediate(blocks, offset, driverContext);
+  }
+
+  @Override
+  public void evaluateFinal(Block[] blocks, int offset, DriverContext driverContext) {
+    blocks[offset] = TopBytesRefAggregator.evaluateFinal(state, driverContext);
+  }
+
+  @Override
+  public String toString() {
+    StringBuilder sb = new StringBuilder();
+    sb.append(getClass().getSimpleName()).append("[");
+    sb.append("channels=").append(channels);
+    sb.append("]");
+    return sb.toString();
+  }
+
+  @Override
+  public void close() {
+    state.close();
+  }
+}
diff --git a/x-pack/plugin/esql/compute/src/main/generated/org/elasticsearch/compute/aggregation/TopBytesRefAggregatorFunctionSupplier.java b/x-pack/plugin/esql/compute/src/main/generated/org/elasticsearch/compute/aggregation/TopBytesRefAggregatorFunctionSupplier.java
new file mode 100644
index 0000000000000..8c77d2116bf69
--- /dev/null
+++ b/x-pack/plugin/esql/compute/src/main/generated/org/elasticsearch/compute/aggregation/TopBytesRefAggregatorFunctionSupplier.java
@@ -0,0 +1,45 @@
+// Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+// or more contributor license agreements. Licensed under the Elastic License
+// 2.0; you may not use this file except in compliance with the Elastic License
+// 2.0.
+package org.elasticsearch.compute.aggregation;
+
+import java.lang.Integer;
+import java.lang.Override;
+import java.lang.String;
+import java.util.List;
+import org.elasticsearch.compute.operator.DriverContext;
+
+/**
+ * {@link AggregatorFunctionSupplier} implementation for {@link TopBytesRefAggregator}.
+ * This class is generated. Do not edit it.
+ */
+public final class TopBytesRefAggregatorFunctionSupplier implements AggregatorFunctionSupplier {
+  private final List<Integer> channels;
+
+  private final int limit;
+
+  private final boolean ascending;
+
+  public TopBytesRefAggregatorFunctionSupplier(List<Integer> channels, int limit,
+      boolean ascending) {
+    this.channels = channels;
+    this.limit = limit;
+    this.ascending = ascending;
+  }
+
+  @Override
+  public TopBytesRefAggregatorFunction aggregator(DriverContext driverContext) {
+    return TopBytesRefAggregatorFunction.create(driverContext, channels, limit, ascending);
+  }
+
+  @Override
+  public TopBytesRefGroupingAggregatorFunction groupingAggregator(DriverContext driverContext) {
+    return TopBytesRefGroupingAggregatorFunction.create(channels, driverContext, limit, ascending);
+  }
+
+  @Override
+  public String describe() {
+    return "top of bytes";
+  }
+}
diff --git a/x-pack/plugin/esql/compute/src/main/generated/org/elasticsearch/compute/aggregation/TopBytesRefGroupingAggregatorFunction.java b/x-pack/plugin/esql/compute/src/main/generated/org/elasticsearch/compute/aggregation/TopBytesRefGroupingAggregatorFunction.java
new file mode 100644
index 0000000000000..aa2d6094c8c3f
--- /dev/null
+++ b/x-pack/plugin/esql/compute/src/main/generated/org/elasticsearch/compute/aggregation/TopBytesRefGroupingAggregatorFunction.java
@@ -0,0 +1,221 @@
+// Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+// or more contributor license agreements. Licensed under the Elastic License
+// 2.0; you may not use this file except in compliance with the Elastic License
+// 2.0.
+package org.elasticsearch.compute.aggregation;
+
+import java.lang.Integer;
+import java.lang.Override;
+import java.lang.String;
+import java.lang.StringBuilder;
+import java.util.List;
+import org.apache.lucene.util.BytesRef;
+import org.elasticsearch.compute.data.Block;
+import org.elasticsearch.compute.data.BytesRefBlock;
+import org.elasticsearch.compute.data.BytesRefVector;
+import org.elasticsearch.compute.data.ElementType;
+import org.elasticsearch.compute.data.IntBlock;
+import org.elasticsearch.compute.data.IntVector;
+import org.elasticsearch.compute.data.Page;
+import org.elasticsearch.compute.operator.DriverContext;
+
+/**
+ * {@link GroupingAggregatorFunction} implementation for {@link TopBytesRefAggregator}.
+ * This class is generated. Do not edit it.
+ */
+public final class TopBytesRefGroupingAggregatorFunction implements GroupingAggregatorFunction {
+  private static final List<IntermediateStateDesc> INTERMEDIATE_STATE_DESC = List.of(
+      new IntermediateStateDesc("top", ElementType.BYTES_REF)  );
+
+  private final TopBytesRefAggregator.GroupingState state;
+
+  private final List<Integer> channels;
+
+  private final DriverContext driverContext;
+
+  private final int limit;
+
+  private final boolean ascending;
+
+  public TopBytesRefGroupingAggregatorFunction(List<Integer> channels,
+      TopBytesRefAggregator.GroupingState state, DriverContext driverContext, int limit,
+      boolean ascending) {
+    this.channels = channels;
+    this.state = state;
+    this.driverContext = driverContext;
+    this.limit = limit;
+    this.ascending = ascending;
+  }
+
+  public static TopBytesRefGroupingAggregatorFunction create(List<Integer> channels,
+      DriverContext driverContext, int limit, boolean ascending) {
+    return new TopBytesRefGroupingAggregatorFunction(channels, TopBytesRefAggregator.initGrouping(driverContext.bigArrays(), limit, ascending), driverContext, limit, ascending);
+  }
+
+  public static List<IntermediateStateDesc> intermediateStateDesc() {
+    return INTERMEDIATE_STATE_DESC;
+  }
+
+  @Override
+  public int intermediateBlockCount() {
+    return INTERMEDIATE_STATE_DESC.size();
+  }
+
+  @Override
+  public GroupingAggregatorFunction.AddInput prepareProcessPage(SeenGroupIds seenGroupIds,
+      Page page) {
+    BytesRefBlock valuesBlock = page.getBlock(channels.get(0));
+    BytesRefVector valuesVector = valuesBlock.asVector();
+    if (valuesVector == null) {
+      if (valuesBlock.mayHaveNulls()) {
+        state.enableGroupIdTracking(seenGroupIds);
+      }
+      return new GroupingAggregatorFunction.AddInput() {
+        @Override
+        public void add(int positionOffset, IntBlock groupIds) {
+          addRawInput(positionOffset, groupIds, valuesBlock);
+        }
+
+        @Override
+        public void add(int positionOffset, IntVector groupIds) {
+          addRawInput(positionOffset, groupIds, valuesBlock);
+        }
+
+        @Override
+        public void close() {
+        }
+      };
+    }
+    return new GroupingAggregatorFunction.AddInput() {
+      @Override
+      public void add(int positionOffset, IntBlock groupIds) {
+        addRawInput(positionOffset, groupIds, valuesVector);
+      }
+
+      @Override
+      public void add(int positionOffset, IntVector groupIds) {
+        addRawInput(positionOffset, groupIds, valuesVector);
+      }
+
+      @Override
+      public void close() {
+      }
+    };
+  }
+
+  private void addRawInput(int positionOffset, IntVector groups, BytesRefBlock values) {
+    BytesRef scratch = new BytesRef();
+    for (int groupPosition = 0; groupPosition < groups.getPositionCount(); groupPosition++) {
+      int groupId = groups.getInt(groupPosition);
+      if (values.isNull(groupPosition + positionOffset)) {
+        continue;
+      }
+      int valuesStart = values.getFirstValueIndex(groupPosition + positionOffset);
+      int valuesEnd = valuesStart + values.getValueCount(groupPosition + positionOffset);
+      for (int v = valuesStart; v < valuesEnd; v++) {
+        TopBytesRefAggregator.combine(state, groupId, values.getBytesRef(v, scratch));
+      }
+    }
+  }
+
+  private void addRawInput(int positionOffset, IntVector groups, BytesRefVector values) {
+    BytesRef scratch = new BytesRef();
+    for (int groupPosition = 0; groupPosition < groups.getPositionCount(); groupPosition++) {
+      int groupId = groups.getInt(groupPosition);
+      TopBytesRefAggregator.combine(state, groupId, values.getBytesRef(groupPosition + positionOffset, scratch));
+    }
+  }
+
+  private void addRawInput(int positionOffset, IntBlock groups, BytesRefBlock values) {
+    BytesRef scratch = new BytesRef();
+    for (int groupPosition = 0; groupPosition < groups.getPositionCount(); groupPosition++) {
+      if (groups.isNull(groupPosition)) {
+        continue;
+      }
+      int groupStart = groups.getFirstValueIndex(groupPosition);
+      int groupEnd = groupStart + groups.getValueCount(groupPosition);
+      for (int g = groupStart; g < groupEnd; g++) {
+        int groupId = groups.getInt(g);
+        if (values.isNull(groupPosition + positionOffset)) {
+          continue;
+        }
+        int valuesStart = values.getFirstValueIndex(groupPosition + positionOffset);
+        int valuesEnd = valuesStart + values.getValueCount(groupPosition + positionOffset);
+        for (int v = valuesStart; v < valuesEnd; v++) {
+          TopBytesRefAggregator.combine(state, groupId, values.getBytesRef(v, scratch));
+        }
+      }
+    }
+  }
+
+  private void addRawInput(int positionOffset, IntBlock groups, BytesRefVector values) {
+    BytesRef scratch = new BytesRef();
+    for (int groupPosition = 0; groupPosition < groups.getPositionCount(); groupPosition++) {
+      if (groups.isNull(groupPosition)) {
+        continue;
+      }
+      int groupStart = groups.getFirstValueIndex(groupPosition);
+      int groupEnd = groupStart + groups.getValueCount(groupPosition);
+      for (int g = groupStart; g < groupEnd; g++) {
+        int groupId = groups.getInt(g);
+        TopBytesRefAggregator.combine(state, groupId, values.getBytesRef(groupPosition + positionOffset, scratch));
+      }
+    }
+  }
+
+  @Override
+  public void selectedMayContainUnseenGroups(SeenGroupIds seenGroupIds) {
+    state.enableGroupIdTracking(seenGroupIds);
+  }
+
+  @Override
+  public void addIntermediateInput(int positionOffset, IntVector groups, Page page) {
+    state.enableGroupIdTracking(new SeenGroupIds.Empty());
+    assert channels.size() == intermediateBlockCount();
+    Block topUncast = page.getBlock(channels.get(0));
+    if (topUncast.areAllValuesNull()) {
+      return;
+    }
+    BytesRefBlock top = (BytesRefBlock) topUncast;
+    BytesRef scratch = new BytesRef();
+    for (int groupPosition = 0; groupPosition < groups.getPositionCount(); groupPosition++) {
+      int groupId = groups.getInt(groupPosition);
+      TopBytesRefAggregator.combineIntermediate(state, groupId, top, groupPosition + positionOffset);
+    }
+  }
+
+  @Override
+  public void addIntermediateRowInput(int groupId, GroupingAggregatorFunction input, int position) {
+    if (input.getClass() != getClass()) {
+      throw new IllegalArgumentException("expected " + getClass() + "; got " + input.getClass());
+    }
+    TopBytesRefAggregator.GroupingState inState = ((TopBytesRefGroupingAggregatorFunction) input).state;
+    state.enableGroupIdTracking(new SeenGroupIds.Empty());
+    TopBytesRefAggregator.combineStates(state, groupId, inState, position);
+  }
+
+  @Override
+  public void evaluateIntermediate(Block[] blocks, int offset, IntVector selected) {
+    state.toIntermediate(blocks, offset, selected, driverContext);
+  }
+
+  @Override
+  public void evaluateFinal(Block[] blocks, int offset, IntVector selected,
+      DriverContext driverContext) {
+    blocks[offset] = TopBytesRefAggregator.evaluateFinal(state, selected, driverContext);
+  }
+
+  @Override
+  public String toString() {
+    StringBuilder sb = new StringBuilder();
+    sb.append(getClass().getSimpleName()).append("[");
+    sb.append("channels=").append(channels);
+    sb.append("]");
+    return sb.toString();
+  }
+
+  @Override
+  public void close() {
+    state.close();
+  }
+}
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/X-TopAggregator.java.st b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/X-TopAggregator.java.st
index b97d26ee6147d..18d573eea4a4c 100644
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/X-TopAggregator.java.st
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/X-TopAggregator.java.st
@@ -7,9 +7,12 @@
 
 package org.elasticsearch.compute.aggregation;
 
-$if(Ip)$
+$if(BytesRef || Ip)$
 import org.apache.lucene.util.BytesRef;
 $endif$
+$if(BytesRef)$
+import org.elasticsearch.common.breaker.CircuitBreaker;
+$endif$
 import org.elasticsearch.common.util.BigArrays;
 import org.elasticsearch.compute.ann.Aggregator;
 import org.elasticsearch.compute.ann.GroupingAggregator;
@@ -49,7 +52,7 @@ class Top$Name$Aggregator {
     public static void combineIntermediate(SingleState state, $Type$Block values) {
         int start = values.getFirstValueIndex(0);
         int end = start + values.getValueCount(0);
-$if(Ip)$
+$if(BytesRef || Ip)$
         var scratch = new BytesRef();
         for (int i = start; i < end; i++) {
             combine(state, values.get$Type$(i, scratch));
@@ -76,7 +79,7 @@ $endif$
     public static void combineIntermediate(GroupingState state, int groupId, $Type$Block values, int valuesPosition) {
         int start = values.getFirstValueIndex(valuesPosition);
         int end = start + values.getValueCount(valuesPosition);
-$if(Ip)$
+$if(BytesRef || Ip)$
         var scratch = new BytesRef();
         for (int i = start; i < end; i++) {
             combine(state, groupId, values.get$Type$(i, scratch));
@@ -100,7 +103,13 @@ $endif$
         private final $Name$BucketedSort sort;
 
         private GroupingState(BigArrays bigArrays, int limit, boolean ascending) {
+$if(BytesRef)$
+            // TODO pass the breaker in from the DriverContext
+            CircuitBreaker breaker = bigArrays.breakerService().getBreaker(CircuitBreaker.REQUEST);
+            this.sort = new BytesRefBucketedSort(breaker, "top", bigArrays, ascending ? SortOrder.ASC : SortOrder.DESC, limit);
+$else$
             this.sort = new $Name$BucketedSort(bigArrays, ascending ? SortOrder.ASC : SortOrder.DESC, limit);
+$endif$
         }
 
         public void add(int groupId, $type$ value) {
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/sort/BucketedSortCommon.java b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/sort/BucketedSortCommon.java
new file mode 100644
index 0000000000000..58306f2140a82
--- /dev/null
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/sort/BucketedSortCommon.java
@@ -0,0 +1,68 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.compute.data.sort;
+
+import org.elasticsearch.common.util.BigArrays;
+import org.elasticsearch.common.util.BitArray;
+import org.elasticsearch.core.Releasable;
+import org.elasticsearch.search.sort.SortOrder;
+
+/**
+ * Components common to BucketedSort implementations.
+ */
+class BucketedSortCommon implements Releasable {
+    final BigArrays bigArrays;
+    final SortOrder order;
+    final int bucketSize;
+
+    /**
+     * {@code true} if the bucket is in heap mode, {@code false} if
+     * it is still gathering.
+     */
+    private final BitArray heapMode;
+
+    BucketedSortCommon(BigArrays bigArrays, SortOrder order, int bucketSize) {
+        this.bigArrays = bigArrays;
+        this.order = order;
+        this.bucketSize = bucketSize;
+        this.heapMode = new BitArray(0, bigArrays);
+    }
+
+    /**
+     * The first index in a bucket. Note that this might not be <strong>used</strong>.
+     * See {@link }
+     */
+    long rootIndex(int bucket) {
+        return (long) bucket * bucketSize;
+    }
+
+    /**
+     * The last index in a bucket.
+     */
+    long endIndex(long rootIndex) {
+        return rootIndex + bucketSize;
+    }
+
+    boolean inHeapMode(int bucket) {
+        return heapMode.get(bucket);
+    }
+
+    void enableHeapMode(int bucket) {
+        heapMode.set(bucket);
+    }
+
+    void assertValidNextOffset(int next) {
+        assert 0 <= next && next < bucketSize
+            : "Expected next to be in the range of valid buckets [0 <= " + next + " < " + bucketSize + "]";
+    }
+
+    @Override
+    public void close() {
+        heapMode.close();
+    }
+}
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/sort/BytesRefBucketedSort.java b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/sort/BytesRefBucketedSort.java
new file mode 100644
index 0000000000000..9198de53b1e04
--- /dev/null
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/sort/BytesRefBucketedSort.java
@@ -0,0 +1,386 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.compute.data.sort;
+
+import org.apache.lucene.util.BytesRef;
+import org.elasticsearch.common.breaker.CircuitBreaker;
+import org.elasticsearch.common.util.BigArrays;
+import org.elasticsearch.common.util.ByteUtils;
+import org.elasticsearch.common.util.ObjectArray;
+import org.elasticsearch.compute.data.Block;
+import org.elasticsearch.compute.data.BlockFactory;
+import org.elasticsearch.compute.data.IntVector;
+import org.elasticsearch.compute.operator.BreakingBytesRefBuilder;
+import org.elasticsearch.core.Assertions;
+import org.elasticsearch.core.Releasable;
+import org.elasticsearch.core.Releasables;
+import org.elasticsearch.search.sort.BucketedSort;
+import org.elasticsearch.search.sort.SortOrder;
+
+import java.util.Arrays;
+import java.util.stream.IntStream;
+import java.util.stream.LongStream;
+
+/**
+ * Aggregates the top N variable length {@link BytesRef} values per bucket.
+ * See {@link BucketedSort} for more information.
+ */
+public class BytesRefBucketedSort implements Releasable {
+    private final BucketedSortCommon common;
+    private final CircuitBreaker breaker;
+    private final String label;
+
+    /**
+     * An array containing all the values on all buckets. The structure is as follows:
+     * <p>
+     *     For each bucket, there are {@link BucketedSortCommon#bucketSize} elements, based
+     *     on the bucket id (0, 1, 2...). Then, for each bucket, it can be in 2 states:
+     * </p>
+     * <ul>
+     *     <li>
+     *         Gather mode: All buckets start in gather mode, and remain here while they have
+     *         less than bucketSize elements. In gather mode, the elements are stored in the
+     *         array from the highest index to the lowest index. The lowest index contains
+     *         the offset to the next slot to be filled.
+     *         <p>
+     *             This allows us to insert elements in O(1) time.
+     *         </p>
+     *         <p>
+     *             When the bucketSize-th element is collected, the bucket transitions to heap
+     *             mode, by heapifying its contents.
+     *         </p>
+     *     </li>
+     *     <li>
+     *         Heap mode: The bucket slots are organized as a min heap structure.
+     *         <p>
+     *             The root of the heap is the minimum value in the bucket,
+     *             which allows us to quickly discard new values that are not in the top N.
+     *         </p>
+     *     </li>
+     * </ul>
+     */
+    private ObjectArray<BreakingBytesRefBuilder> values;
+
+    public BytesRefBucketedSort(CircuitBreaker breaker, String label, BigArrays bigArrays, SortOrder order, int bucketSize) {
+        this.breaker = breaker;
+        this.label = label;
+        common = new BucketedSortCommon(bigArrays, order, bucketSize);
+        boolean success = false;
+        try {
+            values = bigArrays.newObjectArray(0);
+            success = true;
+        } finally {
+            if (success == false) {
+                close();
+            }
+        }
+    }
+
+    private void checkInvariant(int bucket) {
+        if (Assertions.ENABLED == false) {
+            return;
+        }
+        long rootIndex = common.rootIndex(bucket);
+        long requiredSize = common.endIndex(rootIndex);
+        if (values.size() < requiredSize) {
+            throw new AssertionError("values too short " + values.size() + " < " + requiredSize);
+        }
+        if (values.get(rootIndex) == null) {
+            throw new AssertionError("new gather offset can't be null");
+        }
+        if (common.inHeapMode(bucket) == false) {
+            common.assertValidNextOffset(getNextGatherOffset(rootIndex));
+        } else {
+            for (long l = rootIndex; l < common.endIndex(rootIndex); l++) {
+                if (values.get(rootIndex) == null) {
+                    throw new AssertionError("values missing in heap mode");
+                }
+            }
+        }
+    }
+
+    /**
+     * Collects a {@code value} into a {@code bucket}.
+     * <p>
+     *     It may or may not be inserted in the heap, depending on if it is better than the current root.
+     * </p>
+     */
+    public void collect(BytesRef value, int bucket) {
+        long rootIndex = common.rootIndex(bucket);
+        if (common.inHeapMode(bucket)) {
+            if (betterThan(value, values.get(rootIndex).bytesRefView())) {
+                clearedBytesAt(rootIndex).append(value);
+                downHeap(rootIndex, 0);
+            }
+            checkInvariant(bucket);
+            return;
+        }
+        // Gathering mode
+        long requiredSize = common.endIndex(rootIndex);
+        if (values.size() < requiredSize) {
+            grow(requiredSize);
+        }
+        int next = getNextGatherOffset(rootIndex);
+        common.assertValidNextOffset(next);
+        long index = next + rootIndex;
+        clearedBytesAt(index).append(value);
+        if (next == 0) {
+            common.enableHeapMode(bucket);
+            heapify(rootIndex);
+        } else {
+            ByteUtils.writeIntLE(next - 1, values.get(rootIndex).bytes(), 0);
+        }
+        checkInvariant(bucket);
+    }
+
+    /**
+     * Merge the values from {@code other}'s {@code otherGroupId} into {@code groupId}.
+     */
+    public void merge(int bucket, BytesRefBucketedSort other, int otherBucket) {
+        long otherRootIndex = other.common.rootIndex(otherBucket);
+        if (otherRootIndex >= other.values.size()) {
+            // The value was never collected.
+            return;
+        }
+        other.checkInvariant(bucket);
+        long otherStart = other.startIndex(otherBucket, otherRootIndex);
+        long otherEnd = other.common.endIndex(otherRootIndex);
+        // TODO: This can be improved for heapified buckets by making use of the heap structures
+        for (long i = otherStart; i < otherEnd; i++) {
+            collect(other.values.get(i).bytesRefView(), bucket);
+        }
+    }
+
+    /**
+     * Creates a block with the values from the {@code selected} groups.
+     */
+    public Block toBlock(BlockFactory blockFactory, IntVector selected) {
+        // Check if the selected groups are all empty, to avoid allocating extra memory
+        if (IntStream.range(0, selected.getPositionCount()).map(selected::getInt).noneMatch(bucket -> {
+            long rootIndex = common.rootIndex(bucket);
+            if (rootIndex >= values.size()) {
+                // Never collected
+                return false;
+            }
+            long start = startIndex(bucket, rootIndex);
+            long end = common.endIndex(rootIndex);
+            long size = end - start;
+            return size > 0;
+        })) {
+            return blockFactory.newConstantNullBlock(selected.getPositionCount());
+        }
+
+        // Used to sort the values in the bucket.
+        BytesRef[] bucketValues = new BytesRef[common.bucketSize];
+
+        try (var builder = blockFactory.newBytesRefBlockBuilder(selected.getPositionCount())) {
+            for (int s = 0; s < selected.getPositionCount(); s++) {
+                int bucket = selected.getInt(s);
+                long rootIndex = common.rootIndex(bucket);
+                if (rootIndex >= values.size()) {
+                    // Never collected
+                    builder.appendNull();
+                    continue;
+                }
+
+                long start = startIndex(bucket, rootIndex);
+                long end = common.endIndex(rootIndex);
+                long size = end - start;
+
+                if (size == 0) {
+                    builder.appendNull();
+                    continue;
+                }
+
+                if (size == 1) {
+                    try (BreakingBytesRefBuilder bytes = values.get(start)) {
+                        builder.appendBytesRef(bytes.bytesRefView());
+                    }
+                    values.set(start, null);
+                    continue;
+                }
+
+                for (int i = 0; i < size; i++) {
+                    try (BreakingBytesRefBuilder bytes = values.get(start + i)) {
+                        bucketValues[i] = bytes.bytesRefView();
+                    }
+                    values.set(start + i, null);
+                }
+
+                // TODO: Make use of heap structures to faster iterate in order instead of copying and sorting
+                Arrays.sort(bucketValues, 0, (int) size);
+
+                builder.beginPositionEntry();
+                if (common.order == SortOrder.ASC) {
+                    for (int i = 0; i < size; i++) {
+                        builder.appendBytesRef(bucketValues[i]);
+                    }
+                } else {
+                    for (int i = (int) size - 1; i >= 0; i--) {
+                        builder.appendBytesRef(bucketValues[i]);
+                    }
+                }
+                builder.endPositionEntry();
+            }
+            return builder.build();
+        }
+    }
+
+    private long startIndex(int bucket, long rootIndex) {
+        if (common.inHeapMode(bucket)) {
+            return rootIndex;
+        }
+        return rootIndex + getNextGatherOffset(rootIndex) + 1;
+    }
+
+    /**
+     * Get the next index that should be "gathered" for a bucket rooted
+     * at {@code rootIndex}.
+     * <p>
+     *     Using the first 4 bytes of the element to store the next gather offset.
+     * </p>
+     */
+    private int getNextGatherOffset(long rootIndex) {
+        BreakingBytesRefBuilder bytes = values.get(rootIndex);
+        assert bytes.length() == Integer.BYTES;
+        return ByteUtils.readIntLE(bytes.bytes(), 0);
+    }
+
+    /**
+     * {@code true} if the entry at index {@code lhs} is "better" than
+     * the entry at {@code rhs}. "Better" in this means "lower" for
+     * {@link SortOrder#ASC} and "higher" for {@link SortOrder#DESC}.
+     */
+    private boolean betterThan(BytesRef lhs, BytesRef rhs) {
+        return common.order.reverseMul() * lhs.compareTo(rhs) < 0;
+    }
+
+    /**
+     * Swap the data at two indices.
+     */
+    private void swap(long lhs, long rhs) {
+        BreakingBytesRefBuilder tmp = values.get(lhs);
+        values.set(lhs, values.get(rhs));
+        values.set(rhs, tmp);
+    }
+
+    /**
+     * Allocate storage for more buckets and store the "next gather offset"
+     * for those new buckets.
+     */
+    private void grow(long requiredSize) {
+        long oldMax = values.size();
+        values = common.bigArrays.grow(values, requiredSize);
+        // Set the next gather offsets for all newly allocated buckets.
+        fillGatherOffsets(oldMax - (oldMax % common.bucketSize));
+    }
+
+    /**
+     * Maintain the "next gather offsets" for newly allocated buckets.
+     */
+    private void fillGatherOffsets(long startingAt) {
+        assert startingAt % common.bucketSize == 0;
+        int nextOffset = common.bucketSize - 1;
+        for (long bucketRoot = startingAt; bucketRoot < values.size(); bucketRoot += common.bucketSize) {
+            BreakingBytesRefBuilder bytes = values.get(bucketRoot);
+            if (bytes != null) {
+                continue;
+            }
+            bytes = new BreakingBytesRefBuilder(breaker, label);
+            values.set(bucketRoot, bytes);
+            bytes.grow(Integer.BYTES);
+            bytes.setLength(Integer.BYTES);
+            ByteUtils.writeIntLE(nextOffset, bytes.bytes(), 0);
+        }
+    }
+
+    /**
+     * Heapify a bucket whose entries are in random order.
+     * <p>
+     * This works by validating the heap property on each node, iterating
+     * "upwards", pushing any out of order parents "down". Check out the
+     * <a href="https://en.wikipedia.org/w/index.php?title=Binary_heap&oldid=940542991#Building_a_heap">wikipedia</a>
+     * entry on binary heaps for more about this.
+     * </p>
+     * <p>
+     * While this *looks* like it could easily be {@code O(n * log n)}, it is
+     * a fairly well studied algorithm attributed to Floyd. There's
+     * been a bunch of work that puts this at {@code O(n)}, close to 1.88n worst
+     * case.
+     * </p>
+     * <ul>
+     * <li>Hayward, Ryan; McDiarmid, Colin (1991).
+     * <a href="https://web.archive.org/web/20160205023201/http://www.stats.ox.ac.uk/__data/assets/pdf_file/0015/4173/heapbuildjalg.pdf">
+     * Average Case Analysis of Heap Building byRepeated Insertion</a> J. Algorithms.
+     * <li>D.E. Knuth, ”The Art of Computer Programming, Vol. 3, Sorting and Searching”</li>
+     * </ul>
+     * @param rootIndex the index the start of the bucket
+     */
+    private void heapify(long rootIndex) {
+        int maxParent = common.bucketSize / 2 - 1;
+        for (int parent = maxParent; parent >= 0; parent--) {
+            downHeap(rootIndex, parent);
+        }
+    }
+
+    /**
+     * Correct the heap invariant of a parent and its children. This
+     * runs in {@code O(log n)} time.
+     * @param rootIndex index of the start of the bucket
+     * @param parent Index within the bucket of the parent to check.
+     *               For example, 0 is the "root".
+     */
+    private void downHeap(long rootIndex, int parent) {
+        while (true) {
+            long parentIndex = rootIndex + parent;
+            int worst = parent;
+            long worstIndex = parentIndex;
+            int leftChild = parent * 2 + 1;
+            long leftIndex = rootIndex + leftChild;
+            if (leftChild < common.bucketSize) {
+                if (betterThan(values.get(worstIndex).bytesRefView(), values.get(leftIndex).bytesRefView())) {
+                    worst = leftChild;
+                    worstIndex = leftIndex;
+                }
+                int rightChild = leftChild + 1;
+                long rightIndex = rootIndex + rightChild;
+                if (rightChild < common.bucketSize
+                    && betterThan(values.get(worstIndex).bytesRefView(), values.get(rightIndex).bytesRefView())) {
+
+                    worst = rightChild;
+                    worstIndex = rightIndex;
+                }
+            }
+            if (worst == parent) {
+                break;
+            }
+            swap(worstIndex, parentIndex);
+            parent = worst;
+        }
+    }
+
+    private BreakingBytesRefBuilder clearedBytesAt(long index) {
+        BreakingBytesRefBuilder bytes = values.get(index);
+        if (bytes == null) {
+            bytes = new BreakingBytesRefBuilder(breaker, label);
+            values.set(index, bytes);
+        } else {
+            bytes.clear();
+        }
+        return bytes;
+    }
+
+    @Override
+    public final void close() {
+        Releasable allValues = values == null ? () -> {} : Releasables.wrap(LongStream.range(0, values.size()).mapToObj(i -> {
+            BreakingBytesRefBuilder bytes = values.get(i);
+            return bytes == null ? (Releasable) () -> {} : bytes;
+        }).toList().iterator());
+        Releasables.close(allValues, values, common);
+    }
+}
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/sort/IpBucketedSort.java b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/sort/IpBucketedSort.java
index 0fd38c18d7504..4eb31ea30db22 100644
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/sort/IpBucketedSort.java
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/sort/IpBucketedSort.java
@@ -9,7 +9,6 @@
 
 import org.apache.lucene.util.BytesRef;
 import org.elasticsearch.common.util.BigArrays;
-import org.elasticsearch.common.util.BitArray;
 import org.elasticsearch.common.util.ByteArray;
 import org.elasticsearch.common.util.ByteUtils;
 import org.elasticsearch.compute.data.Block;
@@ -29,7 +28,7 @@
  * See {@link BucketedSort} for more information.
  */
 public class IpBucketedSort implements Releasable {
-    private static final int IP_LENGTH = 16;
+    private static final int IP_LENGTH = 16; // Bytes. It's ipv6.
 
     // BytesRefs used in internal methods
     private final BytesRef scratch1 = new BytesRef();
@@ -39,18 +38,11 @@ public class IpBucketedSort implements Releasable {
      */
     private final byte[] scratchBytes = new byte[IP_LENGTH];
 
-    private final BigArrays bigArrays;
-    private final SortOrder order;
-    private final int bucketSize;
-    /**
-     * {@code true} if the bucket is in heap mode, {@code false} if
-     * it is still gathering.
-     */
-    private final BitArray heapMode;
+    private final BucketedSortCommon common;
     /**
      * An array containing all the values on all buckets. The structure is as follows:
      * <p>
-     *     For each bucket, there are bucketSize elements, based on the bucket id (0, 1, 2...).
+     *     For each bucket, there are {@link BucketedSortCommon#bucketSize} elements, based on the bucket id (0, 1, 2...).
      *     Then, for each bucket, it can be in 2 states:
      * </p>
      * <ul>
@@ -77,10 +69,7 @@ public class IpBucketedSort implements Releasable {
     private ByteArray values;
 
     public IpBucketedSort(BigArrays bigArrays, SortOrder order, int bucketSize) {
-        this.bigArrays = bigArrays;
-        this.order = order;
-        this.bucketSize = bucketSize;
-        heapMode = new BitArray(0, bigArrays);
+        this.common = new BucketedSortCommon(bigArrays, order, bucketSize);
 
         boolean success = false;
         try {
@@ -101,8 +90,8 @@ public IpBucketedSort(BigArrays bigArrays, SortOrder order, int bucketSize) {
      */
     public void collect(BytesRef value, int bucket) {
         assert value.length == IP_LENGTH;
-        long rootIndex = (long) bucket * bucketSize;
-        if (inHeapMode(bucket)) {
+        long rootIndex = common.rootIndex(bucket);
+        if (common.inHeapMode(bucket)) {
             if (betterThan(value, get(rootIndex, scratch1))) {
                 set(rootIndex, value);
                 downHeap(rootIndex, 0);
@@ -110,49 +99,34 @@ public void collect(BytesRef value, int bucket) {
             return;
         }
         // Gathering mode
-        long requiredSize = (rootIndex + bucketSize) * IP_LENGTH;
+        long requiredSize = common.endIndex(rootIndex) * IP_LENGTH;
         if (values.size() < requiredSize) {
             grow(requiredSize);
         }
         int next = getNextGatherOffset(rootIndex);
-        assert 0 <= next && next < bucketSize
-            : "Expected next to be in the range of valid buckets [0 <= " + next + " < " + bucketSize + "]";
+        common.assertValidNextOffset(next);
         long index = next + rootIndex;
         set(index, value);
         if (next == 0) {
-            heapMode.set(bucket);
+            common.enableHeapMode(bucket);
             heapify(rootIndex);
         } else {
             setNextGatherOffset(rootIndex, next - 1);
         }
     }
 
-    /**
-     * The order of the sort.
-     */
-    public SortOrder getOrder() {
-        return order;
-    }
-
-    /**
-     * The number of values to store per bucket.
-     */
-    public int getBucketSize() {
-        return bucketSize;
-    }
-
     /**
      * Get the first and last indexes (inclusive, exclusive) of the values for a bucket.
      * Returns [0, 0] if the bucket has never been collected.
      */
     private Tuple<Long, Long> getBucketValuesIndexes(int bucket) {
-        long rootIndex = (long) bucket * bucketSize;
+        long rootIndex = common.rootIndex(bucket);
         if (rootIndex >= values.size() / IP_LENGTH) {
             // We've never seen this bucket.
             return Tuple.tuple(0L, 0L);
         }
-        long start = inHeapMode(bucket) ? rootIndex : (rootIndex + getNextGatherOffset(rootIndex) + 1);
-        long end = rootIndex + bucketSize;
+        long start = startIndex(bucket, rootIndex);
+        long end = common.endIndex(rootIndex);
         return Tuple.tuple(start, end);
     }
 
@@ -184,7 +158,7 @@ public Block toBlock(BlockFactory blockFactory, IntVector selected) {
         }
 
         // Used to sort the values in the bucket.
-        var bucketValues = new BytesRef[bucketSize];
+        var bucketValues = new BytesRef[common.bucketSize];
 
         try (var builder = blockFactory.newBytesRefBlockBuilder(selected.getPositionCount())) {
             for (int s = 0; s < selected.getPositionCount(); s++) {
@@ -211,7 +185,7 @@ public Block toBlock(BlockFactory blockFactory, IntVector selected) {
                 Arrays.sort(bucketValues, 0, (int) size);
 
                 builder.beginPositionEntry();
-                if (order == SortOrder.ASC) {
+                if (common.order == SortOrder.ASC) {
                     for (int i = 0; i < size; i++) {
                         builder.appendBytesRef(bucketValues[i]);
                     }
@@ -226,11 +200,11 @@ public Block toBlock(BlockFactory blockFactory, IntVector selected) {
         }
     }
 
-    /**
-     * Is this bucket a min heap {@code true} or in gathering mode {@code false}?
-     */
-    private boolean inHeapMode(int bucket) {
-        return heapMode.get(bucket);
+    private long startIndex(int bucket, long rootIndex) {
+        if (common.inHeapMode(bucket)) {
+            return rootIndex;
+        }
+        return rootIndex + getNextGatherOffset(rootIndex) + 1;
     }
 
     /**
@@ -267,7 +241,7 @@ private void setNextGatherOffset(long rootIndex, int offset) {
      * {@link SortOrder#ASC} and "higher" for {@link SortOrder#DESC}.
      */
     private boolean betterThan(BytesRef lhs, BytesRef rhs) {
-        return getOrder().reverseMul() * lhs.compareTo(rhs) < 0;
+        return common.order.reverseMul() * lhs.compareTo(rhs) < 0;
     }
 
     /**
@@ -296,17 +270,17 @@ private void swap(long lhs, long rhs) {
      */
     private void grow(long minSize) {
         long oldMax = values.size() / IP_LENGTH;
-        values = bigArrays.grow(values, minSize);
+        values = common.bigArrays.grow(values, minSize);
         // Set the next gather offsets for all newly allocated buckets.
-        setNextGatherOffsets(oldMax - (oldMax % bucketSize));
+        setNextGatherOffsets(oldMax - (oldMax % common.bucketSize));
     }
 
     /**
      * Maintain the "next gather offsets" for newly allocated buckets.
      */
     private void setNextGatherOffsets(long startingAt) {
-        int nextOffset = bucketSize - 1;
-        for (long bucketRoot = startingAt; bucketRoot < values.size() / IP_LENGTH; bucketRoot += bucketSize) {
+        int nextOffset = common.bucketSize - 1;
+        for (long bucketRoot = startingAt; bucketRoot < values.size() / IP_LENGTH; bucketRoot += common.bucketSize) {
             setNextGatherOffset(bucketRoot, nextOffset);
         }
     }
@@ -334,7 +308,7 @@ private void setNextGatherOffsets(long startingAt) {
      * @param rootIndex the index the start of the bucket
      */
     private void heapify(long rootIndex) {
-        int maxParent = bucketSize / 2 - 1;
+        int maxParent = common.bucketSize / 2 - 1;
         for (int parent = maxParent; parent >= 0; parent--) {
             downHeap(rootIndex, parent);
         }
@@ -354,14 +328,14 @@ private void downHeap(long rootIndex, int parent) {
             long worstIndex = parentIndex;
             int leftChild = parent * 2 + 1;
             long leftIndex = rootIndex + leftChild;
-            if (leftChild < bucketSize) {
+            if (leftChild < common.bucketSize) {
                 if (betterThan(get(worstIndex, scratch1), get(leftIndex, scratch2))) {
                     worst = leftChild;
                     worstIndex = leftIndex;
                 }
                 int rightChild = leftChild + 1;
                 long rightIndex = rootIndex + rightChild;
-                if (rightChild < bucketSize && betterThan(get(worstIndex, scratch1), get(rightIndex, scratch2))) {
+                if (rightChild < common.bucketSize && betterThan(get(worstIndex, scratch1), get(rightIndex, scratch2))) {
                     worst = rightChild;
                     worstIndex = rightIndex;
                 }
@@ -400,6 +374,6 @@ private void set(long index, BytesRef value) {
 
     @Override
     public final void close() {
-        Releasables.close(values, heapMode);
+        Releasables.close(values, common);
     }
 }
diff --git a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/AbstractTopBytesRefAggregatorFunctionTests.java b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/AbstractTopBytesRefAggregatorFunctionTests.java
new file mode 100644
index 0000000000000..2815dd70e8124
--- /dev/null
+++ b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/AbstractTopBytesRefAggregatorFunctionTests.java
@@ -0,0 +1,37 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.compute.aggregation;
+
+import org.apache.lucene.util.BytesRef;
+import org.elasticsearch.compute.data.Block;
+import org.elasticsearch.compute.data.BlockFactory;
+import org.elasticsearch.compute.data.BlockUtils;
+import org.elasticsearch.compute.operator.SequenceBytesRefBlockSourceOperator;
+import org.elasticsearch.compute.operator.SourceOperator;
+
+import java.util.List;
+import java.util.stream.IntStream;
+
+import static org.hamcrest.Matchers.contains;
+
+abstract class AbstractTopBytesRefAggregatorFunctionTests extends AggregatorFunctionTestCase {
+    static final int LIMIT = 100;
+
+    @Override
+    protected final SourceOperator simpleInput(BlockFactory blockFactory, int size) {
+        return new SequenceBytesRefBlockSourceOperator(blockFactory, IntStream.range(0, size).mapToObj(l -> randomValue()));
+    }
+
+    protected abstract BytesRef randomValue();
+
+    @Override
+    public final void assertSimpleOutput(List<Block> input, Block result) {
+        Object[] values = input.stream().flatMap(AggregatorFunctionTestCase::allBytesRefs).sorted().limit(LIMIT).toArray(Object[]::new);
+        assertThat((List<?>) BlockUtils.toJavaObject(result, 0), contains(values));
+    }
+}
diff --git a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/AbstractTopBytesRefGroupingAggregatorFunctionTests.java b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/AbstractTopBytesRefGroupingAggregatorFunctionTests.java
new file mode 100644
index 0000000000000..45c8a23dfc1c0
--- /dev/null
+++ b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/AbstractTopBytesRefGroupingAggregatorFunctionTests.java
@@ -0,0 +1,49 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.compute.aggregation;
+
+import org.apache.lucene.util.BytesRef;
+import org.elasticsearch.compute.data.Block;
+import org.elasticsearch.compute.data.BlockFactory;
+import org.elasticsearch.compute.data.BlockUtils;
+import org.elasticsearch.compute.data.Page;
+import org.elasticsearch.compute.operator.LongBytesRefTupleBlockSourceOperator;
+import org.elasticsearch.compute.operator.SourceOperator;
+import org.elasticsearch.core.Tuple;
+
+import java.util.List;
+import java.util.stream.IntStream;
+
+import static org.hamcrest.Matchers.contains;
+import static org.hamcrest.Matchers.equalTo;
+
+public abstract class AbstractTopBytesRefGroupingAggregatorFunctionTests extends GroupingAggregatorFunctionTestCase {
+    static final int LIMIT = 100;
+
+    @Override
+    protected final SourceOperator simpleInput(BlockFactory blockFactory, int size) {
+        return new LongBytesRefTupleBlockSourceOperator(
+            blockFactory,
+            IntStream.range(0, size).mapToObj(l -> Tuple.tuple(randomLongBetween(0, 4), randomValue()))
+        );
+    }
+
+    protected abstract BytesRef randomValue();
+
+    @Override
+    protected final void assertSimpleGroup(List<Page> input, Block result, int position, Long group) {
+        Object[] values = input.stream().flatMap(b -> allBytesRefs(b, group)).sorted().limit(LIMIT).toArray(Object[]::new);
+        if (values.length == 0) {
+            assertThat(result.isNull(position), equalTo(true));
+        } else if (values.length == 1) {
+            assertThat(BlockUtils.toJavaObject(result, position), equalTo(values[0]));
+        } else {
+            assertThat((List<?>) BlockUtils.toJavaObject(result, position), contains(values));
+        }
+    }
+}
diff --git a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/TopBytesRefAggregatorFunctionTests.java b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/TopBytesRefAggregatorFunctionTests.java
new file mode 100644
index 0000000000000..732229c98f9c7
--- /dev/null
+++ b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/TopBytesRefAggregatorFunctionTests.java
@@ -0,0 +1,29 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.compute.aggregation;
+
+import org.apache.lucene.util.BytesRef;
+
+import java.util.List;
+
+public class TopBytesRefAggregatorFunctionTests extends AbstractTopBytesRefAggregatorFunctionTests {
+    @Override
+    protected BytesRef randomValue() {
+        return new BytesRef(randomAlphaOfLength(10));
+    }
+
+    @Override
+    protected AggregatorFunctionSupplier aggregatorFunction(List<Integer> inputChannels) {
+        return new TopBytesRefAggregatorFunctionSupplier(inputChannels, LIMIT, true);
+    }
+
+    @Override
+    protected String expectedDescriptionOfAggregator() {
+        return "top of bytes";
+    }
+}
diff --git a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/TopBytesRefGroupingAggregatorFunctionTests.java b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/TopBytesRefGroupingAggregatorFunctionTests.java
new file mode 100644
index 0000000000000..4932e1abef46d
--- /dev/null
+++ b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/TopBytesRefGroupingAggregatorFunctionTests.java
@@ -0,0 +1,35 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.compute.aggregation;
+
+import org.apache.lucene.util.BytesRef;
+import org.elasticsearch.xpack.esql.core.type.DataType;
+
+import java.util.List;
+
+public class TopBytesRefGroupingAggregatorFunctionTests extends AbstractTopBytesRefGroupingAggregatorFunctionTests {
+    @Override
+    protected BytesRef randomValue() {
+        return new BytesRef(randomAlphaOfLength(6));
+    }
+
+    @Override
+    protected final AggregatorFunctionSupplier aggregatorFunction(List<Integer> inputChannels) {
+        return new TopBytesRefAggregatorFunctionSupplier(inputChannels, LIMIT, true);
+    }
+
+    @Override
+    protected DataType acceptedDataType() {
+        return DataType.KEYWORD;
+    }
+
+    @Override
+    protected String expectedDescriptionOfAggregator() {
+        return "top of bytes";
+    }
+}
diff --git a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/TopIpAggregatorFunctionTests.java b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/TopIpAggregatorFunctionTests.java
index 1594f66ed9fe2..840e4cf9af961 100644
--- a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/TopIpAggregatorFunctionTests.java
+++ b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/TopIpAggregatorFunctionTests.java
@@ -9,26 +9,13 @@
 
 import org.apache.lucene.document.InetAddressPoint;
 import org.apache.lucene.util.BytesRef;
-import org.elasticsearch.compute.data.Block;
-import org.elasticsearch.compute.data.BlockFactory;
-import org.elasticsearch.compute.data.BlockUtils;
-import org.elasticsearch.compute.operator.SequenceBytesRefBlockSourceOperator;
-import org.elasticsearch.compute.operator.SourceOperator;
 
 import java.util.List;
-import java.util.stream.IntStream;
-
-import static org.hamcrest.Matchers.contains;
-
-public class TopIpAggregatorFunctionTests extends AggregatorFunctionTestCase {
-    private static final int LIMIT = 100;
 
+public class TopIpAggregatorFunctionTests extends AbstractTopBytesRefAggregatorFunctionTests {
     @Override
-    protected SourceOperator simpleInput(BlockFactory blockFactory, int size) {
-        return new SequenceBytesRefBlockSourceOperator(
-            blockFactory,
-            IntStream.range(0, size).mapToObj(l -> new BytesRef(InetAddressPoint.encode(randomIp(randomBoolean()))))
-        );
+    protected BytesRef randomValue() {
+        return new BytesRef(InetAddressPoint.encode(randomIp(randomBoolean())));
     }
 
     @Override
@@ -40,10 +27,4 @@ protected AggregatorFunctionSupplier aggregatorFunction(List<Integer> inputChann
     protected String expectedDescriptionOfAggregator() {
         return "top of ips";
     }
-
-    @Override
-    public void assertSimpleOutput(List<Block> input, Block result) {
-        Object[] values = input.stream().flatMap(b -> allBytesRefs(b)).sorted().limit(LIMIT).toArray(Object[]::new);
-        assertThat((List<?>) BlockUtils.toJavaObject(result, 0), contains(values));
-    }
 }
diff --git a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/TopIpGroupingAggregatorFunctionTests.java b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/TopIpGroupingAggregatorFunctionTests.java
index da55ff2d7aab3..02bf6b667192b 100644
--- a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/TopIpGroupingAggregatorFunctionTests.java
+++ b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/TopIpGroupingAggregatorFunctionTests.java
@@ -9,36 +9,14 @@
 
 import org.apache.lucene.document.InetAddressPoint;
 import org.apache.lucene.util.BytesRef;
-import org.elasticsearch.compute.data.Block;
-import org.elasticsearch.compute.data.BlockFactory;
-import org.elasticsearch.compute.data.BlockUtils;
-import org.elasticsearch.compute.data.Page;
-import org.elasticsearch.compute.operator.LongBytesRefTupleBlockSourceOperator;
-import org.elasticsearch.compute.operator.SourceOperator;
-import org.elasticsearch.core.Tuple;
 import org.elasticsearch.xpack.esql.core.type.DataType;
 
 import java.util.List;
-import java.util.stream.IntStream;
-
-import static org.hamcrest.Matchers.contains;
-import static org.hamcrest.Matchers.equalTo;
-
-public class TopIpGroupingAggregatorFunctionTests extends GroupingAggregatorFunctionTestCase {
-    private static final int LIMIT = 100;
 
+public class TopIpGroupingAggregatorFunctionTests extends AbstractTopBytesRefGroupingAggregatorFunctionTests {
     @Override
-    protected SourceOperator simpleInput(BlockFactory blockFactory, int size) {
-        return new LongBytesRefTupleBlockSourceOperator(
-            blockFactory,
-            IntStream.range(0, size)
-                .mapToObj(l -> Tuple.tuple(randomLongBetween(0, 4), new BytesRef(InetAddressPoint.encode(randomIp(randomBoolean())))))
-        );
-    }
-
-    @Override
-    protected DataType acceptedDataType() {
-        return DataType.IP;
+    protected BytesRef randomValue() {
+        return new BytesRef(InetAddressPoint.encode(randomIp(randomBoolean())));
     }
 
     @Override
@@ -47,19 +25,12 @@ protected AggregatorFunctionSupplier aggregatorFunction(List<Integer> inputChann
     }
 
     @Override
-    protected String expectedDescriptionOfAggregator() {
-        return "top of ips";
+    protected DataType acceptedDataType() {
+        return DataType.IP;
     }
 
     @Override
-    protected void assertSimpleGroup(List<Page> input, Block result, int position, Long group) {
-        Object[] values = input.stream().flatMap(b -> allBytesRefs(b, group)).sorted().limit(LIMIT).toArray(Object[]::new);
-        if (values.length == 0) {
-            assertThat(result.isNull(position), equalTo(true));
-        } else if (values.length == 1) {
-            assertThat(BlockUtils.toJavaObject(result, position), equalTo(values[0]));
-        } else {
-            assertThat((List<?>) BlockUtils.toJavaObject(result, position), contains(values));
-        }
+    protected String expectedDescriptionOfAggregator() {
+        return "top of ips";
     }
 }
diff --git a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/sort/BytesRefBucketedSortTests.java b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/sort/BytesRefBucketedSortTests.java
new file mode 100644
index 0000000000000..7a4e6658cd646
--- /dev/null
+++ b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/sort/BytesRefBucketedSortTests.java
@@ -0,0 +1,79 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.compute.data.sort;
+
+import org.apache.lucene.document.InetAddressPoint;
+import org.apache.lucene.util.BytesRef;
+import org.elasticsearch.common.breaker.CircuitBreaker;
+import org.elasticsearch.common.util.BigArrays;
+import org.elasticsearch.compute.data.Block;
+import org.elasticsearch.compute.data.BlockFactory;
+import org.elasticsearch.compute.data.BytesRefBlock;
+import org.elasticsearch.compute.data.ElementType;
+import org.elasticsearch.compute.data.IntVector;
+import org.elasticsearch.search.sort.SortOrder;
+
+import java.util.ArrayList;
+import java.util.Collections;
+import java.util.List;
+
+import static org.hamcrest.Matchers.equalTo;
+
+public class BytesRefBucketedSortTests extends BucketedSortTestCase<BytesRefBucketedSort, BytesRef> {
+    @Override
+    protected BytesRefBucketedSort build(SortOrder sortOrder, int bucketSize) {
+        BigArrays bigArrays = bigArrays();
+        return new BytesRefBucketedSort(
+            bigArrays.breakerService().getBreaker(CircuitBreaker.REQUEST),
+            "test",
+            bigArrays,
+            sortOrder,
+            bucketSize
+        );
+    }
+
+    @Override
+    protected BytesRef randomValue() {
+        return new BytesRef(InetAddressPoint.encode(randomIp(randomBoolean())));
+    }
+
+    @Override
+    protected List<BytesRef> threeSortedValues() {
+        List<BytesRef> values = new ArrayList<>();
+        values.add(new BytesRef(randomAlphaOfLength(10)));
+        values.add(new BytesRef(randomAlphaOfLength(11)));
+        values.add(new BytesRef(randomAlphaOfLength(1)));
+        Collections.sort(values);
+        return values;
+    }
+
+    @Override
+    protected void collect(BytesRefBucketedSort sort, BytesRef value, int bucket) {
+        sort.collect(value, bucket);
+    }
+
+    @Override
+    protected void merge(BytesRefBucketedSort sort, int groupId, BytesRefBucketedSort other, int otherGroupId) {
+        sort.merge(groupId, other, otherGroupId);
+    }
+
+    @Override
+    protected Block toBlock(BytesRefBucketedSort sort, BlockFactory blockFactory, IntVector selected) {
+        return sort.toBlock(blockFactory, selected);
+    }
+
+    @Override
+    protected void assertBlockTypeAndValues(Block block, List<BytesRef> values) {
+        assertThat(block.elementType(), equalTo(ElementType.BYTES_REF));
+        var typedBlock = (BytesRefBlock) block;
+        var scratch = new BytesRef();
+        for (int i = 0; i < values.size(); i++) {
+            assertThat("expected value on block position " + i, typedBlock.getBytesRef(i, scratch), equalTo(values.get(i)));
+        }
+    }
+}
diff --git a/x-pack/plugin/esql/qa/server/mixed-cluster/src/javaRestTest/java/org/elasticsearch/xpack/esql/qa/mixed/MixedClusterEsqlSpecIT.java b/x-pack/plugin/esql/qa/server/mixed-cluster/src/javaRestTest/java/org/elasticsearch/xpack/esql/qa/mixed/MixedClusterEsqlSpecIT.java
index d0d6d5fa49c42..08b4794b740d6 100644
--- a/x-pack/plugin/esql/qa/server/mixed-cluster/src/javaRestTest/java/org/elasticsearch/xpack/esql/qa/mixed/MixedClusterEsqlSpecIT.java
+++ b/x-pack/plugin/esql/qa/server/mixed-cluster/src/javaRestTest/java/org/elasticsearch/xpack/esql/qa/mixed/MixedClusterEsqlSpecIT.java
@@ -72,6 +72,10 @@ public MixedClusterEsqlSpecIT(
     protected void shouldSkipTest(String testName) throws IOException {
         super.shouldSkipTest(testName);
         assumeTrue("Test " + testName + " is skipped on " + bwcVersion, isEnabled(testName, instructions, bwcVersion));
+        assumeFalse(
+            "Skip META tests on mixed version clusters because we change it too quickly",
+            testCase.requiredCapabilities.contains("meta")
+        );
         if (mode == ASYNC) {
             assumeTrue("Async is not supported on " + bwcVersion, supportsAsync());
         }
diff --git a/x-pack/plugin/esql/qa/server/multi-clusters/src/javaRestTest/java/org/elasticsearch/xpack/esql/ccq/MultiClusterSpecIT.java b/x-pack/plugin/esql/qa/server/multi-clusters/src/javaRestTest/java/org/elasticsearch/xpack/esql/ccq/MultiClusterSpecIT.java
index 3e799730f7269..8d54dc63598f0 100644
--- a/x-pack/plugin/esql/qa/server/multi-clusters/src/javaRestTest/java/org/elasticsearch/xpack/esql/ccq/MultiClusterSpecIT.java
+++ b/x-pack/plugin/esql/qa/server/multi-clusters/src/javaRestTest/java/org/elasticsearch/xpack/esql/ccq/MultiClusterSpecIT.java
@@ -112,6 +112,10 @@ protected void shouldSkipTest(String testName) throws IOException {
         );
         assumeFalse("INLINESTATS not yet supported in CCS", testCase.requiredCapabilities.contains("inlinestats"));
         assumeFalse("INLINESTATS not yet supported in CCS", testCase.requiredCapabilities.contains("inlinestats_v2"));
+        assumeFalse(
+            "Skip META tests on mixed version clusters because we change it too quickly",
+            testCase.requiredCapabilities.contains("meta")
+        );
     }
 
     private TestFeatureService remoteFeaturesService() throws IOException {
diff --git a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/meta.csv-spec b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/meta.csv-spec
index 6909f0aeb42f5..2b3fa9dec797d 100644
--- a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/meta.csv-spec
+++ b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/meta.csv-spec
@@ -1,5 +1,7 @@
-metaFunctionsSynopsis#[skip:-8.15.99]
+metaFunctionsSynopsis
 required_capability: date_nanos_type
+required_capability: meta
+
 meta functions | keep synopsis;
 
 synopsis:keyword
@@ -118,14 +120,16 @@ double tau()
 "keyword|text to_upper(str:keyword|text)"
 "version to_ver(field:keyword|text|version)"
 "version to_version(field:keyword|text|version)"
-"boolean|double|integer|long|date|ip top(field:boolean|double|integer|long|date|ip, limit:integer, order:keyword)"
+"boolean|double|integer|long|date|ip|keyword|text top(field:boolean|double|integer|long|date|ip|keyword|text, limit:integer, order:keyword)"
 "keyword|text trim(string:keyword|text)"
 "boolean|date|double|integer|ip|keyword|long|text|version values(field:boolean|date|double|integer|ip|keyword|long|text|version)"
 "double weighted_avg(number:double|integer|long, weight:double|integer|long)"
 ;
 
-metaFunctionsArgs#[skip:-8.15.99]
+metaFunctionsArgs
+required_capability: meta
 required_capability: date_nanos_type
+
   META functions
 | EVAL name = SUBSTRING(name, 0, 14)
 | KEEP name, argNames, argTypes, argDescriptions;
@@ -246,13 +250,15 @@ to_unsigned_lo|field                               |"boolean|date|keyword|text|d
 to_upper      |str                                 |"keyword|text"                                                                                                                    |String expression. If `null`, the function returns `null`.
 to_ver        |field                               |"keyword|text|version"                                                                                                            |Input value. The input can be a single- or multi-valued column or an expression.
 to_version    |field                               |"keyword|text|version"                                                                                                            |Input value. The input can be a single- or multi-valued column or an expression.
-top           |[field, limit, order]               |["boolean|double|integer|long|date|ip", integer, keyword]                                                                         |[The field to collect the top values for.,The maximum number of values to collect.,The order to calculate the top values. Either `asc` or `desc`.]
+top           |[field, limit, order]               |["boolean|double|integer|long|date|ip|keyword|text", integer, keyword]                                                                         |[The field to collect the top values for.,The maximum number of values to collect.,The order to calculate the top values. Either `asc` or `desc`.]
 trim          |string                              |"keyword|text"                                                                                                                    |String expression. If `null`, the function returns `null`.
 values        |field                               |"boolean|date|double|integer|ip|keyword|long|text|version"                                                                        |[""]
 weighted_avg  |[number, weight]                    |["double|integer|long", "double|integer|long"]                                                                                    |[A numeric value., A numeric weight.]
 ;
 
-metaFunctionsDescription#[skip:-8.15.99]
+metaFunctionsDescription
+required_capability: meta
+
   META functions
 | EVAL name = SUBSTRING(name, 0, 14)
 | KEEP name, description
@@ -380,8 +386,10 @@ values        |Returns all values in a group as a multivalued field. The order o
 weighted_avg  |The weighted average of a numeric expression.
 ;
 
-metaFunctionsRemaining#[skip:-8.15.99]
+metaFunctionsRemaining
+required_capability: meta
 required_capability: date_nanos_type
+
   META functions
 | EVAL name = SUBSTRING(name, 0, 14)
 | KEEP name, *
@@ -504,13 +512,15 @@ to_unsigned_lo|unsigned_long
 to_upper      |"keyword|text"                                                                                                              |false                       |false           |false
 to_ver        |version                                                                                                                     |false                       |false           |false
 to_version    |version                                                                                                                     |false                       |false           |false
-top           |"boolean|double|integer|long|date|ip"                                                                                       |[false, false, false]       |false           |true
+top           |"boolean|double|integer|long|date|ip|keyword|text"                                                                                       |[false, false, false]       |false           |true
 trim          |"keyword|text"                                                                                                              |false                       |false           |false
 values        |"boolean|date|double|integer|ip|keyword|long|text|version"                                                                  |false                       |false           |true
 weighted_avg  |"double"                                                                                                                    |[false, false]              |false           |true
 ;
 
-metaFunctionsFiltered#[skip:-8.15.99]
+metaFunctionsFiltered
+required_capability: meta
+
 META FUNCTIONS
 | WHERE STARTS_WITH(name, "sin")
 ;
@@ -520,7 +530,9 @@ sin          |"double sin(angle:double|integer|long|unsigned_long)"   |angle
 sinh         |"double sinh(number:double|integer|long|unsigned_long)" |number            |"double|integer|long|unsigned_long" | "Numeric expression. If `null`, the function returns `null`."   | double             | "Returns the {wikipedia}/Hyperbolic_functions[hyperbolic sine] of a number." | false                | false            | false
 ;
 
-countFunctions#[skip:-8.15.99]
+countFunctions
+required_capability: meta
+
 meta functions |  stats  a = count(*), b = count(*), c = count(*) |  mv_expand c;
 
 a:long | b:long | c:long
diff --git a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/stats_top.csv-spec b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/stats_top.csv-spec
index 86f91adf506d1..80d11425c5bb6 100644
--- a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/stats_top.csv-spec
+++ b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/stats_top.csv-spec
@@ -224,3 +224,77 @@ a:ip | b:ip | c:ip | host:keyword
 [fe82::cae2:65ff:fece:fec0, fe81::cae2:65ff:fece:feb9] | [fe82::cae2:65ff:fece:fec0, fe81::cae2:65ff:fece:feb9] | [fe82::cae2:65ff:fece:fec0, fe81::cae2:65ff:fece:feb9] | epsilon
 [fe80::cae2:65ff:fece:feb9, fe80::cae2:65ff:fece:feb9] | [fe80::cae2:65ff:fece:feb9, fe80::cae2:65ff:fece:feb9] | [fe81::cae2:65ff:fece:feb9, 127.0.0.3] | gamma
 ;
+
+topKeywords
+required_capability: agg_top
+required_capability: agg_top_string_support
+
+FROM employees
+| EVAL calc = SUBSTRING(last_name, 2)
+| STATS
+    first_name = TOP(first_name, 3, "asc"),
+    last_name = TOP(calc, 3, "asc"),
+    evil = TOP(CASE(languages <= 2, first_name, last_name), 3, "desc");
+
+     first_name:keyword      |   last_name:keyword   | evil:keyword
+[Alejandro, Amabile, Anneke] | [acello, addadi, aek] | [Zschoche, Zielinski, Zhongwei]
+;
+
+topKeywordsGrouping
+required_capability: agg_top
+required_capability: agg_top_string_support
+
+FROM employees
+| EVAL calc = SUBSTRING(last_name, 2)
+| STATS
+    first_name = TOP(first_name, 3, "asc"),
+    last_name = TOP(calc, 3, "asc"),
+    evil = TOP(CASE(languages <= 2, first_name, last_name), 3, "desc")
+  BY job_positions
+| SORT job_positions
+| LIMIT 3;
+
+     first_name:keyword      |     last_name:keyword     |          evil:keyword          | job_positions:keyword
+ [Arumugam, Bojan, Domenick] |   [acello, aine, akrucki] | [Zhongwei, Yinghua, Valdiodio] | Accountant
+[Alejandro, Charlene, Danel] | [andell, cAlpine, eistad] |      [Stamatiou, Sluis, Sidou] | Architect
+ [Basil, Breannda, Hidefumi] |  [aine, alabarba, ierman] |  [Tramer, Syrzycki, Stamatiou] | Business Analyst
+;
+
+topText
+required_capability: agg_top
+required_capability: agg_top_string_support
+# we don't need MATCH, but the loader for books.csv is busted in CsvTests
+required_capability: match_operator
+
+FROM books
+| EVAL calc = TRIM(SUBSTRING(title, 2, 5))
+| STATS
+    title = TOP(title, 3, "desc"),
+    calc = TOP(calc, 3, "asc"),
+    evil = TOP(CASE(year < 1980, title, author), 3, "desc");
+
+title:text | calc:keyword | evil:text
+[Worlds of Exile and Illusion: Three Complete Novels of the Hainish Series in One Volume--Rocannon's World, Planet of Exile, City of Illusions, Woman-The Full Story: A Dynamic Celebration of Freedoms, Winter notes on summer impressions] | ["'Bria", "Gent", "HE UN"] | [William Faulkner, William Faulkner, William Faulkner]
+;
+
+topTextGrouping
+required_capability: agg_top
+required_capability: agg_top_string_support
+# we don't need MATCH, but the loader for books.csv is busted in CsvTests
+required_capability: match_operator
+
+FROM books
+| EVAL calc = TRIM(SUBSTRING(title, 2, 5))
+| STATS
+    title = TOP(title, 3, "desc"),
+    calc = TOP(calc, 3, "asc"),
+    evil = TOP(CASE(year < 1980, title, author), 3, "desc")
+  BY author
+| SORT author
+| LIMIT 3;
+
+                                                                                                             title:text | calc:keyword | evil:text | author:text
+                                   A Tolkien Compass: Including J. R. R. Tolkien's Guide to the Names in The Lord of the Rings |  Tolk | A Tolkien Compass: Including J. R. R. Tolkien's Guide to the Names in The Lord of the Rings | Agnes Perkins
+                                                    The Lord of the Rings Poster Collection: Six Paintings by Alan Lee (No. 1) | he Lo |                                                                [J. R. R. Tolkien, Alan Lee] | Alan Lee
+A Gentle Creature and Other Stories: White Nights, A Gentle Creature, and The Dream of a Ridiculous Man (The World's Classics) |  Gent |                                        [W. J. Leatherbarrow, Fyodor Dostoevsky, Alan Myers] | Alan Myers
+;
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/action/EsqlCapabilities.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/action/EsqlCapabilities.java
index 597c349273eb2..31a3096c13cd2 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/action/EsqlCapabilities.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/action/EsqlCapabilities.java
@@ -97,6 +97,11 @@ public enum Cap {
          */
         AGG_TOP_IP_SUPPORT,
 
+        /**
+         * Support for {@code keyword} and {@code text} fields in {@code TOP} aggregation.
+         */
+        AGG_TOP_STRING_SUPPORT,
+
         /**
          * {@code CASE} properly handling multivalue conditions.
          */
@@ -251,6 +256,13 @@ public enum Cap {
          */
         MATCH_OPERATOR(true),
 
+        /**
+         * Support for the {@code META} keyword. Tests with this tag are
+         * intentionally excluded from mixed version clusters because we
+         * continually add functions, so they constantly fail if we don't.
+         */
+        META,
+
         /**
          * Add CombineBinaryComparisons rule.
          */
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/aggregate/Top.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/aggregate/Top.java
index 4927acc3e1cd9..cb1b0f0cad895 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/aggregate/Top.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/aggregate/Top.java
@@ -13,6 +13,7 @@
 import org.elasticsearch.common.lucene.BytesRefs;
 import org.elasticsearch.compute.aggregation.AggregatorFunctionSupplier;
 import org.elasticsearch.compute.aggregation.TopBooleanAggregatorFunctionSupplier;
+import org.elasticsearch.compute.aggregation.TopBytesRefAggregatorFunctionSupplier;
 import org.elasticsearch.compute.aggregation.TopDoubleAggregatorFunctionSupplier;
 import org.elasticsearch.compute.aggregation.TopIntAggregatorFunctionSupplier;
 import org.elasticsearch.compute.aggregation.TopIpAggregatorFunctionSupplier;
@@ -48,7 +49,7 @@ public class Top extends AggregateFunction implements ToAggregator, SurrogateExp
     private static final String ORDER_DESC = "DESC";
 
     @FunctionInfo(
-        returnType = { "boolean", "double", "integer", "long", "date", "ip" },
+        returnType = { "boolean", "double", "integer", "long", "date", "ip", "keyword", "text" },
         description = "Collects the top values for a field. Includes repeated values.",
         isAggregation = true,
         examples = @Example(file = "stats_top", tag = "top")
@@ -57,7 +58,7 @@ public Top(
         Source source,
         @Param(
             name = "field",
-            type = { "boolean", "double", "integer", "long", "date", "ip" },
+            type = { "boolean", "double", "integer", "long", "date", "ip", "keyword", "text" },
             description = "The field to collect the top values for."
         ) Expression field,
         @Param(name = "limit", type = { "integer" }, description = "The maximum number of values to collect.") Expression limit,
@@ -125,12 +126,14 @@ protected TypeResolution resolveType() {
             dt -> dt == DataType.BOOLEAN
                 || dt == DataType.DATETIME
                 || dt == DataType.IP
+                || DataType.isString(dt)
                 || (dt.isNumeric() && dt != DataType.UNSIGNED_LONG),
             sourceText(),
             FIRST,
             "boolean",
             "date",
             "ip",
+            "string",
             "numeric except unsigned_long or counter types"
         ).and(isNotNullAndFoldable(limitField(), sourceText(), SECOND))
             .and(isType(limitField(), dt -> dt == DataType.INTEGER, sourceText(), SECOND, "integer"))
@@ -190,6 +193,9 @@ public AggregatorFunctionSupplier supplier(List<Integer> inputChannels) {
         if (type == DataType.IP) {
             return new TopIpAggregatorFunctionSupplier(inputChannels, limitValue(), orderValue());
         }
+        if (DataType.isString(type)) {
+            return new TopBytesRefAggregatorFunctionSupplier(inputChannels, limitValue(), orderValue());
+        }
         throw EsqlIllegalArgumentException.illegalDataType(type);
     }
 
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/AggregateMapper.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/AggregateMapper.java
index 60bf4be1d2b03..13ce9ba77cc71 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/AggregateMapper.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/AggregateMapper.java
@@ -170,7 +170,7 @@ private static Stream<Tuple<Class<?>, Tuple<String, String>>> typeAndNames(Class
             // TODO can't we figure this out from the function itself?
             types = List.of("Int", "Long", "Double", "Boolean", "BytesRef");
         } else if (Top.class.isAssignableFrom(clazz)) {
-            types = List.of("Boolean", "Int", "Long", "Double", "Ip");
+            types = List.of("Boolean", "Int", "Long", "Double", "Ip", "BytesRef");
         } else if (Rate.class.isAssignableFrom(clazz)) {
             types = List.of("Int", "Long", "Double");
         } else if (FromPartial.class.isAssignableFrom(clazz) || ToPartial.class.isAssignableFrom(clazz)) {
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/aggregate/TopTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/aggregate/TopTests.java
index f64d6a200a031..f7bf338caa099 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/aggregate/TopTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/aggregate/TopTests.java
@@ -46,7 +46,9 @@ public static Iterable<Object[]> parameters() {
                     MultiRowTestCaseSupplier.doubleCases(1, 1000, -Double.MAX_VALUE, Double.MAX_VALUE, true),
                     MultiRowTestCaseSupplier.dateCases(1, 1000),
                     MultiRowTestCaseSupplier.booleanCases(1, 1000),
-                    MultiRowTestCaseSupplier.ipCases(1, 1000)
+                    MultiRowTestCaseSupplier.ipCases(1, 1000),
+                    MultiRowTestCaseSupplier.stringCases(1, 1000, DataType.KEYWORD),
+                    MultiRowTestCaseSupplier.stringCases(1, 1000, DataType.TEXT)
                 )
                     .flatMap(List::stream)
                     .map(fieldCaseSupplier -> TopTests.makeSupplier(fieldCaseSupplier, limitCaseSupplier, order))

From 80dd56398f855923df0c0117abd098fd3023ce36 Mon Sep 17 00:00:00 2001
From: Sam Xiao <sam.xiao@elastic.co>
Date: Mon, 23 Sep 2024 13:37:58 -0400
Subject: [PATCH 07/28] ILM: Add total_shards_per_node setting to searchable
 snapshot (#112972)

Allows setting index total_shards_per_node in the SearchableSnapshot action of ILM to remediate hot spot in shard allocation for searchable snapshot index.

Closes #112261
---
 docs/changelog/112972.yaml                    |  6 ++
 .../actions/ilm-searchable-snapshot.asciidoc  |  5 +-
 .../org/elasticsearch/TransportVersions.java  |  1 +
 .../xpack/core/ilm/MountSnapshotStep.java     | 60 ++++++++++----
 .../core/ilm/SearchableSnapshotAction.java    | 42 ++++++++--
 .../xpack/core/ilm/LifecyclePolicyTests.java  |  6 +-
 .../core/ilm/MountSnapshotStepTests.java      | 82 +++++++++++++++++--
 .../ilm/SearchableSnapshotActionTests.java    | 24 +++++-
 .../actions/SearchableSnapshotActionIT.java   | 56 +++++++++++++
 9 files changed, 253 insertions(+), 29 deletions(-)
 create mode 100644 docs/changelog/112972.yaml

diff --git a/docs/changelog/112972.yaml b/docs/changelog/112972.yaml
new file mode 100644
index 0000000000000..5332ac13fd13f
--- /dev/null
+++ b/docs/changelog/112972.yaml
@@ -0,0 +1,6 @@
+pr: 112972
+summary: "ILM: Add `total_shards_per_node` setting to searchable snapshot"
+area: ILM+SLM
+type: enhancement
+issues:
+ - 112261
diff --git a/docs/reference/ilm/actions/ilm-searchable-snapshot.asciidoc b/docs/reference/ilm/actions/ilm-searchable-snapshot.asciidoc
index 4ba4782174bef..73a77bef09bde 100644
--- a/docs/reference/ilm/actions/ilm-searchable-snapshot.asciidoc
+++ b/docs/reference/ilm/actions/ilm-searchable-snapshot.asciidoc
@@ -19,7 +19,7 @@ index>> prefixed with `partial-` to the frozen tier. In other phases, the action
 
 In the frozen tier, the action will ignore the setting
 <<total-shards-per-node,`index.routing.allocation.total_shards_per_node`>>, if it was present in the original index,
-to account for the difference in the number of nodes between the frozen and the other tiers.
+to account for the difference in the number of nodes between the frozen and the other tiers. To set <<total-shards-per-node,`index.routing.allocation.total_shards_per_node`>> for searchable snapshots, set the `total_shards_per_node` option in the frozen phase's `searchable_snapshot` action within the ILM policy.
 
 
 WARNING: Don't include the `searchable_snapshot` action in both the hot and cold
@@ -74,6 +74,9 @@ will be performed on the hot nodes. If using a `searchable_snapshot` action in t
 force merge will be performed on whatever tier the index is *prior* to the `cold` phase (either
 `hot` or `warm`).
 
+`total_shards_per_node`::
+The maximum number of shards (replicas and primaries) that will be allocated to a single node for the searchable snapshot index. Defaults to unbounded.
+
 [[ilm-searchable-snapshot-ex]]
 ==== Examples
 ////
diff --git a/server/src/main/java/org/elasticsearch/TransportVersions.java b/server/src/main/java/org/elasticsearch/TransportVersions.java
index 55a3391976057..2cc50a85668c7 100644
--- a/server/src/main/java/org/elasticsearch/TransportVersions.java
+++ b/server/src/main/java/org/elasticsearch/TransportVersions.java
@@ -222,6 +222,7 @@ static TransportVersion def(int id) {
     public static final TransportVersion FAILURE_STORE_STATUS_IN_INDEX_RESPONSE = def(8_746_00_0);
     public static final TransportVersion ESQL_AGGREGATION_OPERATOR_STATUS_FINISH_NANOS = def(8_747_00_0);
     public static final TransportVersion ML_TELEMETRY_MEMORY_ADDED = def(8_748_00_0);
+    public static final TransportVersion ILM_ADD_SEARCHABLE_SNAPSHOT_TOTAL_SHARDS_PER_NODE = def(8_749_00_0);
 
     /*
      * STOP! READ THIS FIRST! No, really,
diff --git a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ilm/MountSnapshotStep.java b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ilm/MountSnapshotStep.java
index aac4d74144e95..7d045f2950e1b 100644
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ilm/MountSnapshotStep.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ilm/MountSnapshotStep.java
@@ -18,11 +18,13 @@
 import org.elasticsearch.cluster.routing.allocation.decider.ShardsLimitAllocationDecider;
 import org.elasticsearch.common.Strings;
 import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.core.Nullable;
 import org.elasticsearch.core.TimeValue;
 import org.elasticsearch.rest.RestStatus;
 import org.elasticsearch.xpack.core.searchablesnapshots.MountSearchableSnapshotAction;
 import org.elasticsearch.xpack.core.searchablesnapshots.MountSearchableSnapshotRequest;
 
+import java.util.ArrayList;
 import java.util.Objects;
 import java.util.Optional;
 
@@ -37,17 +39,34 @@ public class MountSnapshotStep extends AsyncRetryDuringSnapshotActionStep {
 
     private final String restoredIndexPrefix;
     private final MountSearchableSnapshotRequest.Storage storageType;
+    @Nullable
+    private final Integer totalShardsPerNode;
 
     public MountSnapshotStep(
         StepKey key,
         StepKey nextStepKey,
         Client client,
         String restoredIndexPrefix,
-        MountSearchableSnapshotRequest.Storage storageType
+        MountSearchableSnapshotRequest.Storage storageType,
+        @Nullable Integer totalShardsPerNode
     ) {
         super(key, nextStepKey, client);
         this.restoredIndexPrefix = restoredIndexPrefix;
         this.storageType = Objects.requireNonNull(storageType, "a storage type must be specified");
+        if (totalShardsPerNode != null && totalShardsPerNode < 1) {
+            throw new IllegalArgumentException("[" + SearchableSnapshotAction.TOTAL_SHARDS_PER_NODE.getPreferredName() + "] must be >= 1");
+        }
+        this.totalShardsPerNode = totalShardsPerNode;
+    }
+
+    public MountSnapshotStep(
+        StepKey key,
+        StepKey nextStepKey,
+        Client client,
+        String restoredIndexPrefix,
+        MountSearchableSnapshotRequest.Storage storageType
+    ) {
+        this(key, nextStepKey, client, restoredIndexPrefix, storageType, null);
     }
 
     @Override
@@ -63,6 +82,11 @@ public MountSearchableSnapshotRequest.Storage getStorage() {
         return storageType;
     }
 
+    @Nullable
+    public Integer getTotalShardsPerNode() {
+        return totalShardsPerNode;
+    }
+
     @Override
     void performDuringNoSnapshot(IndexMetadata indexMetadata, ClusterState currentClusterState, ActionListener<Void> listener) {
         String indexName = indexMetadata.getIndex().getName();
@@ -140,6 +164,9 @@ void performDuringNoSnapshot(IndexMetadata indexMetadata, ClusterState currentCl
         final Settings.Builder settingsBuilder = Settings.builder();
 
         overrideTierPreference(this.getKey().phase()).ifPresent(override -> settingsBuilder.put(DataTier.TIER_PREFERENCE, override));
+        if (totalShardsPerNode != null) {
+            settingsBuilder.put(ShardsLimitAllocationDecider.INDEX_TOTAL_SHARDS_PER_NODE_SETTING.getKey(), totalShardsPerNode);
+        }
 
         final MountSearchableSnapshotRequest mountSearchableSnapshotRequest = new MountSearchableSnapshotRequest(
             TimeValue.MAX_VALUE,
@@ -148,9 +175,9 @@ void performDuringNoSnapshot(IndexMetadata indexMetadata, ClusterState currentCl
             snapshotName,
             indexName,
             settingsBuilder.build(),
-            ignoredIndexSettings(this.getKey().phase()),
+            ignoredIndexSettings(),
             // we'll not wait for the snapshot to complete in this step as the async steps are executed from threads that shouldn't
-            // perform expensive operations (ie. clusterStateProcessed)
+            // perform expensive operations (i.e. clusterStateProcessed)
             false,
             storageType
         );
@@ -198,23 +225,27 @@ static Optional<String> overrideTierPreference(String phase) {
      * setting, the restored index would be captured by the ILM runner and, depending on what ILM execution state was captured at snapshot
      * time, make it's way forward from _that_ step forward in the ILM policy. We'll re-set this setting on the restored index at a later
      * step once we restored a deterministic execution state
-     * - index.routing.allocation.total_shards_per_node: It is  likely that frozen tier has fewer nodes than the hot tier.
-     * Keeping this setting runs the risk that we will not have enough nodes to allocate all the shards in the
-     * frozen tier and the user does not have any way of fixing this. For this reason, we ignore this setting when moving to frozen.
+     * - index.routing.allocation.total_shards_per_node: It is likely that frozen tier has fewer nodes than the hot tier. If this setting
+     * is not specifically set in the frozen tier, keeping this setting runs the risk that we will not have enough nodes to
+     * allocate all the shards in the frozen tier and the user does not have any way of fixing this. For this reason, we ignore this
+     * setting when moving to frozen. We do not ignore this setting if it is specifically set in the mount searchable snapshot step
+     * of frozen tier.
      */
-    static String[] ignoredIndexSettings(String phase) {
+    String[] ignoredIndexSettings() {
+        ArrayList<String> ignoredSettings = new ArrayList<>();
+        ignoredSettings.add(LifecycleSettings.LIFECYCLE_NAME);
         // if we are mounting a searchable snapshot in the hot phase, then we should not change the total_shards_per_node setting
-        if (TimeseriesLifecycleType.FROZEN_PHASE.equals(phase)) {
-            return new String[] {
-                LifecycleSettings.LIFECYCLE_NAME,
-                ShardsLimitAllocationDecider.INDEX_TOTAL_SHARDS_PER_NODE_SETTING.getKey() };
+        // if total_shards_per_node setting is specifically set for the frozen phase and not propagated from previous phase,
+        // then it should not be ignored
+        if (TimeseriesLifecycleType.FROZEN_PHASE.equals(this.getKey().phase()) && this.totalShardsPerNode == null) {
+            ignoredSettings.add(ShardsLimitAllocationDecider.INDEX_TOTAL_SHARDS_PER_NODE_SETTING.getKey());
         }
-        return new String[] { LifecycleSettings.LIFECYCLE_NAME };
+        return ignoredSettings.toArray(new String[0]);
     }
 
     @Override
     public int hashCode() {
-        return Objects.hash(super.hashCode(), restoredIndexPrefix, storageType);
+        return Objects.hash(super.hashCode(), restoredIndexPrefix, storageType, totalShardsPerNode);
     }
 
     @Override
@@ -228,6 +259,7 @@ public boolean equals(Object obj) {
         MountSnapshotStep other = (MountSnapshotStep) obj;
         return super.equals(obj)
             && Objects.equals(restoredIndexPrefix, other.restoredIndexPrefix)
-            && Objects.equals(storageType, other.storageType);
+            && Objects.equals(storageType, other.storageType)
+            && Objects.equals(totalShardsPerNode, other.totalShardsPerNode);
     }
 }
diff --git a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ilm/SearchableSnapshotAction.java b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ilm/SearchableSnapshotAction.java
index 5b9b559b4d957..c06dcc0f083d1 100644
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ilm/SearchableSnapshotAction.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ilm/SearchableSnapshotAction.java
@@ -32,6 +32,7 @@
 import java.util.List;
 import java.util.Objects;
 
+import static org.elasticsearch.TransportVersions.ILM_ADD_SEARCHABLE_SNAPSHOT_TOTAL_SHARDS_PER_NODE;
 import static org.elasticsearch.snapshots.SearchableSnapshotsSettings.SEARCHABLE_SNAPSHOTS_REPOSITORY_NAME_SETTING_KEY;
 import static org.elasticsearch.snapshots.SearchableSnapshotsSettings.SEARCHABLE_SNAPSHOTS_SNAPSHOT_NAME_SETTING_KEY;
 import static org.elasticsearch.snapshots.SearchableSnapshotsSettings.SEARCHABLE_SNAPSHOT_PARTIAL_SETTING_KEY;
@@ -49,6 +50,7 @@ public class SearchableSnapshotAction implements LifecycleAction {
 
     public static final ParseField SNAPSHOT_REPOSITORY = new ParseField("snapshot_repository");
     public static final ParseField FORCE_MERGE_INDEX = new ParseField("force_merge_index");
+    public static final ParseField TOTAL_SHARDS_PER_NODE = new ParseField("total_shards_per_node");
     public static final String CONDITIONAL_DATASTREAM_CHECK_KEY = BranchingStep.NAME + "-on-datastream-check";
     public static final String CONDITIONAL_SKIP_ACTION_STEP = BranchingStep.NAME + "-check-prerequisites";
     public static final String CONDITIONAL_SKIP_GENERATE_AND_CLEAN = BranchingStep.NAME + "-check-existing-snapshot";
@@ -58,12 +60,13 @@ public class SearchableSnapshotAction implements LifecycleAction {
 
     private static final ConstructingObjectParser<SearchableSnapshotAction, Void> PARSER = new ConstructingObjectParser<>(
         NAME,
-        a -> new SearchableSnapshotAction((String) a[0], a[1] == null || (boolean) a[1])
+        a -> new SearchableSnapshotAction((String) a[0], a[1] == null || (boolean) a[1], (Integer) a[2])
     );
 
     static {
         PARSER.declareString(ConstructingObjectParser.constructorArg(), SNAPSHOT_REPOSITORY);
         PARSER.declareBoolean(ConstructingObjectParser.optionalConstructorArg(), FORCE_MERGE_INDEX);
+        PARSER.declareInt(ConstructingObjectParser.optionalConstructorArg(), TOTAL_SHARDS_PER_NODE);
     }
 
     public static SearchableSnapshotAction parse(XContentParser parser) {
@@ -72,22 +75,36 @@ public static SearchableSnapshotAction parse(XContentParser parser) {
 
     private final String snapshotRepository;
     private final boolean forceMergeIndex;
+    @Nullable
+    private final Integer totalShardsPerNode;
 
-    public SearchableSnapshotAction(String snapshotRepository, boolean forceMergeIndex) {
+    public SearchableSnapshotAction(String snapshotRepository, boolean forceMergeIndex, @Nullable Integer totalShardsPerNode) {
         if (Strings.hasText(snapshotRepository) == false) {
             throw new IllegalArgumentException("the snapshot repository must be specified");
         }
         this.snapshotRepository = snapshotRepository;
         this.forceMergeIndex = forceMergeIndex;
+
+        if (totalShardsPerNode != null && totalShardsPerNode < 1) {
+            throw new IllegalArgumentException("[" + TOTAL_SHARDS_PER_NODE.getPreferredName() + "] must be >= 1");
+        }
+        this.totalShardsPerNode = totalShardsPerNode;
+    }
+
+    public SearchableSnapshotAction(String snapshotRepository, boolean forceMergeIndex) {
+        this(snapshotRepository, forceMergeIndex, null);
     }
 
     public SearchableSnapshotAction(String snapshotRepository) {
-        this(snapshotRepository, true);
+        this(snapshotRepository, true, null);
     }
 
     public SearchableSnapshotAction(StreamInput in) throws IOException {
         this.snapshotRepository = in.readString();
         this.forceMergeIndex = in.readBoolean();
+        this.totalShardsPerNode = in.getTransportVersion().onOrAfter(ILM_ADD_SEARCHABLE_SNAPSHOT_TOTAL_SHARDS_PER_NODE)
+            ? in.readOptionalInt()
+            : null;
     }
 
     boolean isForceMergeIndex() {
@@ -98,6 +115,10 @@ public String getSnapshotRepository() {
         return snapshotRepository;
     }
 
+    public Integer getTotalShardsPerNode() {
+        return totalShardsPerNode;
+    }
+
     @Override
     public List<Step> toSteps(Client client, String phase, StepKey nextStepKey) {
         assert false;
@@ -298,7 +319,8 @@ public List<Step> toSteps(Client client, String phase, StepKey nextStepKey, XPac
             waitForGreenRestoredIndexKey,
             client,
             getRestoredIndexPrefix(mountSnapshotKey),
-            storageType
+            storageType,
+            totalShardsPerNode
         );
         WaitForIndexColorStep waitForGreenIndexHealthStep = new WaitForIndexColorStep(
             waitForGreenRestoredIndexKey,
@@ -402,6 +424,9 @@ public String getWriteableName() {
     public void writeTo(StreamOutput out) throws IOException {
         out.writeString(snapshotRepository);
         out.writeBoolean(forceMergeIndex);
+        if (out.getTransportVersion().onOrAfter(ILM_ADD_SEARCHABLE_SNAPSHOT_TOTAL_SHARDS_PER_NODE)) {
+            out.writeOptionalInt(totalShardsPerNode);
+        }
     }
 
     @Override
@@ -409,6 +434,9 @@ public XContentBuilder toXContent(XContentBuilder builder, Params params) throws
         builder.startObject();
         builder.field(SNAPSHOT_REPOSITORY.getPreferredName(), snapshotRepository);
         builder.field(FORCE_MERGE_INDEX.getPreferredName(), forceMergeIndex);
+        if (totalShardsPerNode != null) {
+            builder.field(TOTAL_SHARDS_PER_NODE.getPreferredName(), totalShardsPerNode);
+        }
         builder.endObject();
         return builder;
     }
@@ -422,12 +450,14 @@ public boolean equals(Object o) {
             return false;
         }
         SearchableSnapshotAction that = (SearchableSnapshotAction) o;
-        return Objects.equals(snapshotRepository, that.snapshotRepository) && Objects.equals(forceMergeIndex, that.forceMergeIndex);
+        return Objects.equals(snapshotRepository, that.snapshotRepository)
+            && Objects.equals(forceMergeIndex, that.forceMergeIndex)
+            && Objects.equals(totalShardsPerNode, that.totalShardsPerNode);
     }
 
     @Override
     public int hashCode() {
-        return Objects.hash(snapshotRepository, forceMergeIndex);
+        return Objects.hash(snapshotRepository, forceMergeIndex, totalShardsPerNode);
     }
 
     @Nullable
diff --git a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ilm/LifecyclePolicyTests.java b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ilm/LifecyclePolicyTests.java
index 66aa9a24cbcd4..7963d04e0f666 100644
--- a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ilm/LifecyclePolicyTests.java
+++ b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ilm/LifecyclePolicyTests.java
@@ -224,7 +224,11 @@ public static LifecyclePolicy randomTimeseriesLifecyclePolicy(@Nullable String l
                     frozenTime,
                     Collections.singletonMap(
                         SearchableSnapshotAction.NAME,
-                        new SearchableSnapshotAction(randomAlphaOfLength(10), randomBoolean())
+                        new SearchableSnapshotAction(
+                            randomAlphaOfLength(10),
+                            randomBoolean(),
+                            (randomBoolean() ? null : randomIntBetween(1, 100))
+                        )
                     )
                 )
             );
diff --git a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ilm/MountSnapshotStepTests.java b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ilm/MountSnapshotStepTests.java
index 2b5a0535caa0e..8ca7a00ab0948 100644
--- a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ilm/MountSnapshotStepTests.java
+++ b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ilm/MountSnapshotStepTests.java
@@ -41,7 +41,8 @@ public MountSnapshotStep createRandomInstance() {
         StepKey nextStepKey = randomStepKey();
         String restoredIndexPrefix = randomAlphaOfLength(10);
         MountSearchableSnapshotRequest.Storage storage = randomStorageType();
-        return new MountSnapshotStep(stepKey, nextStepKey, client, restoredIndexPrefix, storage);
+        Integer totalShardsPerNode = randomTotalShardsPerNode(true);
+        return new MountSnapshotStep(stepKey, nextStepKey, client, restoredIndexPrefix, storage, totalShardsPerNode);
     }
 
     public static MountSearchableSnapshotRequest.Storage randomStorageType() {
@@ -59,7 +60,8 @@ protected MountSnapshotStep copyInstance(MountSnapshotStep instance) {
             instance.getNextStepKey(),
             instance.getClient(),
             instance.getRestoredIndexPrefix(),
-            instance.getStorage()
+            instance.getStorage(),
+            instance.getTotalShardsPerNode()
         );
     }
 
@@ -69,7 +71,8 @@ public MountSnapshotStep mutateInstance(MountSnapshotStep instance) {
         StepKey nextKey = instance.getNextStepKey();
         String restoredIndexPrefix = instance.getRestoredIndexPrefix();
         MountSearchableSnapshotRequest.Storage storage = instance.getStorage();
-        switch (between(0, 3)) {
+        Integer totalShardsPerNode = instance.getTotalShardsPerNode();
+        switch (between(0, 4)) {
             case 0:
                 key = new StepKey(key.phase(), key.action(), key.name() + randomAlphaOfLength(5));
                 break;
@@ -88,10 +91,30 @@ public MountSnapshotStep mutateInstance(MountSnapshotStep instance) {
                     throw new AssertionError("unknown storage type: " + storage);
                 }
                 break;
+            case 4:
+                totalShardsPerNode = totalShardsPerNode == null ? 1 : totalShardsPerNode + randomIntBetween(1, 100);
+                break;
             default:
                 throw new AssertionError("Illegal randomisation branch");
         }
-        return new MountSnapshotStep(key, nextKey, instance.getClient(), restoredIndexPrefix, storage);
+        return new MountSnapshotStep(key, nextKey, instance.getClient(), restoredIndexPrefix, storage, totalShardsPerNode);
+    }
+
+    public void testCreateWithInvalidTotalShardsPerNode() throws Exception {
+        int invalidTotalShardsPerNode = randomIntBetween(-100, 0);
+
+        IllegalArgumentException exception = expectThrows(
+            IllegalArgumentException.class,
+            () -> new MountSnapshotStep(
+                randomStepKey(),
+                randomStepKey(),
+                client,
+                RESTORED_INDEX_PREFIX,
+                randomStorageType(),
+                invalidTotalShardsPerNode
+            )
+        );
+        assertEquals("[total_shards_per_node] must be >= 1", exception.getMessage());
     }
 
     public void testPerformActionFailure() {
@@ -345,7 +368,50 @@ public void testIgnoreTotalShardsPerNodeInFrozenPhase() throws Exception {
                 randomStepKey(),
                 client,
                 RESTORED_INDEX_PREFIX,
-                randomStorageType()
+                randomStorageType(),
+                null
+            );
+            performActionAndWait(step, indexMetadata, clusterState, null);
+        }
+    }
+
+    public void testDoNotIgnoreTotalShardsPerNodeIfSet() throws Exception {
+        String indexName = randomAlphaOfLength(10);
+        String policyName = "test-ilm-policy";
+        Map<String, String> ilmCustom = new HashMap<>();
+        String snapshotName = indexName + "-" + policyName;
+        ilmCustom.put("snapshot_name", snapshotName);
+        String repository = "repository";
+        ilmCustom.put("snapshot_repository", repository);
+
+        IndexMetadata.Builder indexMetadataBuilder = IndexMetadata.builder(indexName)
+            .settings(settings(IndexVersion.current()).put(LifecycleSettings.LIFECYCLE_NAME, policyName))
+            .putCustom(LifecycleExecutionState.ILM_CUSTOM_METADATA_KEY, ilmCustom)
+            .numberOfShards(randomIntBetween(1, 5))
+            .numberOfReplicas(randomIntBetween(0, 5));
+        IndexMetadata indexMetadata = indexMetadataBuilder.build();
+
+        ClusterState clusterState = ClusterState.builder(emptyClusterState())
+            .metadata(Metadata.builder().put(indexMetadata, true).build())
+            .build();
+
+        try (var threadPool = createThreadPool()) {
+            final var client = getRestoreSnapshotRequestAssertingClient(
+                threadPool,
+                repository,
+                snapshotName,
+                indexName,
+                RESTORED_INDEX_PREFIX,
+                indexName,
+                new String[] { LifecycleSettings.LIFECYCLE_NAME }
+            );
+            MountSnapshotStep step = new MountSnapshotStep(
+                new StepKey(TimeseriesLifecycleType.FROZEN_PHASE, randomAlphaOfLength(10), randomAlphaOfLength(10)),
+                randomStepKey(),
+                client,
+                RESTORED_INDEX_PREFIX,
+                randomStorageType(),
+                randomTotalShardsPerNode(false)
             );
             performActionAndWait(step, indexMetadata, clusterState, null);
         }
@@ -401,4 +467,10 @@ protected <Request extends ActionRequest, Response extends ActionResponse> void
             }
         };
     }
+
+    private Integer randomTotalShardsPerNode(boolean nullable) {
+        Integer randomInt = randomIntBetween(1, 100);
+        Integer randomIntNullable = (randomBoolean() ? null : randomInt);
+        return nullable ? randomIntNullable : randomInt;
+    }
 }
diff --git a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ilm/SearchableSnapshotActionTests.java b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ilm/SearchableSnapshotActionTests.java
index 193d9abeec91d..ca219fdde3d57 100644
--- a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ilm/SearchableSnapshotActionTests.java
+++ b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/ilm/SearchableSnapshotActionTests.java
@@ -16,6 +16,7 @@
 import java.util.List;
 
 import static org.elasticsearch.xpack.core.ilm.SearchableSnapshotAction.NAME;
+import static org.elasticsearch.xpack.core.ilm.SearchableSnapshotAction.TOTAL_SHARDS_PER_NODE;
 import static org.hamcrest.Matchers.equalTo;
 import static org.hamcrest.Matchers.is;
 
@@ -97,6 +98,16 @@ public void testPrefixAndStorageTypeDefaults() {
         );
     }
 
+    public void testCreateWithInvalidTotalShardsPerNode() {
+        int invalidTotalShardsPerNode = randomIntBetween(-100, 0);
+
+        IllegalArgumentException exception = expectThrows(
+            IllegalArgumentException.class,
+            () -> new SearchableSnapshotAction("test", true, invalidTotalShardsPerNode)
+        );
+        assertEquals("[" + TOTAL_SHARDS_PER_NODE.getPreferredName() + "] must be >= 1", exception.getMessage());
+    }
+
     private List<StepKey> expectedStepKeysWithForceMerge(String phase) {
         return List.of(
             new StepKey(phase, NAME, SearchableSnapshotAction.CONDITIONAL_SKIP_ACTION_STEP),
@@ -160,14 +171,23 @@ protected Writeable.Reader<SearchableSnapshotAction> instanceReader() {
 
     @Override
     protected SearchableSnapshotAction mutateInstance(SearchableSnapshotAction instance) {
-        return switch (randomIntBetween(0, 1)) {
+        return switch (randomIntBetween(0, 2)) {
             case 0 -> new SearchableSnapshotAction(randomAlphaOfLengthBetween(5, 10), instance.isForceMergeIndex());
             case 1 -> new SearchableSnapshotAction(instance.getSnapshotRepository(), instance.isForceMergeIndex() == false);
+            case 2 -> new SearchableSnapshotAction(
+                instance.getSnapshotRepository(),
+                instance.isForceMergeIndex(),
+                instance.getTotalShardsPerNode() == null ? 1 : instance.getTotalShardsPerNode() + randomIntBetween(1, 100)
+            );
             default -> throw new IllegalArgumentException("Invalid mutation branch");
         };
     }
 
     static SearchableSnapshotAction randomInstance() {
-        return new SearchableSnapshotAction(randomAlphaOfLengthBetween(5, 10), randomBoolean());
+        return new SearchableSnapshotAction(
+            randomAlphaOfLengthBetween(5, 10),
+            randomBoolean(),
+            (randomBoolean() ? null : randomIntBetween(1, 100))
+        );
     }
 }
diff --git a/x-pack/plugin/ilm/qa/multi-node/src/javaRestTest/java/org/elasticsearch/xpack/ilm/actions/SearchableSnapshotActionIT.java b/x-pack/plugin/ilm/qa/multi-node/src/javaRestTest/java/org/elasticsearch/xpack/ilm/actions/SearchableSnapshotActionIT.java
index 0e3d0f1b2ec40..fefeaa95319ed 100644
--- a/x-pack/plugin/ilm/qa/multi-node/src/javaRestTest/java/org/elasticsearch/xpack/ilm/actions/SearchableSnapshotActionIT.java
+++ b/x-pack/plugin/ilm/qa/multi-node/src/javaRestTest/java/org/elasticsearch/xpack/ilm/actions/SearchableSnapshotActionIT.java
@@ -48,6 +48,7 @@
 import java.util.concurrent.TimeUnit;
 
 import static java.util.Collections.singletonMap;
+import static org.elasticsearch.cluster.routing.allocation.decider.ShardsLimitAllocationDecider.INDEX_TOTAL_SHARDS_PER_NODE_SETTING;
 import static org.elasticsearch.xcontent.XContentFactory.jsonBuilder;
 import static org.elasticsearch.xpack.TimeSeriesRestDriver.createComposableTemplate;
 import static org.elasticsearch.xpack.TimeSeriesRestDriver.createNewSingletonPolicy;
@@ -921,6 +922,61 @@ public void testSearchableSnapshotInvokesAsyncActionOnNewIndex() throws Exceptio
         }, 30, TimeUnit.SECONDS);
     }
 
+    public void testSearchableSnapshotTotalShardsPerNode() throws Exception {
+        String index = "myindex-" + randomAlphaOfLength(4).toLowerCase(Locale.ROOT);
+        Integer totalShardsPerNode = 2;
+        createSnapshotRepo(client(), snapshotRepo, randomBoolean());
+        createPolicy(
+            client(),
+            policy,
+            null,
+            null,
+            new Phase(
+                "cold",
+                TimeValue.ZERO,
+                singletonMap(SearchableSnapshotAction.NAME, new SearchableSnapshotAction(snapshotRepo, randomBoolean()))
+            ),
+            new Phase(
+                "frozen",
+                TimeValue.ZERO,
+                singletonMap(SearchableSnapshotAction.NAME, new SearchableSnapshotAction(snapshotRepo, randomBoolean(), totalShardsPerNode))
+            ),
+            null
+        );
+
+        createIndex(index, Settings.EMPTY);
+        ensureGreen(index);
+        indexDocument(client(), index, true);
+
+        // enable ILM after we indexed a document as otherwise ILM might sometimes run so fast the indexDocument call will fail with
+        // `index_not_found_exception`
+        updateIndexSettings(index, Settings.builder().put(LifecycleSettings.LIFECYCLE_NAME, policy));
+
+        // wait for snapshot successfully mounted and ILM execution completed
+        final String searchableSnapMountedIndexName = SearchableSnapshotAction.PARTIAL_RESTORED_INDEX_PREFIX
+            + SearchableSnapshotAction.FULL_RESTORED_INDEX_PREFIX + index;
+        assertBusy(() -> {
+            logger.info("--> waiting for [{}] to exist...", searchableSnapMountedIndexName);
+            assertTrue(indexExists(searchableSnapMountedIndexName));
+        }, 30, TimeUnit.SECONDS);
+        assertBusy(() -> {
+            triggerStateChange();
+            Step.StepKey stepKeyForIndex = getStepKeyForIndex(client(), searchableSnapMountedIndexName);
+            assertThat(stepKeyForIndex.phase(), is("frozen"));
+            assertThat(stepKeyForIndex.name(), is(PhaseCompleteStep.NAME));
+        }, 30, TimeUnit.SECONDS);
+
+        // validate total_shards_per_node setting
+        Map<String, Object> indexSettings = getIndexSettingsAsMap(searchableSnapMountedIndexName);
+        assertNotNull("expected total_shards_per_node to exist", indexSettings.get(INDEX_TOTAL_SHARDS_PER_NODE_SETTING.getKey()));
+        Integer snapshotTotalShardsPerNode = Integer.valueOf((String) indexSettings.get(INDEX_TOTAL_SHARDS_PER_NODE_SETTING.getKey()));
+        assertEquals(
+            "expected total_shards_per_node to be " + totalShardsPerNode + ", but got: " + snapshotTotalShardsPerNode,
+            snapshotTotalShardsPerNode,
+            totalShardsPerNode
+        );
+    }
+
     /**
      * Cause a bit of cluster activity using an empty reroute call in case the `wait-for-index-colour` ILM step missed the
      * notification that partial-index is now GREEN.

From 756f18eb74e17ed9cb6bde289261b903781c1b21 Mon Sep 17 00:00:00 2001
From: Stanislav Malyshev <smalyshev@users.noreply.github.com>
Date: Mon, 23 Sep 2024 13:21:37 -0600
Subject: [PATCH 08/28] Test fix: ensure we don't accidentally generate two
 identical histograms (#113322)

* Test fix: looks like using one value is not random enough
---
 .../admin/cluster/stats/CCSTelemetrySnapshotTests.java    | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/server/src/test/java/org/elasticsearch/action/admin/cluster/stats/CCSTelemetrySnapshotTests.java b/server/src/test/java/org/elasticsearch/action/admin/cluster/stats/CCSTelemetrySnapshotTests.java
index 0bca6e57dc47b..e9188d9cb8f0d 100644
--- a/server/src/test/java/org/elasticsearch/action/admin/cluster/stats/CCSTelemetrySnapshotTests.java
+++ b/server/src/test/java/org/elasticsearch/action/admin/cluster/stats/CCSTelemetrySnapshotTests.java
@@ -33,7 +33,7 @@ public class CCSTelemetrySnapshotTests extends AbstractWireSerializingTestCase<C
 
     private LongMetricValue randomLongMetricValue() {
         LongMetric v = new LongMetric();
-        for (int i = 0; i < randomIntBetween(1, 10); i++) {
+        for (int i = 0; i < randomIntBetween(5, 10); i++) {
             v.record(randomIntBetween(0, 1_000_000));
         }
         return v.getValue();
@@ -110,13 +110,13 @@ protected CCSTelemetrySnapshot mutateInstance(CCSTelemetrySnapshot instance) thr
                 }
                 break;
             case 3:
-                took = randomLongMetricValue();
+                took = randomValueOtherThan(took, this::randomLongMetricValue);
                 break;
             case 4:
-                tookMrtTrue = randomLongMetricValue();
+                tookMrtTrue = randomValueOtherThan(tookMrtTrue, this::randomLongMetricValue);
                 break;
             case 5:
-                tookMrtFalse = randomLongMetricValue();
+                tookMrtFalse = randomValueOtherThan(tookMrtFalse, this::randomLongMetricValue);
                 break;
             case 6:
                 skippedRemotes += randomNonNegativeLong();

From f7ba89bcb1f7f059542dcccd83c01d06ed613dfa Mon Sep 17 00:00:00 2001
From: Mikhail Berezovskiy <mikhail@elastic.co>
Date: Mon, 23 Sep 2024 12:24:08 -0700
Subject: [PATCH 09/28] relax http stream logging assertions (#113229)

---
 .../http/netty4/Netty4IncrementalRequestHandlingIT.java        | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/modules/transport-netty4/src/internalClusterTest/java/org/elasticsearch/http/netty4/Netty4IncrementalRequestHandlingIT.java b/modules/transport-netty4/src/internalClusterTest/java/org/elasticsearch/http/netty4/Netty4IncrementalRequestHandlingIT.java
index 2b9c77b17bced..26d31b941f356 100644
--- a/modules/transport-netty4/src/internalClusterTest/java/org/elasticsearch/http/netty4/Netty4IncrementalRequestHandlingIT.java
+++ b/modules/transport-netty4/src/internalClusterTest/java/org/elasticsearch/http/netty4/Netty4IncrementalRequestHandlingIT.java
@@ -451,8 +451,7 @@ private void assertHttpBodyLogging(Function<Ctx, Runnable> test) throws Exceptio
                     "request end",
                     HttpBodyTracer.class.getCanonicalName(),
                     Level.TRACE,
-                    "* request body (gzip compressed, base64-encoded, and split into * parts on preceding log lines; for details see "
-                        + "https://www.elastic.co/guide/en/elasticsearch/reference/master/modules-network.html#http-rest-request-tracer)"
+                    "* request body (gzip compressed, base64-encoded, and split into * parts on preceding log lines;*)"
                 )
             );
         }

From d146b27a266063d08a5923194de29e15c19e4231 Mon Sep 17 00:00:00 2001
From: Tim Brooks <tim@timbrooks.org>
Date: Mon, 23 Sep 2024 14:26:48 -0600
Subject: [PATCH 10/28] Default incremental bulk functionality to false
 (#113416)

This commit flips the incremental bulk setting to false. Additionally,
it removes some test code which intermittently causes issues with
security test cases.
---
 .../http/IncrementalBulkRestIT.java           |  8 +++
 .../action/bulk/IncrementalBulkService.java   |  2 +-
 .../elasticsearch/test/ESIntegTestCase.java   | 49 ++-----------------
 3 files changed, 13 insertions(+), 46 deletions(-)

diff --git a/qa/smoke-test-http/src/javaRestTest/java/org/elasticsearch/http/IncrementalBulkRestIT.java b/qa/smoke-test-http/src/javaRestTest/java/org/elasticsearch/http/IncrementalBulkRestIT.java
index 2b24e53874e51..da05011696274 100644
--- a/qa/smoke-test-http/src/javaRestTest/java/org/elasticsearch/http/IncrementalBulkRestIT.java
+++ b/qa/smoke-test-http/src/javaRestTest/java/org/elasticsearch/http/IncrementalBulkRestIT.java
@@ -29,6 +29,14 @@
 @ESIntegTestCase.ClusterScope(scope = ESIntegTestCase.Scope.SUITE, supportsDedicatedMasters = false, numDataNodes = 2, numClientNodes = 0)
 public class IncrementalBulkRestIT extends HttpSmokeTestCase {
 
+    @Override
+    protected Settings nodeSettings(int nodeOrdinal, Settings otherSettings) {
+        return Settings.builder()
+            .put(super.nodeSettings(nodeOrdinal, otherSettings))
+            .put(IncrementalBulkService.INCREMENTAL_BULK.getKey(), true)
+            .build();
+    }
+
     public void testBulkUriMatchingDoesNotMatchBulkCapabilitiesApi() throws IOException {
         Request request = new Request("GET", "/_capabilities?method=GET&path=%2F_bulk&capabilities=failure_store_status&pretty");
         Response response = getRestClient().performRequest(request);
diff --git a/server/src/main/java/org/elasticsearch/action/bulk/IncrementalBulkService.java b/server/src/main/java/org/elasticsearch/action/bulk/IncrementalBulkService.java
index 7185c4d76265e..fc264de35f510 100644
--- a/server/src/main/java/org/elasticsearch/action/bulk/IncrementalBulkService.java
+++ b/server/src/main/java/org/elasticsearch/action/bulk/IncrementalBulkService.java
@@ -36,7 +36,7 @@ public class IncrementalBulkService {
 
     public static final Setting<Boolean> INCREMENTAL_BULK = boolSetting(
         "rest.incremental_bulk",
-        true,
+        false,
         Setting.Property.NodeScope,
         Setting.Property.Dynamic
     );
diff --git a/test/framework/src/main/java/org/elasticsearch/test/ESIntegTestCase.java b/test/framework/src/main/java/org/elasticsearch/test/ESIntegTestCase.java
index 92e480aff3bc9..cca3443c28e3a 100644
--- a/test/framework/src/main/java/org/elasticsearch/test/ESIntegTestCase.java
+++ b/test/framework/src/main/java/org/elasticsearch/test/ESIntegTestCase.java
@@ -26,7 +26,6 @@
 import org.elasticsearch.action.ActionRequest;
 import org.elasticsearch.action.ActionResponse;
 import org.elasticsearch.action.ActionType;
-import org.elasticsearch.action.DocWriteRequest;
 import org.elasticsearch.action.DocWriteResponse;
 import org.elasticsearch.action.admin.cluster.allocation.ClusterAllocationExplainRequest;
 import org.elasticsearch.action.admin.cluster.allocation.ClusterAllocationExplainResponse;
@@ -49,8 +48,6 @@
 import org.elasticsearch.action.admin.indices.template.put.PutIndexTemplateRequestBuilder;
 import org.elasticsearch.action.bulk.BulkRequestBuilder;
 import org.elasticsearch.action.bulk.BulkResponse;
-import org.elasticsearch.action.bulk.IncrementalBulkService;
-import org.elasticsearch.action.index.IndexRequest;
 import org.elasticsearch.action.index.IndexRequestBuilder;
 import org.elasticsearch.action.ingest.DeletePipelineRequest;
 import org.elasticsearch.action.ingest.DeletePipelineTransportAction;
@@ -196,7 +193,6 @@
 import java.util.Random;
 import java.util.Set;
 import java.util.concurrent.Callable;
-import java.util.concurrent.ConcurrentLinkedQueue;
 import java.util.concurrent.CountDownLatch;
 import java.util.concurrent.ExecutionException;
 import java.util.concurrent.Executor;
@@ -1782,48 +1778,11 @@ public void indexRandom(boolean forceRefresh, boolean dummyDocuments, boolean ma
             logger.info("Index [{}] docs async: [{}] bulk: [{}] partitions [{}]", builders.size(), false, true, partition.size());
             for (List<IndexRequestBuilder> segmented : partition) {
                 BulkResponse actionGet;
-                if (randomBoolean()) {
-                    BulkRequestBuilder bulkBuilder = client().prepareBulk();
-                    for (IndexRequestBuilder indexRequestBuilder : segmented) {
-                        bulkBuilder.add(indexRequestBuilder);
-                    }
-                    actionGet = bulkBuilder.get();
-                } else {
-                    IncrementalBulkService bulkService = internalCluster().getInstance(IncrementalBulkService.class);
-                    IncrementalBulkService.Handler handler = bulkService.newBulkRequest();
-
-                    ConcurrentLinkedQueue<IndexRequest> queue = new ConcurrentLinkedQueue<>();
-                    segmented.forEach(b -> queue.add(b.request()));
-
-                    PlainActionFuture<BulkResponse> future = new PlainActionFuture<>();
-                    AtomicInteger runs = new AtomicInteger(0);
-                    Runnable r = new Runnable() {
-
-                        @Override
-                        public void run() {
-                            int toRemove = Math.min(randomIntBetween(5, 10), queue.size());
-                            ArrayList<DocWriteRequest<?>> docs = new ArrayList<>();
-                            for (int i = 0; i < toRemove; i++) {
-                                docs.add(queue.poll());
-                            }
-
-                            if (queue.isEmpty()) {
-                                handler.lastItems(docs, () -> {}, future);
-                            } else {
-                                handler.addItems(docs, () -> {}, () -> {
-                                    // Every 10 runs dispatch to new thread to prevent stackoverflow
-                                    if (runs.incrementAndGet() % 10 == 0) {
-                                        new Thread(this).start();
-                                    } else {
-                                        this.run();
-                                    }
-                                });
-                            }
-                        }
-                    };
-                    r.run();
-                    actionGet = future.actionGet();
+                BulkRequestBuilder bulkBuilder = client().prepareBulk();
+                for (IndexRequestBuilder indexRequestBuilder : segmented) {
+                    bulkBuilder.add(indexRequestBuilder);
                 }
+                actionGet = bulkBuilder.get();
                 assertThat(actionGet.hasFailures() ? actionGet.buildFailureMessage() : "", actionGet.hasFailures(), equalTo(false));
             }
         }

From 2bb8be8e28a35f38c3a4354a436920c4dc425ba5 Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Tue, 24 Sep 2024 06:44:41 +1000
Subject: [PATCH 11/28] Mute org.elasticsearch.xpack.esql.EsqlAsyncSecurityIT
 testLimitedPrivilege #113419

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 0ceaeff67e2c5..2a2f8071482d8 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -301,6 +301,9 @@ tests:
 - class: org.elasticsearch.xpack.ml.integration.MlJobIT
   method: testDeleteJob_TimingStatsDocumentIsDeleted
   issue: https://github.com/elastic/elasticsearch/issues/113370
+- class: org.elasticsearch.xpack.esql.EsqlAsyncSecurityIT
+  method: testLimitedPrivilege
+  issue: https://github.com/elastic/elasticsearch/issues/113419
 
 # Examples:
 #

From a0c97bd969fcbf4f9b980e9d0333a79fb5ae4368 Mon Sep 17 00:00:00 2001
From: Bogdan Pintea <bogdan.pintea@elastic.co>
Date: Mon, 23 Sep 2024 23:56:16 +0200
Subject: [PATCH 12/28] ESQL: add tests checking on data availabiltiy (#113292)

This adds simple tests that check the shape of the available data to
query as a first step in troubleshooting some non-reproducible failures.
---
 .../test/esql/26_aggs_bucket.yml              | 48 +++++++++++++++++++
 1 file changed, 48 insertions(+)

diff --git a/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/esql/26_aggs_bucket.yml b/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/esql/26_aggs_bucket.yml
index 7d0989a6e1886..ea7684fb69a09 100644
--- a/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/esql/26_aggs_bucket.yml
+++ b/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/esql/26_aggs_bucket.yml
@@ -30,6 +30,20 @@
           - { "index": { "_index": "test_bucket" } }
           - { "ts": "2024-07-16T11:40:00Z" }
 
+  - do:
+      allowed_warnings_regex:
+        - "No limit defined, adding default limit of \\[.*\\]"
+      esql.query:
+        body:
+          query: 'FROM test_bucket | SORT ts'
+  - match: { columns.0.name: ts }
+  - match: { columns.0.type: date }
+  - length: { values: 4 }
+  - match: { values.0.0: "2024-07-16T08:10:00.000Z" }
+  - match: { values.1.0: "2024-07-16T09:20:00.000Z" }
+  - match: { values.2.0: "2024-07-16T10:30:00.000Z" }
+  - match: { values.3.0: "2024-07-16T11:40:00.000Z" }
+
   - do:
       allowed_warnings_regex:
         - "No limit defined, adding default limit of \\[.*\\]"
@@ -119,6 +133,40 @@
           - { "index": { "_index": "test_bucket" } }
           - { "ts": "2024-09-16" }
 
+  - do:
+      allowed_warnings_regex:
+        - "No limit defined, adding default limit of \\[.*\\]"
+      esql.query:
+        body:
+          query: 'FROM test_bucket | STATS c = COUNT(*)'
+  - match: { columns.0.name: c }
+  - match: { columns.0.type: long }
+  - match: { values.0.0: 4 }
+
+  - do:
+      allowed_warnings_regex:
+        - "No limit defined, adding default limit of \\[.*\\]"
+      esql.query:
+        body:
+          query: 'FROM test_bucket | SORT ts'
+  - match: { columns.0.name: ts }
+  - match: { columns.0.type: date }
+  - length: { values: 4 }
+  - match: { values.0.0: "2024-06-16T00:00:00.000Z" }
+  - match: { values.1.0: "2024-07-16T00:00:00.000Z" }
+  - match: { values.2.0: "2024-08-16T00:00:00.000Z" }
+  - match: { values.3.0: "2024-09-16T00:00:00.000Z" }
+
+  - do:
+      allowed_warnings_regex:
+        - "No limit defined, adding default limit of \\[.*\\]"
+      esql.query:
+        body:
+          query: 'FROM test_bucket | STATS c = COUNT(*)'
+  - match: { columns.0.name: c }
+  - match: { columns.0.type: long }
+  - match: { values.0.0: 4 }
+
   - do:
       allowed_warnings_regex:
         - "No limit defined, adding default limit of \\[.*\\]"

From 1565c314711908d13fa074c663d1ead6a8b7fc16 Mon Sep 17 00:00:00 2001
From: Pat Whelan <pat.whelan@elastic.co>
Date: Mon, 23 Sep 2024 18:19:40 -0400
Subject: [PATCH 13/28] [ML] Stream Inference API (#113158)

Create `POST _inference/<task>/<id>/_stream` and
`POST _inference/<id>/_stream` API.

REST Streaming API will reuse InferenceAction.
For now, all services and task types will return an
HTTP 405 status code and error message.

Co-authored-by: Elastic Machine <elasticmachine@users.noreply.github.com>
---
 docs/changelog/113158.yaml                    |   5 +
 .../inference/InferenceService.java           |  17 ++
 .../inference/action/InferenceAction.java     |  18 +-
 .../action/InferenceActionRequestTests.java   |  63 ++++--
 .../AsyncInferenceResponseConsumer.java       |  68 ++++++
 .../inference/InferenceBaseRestTest.java      |  61 +++++-
 .../xpack/inference/InferenceCrudIT.java      |  58 +++++
 .../mock/TestInferenceServicePlugin.java      |   5 +
 ...stStreamingCompletionServiceExtension.java | 204 ++++++++++++++++++
 ...search.inference.InferenceServiceExtension |   1 +
 .../xpack/inference/InferencePlugin.java      |   2 +
 .../action/TransportInferenceAction.java      |  65 ++++--
 .../queries/SemanticQueryBuilder.java         |   3 +-
 ...ankFeaturePhaseRankCoordinatorContext.java |   3 +-
 .../inference/rest/BaseInferenceAction.java   |  55 +++++
 .../xpack/inference/rest/Paths.java           |   7 +
 .../inference/rest/RestInferenceAction.java   |  35 +--
 .../rest/RestStreamInferenceAction.java       |  43 ++++
 .../TextSimilarityRankTests.java              |   3 +-
 .../TextSimilarityTestPlugin.java             |   3 +-
 .../rest/BaseInferenceActionTests.java        | 107 +++++++++
 .../rest/RestInferenceActionTests.java        |  40 +---
 .../rest/RestStreamInferenceActionTests.java  |  50 +++++
 .../TransportCoordinatedInferenceAction.java  |   3 +-
 24 files changed, 798 insertions(+), 121 deletions(-)
 create mode 100644 docs/changelog/113158.yaml
 create mode 100644 x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/AsyncInferenceResponseConsumer.java
 create mode 100644 x-pack/plugin/inference/qa/test-service-plugin/src/main/java/org/elasticsearch/xpack/inference/mock/TestStreamingCompletionServiceExtension.java
 create mode 100644 x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rest/BaseInferenceAction.java
 create mode 100644 x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rest/RestStreamInferenceAction.java
 create mode 100644 x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rest/BaseInferenceActionTests.java
 create mode 100644 x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rest/RestStreamInferenceActionTests.java

diff --git a/docs/changelog/113158.yaml b/docs/changelog/113158.yaml
new file mode 100644
index 0000000000000..d097ea11b3a23
--- /dev/null
+++ b/docs/changelog/113158.yaml
@@ -0,0 +1,5 @@
+pr: 113158
+summary: Adds a new Inference API for streaming responses back to the user.
+area: Machine Learning
+type: enhancement
+issues: []
diff --git a/server/src/main/java/org/elasticsearch/inference/InferenceService.java b/server/src/main/java/org/elasticsearch/inference/InferenceService.java
index a37fb3dd75673..9e9a4cf890379 100644
--- a/server/src/main/java/org/elasticsearch/inference/InferenceService.java
+++ b/server/src/main/java/org/elasticsearch/inference/InferenceService.java
@@ -188,4 +188,21 @@ default boolean isInClusterService() {
      * @return {@link TransportVersion} specifying the version
      */
     TransportVersion getMinimalSupportedVersion();
+
+    /**
+     * The set of tasks where this service provider supports using the streaming API.
+     * @return set of supported task types. Defaults to empty.
+     */
+    default Set<TaskType> supportedStreamingTasks() {
+        return Set.of();
+    }
+
+    /**
+     * Checks the task type against the set of supported streaming tasks returned by {@link #supportedStreamingTasks()}.
+     * @param taskType the task that supports streaming
+     * @return true if the taskType is supported
+     */
+    default boolean canStream(TaskType taskType) {
+        return supportedStreamingTasks().contains(taskType);
+    }
 }
diff --git a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/inference/action/InferenceAction.java b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/inference/action/InferenceAction.java
index d898f961651f1..a19edd5a08162 100644
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/inference/action/InferenceAction.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/inference/action/InferenceAction.java
@@ -92,6 +92,7 @@ public static Builder parseRequest(String inferenceEntityId, TaskType taskType,
         private final Map<String, Object> taskSettings;
         private final InputType inputType;
         private final TimeValue inferenceTimeout;
+        private final boolean stream;
 
         public Request(
             TaskType taskType,
@@ -100,7 +101,8 @@ public Request(
             List<String> input,
             Map<String, Object> taskSettings,
             InputType inputType,
-            TimeValue inferenceTimeout
+            TimeValue inferenceTimeout,
+            boolean stream
         ) {
             this.taskType = taskType;
             this.inferenceEntityId = inferenceEntityId;
@@ -109,6 +111,7 @@ public Request(
             this.taskSettings = taskSettings;
             this.inputType = inputType;
             this.inferenceTimeout = inferenceTimeout;
+            this.stream = stream;
         }
 
         public Request(StreamInput in) throws IOException {
@@ -134,6 +137,9 @@ public Request(StreamInput in) throws IOException {
                 this.query = null;
                 this.inferenceTimeout = DEFAULT_TIMEOUT;
             }
+
+            // streaming is not supported yet for transport traffic
+            this.stream = false;
         }
 
         public TaskType getTaskType() {
@@ -165,7 +171,7 @@ public TimeValue getInferenceTimeout() {
         }
 
         public boolean isStreaming() {
-            return false;
+            return stream;
         }
 
         @Override
@@ -261,6 +267,7 @@ public static class Builder {
             private Map<String, Object> taskSettings = Map.of();
             private String query;
             private TimeValue timeout = DEFAULT_TIMEOUT;
+            private boolean stream = false;
 
             private Builder() {}
 
@@ -303,8 +310,13 @@ private Builder setInferenceTimeout(String inferenceTimeout) {
                 return setInferenceTimeout(TimeValue.parseTimeValue(inferenceTimeout, TIMEOUT.getPreferredName()));
             }
 
+            public Builder setStream(boolean stream) {
+                this.stream = stream;
+                return this;
+            }
+
             public Request build() {
-                return new Request(taskType, inferenceEntityId, query, input, taskSettings, inputType, timeout);
+                return new Request(taskType, inferenceEntityId, query, input, taskSettings, inputType, timeout, stream);
             }
         }
 
diff --git a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/inference/action/InferenceActionRequestTests.java b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/inference/action/InferenceActionRequestTests.java
index f41e117e75b9f..a9ca5e6da8720 100644
--- a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/inference/action/InferenceActionRequestTests.java
+++ b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/inference/action/InferenceActionRequestTests.java
@@ -46,7 +46,8 @@ protected InferenceAction.Request createTestInstance() {
             randomList(1, 5, () -> randomAlphaOfLength(8)),
             randomMap(0, 3, () -> new Tuple<>(randomAlphaOfLength(4), randomAlphaOfLength(4))),
             randomFrom(InputType.values()),
-            TimeValue.timeValueMillis(randomLongBetween(1, 2048))
+            TimeValue.timeValueMillis(randomLongBetween(1, 2048)),
+            false
         );
     }
 
@@ -80,7 +81,8 @@ public void testValidation_TextEmbedding() {
             List.of("input"),
             null,
             null,
-            null
+            null,
+            false
         );
         ActionRequestValidationException e = request.validate();
         assertNull(e);
@@ -94,7 +96,8 @@ public void testValidation_Rerank() {
             List.of("input"),
             null,
             null,
-            null
+            null,
+            false
         );
         ActionRequestValidationException e = request.validate();
         assertNull(e);
@@ -108,7 +111,8 @@ public void testValidation_TextEmbedding_Null() {
             null,
             null,
             null,
-            null
+            null,
+            false
         );
         ActionRequestValidationException inputNullError = inputNullRequest.validate();
         assertNotNull(inputNullError);
@@ -123,7 +127,8 @@ public void testValidation_TextEmbedding_Empty() {
             List.of(),
             null,
             null,
-            null
+            null,
+            false
         );
         ActionRequestValidationException inputEmptyError = inputEmptyRequest.validate();
         assertNotNull(inputEmptyError);
@@ -138,7 +143,8 @@ public void testValidation_Rerank_Null() {
             List.of("input"),
             null,
             null,
-            null
+            null,
+            false
         );
         ActionRequestValidationException queryNullError = queryNullRequest.validate();
         assertNotNull(queryNullError);
@@ -153,7 +159,8 @@ public void testValidation_Rerank_Empty() {
             List.of("input"),
             null,
             null,
-            null
+            null,
+            false
         );
         ActionRequestValidationException queryEmptyError = queryEmptyRequest.validate();
         assertNotNull(queryEmptyError);
@@ -185,7 +192,8 @@ protected InferenceAction.Request mutateInstance(InferenceAction.Request instanc
                     instance.getInput(),
                     instance.getTaskSettings(),
                     instance.getInputType(),
-                    instance.getInferenceTimeout()
+                    instance.getInferenceTimeout(),
+                    false
                 );
             }
             case 1 -> new InferenceAction.Request(
@@ -195,7 +203,8 @@ protected InferenceAction.Request mutateInstance(InferenceAction.Request instanc
                 instance.getInput(),
                 instance.getTaskSettings(),
                 instance.getInputType(),
-                instance.getInferenceTimeout()
+                instance.getInferenceTimeout(),
+                false
             );
             case 2 -> {
                 var changedInputs = new ArrayList<String>(instance.getInput());
@@ -207,7 +216,8 @@ protected InferenceAction.Request mutateInstance(InferenceAction.Request instanc
                     changedInputs,
                     instance.getTaskSettings(),
                     instance.getInputType(),
-                    instance.getInferenceTimeout()
+                    instance.getInferenceTimeout(),
+                    false
                 );
             }
             case 3 -> {
@@ -225,7 +235,8 @@ protected InferenceAction.Request mutateInstance(InferenceAction.Request instanc
                     instance.getInput(),
                     taskSettings,
                     instance.getInputType(),
-                    instance.getInferenceTimeout()
+                    instance.getInferenceTimeout(),
+                    false
                 );
             }
             case 4 -> {
@@ -237,7 +248,8 @@ protected InferenceAction.Request mutateInstance(InferenceAction.Request instanc
                     instance.getInput(),
                     instance.getTaskSettings(),
                     nextInputType,
-                    instance.getInferenceTimeout()
+                    instance.getInferenceTimeout(),
+                    false
                 );
             }
             case 5 -> new InferenceAction.Request(
@@ -247,7 +259,8 @@ protected InferenceAction.Request mutateInstance(InferenceAction.Request instanc
                 instance.getInput(),
                 instance.getTaskSettings(),
                 instance.getInputType(),
-                instance.getInferenceTimeout()
+                instance.getInferenceTimeout(),
+                false
             );
             case 6 -> {
                 var newDuration = Duration.of(
@@ -262,7 +275,8 @@ protected InferenceAction.Request mutateInstance(InferenceAction.Request instanc
                     instance.getInput(),
                     instance.getTaskSettings(),
                     instance.getInputType(),
-                    TimeValue.timeValueMillis(newDuration.plus(additionalTime).toMillis())
+                    TimeValue.timeValueMillis(newDuration.plus(additionalTime).toMillis()),
+                    false
                 );
             }
             default -> throw new UnsupportedOperationException();
@@ -279,7 +293,8 @@ protected InferenceAction.Request mutateInstanceForVersion(InferenceAction.Reque
                 instance.getInput().subList(0, 1),
                 instance.getTaskSettings(),
                 InputType.UNSPECIFIED,
-                InferenceAction.Request.DEFAULT_TIMEOUT
+                InferenceAction.Request.DEFAULT_TIMEOUT,
+                false
             );
         } else if (version.before(TransportVersions.V_8_13_0)) {
             return new InferenceAction.Request(
@@ -289,7 +304,8 @@ protected InferenceAction.Request mutateInstanceForVersion(InferenceAction.Reque
                 instance.getInput(),
                 instance.getTaskSettings(),
                 InputType.UNSPECIFIED,
-                InferenceAction.Request.DEFAULT_TIMEOUT
+                InferenceAction.Request.DEFAULT_TIMEOUT,
+                false
             );
         } else if (version.before(TransportVersions.V_8_13_0)
             && (instance.getInputType() == InputType.UNSPECIFIED
@@ -302,7 +318,8 @@ protected InferenceAction.Request mutateInstanceForVersion(InferenceAction.Reque
                         instance.getInput(),
                         instance.getTaskSettings(),
                         InputType.INGEST,
-                        InferenceAction.Request.DEFAULT_TIMEOUT
+                        InferenceAction.Request.DEFAULT_TIMEOUT,
+                        false
                     );
                 } else if (version.before(TransportVersions.V_8_13_0)
                     && (instance.getInputType() == InputType.CLUSTERING || instance.getInputType() == InputType.CLASSIFICATION)) {
@@ -313,7 +330,8 @@ protected InferenceAction.Request mutateInstanceForVersion(InferenceAction.Reque
                             instance.getInput(),
                             instance.getTaskSettings(),
                             InputType.UNSPECIFIED,
-                            InferenceAction.Request.DEFAULT_TIMEOUT
+                            InferenceAction.Request.DEFAULT_TIMEOUT,
+                            false
                         );
                     } else if (version.before(TransportVersions.V_8_14_0)) {
                         return new InferenceAction.Request(
@@ -323,7 +341,8 @@ protected InferenceAction.Request mutateInstanceForVersion(InferenceAction.Reque
                             instance.getInput(),
                             instance.getTaskSettings(),
                             instance.getInputType(),
-                            InferenceAction.Request.DEFAULT_TIMEOUT
+                            InferenceAction.Request.DEFAULT_TIMEOUT,
+                            false
                         );
                     }
 
@@ -339,7 +358,8 @@ public void testWriteTo_WhenVersionIsOnAfterUnspecifiedAdded() throws IOExceptio
                 List.of(),
                 Map.of(),
                 InputType.UNSPECIFIED,
-                InferenceAction.Request.DEFAULT_TIMEOUT
+                InferenceAction.Request.DEFAULT_TIMEOUT,
+                false
             ),
             TransportVersions.V_8_13_0
         );
@@ -353,7 +373,8 @@ public void testWriteTo_WhenVersionIsBeforeInputTypeAdded_ShouldSetInputTypeToUn
             List.of(),
             Map.of(),
             InputType.INGEST,
-            InferenceAction.Request.DEFAULT_TIMEOUT
+            InferenceAction.Request.DEFAULT_TIMEOUT,
+            false
         );
 
         InferenceAction.Request deserializedInstance = copyWriteable(
diff --git a/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/AsyncInferenceResponseConsumer.java b/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/AsyncInferenceResponseConsumer.java
new file mode 100644
index 0000000000000..eb5f3c75bab60
--- /dev/null
+++ b/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/AsyncInferenceResponseConsumer.java
@@ -0,0 +1,68 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference;
+
+import org.apache.http.HttpEntity;
+import org.apache.http.HttpResponse;
+import org.apache.http.entity.ContentType;
+import org.apache.http.nio.ContentDecoder;
+import org.apache.http.nio.IOControl;
+import org.apache.http.nio.protocol.AbstractAsyncResponseConsumer;
+import org.apache.http.nio.util.SimpleInputBuffer;
+import org.apache.http.protocol.HttpContext;
+import org.elasticsearch.xpack.inference.external.response.streaming.ServerSentEvent;
+import org.elasticsearch.xpack.inference.external.response.streaming.ServerSentEventParser;
+
+import java.io.IOException;
+import java.util.ArrayDeque;
+import java.util.Deque;
+import java.util.concurrent.atomic.AtomicReference;
+
+class AsyncInferenceResponseConsumer extends AbstractAsyncResponseConsumer<HttpResponse> {
+    private final AtomicReference<HttpResponse> httpResponse = new AtomicReference<>();
+    private final Deque<ServerSentEvent> collector = new ArrayDeque<>();
+    private final ServerSentEventParser sseParser = new ServerSentEventParser();
+    private final SimpleInputBuffer inputBuffer = new SimpleInputBuffer(4096);
+
+    @Override
+    protected void onResponseReceived(HttpResponse httpResponse) {
+        this.httpResponse.set(httpResponse);
+    }
+
+    @Override
+    protected void onContentReceived(ContentDecoder contentDecoder, IOControl ioControl) throws IOException {
+        inputBuffer.consumeContent(contentDecoder);
+    }
+
+    @Override
+    protected void onEntityEnclosed(HttpEntity httpEntity, ContentType contentType) {
+        httpResponse.updateAndGet(response -> {
+            response.setEntity(httpEntity);
+            return response;
+        });
+    }
+
+    @Override
+    protected HttpResponse buildResult(HttpContext httpContext) {
+        var allBytes = new byte[inputBuffer.length()];
+        try {
+            inputBuffer.read(allBytes);
+            sseParser.parse(allBytes).forEach(collector::offer);
+        } catch (IOException e) {
+            failed(e);
+        }
+        return httpResponse.get();
+    }
+
+    @Override
+    protected void releaseResources() {}
+
+    Deque<ServerSentEvent> events() {
+        return collector;
+    }
+}
diff --git a/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/InferenceBaseRestTest.java b/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/InferenceBaseRestTest.java
index f30f2e8fe201a..c19cd916055d3 100644
--- a/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/InferenceBaseRestTest.java
+++ b/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/InferenceBaseRestTest.java
@@ -9,7 +9,9 @@
 
 import org.apache.http.util.EntityUtils;
 import org.elasticsearch.client.Request;
+import org.elasticsearch.client.RequestOptions;
 import org.elasticsearch.client.Response;
+import org.elasticsearch.client.ResponseListener;
 import org.elasticsearch.common.Strings;
 import org.elasticsearch.common.settings.SecureString;
 import org.elasticsearch.common.settings.Settings;
@@ -19,11 +21,15 @@
 import org.elasticsearch.test.cluster.ElasticsearchCluster;
 import org.elasticsearch.test.cluster.local.distribution.DistributionType;
 import org.elasticsearch.test.rest.ESRestTestCase;
+import org.elasticsearch.xpack.inference.external.response.streaming.ServerSentEvent;
 import org.junit.ClassRule;
 
 import java.io.IOException;
+import java.util.Deque;
 import java.util.List;
 import java.util.Map;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.TimeUnit;
 
 import static org.hamcrest.Matchers.anyOf;
 import static org.hamcrest.Matchers.equalTo;
@@ -72,6 +78,23 @@ static String mockSparseServiceModelConfig(@Nullable TaskType taskTypeInBody) {
             """, taskType);
     }
 
+    static String mockCompletionServiceModelConfig(@Nullable TaskType taskTypeInBody) {
+        var taskType = taskTypeInBody == null ? "" : "\"task_type\": \"" + taskTypeInBody + "\",";
+        return Strings.format("""
+            {
+              %s
+              "service": "streaming_completion_test_service",
+              "service_settings": {
+                "model": "my_model",
+                "api_key": "abc64"
+              },
+              "task_settings": {
+                "temperature": 3
+              }
+            }
+            """, taskType);
+    }
+
     static String mockSparseServiceModelConfig(@Nullable TaskType taskTypeInBody, boolean shouldReturnHiddenField) {
         var taskType = taskTypeInBody == null ? "" : "\"task_type\": \"" + taskTypeInBody + "\",";
         return Strings.format("""
@@ -252,6 +275,32 @@ protected Map<String, Object> inferOnMockService(String modelId, List<String> in
         return inferOnMockServiceInternal(endpoint, input);
     }
 
+    protected Deque<ServerSentEvent> streamInferOnMockService(String modelId, TaskType taskType, List<String> input) throws Exception {
+        var endpoint = Strings.format("_inference/%s/%s/_stream", taskType, modelId);
+        return callAsync(endpoint, input);
+    }
+
+    private Deque<ServerSentEvent> callAsync(String endpoint, List<String> input) throws Exception {
+        var responseConsumer = new AsyncInferenceResponseConsumer();
+        var request = new Request("POST", endpoint);
+        request.setJsonEntity(jsonBody(input));
+        request.setOptions(RequestOptions.DEFAULT.toBuilder().setHttpAsyncResponseConsumerFactory(() -> responseConsumer).build());
+        var latch = new CountDownLatch(1);
+        client().performRequestAsync(request, new ResponseListener() {
+            @Override
+            public void onSuccess(Response response) {
+                latch.countDown();
+            }
+
+            @Override
+            public void onFailure(Exception exception) {
+                latch.countDown();
+            }
+        });
+        assertTrue(latch.await(30, TimeUnit.SECONDS));
+        return responseConsumer.events();
+    }
+
     protected Map<String, Object> inferOnMockService(String modelId, TaskType taskType, List<String> input) throws IOException {
         var endpoint = Strings.format("_inference/%s/%s", taskType, modelId);
         return inferOnMockServiceInternal(endpoint, input);
@@ -259,7 +308,13 @@ protected Map<String, Object> inferOnMockService(String modelId, TaskType taskTy
 
     private Map<String, Object> inferOnMockServiceInternal(String endpoint, List<String> input) throws IOException {
         var request = new Request("POST", endpoint);
+        request.setJsonEntity(jsonBody(input));
+        var response = client().performRequest(request);
+        assertOkOrCreated(response);
+        return entityAsMap(response);
+    }
 
+    private String jsonBody(List<String> input) {
         var bodyBuilder = new StringBuilder("{\"input\": [");
         for (var in : input) {
             bodyBuilder.append('"').append(in).append('"').append(',');
@@ -267,11 +322,7 @@ private Map<String, Object> inferOnMockServiceInternal(String endpoint, List<Str
         // remove last comma
         bodyBuilder.deleteCharAt(bodyBuilder.length() - 1);
         bodyBuilder.append("]}");
-
-        request.setJsonEntity(bodyBuilder.toString());
-        var response = client().performRequest(request);
-        assertOkOrCreated(response);
-        return entityAsMap(response);
+        return bodyBuilder.toString();
     }
 
     @SuppressWarnings("unchecked")
diff --git a/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/InferenceCrudIT.java b/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/InferenceCrudIT.java
index 7b897432afa83..b9a5202a25013 100644
--- a/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/InferenceCrudIT.java
+++ b/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/InferenceCrudIT.java
@@ -17,8 +17,12 @@
 import java.io.IOException;
 import java.util.List;
 import java.util.Set;
+import java.util.stream.IntStream;
+import java.util.stream.Stream;
 
 import static org.hamcrest.Matchers.containsString;
+import static org.hamcrest.Matchers.equalTo;
+import static org.hamcrest.Matchers.equalToIgnoringCase;
 import static org.hamcrest.Matchers.hasSize;
 
 public class InferenceCrudIT extends InferenceBaseRestTest {
@@ -222,4 +226,58 @@ public void testDeleteEndpointWhileReferencedBySemanticTextAndPipeline() throws
         deletePipeline(pipelineId);
         deleteIndex(indexName);
     }
+
+    public void testUnsupportedStream() throws Exception {
+        String modelId = "streaming";
+        putModel(modelId, mockCompletionServiceModelConfig(TaskType.SPARSE_EMBEDDING));
+        var singleModel = getModel(modelId);
+        assertEquals(modelId, singleModel.get("inference_id"));
+        assertEquals(TaskType.SPARSE_EMBEDDING.toString(), singleModel.get("task_type"));
+
+        try {
+            var events = streamInferOnMockService(modelId, TaskType.SPARSE_EMBEDDING, List.of(randomAlphaOfLength(10)));
+            assertThat(events.size(), equalTo(2));
+            events.forEach(event -> {
+                switch (event.name()) {
+                    case EVENT -> assertThat(event.value(), equalToIgnoringCase("error"));
+                    case DATA -> assertThat(
+                        event.value(),
+                        containsString(
+                            "Streaming is not allowed for service [streaming_completion_test_service] and task [sparse_embedding]"
+                        )
+                    );
+                }
+            });
+        } finally {
+            deleteModel(modelId);
+        }
+    }
+
+    public void testSupportedStream() throws Exception {
+        String modelId = "streaming";
+        putModel(modelId, mockCompletionServiceModelConfig(TaskType.COMPLETION));
+        var singleModel = getModel(modelId);
+        assertEquals(modelId, singleModel.get("inference_id"));
+        assertEquals(TaskType.COMPLETION.toString(), singleModel.get("task_type"));
+
+        var input = IntStream.range(0, randomInt(10)).mapToObj(i -> randomAlphaOfLength(10)).toList();
+
+        try {
+            var events = streamInferOnMockService(modelId, TaskType.COMPLETION, input);
+
+            var expectedResponses = Stream.concat(
+                input.stream().map(String::toUpperCase).map(str -> "{\"completion\":[{\"delta\":\"" + str + "\"}]}"),
+                Stream.of("[DONE]")
+            ).iterator();
+            assertThat(events.size(), equalTo((input.size() + 1) * 2));
+            events.forEach(event -> {
+                switch (event.name()) {
+                    case EVENT -> assertThat(event.value(), equalToIgnoringCase("message"));
+                    case DATA -> assertThat(event.value(), equalTo(expectedResponses.next()));
+                }
+            });
+        } finally {
+            deleteModel(modelId);
+        }
+    }
 }
diff --git a/x-pack/plugin/inference/qa/test-service-plugin/src/main/java/org/elasticsearch/xpack/inference/mock/TestInferenceServicePlugin.java b/x-pack/plugin/inference/qa/test-service-plugin/src/main/java/org/elasticsearch/xpack/inference/mock/TestInferenceServicePlugin.java
index 752472b90374b..eef0da909f529 100644
--- a/x-pack/plugin/inference/qa/test-service-plugin/src/main/java/org/elasticsearch/xpack/inference/mock/TestInferenceServicePlugin.java
+++ b/x-pack/plugin/inference/qa/test-service-plugin/src/main/java/org/elasticsearch/xpack/inference/mock/TestInferenceServicePlugin.java
@@ -44,6 +44,11 @@ public List<NamedWriteableRegistry.Entry> getNamedWriteables() {
                 ServiceSettings.class,
                 TestRerankingServiceExtension.TestServiceSettings.NAME,
                 TestRerankingServiceExtension.TestServiceSettings::new
+            ),
+            new NamedWriteableRegistry.Entry(
+                ServiceSettings.class,
+                TestStreamingCompletionServiceExtension.TestServiceSettings.NAME,
+                TestStreamingCompletionServiceExtension.TestServiceSettings::new
             )
         );
     }
diff --git a/x-pack/plugin/inference/qa/test-service-plugin/src/main/java/org/elasticsearch/xpack/inference/mock/TestStreamingCompletionServiceExtension.java b/x-pack/plugin/inference/qa/test-service-plugin/src/main/java/org/elasticsearch/xpack/inference/mock/TestStreamingCompletionServiceExtension.java
new file mode 100644
index 0000000000000..3d72b1f2729b0
--- /dev/null
+++ b/x-pack/plugin/inference/qa/test-service-plugin/src/main/java/org/elasticsearch/xpack/inference/mock/TestStreamingCompletionServiceExtension.java
@@ -0,0 +1,204 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.mock;
+
+import org.elasticsearch.ElasticsearchStatusException;
+import org.elasticsearch.TransportVersion;
+import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.common.ValidationException;
+import org.elasticsearch.common.collect.Iterators;
+import org.elasticsearch.common.io.stream.StreamInput;
+import org.elasticsearch.common.io.stream.StreamOutput;
+import org.elasticsearch.common.xcontent.ChunkedToXContent;
+import org.elasticsearch.common.xcontent.ChunkedToXContentHelper;
+import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.inference.ChunkedInferenceServiceResults;
+import org.elasticsearch.inference.ChunkingOptions;
+import org.elasticsearch.inference.InferenceServiceExtension;
+import org.elasticsearch.inference.InferenceServiceResults;
+import org.elasticsearch.inference.InputType;
+import org.elasticsearch.inference.Model;
+import org.elasticsearch.inference.ModelConfigurations;
+import org.elasticsearch.inference.ServiceSettings;
+import org.elasticsearch.inference.TaskType;
+import org.elasticsearch.rest.RestStatus;
+import org.elasticsearch.xcontent.ToXContentObject;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xpack.core.inference.results.StreamingChatCompletionResults;
+
+import java.io.IOException;
+import java.util.List;
+import java.util.Map;
+import java.util.Set;
+import java.util.concurrent.Flow;
+
+import static org.elasticsearch.xpack.core.inference.results.ChatCompletionResults.COMPLETION;
+
+public class TestStreamingCompletionServiceExtension implements InferenceServiceExtension {
+    @Override
+    public List<Factory> getInferenceServiceFactories() {
+        return List.of(TestInferenceService::new);
+    }
+
+    public static class TestInferenceService extends AbstractTestInferenceService {
+        private static final String NAME = "streaming_completion_test_service";
+        private static final Set<TaskType> supportedStreamingTasks = Set.of(TaskType.COMPLETION);
+
+        public TestInferenceService(InferenceServiceExtension.InferenceServiceFactoryContext context) {}
+
+        @Override
+        public String name() {
+            return NAME;
+        }
+
+        @Override
+        protected ServiceSettings getServiceSettingsFromMap(Map<String, Object> serviceSettingsMap) {
+            return TestServiceSettings.fromMap(serviceSettingsMap);
+        }
+
+        @Override
+        @SuppressWarnings("unchecked")
+        public void parseRequestConfig(
+            String modelId,
+            TaskType taskType,
+            Map<String, Object> config,
+            Set<String> platformArchitectures,
+            ActionListener<Model> parsedModelListener
+        ) {
+            var serviceSettingsMap = (Map<String, Object>) config.remove(ModelConfigurations.SERVICE_SETTINGS);
+            var serviceSettings = TestSparseInferenceServiceExtension.TestServiceSettings.fromMap(serviceSettingsMap);
+            var secretSettings = TestSecretSettings.fromMap(serviceSettingsMap);
+
+            var taskSettingsMap = getTaskSettingsMap(config);
+            var taskSettings = TestTaskSettings.fromMap(taskSettingsMap);
+
+            parsedModelListener.onResponse(new TestServiceModel(modelId, taskType, name(), serviceSettings, taskSettings, secretSettings));
+        }
+
+        @Override
+        public void infer(
+            Model model,
+            String query,
+            List<String> input,
+            Map<String, Object> taskSettings,
+            InputType inputType,
+            TimeValue timeout,
+            ActionListener<InferenceServiceResults> listener
+        ) {
+            switch (model.getConfigurations().getTaskType()) {
+                case COMPLETION -> listener.onResponse(makeResults(input));
+                default -> listener.onFailure(
+                    new ElasticsearchStatusException(
+                        TaskType.unsupportedTaskTypeErrorMsg(model.getConfigurations().getTaskType(), name()),
+                        RestStatus.BAD_REQUEST
+                    )
+                );
+            }
+        }
+
+        private StreamingChatCompletionResults makeResults(List<String> input) {
+            var responseIter = input.stream().map(String::toUpperCase).iterator();
+            return new StreamingChatCompletionResults(subscriber -> {
+                subscriber.onSubscribe(new Flow.Subscription() {
+                    @Override
+                    public void request(long n) {
+                        if (responseIter.hasNext()) {
+                            subscriber.onNext(completionChunk(responseIter.next()));
+                        } else {
+                            subscriber.onComplete();
+                        }
+                    }
+
+                    @Override
+                    public void cancel() {}
+                });
+            });
+        }
+
+        private ChunkedToXContent completionChunk(String delta) {
+            return params -> Iterators.concat(
+                ChunkedToXContentHelper.startObject(),
+                ChunkedToXContentHelper.startArray(COMPLETION),
+                ChunkedToXContentHelper.startObject(),
+                ChunkedToXContentHelper.field("delta", delta),
+                ChunkedToXContentHelper.endObject(),
+                ChunkedToXContentHelper.endArray(),
+                ChunkedToXContentHelper.endObject()
+            );
+        }
+
+        @Override
+        public void chunkedInfer(
+            Model model,
+            String query,
+            List<String> input,
+            Map<String, Object> taskSettings,
+            InputType inputType,
+            ChunkingOptions chunkingOptions,
+            TimeValue timeout,
+            ActionListener<List<ChunkedInferenceServiceResults>> listener
+        ) {
+            listener.onFailure(
+                new ElasticsearchStatusException(
+                    TaskType.unsupportedTaskTypeErrorMsg(model.getConfigurations().getTaskType(), name()),
+                    RestStatus.BAD_REQUEST
+                )
+            );
+        }
+
+        @Override
+        public Set<TaskType> supportedStreamingTasks() {
+            return supportedStreamingTasks;
+        }
+    }
+
+    public record TestServiceSettings(String modelId) implements ServiceSettings {
+        public static final String NAME = "streaming_completion_test_service_settings";
+
+        public TestServiceSettings(StreamInput in) throws IOException {
+            this(in.readString());
+        }
+
+        public static TestServiceSettings fromMap(Map<String, Object> map) {
+            var modelId = map.remove("model").toString();
+
+            if (modelId == null) {
+                ValidationException validationException = new ValidationException();
+                validationException.addValidationError("missing model id");
+                throw validationException;
+            }
+
+            return new TestServiceSettings(modelId);
+        }
+
+        @Override
+        public String getWriteableName() {
+            return NAME;
+        }
+
+        @Override
+        public TransportVersion getMinimalSupportedVersion() {
+            return TransportVersion.current(); // fine for these tests but will not work for cluster upgrade tests
+        }
+
+        @Override
+        public void writeTo(StreamOutput out) throws IOException {
+            out.writeString(modelId());
+        }
+
+        @Override
+        public ToXContentObject getFilteredXContentObject() {
+            return this;
+        }
+
+        @Override
+        public XContentBuilder toXContent(XContentBuilder builder, Params params) throws IOException {
+            return builder.startObject().field("model", modelId()).endObject();
+        }
+    }
+}
diff --git a/x-pack/plugin/inference/qa/test-service-plugin/src/main/resources/META-INF/services/org.elasticsearch.inference.InferenceServiceExtension b/x-pack/plugin/inference/qa/test-service-plugin/src/main/resources/META-INF/services/org.elasticsearch.inference.InferenceServiceExtension
index 690168b538fb9..c996a33d1e916 100644
--- a/x-pack/plugin/inference/qa/test-service-plugin/src/main/resources/META-INF/services/org.elasticsearch.inference.InferenceServiceExtension
+++ b/x-pack/plugin/inference/qa/test-service-plugin/src/main/resources/META-INF/services/org.elasticsearch.inference.InferenceServiceExtension
@@ -1,3 +1,4 @@
 org.elasticsearch.xpack.inference.mock.TestSparseInferenceServiceExtension
 org.elasticsearch.xpack.inference.mock.TestDenseInferenceServiceExtension
 org.elasticsearch.xpack.inference.mock.TestRerankingServiceExtension
+org.elasticsearch.xpack.inference.mock.TestStreamingCompletionServiceExtension
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/InferencePlugin.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/InferencePlugin.java
index 1cec996400a97..a6972ddc214fc 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/InferencePlugin.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/InferencePlugin.java
@@ -73,6 +73,7 @@
 import org.elasticsearch.xpack.inference.rest.RestGetInferenceModelAction;
 import org.elasticsearch.xpack.inference.rest.RestInferenceAction;
 import org.elasticsearch.xpack.inference.rest.RestPutInferenceModelAction;
+import org.elasticsearch.xpack.inference.rest.RestStreamInferenceAction;
 import org.elasticsearch.xpack.inference.services.ServiceComponents;
 import org.elasticsearch.xpack.inference.services.alibabacloudsearch.AlibabaCloudSearchService;
 import org.elasticsearch.xpack.inference.services.amazonbedrock.AmazonBedrockService;
@@ -167,6 +168,7 @@ public List<RestHandler> getRestHandlers(
     ) {
         return List.of(
             new RestInferenceAction(),
+            new RestStreamInferenceAction(),
             new RestGetInferenceModelAction(),
             new RestPutInferenceModelAction(),
             new RestDeleteInferenceEndpointAction(),
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/action/TransportInferenceAction.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/action/TransportInferenceAction.java
index bfdfca166ef3a..803e8f1e07612 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/action/TransportInferenceAction.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/action/TransportInferenceAction.java
@@ -17,6 +17,7 @@
 import org.elasticsearch.inference.InferenceServiceRegistry;
 import org.elasticsearch.inference.InferenceServiceResults;
 import org.elasticsearch.inference.Model;
+import org.elasticsearch.inference.TaskType;
 import org.elasticsearch.injection.guice.Inject;
 import org.elasticsearch.rest.RestStatus;
 import org.elasticsearch.tasks.Task;
@@ -26,10 +27,17 @@
 import org.elasticsearch.xpack.inference.registry.ModelRegistry;
 import org.elasticsearch.xpack.inference.telemetry.InferenceStats;
 
+import java.util.Set;
+import java.util.stream.Collectors;
+
+import static org.elasticsearch.core.Strings.format;
+
 public class TransportInferenceAction extends HandledTransportAction<InferenceAction.Request, InferenceAction.Response> {
     private static final String STREAMING_INFERENCE_TASK_TYPE = "streaming_inference";
     private static final String STREAMING_TASK_ACTION = "xpack/inference/streaming_inference[n]";
 
+    private static final Set<Class<? extends InferenceService>> supportsStreaming = Set.of();
+
     private final ModelRegistry modelRegistry;
     private final InferenceServiceRegistry serviceRegistry;
     private final InferenceStats inferenceStats;
@@ -101,15 +109,40 @@ private void inferOnService(
         InferenceService service,
         ActionListener<InferenceAction.Response> listener
     ) {
-        service.infer(
-            model,
-            request.getQuery(),
-            request.getInput(),
-            request.getTaskSettings(),
-            request.getInputType(),
-            request.getInferenceTimeout(),
-            createListener(request, listener)
-        );
+        if (request.isStreaming() == false || service.canStream(request.getTaskType())) {
+            service.infer(
+                model,
+                request.getQuery(),
+                request.getInput(),
+                request.getTaskSettings(),
+                request.getInputType(),
+                request.getInferenceTimeout(),
+                createListener(request, listener)
+            );
+        } else {
+            listener.onFailure(unsupportedStreamingTaskException(request, service));
+        }
+    }
+
+    private ElasticsearchStatusException unsupportedStreamingTaskException(InferenceAction.Request request, InferenceService service) {
+        var supportedTasks = service.supportedStreamingTasks();
+        if (supportedTasks.isEmpty()) {
+            return new ElasticsearchStatusException(
+                format("Streaming is not allowed for service [%s].", service.name()),
+                RestStatus.METHOD_NOT_ALLOWED
+            );
+        } else {
+            var validTasks = supportedTasks.stream().map(TaskType::toString).collect(Collectors.joining(","));
+            return new ElasticsearchStatusException(
+                format(
+                    "Streaming is not allowed for service [%s] and task [%s]. Supported tasks: [%s]",
+                    service.name(),
+                    request.getTaskType(),
+                    validTasks
+                ),
+                RestStatus.METHOD_NOT_ALLOWED
+            );
+        }
     }
 
     private ActionListener<InferenceServiceResults> createListener(
@@ -118,17 +151,9 @@ private ActionListener<InferenceServiceResults> createListener(
     ) {
         if (request.isStreaming()) {
             return listener.delegateFailureAndWrap((l, inferenceResults) -> {
-                if (inferenceResults.isStreaming()) {
-                    var taskProcessor = streamingTaskManager.<ChunkedToXContent>create(
-                        STREAMING_INFERENCE_TASK_TYPE,
-                        STREAMING_TASK_ACTION
-                    );
-                    inferenceResults.publisher().subscribe(taskProcessor);
-                    l.onResponse(new InferenceAction.Response(inferenceResults, taskProcessor));
-                } else {
-                    // if we asked for streaming but the provider doesn't support it, for now we're going to get back the single response
-                    l.onResponse(new InferenceAction.Response(inferenceResults));
-                }
+                var taskProcessor = streamingTaskManager.<ChunkedToXContent>create(STREAMING_INFERENCE_TASK_TYPE, STREAMING_TASK_ACTION);
+                inferenceResults.publisher().subscribe(taskProcessor);
+                l.onResponse(new InferenceAction.Response(inferenceResults, taskProcessor));
             });
         }
         return listener.delegateFailureAndWrap((l, inferenceResults) -> l.onResponse(new InferenceAction.Response(inferenceResults)));
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/queries/SemanticQueryBuilder.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/queries/SemanticQueryBuilder.java
index 8f1e28d0d8ee4..7f21f94d33276 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/queries/SemanticQueryBuilder.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/queries/SemanticQueryBuilder.java
@@ -204,7 +204,8 @@ private SemanticQueryBuilder doRewriteGetInferenceResults(QueryRewriteContext qu
                 List.of(query),
                 Map.of(),
                 InputType.SEARCH,
-                InferModelAction.Request.DEFAULT_TIMEOUT_FOR_API
+                InferModelAction.Request.DEFAULT_TIMEOUT_FOR_API,
+                false
             );
 
             queryRewriteContext.registerAsyncAction(
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rank/textsimilarity/TextSimilarityRankFeaturePhaseRankCoordinatorContext.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rank/textsimilarity/TextSimilarityRankFeaturePhaseRankCoordinatorContext.java
index cad11cbdc9d5b..0ff48bfd493ba 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rank/textsimilarity/TextSimilarityRankFeaturePhaseRankCoordinatorContext.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rank/textsimilarity/TextSimilarityRankFeaturePhaseRankCoordinatorContext.java
@@ -144,7 +144,8 @@ protected InferenceAction.Request generateRequest(List<String> docFeatures) {
             docFeatures,
             Map.of(),
             InputType.SEARCH,
-            InferenceAction.Request.DEFAULT_TIMEOUT
+            InferenceAction.Request.DEFAULT_TIMEOUT,
+            false
         );
     }
 
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rest/BaseInferenceAction.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rest/BaseInferenceAction.java
new file mode 100644
index 0000000000000..e72e68052f648
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rest/BaseInferenceAction.java
@@ -0,0 +1,55 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.rest;
+
+import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.client.internal.node.NodeClient;
+import org.elasticsearch.inference.TaskType;
+import org.elasticsearch.rest.BaseRestHandler;
+import org.elasticsearch.rest.RestChannel;
+import org.elasticsearch.rest.RestRequest;
+import org.elasticsearch.xpack.core.inference.action.InferenceAction;
+
+import java.io.IOException;
+
+import static org.elasticsearch.xpack.inference.rest.Paths.INFERENCE_ID;
+import static org.elasticsearch.xpack.inference.rest.Paths.TASK_TYPE_OR_INFERENCE_ID;
+
+abstract class BaseInferenceAction extends BaseRestHandler {
+    @Override
+    protected RestChannelConsumer prepareRequest(RestRequest restRequest, NodeClient client) throws IOException {
+        String inferenceEntityId;
+        TaskType taskType;
+        if (restRequest.hasParam(INFERENCE_ID)) {
+            inferenceEntityId = restRequest.param(INFERENCE_ID);
+            taskType = TaskType.fromStringOrStatusException(restRequest.param(TASK_TYPE_OR_INFERENCE_ID));
+        } else {
+            inferenceEntityId = restRequest.param(TASK_TYPE_OR_INFERENCE_ID);
+            taskType = TaskType.ANY;
+        }
+
+        InferenceAction.Request.Builder requestBuilder;
+        try (var parser = restRequest.contentParser()) {
+            requestBuilder = InferenceAction.Request.parseRequest(inferenceEntityId, taskType, parser);
+        }
+
+        var inferTimeout = restRequest.paramAsTime(
+            InferenceAction.Request.TIMEOUT.getPreferredName(),
+            InferenceAction.Request.DEFAULT_TIMEOUT
+        );
+        requestBuilder.setInferenceTimeout(inferTimeout);
+        var request = prepareInferenceRequest(requestBuilder);
+        return channel -> client.execute(InferenceAction.INSTANCE, request, listener(channel));
+    }
+
+    protected InferenceAction.Request prepareInferenceRequest(InferenceAction.Request.Builder builder) {
+        return builder.build();
+    }
+
+    protected abstract ActionListener<InferenceAction.Response> listener(RestChannel channel);
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rest/Paths.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rest/Paths.java
index e33931f3d2f8d..9f64b58e48b55 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rest/Paths.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rest/Paths.java
@@ -15,6 +15,13 @@ public final class Paths {
     static final String TASK_TYPE_INFERENCE_ID_PATH = "_inference/{" + TASK_TYPE_OR_INFERENCE_ID + "}/{" + INFERENCE_ID + "}";
     static final String INFERENCE_DIAGNOSTICS_PATH = "_inference/.diagnostics";
 
+    static final String STREAM_INFERENCE_ID_PATH = "_inference/{" + TASK_TYPE_OR_INFERENCE_ID + "}/_stream";
+    static final String STREAM_TASK_TYPE_INFERENCE_ID_PATH = "_inference/{"
+        + TASK_TYPE_OR_INFERENCE_ID
+        + "}/{"
+        + INFERENCE_ID
+        + "}/_stream";
+
     private Paths() {
 
     }
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rest/RestInferenceAction.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rest/RestInferenceAction.java
index f5c30d0a94c54..0fbc2f8214cbb 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rest/RestInferenceAction.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rest/RestInferenceAction.java
@@ -7,26 +7,21 @@
 
 package org.elasticsearch.xpack.inference.rest;
 
-import org.elasticsearch.client.internal.node.NodeClient;
-import org.elasticsearch.inference.TaskType;
-import org.elasticsearch.rest.BaseRestHandler;
-import org.elasticsearch.rest.RestRequest;
+import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.rest.RestChannel;
 import org.elasticsearch.rest.Scope;
 import org.elasticsearch.rest.ServerlessScope;
 import org.elasticsearch.rest.action.RestChunkedToXContentListener;
 import org.elasticsearch.xpack.core.inference.action.InferenceAction;
 
-import java.io.IOException;
 import java.util.List;
 
 import static org.elasticsearch.rest.RestRequest.Method.POST;
-import static org.elasticsearch.xpack.inference.rest.Paths.INFERENCE_ID;
 import static org.elasticsearch.xpack.inference.rest.Paths.INFERENCE_ID_PATH;
 import static org.elasticsearch.xpack.inference.rest.Paths.TASK_TYPE_INFERENCE_ID_PATH;
-import static org.elasticsearch.xpack.inference.rest.Paths.TASK_TYPE_OR_INFERENCE_ID;
 
 @ServerlessScope(Scope.PUBLIC)
-public class RestInferenceAction extends BaseRestHandler {
+public class RestInferenceAction extends BaseInferenceAction {
     @Override
     public String getName() {
         return "inference_action";
@@ -38,27 +33,7 @@ public List<Route> routes() {
     }
 
     @Override
-    protected RestChannelConsumer prepareRequest(RestRequest restRequest, NodeClient client) throws IOException {
-        String inferenceEntityId;
-        TaskType taskType;
-        if (restRequest.hasParam(INFERENCE_ID)) {
-            inferenceEntityId = restRequest.param(INFERENCE_ID);
-            taskType = TaskType.fromStringOrStatusException(restRequest.param(TASK_TYPE_OR_INFERENCE_ID));
-        } else {
-            inferenceEntityId = restRequest.param(TASK_TYPE_OR_INFERENCE_ID);
-            taskType = TaskType.ANY;
-        }
-
-        InferenceAction.Request.Builder requestBuilder;
-        try (var parser = restRequest.contentParser()) {
-            requestBuilder = InferenceAction.Request.parseRequest(inferenceEntityId, taskType, parser);
-        }
-
-        var inferTimeout = restRequest.paramAsTime(
-            InferenceAction.Request.TIMEOUT.getPreferredName(),
-            InferenceAction.Request.DEFAULT_TIMEOUT
-        );
-        requestBuilder.setInferenceTimeout(inferTimeout);
-        return channel -> client.execute(InferenceAction.INSTANCE, requestBuilder.build(), new RestChunkedToXContentListener<>(channel));
+    protected ActionListener<InferenceAction.Response> listener(RestChannel channel) {
+        return new RestChunkedToXContentListener<>(channel);
     }
 }
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rest/RestStreamInferenceAction.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rest/RestStreamInferenceAction.java
new file mode 100644
index 0000000000000..875c288da52bd
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/rest/RestStreamInferenceAction.java
@@ -0,0 +1,43 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.rest;
+
+import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.rest.RestChannel;
+import org.elasticsearch.rest.Scope;
+import org.elasticsearch.rest.ServerlessScope;
+import org.elasticsearch.xpack.core.inference.action.InferenceAction;
+
+import java.util.List;
+
+import static org.elasticsearch.rest.RestRequest.Method.POST;
+import static org.elasticsearch.xpack.inference.rest.Paths.STREAM_INFERENCE_ID_PATH;
+import static org.elasticsearch.xpack.inference.rest.Paths.STREAM_TASK_TYPE_INFERENCE_ID_PATH;
+
+@ServerlessScope(Scope.PUBLIC)
+public class RestStreamInferenceAction extends BaseInferenceAction {
+    @Override
+    public String getName() {
+        return "stream_inference_action";
+    }
+
+    @Override
+    public List<Route> routes() {
+        return List.of(new Route(POST, STREAM_INFERENCE_ID_PATH), new Route(POST, STREAM_TASK_TYPE_INFERENCE_ID_PATH));
+    }
+
+    @Override
+    protected InferenceAction.Request prepareInferenceRequest(InferenceAction.Request.Builder builder) {
+        return builder.setStream(true).build();
+    }
+
+    @Override
+    protected ActionListener<InferenceAction.Response> listener(RestChannel channel) {
+        return new ServerSentEventsRestActionListener(channel);
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rank/textsimilarity/TextSimilarityRankTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rank/textsimilarity/TextSimilarityRankTests.java
index a26dc50097cf5..a042fca44fdb5 100644
--- a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rank/textsimilarity/TextSimilarityRankTests.java
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rank/textsimilarity/TextSimilarityRankTests.java
@@ -92,7 +92,8 @@ protected InferenceAction.Request generateRequest(List<String> docFeatures) {
                         docFeatures,
                         Map.of("inferenceResultCount", inferenceResultCount),
                         InputType.SEARCH,
-                        InferenceAction.Request.DEFAULT_TIMEOUT
+                        InferenceAction.Request.DEFAULT_TIMEOUT,
+                        false
                     );
                 }
             };
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rank/textsimilarity/TextSimilarityTestPlugin.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rank/textsimilarity/TextSimilarityTestPlugin.java
index 6d0c15d5c0bfe..120527f489549 100644
--- a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rank/textsimilarity/TextSimilarityTestPlugin.java
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rank/textsimilarity/TextSimilarityTestPlugin.java
@@ -312,7 +312,8 @@ protected InferenceAction.Request generateRequest(List<String> docFeatures) {
                             docFeatures,
                             Map.of("throwing", true),
                             InputType.SEARCH,
-                            InferenceAction.Request.DEFAULT_TIMEOUT
+                            InferenceAction.Request.DEFAULT_TIMEOUT,
+                            false
                         );
                     }
                 };
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rest/BaseInferenceActionTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rest/BaseInferenceActionTests.java
new file mode 100644
index 0000000000000..05a8d52be5df4
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rest/BaseInferenceActionTests.java
@@ -0,0 +1,107 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.rest;
+
+import org.apache.lucene.util.SetOnce;
+import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.common.bytes.BytesArray;
+import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.rest.RestChannel;
+import org.elasticsearch.rest.RestRequest;
+import org.elasticsearch.rest.action.RestChunkedToXContentListener;
+import org.elasticsearch.test.rest.FakeRestRequest;
+import org.elasticsearch.test.rest.RestActionTestCase;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.core.inference.action.InferenceAction;
+import org.elasticsearch.xpack.core.inference.results.InferenceTextEmbeddingByteResults;
+import org.junit.Before;
+
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+
+import static org.elasticsearch.rest.RestRequest.Method.POST;
+import static org.hamcrest.CoreMatchers.is;
+import static org.hamcrest.Matchers.equalTo;
+import static org.hamcrest.Matchers.instanceOf;
+
+public class BaseInferenceActionTests extends RestActionTestCase {
+
+    @Before
+    public void setUpAction() {
+        controller().registerHandler(new BaseInferenceAction() {
+            @Override
+            protected ActionListener<InferenceAction.Response> listener(RestChannel channel) {
+                return new RestChunkedToXContentListener<>(channel);
+            }
+
+            @Override
+            public String getName() {
+                return "base_inference_action";
+            }
+
+            @Override
+            public List<Route> routes() {
+                return List.of(new Route(POST, route("{task_type_or_id}")));
+            }
+        });
+    }
+
+    private static String route(String param) {
+        return "_route/" + param;
+    }
+
+    public void testUsesDefaultTimeout() {
+        SetOnce<Boolean> executeCalled = new SetOnce<>();
+        verifyingClient.setExecuteVerifier(((actionType, actionRequest) -> {
+            assertThat(actionRequest, instanceOf(InferenceAction.Request.class));
+
+            var request = (InferenceAction.Request) actionRequest;
+            assertThat(request.getInferenceTimeout(), is(InferenceAction.Request.DEFAULT_TIMEOUT));
+
+            executeCalled.set(true);
+            return createResponse();
+        }));
+
+        RestRequest inferenceRequest = new FakeRestRequest.Builder(xContentRegistry()).withMethod(RestRequest.Method.POST)
+            .withPath(route("test"))
+            .withContent(new BytesArray("{}"), XContentType.JSON)
+            .build();
+        dispatchRequest(inferenceRequest);
+        assertThat(executeCalled.get(), equalTo(true));
+    }
+
+    public void testUses3SecondTimeoutFromParams() {
+        SetOnce<Boolean> executeCalled = new SetOnce<>();
+        verifyingClient.setExecuteVerifier(((actionType, actionRequest) -> {
+            assertThat(actionRequest, instanceOf(InferenceAction.Request.class));
+
+            var request = (InferenceAction.Request) actionRequest;
+            assertThat(request.getInferenceTimeout(), is(TimeValue.timeValueSeconds(3)));
+
+            executeCalled.set(true);
+            return createResponse();
+        }));
+
+        RestRequest inferenceRequest = new FakeRestRequest.Builder(xContentRegistry()).withMethod(RestRequest.Method.POST)
+            .withPath(route("test"))
+            .withParams(new HashMap<>(Map.of("timeout", "3s")))
+            .withContent(new BytesArray("{}"), XContentType.JSON)
+            .build();
+        dispatchRequest(inferenceRequest);
+        assertThat(executeCalled.get(), equalTo(true));
+    }
+
+    static InferenceAction.Response createResponse() {
+        return new InferenceAction.Response(
+            new InferenceTextEmbeddingByteResults(
+                List.of(new InferenceTextEmbeddingByteResults.InferenceByteEmbedding(new byte[] { (byte) -1 }))
+            )
+        );
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rest/RestInferenceActionTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rest/RestInferenceActionTests.java
index 48e5d54a62733..1b0df1b4a20da 100644
--- a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rest/RestInferenceActionTests.java
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rest/RestInferenceActionTests.java
@@ -9,19 +9,14 @@
 
 import org.apache.lucene.util.SetOnce;
 import org.elasticsearch.common.bytes.BytesArray;
-import org.elasticsearch.core.TimeValue;
 import org.elasticsearch.rest.RestRequest;
 import org.elasticsearch.test.rest.FakeRestRequest;
 import org.elasticsearch.test.rest.RestActionTestCase;
 import org.elasticsearch.xcontent.XContentType;
 import org.elasticsearch.xpack.core.inference.action.InferenceAction;
-import org.elasticsearch.xpack.core.inference.results.InferenceTextEmbeddingByteResults;
 import org.junit.Before;
 
-import java.util.HashMap;
-import java.util.List;
-import java.util.Map;
-
+import static org.elasticsearch.xpack.inference.rest.BaseInferenceActionTests.createResponse;
 import static org.hamcrest.CoreMatchers.is;
 import static org.hamcrest.Matchers.equalTo;
 import static org.hamcrest.Matchers.instanceOf;
@@ -33,13 +28,13 @@ public void setUpAction() {
         controller().registerHandler(new RestInferenceAction());
     }
 
-    public void testUsesDefaultTimeout() {
+    public void testStreamIsFalse() {
         SetOnce<Boolean> executeCalled = new SetOnce<>();
         verifyingClient.setExecuteVerifier(((actionType, actionRequest) -> {
             assertThat(actionRequest, instanceOf(InferenceAction.Request.class));
 
             var request = (InferenceAction.Request) actionRequest;
-            assertThat(request.getInferenceTimeout(), is(InferenceAction.Request.DEFAULT_TIMEOUT));
+            assertThat(request.isStreaming(), is(false));
 
             executeCalled.set(true);
             return createResponse();
@@ -52,33 +47,4 @@ public void testUsesDefaultTimeout() {
         dispatchRequest(inferenceRequest);
         assertThat(executeCalled.get(), equalTo(true));
     }
-
-    public void testUses3SecondTimeoutFromParams() {
-        SetOnce<Boolean> executeCalled = new SetOnce<>();
-        verifyingClient.setExecuteVerifier(((actionType, actionRequest) -> {
-            assertThat(actionRequest, instanceOf(InferenceAction.Request.class));
-
-            var request = (InferenceAction.Request) actionRequest;
-            assertThat(request.getInferenceTimeout(), is(TimeValue.timeValueSeconds(3)));
-
-            executeCalled.set(true);
-            return createResponse();
-        }));
-
-        RestRequest inferenceRequest = new FakeRestRequest.Builder(xContentRegistry()).withMethod(RestRequest.Method.POST)
-            .withPath("_inference/test")
-            .withParams(new HashMap<>(Map.of("timeout", "3s")))
-            .withContent(new BytesArray("{}"), XContentType.JSON)
-            .build();
-        dispatchRequest(inferenceRequest);
-        assertThat(executeCalled.get(), equalTo(true));
-    }
-
-    private static InferenceAction.Response createResponse() {
-        return new InferenceAction.Response(
-            new InferenceTextEmbeddingByteResults(
-                List.of(new InferenceTextEmbeddingByteResults.InferenceByteEmbedding(new byte[] { (byte) -1 }))
-            )
-        );
-    }
 }
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rest/RestStreamInferenceActionTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rest/RestStreamInferenceActionTests.java
new file mode 100644
index 0000000000000..b999e2c9b72f0
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/rest/RestStreamInferenceActionTests.java
@@ -0,0 +1,50 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.rest;
+
+import org.apache.lucene.util.SetOnce;
+import org.elasticsearch.common.bytes.BytesArray;
+import org.elasticsearch.rest.RestRequest;
+import org.elasticsearch.test.rest.FakeRestRequest;
+import org.elasticsearch.test.rest.RestActionTestCase;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.core.inference.action.InferenceAction;
+import org.junit.Before;
+
+import static org.elasticsearch.xpack.inference.rest.BaseInferenceActionTests.createResponse;
+import static org.hamcrest.CoreMatchers.is;
+import static org.hamcrest.Matchers.equalTo;
+import static org.hamcrest.Matchers.instanceOf;
+
+public class RestStreamInferenceActionTests extends RestActionTestCase {
+
+    @Before
+    public void setUpAction() {
+        controller().registerHandler(new RestStreamInferenceAction());
+    }
+
+    public void testStreamIsTrue() {
+        SetOnce<Boolean> executeCalled = new SetOnce<>();
+        verifyingClient.setExecuteVerifier(((actionType, actionRequest) -> {
+            assertThat(actionRequest, instanceOf(InferenceAction.Request.class));
+
+            var request = (InferenceAction.Request) actionRequest;
+            assertThat(request.isStreaming(), is(true));
+
+            executeCalled.set(true);
+            return createResponse();
+        }));
+
+        RestRequest inferenceRequest = new FakeRestRequest.Builder(xContentRegistry()).withMethod(RestRequest.Method.POST)
+            .withPath("_inference/test/_stream")
+            .withContent(new BytesArray("{}"), XContentType.JSON)
+            .build();
+        dispatchRequest(inferenceRequest);
+        assertThat(executeCalled.get(), equalTo(true));
+    }
+}
diff --git a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportCoordinatedInferenceAction.java b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportCoordinatedInferenceAction.java
index fd13e3de4e6cd..ab5a9d43fd6d1 100644
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportCoordinatedInferenceAction.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/action/TransportCoordinatedInferenceAction.java
@@ -126,7 +126,8 @@ private void doInferenceServiceModel(CoordinatedInferenceAction.Request request,
                 request.getInputs(),
                 request.getTaskSettings(),
                 inputType,
-                request.getInferenceTimeout()
+                request.getInferenceTimeout(),
+                false
             ),
             listener.delegateFailureAndWrap((l, r) -> l.onResponse(translateInferenceServiceResponse(r.getResults())))
         );

From 93236f9dedb5a3715ff39f34838de27b3bd72d2a Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Tue, 24 Sep 2024 14:41:33 +1000
Subject: [PATCH 14/28] Mute
 org.elasticsearch.index.mapper.extras.TokenCountFieldMapperTests
 testBlockLoaderFromRowStrideReaderWithSyntheticSource #113427

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 2a2f8071482d8..05e0b9862625e 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -304,6 +304,9 @@ tests:
 - class: org.elasticsearch.xpack.esql.EsqlAsyncSecurityIT
   method: testLimitedPrivilege
   issue: https://github.com/elastic/elasticsearch/issues/113419
+- class: org.elasticsearch.index.mapper.extras.TokenCountFieldMapperTests
+  method: testBlockLoaderFromRowStrideReaderWithSyntheticSource
+  issue: https://github.com/elastic/elasticsearch/issues/113427
 
 # Examples:
 #

From 97fcfa0854d49749de1fae18a068255d5feb69b7 Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Tue, 24 Sep 2024 14:49:01 +1000
Subject: [PATCH 15/28] Mute
 org.elasticsearch.xpack.esql.ccq.MultiClusterSpecIT test
 {categorize.Categorize} #113428

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 05e0b9862625e..8ef4dd355a55b 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -307,6 +307,9 @@ tests:
 - class: org.elasticsearch.index.mapper.extras.TokenCountFieldMapperTests
   method: testBlockLoaderFromRowStrideReaderWithSyntheticSource
   issue: https://github.com/elastic/elasticsearch/issues/113427
+- class: org.elasticsearch.xpack.esql.ccq.MultiClusterSpecIT
+  method: test {categorize.Categorize}
+  issue: https://github.com/elastic/elasticsearch/issues/113428
 
 # Examples:
 #

From d9e0cbeb59638cb7476942b4cb4b9ea857a6703e Mon Sep 17 00:00:00 2001
From: Ignacio Vera <ignacio.vera@elastic.co>
Date: Tue, 24 Sep 2024 07:08:47 +0200
Subject: [PATCH 16/28] Small performance improvement in h3 library (#113385)

Changing some FDIV's into FMUL's leads to performance improvements
---
 docs/changelog/113385.yaml                    |  5 +++
 .../java/org/elasticsearch/h3/Constants.java  |  7 +++-
 .../java/org/elasticsearch/h3/CoordIJK.java   | 11 +++--
 .../java/org/elasticsearch/h3/FastMath.java   | 41 +++++++++++--------
 .../main/java/org/elasticsearch/h3/Vec2d.java | 23 ++++++-----
 .../main/java/org/elasticsearch/h3/Vec3d.java |  2 +-
 6 files changed, 57 insertions(+), 32 deletions(-)
 create mode 100644 docs/changelog/113385.yaml

diff --git a/docs/changelog/113385.yaml b/docs/changelog/113385.yaml
new file mode 100644
index 0000000000000..9cee1ebcd4f64
--- /dev/null
+++ b/docs/changelog/113385.yaml
@@ -0,0 +1,5 @@
+pr: 113385
+summary: Small performance improvement in h3 library
+area: Geo
+type: enhancement
+issues: []
diff --git a/libs/h3/src/main/java/org/elasticsearch/h3/Constants.java b/libs/h3/src/main/java/org/elasticsearch/h3/Constants.java
index 5192fe836e73d..570052700615f 100644
--- a/libs/h3/src/main/java/org/elasticsearch/h3/Constants.java
+++ b/libs/h3/src/main/java/org/elasticsearch/h3/Constants.java
@@ -33,7 +33,7 @@ final class Constants {
     /**
      * 2.0 * PI
      */
-    public static final double M_2PI = 6.28318530717958647692528676655900576839433;
+    public static final double M_2PI = 2.0 * Math.PI;
     /**
      * max H3 resolution; H3 version 1 has 16 resolutions, numbered 0 through 15
      */
@@ -58,6 +58,11 @@ final class Constants {
      * square root of 7
      */
     public static final double M_SQRT7 = 2.6457513110645905905016157536392604257102;
+
+    /**
+     * 1 / square root of 7
+     */
+    public static final double M_RSQRT7 = 1.0 / M_SQRT7;
     /**
      * scaling factor from hex2d resolution 0 unit length
      * (or distance between adjacent cell center points
diff --git a/libs/h3/src/main/java/org/elasticsearch/h3/CoordIJK.java b/libs/h3/src/main/java/org/elasticsearch/h3/CoordIJK.java
index e57f681fc2eae..8aae7583ef04e 100644
--- a/libs/h3/src/main/java/org/elasticsearch/h3/CoordIJK.java
+++ b/libs/h3/src/main/java/org/elasticsearch/h3/CoordIJK.java
@@ -39,6 +39,9 @@
  */
 final class CoordIJK {
 
+    /** one seventh (1/7) **/
+    private static final double M_ONESEVENTH = 1.0 / 7.0;
+
     /** CoordIJK unit vectors corresponding to the 7 H3 digits.
      */
     private static final int[][] UNIT_VECS = {
@@ -281,8 +284,8 @@ public void neighbor(int digit) {
     public void upAp7r() {
         final int i = Math.subtractExact(this.i, this.k);
         final int j = Math.subtractExact(this.j, this.k);
-        this.i = (int) Math.round((Math.addExact(Math.multiplyExact(2, i), j)) / 7.0);
-        this.j = (int) Math.round((Math.subtractExact(Math.multiplyExact(3, j), i)) / 7.0);
+        this.i = (int) Math.round((Math.addExact(Math.multiplyExact(2, i), j)) * M_ONESEVENTH);
+        this.j = (int) Math.round((Math.subtractExact(Math.multiplyExact(3, j), i)) * M_ONESEVENTH);
         this.k = 0;
         ijkNormalize();
     }
@@ -295,8 +298,8 @@ public void upAp7r() {
     public void upAp7() {
         final int i = Math.subtractExact(this.i, this.k);
         final int j = Math.subtractExact(this.j, this.k);
-        this.i = (int) Math.round((Math.subtractExact(Math.multiplyExact(3, i), j)) / 7.0);
-        this.j = (int) Math.round((Math.addExact(Math.multiplyExact(2, j), i)) / 7.0);
+        this.i = (int) Math.round((Math.subtractExact(Math.multiplyExact(3, i), j)) * M_ONESEVENTH);
+        this.j = (int) Math.round((Math.addExact(Math.multiplyExact(2, j), i)) * M_ONESEVENTH);
         this.k = 0;
         ijkNormalize();
     }
diff --git a/libs/h3/src/main/java/org/elasticsearch/h3/FastMath.java b/libs/h3/src/main/java/org/elasticsearch/h3/FastMath.java
index 61d767901ae0c..760fa75535487 100644
--- a/libs/h3/src/main/java/org/elasticsearch/h3/FastMath.java
+++ b/libs/h3/src/main/java/org/elasticsearch/h3/FastMath.java
@@ -102,6 +102,15 @@ final class FastMath {
     private static final int MIN_DOUBLE_EXPONENT = -1074;
     private static final int MAX_DOUBLE_EXPONENT = 1023;
 
+    /**
+     * PI / 2.0
+     */
+    private static final double M_HALF_PI = Math.PI * 0.5;
+    /**
+     * PI / 4.0
+     */
+    private static final double M_QUARTER_PI = Math.PI * 0.25;
+
     // --------------------------------------------------------------------------
     // CONSTANTS FOR NORMALIZATIONS
     // --------------------------------------------------------------------------
@@ -335,7 +344,7 @@ public static double cos(double angle) {
             // Faster than using normalizeZeroTwoPi.
             angle = remainderTwoPi(angle);
             if (angle < 0.0) {
-                angle += 2 * Math.PI;
+                angle += Constants.M_2PI;
             }
         }
         // index: possibly outside tables range.
@@ -366,7 +375,7 @@ public static double sin(double angle) {
             // Faster than using normalizeZeroTwoPi.
             angle = remainderTwoPi(angle);
             if (angle < 0.0) {
-                angle += 2 * Math.PI;
+                angle += Constants.M_2PI;
             }
         }
         int index = (int) (angle * SIN_COS_INDEXER + 0.5);
@@ -387,9 +396,9 @@ public static double tan(double angle) {
         if (Math.abs(angle) > TAN_MAX_VALUE_FOR_INT_MODULO) {
             // Faster than using normalizeMinusHalfPiHalfPi.
             angle = remainderTwoPi(angle);
-            if (angle < -Math.PI / 2) {
+            if (angle < -M_HALF_PI) {
                 angle += Math.PI;
-            } else if (angle > Math.PI / 2) {
+            } else if (angle > M_HALF_PI) {
                 angle -= Math.PI;
             }
         }
@@ -428,7 +437,7 @@ public static double tan(double angle) {
      * @return Value arccosine, in radians, in [0,PI].
      */
     public static double acos(double value) {
-        return Math.PI / 2 - FastMath.asin(value);
+        return M_HALF_PI - FastMath.asin(value);
     }
 
     /**
@@ -468,7 +477,7 @@ public static double asin(double value) {
                 return negateResult ? -result : result;
             } else { // value >= 1.0, or value is NaN
                 if (value == 1.0) {
-                    return negateResult ? -Math.PI / 2 : Math.PI / 2;
+                    return negateResult ? -M_HALF_PI : M_HALF_PI;
                 } else {
                     return Double.NaN;
                 }
@@ -490,7 +499,7 @@ public static double atan(double value) {
         }
         if (value == 1.0) {
             // We want "exact" result for 1.0.
-            return negateResult ? -Math.PI / 4 : Math.PI / 4;
+            return negateResult ? -M_QUARTER_PI : M_QUARTER_PI;
         } else if (value <= ATAN_MAX_VALUE_FOR_TABS) {
             int index = (int) (value * ATAN_INDEXER + 0.5);
             double delta = value - index * ATAN_DELTA;
@@ -511,7 +520,7 @@ public static double atan(double value) {
                 if (Double.isNaN(value)) {
                     return Double.NaN;
                 } else {
-                    return negateResult ? -Math.PI / 2 : Math.PI / 2;
+                    return negateResult ? -M_HALF_PI : M_HALF_PI;
                 }
             }
         }
@@ -532,9 +541,9 @@ public static double atan2(double y, double x) {
             }
             if (x == Double.POSITIVE_INFINITY) {
                 if (y == Double.POSITIVE_INFINITY) {
-                    return Math.PI / 4;
+                    return M_QUARTER_PI;
                 } else if (y == Double.NEGATIVE_INFINITY) {
-                    return -Math.PI / 4;
+                    return -M_QUARTER_PI;
                 } else if (y > 0.0) {
                     return 0.0;
                 } else if (y < 0.0) {
@@ -551,9 +560,9 @@ public static double atan2(double y, double x) {
             }
             if (x == Double.NEGATIVE_INFINITY) {
                 if (y == Double.POSITIVE_INFINITY) {
-                    return 3 * Math.PI / 4;
+                    return 3 * M_QUARTER_PI;
                 } else if (y == Double.NEGATIVE_INFINITY) {
-                    return -3 * Math.PI / 4;
+                    return -3 * M_QUARTER_PI;
                 } else if (y > 0.0) {
                     return Math.PI;
                 } else if (y < 0.0) {
@@ -562,9 +571,9 @@ public static double atan2(double y, double x) {
                     return Double.NaN;
                 }
             } else if (y > 0.0) {
-                return Math.PI / 2 + FastMath.atan(-x / y);
+                return M_HALF_PI + FastMath.atan(-x / y);
             } else if (y < 0.0) {
-                return -Math.PI / 2 - FastMath.atan(x / y);
+                return -M_HALF_PI - FastMath.atan(x / y);
             } else {
                 return Double.NaN;
             }
@@ -577,9 +586,9 @@ public static double atan2(double y, double x) {
                 }
             }
             if (y > 0.0) {
-                return Math.PI / 2;
+                return M_HALF_PI;
             } else if (y < 0.0) {
-                return -Math.PI / 2;
+                return -M_HALF_PI;
             } else {
                 return Double.NaN;
             }
diff --git a/libs/h3/src/main/java/org/elasticsearch/h3/Vec2d.java b/libs/h3/src/main/java/org/elasticsearch/h3/Vec2d.java
index 12ce728a99967..b0c2627a5f398 100644
--- a/libs/h3/src/main/java/org/elasticsearch/h3/Vec2d.java
+++ b/libs/h3/src/main/java/org/elasticsearch/h3/Vec2d.java
@@ -29,8 +29,11 @@
  */
 final class Vec2d {
 
-    /** sin(60') */
-    private static final double M_SIN60 = Constants.M_SQRT3_2;
+    /** 1/sin(60') **/
+    private static final double M_RSIN60 = 1.0 / Constants.M_SQRT3_2;
+
+    /** one third **/
+    private static final double M_ONETHIRD = 1.0 / 3.0;
 
     private static final double VEC2D_RESOLUTION = 1e-7;
 
@@ -133,14 +136,14 @@ static LatLng hex2dToGeo(double x, double y, int face, int res, boolean substrat
 
         // scale for current resolution length u
         for (int i = 0; i < res; i++) {
-            r /= Constants.M_SQRT7;
+            r *= Constants.M_RSQRT7;
         }
 
         // scale accordingly if this is a substrate grid
         if (substrate) {
             r /= 3.0;
             if (H3Index.isResolutionClassIII(res)) {
-                r /= Constants.M_SQRT7;
+                r *= Constants.M_RSQRT7;
             }
         }
 
@@ -181,8 +184,8 @@ static CoordIJK hex2dToCoordIJK(double x, double y) {
         a2 = Math.abs(y);
 
         // first do a reverse conversion
-        x2 = a2 / M_SIN60;
-        x1 = a1 + x2 / 2.0;
+        x2 = a2 * M_RSIN60;
+        x1 = a1 + x2 * 0.5;
 
         // check if we have the center of a hex
         m1 = (int) x1;
@@ -193,8 +196,8 @@ static CoordIJK hex2dToCoordIJK(double x, double y) {
         r2 = x2 - m2;
 
         if (r1 < 0.5) {
-            if (r1 < 1.0 / 3.0) {
-                if (r2 < (1.0 + r1) / 2.0) {
+            if (r1 < M_ONETHIRD) {
+                if (r2 < (1.0 + r1) * 0.5) {
                     i = m1;
                     j = m2;
                 } else {
@@ -215,7 +218,7 @@ static CoordIJK hex2dToCoordIJK(double x, double y) {
                 }
             }
         } else {
-            if (r1 < 2.0 / 3.0) {
+            if (r1 < 2.0 * M_ONETHIRD) {
                 if (r2 < (1.0 - r1)) {
                     j = m2;
                 } else {
@@ -228,7 +231,7 @@ static CoordIJK hex2dToCoordIJK(double x, double y) {
                     i = Math.incrementExact(m1);
                 }
             } else {
-                if (r2 < (r1 / 2.0)) {
+                if (r2 < (r1 * 0.5)) {
                     i = Math.incrementExact(m1);
                     j = m2;
                 } else {
diff --git a/libs/h3/src/main/java/org/elasticsearch/h3/Vec3d.java b/libs/h3/src/main/java/org/elasticsearch/h3/Vec3d.java
index c5c4f8975597c..5973af4b51f6f 100644
--- a/libs/h3/src/main/java/org/elasticsearch/h3/Vec3d.java
+++ b/libs/h3/src/main/java/org/elasticsearch/h3/Vec3d.java
@@ -96,7 +96,7 @@ static long geoToH3(int res, double lat, double lon) {
             }
         }
         // cos(r) = 1 - 2 * sin^2(r/2) = 1 - 2 * (sqd / 4) = 1 - sqd/2
-        double r = FastMath.acos(1 - sqd / 2);
+        double r = FastMath.acos(1 - sqd * 0.5);
 
         if (r < Constants.EPSILON) {
             return FaceIJK.faceIjkToH3(res, face, new CoordIJK(0, 0, 0));

From 3b5572da715b4af00c505c1e44b1e43abece27de Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Tue, 24 Sep 2024 15:28:32 +1000
Subject: [PATCH 17/28] Mute org.elasticsearch.xpack.inference.InferenceCrudIT
 testSupportedStream #113430

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 8ef4dd355a55b..502f703eb7630 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -310,6 +310,9 @@ tests:
 - class: org.elasticsearch.xpack.esql.ccq.MultiClusterSpecIT
   method: test {categorize.Categorize}
   issue: https://github.com/elastic/elasticsearch/issues/113428
+- class: org.elasticsearch.xpack.inference.InferenceCrudIT
+  method: testSupportedStream
+  issue: https://github.com/elastic/elasticsearch/issues/113430
 
 # Examples:
 #

From 23299228a3bf773acb56777a17ad36a234c25b9a Mon Sep 17 00:00:00 2001
From: David Kyle <david.kyle@elastic.co>
Date: Tue, 24 Sep 2024 08:00:12 +0100
Subject: [PATCH 18/28] Update Javadocs about the use of prior System Index
 Descriptors when updating mappings  (#113274)

---
 .../java/org/elasticsearch/indices/SystemIndexDescriptor.java  | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/server/src/main/java/org/elasticsearch/indices/SystemIndexDescriptor.java b/server/src/main/java/org/elasticsearch/indices/SystemIndexDescriptor.java
index 39119dacf29f1..08148de0591cb 100644
--- a/server/src/main/java/org/elasticsearch/indices/SystemIndexDescriptor.java
+++ b/server/src/main/java/org/elasticsearch/indices/SystemIndexDescriptor.java
@@ -93,6 +93,9 @@
  *
  * <p>The mappings for managed system indices are automatically upgraded when all nodes in the cluster are compatible with the
  * descriptor's mappings. See {@link SystemIndexMappingUpdateService} for details.
+ * When the mappings change add the previous index descriptors with
+ * {@link SystemIndexDescriptor.Builder#setPriorSystemIndexDescriptors(List)}. In a mixed cluster setting this enables auto creation
+ * of the index with compatible mappings.
  *
  * <p>We hope to remove the currently deprecated forms of access to system indices in a future release. A newly added system index with
  * no backwards-compatibility requirements may opt into our desired behavior by setting isNetNew to true. A "net new system index"

From 7b7dd91f6208251a830b28f2fb24c3ac91414fc1 Mon Sep 17 00:00:00 2001
From: Valeriy Khakhutskyy <1292899+valeriy42@users.noreply.github.com>
Date: Tue, 24 Sep 2024 09:46:42 +0200
Subject: [PATCH 19/28] [ML] Add documentation for post calendar events API
 (#113188)

This PR updates the documentation for the extension of the POST calendar events API implemented in #112837.
---
 .../apis/post-calendar-event.asciidoc         | 64 ++++++++++++++++++-
 1 file changed, 63 insertions(+), 1 deletion(-)

diff --git a/docs/reference/ml/anomaly-detection/apis/post-calendar-event.asciidoc b/docs/reference/ml/anomaly-detection/apis/post-calendar-event.asciidoc
index 8db1eb1ae84df..46ffeab694fa3 100644
--- a/docs/reference/ml/anomaly-detection/apis/post-calendar-event.asciidoc
+++ b/docs/reference/ml/anomaly-detection/apis/post-calendar-event.asciidoc
@@ -15,7 +15,7 @@ Posts scheduled events in a calendar.
 [[ml-post-calendar-event-prereqs]]
 == {api-prereq-title}
 
-Requires the `manage_ml` cluster privilege. This privilege is included in the 
+Requires the `manage_ml` cluster privilege. This privilege is included in the
 `machine_learning_admin` built-in role.
 
 [[ml-post-calendar-event-desc]]
@@ -54,6 +54,22 @@ milliseconds since the epoch or ISO 8601 format.
 `start_time`:::
 (Required, date) The timestamp for the beginning of the scheduled event in
 milliseconds since the epoch or ISO 8601 format.
+
+`skip_results`:::
+(Optional, Boolean) If `true`, the results during the scheduled event are not created.
+The default value is `true`.
+
+`skip_model_update`:::
+(Optional, Boolean) If `true`, the model is not updated during the scheduled event.
+The default value is `true`.
+
+`force_time_shift`:::
+(Optional, integer) Allows you to shift the time within the anomaly detector
+by a specified number of seconds in a specified direction. This is useful to quickly
+adjust to known Daylight Saving Time (DST) events. For example, to account for a
+one-hour backward time shift during the fall DST event, use a value of `-3600`.
+The parameter is not set by default. The time is shifted once at the beginning of the
+scheduled event. The shift is measured in seconds.
 ====
 
 [[ml-post-calendar-event-example]]
@@ -82,20 +98,66 @@ The API returns the following results:
       "description": "event 1",
       "start_time": 1513641600000,
       "end_time": 1513728000000,
+      "skip_result": true,
+      "skip_model_update": true,
       "calendar_id": "planned-outages"
     },
     {
       "description": "event 2",
       "start_time": 1513814400000,
       "end_time": 1513900800000,
+      "skip_result": true,
+      "skip_model_update": true,
       "calendar_id": "planned-outages"
     },
     {
       "description": "event 3",
       "start_time": 1514160000000,
       "end_time": 1514246400000,
+      "skip_result": true,
+      "skip_model_update": true,
       "calendar_id": "planned-outages"
     }
   ]
 }
 ----
+
+[source,console]
+--------------------------------------------------
+POST _ml/calendars/dst-germany/events
+{
+  "events" : [
+    {"description": "Fall 2024", "start_time": 1729994400000, "end_time": 1730167200000, "skip_result": false, "skip_model_update": false, "force_time_shift": -3600},
+    {"description": "Spring 2025", "start_time": 1743296400000, "end_time": 1743469200000, "skip_result": false, "skip_model_update": false, "force_time_shift": 3600}
+  ]
+}
+--------------------------------------------------
+// TEST[skip:setup:calendar_dst_addjob]
+
+The API returns the following results:
+
+[source,console-result]
+----
+{
+  "events": [
+    {
+      "description": "Fall 2024",
+      "start_time": 1729994400000,
+      "end_time": 1730167200000,
+      "skip_result": false,
+      "skip_model_update": false,
+      "force_time_shift": -3600,
+      "calendar_id": "dst-germany"
+    },
+    {
+      "description": "Spring 2025",
+      "start_time": 1743296400000,
+      "end_time": 1743469200000,
+      "skip_result": false,
+      "skip_model_update": false,
+      "force_time_shift": 3600,
+      "calendar_id": "dst-germany"
+    }
+  ]
+}
+----

From 840eecbd77fcb774421ea831753e7444ccfba9d0 Mon Sep 17 00:00:00 2001
From: David Turner <david.turner@elastic.co>
Date: Tue, 24 Sep 2024 08:53:55 +0100
Subject: [PATCH 20/28] Make `UpdateSettingsClusterStateUpdateRequest` a record
 (#113432)

No need to extend `IndicesClusterStateUpdateRequest`, this thing can be
completely immutable.
---
 .../MetadataUpdateSettingsServiceIT.java      | 133 ++++++++++--------
 .../put/TransportUpdateSettingsAction.java    |  31 ++--
 ...dateSettingsClusterStateUpdateRequest.java |  86 +++++------
 .../MetadataUpdateSettingsService.java        |   4 +-
 .../upgrades/SystemIndexMigrator.java         |  16 ++-
 ...TransportUpdateSecuritySettingsAction.java |  16 ++-
 .../TransportUpdateWatcherSettingsAction.java |  12 +-
 7 files changed, 166 insertions(+), 132 deletions(-)

diff --git a/server/src/internalClusterTest/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsServiceIT.java b/server/src/internalClusterTest/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsServiceIT.java
index b3b7957801cd7..c1e68040e075b 100644
--- a/server/src/internalClusterTest/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsServiceIT.java
+++ b/server/src/internalClusterTest/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsServiceIT.java
@@ -28,6 +28,7 @@
 import java.util.List;
 import java.util.concurrent.atomic.AtomicBoolean;
 import java.util.concurrent.atomic.AtomicReference;
+import java.util.function.Function;
 
 import static org.hamcrest.Matchers.equalTo;
 
@@ -42,45 +43,58 @@ public void testThatNonDynamicSettingChangesTakeEffect() throws Exception {
         MetadataUpdateSettingsService metadataUpdateSettingsService = internalCluster().getCurrentMasterNodeInstance(
             MetadataUpdateSettingsService.class
         );
-        UpdateSettingsClusterStateUpdateRequest request = new UpdateSettingsClusterStateUpdateRequest().ackTimeout(TimeValue.ZERO);
-        List<Index> indices = new ArrayList<>();
+        List<Index> indicesList = new ArrayList<>();
         for (IndicesService indicesService : internalCluster().getInstances(IndicesService.class)) {
             for (IndexService indexService : indicesService) {
-                indices.add(indexService.index());
+                indicesList.add(indexService.index());
             }
         }
-        request.indices(indices.toArray(Index.EMPTY_ARRAY));
-        request.settings(Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData").build());
+        final var indices = indicesList.toArray(Index.EMPTY_ARRAY);
+
+        final Function<UpdateSettingsClusterStateUpdateRequest.OnStaticSetting, UpdateSettingsClusterStateUpdateRequest> requestFactory =
+            onStaticSetting -> new UpdateSettingsClusterStateUpdateRequest(
+                TEST_REQUEST_TIMEOUT,
+                TimeValue.ZERO,
+                Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData").build(),
+                UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
+                onStaticSetting,
+                indices
+            );
 
         // First make sure it fails if reopenShards is not set on the request:
         AtomicBoolean expectedFailureOccurred = new AtomicBoolean(false);
-        metadataUpdateSettingsService.updateSettings(request, new ActionListener<>() {
-            @Override
-            public void onResponse(AcknowledgedResponse acknowledgedResponse) {
-                fail("Should have failed updating a non-dynamic setting without reopenShards set to true");
-            }
+        metadataUpdateSettingsService.updateSettings(
+            requestFactory.apply(UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT),
+            new ActionListener<>() {
+                @Override
+                public void onResponse(AcknowledgedResponse acknowledgedResponse) {
+                    fail("Should have failed updating a non-dynamic setting without reopenShards set to true");
+                }
 
-            @Override
-            public void onFailure(Exception e) {
-                expectedFailureOccurred.set(true);
+                @Override
+                public void onFailure(Exception e) {
+                    expectedFailureOccurred.set(true);
+                }
             }
-        });
+        );
         assertBusy(() -> assertThat(expectedFailureOccurred.get(), equalTo(true)));
 
         // Now we set reopenShards and expect it to work:
-        request.reopenShards(true);
         AtomicBoolean success = new AtomicBoolean(false);
-        metadataUpdateSettingsService.updateSettings(request, new ActionListener<>() {
-            @Override
-            public void onResponse(AcknowledgedResponse acknowledgedResponse) {
-                success.set(true);
-            }
+        metadataUpdateSettingsService.updateSettings(
+            requestFactory.apply(UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REOPEN_INDICES),
+            new ActionListener<>() {
+                @Override
+                public void onResponse(AcknowledgedResponse acknowledgedResponse) {
+                    success.set(true);
+                }
 
-            @Override
-            public void onFailure(Exception e) {
-                fail(e);
+                @Override
+                public void onFailure(Exception e) {
+                    fail(e);
+                }
             }
-        });
+        );
         assertBusy(() -> assertThat(success.get(), equalTo(true)));
 
         // Now we look into the IndexShard objects to make sure that the code was actually updated (vs just the setting):
@@ -110,16 +124,23 @@ public void testThatNonDynamicSettingChangesDoNotUnncessesarilyCauseReopens() th
         MetadataUpdateSettingsService metadataUpdateSettingsService = internalCluster().getCurrentMasterNodeInstance(
             MetadataUpdateSettingsService.class
         );
-        UpdateSettingsClusterStateUpdateRequest request = new UpdateSettingsClusterStateUpdateRequest().ackTimeout(TimeValue.ZERO);
-        List<Index> indices = new ArrayList<>();
+        List<Index> indicesList = new ArrayList<>();
         for (IndicesService indicesService : internalCluster().getInstances(IndicesService.class)) {
             for (IndexService indexService : indicesService) {
-                indices.add(indexService.index());
+                indicesList.add(indexService.index());
             }
         }
-        request.indices(indices.toArray(Index.EMPTY_ARRAY));
-        request.settings(Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData").build());
-        request.reopenShards(true);
+        final var indices = indicesList.toArray(Index.EMPTY_ARRAY);
+
+        final Function<Settings.Builder, UpdateSettingsClusterStateUpdateRequest> requestFactory =
+            settings -> new UpdateSettingsClusterStateUpdateRequest(
+                TEST_REQUEST_TIMEOUT,
+                TimeValue.ZERO,
+                settings.build(),
+                UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
+                UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REOPEN_INDICES,
+                indices
+            );
 
         ClusterService clusterService = internalCluster().getInstance(ClusterService.class);
         AtomicBoolean shardsUnassigned = new AtomicBoolean(false);
@@ -142,47 +163,49 @@ public void testThatNonDynamicSettingChangesDoNotUnncessesarilyCauseReopens() th
 
         AtomicBoolean success = new AtomicBoolean(false);
         // Make the first request, just to set things up:
-        metadataUpdateSettingsService.updateSettings(request, new ActionListener<>() {
-            @Override
-            public void onResponse(AcknowledgedResponse acknowledgedResponse) {
-                success.set(true);
-            }
+        metadataUpdateSettingsService.updateSettings(
+            requestFactory.apply(Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData")),
+            new ActionListener<>() {
+                @Override
+                public void onResponse(AcknowledgedResponse acknowledgedResponse) {
+                    success.set(true);
+                }
 
-            @Override
-            public void onFailure(Exception e) {
-                fail(e);
+                @Override
+                public void onFailure(Exception e) {
+                    fail(e);
+                }
             }
-        });
+        );
         assertBusy(() -> assertThat(success.get(), equalTo(true)));
         assertBusy(() -> assertThat(expectedSettingsChangeInClusterState.get(), equalTo(true)));
         assertThat(shardsUnassigned.get(), equalTo(true));
 
         assertBusy(() -> assertThat(hasUnassignedShards(clusterService.state(), indexName), equalTo(false)));
 
-        // Same request, except now we'll also set the dynamic "index.max_result_window" setting:
-        request.settings(
-            Settings.builder()
-                .put("index.codec", "FastDecompressionCompressingStoredFieldsData")
-                .put("index.max_result_window", "1500")
-                .build()
-        );
         success.set(false);
         expectedSettingsChangeInClusterState.set(false);
         shardsUnassigned.set(false);
         expectedSetting.set("index.max_result_window");
         expectedSettingValue.set("1500");
         // Making this request ought to add this new setting but not unassign the shards:
-        metadataUpdateSettingsService.updateSettings(request, new ActionListener<>() {
-            @Override
-            public void onResponse(AcknowledgedResponse acknowledgedResponse) {
-                success.set(true);
-            }
+        metadataUpdateSettingsService.updateSettings(
+            // Same request, except now we'll also set the dynamic "index.max_result_window" setting:
+            requestFactory.apply(
+                Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData").put("index.max_result_window", "1500")
+            ),
+            new ActionListener<>() {
+                @Override
+                public void onResponse(AcknowledgedResponse acknowledgedResponse) {
+                    success.set(true);
+                }
 
-            @Override
-            public void onFailure(Exception e) {
-                fail(e);
+                @Override
+                public void onFailure(Exception e) {
+                    fail(e);
+                }
             }
-        });
+        );
 
         assertBusy(() -> assertThat(success.get(), equalTo(true)));
         assertBusy(() -> assertThat(expectedSettingsChangeInClusterState.get(), equalTo(true)));
diff --git a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/TransportUpdateSettingsAction.java b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/TransportUpdateSettingsAction.java
index 1d7c264065d6f..1e7f32641b86f 100644
--- a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/TransportUpdateSettingsAction.java
+++ b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/TransportUpdateSettingsAction.java
@@ -124,19 +124,24 @@ protected void masterOperation(
             return;
         }
 
-        UpdateSettingsClusterStateUpdateRequest clusterStateUpdateRequest = new UpdateSettingsClusterStateUpdateRequest().indices(
-            concreteIndices
-        )
-            .settings(requestSettings)
-            .setPreserveExisting(request.isPreserveExisting())
-            .reopenShards(request.reopen())
-            .ackTimeout(request.ackTimeout())
-            .masterNodeTimeout(request.masterNodeTimeout());
-
-        updateSettingsService.updateSettings(clusterStateUpdateRequest, listener.delegateResponse((l, e) -> {
-            logger.debug(() -> "failed to update settings on indices [" + Arrays.toString(concreteIndices) + "]", e);
-            l.onFailure(e);
-        }));
+        updateSettingsService.updateSettings(
+            new UpdateSettingsClusterStateUpdateRequest(
+                request.masterNodeTimeout(),
+                request.ackTimeout(),
+                requestSettings,
+                request.isPreserveExisting()
+                    ? UpdateSettingsClusterStateUpdateRequest.OnExisting.PRESERVE
+                    : UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
+                request.reopen()
+                    ? UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REOPEN_INDICES
+                    : UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT,
+                concreteIndices
+            ),
+            listener.delegateResponse((l, e) -> {
+                logger.debug(() -> "failed to update settings on indices [" + Arrays.toString(concreteIndices) + "]", e);
+                l.onFailure(e);
+            })
+        );
     }
 
     /**
diff --git a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java
index 42a904c704bf3..fe8573da5fb68 100644
--- a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java
+++ b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java
@@ -9,70 +9,60 @@
 
 package org.elasticsearch.action.admin.indices.settings.put;
 
-import org.elasticsearch.cluster.ack.IndicesClusterStateUpdateRequest;
 import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.index.Index;
 
-import java.util.Arrays;
+import java.util.Objects;
 
 /**
  * Cluster state update request that allows to update settings for some indices
  */
-public class UpdateSettingsClusterStateUpdateRequest extends IndicesClusterStateUpdateRequest<UpdateSettingsClusterStateUpdateRequest> {
-
-    private Settings settings;
-
-    private boolean preserveExisting = false;
-
-    private boolean reopenShards = false;
-
-    /**
-     * Returns <code>true</code> iff the settings update should only add but not update settings. If the setting already exists
-     * it should not be overwritten by this update. The default is <code>false</code>
-     */
-    public boolean isPreserveExisting() {
-        return preserveExisting;
-    }
+public record UpdateSettingsClusterStateUpdateRequest(
+    TimeValue masterNodeTimeout,
+    TimeValue ackTimeout,
+    Settings settings,
+    OnExisting onExisting,
+    OnStaticSetting onStaticSetting,
+    Index... indices
+) {
 
     /**
-     * Returns <code>true</code> if non-dynamic setting updates should go through, by automatically unassigning shards in the same cluster
-     * state change as the setting update. The shards will be automatically reassigned after the cluster state update is made. The
-     * default is <code>false</code>.
+     * Specifies the behaviour of an update-settings action on existing settings.
      */
-    public boolean reopenShards() {
-        return reopenShards;
-    }
+    public enum OnExisting {
+        /**
+         * Update all the specified settings, overwriting any settings which already exist. This is the API default.
+         */
+        OVERWRITE,
 
-    public UpdateSettingsClusterStateUpdateRequest reopenShards(boolean reopenShards) {
-        this.reopenShards = reopenShards;
-        return this;
+        /**
+         * Only add new settings, preserving the values of any settings which are already set and ignoring the new values specified in the
+         * request.
+         */
+        PRESERVE
     }
 
     /**
-     * Iff set to <code>true</code> this settings update will only add settings not already set on an index. Existing settings remain
-     * unchanged.
+     * Specifies the behaviour of an update-settings action which is trying to adjust a non-dynamic setting.
      */
-    public UpdateSettingsClusterStateUpdateRequest setPreserveExisting(boolean preserveExisting) {
-        this.preserveExisting = preserveExisting;
-        return this;
-    }
+    public enum OnStaticSetting {
+        /**
+         * Reject attempts to update non-dynamic settings on open indices. This is the API default.
+         */
+        REJECT,
 
-    /**
-     * Returns the {@link Settings} to update
-     */
-    public Settings settings() {
-        return settings;
-    }
-
-    /**
-     * Sets the {@link Settings} to update
-     */
-    public UpdateSettingsClusterStateUpdateRequest settings(Settings settings) {
-        this.settings = settings;
-        return this;
+        /**
+         * Automatically close and reopen the shards of any open indices when updating a non-dynamic setting, forcing the shard to
+         * reinitialize from scratch.
+         */
+        REOPEN_INDICES
     }
 
-    @Override
-    public String toString() {
-        return Arrays.toString(indices()) + settings;
+    public UpdateSettingsClusterStateUpdateRequest {
+        Objects.requireNonNull(masterNodeTimeout);
+        Objects.requireNonNull(ackTimeout);
+        Objects.requireNonNull(settings);
+        Objects.requireNonNull(indices);
     }
 }
diff --git a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java
index cee3b4c0bdac1..4fcbd4165423b 100644
--- a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java
+++ b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java
@@ -176,7 +176,7 @@ ClusterState execute(ClusterState currentState) {
             }
             final Settings closedSettings = settingsForClosedIndices.build();
             final Settings openSettings = settingsForOpenIndices.build();
-            final boolean preserveExisting = request.isPreserveExisting();
+            final boolean preserveExisting = request.onExisting() == UpdateSettingsClusterStateUpdateRequest.OnExisting.PRESERVE;
 
             RoutingTable.Builder routingTableBuilder = null;
             Metadata.Builder metadataBuilder = Metadata.builder(currentState.metadata());
@@ -199,7 +199,7 @@ ClusterState execute(ClusterState currentState) {
             }
 
             if (skippedSettings.isEmpty() == false && openIndices.isEmpty() == false) {
-                if (request.reopenShards()) {
+                if (request.onStaticSetting() == UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REOPEN_INDICES) {
                     // We have non-dynamic settings and open indices. We will unassign all of the shards in these indices so that the new
                     // changed settings are applied when the shards are re-assigned.
                     routingTableBuilder = RoutingTable.builder(
diff --git a/server/src/main/java/org/elasticsearch/upgrades/SystemIndexMigrator.java b/server/src/main/java/org/elasticsearch/upgrades/SystemIndexMigrator.java
index 94b856f7a22fb..a131f63cb75f3 100644
--- a/server/src/main/java/org/elasticsearch/upgrades/SystemIndexMigrator.java
+++ b/server/src/main/java/org/elasticsearch/upgrades/SystemIndexMigrator.java
@@ -19,6 +19,7 @@
 import org.elasticsearch.action.admin.indices.settings.put.UpdateSettingsClusterStateUpdateRequest;
 import org.elasticsearch.action.support.ActiveShardCount;
 import org.elasticsearch.action.support.master.AcknowledgedResponse;
+import org.elasticsearch.action.support.master.MasterNodeRequest;
 import org.elasticsearch.action.support.master.ShardsAcknowledgedResponse;
 import org.elasticsearch.client.internal.Client;
 import org.elasticsearch.client.internal.ParentTaskAssigningClient;
@@ -537,11 +538,18 @@ private CheckedBiConsumer<ActionListener<BulkByScrollResponse>, AcknowledgedResp
      */
     private void setWriteBlock(Index index, boolean readOnlyValue, ActionListener<AcknowledgedResponse> listener) {
         final Settings readOnlySettings = Settings.builder().put(IndexMetadata.INDEX_BLOCKS_WRITE_SETTING.getKey(), readOnlyValue).build();
-        UpdateSettingsClusterStateUpdateRequest updateSettingsRequest = new UpdateSettingsClusterStateUpdateRequest().indices(
-            new Index[] { index }
-        ).settings(readOnlySettings).setPreserveExisting(false).ackTimeout(TimeValue.ZERO);
 
-        metadataUpdateSettingsService.updateSettings(updateSettingsRequest, listener);
+        metadataUpdateSettingsService.updateSettings(
+            new UpdateSettingsClusterStateUpdateRequest(
+                MasterNodeRequest.INFINITE_MASTER_NODE_TIMEOUT,
+                TimeValue.ZERO,
+                readOnlySettings,
+                UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
+                UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT,
+                index
+            ),
+            listener
+        );
     }
 
     private void reindex(SystemIndexMigrationInfo migrationInfo, ActionListener<BulkByScrollResponse> listener) {
diff --git a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportUpdateSecuritySettingsAction.java b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportUpdateSecuritySettingsAction.java
index 49f8846c36e1f..b924fe0d983bb 100644
--- a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportUpdateSecuritySettingsAction.java
+++ b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportUpdateSecuritySettingsAction.java
@@ -119,8 +119,8 @@ protected void masterOperation(
     private Optional<UpdateSettingsClusterStateUpdateRequest> createUpdateSettingsRequest(
         String indexName,
         Settings settingsToUpdate,
-        TimeValue timeout,
-        TimeValue masterTimeout,
+        TimeValue ackTimeout,
+        TimeValue masterNodeTimeout,
         ClusterState state
     ) {
         if (settingsToUpdate.isEmpty()) {
@@ -136,10 +136,14 @@ private Optional<UpdateSettingsClusterStateUpdateRequest> createUpdateSettingsRe
         }
 
         return Optional.of(
-            new UpdateSettingsClusterStateUpdateRequest().indices(new Index[] { writeIndex })
-                .settings(settingsToUpdate)
-                .ackTimeout(timeout)
-                .masterNodeTimeout(masterTimeout)
+            new UpdateSettingsClusterStateUpdateRequest(
+                masterNodeTimeout,
+                ackTimeout,
+                settingsToUpdate,
+                UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
+                UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT,
+                writeIndex
+            )
         );
     }
 
diff --git a/x-pack/plugin/watcher/src/main/java/org/elasticsearch/xpack/watcher/transport/actions/TransportUpdateWatcherSettingsAction.java b/x-pack/plugin/watcher/src/main/java/org/elasticsearch/xpack/watcher/transport/actions/TransportUpdateWatcherSettingsAction.java
index 378ee642cf105..0407c2db63ac6 100644
--- a/x-pack/plugin/watcher/src/main/java/org/elasticsearch/xpack/watcher/transport/actions/TransportUpdateWatcherSettingsAction.java
+++ b/x-pack/plugin/watcher/src/main/java/org/elasticsearch/xpack/watcher/transport/actions/TransportUpdateWatcherSettingsAction.java
@@ -24,7 +24,6 @@
 import org.elasticsearch.cluster.service.ClusterService;
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.util.concurrent.EsExecutors;
-import org.elasticsearch.index.Index;
 import org.elasticsearch.injection.guice.Inject;
 import org.elasticsearch.logging.LogManager;
 import org.elasticsearch.logging.Logger;
@@ -91,9 +90,14 @@ protected void masterOperation(
             return;
         }
         final Settings newSettings = Settings.builder().loadFromMap(request.settings()).build();
-        final UpdateSettingsClusterStateUpdateRequest clusterStateUpdateRequest = new UpdateSettingsClusterStateUpdateRequest().indices(
-            new Index[] { watcherIndexMd.getIndex() }
-        ).settings(newSettings).ackTimeout(request.ackTimeout()).masterNodeTimeout(request.masterNodeTimeout());
+        final UpdateSettingsClusterStateUpdateRequest clusterStateUpdateRequest = new UpdateSettingsClusterStateUpdateRequest(
+            request.masterNodeTimeout(),
+            request.ackTimeout(),
+            newSettings,
+            UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
+            UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT,
+            watcherIndexMd.getIndex()
+        );
 
         updateSettingsService.updateSettings(clusterStateUpdateRequest, new ActionListener<>() {
             @Override

From 4e5e87037074e7b4a6ccd6b729da477f99aabeae Mon Sep 17 00:00:00 2001
From: Andrei Dan <andrei.dan@elastic.co>
Date: Tue, 24 Sep 2024 11:13:26 +0300
Subject: [PATCH 21/28] Implement `parseBytesRef` for
 TimeSeriesRoutingHashFieldType (#113373)

This implements the `parseBytesRef` method for the `_ts_routing_hash` field so we
can parse the values generated by the companion `format` method.
We parse the values when fetching them from the source when the field is used
as a `sort` paired with `search_after`.

Before this change a sort by and search_after `_ts_routing_hash` would yield
an `UnsupportedOperationException`
---
 docs/changelog/113373.yaml                    |  6 +++
 .../test/tsdb/25_id_generation.yml            | 47 +++++++++++++++++++
 .../index/mapper/MapperFeatures.java          |  3 +-
 .../TimeSeriesRoutingHashFieldMapper.java     |  9 ++++
 .../search/DocValueFormatTests.java           | 13 +++++
 5 files changed, 77 insertions(+), 1 deletion(-)
 create mode 100644 docs/changelog/113373.yaml

diff --git a/docs/changelog/113373.yaml b/docs/changelog/113373.yaml
new file mode 100644
index 0000000000000..cbb3829e03425
--- /dev/null
+++ b/docs/changelog/113373.yaml
@@ -0,0 +1,6 @@
+pr: 113373
+summary: Implement `parseBytesRef` for `TimeSeriesRoutingHashFieldType`
+area: TSDB
+type: bug
+issues:
+ - 112399
diff --git a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/tsdb/25_id_generation.yml b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/tsdb/25_id_generation.yml
index 973832cf3ca73..4faa0424adb43 100644
--- a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/tsdb/25_id_generation.yml
+++ b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/tsdb/25_id_generation.yml
@@ -65,6 +65,9 @@ setup:
 
 ---
 generates a consistent id:
+  - requires:
+        cluster_features: "tsdb.ts_routing_hash_doc_value_parse_byte_ref"
+        reason: _tsid routing hash doc value parsing has been fixed
   - do:
       bulk:
         refresh: true
@@ -152,6 +155,50 @@ generates a consistent id:
   - match: { hits.hits.8._source.@timestamp: 2021-04-28T18:52:04.467Z }
   - match: { hits.hits.8._source.k8s.pod.uid: 947e4ced-1786-4e53-9e0c-5c447e959507 }
 
+  - do:
+      search:
+        index: id_generation_test
+        body:
+          query:
+            match_all: {}
+          sort: ["@timestamp", "_ts_routing_hash"]
+          _source: true
+          search_after: [ "2021-04-28T18:50:03.142Z", "cn4exQ" ]
+          docvalue_fields: [_ts_routing_hash]
+
+  - match: {hits.total.value: 9}
+
+  - match: { hits.hits.0._id: cZZNs7B9sSWsyrL5AAABeRnRGTM }
+  - match: { hits.hits.0._source.@timestamp: 2021-04-28T18:50:04.467Z }
+  - match: { hits.hits.0._source.k8s.pod.uid: 947e4ced-1786-4e53-9e0c-5c447e959507 }
+
+  - match: { hits.hits.1._id: cn4excfoxSs_KdA5AAABeRnRYiY }
+  - match: { hits.hits.1._source.@timestamp: 2021-04-28T18:50:23.142Z }
+  - match: { hits.hits.1._source.k8s.pod.uid: df3145b3-0563-4d3b-a0f7-897eb2876ea9 }
+
+  - match: { hits.hits.2._id: cZZNs7B9sSWsyrL5AAABeRnRZ1M }
+  - match: { hits.hits.2._source.@timestamp: 2021-04-28T18:50:24.467Z }
+  - match: { hits.hits.2._source.k8s.pod.uid: 947e4ced-1786-4e53-9e0c-5c447e959507 }
+
+  - match: { hits.hits.3._id: cZZNs7B9sSWsyrL5AAABeRnRtXM }
+  - match: { hits.hits.3._source.@timestamp: 2021-04-28T18:50:44.467Z }
+  - match: { hits.hits.3._source.k8s.pod.uid: 947e4ced-1786-4e53-9e0c-5c447e959507 }
+
+  - match: { hits.hits.4._id: cn4excfoxSs_KdA5AAABeRnR11Y }
+  - match: { hits.hits.4._source.@timestamp: 2021-04-28T18:50:53.142Z }
+  - match: { hits.hits.4._source.k8s.pod.uid: df3145b3-0563-4d3b-a0f7-897eb2876ea9 }
+
+  - match: { hits.hits.5._id: cn4excfoxSs_KdA5AAABeRnR_mY }
+  - match: { hits.hits.5._source.@timestamp: 2021-04-28T18:51:03.142Z }
+  - match: { hits.hits.5._source.k8s.pod.uid: df3145b3-0563-4d3b-a0f7-897eb2876ea9 }
+
+  - match: { hits.hits.6._id: cZZNs7B9sSWsyrL5AAABeRnSA5M }
+  - match: { hits.hits.6._source.@timestamp: 2021-04-28T18:51:04.467Z }
+  - match: { hits.hits.6._source.k8s.pod.uid: 947e4ced-1786-4e53-9e0c-5c447e959507 }
+
+  - match: { hits.hits.7._id: cZZNs7B9sSWsyrL5AAABeRnS7fM }
+  - match: { hits.hits.7._source.@timestamp: 2021-04-28T18:52:04.467Z }
+  - match: { hits.hits.7._source.k8s.pod.uid: 947e4ced-1786-4e53-9e0c-5c447e959507 }
 ---
 index a new document on top of an old one:
   - do:
diff --git a/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java b/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java
index d2ca7a24a78fd..ac7d10abc7121 100644
--- a/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java
+++ b/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java
@@ -43,7 +43,8 @@ public Set<NodeFeature> getFeatures() {
             SourceFieldMapper.SYNTHETIC_SOURCE_COPY_TO_FIX,
             FlattenedFieldMapper.IGNORE_ABOVE_SUPPORT,
             IndexSettings.IGNORE_ABOVE_INDEX_LEVEL_SETTING,
-            SourceFieldMapper.SYNTHETIC_SOURCE_COPY_TO_INSIDE_OBJECTS_FIX
+            SourceFieldMapper.SYNTHETIC_SOURCE_COPY_TO_INSIDE_OBJECTS_FIX,
+            TimeSeriesRoutingHashFieldMapper.TS_ROUTING_HASH_FIELD_PARSES_BYTES_REF
         );
     }
 }
diff --git a/server/src/main/java/org/elasticsearch/index/mapper/TimeSeriesRoutingHashFieldMapper.java b/server/src/main/java/org/elasticsearch/index/mapper/TimeSeriesRoutingHashFieldMapper.java
index cd0cbfeaaff7f..8b5cb08d09d16 100644
--- a/server/src/main/java/org/elasticsearch/index/mapper/TimeSeriesRoutingHashFieldMapper.java
+++ b/server/src/main/java/org/elasticsearch/index/mapper/TimeSeriesRoutingHashFieldMapper.java
@@ -15,6 +15,7 @@
 import org.elasticsearch.common.Strings;
 import org.elasticsearch.common.io.stream.StreamOutput;
 import org.elasticsearch.common.util.ByteUtils;
+import org.elasticsearch.features.NodeFeature;
 import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.index.IndexVersions;
 import org.elasticsearch.index.fielddata.FieldData;
@@ -46,6 +47,7 @@ public class TimeSeriesRoutingHashFieldMapper extends MetadataFieldMapper {
     public static final TimeSeriesRoutingHashFieldMapper INSTANCE = new TimeSeriesRoutingHashFieldMapper();
 
     public static final TypeParser PARSER = new FixedTypeParser(c -> c.getIndexSettings().getMode().timeSeriesRoutingHashFieldMapper());
+    static final NodeFeature TS_ROUTING_HASH_FIELD_PARSES_BYTES_REF = new NodeFeature("tsdb.ts_routing_hash_doc_value_parse_byte_ref");
 
     static final class TimeSeriesRoutingHashFieldType extends MappedFieldType {
 
@@ -65,6 +67,13 @@ public Object format(BytesRef value) {
                 return Uid.decodeId(value.bytes, value.offset, value.length);
             }
 
+            @Override
+            public BytesRef parseBytesRef(Object value) {
+                if (value instanceof BytesRef valueAsBytesRef) {
+                    return valueAsBytesRef;
+                }
+                return Uid.encodeId(value.toString());
+            }
         };
 
         private TimeSeriesRoutingHashFieldType() {
diff --git a/server/src/test/java/org/elasticsearch/search/DocValueFormatTests.java b/server/src/test/java/org/elasticsearch/search/DocValueFormatTests.java
index 0a830b598817d..6b42dbbb39c9f 100644
--- a/server/src/test/java/org/elasticsearch/search/DocValueFormatTests.java
+++ b/server/src/test/java/org/elasticsearch/search/DocValueFormatTests.java
@@ -20,6 +20,7 @@
 import org.elasticsearch.common.time.DateFormatter;
 import org.elasticsearch.index.mapper.DateFieldMapper.Resolution;
 import org.elasticsearch.index.mapper.TimeSeriesIdFieldMapper.TimeSeriesIdBuilder;
+import org.elasticsearch.index.mapper.TimeSeriesRoutingHashFieldMapper;
 import org.elasticsearch.test.ESTestCase;
 
 import java.io.IOException;
@@ -33,6 +34,8 @@
 import static org.elasticsearch.search.aggregations.bucket.geogrid.GeoTileUtils.longEncode;
 import static org.hamcrest.Matchers.containsString;
 import static org.hamcrest.Matchers.equalTo;
+import static org.hamcrest.Matchers.instanceOf;
+import static org.hamcrest.Matchers.is;
 
 public class DocValueFormatTests extends ESTestCase {
 
@@ -388,4 +391,14 @@ public void testParseTsid() throws IOException {
         Object tsidBase64 = Base64.getUrlEncoder().withoutPadding().encodeToString(expectedBytes);
         assertEquals(tsidFormat, tsidBase64);
     }
+
+    public void testFormatAndParseTsRoutingHash() throws IOException {
+        BytesRef tsRoutingHashInput = new BytesRef("cn4exQ");
+        DocValueFormat docValueFormat = TimeSeriesRoutingHashFieldMapper.INSTANCE.fieldType().docValueFormat(null, ZoneOffset.UTC);
+        Object formattedValue = docValueFormat.format(tsRoutingHashInput);
+        // the format method takes BytesRef as input and outputs a String
+        assertThat(formattedValue, instanceOf(String.class));
+        // the parse method will output the BytesRef input
+        assertThat(docValueFormat.parseBytesRef(formattedValue), is(tsRoutingHashInput));
+    }
 }

From 6cdd59bfd80af4e205973e5e053296ace183d4a3 Mon Sep 17 00:00:00 2001
From: Nikolaj Volgushev <n1v0lg@users.noreply.github.com>
Date: Tue, 24 Sep 2024 10:22:05 +0200
Subject: [PATCH 22/28] Move expensive role building off transport thread
 (#113020)

This PR moves role building off the transport thread to the generic
thread pool, since role building can be expensive depending on role
structure.

Role building is CPU bound so this PR uses a `ThrottledTaskRunner` to
limit the number of concurrent requests. I will explore adding a max
queue limit in a follow up.

Resolves: ES-9505
---
 .../xpack/security/Security.java              |  27 ++++
 .../authz/store/CompositeRolesStore.java      |  80 +++++++++--
 .../authz/IndicesAndAliasesResolverTests.java |   2 +
 .../authz/store/CompositeRolesStoreTests.java | 126 ++++++++++++++++++
 4 files changed, 225 insertions(+), 10 deletions(-)

diff --git a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/Security.java b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/Security.java
index 7e44d6d8b1c99..79a00fa1293bd 100644
--- a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/Security.java
+++ b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/Security.java
@@ -54,12 +54,15 @@
 import org.elasticsearch.common.transport.BoundTransportAddress;
 import org.elasticsearch.common.util.BigArrays;
 import org.elasticsearch.common.util.PageCacheRecycler;
+import org.elasticsearch.common.util.concurrent.AbstractRunnable;
 import org.elasticsearch.common.util.concurrent.EsExecutors;
 import org.elasticsearch.common.util.concurrent.ListenableFuture;
 import org.elasticsearch.common.util.concurrent.ThreadContext;
+import org.elasticsearch.common.util.concurrent.ThrottledTaskRunner;
 import org.elasticsearch.common.util.set.Sets;
 import org.elasticsearch.core.IOUtils;
 import org.elasticsearch.core.Nullable;
+import org.elasticsearch.core.Releasable;
 import org.elasticsearch.env.Environment;
 import org.elasticsearch.env.NodeMetadata;
 import org.elasticsearch.features.FeatureService;
@@ -1036,6 +1039,7 @@ Collection<Object> createComponents(
             serviceAccountService,
             dlsBitsetCache.get(),
             restrictedIndices,
+            buildRoleBuildingExecutor(threadPool, settings),
             new DeprecationRoleDescriptorConsumer(clusterService, threadPool)
         );
         systemIndices.getMainIndexManager().addStateListener(allRolesStore::onSecurityIndexStateChange);
@@ -1267,6 +1271,29 @@ private void submitPersistentMigrationTask(int migrationsVersion, boolean securi
             );
     }
 
+    private static Executor buildRoleBuildingExecutor(ThreadPool threadPool, Settings settings) {
+        final int allocatedProcessors = EsExecutors.allocatedProcessors(settings);
+        final ThrottledTaskRunner throttledTaskRunner = new ThrottledTaskRunner("build_roles", allocatedProcessors, threadPool.generic());
+        return r -> throttledTaskRunner.enqueueTask(new ActionListener<>() {
+            @Override
+            public void onResponse(Releasable releasable) {
+                try (releasable) {
+                    r.run();
+                }
+            }
+
+            @Override
+            public void onFailure(Exception e) {
+                if (r instanceof AbstractRunnable abstractRunnable) {
+                    abstractRunnable.onFailure(e);
+                }
+                // should be impossible, GENERIC pool doesn't reject anything
+                logger.error("unexpected failure running " + r, e);
+                assert false : new AssertionError("unexpected failure running " + r, e);
+            }
+        });
+    }
+
     private AuthorizationEngine getAuthorizationEngine() {
         return findValueFromExtensions("authorization engine", extension -> extension.getAuthorizationEngine(settings));
     }
diff --git a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authz/store/CompositeRolesStore.java b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authz/store/CompositeRolesStore.java
index d9778fda6e486..d79a3e31c1bc9 100644
--- a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authz/store/CompositeRolesStore.java
+++ b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authz/store/CompositeRolesStore.java
@@ -10,6 +10,7 @@
 import org.apache.logging.log4j.Logger;
 import org.elasticsearch.ElasticsearchException;
 import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.action.ActionRunnable;
 import org.elasticsearch.common.Strings;
 import org.elasticsearch.common.bytes.BytesReference;
 import org.elasticsearch.common.cache.Cache;
@@ -65,6 +66,7 @@
 import java.util.Objects;
 import java.util.Optional;
 import java.util.Set;
+import java.util.concurrent.Executor;
 import java.util.concurrent.atomic.AtomicLong;
 import java.util.function.Consumer;
 import java.util.stream.Collectors;
@@ -91,6 +93,11 @@ public class CompositeRolesStore {
         Property.NodeScope
     );
     private static final Logger logger = LogManager.getLogger(CompositeRolesStore.class);
+    /**
+     * See {@link #shouldForkRoleBuilding(Set)}
+     */
+    private static final int ROLE_DESCRIPTOR_FORK_THRESHOLD = 100;
+    private static final int INDEX_PRIVILEGE_FORK_THRESHOLD = 1000;
 
     private final RoleProviders roleProviders;
     private final NativePrivilegeStore privilegeStore;
@@ -106,6 +113,7 @@ public class CompositeRolesStore {
     private final Map<String, Role> internalUserRoles;
     private final RestrictedIndices restrictedIndices;
     private final ThreadContext threadContext;
+    private final Executor roleBuildingExecutor;
 
     public CompositeRolesStore(
         Settings settings,
@@ -118,6 +126,7 @@ public CompositeRolesStore(
         ServiceAccountService serviceAccountService,
         DocumentSubsetBitsetCache dlsBitsetCache,
         RestrictedIndices restrictedIndices,
+        Executor roleBuildingExecutor,
         Consumer<Collection<RoleDescriptor>> effectiveRoleDescriptorsConsumer
     ) {
         this.roleProviders = roleProviders;
@@ -179,6 +188,7 @@ public void providersChanged() {
         );
         this.anonymousUser = new AnonymousUser(settings);
         this.threadContext = threadContext;
+        this.roleBuildingExecutor = roleBuildingExecutor;
     }
 
     public void getRoles(Authentication authentication, ActionListener<Tuple<Role, Role>> roleActionListener) {
@@ -276,14 +286,31 @@ public void buildRoleFromRoleReference(RoleReference roleReference, ActionListen
                 } else if (RolesRetrievalResult.SUPERUSER == rolesRetrievalResult) {
                     roleActionListener.onResponse(superuserRole);
                 } else {
-                    buildThenMaybeCacheRole(
-                        roleKey,
-                        rolesRetrievalResult.getRoleDescriptors(),
-                        rolesRetrievalResult.getMissingRoles(),
-                        rolesRetrievalResult.isSuccess(),
-                        invalidationCounter,
-                        ActionListener.wrap(roleActionListener::onResponse, failureHandler)
-                    );
+                    final ActionListener<Role> wrapped = ActionListener.wrap(roleActionListener::onResponse, failureHandler);
+                    if (shouldForkRoleBuilding(rolesRetrievalResult.getRoleDescriptors())) {
+                        roleBuildingExecutor.execute(
+                            ActionRunnable.wrap(
+                                wrapped,
+                                l -> buildThenMaybeCacheRole(
+                                    roleKey,
+                                    rolesRetrievalResult.getRoleDescriptors(),
+                                    rolesRetrievalResult.getMissingRoles(),
+                                    rolesRetrievalResult.isSuccess(),
+                                    invalidationCounter,
+                                    l
+                                )
+                            )
+                        );
+                    } else {
+                        buildThenMaybeCacheRole(
+                            roleKey,
+                            rolesRetrievalResult.getRoleDescriptors(),
+                            rolesRetrievalResult.getMissingRoles(),
+                            rolesRetrievalResult.isSuccess(),
+                            invalidationCounter,
+                            wrapped
+                        );
+                    }
                 }
             }, failureHandler));
         } else {
@@ -291,6 +318,38 @@ public void buildRoleFromRoleReference(RoleReference roleReference, ActionListen
         }
     }
 
+    /**
+     * Uses heuristics such as presence of application privileges to determine if role building will be expensive
+     * and therefore warrants forking.
+     * Package-private for testing.
+     */
+    boolean shouldForkRoleBuilding(Set<RoleDescriptor> roleDescriptors) {
+        // A role with many role descriptors is likely expensive to build
+        if (roleDescriptors.size() > ROLE_DESCRIPTOR_FORK_THRESHOLD) {
+            return true;
+        }
+        int totalIndexPrivileges = 0;
+        int totalRemoteIndexPrivileges = 0;
+        for (RoleDescriptor roleDescriptor : roleDescriptors) {
+            // Application privileges can also result in big automata; it's difficult to determine how big application privileges
+            // are so err on the side of caution
+            if (roleDescriptor.hasApplicationPrivileges()) {
+                return true;
+            }
+            // Index privilege names or remote index privilege names can result in big and complex automata
+            totalIndexPrivileges += roleDescriptor.getIndicesPrivileges().length;
+            totalRemoteIndexPrivileges += roleDescriptor.getRemoteIndicesPrivileges().length;
+            if (totalIndexPrivileges > INDEX_PRIVILEGE_FORK_THRESHOLD || totalRemoteIndexPrivileges > INDEX_PRIVILEGE_FORK_THRESHOLD) {
+                return true;
+            }
+            // Likewise for FLS/DLS
+            if (roleDescriptor.isUsingDocumentOrFieldLevelSecurity()) {
+                return true;
+            }
+        }
+        return false;
+    }
+
     private static boolean includesSuperuserRole(RoleReference roleReference) {
         if (roleReference instanceof RoleReference.NamedRoleReference namedRoles) {
             return Arrays.asList(namedRoles.getRoleNames()).contains(ReservedRolesStore.SUPERUSER_ROLE_DESCRIPTOR.getName());
@@ -313,10 +372,11 @@ private void buildThenMaybeCacheRole(
         ActionListener<Role> listener
     ) {
         logger.trace(
-            "Building role from descriptors [{}] for names [{}] from source [{}]",
+            "Building role from descriptors [{}] for names [{}] from source [{}] on [{}]",
             roleDescriptors,
             roleKey.getNames(),
-            roleKey.getSource()
+            roleKey.getSource(),
+            Thread.currentThread().getName()
         );
         buildRoleFromDescriptors(
             roleDescriptors,
diff --git a/x-pack/plugin/security/src/test/java/org/elasticsearch/xpack/security/authz/IndicesAndAliasesResolverTests.java b/x-pack/plugin/security/src/test/java/org/elasticsearch/xpack/security/authz/IndicesAndAliasesResolverTests.java
index 73a5ce8177153..904fb1cff820a 100644
--- a/x-pack/plugin/security/src/test/java/org/elasticsearch/xpack/security/authz/IndicesAndAliasesResolverTests.java
+++ b/x-pack/plugin/security/src/test/java/org/elasticsearch/xpack/security/authz/IndicesAndAliasesResolverTests.java
@@ -47,6 +47,7 @@
 import org.elasticsearch.common.settings.ClusterSettings;
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.time.DateFormatter;
+import org.elasticsearch.common.util.concurrent.EsExecutors;
 import org.elasticsearch.common.util.concurrent.ThreadContext;
 import org.elasticsearch.core.Tuple;
 import org.elasticsearch.index.Index;
@@ -242,6 +243,7 @@ public void setup() {
                 mock(ServiceAccountService.class),
                 new DocumentSubsetBitsetCache(Settings.EMPTY, mock(ThreadPool.class)),
                 RESTRICTED_INDICES,
+                EsExecutors.DIRECT_EXECUTOR_SERVICE,
                 rds -> {}
             )
         );
diff --git a/x-pack/plugin/security/src/test/java/org/elasticsearch/xpack/security/authz/store/CompositeRolesStoreTests.java b/x-pack/plugin/security/src/test/java/org/elasticsearch/xpack/security/authz/store/CompositeRolesStoreTests.java
index 1886a945cbf38..9587533d87d86 100644
--- a/x-pack/plugin/security/src/test/java/org/elasticsearch/xpack/security/authz/store/CompositeRolesStoreTests.java
+++ b/x-pack/plugin/security/src/test/java/org/elasticsearch/xpack/security/authz/store/CompositeRolesStoreTests.java
@@ -35,6 +35,8 @@
 import org.elasticsearch.common.io.stream.StreamOutput;
 import org.elasticsearch.common.settings.ClusterSettings;
 import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.common.util.concurrent.AbstractRunnable;
+import org.elasticsearch.common.util.concurrent.EsExecutors;
 import org.elasticsearch.common.util.concurrent.ThreadContext;
 import org.elasticsearch.common.util.set.Sets;
 import org.elasticsearch.common.xcontent.XContentHelper;
@@ -112,6 +114,9 @@
 import org.hamcrest.Description;
 import org.hamcrest.Matcher;
 import org.hamcrest.Matchers;
+import org.junit.After;
+import org.junit.Before;
+import org.mockito.Mockito;
 
 import java.io.IOException;
 import java.time.Clock;
@@ -127,6 +132,7 @@
 import java.util.Map;
 import java.util.Set;
 import java.util.concurrent.ExecutionException;
+import java.util.concurrent.Executor;
 import java.util.concurrent.atomic.AtomicInteger;
 import java.util.concurrent.atomic.AtomicReference;
 import java.util.function.BiConsumer;
@@ -166,6 +172,7 @@
 import static org.mockito.ArgumentMatchers.anyString;
 import static org.mockito.ArgumentMatchers.eq;
 import static org.mockito.ArgumentMatchers.isA;
+import static org.mockito.Mockito.clearInvocations;
 import static org.mockito.Mockito.doAnswer;
 import static org.mockito.Mockito.doCallRealMethod;
 import static org.mockito.Mockito.mock;
@@ -186,6 +193,23 @@ public class CompositeRolesStoreTests extends ESTestCase {
         TestRestrictedIndices.INTERNAL_SECURITY_MAIN_INDEX_7
     );
 
+    private Executor mockRoleBuildingExecutor;
+
+    @Before
+    public void setup() {
+        mockRoleBuildingExecutor = mock(Executor.class);
+        Mockito.doAnswer(invocationOnMock -> {
+            final AbstractRunnable actionRunnable = (AbstractRunnable) invocationOnMock.getArguments()[0];
+            actionRunnable.run();
+            return null;
+        }).when(mockRoleBuildingExecutor).execute(any(Runnable.class));
+    }
+
+    @After
+    public void clear() {
+        clearInvocations(mockRoleBuildingExecutor);
+    }
+
     public void testRolesWhenDlsFlsUnlicensed() throws IOException {
         MockLicenseState licenseState = mock(MockLicenseState.class);
         when(licenseState.isAllowed(DOCUMENT_LEVEL_SECURITY_FEATURE)).thenReturn(false);
@@ -686,6 +710,62 @@ public void testNegativeLookupsCacheDisabled() {
         verifyNoMoreInteractions(fileRolesStore, reservedRolesStore, nativeRolesStore);
     }
 
+    public void testShouldForkRoleBuilding() {
+        final CompositeRolesStore compositeRolesStore = new CompositeRolesStore(
+            SECURITY_ENABLED_SETTINGS,
+            mock(RoleProviders.class),
+            mock(NativePrivilegeStore.class),
+            new ThreadContext(SECURITY_ENABLED_SETTINGS),
+            mock(),
+            cache,
+            mock(ApiKeyService.class),
+            mock(ServiceAccountService.class),
+            buildBitsetCache(),
+            TestRestrictedIndices.RESTRICTED_INDICES,
+            EsExecutors.DIRECT_EXECUTOR_SERVICE,
+            mock()
+        );
+
+        assertFalse(compositeRolesStore.shouldForkRoleBuilding(Set.of()));
+        assertFalse(
+            compositeRolesStore.shouldForkRoleBuilding(
+                Set.of(
+                    randomValueOtherThanMany(
+                        rd -> rd.isUsingDocumentOrFieldLevelSecurity() || rd.hasApplicationPrivileges(),
+                        RoleDescriptorTestHelper::randomRoleDescriptor
+                    )
+                )
+            )
+        );
+
+        assertTrue(compositeRolesStore.shouldForkRoleBuilding(generateRoleDescriptors(101))); // RD count above threshold
+        assertTrue(
+            compositeRolesStore.shouldForkRoleBuilding(
+                Set.of(
+                    randomValueOtherThanMany(
+                        rd -> false == rd.isUsingDocumentOrFieldLevelSecurity(),
+                        RoleDescriptorTestHelper::randomRoleDescriptor
+                    )
+                )
+            )
+        );
+        assertTrue(
+            compositeRolesStore.shouldForkRoleBuilding(
+                Set.of(
+                    randomValueOtherThanMany(rd -> false == rd.hasApplicationPrivileges(), RoleDescriptorTestHelper::randomRoleDescriptor)
+                )
+            )
+        );
+    }
+
+    private static Set<RoleDescriptor> generateRoleDescriptors(int numRoleDescriptors) {
+        Set<RoleDescriptor> roleDescriptors = new HashSet<>();
+        for (int i = 0; i < numRoleDescriptors; i++) {
+            roleDescriptors.add(RoleDescriptorTestHelper.randomRoleDescriptor());
+        }
+        return roleDescriptors;
+    }
+
     public void testNegativeLookupsAreNotCachedWithFailures() {
         final FileRolesStore fileRolesStore = mock(FileRolesStore.class);
         doCallRealMethod().when(fileRolesStore).accept(anySet(), anyActionListener());
@@ -715,6 +795,7 @@ public void testNegativeLookupsAreNotCachedWithFailures() {
             mock(ServiceAccountService.class),
             documentSubsetBitsetCache,
             TestRestrictedIndices.RESTRICTED_INDICES,
+            EsExecutors.DIRECT_EXECUTOR_SERVICE,
             effectiveRoleDescriptors::set
         );
         verify(fileRolesStore).addListener(anyConsumer()); // adds a listener in ctor
@@ -2318,6 +2399,7 @@ public void testGetRoleForWorkflowWithRestriction() {
             mock(ServiceAccountService.class),
             buildBitsetCache(),
             TestRestrictedIndices.RESTRICTED_INDICES,
+            EsExecutors.DIRECT_EXECUTOR_SERVICE,
             rds -> {}
         );
 
@@ -2431,6 +2513,7 @@ public void testGetRoleForWorkflowWithoutRestriction() {
             mock(ServiceAccountService.class),
             buildBitsetCache(),
             TestRestrictedIndices.RESTRICTED_INDICES,
+            EsExecutors.DIRECT_EXECUTOR_SERVICE,
             rds -> {}
         );
 
@@ -2868,6 +2951,48 @@ public void testGetRoleDescriptorsListForInternalUsers() {
         }
     }
 
+    public void testForkOnExpensiveRole() {
+        final RoleDescriptor expectedRoleDescriptor = randomValueOtherThanMany(
+            rd -> false == rd.hasApplicationPrivileges(),
+            // skip workflow restrictions since these can produce empty, nameless roles
+            () -> RoleDescriptorTestHelper.builder().allowRestriction(false).build()
+        );
+        final Consumer<ActionListener<RoleRetrievalResult>> rolesHandler = callback -> {
+            callback.onResponse(RoleRetrievalResult.success(Set.of(expectedRoleDescriptor)));
+        };
+        final Consumer<ActionListener<Collection<ApplicationPrivilegeDescriptor>>> privilegesHandler = callback -> callback.onResponse(
+            Collections.emptyList()
+        );
+        final CompositeRolesStore compositeRolesStore = setupRolesStore(rolesHandler, privilegesHandler);
+
+        final PlainActionFuture<Role> future = new PlainActionFuture<>();
+        getRoleForRoleNames(compositeRolesStore, List.of(expectedRoleDescriptor.getName()), future);
+        assertThat(future.actionGet().names(), equalTo(new String[] { expectedRoleDescriptor.getName() }));
+
+        verify(mockRoleBuildingExecutor, times(1)).execute(any());
+    }
+
+    public void testDoNotForkOnInexpensiveRole() {
+        final RoleDescriptor expectedRoleDescriptor = randomValueOtherThanMany(
+            rd -> rd.isUsingDocumentOrFieldLevelSecurity() || rd.hasApplicationPrivileges(),
+            // skip workflow restrictions since these can produce empty, nameless roles
+            () -> RoleDescriptorTestHelper.builder().allowRestriction(false).build()
+        );
+        final Consumer<ActionListener<RoleRetrievalResult>> rolesHandler = callback -> {
+            callback.onResponse(RoleRetrievalResult.success(Set.of(expectedRoleDescriptor)));
+        };
+        final Consumer<ActionListener<Collection<ApplicationPrivilegeDescriptor>>> privilegesHandler = callback -> callback.onResponse(
+            Collections.emptyList()
+        );
+        final CompositeRolesStore compositeRolesStore = setupRolesStore(rolesHandler, privilegesHandler);
+
+        final PlainActionFuture<Role> future = new PlainActionFuture<>();
+        getRoleForRoleNames(compositeRolesStore, List.of(expectedRoleDescriptor.getName()), future);
+        assertThat(future.actionGet().names(), equalTo(new String[] { expectedRoleDescriptor.getName() }));
+
+        verify(mockRoleBuildingExecutor, never()).execute(any());
+    }
+
     public void testGetRoleDescriptorsListUsesRoleStoreToResolveRoleWithInternalRoleName() {
         String roleName = AuthenticationTestHelper.randomInternalRoleName();
         RoleDescriptor expectedRoleDescriptor = new RoleDescriptor(roleName, null, null, null);
@@ -3024,6 +3149,7 @@ private CompositeRolesStore buildCompositeRolesStore(
             serviceAccountService,
             documentSubsetBitsetCache,
             TestRestrictedIndices.RESTRICTED_INDICES,
+            mockRoleBuildingExecutor,
             roleConsumer
         ) {
             @Override

From ed9a3bf1a401aa235b5bfbca3165d228f76020fb Mon Sep 17 00:00:00 2001
From: David Turner <david.turner@elastic.co>
Date: Tue, 24 Sep 2024 09:29:11 +0100
Subject: [PATCH 23/28] Revert "Make `UpdateSettingsClusterStateUpdateRequest`
 a record (#113432)"

This reverts commit 840eecbd77fcb774421ea831753e7444ccfba9d0.
---
 .../MetadataUpdateSettingsServiceIT.java      | 133 ++++++++----------
 .../put/TransportUpdateSettingsAction.java    |  31 ++--
 ...dateSettingsClusterStateUpdateRequest.java |  86 ++++++-----
 .../MetadataUpdateSettingsService.java        |   4 +-
 .../upgrades/SystemIndexMigrator.java         |  16 +--
 ...TransportUpdateSecuritySettingsAction.java |  16 +--
 .../TransportUpdateWatcherSettingsAction.java |  12 +-
 7 files changed, 132 insertions(+), 166 deletions(-)

diff --git a/server/src/internalClusterTest/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsServiceIT.java b/server/src/internalClusterTest/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsServiceIT.java
index c1e68040e075b..b3b7957801cd7 100644
--- a/server/src/internalClusterTest/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsServiceIT.java
+++ b/server/src/internalClusterTest/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsServiceIT.java
@@ -28,7 +28,6 @@
 import java.util.List;
 import java.util.concurrent.atomic.AtomicBoolean;
 import java.util.concurrent.atomic.AtomicReference;
-import java.util.function.Function;
 
 import static org.hamcrest.Matchers.equalTo;
 
@@ -43,58 +42,45 @@ public void testThatNonDynamicSettingChangesTakeEffect() throws Exception {
         MetadataUpdateSettingsService metadataUpdateSettingsService = internalCluster().getCurrentMasterNodeInstance(
             MetadataUpdateSettingsService.class
         );
-        List<Index> indicesList = new ArrayList<>();
+        UpdateSettingsClusterStateUpdateRequest request = new UpdateSettingsClusterStateUpdateRequest().ackTimeout(TimeValue.ZERO);
+        List<Index> indices = new ArrayList<>();
         for (IndicesService indicesService : internalCluster().getInstances(IndicesService.class)) {
             for (IndexService indexService : indicesService) {
-                indicesList.add(indexService.index());
+                indices.add(indexService.index());
             }
         }
-        final var indices = indicesList.toArray(Index.EMPTY_ARRAY);
-
-        final Function<UpdateSettingsClusterStateUpdateRequest.OnStaticSetting, UpdateSettingsClusterStateUpdateRequest> requestFactory =
-            onStaticSetting -> new UpdateSettingsClusterStateUpdateRequest(
-                TEST_REQUEST_TIMEOUT,
-                TimeValue.ZERO,
-                Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData").build(),
-                UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
-                onStaticSetting,
-                indices
-            );
+        request.indices(indices.toArray(Index.EMPTY_ARRAY));
+        request.settings(Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData").build());
 
         // First make sure it fails if reopenShards is not set on the request:
         AtomicBoolean expectedFailureOccurred = new AtomicBoolean(false);
-        metadataUpdateSettingsService.updateSettings(
-            requestFactory.apply(UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT),
-            new ActionListener<>() {
-                @Override
-                public void onResponse(AcknowledgedResponse acknowledgedResponse) {
-                    fail("Should have failed updating a non-dynamic setting without reopenShards set to true");
-                }
+        metadataUpdateSettingsService.updateSettings(request, new ActionListener<>() {
+            @Override
+            public void onResponse(AcknowledgedResponse acknowledgedResponse) {
+                fail("Should have failed updating a non-dynamic setting without reopenShards set to true");
+            }
 
-                @Override
-                public void onFailure(Exception e) {
-                    expectedFailureOccurred.set(true);
-                }
+            @Override
+            public void onFailure(Exception e) {
+                expectedFailureOccurred.set(true);
             }
-        );
+        });
         assertBusy(() -> assertThat(expectedFailureOccurred.get(), equalTo(true)));
 
         // Now we set reopenShards and expect it to work:
+        request.reopenShards(true);
         AtomicBoolean success = new AtomicBoolean(false);
-        metadataUpdateSettingsService.updateSettings(
-            requestFactory.apply(UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REOPEN_INDICES),
-            new ActionListener<>() {
-                @Override
-                public void onResponse(AcknowledgedResponse acknowledgedResponse) {
-                    success.set(true);
-                }
+        metadataUpdateSettingsService.updateSettings(request, new ActionListener<>() {
+            @Override
+            public void onResponse(AcknowledgedResponse acknowledgedResponse) {
+                success.set(true);
+            }
 
-                @Override
-                public void onFailure(Exception e) {
-                    fail(e);
-                }
+            @Override
+            public void onFailure(Exception e) {
+                fail(e);
             }
-        );
+        });
         assertBusy(() -> assertThat(success.get(), equalTo(true)));
 
         // Now we look into the IndexShard objects to make sure that the code was actually updated (vs just the setting):
@@ -124,23 +110,16 @@ public void testThatNonDynamicSettingChangesDoNotUnncessesarilyCauseReopens() th
         MetadataUpdateSettingsService metadataUpdateSettingsService = internalCluster().getCurrentMasterNodeInstance(
             MetadataUpdateSettingsService.class
         );
-        List<Index> indicesList = new ArrayList<>();
+        UpdateSettingsClusterStateUpdateRequest request = new UpdateSettingsClusterStateUpdateRequest().ackTimeout(TimeValue.ZERO);
+        List<Index> indices = new ArrayList<>();
         for (IndicesService indicesService : internalCluster().getInstances(IndicesService.class)) {
             for (IndexService indexService : indicesService) {
-                indicesList.add(indexService.index());
+                indices.add(indexService.index());
             }
         }
-        final var indices = indicesList.toArray(Index.EMPTY_ARRAY);
-
-        final Function<Settings.Builder, UpdateSettingsClusterStateUpdateRequest> requestFactory =
-            settings -> new UpdateSettingsClusterStateUpdateRequest(
-                TEST_REQUEST_TIMEOUT,
-                TimeValue.ZERO,
-                settings.build(),
-                UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
-                UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REOPEN_INDICES,
-                indices
-            );
+        request.indices(indices.toArray(Index.EMPTY_ARRAY));
+        request.settings(Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData").build());
+        request.reopenShards(true);
 
         ClusterService clusterService = internalCluster().getInstance(ClusterService.class);
         AtomicBoolean shardsUnassigned = new AtomicBoolean(false);
@@ -163,49 +142,47 @@ public void testThatNonDynamicSettingChangesDoNotUnncessesarilyCauseReopens() th
 
         AtomicBoolean success = new AtomicBoolean(false);
         // Make the first request, just to set things up:
-        metadataUpdateSettingsService.updateSettings(
-            requestFactory.apply(Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData")),
-            new ActionListener<>() {
-                @Override
-                public void onResponse(AcknowledgedResponse acknowledgedResponse) {
-                    success.set(true);
-                }
+        metadataUpdateSettingsService.updateSettings(request, new ActionListener<>() {
+            @Override
+            public void onResponse(AcknowledgedResponse acknowledgedResponse) {
+                success.set(true);
+            }
 
-                @Override
-                public void onFailure(Exception e) {
-                    fail(e);
-                }
+            @Override
+            public void onFailure(Exception e) {
+                fail(e);
             }
-        );
+        });
         assertBusy(() -> assertThat(success.get(), equalTo(true)));
         assertBusy(() -> assertThat(expectedSettingsChangeInClusterState.get(), equalTo(true)));
         assertThat(shardsUnassigned.get(), equalTo(true));
 
         assertBusy(() -> assertThat(hasUnassignedShards(clusterService.state(), indexName), equalTo(false)));
 
+        // Same request, except now we'll also set the dynamic "index.max_result_window" setting:
+        request.settings(
+            Settings.builder()
+                .put("index.codec", "FastDecompressionCompressingStoredFieldsData")
+                .put("index.max_result_window", "1500")
+                .build()
+        );
         success.set(false);
         expectedSettingsChangeInClusterState.set(false);
         shardsUnassigned.set(false);
         expectedSetting.set("index.max_result_window");
         expectedSettingValue.set("1500");
         // Making this request ought to add this new setting but not unassign the shards:
-        metadataUpdateSettingsService.updateSettings(
-            // Same request, except now we'll also set the dynamic "index.max_result_window" setting:
-            requestFactory.apply(
-                Settings.builder().put("index.codec", "FastDecompressionCompressingStoredFieldsData").put("index.max_result_window", "1500")
-            ),
-            new ActionListener<>() {
-                @Override
-                public void onResponse(AcknowledgedResponse acknowledgedResponse) {
-                    success.set(true);
-                }
+        metadataUpdateSettingsService.updateSettings(request, new ActionListener<>() {
+            @Override
+            public void onResponse(AcknowledgedResponse acknowledgedResponse) {
+                success.set(true);
+            }
 
-                @Override
-                public void onFailure(Exception e) {
-                    fail(e);
-                }
+            @Override
+            public void onFailure(Exception e) {
+                fail(e);
             }
-        );
+        });
 
         assertBusy(() -> assertThat(success.get(), equalTo(true)));
         assertBusy(() -> assertThat(expectedSettingsChangeInClusterState.get(), equalTo(true)));
diff --git a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/TransportUpdateSettingsAction.java b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/TransportUpdateSettingsAction.java
index 1e7f32641b86f..1d7c264065d6f 100644
--- a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/TransportUpdateSettingsAction.java
+++ b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/TransportUpdateSettingsAction.java
@@ -124,24 +124,19 @@ protected void masterOperation(
             return;
         }
 
-        updateSettingsService.updateSettings(
-            new UpdateSettingsClusterStateUpdateRequest(
-                request.masterNodeTimeout(),
-                request.ackTimeout(),
-                requestSettings,
-                request.isPreserveExisting()
-                    ? UpdateSettingsClusterStateUpdateRequest.OnExisting.PRESERVE
-                    : UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
-                request.reopen()
-                    ? UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REOPEN_INDICES
-                    : UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT,
-                concreteIndices
-            ),
-            listener.delegateResponse((l, e) -> {
-                logger.debug(() -> "failed to update settings on indices [" + Arrays.toString(concreteIndices) + "]", e);
-                l.onFailure(e);
-            })
-        );
+        UpdateSettingsClusterStateUpdateRequest clusterStateUpdateRequest = new UpdateSettingsClusterStateUpdateRequest().indices(
+            concreteIndices
+        )
+            .settings(requestSettings)
+            .setPreserveExisting(request.isPreserveExisting())
+            .reopenShards(request.reopen())
+            .ackTimeout(request.ackTimeout())
+            .masterNodeTimeout(request.masterNodeTimeout());
+
+        updateSettingsService.updateSettings(clusterStateUpdateRequest, listener.delegateResponse((l, e) -> {
+            logger.debug(() -> "failed to update settings on indices [" + Arrays.toString(concreteIndices) + "]", e);
+            l.onFailure(e);
+        }));
     }
 
     /**
diff --git a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java
index fe8573da5fb68..42a904c704bf3 100644
--- a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java
+++ b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java
@@ -9,60 +9,70 @@
 
 package org.elasticsearch.action.admin.indices.settings.put;
 
+import org.elasticsearch.cluster.ack.IndicesClusterStateUpdateRequest;
 import org.elasticsearch.common.settings.Settings;
-import org.elasticsearch.core.TimeValue;
-import org.elasticsearch.index.Index;
 
-import java.util.Objects;
+import java.util.Arrays;
 
 /**
  * Cluster state update request that allows to update settings for some indices
  */
-public record UpdateSettingsClusterStateUpdateRequest(
-    TimeValue masterNodeTimeout,
-    TimeValue ackTimeout,
-    Settings settings,
-    OnExisting onExisting,
-    OnStaticSetting onStaticSetting,
-    Index... indices
-) {
+public class UpdateSettingsClusterStateUpdateRequest extends IndicesClusterStateUpdateRequest<UpdateSettingsClusterStateUpdateRequest> {
+
+    private Settings settings;
+
+    private boolean preserveExisting = false;
+
+    private boolean reopenShards = false;
+
+    /**
+     * Returns <code>true</code> iff the settings update should only add but not update settings. If the setting already exists
+     * it should not be overwritten by this update. The default is <code>false</code>
+     */
+    public boolean isPreserveExisting() {
+        return preserveExisting;
+    }
 
     /**
-     * Specifies the behaviour of an update-settings action on existing settings.
+     * Returns <code>true</code> if non-dynamic setting updates should go through, by automatically unassigning shards in the same cluster
+     * state change as the setting update. The shards will be automatically reassigned after the cluster state update is made. The
+     * default is <code>false</code>.
      */
-    public enum OnExisting {
-        /**
-         * Update all the specified settings, overwriting any settings which already exist. This is the API default.
-         */
-        OVERWRITE,
+    public boolean reopenShards() {
+        return reopenShards;
+    }
 
-        /**
-         * Only add new settings, preserving the values of any settings which are already set and ignoring the new values specified in the
-         * request.
-         */
-        PRESERVE
+    public UpdateSettingsClusterStateUpdateRequest reopenShards(boolean reopenShards) {
+        this.reopenShards = reopenShards;
+        return this;
     }
 
     /**
-     * Specifies the behaviour of an update-settings action which is trying to adjust a non-dynamic setting.
+     * Iff set to <code>true</code> this settings update will only add settings not already set on an index. Existing settings remain
+     * unchanged.
      */
-    public enum OnStaticSetting {
-        /**
-         * Reject attempts to update non-dynamic settings on open indices. This is the API default.
-         */
-        REJECT,
+    public UpdateSettingsClusterStateUpdateRequest setPreserveExisting(boolean preserveExisting) {
+        this.preserveExisting = preserveExisting;
+        return this;
+    }
 
-        /**
-         * Automatically close and reopen the shards of any open indices when updating a non-dynamic setting, forcing the shard to
-         * reinitialize from scratch.
-         */
-        REOPEN_INDICES
+    /**
+     * Returns the {@link Settings} to update
+     */
+    public Settings settings() {
+        return settings;
+    }
+
+    /**
+     * Sets the {@link Settings} to update
+     */
+    public UpdateSettingsClusterStateUpdateRequest settings(Settings settings) {
+        this.settings = settings;
+        return this;
     }
 
-    public UpdateSettingsClusterStateUpdateRequest {
-        Objects.requireNonNull(masterNodeTimeout);
-        Objects.requireNonNull(ackTimeout);
-        Objects.requireNonNull(settings);
-        Objects.requireNonNull(indices);
+    @Override
+    public String toString() {
+        return Arrays.toString(indices()) + settings;
     }
 }
diff --git a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java
index 4fcbd4165423b..cee3b4c0bdac1 100644
--- a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java
+++ b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java
@@ -176,7 +176,7 @@ ClusterState execute(ClusterState currentState) {
             }
             final Settings closedSettings = settingsForClosedIndices.build();
             final Settings openSettings = settingsForOpenIndices.build();
-            final boolean preserveExisting = request.onExisting() == UpdateSettingsClusterStateUpdateRequest.OnExisting.PRESERVE;
+            final boolean preserveExisting = request.isPreserveExisting();
 
             RoutingTable.Builder routingTableBuilder = null;
             Metadata.Builder metadataBuilder = Metadata.builder(currentState.metadata());
@@ -199,7 +199,7 @@ ClusterState execute(ClusterState currentState) {
             }
 
             if (skippedSettings.isEmpty() == false && openIndices.isEmpty() == false) {
-                if (request.onStaticSetting() == UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REOPEN_INDICES) {
+                if (request.reopenShards()) {
                     // We have non-dynamic settings and open indices. We will unassign all of the shards in these indices so that the new
                     // changed settings are applied when the shards are re-assigned.
                     routingTableBuilder = RoutingTable.builder(
diff --git a/server/src/main/java/org/elasticsearch/upgrades/SystemIndexMigrator.java b/server/src/main/java/org/elasticsearch/upgrades/SystemIndexMigrator.java
index a131f63cb75f3..94b856f7a22fb 100644
--- a/server/src/main/java/org/elasticsearch/upgrades/SystemIndexMigrator.java
+++ b/server/src/main/java/org/elasticsearch/upgrades/SystemIndexMigrator.java
@@ -19,7 +19,6 @@
 import org.elasticsearch.action.admin.indices.settings.put.UpdateSettingsClusterStateUpdateRequest;
 import org.elasticsearch.action.support.ActiveShardCount;
 import org.elasticsearch.action.support.master.AcknowledgedResponse;
-import org.elasticsearch.action.support.master.MasterNodeRequest;
 import org.elasticsearch.action.support.master.ShardsAcknowledgedResponse;
 import org.elasticsearch.client.internal.Client;
 import org.elasticsearch.client.internal.ParentTaskAssigningClient;
@@ -538,18 +537,11 @@ private CheckedBiConsumer<ActionListener<BulkByScrollResponse>, AcknowledgedResp
      */
     private void setWriteBlock(Index index, boolean readOnlyValue, ActionListener<AcknowledgedResponse> listener) {
         final Settings readOnlySettings = Settings.builder().put(IndexMetadata.INDEX_BLOCKS_WRITE_SETTING.getKey(), readOnlyValue).build();
+        UpdateSettingsClusterStateUpdateRequest updateSettingsRequest = new UpdateSettingsClusterStateUpdateRequest().indices(
+            new Index[] { index }
+        ).settings(readOnlySettings).setPreserveExisting(false).ackTimeout(TimeValue.ZERO);
 
-        metadataUpdateSettingsService.updateSettings(
-            new UpdateSettingsClusterStateUpdateRequest(
-                MasterNodeRequest.INFINITE_MASTER_NODE_TIMEOUT,
-                TimeValue.ZERO,
-                readOnlySettings,
-                UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
-                UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT,
-                index
-            ),
-            listener
-        );
+        metadataUpdateSettingsService.updateSettings(updateSettingsRequest, listener);
     }
 
     private void reindex(SystemIndexMigrationInfo migrationInfo, ActionListener<BulkByScrollResponse> listener) {
diff --git a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportUpdateSecuritySettingsAction.java b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportUpdateSecuritySettingsAction.java
index b924fe0d983bb..49f8846c36e1f 100644
--- a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportUpdateSecuritySettingsAction.java
+++ b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportUpdateSecuritySettingsAction.java
@@ -119,8 +119,8 @@ protected void masterOperation(
     private Optional<UpdateSettingsClusterStateUpdateRequest> createUpdateSettingsRequest(
         String indexName,
         Settings settingsToUpdate,
-        TimeValue ackTimeout,
-        TimeValue masterNodeTimeout,
+        TimeValue timeout,
+        TimeValue masterTimeout,
         ClusterState state
     ) {
         if (settingsToUpdate.isEmpty()) {
@@ -136,14 +136,10 @@ private Optional<UpdateSettingsClusterStateUpdateRequest> createUpdateSettingsRe
         }
 
         return Optional.of(
-            new UpdateSettingsClusterStateUpdateRequest(
-                masterNodeTimeout,
-                ackTimeout,
-                settingsToUpdate,
-                UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
-                UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT,
-                writeIndex
-            )
+            new UpdateSettingsClusterStateUpdateRequest().indices(new Index[] { writeIndex })
+                .settings(settingsToUpdate)
+                .ackTimeout(timeout)
+                .masterNodeTimeout(masterTimeout)
         );
     }
 
diff --git a/x-pack/plugin/watcher/src/main/java/org/elasticsearch/xpack/watcher/transport/actions/TransportUpdateWatcherSettingsAction.java b/x-pack/plugin/watcher/src/main/java/org/elasticsearch/xpack/watcher/transport/actions/TransportUpdateWatcherSettingsAction.java
index 0407c2db63ac6..378ee642cf105 100644
--- a/x-pack/plugin/watcher/src/main/java/org/elasticsearch/xpack/watcher/transport/actions/TransportUpdateWatcherSettingsAction.java
+++ b/x-pack/plugin/watcher/src/main/java/org/elasticsearch/xpack/watcher/transport/actions/TransportUpdateWatcherSettingsAction.java
@@ -24,6 +24,7 @@
 import org.elasticsearch.cluster.service.ClusterService;
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.util.concurrent.EsExecutors;
+import org.elasticsearch.index.Index;
 import org.elasticsearch.injection.guice.Inject;
 import org.elasticsearch.logging.LogManager;
 import org.elasticsearch.logging.Logger;
@@ -90,14 +91,9 @@ protected void masterOperation(
             return;
         }
         final Settings newSettings = Settings.builder().loadFromMap(request.settings()).build();
-        final UpdateSettingsClusterStateUpdateRequest clusterStateUpdateRequest = new UpdateSettingsClusterStateUpdateRequest(
-            request.masterNodeTimeout(),
-            request.ackTimeout(),
-            newSettings,
-            UpdateSettingsClusterStateUpdateRequest.OnExisting.OVERWRITE,
-            UpdateSettingsClusterStateUpdateRequest.OnStaticSetting.REJECT,
-            watcherIndexMd.getIndex()
-        );
+        final UpdateSettingsClusterStateUpdateRequest clusterStateUpdateRequest = new UpdateSettingsClusterStateUpdateRequest().indices(
+            new Index[] { watcherIndexMd.getIndex() }
+        ).settings(newSettings).ackTimeout(request.ackTimeout()).masterNodeTimeout(request.masterNodeTimeout());
 
         updateSettingsService.updateSettings(clusterStateUpdateRequest, new ActionListener<>() {
             @Override

From d582db22b717cd19553ebb98490a1d4e62907008 Mon Sep 17 00:00:00 2001
From: Simon Cooper <simon.cooper@elastic.co>
Date: Tue, 24 Sep 2024 09:54:39 +0100
Subject: [PATCH 24/28] Change default locale of date processors to ENGLISH
 (#112796)

It is English in the docs, so this fixes the code to match the docs. Note that this really impacts Elasticsearch when run on JDK 23 with the CLDR locale database, as in the COMPAT database pre-23, root and en are essentially the same.
---
 .../java/org/elasticsearch/ingest/common/DateProcessor.java     | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/modules/ingest-common/src/main/java/org/elasticsearch/ingest/common/DateProcessor.java b/modules/ingest-common/src/main/java/org/elasticsearch/ingest/common/DateProcessor.java
index bfdf87f417b60..22db5a330fb45 100644
--- a/modules/ingest-common/src/main/java/org/elasticsearch/ingest/common/DateProcessor.java
+++ b/modules/ingest-common/src/main/java/org/elasticsearch/ingest/common/DateProcessor.java
@@ -98,7 +98,7 @@ private static ZoneId newDateTimeZone(String timezone) {
     }
 
     private static Locale newLocale(String locale) {
-        return locale == null ? Locale.ROOT : LocaleUtils.parse(locale);
+        return locale == null ? Locale.ENGLISH : LocaleUtils.parse(locale);
     }
 
     @Override

From 449aff35bc1d45eb8d37a5bfbf4fd7ad109bf061 Mon Sep 17 00:00:00 2001
From: Armin Braun <me@obrown.io>
Date: Tue, 24 Sep 2024 11:08:19 +0200
Subject: [PATCH 25/28] Fix unnecessary locking on refreshIfNeeded mutex
 (#113334)

This spot is very hot (or rather "cold") when running tests.
No need to for a costly lock on this thing when trace is not active.
---
 .../elasticsearch/indices/recovery/RecoverySourceHandler.java | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/server/src/main/java/org/elasticsearch/indices/recovery/RecoverySourceHandler.java b/server/src/main/java/org/elasticsearch/indices/recovery/RecoverySourceHandler.java
index 3f57c2bce5228..3b0e4e048613c 100644
--- a/server/src/main/java/org/elasticsearch/indices/recovery/RecoverySourceHandler.java
+++ b/server/src/main/java/org/elasticsearch/indices/recovery/RecoverySourceHandler.java
@@ -315,7 +315,9 @@ && isTargetSameHistory()
                 cancellableThreads,
                 ActionListener.wrap(ignored -> {
                     final long endingSeqNo = shard.seqNoStats().getMaxSeqNo();
-                    logger.trace("snapshot for recovery; current size is [{}]", estimateNumberOfHistoryOperations(startingSeqNo));
+                    if (logger.isTraceEnabled()) {
+                        logger.trace("snapshot for recovery; current size is [{}]", estimateNumberOfHistoryOperations(startingSeqNo));
+                    }
                     final Translog.Snapshot phase2Snapshot = shard.newChangesSnapshot(
                         "peer-recovery",
                         startingSeqNo,

From 11d968d173bb0f4e29bafd6dee8d99a7a254c6d5 Mon Sep 17 00:00:00 2001
From: Pooya Salehi <pxsalehi@users.noreply.github.com>
Date: Tue, 24 Sep 2024 11:11:48 +0200
Subject: [PATCH 26/28] Remove test logging from
 PrevalidateShardPathIT#testCheckShards (#113434)

Relates https://github.com/elastic/elasticsearch/pull/113107 Closes
https://github.com/elastic/elasticsearch/issues/111134
---
 .../elasticsearch/cluster/PrevalidateShardPathIT.java  | 10 ----------
 1 file changed, 10 deletions(-)

diff --git a/server/src/internalClusterTest/java/org/elasticsearch/cluster/PrevalidateShardPathIT.java b/server/src/internalClusterTest/java/org/elasticsearch/cluster/PrevalidateShardPathIT.java
index 062f4adb27120..87943dedc708b 100644
--- a/server/src/internalClusterTest/java/org/elasticsearch/cluster/PrevalidateShardPathIT.java
+++ b/server/src/internalClusterTest/java/org/elasticsearch/cluster/PrevalidateShardPathIT.java
@@ -21,7 +21,6 @@
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.index.shard.ShardId;
 import org.elasticsearch.test.ESIntegTestCase;
-import org.elasticsearch.test.junit.annotations.TestIssueLogging;
 
 import java.util.HashSet;
 import java.util.Set;
@@ -41,15 +40,6 @@
 @ESIntegTestCase.ClusterScope(scope = ESIntegTestCase.Scope.TEST, numDataNodes = 0)
 public class PrevalidateShardPathIT extends ESIntegTestCase {
 
-    @TestIssueLogging(
-        value = "org.elasticsearch.cluster.service.MasterService:DEBUG,"
-            + "org.elasticsearch.indices.store.IndicesStore:TRACE,"
-            + "org.elasticsearch.indices.cluster.IndicesClusterStateService:DEBUG,"
-            + "org.elasticsearch.indices.IndicesService:TRACE,"
-            + "org.elasticsearch.index.IndexService:TRACE,"
-            + "org.elasticsearch.env.NodeEnvironment:TRACE",
-        issueUrl = "https://github.com/elastic/elasticsearch/issues/111134"
-    )
     public void testCheckShards() throws Exception {
         internalCluster().startMasterOnlyNode();
         String node1 = internalCluster().startDataOnlyNode();

From 4309eaa6026ad18fc2135b0797736857045b78dd Mon Sep 17 00:00:00 2001
From: David Turner <david.turner@elastic.co>
Date: Tue, 24 Sep 2024 12:28:50 +0100
Subject: [PATCH 27/28] Prepare for making
 `UpdateSettingsClusterStateUpdateRequest` a record (#113441)

A preliminary PR to maintain source compatibility while the serverless
change is still in flight. See #113432 or #113353 for the actual change.
---
 ...dateSettingsClusterStateUpdateRequest.java | 53 +++++++++++++++++++
 1 file changed, 53 insertions(+)

diff --git a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java
index 42a904c704bf3..6850c40307910 100644
--- a/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java
+++ b/server/src/main/java/org/elasticsearch/action/admin/indices/settings/put/UpdateSettingsClusterStateUpdateRequest.java
@@ -11,6 +11,8 @@
 
 import org.elasticsearch.cluster.ack.IndicesClusterStateUpdateRequest;
 import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.index.Index;
 
 import java.util.Arrays;
 
@@ -19,12 +21,63 @@
  */
 public class UpdateSettingsClusterStateUpdateRequest extends IndicesClusterStateUpdateRequest<UpdateSettingsClusterStateUpdateRequest> {
 
+    /**
+     * Specifies the behaviour of an update-settings action on existing settings.
+     */
+    public enum OnExisting {
+        /**
+         * Update all the specified settings, overwriting any settings which already exist. This is the API default.
+         */
+        OVERWRITE,
+
+        /**
+         * Only add new settings, preserving the values of any settings which are already set and ignoring the new values specified in the
+         * request.
+         */
+        PRESERVE
+    }
+
+    /**
+     * Specifies the behaviour of an update-settings action which is trying to adjust a non-dynamic setting.
+     */
+    public enum OnStaticSetting {
+        /**
+         * Reject attempts to update non-dynamic settings on open indices. This is the API default.
+         */
+        REJECT,
+
+        /**
+         * Automatically close and reopen the shards of any open indices when updating a non-dynamic setting, forcing the shard to
+         * reinitialize from scratch.
+         */
+        REOPEN_INDICES
+    }
+
     private Settings settings;
 
     private boolean preserveExisting = false;
 
     private boolean reopenShards = false;
 
+    public UpdateSettingsClusterStateUpdateRequest() {}
+
+    @SuppressWarnings("this-escape")
+    public UpdateSettingsClusterStateUpdateRequest(
+        TimeValue masterNodeTimeout,
+        TimeValue ackTimeout,
+        Settings settings,
+        OnExisting onExisting,
+        OnStaticSetting onStaticSetting,
+        Index... indices
+    ) {
+        masterNodeTimeout(masterNodeTimeout);
+        ackTimeout(ackTimeout);
+        settings(settings);
+        setPreserveExisting(onExisting == OnExisting.PRESERVE);
+        reopenShards(onStaticSetting == OnStaticSetting.REOPEN_INDICES);
+        indices(indices);
+    }
+
     /**
      * Returns <code>true</code> iff the settings update should only add but not update settings. If the setting already exists
      * it should not be overwritten by this update. The default is <code>false</code>

From a3806cd8e1c4548633a2c4fad8d5beb272b7b856 Mon Sep 17 00:00:00 2001
From: Ignacio Vera <ignacio.vera@elastic.co>
Date: Tue, 24 Sep 2024 14:46:25 +0200
Subject: [PATCH 28/28] Account for DelayedBucket before reduction (#113013)

This commit moves the account for the DelayableBucket before reduction, therefore in some adversarial cases, we
should exit much sooner.
---
 docs/changelog/113013.yaml                    |  5 ++
 .../search/aggregations/DelayedBucket.java    |  9 ++--
 .../search/aggregations/TopBucketBuilder.java |  6 +++
 .../bucket/terms/AbstractInternalTerms.java   | 10 ++--
 .../aggregations/DelayedBucketTests.java      | 49 ++++++++++++++++++-
 5 files changed, 70 insertions(+), 9 deletions(-)
 create mode 100644 docs/changelog/113013.yaml

diff --git a/docs/changelog/113013.yaml b/docs/changelog/113013.yaml
new file mode 100644
index 0000000000000..1cec31074e806
--- /dev/null
+++ b/docs/changelog/113013.yaml
@@ -0,0 +1,5 @@
+pr: 113013
+summary: Account for `DelayedBucket` before reduction
+area: Aggregations
+type: enhancement
+issues: []
diff --git a/server/src/main/java/org/elasticsearch/search/aggregations/DelayedBucket.java b/server/src/main/java/org/elasticsearch/search/aggregations/DelayedBucket.java
index fa8fe9e4628d7..017d87df52092 100644
--- a/server/src/main/java/org/elasticsearch/search/aggregations/DelayedBucket.java
+++ b/server/src/main/java/org/elasticsearch/search/aggregations/DelayedBucket.java
@@ -15,6 +15,10 @@
 /**
  * A wrapper around reducing buckets with the same key that can delay that reduction
  * as long as possible. It's stateful and not even close to thread safe.
+ * <p>
+ * It is responsibility of the caller to account for buckets created using DelayedBucket.
+ * It should call {@link #nonCompetitive} to release any possible sub-bucket creation if
+ * a bucket is rejected from the final response.
  */
 public final class DelayedBucket<B extends InternalMultiBucketAggregation.InternalBucket> {
     /**
@@ -45,7 +49,6 @@ public DelayedBucket(List<B> toReduce) {
      */
     public B reduced(BiFunction<List<B>, AggregationReduceContext, B> reduce, AggregationReduceContext reduceContext) {
         if (reduced == null) {
-            reduceContext.consumeBucketsAndMaybeBreak(1);
             reduced = reduce.apply(toReduce, reduceContext);
             toReduce = null;
         }
@@ -95,8 +98,8 @@ public String toString() {
      */
     void nonCompetitive(AggregationReduceContext reduceContext) {
         if (reduced != null) {
-            // -1 for itself, -countInnerBucket for all the sub-buckets.
-            reduceContext.consumeBucketsAndMaybeBreak(-1 - InternalMultiBucketAggregation.countInnerBucket(reduced));
+            // -countInnerBucket for all the sub-buckets.
+            reduceContext.consumeBucketsAndMaybeBreak(-InternalMultiBucketAggregation.countInnerBucket(reduced));
         }
     }
 }
diff --git a/server/src/main/java/org/elasticsearch/search/aggregations/TopBucketBuilder.java b/server/src/main/java/org/elasticsearch/search/aggregations/TopBucketBuilder.java
index a3d04ecc2074d..0389b7e105a58 100644
--- a/server/src/main/java/org/elasticsearch/search/aggregations/TopBucketBuilder.java
+++ b/server/src/main/java/org/elasticsearch/search/aggregations/TopBucketBuilder.java
@@ -132,7 +132,11 @@ public void add(DelayedBucket<B> bucket) {
             DelayedBucket<B> removed = queue.insertWithOverflow(bucket);
             if (removed != null) {
                 nonCompetitive.accept(removed);
+                // release any created sub-buckets
                 removed.nonCompetitive(reduceContext);
+            } else {
+                // add one bucket to the final result
+                reduceContext.consumeBucketsAndMaybeBreak(1);
             }
         }
 
@@ -183,6 +187,8 @@ public void add(DelayedBucket<B> bucket) {
                 next.add(bucket);
                 return;
             }
+            // add one bucket to the final result
+            reduceContext.consumeBucketsAndMaybeBreak(1);
             buffer.add(bucket);
             if (buffer.size() < size) {
                 return;
diff --git a/server/src/main/java/org/elasticsearch/search/aggregations/bucket/terms/AbstractInternalTerms.java b/server/src/main/java/org/elasticsearch/search/aggregations/bucket/terms/AbstractInternalTerms.java
index 71a06fb020344..5c422a9dd4e32 100644
--- a/server/src/main/java/org/elasticsearch/search/aggregations/bucket/terms/AbstractInternalTerms.java
+++ b/server/src/main/java/org/elasticsearch/search/aggregations/bucket/terms/AbstractInternalTerms.java
@@ -290,6 +290,7 @@ public InternalAggregation get() {
                 result = new ArrayList<>();
                 thisReduceOrder = reduceBuckets(bucketsList, getThisReduceOrder(), bucket -> {
                     if (result.size() < getRequiredSize()) {
+                        reduceContext.consumeBucketsAndMaybeBreak(1);
                         result.add(bucket.reduced(AbstractInternalTerms.this::reduceBucket, reduceContext));
                     } else {
                         otherDocCount[0] += bucket.getDocCount();
@@ -311,11 +312,10 @@ public InternalAggregation get() {
                 result = top.build();
             } else {
                 result = new ArrayList<>();
-                thisReduceOrder = reduceBuckets(
-                    bucketsList,
-                    getThisReduceOrder(),
-                    bucket -> result.add(bucket.reduced(AbstractInternalTerms.this::reduceBucket, reduceContext))
-                );
+                thisReduceOrder = reduceBuckets(bucketsList, getThisReduceOrder(), bucket -> {
+                    reduceContext.consumeBucketsAndMaybeBreak(1);
+                    result.add(bucket.reduced(AbstractInternalTerms.this::reduceBucket, reduceContext));
+                });
             }
             for (B r : result) {
                 if (sumDocCountError == -1) {
diff --git a/server/src/test/java/org/elasticsearch/search/aggregations/DelayedBucketTests.java b/server/src/test/java/org/elasticsearch/search/aggregations/DelayedBucketTests.java
index b5a35098e0073..70d5692b6dcf7 100644
--- a/server/src/test/java/org/elasticsearch/search/aggregations/DelayedBucketTests.java
+++ b/server/src/test/java/org/elasticsearch/search/aggregations/DelayedBucketTests.java
@@ -25,6 +25,8 @@
 import static org.hamcrest.Matchers.greaterThan;
 import static org.hamcrest.Matchers.lessThan;
 import static org.hamcrest.Matchers.sameInstance;
+import static org.mockito.Mockito.mock;
+import static org.mockito.Mockito.when;
 
 public class DelayedBucketTests extends ESTestCase {
     public void testToString() {
@@ -40,6 +42,23 @@ public void testReduced() {
         assertThat(b.reduced(reduce, context), sameInstance(b.reduced(reduce, context)));
         assertThat(b.reduced(reduce, context).getKeyAsString(), equalTo("test"));
         assertThat(b.reduced(reduce, context).getDocCount(), equalTo(3L));
+        // it only accounts for sub-buckets
+        assertEquals(0, buckets.get());
+    }
+
+    public void testReducedSubAggregation() {
+        AtomicInteger buckets = new AtomicInteger();
+        AggregationReduceContext context = new AggregationReduceContext.ForFinal(null, null, () -> false, null, buckets::addAndGet);
+        BiFunction<List<InternalBucket>, AggregationReduceContext, InternalBucket> reduce = mockReduce(context);
+        DelayedBucket<InternalBucket> b = new DelayedBucket<>(
+            List.of(bucket("test", 1, mockMultiBucketAgg()), bucket("test", 2, mockMultiBucketAgg()))
+        );
+
+        assertThat(b.getDocCount(), equalTo(3L));
+        assertThat(b.reduced(reduce, context), sameInstance(b.reduced(reduce, context)));
+        assertThat(b.reduced(reduce, context).getKeyAsString(), equalTo("test"));
+        assertThat(b.reduced(reduce, context).getDocCount(), equalTo(3L));
+        // it only accounts for sub-buckets
         assertEquals(1, buckets.get());
     }
 
@@ -76,6 +95,19 @@ public void testNonCompetitiveReduced() {
         BiFunction<List<InternalBucket>, AggregationReduceContext, InternalBucket> reduce = mockReduce(context);
         DelayedBucket<InternalBucket> b = new DelayedBucket<>(List.of(bucket("test", 1)));
         b.reduced(reduce, context);
+        // only account for sub-aggregations
+        assertEquals(0, buckets.get());
+        b.nonCompetitive(context);
+        assertEquals(0, buckets.get());
+    }
+
+    public void testNonCompetitiveReducedSubAggregation() {
+        AtomicInteger buckets = new AtomicInteger();
+        AggregationReduceContext context = new AggregationReduceContext.ForFinal(null, null, () -> false, null, buckets::addAndGet);
+        BiFunction<List<InternalBucket>, AggregationReduceContext, InternalBucket> reduce = mockReduce(context);
+        DelayedBucket<InternalBucket> b = new DelayedBucket<>(List.of(bucket("test", 1, mockMultiBucketAgg())));
+        b.reduced(reduce, context);
+        // only account for sub-aggregations
         assertEquals(1, buckets.get());
         b.nonCompetitive(context);
         assertEquals(0, buckets.get());
@@ -85,10 +117,25 @@ private static InternalBucket bucket(String key, long docCount) {
         return new StringTerms.Bucket(new BytesRef(key), docCount, InternalAggregations.EMPTY, false, 0, DocValueFormat.RAW);
     }
 
+    private static InternalBucket bucket(String key, long docCount, InternalAggregations subAggregations) {
+        return new StringTerms.Bucket(new BytesRef(key), docCount, subAggregations, false, 0, DocValueFormat.RAW);
+    }
+
     static BiFunction<List<InternalBucket>, AggregationReduceContext, InternalBucket> mockReduce(AggregationReduceContext context) {
         return (l, c) -> {
             assertThat(c, sameInstance(context));
-            return bucket(l.get(0).getKeyAsString(), l.stream().mapToLong(Bucket::getDocCount).sum());
+            context.consumeBucketsAndMaybeBreak(l.get(0).getAggregations().asList().size());
+            return bucket(l.get(0).getKeyAsString(), l.stream().mapToLong(Bucket::getDocCount).sum(), l.get(0).getAggregations());
         };
     }
+
+    @SuppressWarnings("unchecked")
+    private InternalAggregations mockMultiBucketAgg() {
+        List<InternalBucket> buckets = List.of(bucket("sub", 1));
+        InternalMultiBucketAggregation<?, InternalBucket> mock = (InternalMultiBucketAggregation<?, InternalBucket>) mock(
+            InternalMultiBucketAggregation.class
+        );
+        when(mock.getBuckets()).thenReturn(buckets);
+        return InternalAggregations.from(List.of(mock));
+    }
 }