From f0982c7c736928831bed7fca6fbfa8dd0b2f6c11 Mon Sep 17 00:00:00 2001
From: Panagiotis Bailis <pmpailis@gmail.com>
Date: Wed, 28 Aug 2024 15:03:55 +0300
Subject: [PATCH 001/144] Removing trace logging for
 SearchProgressActionListenerIT (#112275)

---
 .../action/search/SearchProgressActionListenerIT.java        | 5 -----
 1 file changed, 5 deletions(-)
diff --git a/server/src/internalClusterTest/java/org/elasticsearch/action/search/SearchProgressActionListenerIT.java b/server/src/internalClusterTest/java/org/elasticsearch/action/search/SearchProgressActionListenerIT.java
index 428e116ecd1ca..88d934973fc49 100644
--- a/server/src/internalClusterTest/java/org/elasticsearch/action/search/SearchProgressActionListenerIT.java
+++ b/server/src/internalClusterTest/java/org/elasticsearch/action/search/SearchProgressActionListenerIT.java
@@ -25,7 +25,6 @@
 import org.elasticsearch.search.sort.SortOrder;
 import org.elasticsearch.tasks.TaskId;
 import org.elasticsearch.test.ESSingleNodeTestCase;
-import org.elasticsearch.test.junit.annotations.TestIssueLogging;
 
 import java.util.ArrayList;
 import java.util.Arrays;
@@ -41,10 +40,6 @@
 import static org.hamcrest.Matchers.equalTo;
 import static org.hamcrest.Matchers.lessThan;
 
-@TestIssueLogging(
-    issueUrl = "https://github.com/elastic/elasticsearch/issues/109830",
-    value = "org.elasticsearch.action.search:TRACE," + "org.elasticsearch.search.SearchService:TRACE"
-)
 public class SearchProgressActionListenerIT extends ESSingleNodeTestCase {
     private List<SearchShard> shards;
 

From 2ad66007861714234a9262edbd9376e559eae785 Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Wed, 28 Aug 2024 22:24:40 +1000
Subject: [PATCH 002/144] Mute
 org.elasticsearch.search.query.ScriptScoreQueryTests
 testScriptTermStatsAvailable #112278

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 5199221c25aaf..26bded1d09dc8 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -163,6 +163,9 @@ tests:
 - class: org.elasticsearch.backwards.MixedClusterClientYamlTestSuiteIT
   method: test {p0=indices.create/20_synthetic_source/stored field under object with store_array_source}
   issue: https://github.com/elastic/elasticsearch/issues/112264
+- class: org.elasticsearch.search.query.ScriptScoreQueryTests
+  method: testScriptTermStatsAvailable
+  issue: https://github.com/elastic/elasticsearch/issues/112278
 
 # Examples:
 #

From defda1900ebd987bc30218d1e33509dc21fb2551 Mon Sep 17 00:00:00 2001
From: Simon Cooper <simon.cooper@elastic.co>
Date: Wed, 28 Aug 2024 13:38:23 +0100
Subject: [PATCH 003/144] Fix toReleaseVersion() when called on the current
 version id (#112242)

---
 docs/changelog/112242.yaml                               | 5 +++++
 .../src/main/java/org/elasticsearch/ReleaseVersions.java | 9 ++++++---
 .../main/java/org/elasticsearch/TransportVersions.java   | 2 +-
 .../main/java/org/elasticsearch/index/IndexVersions.java | 2 +-
 .../java/org/elasticsearch/ReleaseVersionsTests.java     | 7 ++++---
 .../java/org/elasticsearch/TransportVersionTests.java    | 4 ++++
 6 files changed, 21 insertions(+), 8 deletions(-)
 create mode 100644 docs/changelog/112242.yaml

diff --git a/docs/changelog/112242.yaml b/docs/changelog/112242.yaml
new file mode 100644
index 0000000000000..7292a00166de2
--- /dev/null
+++ b/docs/changelog/112242.yaml
@@ -0,0 +1,5 @@
+pr: 112242
+summary: Fix toReleaseVersion() when called on the current version id
+area: Infra/Core
+type: bug
+issues: [111900]
diff --git a/server/src/main/java/org/elasticsearch/ReleaseVersions.java b/server/src/main/java/org/elasticsearch/ReleaseVersions.java
index 7b5c8d1d42382..cacdca1c5b528 100644
--- a/server/src/main/java/org/elasticsearch/ReleaseVersions.java
+++ b/server/src/main/java/org/elasticsearch/ReleaseVersions.java
@@ -41,7 +41,7 @@ public class ReleaseVersions {
 
     private static final Pattern VERSION_LINE = Pattern.compile("(\\d+\\.\\d+\\.\\d+),(\\d+)");
 
-    public static IntFunction<String> generateVersionsLookup(Class<?> versionContainer) {
+    public static IntFunction<String> generateVersionsLookup(Class<?> versionContainer, int current) {
         if (USES_VERSIONS == false) return Integer::toString;
 
         try {
@@ -52,6 +52,9 @@ public static IntFunction<String> generateVersionsLookup(Class<?> versionContain
             }
 
             NavigableMap<Integer, List<Version>> versions = new TreeMap<>();
+            // add the current version id, which won't be in the csv
+            versions.put(current, List.of(Version.CURRENT));
+
             try (BufferedReader reader = new BufferedReader(new InputStreamReader(versionsFile, StandardCharsets.UTF_8))) {
                 String line;
                 while ((line = reader.readLine()) != null) {
@@ -121,8 +124,8 @@ private static IntFunction<String> lookupFunction(NavigableMap<Integer, List<Ver
                     // too hard to guess what version this id might be for using the next version - just use it directly
                     upperBound = upperRange.getValue().get(0).toString();
                 } else {
-                    // likely a version created after the last release tagged version - ok
-                    upperBound = "snapshot[" + id + "]";
+                    // a newer version than all we know about? Can't map it...
+                    upperBound = "[" + id + "]";
                 }
             }
 
diff --git a/server/src/main/java/org/elasticsearch/TransportVersions.java b/server/src/main/java/org/elasticsearch/TransportVersions.java
index c68a33c6df6c4..5963e3c8058de 100644
--- a/server/src/main/java/org/elasticsearch/TransportVersions.java
+++ b/server/src/main/java/org/elasticsearch/TransportVersions.java
@@ -322,7 +322,7 @@ static Collection<TransportVersion> getAllVersions() {
         return VERSION_IDS.values();
     }
 
-    static final IntFunction<String> VERSION_LOOKUP = ReleaseVersions.generateVersionsLookup(TransportVersions.class);
+    static final IntFunction<String> VERSION_LOOKUP = ReleaseVersions.generateVersionsLookup(TransportVersions.class, LATEST_DEFINED.id());
 
     // no instance
     private TransportVersions() {}
diff --git a/server/src/main/java/org/elasticsearch/index/IndexVersions.java b/server/src/main/java/org/elasticsearch/index/IndexVersions.java
index fa40c0316fdcc..608d88fdef664 100644
--- a/server/src/main/java/org/elasticsearch/index/IndexVersions.java
+++ b/server/src/main/java/org/elasticsearch/index/IndexVersions.java
@@ -221,7 +221,7 @@ static Collection<IndexVersion> getAllVersions() {
         return VERSION_IDS.values();
     }
 
-    static final IntFunction<String> VERSION_LOOKUP = ReleaseVersions.generateVersionsLookup(IndexVersions.class);
+    static final IntFunction<String> VERSION_LOOKUP = ReleaseVersions.generateVersionsLookup(IndexVersions.class, LATEST_DEFINED.id());
 
     // no instance
     private IndexVersions() {}
diff --git a/server/src/test/java/org/elasticsearch/ReleaseVersionsTests.java b/server/src/test/java/org/elasticsearch/ReleaseVersionsTests.java
index b80e953bd8aea..3b5f5eea57f66 100644
--- a/server/src/test/java/org/elasticsearch/ReleaseVersionsTests.java
+++ b/server/src/test/java/org/elasticsearch/ReleaseVersionsTests.java
@@ -17,19 +17,20 @@
 public class ReleaseVersionsTests extends ESTestCase {
 
     public void testReleaseVersions() {
-        IntFunction<String> versions = ReleaseVersions.generateVersionsLookup(ReleaseVersionsTests.class);
+        IntFunction<String> versions = ReleaseVersions.generateVersionsLookup(ReleaseVersionsTests.class, 23);
 
         assertThat(versions.apply(10), equalTo("8.0.0"));
         assertThat(versions.apply(14), equalTo("8.1.0-8.1.1"));
         assertThat(versions.apply(21), equalTo("8.2.0"));
         assertThat(versions.apply(22), equalTo("8.2.1"));
+        assertThat(versions.apply(23), equalTo(Version.CURRENT.toString()));
     }
 
     public void testReturnsRange() {
-        IntFunction<String> versions = ReleaseVersions.generateVersionsLookup(ReleaseVersionsTests.class);
+        IntFunction<String> versions = ReleaseVersions.generateVersionsLookup(ReleaseVersionsTests.class, 23);
 
         assertThat(versions.apply(17), equalTo("8.1.2-8.2.0"));
         assertThat(versions.apply(9), equalTo("0.0.0"));
-        assertThat(versions.apply(24), equalTo("8.2.2-snapshot[24]"));
+        assertThat(versions.apply(24), equalTo(new Version(Version.CURRENT.id + 100) + "-[24]"));
     }
 }
diff --git a/server/src/test/java/org/elasticsearch/TransportVersionTests.java b/server/src/test/java/org/elasticsearch/TransportVersionTests.java
index 2de973622248b..a3728f20a23d4 100644
--- a/server/src/test/java/org/elasticsearch/TransportVersionTests.java
+++ b/server/src/test/java/org/elasticsearch/TransportVersionTests.java
@@ -186,6 +186,10 @@ public void testCURRENTIsLatest() {
         assertThat(Collections.max(TransportVersions.getAllVersions()), is(TransportVersion.current()));
     }
 
+    public void testToReleaseVersion() {
+        assertThat(TransportVersion.current().toReleaseVersion(), equalTo(Version.CURRENT.toString()));
+    }
+
     public void testToString() {
         assertEquals("5000099", TransportVersion.fromId(5_00_00_99).toString());
         assertEquals("2030099", TransportVersion.fromId(2_03_00_99).toString());

From 7c5c471904c042b5a548ac1aa454ab9f2bce8b00 Mon Sep 17 00:00:00 2001
From: David Turner <david.turner@elastic.co>
Date: Wed, 28 Aug 2024 14:31:25 +0100
Subject: [PATCH 004/144] Upgrade `repository-azure` dependencies (#112277)

`azure-core-1.51.0` includes fixes for a handful of bugs we reported.
This commit upgrades the `azure-storage-blob` and `azure-identity`
dependencies to pick up this new fixed version of `azure-core`.
---
 docs/changelog/112277.yaml            |  5 +++
 gradle/verification-metadata.xml      | 65 ++++++++++++++-------------
 modules/repository-azure/build.gradle | 22 ++++-----
 3 files changed, 51 insertions(+), 41 deletions(-)
 create mode 100644 docs/changelog/112277.yaml

diff --git a/docs/changelog/112277.yaml b/docs/changelog/112277.yaml
new file mode 100644
index 0000000000000..eac474555999a
--- /dev/null
+++ b/docs/changelog/112277.yaml
@@ -0,0 +1,5 @@
+pr: 112277
+summary: Upgrade `repository-azure` dependencies
+area: Snapshot/Restore
+type: upgrade
+issues: []
diff --git a/gradle/verification-metadata.xml b/gradle/verification-metadata.xml
index 261e210cdbe11..fd514103449c1 100644
--- a/gradle/verification-metadata.xml
+++ b/gradle/verification-metadata.xml
@@ -119,44 +119,44 @@
             <sha256 value="bc818ee3015f7cea73d5a603fc7a542ad82ebb5799e406d9abc81ac42caa90f0" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.azure" name="azure-core" version="1.50.0">
-         <artifact name="azure-core-1.50.0.jar">
-            <sha256 value="71ef89bafb09b2e8df66e0d422e1809f1d9325d68e45fa74980b416f48b90cef" origin="Generated by Gradle"/>
+      <component group="com.azure" name="azure-core" version="1.51.0">
+         <artifact name="azure-core-1.51.0.jar">
+            <sha256 value="9f39244d3cc201a6fd69eb5800d9951624bcac548aee3b51efd642e4acbf457c" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.azure" name="azure-core-http-netty" version="1.15.1">
-         <artifact name="azure-core-http-netty-1.15.1.jar">
-            <sha256 value="e07002835364c67a9267fd019ee1019dc9ea865491b6b1d4f9b8c8809fc1bae7" origin="Generated by Gradle"/>
+      <component group="com.azure" name="azure-core-http-netty" version="1.15.3">
+         <artifact name="azure-core-http-netty-1.15.3.jar">
+            <sha256 value="18e9932c0aa3f42cee80fccee1907849fa9db5be40b8cffa21d1a7fc1d7457e5" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.azure" name="azure-identity" version="1.13.1">
-         <artifact name="azure-identity-1.13.1.jar">
-            <sha256 value="b479a7a1b6143212faaca3f4edc62d2929b14ea9aa48c80fe7cbe418928d6bcd" origin="Generated by Gradle"/>
+      <component group="com.azure" name="azure-identity" version="1.13.2">
+         <artifact name="azure-identity-1.13.2.jar">
+            <sha256 value="f00ebc38b1dcf75a35129b8b0ad434514c84fd310c7afaf12824bd04e590f243" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.azure" name="azure-json" version="1.1.0">
-         <artifact name="azure-json-1.1.0.jar">
-            <sha256 value="114af9b1459c9c93190b2a82f427c0e93fbbb28896fc57f2585a9b821275ca56" origin="Generated by Gradle"/>
+      <component group="com.azure" name="azure-json" version="1.2.0">
+         <artifact name="azure-json-1.2.0.jar">
+            <sha256 value="c7419ae04f668eb4dc3864cd64a6b77207abd93b9ee784f042dea7cb452840de" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.azure" name="azure-storage-blob" version="12.26.1">
-         <artifact name="azure-storage-blob-12.26.1.jar">
-            <sha256 value="9345bcae2c9a727b3bce2b715faa484caa0f3195aacbc9577a3dd055ac1cde1e" origin="Generated by Gradle"/>
+      <component group="com.azure" name="azure-storage-blob" version="12.27.1">
+         <artifact name="azure-storage-blob-12.27.1.jar">
+            <sha256 value="31915426834400cac854f48441c168d55aa6fc054527f28f1d242a7067affd14" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.azure" name="azure-storage-common" version="12.26.0">
-         <artifact name="azure-storage-common-12.26.0.jar">
-            <sha256 value="a11c44c699ed1a112fd7a7001e3964062bd9366de70b4822e4c776b4587a3e2f" origin="Generated by Gradle"/>
+      <component group="com.azure" name="azure-storage-common" version="12.26.1">
+         <artifact name="azure-storage-common-12.26.1.jar">
+            <sha256 value="b0297ac1a9017ccd8a1e5cf41fb8d00ff0adbdd06849f6c5aafb3208708264dd" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.azure" name="azure-storage-internal-avro" version="12.11.1">
-         <artifact name="azure-storage-internal-avro-12.11.1.jar">
-            <sha256 value="f66862923abcf5f652d3c2ca069ebbcefbb244ca74e78bf734b96b8933087631" origin="Generated by Gradle"/>
+      <component group="com.azure" name="azure-storage-internal-avro" version="12.12.1">
+         <artifact name="azure-storage-internal-avro-12.12.1.jar">
+            <sha256 value="b5405fb42fa93413dfb24bbdec57d1a9915810c5cda5fe27dd2fe5b27f8d8767" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.azure" name="azure-xml" version="1.0.0">
-         <artifact name="azure-xml-1.0.0.jar">
-            <sha256 value="438b90eb6f8efa78e06efda132ecd7592b6fb451cc7110bdf202aa17d16a3da7" origin="Generated by Gradle"/>
+      <component group="com.azure" name="azure-xml" version="1.1.0">
+         <artifact name="azure-xml-1.1.0.jar">
+            <sha256 value="1006208324a08dadd5463ad2edfa3057a1ec3adee9d79c3ca00b14ef2f66cbce" origin="Generated by Gradle"/>
          </artifact>
       </component>
       <component group="com.bettercloud" name="vault-java-driver" version="4.1.0">
@@ -411,9 +411,9 @@
             <sha256 value="b2bd29c31fda49a9b28a22b9e5c2b26443bcfa99c1a28eab70ab9c7d349b5002" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.fasterxml.woodstox" name="woodstox-core" version="6.4.0">
-         <artifact name="woodstox-core-6.4.0.jar">
-            <sha256 value="d6eb9f2f40049a7a808baf11ffba0737648e62ff52fde9271d808e5d57a27279" origin="Generated by Gradle"/>
+      <component group="com.fasterxml.woodstox" name="woodstox-core" version="6.7.0">
+         <artifact name="woodstox-core-6.7.0.jar">
+            <sha256 value="81cdeef50567735bda9f6b4aabe0cc0a3f6c04f15569192bc6505393d2612c25" origin="Generated by Gradle"/>
          </artifact>
       </component>
       <component group="com.github.breskeby" name="shadow" version="3b035f2">
@@ -901,9 +901,9 @@
             <sha256 value="f1eae7a4e14944940e54605d7b512bdd3296efe6353af6bfb15c1b97ed06d8ec" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.microsoft.azure" name="msal4j" version="1.16.1">
-         <artifact name="msal4j-1.16.1.jar">
-            <sha256 value="871e50e97d61685d77480fc021b048eecb94d4a005b08f89e7f5d0a6a8ab1dc0" origin="Generated by Gradle"/>
+      <component group="com.microsoft.azure" name="msal4j" version="1.16.2">
+         <artifact name="msal4j-1.16.2.jar">
+            <sha256 value="23478ea37253045c58b8b80367a89b48cbf2bd3e3ef43c2ddd3e7d96b853ef43" origin="Generated by Gradle"/>
          </artifact>
       </component>
       <component group="com.microsoft.azure" name="msal4j-persistence-extension" version="1.3.0">
@@ -3394,6 +3394,11 @@
             <sha256 value="678567e48b51a42c65c699f266539ad3d676d4b1a5b0ad7d89ece8b9d5772579" origin="Generated by Gradle"/>
          </artifact>
       </component>
+      <component group="org.codehaus.woodstox" name="stax2-api" version="4.2.2">
+         <artifact name="stax2-api-4.2.2.jar">
+            <sha256 value="a61c48d553efad78bc01fffc4ac528bebbae64cbaec170b2a5e39cf61eb51abe" origin="Generated by Gradle"/>
+         </artifact>
+      </component>
       <component group="org.cryptacular" name="cryptacular" version="1.2.4">
          <artifact name="cryptacular-1.2.4.jar">
             <sha256 value="97feff80494a54f1b5001f6f4bbdbd45cb64ccbb2dffeb679da9da9be0434b07" origin="Generated by Gradle"/>
diff --git a/modules/repository-azure/build.gradle b/modules/repository-azure/build.gradle
index 9c63304e8267b..6334e5ae6a195 100644
--- a/modules/repository-azure/build.gradle
+++ b/modules/repository-azure/build.gradle
@@ -24,16 +24,16 @@ versions << [
 
 dependencies {
   // Microsoft
-  api "com.azure:azure-core-http-netty:1.15.1"
-  api "com.azure:azure-core:1.50.0"
-  api "com.azure:azure-identity:1.13.1"
-  api "com.azure:azure-json:1.1.0"
-  api "com.azure:azure-storage-blob:12.26.1"
-  api "com.azure:azure-storage-common:12.26.0"
-  api "com.azure:azure-storage-internal-avro:12.11.1"
-  api "com.azure:azure-xml:1.0.0"
+  api "com.azure:azure-core-http-netty:1.15.3"
+  api "com.azure:azure-core:1.51.0"
+  api "com.azure:azure-identity:1.13.2"
+  api "com.azure:azure-json:1.2.0"
+  api "com.azure:azure-storage-blob:12.27.1"
+  api "com.azure:azure-storage-common:12.26.1"
+  api "com.azure:azure-storage-internal-avro:12.12.1"
+  api "com.azure:azure-xml:1.1.0"
   api "com.microsoft.azure:msal4j-persistence-extension:1.3.0"
-  api "com.microsoft.azure:msal4j:1.16.1"
+  api "com.microsoft.azure:msal4j:1.16.2"
 
   // Jackson
   api "com.fasterxml.jackson.core:jackson-core:${versions.jackson}"
@@ -57,7 +57,7 @@ dependencies {
   api "org.reactivestreams:reactive-streams:1.0.4"
 
   // Others
-  api "com.fasterxml.woodstox:woodstox-core:6.4.0"
+  api "com.fasterxml.woodstox:woodstox-core:6.7.0"
   api "com.github.stephenc.jcip:jcip-annotations:1.0-1"
   api "com.nimbusds:content-type:2.3"
   api "com.nimbusds:lang-tag:1.7"
@@ -69,7 +69,7 @@ dependencies {
   api "net.java.dev.jna:jna:${versions.jna}" // Maven says 5.14.0 but this aligns with the Elasticsearch-wide version
   api "net.minidev:accessors-smart:2.5.0"
   api "net.minidev:json-smart:2.5.0"
-  api "org.codehaus.woodstox:stax2-api:4.2.1"
+  api "org.codehaus.woodstox:stax2-api:4.2.2"
   api "org.ow2.asm:asm:9.3"
 
   runtimeOnly "com.google.crypto.tink:tink:1.14.0"

From 046d6ee7544bac7a5ced7d38431b4c6374efa279 Mon Sep 17 00:00:00 2001
From: Nhat Nguyen <nhat.nguyen@elastic.co>
Date: Wed, 28 Aug 2024 07:59:13 -0700
Subject: [PATCH 005/144] Avoid wrapping rejection exception in exchange
 (#112178)

We should avoid wrapping EsRejectedExecutionException in an
ElasticsearchException as it would change the status code from 429 to
500. Ideally, we should avoid wrapping exceptions altogether, but that
would require bigger changes.

Closes #112106
---
 docs/changelog/112178.yaml                    |  6 ++
 .../compute/operator/AsyncOperator.java       |  2 +-
 .../exchange/ExchangeSourceHandler.java       |  2 +-
 .../xpack/esql/action/EnrichIT.java           | 25 ++++++++
 .../xpack/esql/action/ManyShardsIT.java       | 60 +++++++++++++++++++
 5 files changed, 93 insertions(+), 2 deletions(-)
 create mode 100644 docs/changelog/112178.yaml

diff --git a/docs/changelog/112178.yaml b/docs/changelog/112178.yaml
new file mode 100644
index 0000000000000..f1011291542b8
--- /dev/null
+++ b/docs/changelog/112178.yaml
@@ -0,0 +1,6 @@
+pr: 112178
+summary: Avoid wrapping rejection exception in exchange
+area: ES|QL
+type: bug
+issues:
+ - 112106
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/operator/AsyncOperator.java b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/operator/AsyncOperator.java
index 92213eca7b477..2c36b42dee277 100644
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/operator/AsyncOperator.java
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/operator/AsyncOperator.java
@@ -146,7 +146,7 @@ private void checkFailure() {
         Exception e = failureCollector.getFailure();
         if (e != null) {
             discardPages();
-            throw ExceptionsHelper.convertToElastic(e);
+            throw ExceptionsHelper.convertToRuntime(e);
         }
     }
 
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/operator/exchange/ExchangeSourceHandler.java b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/operator/exchange/ExchangeSourceHandler.java
index 406dc4494208c..e3fc0e26e34e0 100644
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/operator/exchange/ExchangeSourceHandler.java
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/operator/exchange/ExchangeSourceHandler.java
@@ -54,7 +54,7 @@ private class ExchangeSourceImpl implements ExchangeSource {
         private void checkFailure() {
             Exception e = failure.getFailure();
             if (e != null) {
-                throw ExceptionsHelper.convertToElastic(e);
+                throw ExceptionsHelper.convertToRuntime(e);
             }
         }
 
diff --git a/x-pack/plugin/esql/src/internalClusterTest/java/org/elasticsearch/xpack/esql/action/EnrichIT.java b/x-pack/plugin/esql/src/internalClusterTest/java/org/elasticsearch/xpack/esql/action/EnrichIT.java
index e7bb054221c89..dab99a0f719dd 100644
--- a/x-pack/plugin/esql/src/internalClusterTest/java/org/elasticsearch/xpack/esql/action/EnrichIT.java
+++ b/x-pack/plugin/esql/src/internalClusterTest/java/org/elasticsearch/xpack/esql/action/EnrichIT.java
@@ -7,6 +7,7 @@
 
 package org.elasticsearch.xpack.esql.action;
 
+import org.elasticsearch.ExceptionsHelper;
 import org.elasticsearch.action.ActionType;
 import org.elasticsearch.action.support.ActionFilters;
 import org.elasticsearch.action.support.TransportAction;
@@ -16,6 +17,7 @@
 import org.elasticsearch.common.settings.Setting;
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.unit.ByteSizeValue;
+import org.elasticsearch.common.util.concurrent.EsRejectedExecutionException;
 import org.elasticsearch.compute.data.BlockFactory;
 import org.elasticsearch.compute.operator.DriverProfile;
 import org.elasticsearch.compute.operator.DriverStatus;
@@ -30,6 +32,9 @@
 import org.elasticsearch.protocol.xpack.XPackInfoRequest;
 import org.elasticsearch.protocol.xpack.XPackInfoResponse;
 import org.elasticsearch.reindex.ReindexPlugin;
+import org.elasticsearch.rest.RestStatus;
+import org.elasticsearch.test.transport.MockTransportService;
+import org.elasticsearch.transport.RemoteTransportException;
 import org.elasticsearch.transport.TransportService;
 import org.elasticsearch.xpack.core.LocalStateCompositeXPackPlugin;
 import org.elasticsearch.xpack.core.XPackSettings;
@@ -43,6 +48,7 @@
 import org.elasticsearch.xpack.enrich.EnrichPlugin;
 import org.elasticsearch.xpack.esql.EsqlTestUtils;
 import org.elasticsearch.xpack.esql.core.type.DataType;
+import org.elasticsearch.xpack.esql.enrich.EnrichLookupService;
 import org.elasticsearch.xpack.esql.plan.logical.Enrich;
 import org.elasticsearch.xpack.esql.plugin.EsqlPlugin;
 import org.junit.After;
@@ -82,6 +88,7 @@ protected Collection<Class<? extends Plugin>> nodePlugins() {
         plugins.add(IngestCommonPlugin.class);
         plugins.add(ReindexPlugin.class);
         plugins.add(InternalTransportSettingPlugin.class);
+        plugins.add(MockTransportService.TestPlugin.class);
         return plugins;
     }
 
@@ -420,6 +427,24 @@ public void testManyDocuments() {
         }
     }
 
+    public void testRejection() {
+        for (var ts : internalCluster().getInstances(TransportService.class)) {
+            ((MockTransportService) ts).addRequestHandlingBehavior(EnrichLookupService.LOOKUP_ACTION_NAME, (h, r, channel, t) -> {
+                EsRejectedExecutionException ex = new EsRejectedExecutionException("test", false);
+                channel.sendResponse(new RemoteTransportException("test", ex));
+            });
+        }
+        try {
+            String query = "FROM listen* | " + enrichSongCommand();
+            Exception error = expectThrows(Exception.class, () -> run(query).close());
+            assertThat(ExceptionsHelper.status(error), equalTo(RestStatus.TOO_MANY_REQUESTS));
+        } finally {
+            for (var ts : internalCluster().getInstances(TransportService.class)) {
+                ((MockTransportService) ts).clearAllRules();
+            }
+        }
+    }
+
     public static class LocalStateEnrich extends LocalStateCompositeXPackPlugin {
 
         public LocalStateEnrich(final Settings settings, final Path configPath) throws Exception {
diff --git a/x-pack/plugin/esql/src/internalClusterTest/java/org/elasticsearch/xpack/esql/action/ManyShardsIT.java b/x-pack/plugin/esql/src/internalClusterTest/java/org/elasticsearch/xpack/esql/action/ManyShardsIT.java
index fb598cb855013..1ce92ded8acc6 100644
--- a/x-pack/plugin/esql/src/internalClusterTest/java/org/elasticsearch/xpack/esql/action/ManyShardsIT.java
+++ b/x-pack/plugin/esql/src/internalClusterTest/java/org/elasticsearch/xpack/esql/action/ManyShardsIT.java
@@ -8,14 +8,24 @@
 package org.elasticsearch.xpack.esql.action;
 
 import org.apache.lucene.tests.util.LuceneTestCase;
+import org.elasticsearch.ExceptionsHelper;
+import org.elasticsearch.action.ActionListener;
 import org.elasticsearch.action.bulk.BulkRequestBuilder;
 import org.elasticsearch.action.index.IndexRequest;
 import org.elasticsearch.action.support.WriteRequest;
 import org.elasticsearch.cluster.metadata.IndexMetadata;
 import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.common.util.concurrent.EsRejectedExecutionException;
+import org.elasticsearch.compute.operator.exchange.ExchangeService;
 import org.elasticsearch.plugins.Plugin;
+import org.elasticsearch.rest.RestStatus;
 import org.elasticsearch.search.MockSearchService;
 import org.elasticsearch.search.SearchService;
+import org.elasticsearch.test.transport.MockTransportService;
+import org.elasticsearch.transport.RemoteTransportException;
+import org.elasticsearch.transport.TransportChannel;
+import org.elasticsearch.transport.TransportResponse;
+import org.elasticsearch.transport.TransportService;
 import org.elasticsearch.xpack.esql.plugin.QueryPragmas;
 import org.hamcrest.Matchers;
 import org.junit.Before;
@@ -27,6 +37,10 @@
 import java.util.concurrent.CountDownLatch;
 import java.util.concurrent.TimeUnit;
 import java.util.concurrent.atomic.AtomicInteger;
+import java.util.concurrent.atomic.AtomicReference;
+
+import static org.hamcrest.Matchers.equalTo;
+import static org.hamcrest.Matchers.instanceOf;
 
 /**
  * Make sures that we can run many concurrent requests with large number of shards with any data_partitioning.
@@ -38,6 +52,7 @@ public class ManyShardsIT extends AbstractEsqlIntegTestCase {
     protected Collection<Class<? extends Plugin>> getMockPlugins() {
         var plugins = new ArrayList<>(super.getMockPlugins());
         plugins.add(MockSearchService.TestPlugin.class);
+        plugins.add(MockTransportService.TestPlugin.class);
         return plugins;
     }
 
@@ -97,6 +112,51 @@ public void testConcurrentQueries() throws Exception {
         }
     }
 
+    public void testRejection() throws Exception {
+        String[] nodes = internalCluster().getNodeNames();
+        for (String node : nodes) {
+            MockTransportService ts = (MockTransportService) internalCluster().getInstance(TransportService.class, node);
+            ts.addRequestHandlingBehavior(ExchangeService.EXCHANGE_ACTION_NAME, (handler, request, channel, task) -> {
+                handler.messageReceived(request, new TransportChannel() {
+                    @Override
+                    public String getProfileName() {
+                        return channel.getProfileName();
+                    }
+
+                    @Override
+                    public void sendResponse(TransportResponse response) {
+                        channel.sendResponse(new RemoteTransportException("simulated", new EsRejectedExecutionException("test queue")));
+                    }
+
+                    @Override
+                    public void sendResponse(Exception exception) {
+                        channel.sendResponse(exception);
+                    }
+                }, task);
+            });
+        }
+        try {
+            AtomicReference<Exception> failure = new AtomicReference<>();
+            EsqlQueryRequest request = new EsqlQueryRequest();
+            request.query("from test-* | stats count(user) by tags");
+            request.acceptedPragmaRisks(true);
+            request.pragmas(randomPragmas());
+            CountDownLatch queryLatch = new CountDownLatch(1);
+            client().execute(EsqlQueryAction.INSTANCE, request, ActionListener.runAfter(ActionListener.wrap(r -> {
+                r.close();
+                throw new AssertionError("expected failure");
+            }, failure::set), queryLatch::countDown));
+            assertTrue(queryLatch.await(10, TimeUnit.SECONDS));
+            assertThat(failure.get(), instanceOf(EsRejectedExecutionException.class));
+            assertThat(ExceptionsHelper.status(failure.get()), equalTo(RestStatus.TOO_MANY_REQUESTS));
+            assertThat(failure.get().getMessage(), equalTo("test queue"));
+        } finally {
+            for (String node : nodes) {
+                ((MockTransportService) internalCluster().getInstance(TransportService.class, node)).clearAllRules();
+            }
+        }
+    }
+
     static class SearchContextCounter {
         private final int maxAllowed;
         private final AtomicInteger current = new AtomicInteger();

From 50871a3d28b413ff846497393459a3af1e937d3a Mon Sep 17 00:00:00 2001
From: Patrick Doyle <810052+prdoyle@users.noreply.github.com>
Date: Wed, 28 Aug 2024 11:13:47 -0400
Subject: [PATCH 006/144] New injector (#111722)

* Initial new injector

* Allow createComponents to return classes

* Downsample injection

* Remove more vestiges of subtype handling

* Lowercase logger

* Respond to code review comments

* Only one object per class

* Some additional cleanup incl spotless

* PR feedback

* Missed one

* Rename workQueue

* Remove Injector.addRecordContents

* TelemetryProvider requires us to inject an object using a supertype

* Address Simon's comments

* Clarify the reason for SuppressForbidden

* Make log indentation code less intrusive
---
 server/src/main/java/module-info.java         |   1 +
 .../org/elasticsearch/injection/Injector.java | 314 ++++++++++++++++++
 .../injection/PlanInterpreter.java            | 108 ++++++
 .../org/elasticsearch/injection/Planner.java  | 128 +++++++
 .../elasticsearch/injection/api/Inject.java   |  23 ++
 .../elasticsearch/injection/package-info.java |  41 +++
 .../injection/spec/ExistingInstanceSpec.java  |  17 +
 .../injection/spec/InjectionSpec.java         |  13 +
 .../injection/spec/MethodHandleSpec.java      |  30 ++
 .../injection/spec/ParameterSpec.java         |  24 ++
 .../injection/spec/package-info.java          |  25 ++
 .../injection/step/InjectionStep.java         |  11 +
 .../injection/step/InstantiateStep.java       |  17 +
 .../injection/step/package-info.java          |  15 +
 .../elasticsearch/node/NodeConstruction.java  |  70 ++--
 .../node/PluginServiceInstances.java          |  52 +++
 .../injection/InjectorTests.java              | 154 +++++++++
 .../xpack/downsample/Downsample.java          |   2 +-
 .../xpack/downsample/DownsampleMetrics.java   |   5 +-
 19 files changed, 1025 insertions(+), 25 deletions(-)
 create mode 100644 server/src/main/java/org/elasticsearch/injection/Injector.java
 create mode 100644 server/src/main/java/org/elasticsearch/injection/PlanInterpreter.java
 create mode 100644 server/src/main/java/org/elasticsearch/injection/Planner.java
 create mode 100644 server/src/main/java/org/elasticsearch/injection/api/Inject.java
 create mode 100644 server/src/main/java/org/elasticsearch/injection/package-info.java
 create mode 100644 server/src/main/java/org/elasticsearch/injection/spec/ExistingInstanceSpec.java
 create mode 100644 server/src/main/java/org/elasticsearch/injection/spec/InjectionSpec.java
 create mode 100644 server/src/main/java/org/elasticsearch/injection/spec/MethodHandleSpec.java
 create mode 100644 server/src/main/java/org/elasticsearch/injection/spec/ParameterSpec.java
 create mode 100644 server/src/main/java/org/elasticsearch/injection/spec/package-info.java
 create mode 100644 server/src/main/java/org/elasticsearch/injection/step/InjectionStep.java
 create mode 100644 server/src/main/java/org/elasticsearch/injection/step/InstantiateStep.java
 create mode 100644 server/src/main/java/org/elasticsearch/injection/step/package-info.java
 create mode 100644 server/src/main/java/org/elasticsearch/node/PluginServiceInstances.java
 create mode 100644 server/src/test/java/org/elasticsearch/injection/InjectorTests.java

diff --git a/server/src/main/java/module-info.java b/server/src/main/java/module-info.java
index d412748ed4e57..086bfece87172 100644
--- a/server/src/main/java/module-info.java
+++ b/server/src/main/java/module-info.java
@@ -190,6 +190,7 @@
     exports org.elasticsearch.common.file;
     exports org.elasticsearch.common.geo;
     exports org.elasticsearch.common.hash;
+    exports org.elasticsearch.injection.api;
     exports org.elasticsearch.injection.guice;
     exports org.elasticsearch.injection.guice.binder;
     exports org.elasticsearch.injection.guice.internal;
diff --git a/server/src/main/java/org/elasticsearch/injection/Injector.java b/server/src/main/java/org/elasticsearch/injection/Injector.java
new file mode 100644
index 0000000000000..03fcf18509fcc
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/injection/Injector.java
@@ -0,0 +1,314 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.injection;
+
+import org.elasticsearch.injection.api.Inject;
+import org.elasticsearch.injection.spec.ExistingInstanceSpec;
+import org.elasticsearch.injection.spec.InjectionSpec;
+import org.elasticsearch.injection.spec.MethodHandleSpec;
+import org.elasticsearch.injection.spec.ParameterSpec;
+import org.elasticsearch.injection.step.InjectionStep;
+import org.elasticsearch.logging.LogManager;
+import org.elasticsearch.logging.Logger;
+
+import java.lang.invoke.MethodHandle;
+import java.lang.invoke.MethodHandles;
+import java.lang.reflect.Constructor;
+import java.util.ArrayDeque;
+import java.util.Collection;
+import java.util.HashSet;
+import java.util.LinkedHashMap;
+import java.util.List;
+import java.util.Map;
+import java.util.Queue;
+import java.util.Set;
+import java.util.stream.Stream;
+
+import static java.util.function.Predicate.not;
+import static java.util.stream.Collectors.joining;
+import static java.util.stream.Collectors.toCollection;
+import static java.util.stream.Collectors.toMap;
+
+/**
+ * The main object for dependency injection.
+ * <p>
+ * Allows the user to specify the requirements, then call {@link #inject} to create an object plus all its dependencies.
+ * <p>
+ * <em>Implementation note</em>: this class itself contains logic for <em>specifying</em> the injection requirements;
+ * the actual injection operations are performed in other classes like {@link Planner} and {@link PlanInterpreter},
+ */
+public final class Injector {
+    private static final Logger logger = LogManager.getLogger(Injector.class);
+
+    /**
+     * The specifications supplied by the user, as opposed to those inferred by the injector.
+     */
+    private final Map<Class<?>, InjectionSpec> seedSpecs;
+
+    Injector(Map<Class<?>, InjectionSpec> seedSpecs) {
+        this.seedSpecs = seedSpecs;
+    }
+
+    public static Injector create() {
+        return new Injector(new LinkedHashMap<>());
+    }
+
+    /**
+     * Instructs the injector to instantiate <code>classToProcess</code>
+     * in accordance with whatever annotations may be present on that class.
+     * <p>
+     * There are only three ways the injector can find out that it must instantiate some class:
+     * <ol>
+     *     <li>
+     *         This method
+     *     </li>
+     *     <li>
+     *         The parameter passed to {@link #inject}
+     *     </li>
+     *     <li>
+     *         A constructor parameter of some other class being instantiated,
+     *         having exactly the right class (not a supertype)
+     *     </li>
+     * </ol>
+     *
+     * @return <code>this</code>
+     */
+    public Injector addClass(Class<?> classToProcess) {
+        MethodHandleSpec methodHandleSpec = methodHandleSpecFor(classToProcess);
+        var existing = seedSpecs.put(classToProcess, methodHandleSpec);
+        if (existing != null) {
+            throw new IllegalArgumentException("class " + classToProcess.getSimpleName() + " has already been added");
+        }
+        return this;
+    }
+
+    /**
+     * Equivalent to multiple chained calls to {@link #addClass}.
+     */
+    public Injector addClasses(Collection<Class<?>> classesToProcess) {
+        classesToProcess.forEach(this::addClass);
+        return this;
+    }
+
+    /**
+     * Equivalent to {@link #addInstance addInstance(object.getClass(), object)}.
+     */
+    public <T> Injector addInstance(Object object) {
+        @SuppressWarnings("unchecked")
+        Class<T> actualClass = (Class<T>) object.getClass(); // Whatever the runtime type is, it's represented by T
+        return addInstance(actualClass, actualClass.cast(object));
+    }
+
+    /**
+     * Equivalent to multiple calls to {@link #addInstance(Object)}.
+     */
+    public Injector addInstances(Collection<?> objects) {
+        for (var x : objects) {
+            addInstance(x);
+        }
+        return this;
+    }
+
+    /**
+     * Indicates that <code>object</code> is to be injected for parameters of type <code>type</code>.
+     * The given object is treated as though it had been instantiated by the injector.
+     */
+    public <T> Injector addInstance(Class<? super T> type, T object) {
+        assert type.isInstance(object); // No unchecked casting shenanigans allowed
+        var existing = seedSpecs.put(type, new ExistingInstanceSpec(type, object));
+        if (existing != null) {
+            throw new IllegalStateException("There's already an object for " + type);
+        }
+        return this;
+    }
+
+    /**
+     * Main entry point. Causes objects to be constructed.
+     * @return {@link Map} whose keys are all the requested <code>resultTypes</code> and whose values are all the instances of those types.
+     */
+    public Map<Class<?>, Object> inject(Collection<? extends Class<?>> resultTypes) {
+        resultTypes.forEach(this::ensureClassIsSpecified);
+        PlanInterpreter i = doInjection();
+        return resultTypes.stream().collect(toMap(c -> c, i::theInstanceOf));
+    }
+
+    private <T> void ensureClassIsSpecified(Class<T> resultType) {
+        if (seedSpecs.containsKey(resultType) == false) {
+            addClass(resultType);
+        }
+    }
+
+    private PlanInterpreter doInjection() {
+        logger.debug("Starting injection");
+        Map<Class<?>, InjectionSpec> specMap = specClosure(seedSpecs);
+        Map<Class<?>, Object> existingInstances = new LinkedHashMap<>();
+        specMap.values().forEach((spec) -> {
+            if (spec instanceof ExistingInstanceSpec e) {
+                existingInstances.put(e.requestedType(), e.instance());
+            }
+        });
+        PlanInterpreter interpreter = new PlanInterpreter(existingInstances);
+        interpreter.executePlan(injectionPlan(seedSpecs.keySet(), specMap));
+        logger.debug("Done injection");
+        return interpreter;
+    }
+
+    /**
+     * Finds an {@link InjectionSpec} for every class the injector is capable of injecting.
+     * <p>
+     * We do this once the injector is fully configured, with all calls to {@link #addClass} and {@link #addInstance} finished,
+     * so that we can easily build the complete picture of how injection should occur.
+     * <p>
+     * This is not part of the planning process; it's just discovering all the things
+     * the injector needs to know about. This logic isn't concerned with ordering or dependency cycles.
+     *
+     * @param seedMap the injections the user explicitly asked for
+     * @return an {@link InjectionSpec} for every class the injector is capable of injecting.
+     */
+    private static Map<Class<?>, InjectionSpec> specClosure(Map<Class<?>, InjectionSpec> seedMap) {
+        assert seedMapIsValid(seedMap);
+
+        // For convenience, we pretend there's a gigantic method out there that takes
+        // all the seed types as parameters.
+        Queue<ParameterSpec> workQueue = seedMap.values()
+            .stream()
+            .map(InjectionSpec::requestedType)
+            .map(Injector::syntheticParameterSpec)
+            .collect(toCollection(ArrayDeque::new));
+
+        // This map doubles as a checklist of classes we're already finished processing
+        Map<Class<?>, InjectionSpec> result = new LinkedHashMap<>();
+
+        ParameterSpec p;
+        while ((p = workQueue.poll()) != null) {
+            Class<?> c = p.injectableType();
+            InjectionSpec existingResult = result.get(c);
+            if (existingResult != null) {
+                logger.trace("Spec for {} already exists", c.getSimpleName());
+                continue;
+            }
+
+            InjectionSpec spec = seedMap.get(c);
+            if (spec instanceof ExistingInstanceSpec) {
+                // simple!
+                result.put(c, spec);
+                continue;
+            }
+
+            // At this point, we know we'll need a MethodHandleSpec
+            MethodHandleSpec methodHandleSpec;
+            if (spec == null) {
+                // The user didn't specify this class; we must infer it now
+                spec = methodHandleSpec = methodHandleSpecFor(c);
+            } else if (spec instanceof MethodHandleSpec m) {
+                methodHandleSpec = m;
+            } else {
+                throw new AssertionError("Unexpected spec: " + spec);
+            }
+
+            logger.trace("Inspecting parameters for constructor of {}", c);
+            for (var ps : methodHandleSpec.parameters()) {
+                logger.trace("Enqueue {}", ps);
+                workQueue.add(ps);
+            }
+
+            registerSpec(spec, result);
+        }
+
+        if (logger.isTraceEnabled()) {
+            logger.trace("Specs: {}", result.values().stream().map(Object::toString).collect(joining("\n\t", "\n\t", "")));
+        }
+        return result;
+    }
+
+    private static MethodHandleSpec methodHandleSpecFor(Class<?> c) {
+        Constructor<?> constructor = getSuitableConstructorIfAny(c);
+        if (constructor == null) {
+            throw new IllegalStateException("No suitable constructor for " + c);
+        }
+
+        MethodHandle ctorHandle;
+        try {
+            ctorHandle = lookup().unreflectConstructor(constructor);
+        } catch (IllegalAccessException e) {
+            throw new IllegalStateException(e);
+        }
+
+        List<ParameterSpec> parameters = Stream.of(constructor.getParameters()).map(ParameterSpec::from).toList();
+
+        return new MethodHandleSpec(c, ctorHandle, parameters);
+    }
+
+    /**
+     * @return true (unless an assertion fails). Never returns false.
+     */
+    private static boolean seedMapIsValid(Map<Class<?>, InjectionSpec> seed) {
+        seed.forEach(
+            (c, s) -> { assert s.requestedType().equals(c) : "Spec must be associated with its requestedType, not " + c + ": " + s; }
+        );
+        return true;
+    }
+
+    /**
+     * For the classes we've been explicitly asked to inject,
+     * pretend there's some massive method taking all of them as parameters
+     */
+    private static ParameterSpec syntheticParameterSpec(Class<?> c) {
+        return new ParameterSpec("synthetic_" + c.getSimpleName(), c, c);
+    }
+
+    private static Constructor<?> getSuitableConstructorIfAny(Class<?> type) {
+        var constructors = Stream.of(type.getConstructors()).filter(not(Constructor::isSynthetic)).toList();
+        if (constructors.size() == 1) {
+            return constructors.get(0);
+        }
+        var injectConstructors = constructors.stream().filter(c -> c.isAnnotationPresent(Inject.class)).toList();
+        if (injectConstructors.size() == 1) {
+            return injectConstructors.get(0);
+        }
+        logger.trace("No suitable constructor for {}", type);
+        return null;
+    }
+
+    private static void registerSpec(InjectionSpec spec, Map<Class<?>, InjectionSpec> specsByClass) {
+        Class<?> requestedType = spec.requestedType();
+        var existing = specsByClass.put(requestedType, spec);
+        if (existing == null || existing.equals(spec)) {
+            logger.trace("Register spec: {}", spec);
+        } else {
+            throw new IllegalStateException("Ambiguous specifications for " + requestedType + ": " + existing + " and " + spec);
+        }
+    }
+
+    private List<InjectionStep> injectionPlan(Set<Class<?>> requiredClasses, Map<Class<?>, InjectionSpec> specsByClass) {
+        logger.trace("Constructing instantiation plan");
+        Set<Class<?>> allParameterTypes = new HashSet<>();
+        specsByClass.values().forEach(spec -> {
+            if (spec instanceof MethodHandleSpec m) {
+                m.parameters().stream().map(ParameterSpec::injectableType).forEachOrdered(allParameterTypes::add);
+            }
+        });
+
+        var plan = new Planner(specsByClass, requiredClasses, allParameterTypes).injectionPlan();
+        if (logger.isDebugEnabled()) {
+            logger.debug("Injection plan: {}", plan.stream().map(Object::toString).collect(joining("\n\t", "\n\t", "")));
+        }
+        return plan;
+    }
+
+    /**
+     * <em>Evolution note</em>: there may be cases in the where we allow the user to
+     * supply a {@link java.lang.invoke.MethodHandles.Lookup} for convenience,
+     * so that they aren't required to make things public just to participate in injection.
+     */
+    private static MethodHandles.Lookup lookup() {
+        return MethodHandles.publicLookup();
+    }
+
+}
diff --git a/server/src/main/java/org/elasticsearch/injection/PlanInterpreter.java b/server/src/main/java/org/elasticsearch/injection/PlanInterpreter.java
new file mode 100644
index 0000000000000..cf38dbcb24b7d
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/injection/PlanInterpreter.java
@@ -0,0 +1,108 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.injection;
+
+import org.elasticsearch.core.SuppressForbidden;
+import org.elasticsearch.injection.spec.MethodHandleSpec;
+import org.elasticsearch.injection.spec.ParameterSpec;
+import org.elasticsearch.injection.step.InjectionStep;
+import org.elasticsearch.injection.step.InstantiateStep;
+import org.elasticsearch.logging.LogManager;
+import org.elasticsearch.logging.Logger;
+
+import java.util.LinkedHashMap;
+import java.util.List;
+import java.util.Map;
+
+/**
+ * Performs the actual injection operations by running the {@link InjectionStep}s.
+ * <p>
+ * The intent is that this logic is as simple as possible so that we don't run complex injection
+ * logic alongside the user-supplied constructor logic. All the injector complexity is already
+ * supposed to have happened in the planning phase. In particular, no injection-related errors
+ * are supposed to be detected during execution; they should be detected during planning and validation.
+ * All exceptions thrown during execution are supposed to be caused by user-supplied code.
+ *
+ * <p>
+ * <strong>Execution model</strong>:
+ * The state of the injector during injection comprises a map from classes to objects.
+ * Before any steps execute, the map is pre-populated by object instances added via
+ * {@link Injector#addInstance(Object)}  Injector.addInstance},
+ * and then the steps begin to execute, reading and writing from this map.
+ * Some steps create objects and add them to this map; others manipulate the map itself.
+ */
+final class PlanInterpreter {
+    private static final Logger logger = LogManager.getLogger(PlanInterpreter.class);
+    private final Map<Class<?>, Object> instances = new LinkedHashMap<>();
+
+    PlanInterpreter(Map<Class<?>, Object> existingInstances) {
+        existingInstances.forEach(this::addInstance);
+    }
+
+    /**
+     * Main entry point. Contains the implementation logic for each {@link InjectionStep}.
+     */
+    void executePlan(List<InjectionStep> plan) {
+        int numConstructorCalls = 0;
+        for (InjectionStep step : plan) {
+            if (step instanceof InstantiateStep i) {
+                MethodHandleSpec spec = i.spec();
+                logger.trace("Instantiating {}", spec.requestedType().getSimpleName());
+                addInstance(spec.requestedType(), instantiate(spec));
+                ++numConstructorCalls;
+            } else {
+                // TODO: switch patterns would make this unnecessary
+                assert false : "Unexpected step type: " + step.getClass().getSimpleName();
+                throw new IllegalStateException("Unexpected step type: " + step.getClass().getSimpleName());
+            }
+        }
+        logger.debug("Instantiated {} objects", numConstructorCalls);
+    }
+
+    /**
+     * @return the list element corresponding to instances.get(type).get(0),
+     * assuming that instances.get(type) has exactly one element.
+     * @throws IllegalStateException if instances.get(type) does not have exactly one element
+     */
+    public <T> T theInstanceOf(Class<T> type) {
+        Object instance = instances.get(type);
+        if (instance == null) {
+            throw new IllegalStateException("No object of type " + type.getSimpleName());
+        }
+        return type.cast(instance);
+    }
+
+    private void addInstance(Class<?> requestedType, Object instance) {
+        Object old = instances.put(requestedType, instance);
+        if (old != null) {
+            throw new IllegalStateException("Multiple objects for " + requestedType);
+        }
+    }
+
+    /**
+     * @throws IllegalStateException if the <code>MethodHandle</code> throws.
+     */
+    @SuppressForbidden(
+        reason = "Can't call invokeExact because we don't know the method argument types statically, "
+            + "since each constructor has a different signature"
+    )
+    private Object instantiate(MethodHandleSpec spec) {
+        Object[] args = spec.parameters().stream().map(this::parameterValue).toArray();
+        try {
+            return spec.methodHandle().invokeWithArguments(args);
+        } catch (Throwable e) {
+            throw new IllegalStateException("Unexpected exception while instantiating {}" + spec, e);
+        }
+    }
+
+    private Object parameterValue(ParameterSpec parameterSpec) {
+        return theInstanceOf(parameterSpec.formalType());
+    }
+
+}
diff --git a/server/src/main/java/org/elasticsearch/injection/Planner.java b/server/src/main/java/org/elasticsearch/injection/Planner.java
new file mode 100644
index 0000000000000..4b6af05d57c04
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/injection/Planner.java
@@ -0,0 +1,128 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.injection;
+
+import org.elasticsearch.injection.spec.ExistingInstanceSpec;
+import org.elasticsearch.injection.spec.InjectionSpec;
+import org.elasticsearch.injection.spec.MethodHandleSpec;
+import org.elasticsearch.injection.step.InjectionStep;
+import org.elasticsearch.injection.step.InstantiateStep;
+import org.elasticsearch.logging.LogManager;
+import org.elasticsearch.logging.Logger;
+
+import java.util.ArrayList;
+import java.util.HashSet;
+import java.util.List;
+import java.util.Map;
+import java.util.Set;
+import java.util.function.Supplier;
+
+import static java.util.Collections.unmodifiableMap;
+import static java.util.Collections.unmodifiableSet;
+
+/**
+ * <em>Evolution note</em>: the intent is to plan one domain/subsystem at a time.
+ */
+final class Planner {
+    private static final Logger logger = LogManager.getLogger(Planner.class);
+
+    final List<InjectionStep> plan;
+    final Map<Class<?>, InjectionSpec> specsByClass;
+    final Set<Class<?>> requiredTypes; // The injector's job is to ensure there is an instance of these; this is like the "root set"
+    final Set<Class<?>> allParameterTypes; // All the injectable types in all dependencies (recursively) of all required types
+    final Set<InjectionSpec> startedPlanning;
+    final Set<InjectionSpec> finishedPlanning;
+    final Set<Class<?>> alreadyProxied;
+
+    /**
+     * @param specsByClass an {@link InjectionSpec} indicating how each class should be injected
+     * @param requiredTypes the classes of which we need instances
+     * @param allParameterTypes the classes that appear as the type of any parameter of any constructor we might call
+     */
+    Planner(Map<Class<?>, InjectionSpec> specsByClass, Set<Class<?>> requiredTypes, Set<Class<?>> allParameterTypes) {
+        this.requiredTypes = requiredTypes;
+        this.plan = new ArrayList<>();
+        this.specsByClass = unmodifiableMap(specsByClass);
+        this.allParameterTypes = unmodifiableSet(allParameterTypes);
+        this.startedPlanning = new HashSet<>();
+        this.finishedPlanning = new HashSet<>();
+        this.alreadyProxied = new HashSet<>();
+    }
+
+    /**
+     * Intended to be called once.
+     * <p>
+     * Note that not all proxies are resolved once this plan has been executed.
+     * <p>
+     *
+     * <em>Evolution note</em>: in a world with multiple domains/subsystems,
+     * it will become necessary to defer proxy resolution until after other plans
+     * have been executed, because they could create additional objects that ought
+     * to be included in the proxies created by this plan.
+     *
+     * @return the {@link InjectionStep} objects listed in execution order.
+     */
+    List<InjectionStep> injectionPlan() {
+        for (Class<?> c : requiredTypes) {
+            planForClass(c, 0);
+        }
+        return plan;
+    }
+
+    /**
+     * Recursive procedure that determines what effect <code>requestedClass</code>
+     * should have on the plan under construction.
+     *
+     * @param depth is used just for indenting the logs
+     */
+    private void planForClass(Class<?> requestedClass, int depth) {
+        InjectionSpec spec = specsByClass.get(requestedClass);
+        if (spec == null) {
+            throw new IllegalStateException("Cannot instantiate " + requestedClass + ": no specification provided");
+        }
+        planForSpec(spec, depth);
+    }
+
+    private void planForSpec(InjectionSpec spec, int depth) {
+        if (finishedPlanning.contains(spec)) {
+            logger.trace("{}Already planned {}", indent(depth), spec);
+            return;
+        }
+
+        logger.trace("{}Planning for {}", indent(depth), spec);
+        if (startedPlanning.add(spec) == false) {
+            // TODO: Better cycle detection and reporting. Use SCCs
+            throw new IllegalStateException("Cyclic dependency involving " + spec);
+        }
+
+        if (spec instanceof MethodHandleSpec m) {
+            for (var p : m.parameters()) {
+                logger.trace("{}- Recursing into {} for actual parameter {}", indent(depth), p.injectableType(), p);
+                planForClass(p.injectableType(), depth + 1);
+            }
+            addStep(new InstantiateStep(m), depth);
+        } else if (spec instanceof ExistingInstanceSpec e) {
+            logger.trace("{}- Plan {}", indent(depth), e);
+            // Nothing to do. The injector will already have the required object.
+        } else {
+            throw new AssertionError("Unexpected injection spec: " + spec);
+        }
+
+        finishedPlanning.add(spec);
+    }
+
+    private void addStep(InjectionStep newStep, int depth) {
+        logger.trace("{}- Add step {}", indent(depth), newStep);
+        plan.add(newStep);
+    }
+
+    private static Supplier<String> indent(int depth) {
+        return () -> "\t".repeat(depth);
+    }
+}
diff --git a/server/src/main/java/org/elasticsearch/injection/api/Inject.java b/server/src/main/java/org/elasticsearch/injection/api/Inject.java
new file mode 100644
index 0000000000000..d5c57d1e5e2e2
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/injection/api/Inject.java
@@ -0,0 +1,23 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.injection.api;
+
+import java.lang.annotation.Retention;
+import java.lang.annotation.Target;
+
+import static java.lang.annotation.ElementType.CONSTRUCTOR;
+import static java.lang.annotation.RetentionPolicy.RUNTIME;
+
+/**
+ * Designates a constructor to be called by the injector.
+ */
+@Target(CONSTRUCTOR)
+@Retention(RUNTIME)
+public @interface Inject {
+}
diff --git a/server/src/main/java/org/elasticsearch/injection/package-info.java b/server/src/main/java/org/elasticsearch/injection/package-info.java
new file mode 100644
index 0000000000000..01dd1e878651c
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/injection/package-info.java
@@ -0,0 +1,41 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+/**
+ * Our dependency injection technologies: our bespoke injector, plus our legacy vendored version of Google Guice.
+ * <h2>Usage</h2>
+ * The new injector is {@link org.elasticsearch.injection.Injector}.
+ * You create an instance using {@link org.elasticsearch.injection.Injector#create()},
+ * call various methods like {@link org.elasticsearch.injection.Injector#addClass} to configure it,
+ * then call {@link org.elasticsearch.injection.Injector#inject} to cause the constructors to be called.
+ *
+ * <h2>Operation</h2>
+ * Injection proceeds in three phases:
+ * <ol>
+ *     <li>
+ *         <em>Configuration</em>: the {@link org.elasticsearch.injection.Injector} captures the user's
+ *         intent in the form of {@link org.elasticsearch.injection.spec.InjectionSpec} objects,
+ *         one for each class.
+ *     </li>
+ *     <li>
+ *         <em>Planning</em>: the {@link org.elasticsearch.injection.Planner} analyzes the
+ *         {@link org.elasticsearch.injection.spec.InjectionSpec} objects, validates them,
+ *         and generates a <em>plan</em> in the form of a list of {@link org.elasticsearch.injection.step.InjectionStep} objects.
+ *     </li>
+ *     <li>
+ *         <em>Execution</em>: the {@link org.elasticsearch.injection.PlanInterpreter} runs
+ *         the steps in the plan, in sequence, to actually instantiate the objects and pass them
+ *         to each others' constructors.
+ *     </li>
+ * </ol>
+ *
+ * <h2>Google Guice</h2>
+ * The older injector, based on Google Guice, is in the {@code guice} package.
+ * The new injector is unrelated to Guice, and is intended to replace Guice eventually.
+ */
+package org.elasticsearch.injection;
diff --git a/server/src/main/java/org/elasticsearch/injection/spec/ExistingInstanceSpec.java b/server/src/main/java/org/elasticsearch/injection/spec/ExistingInstanceSpec.java
new file mode 100644
index 0000000000000..f443e045442c9
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/injection/spec/ExistingInstanceSpec.java
@@ -0,0 +1,17 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.injection.spec;
+
+public record ExistingInstanceSpec(Class<?> requestedType, Object instance) implements InjectionSpec {
+    @Override
+    public String toString() {
+        // Don't call instance.toString; who knows what that will return
+        return "ExistingInstanceSpec[" + "requestedType=" + requestedType + ']';
+    }
+}
diff --git a/server/src/main/java/org/elasticsearch/injection/spec/InjectionSpec.java b/server/src/main/java/org/elasticsearch/injection/spec/InjectionSpec.java
new file mode 100644
index 0000000000000..552d2c2ba9ebb
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/injection/spec/InjectionSpec.java
@@ -0,0 +1,13 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.injection.spec;
+
+public sealed interface InjectionSpec permits MethodHandleSpec, ExistingInstanceSpec {
+    Class<?> requestedType();
+}
diff --git a/server/src/main/java/org/elasticsearch/injection/spec/MethodHandleSpec.java b/server/src/main/java/org/elasticsearch/injection/spec/MethodHandleSpec.java
new file mode 100644
index 0000000000000..06c4cd0faac63
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/injection/spec/MethodHandleSpec.java
@@ -0,0 +1,30 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.injection.spec;
+
+import java.lang.invoke.MethodHandle;
+import java.util.List;
+import java.util.Objects;
+
+/**
+ * Indicates that a type should be instantiated by calling the given {@link java.lang.invoke.MethodHandle}.
+ * <p>
+ * <em>Design note</em>: the intent is that the semantics are fully specified by this record,
+ * and no additional reflection logic is required to determine how the object should be injected.
+ * Roughly speaking: all the reflection should be finished, and the results should be stored in this object.
+ */
+public record MethodHandleSpec(Class<?> requestedType, MethodHandle methodHandle, List<ParameterSpec> parameters) implements InjectionSpec {
+    public MethodHandleSpec {
+        assert Objects.equals(methodHandle.type().parameterList(), parameters.stream().map(ParameterSpec::formalType).toList())
+            : "MethodHandle parameter types must match the supplied parameter info; "
+                + methodHandle.type().parameterList()
+                + " vs "
+                + parameters;
+    }
+}
diff --git a/server/src/main/java/org/elasticsearch/injection/spec/ParameterSpec.java b/server/src/main/java/org/elasticsearch/injection/spec/ParameterSpec.java
new file mode 100644
index 0000000000000..da15bd024fbf4
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/injection/spec/ParameterSpec.java
@@ -0,0 +1,24 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.injection.spec;
+
+import java.lang.reflect.Parameter;
+
+/**
+ * Captures the pertinent info required to inject one of the arguments of a constructor.
+ * @param name is for troubleshooting; it's not strictly needed
+ * @param formalType is the declared class of the parameter
+ * @param injectableType is the target type of the injection dependency
+ */
+public record ParameterSpec(String name, Class<?> formalType, Class<?> injectableType) {
+    public static ParameterSpec from(Parameter parameter) {
+        // We currently have no cases where the formal and injectable types are different.
+        return new ParameterSpec(parameter.getName(), parameter.getType(), parameter.getType());
+    }
+}
diff --git a/server/src/main/java/org/elasticsearch/injection/spec/package-info.java b/server/src/main/java/org/elasticsearch/injection/spec/package-info.java
new file mode 100644
index 0000000000000..26cb1e8ff8543
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/injection/spec/package-info.java
@@ -0,0 +1,25 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+/**
+ * Objects that describe the means by which an object instance is created for (or associated with) some given type.
+ * <p>
+ * The hierarchy is rooted at {@link org.elasticsearch.injection.spec.InjectionSpec}.
+ * <p>
+ * Differs from {@link org.elasticsearch.injection.step.InjectionStep InjectionStep} in that:
+ *
+ * <ul>
+ *     <li>
+ *         this describes the requirements, while <code>InjectionStep</code> describes the solution
+ *     </li>
+ *     <li>
+ *         this is declarative, while <code>InjectionStep</code> is imperative
+ *     </li>
+ * </ul>
+ */
+package org.elasticsearch.injection.spec;
diff --git a/server/src/main/java/org/elasticsearch/injection/step/InjectionStep.java b/server/src/main/java/org/elasticsearch/injection/step/InjectionStep.java
new file mode 100644
index 0000000000000..6e27f45b4f4df
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/injection/step/InjectionStep.java
@@ -0,0 +1,11 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.injection.step;
+
+public sealed interface InjectionStep permits InstantiateStep {}
diff --git a/server/src/main/java/org/elasticsearch/injection/step/InstantiateStep.java b/server/src/main/java/org/elasticsearch/injection/step/InstantiateStep.java
new file mode 100644
index 0000000000000..2342978dcfdb0
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/injection/step/InstantiateStep.java
@@ -0,0 +1,17 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.injection.step;
+
+import org.elasticsearch.injection.spec.MethodHandleSpec;
+
+/**
+ * Constructs a new object by invoking a {@link java.lang.invoke.MethodHandle}
+ * as specified by a given {@link MethodHandleSpec}.
+ */
+public record InstantiateStep(MethodHandleSpec spec) implements InjectionStep {}
diff --git a/server/src/main/java/org/elasticsearch/injection/step/package-info.java b/server/src/main/java/org/elasticsearch/injection/step/package-info.java
new file mode 100644
index 0000000000000..c0a3e05cb53f6
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/injection/step/package-info.java
@@ -0,0 +1,15 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+/**
+ * Objects that describe one operation to be performed by the <code>PlanInterpreter</code>.
+ * Injection is achieved by executing the steps in order.
+ * <p>
+ * See <code>PlanInterpreter</code> for more details on the execution model.
+ */
+package org.elasticsearch.injection.step;
diff --git a/server/src/main/java/org/elasticsearch/node/NodeConstruction.java b/server/src/main/java/org/elasticsearch/node/NodeConstruction.java
index ec0d293dc0064..eb9ef08b329ab 100644
--- a/server/src/main/java/org/elasticsearch/node/NodeConstruction.java
+++ b/server/src/main/java/org/elasticsearch/node/NodeConstruction.java
@@ -80,6 +80,7 @@
 import org.elasticsearch.common.util.BigArrays;
 import org.elasticsearch.common.util.PageCacheRecycler;
 import org.elasticsearch.core.IOUtils;
+import org.elasticsearch.core.SuppressForbidden;
 import org.elasticsearch.core.TimeValue;
 import org.elasticsearch.core.Tuple;
 import org.elasticsearch.discovery.DiscoveryModule;
@@ -216,6 +217,7 @@
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collection;
+import java.util.IdentityHashMap;
 import java.util.LinkedHashSet;
 import java.util.List;
 import java.util.Locale;
@@ -228,6 +230,9 @@
 import java.util.stream.Collectors;
 import java.util.stream.Stream;
 
+import static java.lang.invoke.MethodHandles.lookup;
+import static java.util.Collections.newSetFromMap;
+import static java.util.function.Predicate.not;
 import static org.elasticsearch.core.Types.forciblyCast;
 
 /**
@@ -831,27 +836,6 @@ private void construct(
             metadataCreateIndexService
         );
 
-        record PluginServiceInstances(
-            Client client,
-            ClusterService clusterService,
-            RerouteService rerouteService,
-            ThreadPool threadPool,
-            ResourceWatcherService resourceWatcherService,
-            ScriptService scriptService,
-            NamedXContentRegistry xContentRegistry,
-            Environment environment,
-            NodeEnvironment nodeEnvironment,
-            NamedWriteableRegistry namedWriteableRegistry,
-            IndexNameExpressionResolver indexNameExpressionResolver,
-            RepositoriesService repositoriesService,
-            TelemetryProvider telemetryProvider,
-            AllocationService allocationService,
-            IndicesService indicesService,
-            FeatureService featureService,
-            SystemIndices systemIndices,
-            DataStreamGlobalRetentionSettings dataStreamGlobalRetentionSettings,
-            DocumentParsingProvider documentParsingProvider
-        ) implements Plugin.PluginServices {}
         PluginServiceInstances pluginServices = new PluginServiceInstances(
             client,
             clusterService,
@@ -874,7 +858,30 @@ record PluginServiceInstances(
             documentParsingProvider
         );
 
-        Collection<?> pluginComponents = pluginsService.flatMap(p -> p.createComponents(pluginServices)).toList();
+        Collection<?> pluginComponents = pluginsService.flatMap(plugin -> {
+            Collection<?> allItems = plugin.createComponents(pluginServices);
+            List<?> componentObjects = allItems.stream().filter(not(x -> x instanceof Class<?>)).toList();
+            List<? extends Class<?>> classes = allItems.stream().filter(x -> x instanceof Class<?>).map(x -> (Class<?>) x).toList();
+
+            // Then, injection
+            Collection<?> componentsFromInjector;
+            if (classes.isEmpty()) {
+                componentsFromInjector = Set.of();
+            } else {
+                logger.debug("Using injector to instantiate classes for {}: {}", plugin.getClass().getSimpleName(), classes);
+                var injector = org.elasticsearch.injection.Injector.create();
+                injector.addInstances(componentObjects);
+                addRecordContents(injector, pluginServices);
+                var resultMap = injector.inject(classes);
+                // For now, assume we want all components added to the Guice injector
+                var distinctObjects = newSetFromMap(new IdentityHashMap<>());
+                distinctObjects.addAll(resultMap.values());
+                componentsFromInjector = distinctObjects;
+            }
+
+            // Return both
+            return Stream.of(componentObjects, componentsFromInjector).flatMap(Collection::stream).toList();
+        }).toList();
 
         var terminationHandlers = pluginsService.loadServiceProviders(TerminationHandlerProvider.class)
             .stream()
@@ -1175,6 +1182,24 @@ record PluginServiceInstances(
         postInjection(clusterModule, actionModule, clusterService, transportService, featureService);
     }
 
+    /**
+     * For each "component" (getter) <em>c</em> of a {@link Record},
+     * calls {@link org.elasticsearch.injection.Injector#addInstance(Object) Injector.addInstance}
+     * to register the value with the component's declared type.
+     */
+    @SuppressForbidden(reason = "Can't call invokeExact because we don't know the exact Record subtype statically")
+    private static <T> void addRecordContents(org.elasticsearch.injection.Injector injector, Record r) {
+        for (var c : r.getClass().getRecordComponents()) {
+            try {
+                @SuppressWarnings("unchecked")
+                Class<T> type = (Class<T>) c.getType(); // T represents the declared type of the record component, whatever it is
+                injector.addInstance(type, type.cast(lookup().unreflect(c.getAccessor()).invoke(r)));
+            } catch (Throwable e) {
+                throw new IllegalStateException("Unable to read record component " + c, e);
+            }
+        }
+    }
+
     private ClusterService createClusterService(SettingsModule settingsModule, ThreadPool threadPool, TaskManager taskManager) {
         ClusterService clusterService = new ClusterService(
             settingsModule.getSettings(),
@@ -1595,4 +1620,5 @@ private Module loadPersistentTasksService(
             b.bind(PersistentTasksClusterService.class).toInstance(persistentTasksClusterService);
         };
     }
+
 }
diff --git a/server/src/main/java/org/elasticsearch/node/PluginServiceInstances.java b/server/src/main/java/org/elasticsearch/node/PluginServiceInstances.java
new file mode 100644
index 0000000000000..7c8775502fd64
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/node/PluginServiceInstances.java
@@ -0,0 +1,52 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.node;
+
+import org.elasticsearch.client.internal.Client;
+import org.elasticsearch.cluster.metadata.DataStreamGlobalRetentionSettings;
+import org.elasticsearch.cluster.metadata.IndexNameExpressionResolver;
+import org.elasticsearch.cluster.routing.RerouteService;
+import org.elasticsearch.cluster.routing.allocation.AllocationService;
+import org.elasticsearch.cluster.service.ClusterService;
+import org.elasticsearch.common.io.stream.NamedWriteableRegistry;
+import org.elasticsearch.env.Environment;
+import org.elasticsearch.env.NodeEnvironment;
+import org.elasticsearch.features.FeatureService;
+import org.elasticsearch.indices.IndicesService;
+import org.elasticsearch.indices.SystemIndices;
+import org.elasticsearch.plugins.Plugin;
+import org.elasticsearch.plugins.internal.DocumentParsingProvider;
+import org.elasticsearch.repositories.RepositoriesService;
+import org.elasticsearch.script.ScriptService;
+import org.elasticsearch.telemetry.TelemetryProvider;
+import org.elasticsearch.threadpool.ThreadPool;
+import org.elasticsearch.watcher.ResourceWatcherService;
+import org.elasticsearch.xcontent.NamedXContentRegistry;
+
+public record PluginServiceInstances(
+    Client client,
+    ClusterService clusterService,
+    RerouteService rerouteService,
+    ThreadPool threadPool,
+    ResourceWatcherService resourceWatcherService,
+    ScriptService scriptService,
+    NamedXContentRegistry xContentRegistry,
+    Environment environment,
+    NodeEnvironment nodeEnvironment,
+    NamedWriteableRegistry namedWriteableRegistry,
+    IndexNameExpressionResolver indexNameExpressionResolver,
+    RepositoriesService repositoriesService,
+    TelemetryProvider telemetryProvider,
+    AllocationService allocationService,
+    IndicesService indicesService,
+    FeatureService featureService,
+    SystemIndices systemIndices,
+    DataStreamGlobalRetentionSettings dataStreamGlobalRetentionSettings,
+    DocumentParsingProvider documentParsingProvider
+) implements Plugin.PluginServices {}
diff --git a/server/src/test/java/org/elasticsearch/injection/InjectorTests.java b/server/src/test/java/org/elasticsearch/injection/InjectorTests.java
new file mode 100644
index 0000000000000..025596e640896
--- /dev/null
+++ b/server/src/test/java/org/elasticsearch/injection/InjectorTests.java
@@ -0,0 +1,154 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.injection;
+
+import org.elasticsearch.test.ESTestCase;
+
+import java.lang.invoke.MethodHandles;
+import java.util.List;
+import java.util.Set;
+
+public class InjectorTests extends ESTestCase {
+
+    public record First() {}
+
+    public record Second(First first) {}
+
+    public record Third(First first, Second second) {}
+
+    public record ExistingInstances(First first, Second second) {}
+
+    public void testMultipleResultsMap() {
+        Injector injector = Injector.create().addClasses(List.of(Service1.class, Component3.class));
+        var resultMap = injector.inject(List.of(Service1.class, Component3.class));
+        assertEquals(Set.of(Service1.class, Component3.class), resultMap.keySet());
+        Service1 service1 = (Service1) resultMap.get(Service1.class);
+        Component3 component3 = (Component3) resultMap.get(Component3.class);
+        assertSame(service1, component3.service1());
+    }
+
+    /**
+     * In most cases, if there are two objects that are instances of a class, that's ambiguous.
+     * However, if a concrete (non-abstract) superclass is configured directly, that is not ambiguous:
+     * the instance of that superclass takes precedence over any instances of any subclasses.
+     */
+    public void testConcreteSubclass() {
+        MethodHandles.lookup();
+        assertEquals(
+            Superclass.class,
+            Injector.create()
+                .addClasses(List.of(Superclass.class, Subclass.class)) // Superclass first
+                .inject(List.of(Superclass.class))
+                .get(Superclass.class)
+                .getClass()
+        );
+        MethodHandles.lookup();
+        assertEquals(
+            Superclass.class,
+            Injector.create()
+                .addClasses(List.of(Subclass.class, Superclass.class)) // Subclass first
+                .inject(List.of(Superclass.class))
+                .get(Superclass.class)
+                .getClass()
+        );
+        MethodHandles.lookup();
+        assertEquals(
+            Superclass.class,
+            Injector.create()
+                .addClasses(List.of(Subclass.class))
+                .inject(List.of(Superclass.class)) // Superclass is not mentioned until here
+                .get(Superclass.class)
+                .getClass()
+        );
+    }
+
+    //
+    // Sad paths
+    //
+
+    public void testBadInterfaceClass() {
+        assertThrows(IllegalStateException.class, () -> {
+            MethodHandles.lookup();
+            Injector.create().addClass(Listener.class).inject(List.of());
+        });
+    }
+
+    public void testBadUnknownType() {
+        // Injector knows only about Component4, discovers Listener, but can't find any subtypes
+        MethodHandles.lookup();
+        Injector injector = Injector.create().addClass(Component4.class);
+
+        assertThrows(IllegalStateException.class, () -> injector.inject(List.of()));
+    }
+
+    public void testBadCircularDependency() {
+        assertThrows(IllegalStateException.class, () -> {
+            MethodHandles.lookup();
+            Injector injector = Injector.create();
+            injector.addClasses(List.of(Circular1.class, Circular2.class)).inject(List.of());
+        });
+    }
+
+    /**
+     * For this one, we don't explicitly tell the injector about the classes involved in the cycle;
+     * it finds them on its own.
+     */
+    public void testBadCircularDependencyViaParameter() {
+        record UsesCircular1(Circular1 circular1) {}
+        assertThrows(IllegalStateException.class, () -> {
+            MethodHandles.lookup();
+            Injector.create().addClass(UsesCircular1.class).inject(List.of());
+        });
+    }
+
+    public void testBadCircularDependencyViaSupertype() {
+        interface Service1 {}
+        record Service2(Service1 service1) {}
+        record Service3(Service2 service2) implements Service1 {}
+        assertThrows(IllegalStateException.class, () -> {
+            MethodHandles.lookup();
+            Injector injector = Injector.create();
+            injector.addClasses(List.of(Service2.class, Service3.class)).inject(List.of());
+        });
+    }
+
+    // Common injectable things
+
+    public record Service1() {}
+
+    public interface Listener {}
+
+    public record Component1() implements Listener {}
+
+    public record Component2(Component1 component1) {}
+
+    public record Component3(Service1 service1) {}
+
+    public record Component4(Listener listener) {}
+
+    public record GoodService(List<Component1> components) {}
+
+    public record BadService(List<Component1> components) {
+        public BadService {
+            // Shouldn't be using the component list here!
+            assert components.isEmpty() == false;
+        }
+    }
+
+    public record MultiService(List<Component1> component1s, List<Component2> component2s) {}
+
+    public record Circular1(Circular2 service2) {}
+
+    public record Circular2(Circular1 service2) {}
+
+    public static class Superclass {}
+
+    public static class Subclass extends Superclass {}
+
+}
diff --git a/x-pack/plugin/downsample/src/main/java/org/elasticsearch/xpack/downsample/Downsample.java b/x-pack/plugin/downsample/src/main/java/org/elasticsearch/xpack/downsample/Downsample.java
index a6ba4346b1a25..7dcda9c2b0032 100644
--- a/x-pack/plugin/downsample/src/main/java/org/elasticsearch/xpack/downsample/Downsample.java
+++ b/x-pack/plugin/downsample/src/main/java/org/elasticsearch/xpack/downsample/Downsample.java
@@ -137,6 +137,6 @@ public List<NamedWriteableRegistry.Entry> getNamedWriteables() {
 
     @Override
     public Collection<?> createComponents(PluginServices services) {
-        return List.of(new DownsampleMetrics(services.telemetryProvider().getMeterRegistry()));
+        return List.of(DownsampleMetrics.class);
     }
 }
diff --git a/x-pack/plugin/downsample/src/main/java/org/elasticsearch/xpack/downsample/DownsampleMetrics.java b/x-pack/plugin/downsample/src/main/java/org/elasticsearch/xpack/downsample/DownsampleMetrics.java
index c950658b411ed..b5ac4b0ae37a3 100644
--- a/x-pack/plugin/downsample/src/main/java/org/elasticsearch/xpack/downsample/DownsampleMetrics.java
+++ b/x-pack/plugin/downsample/src/main/java/org/elasticsearch/xpack/downsample/DownsampleMetrics.java
@@ -8,6 +8,7 @@
 package org.elasticsearch.xpack.downsample;
 
 import org.elasticsearch.common.component.AbstractLifecycleComponent;
+import org.elasticsearch.telemetry.TelemetryProvider;
 import org.elasticsearch.telemetry.metric.MeterRegistry;
 
 import java.io.IOException;
@@ -36,8 +37,8 @@ public class DownsampleMetrics extends AbstractLifecycleComponent {
 
     private final MeterRegistry meterRegistry;
 
-    public DownsampleMetrics(MeterRegistry meterRegistry) {
-        this.meterRegistry = meterRegistry;
+    public DownsampleMetrics(TelemetryProvider telemetryProvider) {
+        this.meterRegistry = telemetryProvider.getMeterRegistry();
     }
 
     @Override

From 3dc21f99b6ceb0a4c233c3723a5a81ec40c0a9d6 Mon Sep 17 00:00:00 2001
From: Henning Andersen <33268011+henningandersen@users.noreply.github.com>
Date: Wed, 28 Aug 2024 17:20:54 +0200
Subject: [PATCH 007/144] Avoid cache io field volatile accesses (#112184)

The blob cache has an io field per region that is declared volatile, since it is originally null
and then later initialized. However, during "tryRead" we do not need the volatile access.
This commit changes the field to be non-volatile and use proper volatile accesses only
when needed.
---
 .../shared/SharedBlobCacheService.java        | 159 +++++++++++-------
 .../shared/SharedBlobCacheServiceTests.java   |   9 +-
 2 files changed, 105 insertions(+), 63 deletions(-)

diff --git a/x-pack/plugin/blob-cache/src/main/java/org/elasticsearch/blobcache/shared/SharedBlobCacheService.java b/x-pack/plugin/blob-cache/src/main/java/org/elasticsearch/blobcache/shared/SharedBlobCacheService.java
index 6a55738b864d1..3dfece0a9b20e 100644
--- a/x-pack/plugin/blob-cache/src/main/java/org/elasticsearch/blobcache/shared/SharedBlobCacheService.java
+++ b/x-pack/plugin/blob-cache/src/main/java/org/elasticsearch/blobcache/shared/SharedBlobCacheService.java
@@ -311,9 +311,9 @@ private CacheEntry(T chunk) {
     private final int numRegions;
     private final ConcurrentLinkedQueue<SharedBytes.IO> freeRegions = new ConcurrentLinkedQueue<>();
 
-    private final Cache<KeyType, CacheFileRegion> cache;
+    private final Cache<KeyType, CacheFileRegion<KeyType>> cache;
 
-    private final ConcurrentHashMap<SharedBytes.IO, CacheFileRegion> regionOwners; // to assert exclusive access of regions
+    private final ConcurrentHashMap<SharedBytes.IO, CacheFileRegion<KeyType>> regionOwners; // to assert exclusive access of regions
 
     private final LongAdder writeCount = new LongAdder();
     private final LongAdder writeBytes = new LongAdder();
@@ -471,7 +471,7 @@ public int getRegionSize() {
         return regionSize;
     }
 
-    CacheFileRegion get(KeyType cacheKey, long fileLength, int region) {
+    CacheFileRegion<KeyType> get(KeyType cacheKey, long fileLength, int region) {
         return cache.get(cacheKey, fileLength, region).chunk;
     }
 
@@ -516,7 +516,7 @@ public boolean maybeFetchFullEntry(
                     return true;
                 }
                 final ActionListener<Integer> regionListener = refCountingListener.acquire(ignored -> {});
-                final CacheFileRegion entry;
+                final CacheFileRegion<KeyType> entry;
                 try {
                     entry = get(cacheKey, length, region);
                 } catch (AlreadyClosedException e) {
@@ -583,7 +583,7 @@ public void maybeFetchRegion(
                 listener.onResponse(false);
                 return;
             }
-            final CacheFileRegion entry = get(cacheKey, blobLength, region);
+            final CacheFileRegion<KeyType> entry = get(cacheKey, blobLength, region);
             entry.populate(regionRange, writer, fetchExecutor, listener);
         } catch (Exception e) {
             listener.onFailure(e);
@@ -631,7 +631,7 @@ public void maybeFetchRange(
                 listener.onResponse(false);
                 return;
             }
-            final CacheFileRegion entry = get(cacheKey, blobLength, region);
+            final CacheFileRegion<KeyType> entry = get(cacheKey, blobLength, region);
             entry.populate(
                 regionRange,
                 writerWithOffset(writer, Math.toIntExact(range.start() - getRegionStart(region))),
@@ -705,7 +705,7 @@ public int forceEvict(Predicate<KeyType> cacheKeyPredicate) {
     }
 
     // used by tests
-    int getFreq(CacheFileRegion cacheFileRegion) {
+    int getFreq(CacheFileRegion<KeyType> cacheFileRegion) {
         if (cache instanceof LFUCache lfuCache) {
             return lfuCache.getFreq(cacheFileRegion);
         }
@@ -787,25 +787,45 @@ protected boolean assertOffsetsWithinFileLength(long offset, long length, long f
     /**
      * While this class has incRef and tryIncRef methods, incRefEnsureOpen and tryIncrefEnsureOpen should
      * always be used, ensuring the right ordering between incRef/tryIncRef and ensureOpen
-     * (see {@link LFUCache#maybeEvictAndTakeForFrequency(Runnable, int)})
+     * (see {@link SharedBlobCacheService.LFUCache#maybeEvictAndTakeForFrequency(Runnable, int)})
      */
-    class CacheFileRegion extends EvictableRefCounted {
+    static class CacheFileRegion<KeyType> extends EvictableRefCounted {
+
+        private static final VarHandle VH_IO = findIOVarHandle();
+
+        private static VarHandle findIOVarHandle() {
+            try {
+                return MethodHandles.lookup().in(CacheFileRegion.class).findVarHandle(CacheFileRegion.class, "io", SharedBytes.IO.class);
+            } catch (NoSuchFieldException | IllegalAccessException e) {
+                throw new RuntimeException(e);
+            }
+        }
+
+        final SharedBlobCacheService<KeyType> blobCacheService;
 
         final RegionKey<KeyType> regionKey;
         final SparseFileTracker tracker;
         // io can be null when not init'ed or after evict/take
-        volatile SharedBytes.IO io = null;
-
-        CacheFileRegion(RegionKey<KeyType> regionKey, int regionSize) {
+        // io does not need volatile access on the read path, since it goes from null to a single value (and then possbily back to null).
+        // "cache.get" never returns a `CacheFileRegion` without checking the value is non-null (with a volatile read, ensuring the value is
+        // visible in that thread).
+        // We assume any IndexInput passing among threads is done with proper happens-before semantics (otherwise they'd themselves break).
+        // In general, assertions should use `nonVolatileIO` (when they can) to access this over `volatileIO` to avoid memory visibility
+        // side effects
+        private SharedBytes.IO io = null;
+
+        CacheFileRegion(SharedBlobCacheService<KeyType> blobCacheService, RegionKey<KeyType> regionKey, int regionSize) {
+            this.blobCacheService = blobCacheService;
             this.regionKey = regionKey;
             assert regionSize > 0;
             // NOTE we use a constant string for description to avoid consume extra heap space
             tracker = new SparseFileTracker("file", regionSize);
         }
 
-        public long physicalStartOffset() {
-            var ioRef = io;
-            return ioRef == null ? -1L : (long) regionKey.region * regionSize;
+        // only used for logging
+        private long physicalStartOffset() {
+            var ioRef = nonVolatileIO();
+            return ioRef == null ? -1L : (long) regionKey.region * blobCacheService.regionSize;
         }
 
         public boolean tryIncRefEnsureOpen() {
@@ -832,10 +852,10 @@ private void ensureOpenOrDecRef() {
         // tries to evict this chunk if noone is holding onto its resources anymore
         // visible for tests.
         boolean tryEvict() {
-            assert Thread.holdsLock(SharedBlobCacheService.this) : "must hold lock when evicting";
+            assert Thread.holdsLock(blobCacheService) : "must hold lock when evicting";
             if (refCount() <= 1 && evict()) {
                 logger.trace("evicted {} with channel offset {}", regionKey, physicalStartOffset());
-                evictCount.increment();
+                blobCacheService.evictCount.increment();
                 decRef();
                 return true;
             }
@@ -843,10 +863,10 @@ boolean tryEvict() {
         }
 
         boolean tryEvictNoDecRef() {
-            assert Thread.holdsLock(SharedBlobCacheService.this) : "must hold lock when evicting";
+            assert Thread.holdsLock(blobCacheService) : "must hold lock when evicting";
             if (refCount() <= 1 && evict()) {
                 logger.trace("evicted and take {} with channel offset {}", regionKey, physicalStartOffset());
-                evictCount.increment();
+                blobCacheService.evictCount.increment();
                 return true;
             }
 
@@ -854,10 +874,10 @@ boolean tryEvictNoDecRef() {
         }
 
         public boolean forceEvict() {
-            assert Thread.holdsLock(SharedBlobCacheService.this) : "must hold lock when evicting";
+            assert Thread.holdsLock(blobCacheService) : "must hold lock when evicting";
             if (evict()) {
                 logger.trace("force evicted {} with channel offset {}", regionKey, physicalStartOffset());
-                evictCount.increment();
+                blobCacheService.evictCount.increment();
                 decRef();
                 return true;
             }
@@ -868,9 +888,10 @@ public boolean forceEvict() {
         protected void closeInternal() {
             // now actually free the region associated with this chunk
             // we held the "this" lock when this was evicted, hence if io is not filled in, chunk will never be registered.
+            SharedBytes.IO io = volatileIO();
             if (io != null) {
-                assert regionOwners.remove(io) == this;
-                freeRegions.add(io);
+                assert blobCacheService.regionOwners.remove(io) == this;
+                blobCacheService.freeRegions.add(io);
             }
             logger.trace("closed {} with channel offset {}", regionKey, physicalStartOffset());
         }
@@ -879,14 +900,31 @@ private static void throwAlreadyEvicted() {
             throwAlreadyClosed("File chunk is evicted");
         }
 
+        private SharedBytes.IO volatileIO() {
+            return (SharedBytes.IO) VH_IO.getVolatile(this);
+        }
+
+        private void volatileIO(SharedBytes.IO io) {
+            VH_IO.setVolatile(this, io);
+        }
+
+        private SharedBytes.IO nonVolatileIO() {
+            return io;
+        }
+
+        // for use in tests *only*
+        SharedBytes.IO testOnlyNonVolatileIO() {
+            return io;
+        }
+
         /**
          * Optimistically try to read from the region
          * @return true if successful, i.e., not evicted and data available, false if evicted
          */
         boolean tryRead(ByteBuffer buf, long offset) throws IOException {
-            SharedBytes.IO ioRef = this.io;
+            SharedBytes.IO ioRef = nonVolatileIO();
             if (ioRef != null) {
-                int readBytes = ioRef.read(buf, getRegionRelativePosition(offset));
+                int readBytes = ioRef.read(buf, blobCacheService.getRegionRelativePosition(offset));
                 if (isEvicted()) {
                     buf.position(buf.position() - readBytes);
                     return false;
@@ -922,7 +960,7 @@ void populate(
                         rangeToWrite,
                         rangeToWrite,
                         Assertions.ENABLED ? ActionListener.releaseAfter(ActionListener.running(() -> {
-                            assert regionOwners.get(io) == this;
+                            assert blobCacheService.regionOwners.get(nonVolatileIO()) == this;
                         }), refs.acquire()) : refs.acquireListener()
                     );
                     if (gaps.isEmpty()) {
@@ -958,8 +996,8 @@ void populateAndRead(
                         rangeToWrite,
                         rangeToRead,
                         ActionListener.releaseAfter(listener, refs.acquire()).delegateFailureAndWrap((l, success) -> {
-                            var ioRef = io;
-                            assert regionOwners.get(ioRef) == this;
+                            var ioRef = nonVolatileIO();
+                            assert blobCacheService.regionOwners.get(ioRef) == this;
                             final int start = Math.toIntExact(rangeToRead.start());
                             final int read = reader.onRangeAvailable(ioRef, start, start, Math.toIntExact(rangeToRead.length()));
                             assert read == rangeToRead.length()
@@ -970,7 +1008,7 @@ void populateAndRead(
                                     + '-'
                                     + rangeToRead.start()
                                     + ']';
-                            readCount.increment();
+                            blobCacheService.readCount.increment();
                             l.onResponse(read);
                         })
                     );
@@ -1016,8 +1054,8 @@ private Runnable fillGapRunnable(
             ActionListener<Void> listener
         ) {
             return () -> ActionListener.run(listener, l -> {
-                var ioRef = io;
-                assert regionOwners.get(ioRef) == CacheFileRegion.this;
+                var ioRef = nonVolatileIO();
+                assert blobCacheService.regionOwners.get(ioRef) == CacheFileRegion.this;
                 assert CacheFileRegion.this.hasReferences() : CacheFileRegion.this;
                 int start = Math.toIntExact(gap.start());
                 writer.fillCacheRange(
@@ -1028,9 +1066,9 @@ private Runnable fillGapRunnable(
                     Math.toIntExact(gap.end() - start),
                     progress -> gap.onProgress(start + progress),
                     l.<Void>map(unused -> {
-                        assert regionOwners.get(ioRef) == CacheFileRegion.this;
+                        assert blobCacheService.regionOwners.get(ioRef) == CacheFileRegion.this;
                         assert CacheFileRegion.this.hasReferences() : CacheFileRegion.this;
-                        writeCount.increment();
+                        blobCacheService.writeCount.increment();
                         gap.onCompletion();
                         return null;
                     }).delegateResponse((delegate, e) -> failGapAndListener(gap, delegate, e))
@@ -1058,7 +1096,7 @@ public class CacheFile {
         private final KeyType cacheKey;
         private final long length;
 
-        private CacheEntry<CacheFileRegion> lastAccessedRegion;
+        private CacheEntry<CacheFileRegion<KeyType>> lastAccessedRegion;
 
         private CacheFile(KeyType cacheKey, long length) {
             this.cacheKey = cacheKey;
@@ -1161,7 +1199,7 @@ private int readSingleRegion(
             int region
         ) throws InterruptedException, ExecutionException {
             final PlainActionFuture<Integer> readFuture = new PlainActionFuture<>();
-            final CacheFileRegion fileRegion = get(cacheKey, length, region);
+            final CacheFileRegion<KeyType> fileRegion = get(cacheKey, length, region);
             final long regionStart = getRegionStart(region);
             fileRegion.populateAndRead(
                 mapSubRangeToRegion(rangeToWrite, region),
@@ -1193,7 +1231,7 @@ private int readMultiRegions(
                     }
                     ActionListener<Integer> listener = listeners.acquire(i -> bytesRead.updateAndGet(j -> Math.addExact(i, j)));
                     try {
-                        final CacheFileRegion fileRegion = get(cacheKey, length, region);
+                        final CacheFileRegion<KeyType> fileRegion = get(cacheKey, length, region);
                         final long regionStart = getRegionStart(region);
                         fileRegion.populateAndRead(
                             mapSubRangeToRegion(rangeToWrite, region),
@@ -1213,7 +1251,7 @@ private int readMultiRegions(
             return bytesRead.get();
         }
 
-        private RangeMissingHandler writerWithOffset(RangeMissingHandler writer, CacheFileRegion fileRegion, int writeOffset) {
+        private RangeMissingHandler writerWithOffset(RangeMissingHandler writer, CacheFileRegion<KeyType> fileRegion, int writeOffset) {
             final RangeMissingHandler adjustedWriter;
             if (writeOffset == 0) {
                 // no need to allocate a new capturing lambda if the offset isn't adjusted
@@ -1263,8 +1301,8 @@ public void fillCacheRange(
                             len,
                             progressUpdater,
                             Assertions.ENABLED ? ActionListener.runBefore(completionListener, () -> {
-                                assert regionOwners.get(fileRegion.io) == fileRegion
-                                    : "File chunk [" + fileRegion.regionKey + "] no longer owns IO [" + fileRegion.io + "]";
+                                assert regionOwners.get(fileRegion.nonVolatileIO()) == fileRegion
+                                    : "File chunk [" + fileRegion.regionKey + "] no longer owns IO [" + fileRegion.nonVolatileIO() + "]";
                             }) : completionListener
                         );
                     }
@@ -1274,7 +1312,7 @@ public void fillCacheRange(
             return adjustedWriter;
         }
 
-        private RangeAvailableHandler readerWithOffset(RangeAvailableHandler reader, CacheFileRegion fileRegion, int readOffset) {
+        private RangeAvailableHandler readerWithOffset(RangeAvailableHandler reader, CacheFileRegion<KeyType> fileRegion, int readOffset) {
             final RangeAvailableHandler adjustedReader = (channel, channelPos, relativePos, len) -> reader.onRangeAvailable(
                 channel,
                 channelPos,
@@ -1285,18 +1323,18 @@ private RangeAvailableHandler readerWithOffset(RangeAvailableHandler reader, Cac
                 return (channel, channelPos, relativePos, len) -> {
                     assert assertValidRegionAndLength(fileRegion, channelPos, len);
                     final int bytesRead = adjustedReader.onRangeAvailable(channel, channelPos, relativePos, len);
-                    assert regionOwners.get(fileRegion.io) == fileRegion
-                        : "File chunk [" + fileRegion.regionKey + "] no longer owns IO [" + fileRegion.io + "]";
+                    assert regionOwners.get(fileRegion.nonVolatileIO()) == fileRegion
+                        : "File chunk [" + fileRegion.regionKey + "] no longer owns IO [" + fileRegion.nonVolatileIO() + "]";
                     return bytesRead;
                 };
             }
             return adjustedReader;
         }
 
-        private boolean assertValidRegionAndLength(CacheFileRegion fileRegion, int channelPos, int len) {
-            assert fileRegion.io != null;
+        private boolean assertValidRegionAndLength(CacheFileRegion<KeyType> fileRegion, int channelPos, int len) {
+            assert fileRegion.nonVolatileIO() != null;
             assert fileRegion.hasReferences();
-            assert regionOwners.get(fileRegion.io) == fileRegion;
+            assert regionOwners.get(fileRegion.nonVolatileIO()) == fileRegion;
             assert channelPos >= 0 && channelPos + len <= regionSize;
             return true;
         }
@@ -1421,15 +1459,15 @@ public record Stats(
         public static final Stats EMPTY = new Stats(0, 0L, 0L, 0L, 0L, 0L, 0L, 0L);
     }
 
-    private class LFUCache implements Cache<KeyType, CacheFileRegion> {
+    private class LFUCache implements Cache<KeyType, CacheFileRegion<KeyType>> {
 
-        class LFUCacheEntry extends CacheEntry<CacheFileRegion> {
+        class LFUCacheEntry extends CacheEntry<CacheFileRegion<KeyType>> {
             LFUCacheEntry prev;
             LFUCacheEntry next;
             int freq;
             volatile long lastAccessedEpoch;
 
-            LFUCacheEntry(CacheFileRegion chunk, long lastAccessed) {
+            LFUCacheEntry(CacheFileRegion<KeyType> chunk, long lastAccessed) {
                 super(chunk);
                 this.lastAccessedEpoch = lastAccessed;
                 // todo: consider whether freq=1 is still right for new entries.
@@ -1467,7 +1505,7 @@ public void close() {
             decayAndNewEpochTask.close();
         }
 
-        int getFreq(CacheFileRegion cacheFileRegion) {
+        int getFreq(CacheFileRegion<KeyType> cacheFileRegion) {
             return keyMapping.get(cacheFileRegion.regionKey).freq;
         }
 
@@ -1480,12 +1518,15 @@ public LFUCacheEntry get(KeyType cacheKey, long fileLength, int region) {
             var entry = keyMapping.get(regionKey);
             if (entry == null) {
                 final int effectiveRegionSize = computeCacheFileRegionSize(fileLength, region);
-                entry = keyMapping.computeIfAbsent(regionKey, key -> new LFUCacheEntry(new CacheFileRegion(key, effectiveRegionSize), now));
+                entry = keyMapping.computeIfAbsent(
+                    regionKey,
+                    key -> new LFUCacheEntry(new CacheFileRegion<KeyType>(SharedBlobCacheService.this, key, effectiveRegionSize), now)
+                );
             }
-            // io is volatile, double locking is fine, as long as we assign it last.
-            if (entry.chunk.io == null) {
+            // checks using volatile, double locking is fine, as long as we assign io last.
+            if (entry.chunk.volatileIO() == null) {
                 synchronized (entry.chunk) {
-                    if (entry.chunk.io == null && entry.chunk.isEvicted() == false) {
+                    if (entry.chunk.volatileIO() == null && entry.chunk.isEvicted() == false) {
                         return initChunk(entry);
                     }
                 }
@@ -1515,7 +1556,7 @@ public int forceEvict(Predicate<KeyType> cacheKeyPredicate) {
                     for (LFUCacheEntry entry : matchingEntries) {
                         int frequency = entry.freq;
                         boolean evicted = entry.chunk.forceEvict();
-                        if (evicted && entry.chunk.io != null) {
+                        if (evicted && entry.chunk.volatileIO() != null) {
                             unlink(entry);
                             keyMapping.remove(entry.chunk.regionKey, entry);
                             evictedCount++;
@@ -1576,7 +1617,7 @@ private void assignToSlot(LFUCacheEntry entry, SharedBytes.IO freeSlot) {
                 }
                 pushEntryToBack(entry);
                 // assign io only when chunk is ready for use. Under lock to avoid concurrent tryEvict.
-                entry.chunk.io = freeSlot;
+                entry.chunk.volatileIO(freeSlot);
             }
         }
 
@@ -1641,7 +1682,7 @@ private boolean assertChunkActiveOrEvicted(LFUCacheEntry entry) {
                 assert entry.prev != null || entry.chunk.isEvicted();
 
             }
-            SharedBytes.IO io = entry.chunk.io;
+            SharedBytes.IO io = entry.chunk.nonVolatileIO();
             assert io != null || entry.chunk.isEvicted();
             assert io == null || regionOwners.get(io) == entry.chunk || entry.chunk.isEvicted();
             return true;
@@ -1764,13 +1805,13 @@ private SharedBytes.IO maybeEvictAndTakeForFrequency(Runnable evictedNotificatio
                 boolean evicted = entry.chunk.tryEvictNoDecRef();
                 if (evicted) {
                     try {
-                        SharedBytes.IO ioRef = entry.chunk.io;
+                        SharedBytes.IO ioRef = entry.chunk.volatileIO();
                         if (ioRef != null) {
                             try {
                                 if (entry.chunk.refCount() == 1) {
                                     // we own that one refcount (since we CAS'ed evicted to 1)
                                     // grab io, rely on incref'ers also checking evicted field.
-                                    entry.chunk.io = null;
+                                    entry.chunk.volatileIO(null);
                                     assert regionOwners.remove(ioRef) == entry.chunk;
                                     return ioRef;
                                 }
@@ -1809,7 +1850,7 @@ public boolean maybeEvictLeastUsed() {
             synchronized (SharedBlobCacheService.this) {
                 for (LFUCacheEntry entry = freqs[0]; entry != null; entry = entry.next) {
                     boolean evicted = entry.chunk.tryEvict();
-                    if (evicted && entry.chunk.io != null) {
+                    if (evicted && entry.chunk.volatileIO() != null) {
                         unlink(entry);
                         keyMapping.remove(entry.chunk.regionKey, entry);
                         return true;
diff --git a/x-pack/plugin/blob-cache/src/test/java/org/elasticsearch/blobcache/shared/SharedBlobCacheServiceTests.java b/x-pack/plugin/blob-cache/src/test/java/org/elasticsearch/blobcache/shared/SharedBlobCacheServiceTests.java
index 597180a1d1c31..d7e8ad19382e5 100644
--- a/x-pack/plugin/blob-cache/src/test/java/org/elasticsearch/blobcache/shared/SharedBlobCacheServiceTests.java
+++ b/x-pack/plugin/blob-cache/src/test/java/org/elasticsearch/blobcache/shared/SharedBlobCacheServiceTests.java
@@ -149,7 +149,7 @@ public void testBasicEviction() throws IOException {
         }
     }
 
-    private static boolean tryEvict(SharedBlobCacheService<Object>.CacheFileRegion region1) {
+    private static boolean tryEvict(SharedBlobCacheService.CacheFileRegion<Object> region1) {
         if (randomBoolean()) {
             return region1.tryEvict();
         } else {
@@ -486,7 +486,7 @@ public void testGetMultiThreaded() throws IOException {
                         ready.await();
                         for (int i = 0; i < iterations; ++i) {
                             try {
-                                SharedBlobCacheService<String>.CacheFileRegion cacheFileRegion;
+                                SharedBlobCacheService.CacheFileRegion<String> cacheFileRegion;
                                 try {
                                     cacheFileRegion = cacheService.get(cacheKeys[i], fileLength, regions[i]);
                                 } catch (AlreadyClosedException e) {
@@ -497,6 +497,7 @@ public void testGetMultiThreaded() throws IOException {
                                     if (yield[i] == 0) {
                                         Thread.yield();
                                     }
+                                    assertNotNull(cacheFileRegion.testOnlyNonVolatileIO());
                                     cacheFileRegion.decRef();
                                 }
                                 if (evict[i] == 0) {
@@ -865,7 +866,7 @@ public void testMaybeEvictLeastUsed() throws Exception {
         final DeterministicTaskQueue taskQueue = new DeterministicTaskQueue();
         try (
             NodeEnvironment environment = new NodeEnvironment(settings, TestEnvironment.newEnvironment(settings));
-            var cacheService = new SharedBlobCacheService<>(
+            var cacheService = new SharedBlobCacheService<Object>(
                 environment,
                 settings,
                 taskQueue.getThreadPool(),
@@ -873,7 +874,7 @@ public void testMaybeEvictLeastUsed() throws Exception {
                 BlobCacheMetrics.NOOP
             )
         ) {
-            final Map<Object, SharedBlobCacheService<Object>.CacheFileRegion> cacheEntries = new HashMap<>();
+            final Map<Object, SharedBlobCacheService.CacheFileRegion<Object>> cacheEntries = new HashMap<>();
 
             assertThat("All regions are free", cacheService.freeRegionCount(), equalTo(numRegions));
             assertThat("Cache has no entries", cacheService.maybeEvictLeastUsed(), is(false));

From b20b8012d5437e51f966a4ac5abc05a2710367ba Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Thu, 29 Aug 2024 01:32:17 +1000
Subject: [PATCH 008/144] Mute
 org.elasticsearch.search.query.ScriptScoreQueryTests
 testScriptTermStatsNotAvailable #112290

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 26bded1d09dc8..6498413e33cf5 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -166,6 +166,9 @@ tests:
 - class: org.elasticsearch.search.query.ScriptScoreQueryTests
   method: testScriptTermStatsAvailable
   issue: https://github.com/elastic/elasticsearch/issues/112278
+- class: org.elasticsearch.search.query.ScriptScoreQueryTests
+  method: testScriptTermStatsNotAvailable
+  issue: https://github.com/elastic/elasticsearch/issues/112290
 
 # Examples:
 #

From d832e6ee0cda82ecffde9fc28c9dd90c629e29e1 Mon Sep 17 00:00:00 2001
From: David Turner <david.turner@elastic.co>
Date: Wed, 28 Aug 2024 17:36:29 +0100
Subject: [PATCH 009/144] Extract `BlobStoreCorruptionUtils` (#112229)

Makes these utility methods available to other test suites (to be added
in future PRs).

Relates #111954
---
 .../blobstore/BlobStoreCorruptionIT.java      | 68 +-------------
 .../blobstore/BlobStoreCorruptionUtils.java   | 89 +++++++++++++++++++
 2 files changed, 90 insertions(+), 67 deletions(-)
 create mode 100644 test/framework/src/main/java/org/elasticsearch/repositories/blobstore/BlobStoreCorruptionUtils.java

diff --git a/server/src/internalClusterTest/java/org/elasticsearch/repositories/blobstore/BlobStoreCorruptionIT.java b/server/src/internalClusterTest/java/org/elasticsearch/repositories/blobstore/BlobStoreCorruptionIT.java
index 422696d6b61c6..4665dc486a904 100644
--- a/server/src/internalClusterTest/java/org/elasticsearch/repositories/blobstore/BlobStoreCorruptionIT.java
+++ b/server/src/internalClusterTest/java/org/elasticsearch/repositories/blobstore/BlobStoreCorruptionIT.java
@@ -8,7 +8,6 @@
 
 package org.elasticsearch.repositories.blobstore;
 
-import org.apache.lucene.tests.mockfile.ExtrasFS;
 import org.elasticsearch.ElasticsearchException;
 import org.elasticsearch.action.ActionListener;
 import org.elasticsearch.action.admin.cluster.snapshots.restore.RestoreSnapshotResponse;
@@ -23,18 +22,10 @@
 import org.elasticsearch.repositories.fs.FsRepository;
 import org.elasticsearch.snapshots.AbstractSnapshotIntegTestCase;
 import org.elasticsearch.snapshots.SnapshotState;
-import org.elasticsearch.test.ESTestCase;
 import org.elasticsearch.test.hamcrest.ElasticsearchAssertions;
 import org.junit.Before;
 
-import java.io.IOException;
-import java.nio.file.FileVisitResult;
-import java.nio.file.Files;
-import java.nio.file.Path;
-import java.nio.file.SimpleFileVisitor;
-import java.nio.file.attribute.BasicFileAttributes;
 import java.util.ArrayList;
-import java.util.Base64;
 import java.util.List;
 
 public class BlobStoreCorruptionIT extends AbstractSnapshotIntegTestCase {
@@ -57,7 +48,7 @@ public void testCorruptionDetection() throws Exception {
         flushAndRefresh(indexName);
         createSnapshot(repositoryName, snapshotName, List.of(indexName));
 
-        final var corruptedFile = corruptRandomFile(repositoryRootPath);
+        final var corruptedFile = BlobStoreCorruptionUtils.corruptRandomFile(repositoryRootPath);
         final var corruptedFileType = RepositoryFileType.getRepositoryFileType(repositoryRootPath, corruptedFile);
         final var corruptionDetectors = new ArrayList<CheckedConsumer<ActionListener<Exception>, ?>>();
 
@@ -126,61 +117,4 @@ public void testCorruptionDetection() throws Exception {
             logger.info(Strings.format("--> corrupted [%s] and caught exception", corruptedFile), exception);
         }
     }
-
-    private static Path corruptRandomFile(Path repositoryRootPath) throws IOException {
-        final var corruptedFileType = getRandomCorruptibleFileType();
-        final var corruptedFile = getRandomFileToCorrupt(repositoryRootPath, corruptedFileType);
-        if (randomBoolean()) {
-            logger.info("--> deleting [{}]", corruptedFile);
-            Files.delete(corruptedFile);
-        } else {
-            corruptFileContents(corruptedFile);
-        }
-        return corruptedFile;
-    }
-
-    private static void corruptFileContents(Path fileToCorrupt) throws IOException {
-        final var oldFileContents = Files.readAllBytes(fileToCorrupt);
-        logger.info("--> contents of [{}] before corruption: [{}]", fileToCorrupt, Base64.getEncoder().encodeToString(oldFileContents));
-        final byte[] newFileContents = new byte[randomBoolean() ? oldFileContents.length : between(0, oldFileContents.length)];
-        System.arraycopy(oldFileContents, 0, newFileContents, 0, newFileContents.length);
-        if (newFileContents.length == oldFileContents.length) {
-            final var corruptionPosition = between(0, newFileContents.length - 1);
-            newFileContents[corruptionPosition] = randomValueOtherThan(oldFileContents[corruptionPosition], ESTestCase::randomByte);
-            logger.info(
-                "--> updating byte at position [{}] from [{}] to [{}]",
-                corruptionPosition,
-                oldFileContents[corruptionPosition],
-                newFileContents[corruptionPosition]
-            );
-        } else {
-            logger.info("--> truncating file from length [{}] to length [{}]", oldFileContents.length, newFileContents.length);
-        }
-        Files.write(fileToCorrupt, newFileContents);
-        logger.info("--> contents of [{}] after corruption: [{}]", fileToCorrupt, Base64.getEncoder().encodeToString(newFileContents));
-    }
-
-    private static RepositoryFileType getRandomCorruptibleFileType() {
-        return randomValueOtherThanMany(
-            // these blob types do not have reliable corruption detection, so we must skip them
-            t -> t == RepositoryFileType.ROOT_INDEX_N || t == RepositoryFileType.ROOT_INDEX_LATEST,
-            () -> randomFrom(RepositoryFileType.values())
-        );
-    }
-
-    private static Path getRandomFileToCorrupt(Path repositoryRootPath, RepositoryFileType corruptedFileType) throws IOException {
-        final var corruptibleFiles = new ArrayList<Path>();
-        Files.walkFileTree(repositoryRootPath, new SimpleFileVisitor<>() {
-            @Override
-            public FileVisitResult visitFile(Path filePath, BasicFileAttributes attrs) throws IOException {
-                if (ExtrasFS.isExtra(filePath.getFileName().toString()) == false
-                    && RepositoryFileType.getRepositoryFileType(repositoryRootPath, filePath) == corruptedFileType) {
-                    corruptibleFiles.add(filePath);
-                }
-                return super.visitFile(filePath, attrs);
-            }
-        });
-        return randomFrom(corruptibleFiles);
-    }
-
 }
diff --git a/test/framework/src/main/java/org/elasticsearch/repositories/blobstore/BlobStoreCorruptionUtils.java b/test/framework/src/main/java/org/elasticsearch/repositories/blobstore/BlobStoreCorruptionUtils.java
new file mode 100644
index 0000000000000..3670013f571e0
--- /dev/null
+++ b/test/framework/src/main/java/org/elasticsearch/repositories/blobstore/BlobStoreCorruptionUtils.java
@@ -0,0 +1,89 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.repositories.blobstore;
+
+import org.apache.lucene.tests.mockfile.ExtrasFS;
+import org.elasticsearch.logging.LogManager;
+import org.elasticsearch.logging.Logger;
+import org.elasticsearch.test.ESTestCase;
+
+import java.io.IOException;
+import java.nio.file.FileVisitResult;
+import java.nio.file.Files;
+import java.nio.file.Path;
+import java.nio.file.SimpleFileVisitor;
+import java.nio.file.attribute.BasicFileAttributes;
+import java.util.ArrayList;
+import java.util.Base64;
+
+import static org.elasticsearch.test.ESTestCase.between;
+import static org.elasticsearch.test.ESTestCase.randomBoolean;
+import static org.elasticsearch.test.ESTestCase.randomFrom;
+import static org.elasticsearch.test.ESTestCase.randomValueOtherThan;
+import static org.elasticsearch.test.ESTestCase.randomValueOtherThanMany;
+
+public class BlobStoreCorruptionUtils {
+    private static final Logger logger = LogManager.getLogger(BlobStoreCorruptionUtils.class);
+
+    public static Path corruptRandomFile(Path repositoryRootPath) throws IOException {
+        final var corruptedFileType = getRandomCorruptibleFileType();
+        final var corruptedFile = getRandomFileToCorrupt(repositoryRootPath, corruptedFileType);
+        if (randomBoolean()) {
+            logger.info("--> deleting [{}]", corruptedFile);
+            Files.delete(corruptedFile);
+        } else {
+            corruptFileContents(corruptedFile);
+        }
+        return corruptedFile;
+    }
+
+    public static void corruptFileContents(Path fileToCorrupt) throws IOException {
+        final var oldFileContents = Files.readAllBytes(fileToCorrupt);
+        logger.info("--> contents of [{}] before corruption: [{}]", fileToCorrupt, Base64.getEncoder().encodeToString(oldFileContents));
+        final byte[] newFileContents = new byte[randomBoolean() ? oldFileContents.length : between(0, oldFileContents.length)];
+        System.arraycopy(oldFileContents, 0, newFileContents, 0, newFileContents.length);
+        if (newFileContents.length == oldFileContents.length) {
+            final var corruptionPosition = between(0, newFileContents.length - 1);
+            newFileContents[corruptionPosition] = randomValueOtherThan(oldFileContents[corruptionPosition], ESTestCase::randomByte);
+            logger.info(
+                "--> updating byte at position [{}] from [{}] to [{}]",
+                corruptionPosition,
+                oldFileContents[corruptionPosition],
+                newFileContents[corruptionPosition]
+            );
+        } else {
+            logger.info("--> truncating file from length [{}] to length [{}]", oldFileContents.length, newFileContents.length);
+        }
+        Files.write(fileToCorrupt, newFileContents);
+        logger.info("--> contents of [{}] after corruption: [{}]", fileToCorrupt, Base64.getEncoder().encodeToString(newFileContents));
+    }
+
+    public static RepositoryFileType getRandomCorruptibleFileType() {
+        return randomValueOtherThanMany(
+            // these blob types do not have reliable corruption detection, so we must skip them
+            t -> t == RepositoryFileType.ROOT_INDEX_N || t == RepositoryFileType.ROOT_INDEX_LATEST,
+            () -> randomFrom(RepositoryFileType.values())
+        );
+    }
+
+    public static Path getRandomFileToCorrupt(Path repositoryRootPath, RepositoryFileType corruptedFileType) throws IOException {
+        final var corruptibleFiles = new ArrayList<Path>();
+        Files.walkFileTree(repositoryRootPath, new SimpleFileVisitor<>() {
+            @Override
+            public FileVisitResult visitFile(Path filePath, BasicFileAttributes attrs) throws IOException {
+                if (ExtrasFS.isExtra(filePath.getFileName().toString()) == false
+                    && RepositoryFileType.getRepositoryFileType(repositoryRootPath, filePath) == corruptedFileType) {
+                    corruptibleFiles.add(filePath);
+                }
+                return super.visitFile(filePath, attrs);
+            }
+        });
+        return randomFrom(corruptibleFiles);
+    }
+}

From 32374dbfe046cbf7283af6b02b333b45fe3dfc90 Mon Sep 17 00:00:00 2001
From: Ankita Kumar <ankita.kumar@elastic.co>
Date: Wed, 28 Aug 2024 13:05:58 -0400
Subject: [PATCH 010/144] Metrics for Reindexing (#111845)

This PR adds metrics for the Reindexing plugin, to measure the end-to-end time taken by a reindex request, update-by-query request and delete-by-query request.
---
 .../index/reindex/ReindexPluginMetricsIT.java | 216 ++++++++++++++++++
 .../reindex/DeleteByQueryMetrics.java         |  33 +++
 .../elasticsearch/reindex/ReindexMetrics.java |  32 +++
 .../elasticsearch/reindex/ReindexPlugin.java  |   8 +-
 .../org/elasticsearch/reindex/Reindexer.java  |  16 +-
 .../reindex/TransportDeleteByQueryAction.java |  25 +-
 .../reindex/TransportReindexAction.java       |  12 +-
 .../reindex/TransportUpdateByQueryAction.java |  25 +-
 .../reindex/UpdateByQueryMetrics.java         |  33 +++
 .../reindex/DeleteByQueryMetricsTests.java    |  39 ++++
 .../reindex/ReindexMetricsTests.java          |  40 ++++
 .../reindex/UpdateByQueryMetricsTests.java    |  40 ++++
 .../reindex/UpdateByQueryWithScriptTests.java |   1 +
 .../action/TransportEnrichReindexAction.java  |   3 +-
 14 files changed, 507 insertions(+), 16 deletions(-)
 create mode 100644 modules/reindex/src/internalClusterTest/java/org/elasticsearch/index/reindex/ReindexPluginMetricsIT.java
 create mode 100644 modules/reindex/src/main/java/org/elasticsearch/reindex/DeleteByQueryMetrics.java
 create mode 100644 modules/reindex/src/main/java/org/elasticsearch/reindex/ReindexMetrics.java
 create mode 100644 modules/reindex/src/main/java/org/elasticsearch/reindex/UpdateByQueryMetrics.java
 create mode 100644 modules/reindex/src/test/java/org/elasticsearch/reindex/DeleteByQueryMetricsTests.java
 create mode 100644 modules/reindex/src/test/java/org/elasticsearch/reindex/ReindexMetricsTests.java
 create mode 100644 modules/reindex/src/test/java/org/elasticsearch/reindex/UpdateByQueryMetricsTests.java

diff --git a/modules/reindex/src/internalClusterTest/java/org/elasticsearch/index/reindex/ReindexPluginMetricsIT.java b/modules/reindex/src/internalClusterTest/java/org/elasticsearch/index/reindex/ReindexPluginMetricsIT.java
new file mode 100644
index 0000000000000..e7d26b0808a48
--- /dev/null
+++ b/modules/reindex/src/internalClusterTest/java/org/elasticsearch/index/reindex/ReindexPluginMetricsIT.java
@@ -0,0 +1,216 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.index.reindex;
+
+import org.elasticsearch.index.query.QueryBuilders;
+import org.elasticsearch.plugins.Plugin;
+import org.elasticsearch.plugins.PluginsService;
+import org.elasticsearch.reindex.BulkIndexByScrollResponseMatcher;
+import org.elasticsearch.reindex.ReindexPlugin;
+import org.elasticsearch.search.sort.SortOrder;
+import org.elasticsearch.telemetry.Measurement;
+import org.elasticsearch.telemetry.TestTelemetryPlugin;
+import org.elasticsearch.test.ESIntegTestCase;
+
+import java.util.Arrays;
+import java.util.Collection;
+import java.util.List;
+
+import static org.elasticsearch.index.query.QueryBuilders.termQuery;
+import static org.elasticsearch.reindex.DeleteByQueryMetrics.DELETE_BY_QUERY_TIME_HISTOGRAM;
+import static org.elasticsearch.reindex.ReindexMetrics.REINDEX_TIME_HISTOGRAM;
+import static org.elasticsearch.reindex.UpdateByQueryMetrics.UPDATE_BY_QUERY_TIME_HISTOGRAM;
+import static org.elasticsearch.test.hamcrest.ElasticsearchAssertions.assertHitCount;
+import static org.hamcrest.Matchers.equalTo;
+
+@ESIntegTestCase.ClusterScope(numDataNodes = 0, numClientNodes = 0, scope = ESIntegTestCase.Scope.TEST)
+public class ReindexPluginMetricsIT extends ESIntegTestCase {
+    @Override
+    protected Collection<Class<? extends Plugin>> nodePlugins() {
+        return Arrays.asList(ReindexPlugin.class, TestTelemetryPlugin.class);
+    }
+
+    protected ReindexRequestBuilder reindex() {
+        return new ReindexRequestBuilder(client());
+    }
+
+    protected UpdateByQueryRequestBuilder updateByQuery() {
+        return new UpdateByQueryRequestBuilder(client());
+    }
+
+    protected DeleteByQueryRequestBuilder deleteByQuery() {
+        return new DeleteByQueryRequestBuilder(client());
+    }
+
+    public static BulkIndexByScrollResponseMatcher matcher() {
+        return new BulkIndexByScrollResponseMatcher();
+    }
+
+    public void testReindexMetrics() throws Exception {
+        final String dataNodeName = internalCluster().startNode();
+
+        indexRandom(
+            true,
+            prepareIndex("source").setId("1").setSource("foo", "a"),
+            prepareIndex("source").setId("2").setSource("foo", "a"),
+            prepareIndex("source").setId("3").setSource("foo", "b"),
+            prepareIndex("source").setId("4").setSource("foo", "c")
+        );
+        assertHitCount(prepareSearch("source").setSize(0), 4);
+
+        final TestTelemetryPlugin testTelemetryPlugin = internalCluster().getInstance(PluginsService.class, dataNodeName)
+            .filterPlugins(TestTelemetryPlugin.class)
+            .findFirst()
+            .orElseThrow();
+
+        // Copy all the docs
+        reindex().source("source").destination("dest").get();
+        // Use assertBusy to wait for all threads to complete so we get deterministic results
+        assertBusy(() -> {
+            testTelemetryPlugin.collect();
+            List<Measurement> measurements = testTelemetryPlugin.getLongHistogramMeasurement(REINDEX_TIME_HISTOGRAM);
+            assertThat(measurements.size(), equalTo(1));
+        });
+
+        // Now none of them
+        createIndex("none");
+        reindex().source("source").destination("none").filter(termQuery("foo", "no_match")).get();
+        assertBusy(() -> {
+            testTelemetryPlugin.collect();
+            List<Measurement> measurements = testTelemetryPlugin.getLongHistogramMeasurement(REINDEX_TIME_HISTOGRAM);
+            assertThat(measurements.size(), equalTo(2));
+        });
+
+        // Now half of them
+        reindex().source("source").destination("dest_half").filter(termQuery("foo", "a")).get();
+        assertBusy(() -> {
+            testTelemetryPlugin.collect();
+            List<Measurement> measurements = testTelemetryPlugin.getLongHistogramMeasurement(REINDEX_TIME_HISTOGRAM);
+            assertThat(measurements.size(), equalTo(3));
+        });
+
+        // Limit with maxDocs
+        reindex().source("source").destination("dest_size_one").maxDocs(1).get();
+        assertBusy(() -> {
+            testTelemetryPlugin.collect();
+            List<Measurement> measurements = testTelemetryPlugin.getLongHistogramMeasurement(REINDEX_TIME_HISTOGRAM);
+            assertThat(measurements.size(), equalTo(4));
+        });
+    }
+
+    public void testDeleteByQueryMetrics() throws Exception {
+        final String dataNodeName = internalCluster().startNode();
+
+        indexRandom(
+            true,
+            prepareIndex("test").setId("1").setSource("foo", "a"),
+            prepareIndex("test").setId("2").setSource("foo", "a"),
+            prepareIndex("test").setId("3").setSource("foo", "b"),
+            prepareIndex("test").setId("4").setSource("foo", "c"),
+            prepareIndex("test").setId("5").setSource("foo", "d"),
+            prepareIndex("test").setId("6").setSource("foo", "e"),
+            prepareIndex("test").setId("7").setSource("foo", "f")
+        );
+
+        assertHitCount(prepareSearch("test").setSize(0), 7);
+
+        final TestTelemetryPlugin testTelemetryPlugin = internalCluster().getInstance(PluginsService.class, dataNodeName)
+            .filterPlugins(TestTelemetryPlugin.class)
+            .findFirst()
+            .orElseThrow();
+
+        // Deletes two docs that matches "foo:a"
+        deleteByQuery().source("test").filter(termQuery("foo", "a")).refresh(true).get();
+        assertBusy(() -> {
+            testTelemetryPlugin.collect();
+            List<Measurement> measurements = testTelemetryPlugin.getLongHistogramMeasurement(DELETE_BY_QUERY_TIME_HISTOGRAM);
+            assertThat(measurements.size(), equalTo(1));
+        });
+
+        // Deletes the two first docs with limit by size
+        DeleteByQueryRequestBuilder request = deleteByQuery().source("test").filter(QueryBuilders.matchAllQuery()).size(2).refresh(true);
+        request.source().addSort("foo.keyword", SortOrder.ASC);
+        request.get();
+        assertBusy(() -> {
+            testTelemetryPlugin.collect();
+            List<Measurement> measurements = testTelemetryPlugin.getLongHistogramMeasurement(DELETE_BY_QUERY_TIME_HISTOGRAM);
+            assertThat(measurements.size(), equalTo(2));
+        });
+
+        // Deletes but match no docs
+        deleteByQuery().source("test").filter(termQuery("foo", "no_match")).refresh(true).get();
+        assertBusy(() -> {
+            testTelemetryPlugin.collect();
+            List<Measurement> measurements = testTelemetryPlugin.getLongHistogramMeasurement(DELETE_BY_QUERY_TIME_HISTOGRAM);
+            assertThat(measurements.size(), equalTo(3));
+        });
+
+        // Deletes all remaining docs
+        deleteByQuery().source("test").filter(QueryBuilders.matchAllQuery()).refresh(true).get();
+        assertBusy(() -> {
+            testTelemetryPlugin.collect();
+            List<Measurement> measurements = testTelemetryPlugin.getLongHistogramMeasurement(DELETE_BY_QUERY_TIME_HISTOGRAM);
+            assertThat(measurements.size(), equalTo(4));
+        });
+    }
+
+    public void testUpdateByQueryMetrics() throws Exception {
+        final String dataNodeName = internalCluster().startNode();
+
+        indexRandom(
+            true,
+            prepareIndex("test").setId("1").setSource("foo", "a"),
+            prepareIndex("test").setId("2").setSource("foo", "a"),
+            prepareIndex("test").setId("3").setSource("foo", "b"),
+            prepareIndex("test").setId("4").setSource("foo", "c")
+        );
+        assertHitCount(prepareSearch("test").setSize(0), 4);
+        assertEquals(1, client().prepareGet("test", "1").get().getVersion());
+        assertEquals(1, client().prepareGet("test", "4").get().getVersion());
+
+        final TestTelemetryPlugin testTelemetryPlugin = internalCluster().getInstance(PluginsService.class, dataNodeName)
+            .filterPlugins(TestTelemetryPlugin.class)
+            .findFirst()
+            .orElseThrow();
+
+        // Reindex all the docs
+        updateByQuery().source("test").refresh(true).get();
+        assertBusy(() -> {
+            testTelemetryPlugin.collect();
+            List<Measurement> measurements = testTelemetryPlugin.getLongHistogramMeasurement(UPDATE_BY_QUERY_TIME_HISTOGRAM);
+            assertThat(measurements.size(), equalTo(1));
+        });
+
+        // Now none of them
+        updateByQuery().source("test").filter(termQuery("foo", "no_match")).refresh(true).get();
+        assertBusy(() -> {
+            testTelemetryPlugin.collect();
+            List<Measurement> measurements = testTelemetryPlugin.getLongHistogramMeasurement(UPDATE_BY_QUERY_TIME_HISTOGRAM);
+            assertThat(measurements.size(), equalTo(2));
+        });
+
+        // Now half of them
+        updateByQuery().source("test").filter(termQuery("foo", "a")).refresh(true).get();
+        assertBusy(() -> {
+            testTelemetryPlugin.collect();
+            List<Measurement> measurements = testTelemetryPlugin.getLongHistogramMeasurement(UPDATE_BY_QUERY_TIME_HISTOGRAM);
+            assertThat(measurements.size(), equalTo(3));
+        });
+
+        // Limit with size
+        UpdateByQueryRequestBuilder request = updateByQuery().source("test").size(3).refresh(true);
+        request.source().addSort("foo.keyword", SortOrder.ASC);
+        request.get();
+        assertBusy(() -> {
+            testTelemetryPlugin.collect();
+            List<Measurement> measurements = testTelemetryPlugin.getLongHistogramMeasurement(UPDATE_BY_QUERY_TIME_HISTOGRAM);
+            assertThat(measurements.size(), equalTo(4));
+        });
+    }
+}
diff --git a/modules/reindex/src/main/java/org/elasticsearch/reindex/DeleteByQueryMetrics.java b/modules/reindex/src/main/java/org/elasticsearch/reindex/DeleteByQueryMetrics.java
new file mode 100644
index 0000000000000..2cedf0d5f5823
--- /dev/null
+++ b/modules/reindex/src/main/java/org/elasticsearch/reindex/DeleteByQueryMetrics.java
@@ -0,0 +1,33 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.reindex;
+
+import org.elasticsearch.telemetry.metric.LongHistogram;
+import org.elasticsearch.telemetry.metric.MeterRegistry;
+
+public class DeleteByQueryMetrics {
+    public static final String DELETE_BY_QUERY_TIME_HISTOGRAM = "es.delete_by_query.duration.histogram";
+
+    private final LongHistogram deleteByQueryTimeSecsHistogram;
+
+    public DeleteByQueryMetrics(MeterRegistry meterRegistry) {
+        this(
+            meterRegistry.registerLongHistogram(DELETE_BY_QUERY_TIME_HISTOGRAM, "Time taken to execute Delete by Query request", "seconds")
+        );
+    }
+
+    private DeleteByQueryMetrics(LongHistogram deleteByQueryTimeSecsHistogram) {
+        this.deleteByQueryTimeSecsHistogram = deleteByQueryTimeSecsHistogram;
+    }
+
+    public long recordTookTime(long tookTime) {
+        deleteByQueryTimeSecsHistogram.record(tookTime);
+        return tookTime;
+    }
+}
diff --git a/modules/reindex/src/main/java/org/elasticsearch/reindex/ReindexMetrics.java b/modules/reindex/src/main/java/org/elasticsearch/reindex/ReindexMetrics.java
new file mode 100644
index 0000000000000..3025357aa6538
--- /dev/null
+++ b/modules/reindex/src/main/java/org/elasticsearch/reindex/ReindexMetrics.java
@@ -0,0 +1,32 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.reindex;
+
+import org.elasticsearch.telemetry.metric.LongHistogram;
+import org.elasticsearch.telemetry.metric.MeterRegistry;
+
+public class ReindexMetrics {
+
+    public static final String REINDEX_TIME_HISTOGRAM = "es.reindex.duration.histogram";
+
+    private final LongHistogram reindexTimeSecsHistogram;
+
+    public ReindexMetrics(MeterRegistry meterRegistry) {
+        this(meterRegistry.registerLongHistogram(REINDEX_TIME_HISTOGRAM, "Time to reindex by search", "millis"));
+    }
+
+    private ReindexMetrics(LongHistogram reindexTimeSecsHistogram) {
+        this.reindexTimeSecsHistogram = reindexTimeSecsHistogram;
+    }
+
+    public long recordTookTime(long tookTime) {
+        reindexTimeSecsHistogram.record(tookTime);
+        return tookTime;
+    }
+}
diff --git a/modules/reindex/src/main/java/org/elasticsearch/reindex/ReindexPlugin.java b/modules/reindex/src/main/java/org/elasticsearch/reindex/ReindexPlugin.java
index 1a40f77250e5f..3169d4c4ee1fb 100644
--- a/modules/reindex/src/main/java/org/elasticsearch/reindex/ReindexPlugin.java
+++ b/modules/reindex/src/main/java/org/elasticsearch/reindex/ReindexPlugin.java
@@ -34,7 +34,6 @@
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collection;
-import java.util.Collections;
 import java.util.List;
 import java.util.function.Predicate;
 import java.util.function.Supplier;
@@ -85,8 +84,11 @@ public List<RestHandler> getRestHandlers(
 
     @Override
     public Collection<?> createComponents(PluginServices services) {
-        return Collections.singletonList(
-            new ReindexSslConfig(services.environment().settings(), services.environment(), services.resourceWatcherService())
+        return List.of(
+            new ReindexSslConfig(services.environment().settings(), services.environment(), services.resourceWatcherService()),
+            new ReindexMetrics(services.telemetryProvider().getMeterRegistry()),
+            new UpdateByQueryMetrics(services.telemetryProvider().getMeterRegistry()),
+            new DeleteByQueryMetrics(services.telemetryProvider().getMeterRegistry())
         );
     }
 
diff --git a/modules/reindex/src/main/java/org/elasticsearch/reindex/Reindexer.java b/modules/reindex/src/main/java/org/elasticsearch/reindex/Reindexer.java
index dbe1968bb076a..cb393a42f52a1 100644
--- a/modules/reindex/src/main/java/org/elasticsearch/reindex/Reindexer.java
+++ b/modules/reindex/src/main/java/org/elasticsearch/reindex/Reindexer.java
@@ -37,6 +37,7 @@
 import org.elasticsearch.common.lucene.uid.Versions;
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.xcontent.XContentHelper;
+import org.elasticsearch.core.Nullable;
 import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.index.IndexSettings;
 import org.elasticsearch.index.VersionType;
@@ -65,6 +66,7 @@
 import java.util.ArrayList;
 import java.util.List;
 import java.util.Map;
+import java.util.concurrent.TimeUnit;
 import java.util.concurrent.atomic.AtomicInteger;
 import java.util.function.BiFunction;
 import java.util.function.LongSupplier;
@@ -82,19 +84,22 @@ public class Reindexer {
     private final ThreadPool threadPool;
     private final ScriptService scriptService;
     private final ReindexSslConfig reindexSslConfig;
+    private final ReindexMetrics reindexMetrics;
 
     Reindexer(
         ClusterService clusterService,
         Client client,
         ThreadPool threadPool,
         ScriptService scriptService,
-        ReindexSslConfig reindexSslConfig
+        ReindexSslConfig reindexSslConfig,
+        @Nullable ReindexMetrics reindexMetrics
     ) {
         this.clusterService = clusterService;
         this.client = client;
         this.threadPool = threadPool;
         this.scriptService = scriptService;
         this.reindexSslConfig = reindexSslConfig;
+        this.reindexMetrics = reindexMetrics;
     }
 
     public void initTask(BulkByScrollTask task, ReindexRequest request, ActionListener<Void> listener) {
@@ -102,6 +107,8 @@ public void initTask(BulkByScrollTask task, ReindexRequest request, ActionListen
     }
 
     public void execute(BulkByScrollTask task, ReindexRequest request, Client bulkClient, ActionListener<BulkByScrollResponse> listener) {
+        long startTime = System.nanoTime();
+
         BulkByScrollParallelizationHelper.executeSlicedAction(
             task,
             request,
@@ -122,7 +129,12 @@ public void execute(BulkByScrollTask task, ReindexRequest request, Client bulkCl
                     clusterService.state(),
                     reindexSslConfig,
                     request,
-                    listener
+                    ActionListener.runAfter(listener, () -> {
+                        long elapsedTime = TimeUnit.NANOSECONDS.toSeconds(System.nanoTime() - startTime);
+                        if (reindexMetrics != null) {
+                            reindexMetrics.recordTookTime(elapsedTime);
+                        }
+                    })
                 );
                 searchAction.start();
             }
diff --git a/modules/reindex/src/main/java/org/elasticsearch/reindex/TransportDeleteByQueryAction.java b/modules/reindex/src/main/java/org/elasticsearch/reindex/TransportDeleteByQueryAction.java
index 755587feb47d3..53381c33d7f78 100644
--- a/modules/reindex/src/main/java/org/elasticsearch/reindex/TransportDeleteByQueryAction.java
+++ b/modules/reindex/src/main/java/org/elasticsearch/reindex/TransportDeleteByQueryAction.java
@@ -15,6 +15,7 @@
 import org.elasticsearch.client.internal.ParentTaskAssigningClient;
 import org.elasticsearch.cluster.service.ClusterService;
 import org.elasticsearch.common.util.concurrent.EsExecutors;
+import org.elasticsearch.core.Nullable;
 import org.elasticsearch.index.reindex.BulkByScrollResponse;
 import org.elasticsearch.index.reindex.BulkByScrollTask;
 import org.elasticsearch.index.reindex.DeleteByQueryAction;
@@ -25,12 +26,15 @@
 import org.elasticsearch.threadpool.ThreadPool;
 import org.elasticsearch.transport.TransportService;
 
+import java.util.concurrent.TimeUnit;
+
 public class TransportDeleteByQueryAction extends HandledTransportAction<DeleteByQueryRequest, BulkByScrollResponse> {
 
     private final ThreadPool threadPool;
     private final Client client;
     private final ScriptService scriptService;
     private final ClusterService clusterService;
+    private final DeleteByQueryMetrics deleteByQueryMetrics;
 
     @Inject
     public TransportDeleteByQueryAction(
@@ -39,18 +43,21 @@ public TransportDeleteByQueryAction(
         Client client,
         TransportService transportService,
         ScriptService scriptService,
-        ClusterService clusterService
+        ClusterService clusterService,
+        @Nullable DeleteByQueryMetrics deleteByQueryMetrics
     ) {
         super(DeleteByQueryAction.NAME, transportService, actionFilters, DeleteByQueryRequest::new, EsExecutors.DIRECT_EXECUTOR_SERVICE);
         this.threadPool = threadPool;
         this.client = client;
         this.scriptService = scriptService;
         this.clusterService = clusterService;
+        this.deleteByQueryMetrics = deleteByQueryMetrics;
     }
 
     @Override
     public void doExecute(Task task, DeleteByQueryRequest request, ActionListener<BulkByScrollResponse> listener) {
         BulkByScrollTask bulkByScrollTask = (BulkByScrollTask) task;
+        long startTime = System.nanoTime();
         BulkByScrollParallelizationHelper.startSlicedAction(
             request,
             bulkByScrollTask,
@@ -64,8 +71,20 @@ public void doExecute(Task task, DeleteByQueryRequest request, ActionListener<Bu
                     clusterService.localNode(),
                     bulkByScrollTask
                 );
-                new AsyncDeleteByQueryAction(bulkByScrollTask, logger, assigningClient, threadPool, request, scriptService, listener)
-                    .start();
+                new AsyncDeleteByQueryAction(
+                    bulkByScrollTask,
+                    logger,
+                    assigningClient,
+                    threadPool,
+                    request,
+                    scriptService,
+                    ActionListener.runAfter(listener, () -> {
+                        long elapsedTime = TimeUnit.NANOSECONDS.toSeconds(System.nanoTime() - startTime);
+                        if (deleteByQueryMetrics != null) {
+                            deleteByQueryMetrics.recordTookTime(elapsedTime);
+                        }
+                    })
+                ).start();
             }
         );
     }
diff --git a/modules/reindex/src/main/java/org/elasticsearch/reindex/TransportReindexAction.java b/modules/reindex/src/main/java/org/elasticsearch/reindex/TransportReindexAction.java
index a86af2ca2b83e..821a137ac7566 100644
--- a/modules/reindex/src/main/java/org/elasticsearch/reindex/TransportReindexAction.java
+++ b/modules/reindex/src/main/java/org/elasticsearch/reindex/TransportReindexAction.java
@@ -19,6 +19,7 @@
 import org.elasticsearch.common.settings.Setting.Property;
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.util.concurrent.EsExecutors;
+import org.elasticsearch.core.Nullable;
 import org.elasticsearch.index.reindex.BulkByScrollResponse;
 import org.elasticsearch.index.reindex.BulkByScrollTask;
 import org.elasticsearch.index.reindex.ReindexAction;
@@ -53,7 +54,8 @@ public TransportReindexAction(
         AutoCreateIndex autoCreateIndex,
         Client client,
         TransportService transportService,
-        ReindexSslConfig sslConfig
+        ReindexSslConfig sslConfig,
+        @Nullable ReindexMetrics reindexMetrics
     ) {
         this(
             ReindexAction.NAME,
@@ -66,7 +68,8 @@ public TransportReindexAction(
             autoCreateIndex,
             client,
             transportService,
-            sslConfig
+            sslConfig,
+            reindexMetrics
         );
     }
 
@@ -81,12 +84,13 @@ protected TransportReindexAction(
         AutoCreateIndex autoCreateIndex,
         Client client,
         TransportService transportService,
-        ReindexSslConfig sslConfig
+        ReindexSslConfig sslConfig,
+        @Nullable ReindexMetrics reindexMetrics
     ) {
         super(name, transportService, actionFilters, ReindexRequest::new, EsExecutors.DIRECT_EXECUTOR_SERVICE);
         this.client = client;
         this.reindexValidator = new ReindexValidator(settings, clusterService, indexNameExpressionResolver, autoCreateIndex);
-        this.reindexer = new Reindexer(clusterService, client, threadPool, scriptService, sslConfig);
+        this.reindexer = new Reindexer(clusterService, client, threadPool, scriptService, sslConfig, reindexMetrics);
     }
 
     @Override
diff --git a/modules/reindex/src/main/java/org/elasticsearch/reindex/TransportUpdateByQueryAction.java b/modules/reindex/src/main/java/org/elasticsearch/reindex/TransportUpdateByQueryAction.java
index fc0bfa3c8a214..997d4d32fe042 100644
--- a/modules/reindex/src/main/java/org/elasticsearch/reindex/TransportUpdateByQueryAction.java
+++ b/modules/reindex/src/main/java/org/elasticsearch/reindex/TransportUpdateByQueryAction.java
@@ -18,6 +18,7 @@
 import org.elasticsearch.cluster.ClusterState;
 import org.elasticsearch.cluster.service.ClusterService;
 import org.elasticsearch.common.util.concurrent.EsExecutors;
+import org.elasticsearch.core.Nullable;
 import org.elasticsearch.index.reindex.BulkByScrollResponse;
 import org.elasticsearch.index.reindex.BulkByScrollTask;
 import org.elasticsearch.index.reindex.ScrollableHitSource;
@@ -35,6 +36,7 @@
 import org.elasticsearch.transport.TransportService;
 
 import java.util.Map;
+import java.util.concurrent.TimeUnit;
 import java.util.function.BiFunction;
 import java.util.function.LongSupplier;
 
@@ -44,6 +46,7 @@ public class TransportUpdateByQueryAction extends HandledTransportAction<UpdateB
     private final Client client;
     private final ScriptService scriptService;
     private final ClusterService clusterService;
+    private final UpdateByQueryMetrics updateByQueryMetrics;
 
     @Inject
     public TransportUpdateByQueryAction(
@@ -52,18 +55,21 @@ public TransportUpdateByQueryAction(
         Client client,
         TransportService transportService,
         ScriptService scriptService,
-        ClusterService clusterService
+        ClusterService clusterService,
+        @Nullable UpdateByQueryMetrics updateByQueryMetrics
     ) {
         super(UpdateByQueryAction.NAME, transportService, actionFilters, UpdateByQueryRequest::new, EsExecutors.DIRECT_EXECUTOR_SERVICE);
         this.threadPool = threadPool;
         this.client = client;
         this.scriptService = scriptService;
         this.clusterService = clusterService;
+        this.updateByQueryMetrics = updateByQueryMetrics;
     }
 
     @Override
     protected void doExecute(Task task, UpdateByQueryRequest request, ActionListener<BulkByScrollResponse> listener) {
         BulkByScrollTask bulkByScrollTask = (BulkByScrollTask) task;
+        long startTime = System.nanoTime();
         BulkByScrollParallelizationHelper.startSlicedAction(
             request,
             bulkByScrollTask,
@@ -78,8 +84,21 @@ protected void doExecute(Task task, UpdateByQueryRequest request, ActionListener
                     clusterService.localNode(),
                     bulkByScrollTask
                 );
-                new AsyncIndexBySearchAction(bulkByScrollTask, logger, assigningClient, threadPool, scriptService, request, state, listener)
-                    .start();
+                new AsyncIndexBySearchAction(
+                    bulkByScrollTask,
+                    logger,
+                    assigningClient,
+                    threadPool,
+                    scriptService,
+                    request,
+                    state,
+                    ActionListener.runAfter(listener, () -> {
+                        long elapsedTime = TimeUnit.NANOSECONDS.toSeconds(System.nanoTime() - startTime);
+                        if (updateByQueryMetrics != null) {
+                            updateByQueryMetrics.recordTookTime(elapsedTime);
+                        }
+                    })
+                ).start();
             }
         );
     }
diff --git a/modules/reindex/src/main/java/org/elasticsearch/reindex/UpdateByQueryMetrics.java b/modules/reindex/src/main/java/org/elasticsearch/reindex/UpdateByQueryMetrics.java
new file mode 100644
index 0000000000000..6ca52769a1ba9
--- /dev/null
+++ b/modules/reindex/src/main/java/org/elasticsearch/reindex/UpdateByQueryMetrics.java
@@ -0,0 +1,33 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.reindex;
+
+import org.elasticsearch.telemetry.metric.LongHistogram;
+import org.elasticsearch.telemetry.metric.MeterRegistry;
+
+public class UpdateByQueryMetrics {
+    public static final String UPDATE_BY_QUERY_TIME_HISTOGRAM = "es.update_by_query.duration.histogram";
+
+    private final LongHistogram updateByQueryTimeSecsHistogram;
+
+    public UpdateByQueryMetrics(MeterRegistry meterRegistry) {
+        this(
+            meterRegistry.registerLongHistogram(UPDATE_BY_QUERY_TIME_HISTOGRAM, "Time taken to execute Update by Query request", "seconds")
+        );
+    }
+
+    private UpdateByQueryMetrics(LongHistogram updateByQueryTimeSecsHistogram) {
+        this.updateByQueryTimeSecsHistogram = updateByQueryTimeSecsHistogram;
+    }
+
+    public long recordTookTime(long tookTime) {
+        updateByQueryTimeSecsHistogram.record(tookTime);
+        return tookTime;
+    }
+}
diff --git a/modules/reindex/src/test/java/org/elasticsearch/reindex/DeleteByQueryMetricsTests.java b/modules/reindex/src/test/java/org/elasticsearch/reindex/DeleteByQueryMetricsTests.java
new file mode 100644
index 0000000000000..58adc6aebaa9b
--- /dev/null
+++ b/modules/reindex/src/test/java/org/elasticsearch/reindex/DeleteByQueryMetricsTests.java
@@ -0,0 +1,39 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.reindex;
+
+import org.elasticsearch.telemetry.InstrumentType;
+import org.elasticsearch.telemetry.Measurement;
+import org.elasticsearch.telemetry.RecordingMeterRegistry;
+import org.elasticsearch.test.ESTestCase;
+import org.junit.Before;
+
+import java.util.List;
+
+import static org.elasticsearch.reindex.DeleteByQueryMetrics.DELETE_BY_QUERY_TIME_HISTOGRAM;
+
+public class DeleteByQueryMetricsTests extends ESTestCase {
+    private RecordingMeterRegistry recordingMeterRegistry;
+    private DeleteByQueryMetrics metrics;
+
+    @Before
+    public void createMetrics() {
+        recordingMeterRegistry = new RecordingMeterRegistry();
+        metrics = new DeleteByQueryMetrics(recordingMeterRegistry);
+    }
+
+    public void testRecordTookTime() {
+        int secondsTaken = randomIntBetween(1, 50);
+        metrics.recordTookTime(secondsTaken);
+        List<Measurement> measurements = recordingMeterRegistry.getRecorder()
+            .getMeasurements(InstrumentType.LONG_HISTOGRAM, DELETE_BY_QUERY_TIME_HISTOGRAM);
+        assertEquals(measurements.size(), 1);
+        assertEquals(measurements.get(0).getLong(), secondsTaken);
+    }
+}
diff --git a/modules/reindex/src/test/java/org/elasticsearch/reindex/ReindexMetricsTests.java b/modules/reindex/src/test/java/org/elasticsearch/reindex/ReindexMetricsTests.java
new file mode 100644
index 0000000000000..4711530585817
--- /dev/null
+++ b/modules/reindex/src/test/java/org/elasticsearch/reindex/ReindexMetricsTests.java
@@ -0,0 +1,40 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.reindex;
+
+import org.elasticsearch.telemetry.InstrumentType;
+import org.elasticsearch.telemetry.Measurement;
+import org.elasticsearch.telemetry.RecordingMeterRegistry;
+import org.elasticsearch.test.ESTestCase;
+import org.junit.Before;
+
+import java.util.List;
+
+import static org.elasticsearch.reindex.ReindexMetrics.REINDEX_TIME_HISTOGRAM;
+
+public class ReindexMetricsTests extends ESTestCase {
+
+    private RecordingMeterRegistry recordingMeterRegistry;
+    private ReindexMetrics metrics;
+
+    @Before
+    public void createMetrics() {
+        recordingMeterRegistry = new RecordingMeterRegistry();
+        metrics = new ReindexMetrics(recordingMeterRegistry);
+    }
+
+    public void testRecordTookTime() {
+        int secondsTaken = randomIntBetween(1, 50);
+        metrics.recordTookTime(secondsTaken);
+        List<Measurement> measurements = recordingMeterRegistry.getRecorder()
+            .getMeasurements(InstrumentType.LONG_HISTOGRAM, REINDEX_TIME_HISTOGRAM);
+        assertEquals(measurements.size(), 1);
+        assertEquals(measurements.get(0).getLong(), secondsTaken);
+    }
+}
diff --git a/modules/reindex/src/test/java/org/elasticsearch/reindex/UpdateByQueryMetricsTests.java b/modules/reindex/src/test/java/org/elasticsearch/reindex/UpdateByQueryMetricsTests.java
new file mode 100644
index 0000000000000..548d18d202984
--- /dev/null
+++ b/modules/reindex/src/test/java/org/elasticsearch/reindex/UpdateByQueryMetricsTests.java
@@ -0,0 +1,40 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.reindex;
+
+import org.elasticsearch.telemetry.InstrumentType;
+import org.elasticsearch.telemetry.Measurement;
+import org.elasticsearch.telemetry.RecordingMeterRegistry;
+import org.elasticsearch.test.ESTestCase;
+import org.junit.Before;
+
+import java.util.List;
+
+import static org.elasticsearch.reindex.UpdateByQueryMetrics.UPDATE_BY_QUERY_TIME_HISTOGRAM;
+
+public class UpdateByQueryMetricsTests extends ESTestCase {
+
+    private RecordingMeterRegistry recordingMeterRegistry;
+    private UpdateByQueryMetrics metrics;
+
+    @Before
+    public void createMetrics() {
+        recordingMeterRegistry = new RecordingMeterRegistry();
+        metrics = new UpdateByQueryMetrics(recordingMeterRegistry);
+    }
+
+    public void testRecordTookTime() {
+        int secondsTaken = randomIntBetween(1, 50);
+        metrics.recordTookTime(secondsTaken);
+        List<Measurement> measurements = recordingMeterRegistry.getRecorder()
+            .getMeasurements(InstrumentType.LONG_HISTOGRAM, UPDATE_BY_QUERY_TIME_HISTOGRAM);
+        assertEquals(measurements.size(), 1);
+        assertEquals(measurements.get(0).getLong(), secondsTaken);
+    }
+}
diff --git a/modules/reindex/src/test/java/org/elasticsearch/reindex/UpdateByQueryWithScriptTests.java b/modules/reindex/src/test/java/org/elasticsearch/reindex/UpdateByQueryWithScriptTests.java
index 876ddefda161b..c4d591f804750 100644
--- a/modules/reindex/src/test/java/org/elasticsearch/reindex/UpdateByQueryWithScriptTests.java
+++ b/modules/reindex/src/test/java/org/elasticsearch/reindex/UpdateByQueryWithScriptTests.java
@@ -60,6 +60,7 @@ protected TransportUpdateByQueryAction.AsyncIndexBySearchAction action(ScriptSer
             null,
             transportService,
             scriptService,
+            null,
             null
         );
         return new TransportUpdateByQueryAction.AsyncIndexBySearchAction(
diff --git a/x-pack/plugin/enrich/src/main/java/org/elasticsearch/xpack/enrich/action/TransportEnrichReindexAction.java b/x-pack/plugin/enrich/src/main/java/org/elasticsearch/xpack/enrich/action/TransportEnrichReindexAction.java
index 0eeb85f4574f7..cc42199ab1019 100644
--- a/x-pack/plugin/enrich/src/main/java/org/elasticsearch/xpack/enrich/action/TransportEnrichReindexAction.java
+++ b/x-pack/plugin/enrich/src/main/java/org/elasticsearch/xpack/enrich/action/TransportEnrichReindexAction.java
@@ -61,7 +61,8 @@ public TransportEnrichReindexAction(
             autoCreateIndex,
             client,
             transportService,
-            new ReindexSslConfig(settings, environment, watcherService)
+            new ReindexSslConfig(settings, environment, watcherService),
+            null
         );
         this.bulkClient = new OriginSettingClient(client, ENRICH_ORIGIN);
     }

From e7c0ba953a2f03ecdea9e848478356054689c137 Mon Sep 17 00:00:00 2001
From: Victor Martinez <victormartinezrubio@gmail.com>
Date: Wed, 28 Aug 2024 19:18:58 +0200
Subject: [PATCH 011/144] Update IronBank docker image base to ubi:9.4
 (#111743)

---
 distribution/docker/src/docker/Dockerfile                       | 2 +-
 .../docker/src/docker/iron_bank/hardening_manifest.yaml         | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/distribution/docker/src/docker/Dockerfile b/distribution/docker/src/docker/Dockerfile
index 32f35b05015b9..2a2a77a6df820 100644
--- a/distribution/docker/src/docker/Dockerfile
+++ b/distribution/docker/src/docker/Dockerfile
@@ -22,7 +22,7 @@
 <% if (docker_base == 'iron_bank') { %>
 ARG BASE_REGISTRY=registry1.dso.mil
 ARG BASE_IMAGE=ironbank/redhat/ubi/ubi9
-ARG BASE_TAG=9.3
+ARG BASE_TAG=9.4
 <% } %>
 
 ################################################################################
diff --git a/distribution/docker/src/docker/iron_bank/hardening_manifest.yaml b/distribution/docker/src/docker/iron_bank/hardening_manifest.yaml
index 38ce16a413af2..f4364c5008c09 100644
--- a/distribution/docker/src/docker/iron_bank/hardening_manifest.yaml
+++ b/distribution/docker/src/docker/iron_bank/hardening_manifest.yaml
@@ -14,7 +14,7 @@ tags:
 # Build args passed to Dockerfile ARGs
 args:
   BASE_IMAGE: "redhat/ubi/ubi9"
-  BASE_TAG: "9.3"
+  BASE_TAG: "9.4"
 
 # Docker image labels
 labels:

From 68b7b7f7fb520056ec9fcbbe5b6b66bce51027d2 Mon Sep 17 00:00:00 2001
From: Nik Everett <nik9000@gmail.com>
Date: Wed, 28 Aug 2024 13:42:31 -0400
Subject: [PATCH 012/144] ESQL: Migrate more physical plan writeable (#112248)

Migrates a few more of our physical plan nodes to `NamedWriteable`.
---
 .../xpack/esql/io/stream/PlanNamedTypes.java  | 76 +--------------
 .../xpack/esql/plan/logical/EsRelation.java   | 21 ++++-
 .../xpack/esql/plan/physical/EsQueryExec.java | 60 +++++++++++-
 .../esql/plan/physical/EsSourceExec.java      |  5 +-
 .../xpack/esql/plan/physical/EvalExec.java    | 28 ++++++
 .../esql/plan/physical/PhysicalPlan.java      |  2 +-
 .../esql/io/stream/PlanNamedTypesTests.java   | 68 --------------
 ...bstractPhysicalPlanSerializationTests.java |  4 +-
 .../EsQueryExecSerializationTests.java        | 94 +++++++++++++++++++
 .../physical/EvalExecSerializationTests.java  | 61 ++++++++++++
 10 files changed, 268 insertions(+), 151 deletions(-)
 create mode 100644 x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/EsQueryExecSerializationTests.java
 create mode 100644 x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/EvalExecSerializationTests.java

diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypes.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypes.java
index 77d982453203c..af82ceb4bf809 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypes.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypes.java
@@ -12,16 +12,13 @@
 import org.elasticsearch.common.io.stream.StreamInput;
 import org.elasticsearch.common.io.stream.StreamOutput;
 import org.elasticsearch.common.util.iterable.Iterables;
-import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.index.query.QueryBuilder;
 import org.elasticsearch.transport.RemoteClusterAware;
 import org.elasticsearch.xpack.esql.core.expression.Alias;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
 import org.elasticsearch.xpack.esql.core.expression.Expression;
-import org.elasticsearch.xpack.esql.core.expression.FieldAttribute;
 import org.elasticsearch.xpack.esql.core.expression.NamedExpression;
 import org.elasticsearch.xpack.esql.core.tree.Source;
-import org.elasticsearch.xpack.esql.expression.Order;
 import org.elasticsearch.xpack.esql.index.EsIndex;
 import org.elasticsearch.xpack.esql.plan.logical.Enrich;
 import org.elasticsearch.xpack.esql.plan.logical.Grok;
@@ -56,8 +53,6 @@
 import java.util.Set;
 
 import static org.elasticsearch.xpack.esql.io.stream.PlanNameRegistry.Entry.of;
-import static org.elasticsearch.xpack.esql.io.stream.PlanNameRegistry.PlanReader.readerFromPlanReader;
-import static org.elasticsearch.xpack.esql.io.stream.PlanNameRegistry.PlanWriter.writerFromPlanWriter;
 
 /**
  * A utility class that consists solely of static methods that describe how to serialize and
@@ -93,9 +88,9 @@ public static List<PlanNameRegistry.Entry> namedTypeEntries() {
             // Physical Plan Nodes
             of(PhysicalPlan.class, AggregateExec.ENTRY),
             of(PhysicalPlan.class, DissectExec.ENTRY),
-            of(PhysicalPlan.class, EsQueryExec.class, PlanNamedTypes::writeEsQueryExec, PlanNamedTypes::readEsQueryExec),
+            of(PhysicalPlan.class, EsQueryExec.ENTRY),
             of(PhysicalPlan.class, EsSourceExec.ENTRY),
-            of(PhysicalPlan.class, EvalExec.class, PlanNamedTypes::writeEvalExec, PlanNamedTypes::readEvalExec),
+            of(PhysicalPlan.class, EvalExec.ENTRY),
             of(PhysicalPlan.class, EnrichExec.class, PlanNamedTypes::writeEnrichExec, PlanNamedTypes::readEnrichExec),
             of(PhysicalPlan.class, ExchangeExec.class, PlanNamedTypes::writeExchangeExec, PlanNamedTypes::readExchangeExec),
             of(PhysicalPlan.class, ExchangeSinkExec.class, PlanNamedTypes::writeExchangeSinkExec, PlanNamedTypes::readExchangeSinkExec),
@@ -123,57 +118,6 @@ public static List<PlanNameRegistry.Entry> namedTypeEntries() {
     }
 
     // -- physical plan nodes
-    static EsQueryExec readEsQueryExec(PlanStreamInput in) throws IOException {
-        return new EsQueryExec(
-            Source.readFrom(in),
-            new EsIndex(in),
-            readIndexMode(in),
-            in.readNamedWriteableCollectionAsList(Attribute.class),
-            in.readOptionalNamedWriteable(QueryBuilder.class),
-            in.readOptionalNamed(Expression.class),
-            in.readOptionalCollectionAsList(readerFromPlanReader(PlanNamedTypes::readFieldSort)),
-            in.readOptionalVInt()
-        );
-    }
-
-    static void writeEsQueryExec(PlanStreamOutput out, EsQueryExec esQueryExec) throws IOException {
-        assert esQueryExec.children().size() == 0;
-        Source.EMPTY.writeTo(out);
-        esQueryExec.index().writeTo(out);
-        writeIndexMode(out, esQueryExec.indexMode());
-        out.writeNamedWriteableCollection(esQueryExec.output());
-        out.writeOptionalNamedWriteable(esQueryExec.query());
-        out.writeOptionalNamedWriteable(esQueryExec.limit());
-        out.writeOptionalCollection(esQueryExec.sorts(), writerFromPlanWriter(PlanNamedTypes::writeFieldSort));
-        out.writeOptionalInt(esQueryExec.estimatedRowSize());
-    }
-
-    public static IndexMode readIndexMode(StreamInput in) throws IOException {
-        if (in.getTransportVersion().onOrAfter(TransportVersions.ESQL_ADD_INDEX_MODE_TO_SOURCE)) {
-            return IndexMode.fromString(in.readString());
-        } else {
-            return IndexMode.STANDARD;
-        }
-    }
-
-    public static void writeIndexMode(StreamOutput out, IndexMode indexMode) throws IOException {
-        if (out.getTransportVersion().onOrAfter(TransportVersions.ESQL_ADD_INDEX_MODE_TO_SOURCE)) {
-            out.writeString(indexMode.getName());
-        } else if (indexMode != IndexMode.STANDARD) {
-            throw new IllegalStateException("not ready to support index mode [" + indexMode + "]");
-        }
-    }
-
-    static EvalExec readEvalExec(PlanStreamInput in) throws IOException {
-        return new EvalExec(Source.readFrom(in), in.readPhysicalPlanNode(), in.readCollectionAsList(Alias::new));
-    }
-
-    static void writeEvalExec(PlanStreamOutput out, EvalExec evalExec) throws IOException {
-        Source.EMPTY.writeTo(out);
-        out.writePhysicalPlanNode(evalExec.child());
-        out.writeCollection(evalExec.fields());
-    }
-
     static EnrichExec readEnrichExec(PlanStreamInput in) throws IOException {
         final Source source = Source.readFrom(in);
         final PhysicalPlan child = in.readPhysicalPlanNode();
@@ -426,20 +370,4 @@ static void writeTopNExec(PlanStreamOutput out, TopNExec topNExec) throws IOExce
         out.writeNamedWriteable(topNExec.limit());
         out.writeOptionalVInt(topNExec.estimatedRowSize());
     }
-
-    // -- ancillary supporting classes of plan nodes, etc
-
-    static EsQueryExec.FieldSort readFieldSort(PlanStreamInput in) throws IOException {
-        return new EsQueryExec.FieldSort(
-            FieldAttribute.readFrom(in),
-            in.readEnum(Order.OrderDirection.class),
-            in.readEnum(Order.NullsPosition.class)
-        );
-    }
-
-    static void writeFieldSort(PlanStreamOutput out, EsQueryExec.FieldSort fieldSort) throws IOException {
-        fieldSort.field().writeTo(out);
-        out.writeEnum(fieldSort.direction());
-        out.writeEnum(fieldSort.nulls());
-    }
 }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/EsRelation.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/EsRelation.java
index 56c253f166762..b080c425d2312 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/EsRelation.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/EsRelation.java
@@ -19,7 +19,6 @@
 import org.elasticsearch.xpack.esql.core.tree.Source;
 import org.elasticsearch.xpack.esql.core.type.EsField;
 import org.elasticsearch.xpack.esql.index.EsIndex;
-import org.elasticsearch.xpack.esql.io.stream.PlanNamedTypes;
 import org.elasticsearch.xpack.esql.io.stream.PlanStreamInput;
 
 import java.io.IOException;
@@ -67,7 +66,7 @@ private static EsRelation readFrom(StreamInput in) throws IOException {
             in.readOptionalString();
             in.readOptionalString();
         }
-        IndexMode indexMode = PlanNamedTypes.readIndexMode(in);
+        IndexMode indexMode = readIndexMode(in);
         boolean frozen = in.readBoolean();
         return new EsRelation(source, esIndex, attributes, indexMode, frozen);
     }
@@ -83,7 +82,7 @@ public void writeTo(StreamOutput out) throws IOException {
             out.writeOptionalString(null);
             out.writeOptionalString(null);
         }
-        PlanNamedTypes.writeIndexMode(out, indexMode());
+        writeIndexMode(out, indexMode());
         out.writeBoolean(frozen());
     }
 
@@ -174,4 +173,20 @@ public boolean equals(Object obj) {
     public String nodeString() {
         return nodeName() + "[" + index + "]" + NodeUtils.limitedToString(attrs);
     }
+
+    public static IndexMode readIndexMode(StreamInput in) throws IOException {
+        if (in.getTransportVersion().onOrAfter(TransportVersions.ESQL_ADD_INDEX_MODE_TO_SOURCE)) {
+            return IndexMode.fromString(in.readString());
+        } else {
+            return IndexMode.STANDARD;
+        }
+    }
+
+    public static void writeIndexMode(StreamOutput out, IndexMode indexMode) throws IOException {
+        if (out.getTransportVersion().onOrAfter(TransportVersions.ESQL_ADD_INDEX_MODE_TO_SOURCE)) {
+            out.writeString(indexMode.getName());
+        } else if (indexMode != IndexMode.STANDARD) {
+            throw new IllegalStateException("not ready to support index mode [" + indexMode + "]");
+        }
+    }
 }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EsQueryExec.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EsQueryExec.java
index 5901d42abbc82..21aa2cb7d1860 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EsQueryExec.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EsQueryExec.java
@@ -8,6 +8,10 @@
 package org.elasticsearch.xpack.esql.plan.physical;
 
 import org.elasticsearch.common.Strings;
+import org.elasticsearch.common.io.stream.NamedWriteableRegistry;
+import org.elasticsearch.common.io.stream.StreamInput;
+import org.elasticsearch.common.io.stream.StreamOutput;
+import org.elasticsearch.common.io.stream.Writeable;
 import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.index.query.QueryBuilder;
 import org.elasticsearch.search.sort.FieldSortBuilder;
@@ -22,12 +26,21 @@
 import org.elasticsearch.xpack.esql.core.type.EsField;
 import org.elasticsearch.xpack.esql.expression.Order;
 import org.elasticsearch.xpack.esql.index.EsIndex;
+import org.elasticsearch.xpack.esql.io.stream.PlanStreamInput;
+import org.elasticsearch.xpack.esql.plan.logical.EsRelation;
 
+import java.io.IOException;
 import java.util.List;
 import java.util.Map;
 import java.util.Objects;
 
 public class EsQueryExec extends LeafExec implements EstimatesRowSize {
+    public static final NamedWriteableRegistry.Entry ENTRY = new NamedWriteableRegistry.Entry(
+        PhysicalPlan.class,
+        "EsQueryExec",
+        EsQueryExec::new
+    );
+
     public static final EsField DOC_ID_FIELD = new EsField("_doc", DataType.DOC_DATA_TYPE, Map.of(), false);
 
     private final EsIndex index;
@@ -43,7 +56,7 @@ public class EsQueryExec extends LeafExec implements EstimatesRowSize {
      */
     private final Integer estimatedRowSize;
 
-    public record FieldSort(FieldAttribute field, Order.OrderDirection direction, Order.NullsPosition nulls) {
+    public record FieldSort(FieldAttribute field, Order.OrderDirection direction, Order.NullsPosition nulls) implements Writeable {
         public FieldSortBuilder fieldSortBuilder() {
             FieldSortBuilder builder = new FieldSortBuilder(field.name());
             builder.order(Direction.from(direction).asOrder());
@@ -51,6 +64,21 @@ public FieldSortBuilder fieldSortBuilder() {
             builder.unmappedType(field.dataType().esType());
             return builder;
         }
+
+        private static FieldSort readFrom(StreamInput in) throws IOException {
+            return new EsQueryExec.FieldSort(
+                FieldAttribute.readFrom(in),
+                in.readEnum(Order.OrderDirection.class),
+                in.readEnum(Order.NullsPosition.class)
+            );
+        }
+
+        @Override
+        public void writeTo(StreamOutput out) throws IOException {
+            field().writeTo(out);
+            out.writeEnum(direction());
+            out.writeEnum(nulls());
+        }
     }
 
     public EsQueryExec(Source source, EsIndex index, IndexMode indexMode, List<Attribute> attributes, QueryBuilder query) {
@@ -77,6 +105,36 @@ public EsQueryExec(
         this.estimatedRowSize = estimatedRowSize;
     }
 
+    private EsQueryExec(StreamInput in) throws IOException {
+        this(
+            Source.readFrom((PlanStreamInput) in),
+            new EsIndex(in),
+            EsRelation.readIndexMode(in),
+            in.readNamedWriteableCollectionAsList(Attribute.class),
+            in.readOptionalNamedWriteable(QueryBuilder.class),
+            in.readOptionalNamedWriteable(Expression.class),
+            in.readOptionalCollectionAsList(FieldSort::readFrom),
+            in.readOptionalVInt()
+        );
+    }
+
+    @Override
+    public void writeTo(StreamOutput out) throws IOException {
+        Source.EMPTY.writeTo(out);
+        index().writeTo(out);
+        EsRelation.writeIndexMode(out, indexMode());
+        out.writeNamedWriteableCollection(output());
+        out.writeOptionalNamedWriteable(query());
+        out.writeOptionalNamedWriteable(limit());
+        out.writeOptionalCollection(sorts());
+        out.writeOptionalVInt(estimatedRowSize());
+    }
+
+    @Override
+    public String getWriteableName() {
+        return ENTRY.name;
+    }
+
     public static boolean isSourceAttribute(Attribute attr) {
         return DOC_ID_FIELD.getName().equals(attr.name());
     }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EsSourceExec.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EsSourceExec.java
index 275f1182ff97c..cd167b4683493 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EsSourceExec.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EsSourceExec.java
@@ -17,7 +17,6 @@
 import org.elasticsearch.xpack.esql.core.tree.NodeUtils;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 import org.elasticsearch.xpack.esql.index.EsIndex;
-import org.elasticsearch.xpack.esql.io.stream.PlanNamedTypes;
 import org.elasticsearch.xpack.esql.io.stream.PlanStreamInput;
 import org.elasticsearch.xpack.esql.plan.logical.EsRelation;
 
@@ -55,7 +54,7 @@ private EsSourceExec(StreamInput in) throws IOException {
             new EsIndex(in),
             in.readNamedWriteableCollectionAsList(Attribute.class),
             in.readOptionalNamedWriteable(QueryBuilder.class),
-            PlanNamedTypes.readIndexMode(in)
+            EsRelation.readIndexMode(in)
         );
     }
 
@@ -65,7 +64,7 @@ public void writeTo(StreamOutput out) throws IOException {
         index().writeTo(out);
         out.writeNamedWriteableCollection(output());
         out.writeOptionalNamedWriteable(query());
-        PlanNamedTypes.writeIndexMode(out, indexMode());
+        EsRelation.writeIndexMode(out, indexMode());
     }
 
     @Override
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EvalExec.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EvalExec.java
index 3876891b27752..97b81914f8889 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EvalExec.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EvalExec.java
@@ -7,17 +7,29 @@
 
 package org.elasticsearch.xpack.esql.plan.physical;
 
+import org.elasticsearch.common.io.stream.NamedWriteableRegistry;
+import org.elasticsearch.common.io.stream.StreamInput;
+import org.elasticsearch.common.io.stream.StreamOutput;
 import org.elasticsearch.xpack.esql.core.expression.Alias;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
+import org.elasticsearch.xpack.esql.io.stream.PlanStreamInput;
+import org.elasticsearch.xpack.esql.io.stream.PlanStreamOutput;
 
+import java.io.IOException;
 import java.util.List;
 import java.util.Objects;
 
 import static org.elasticsearch.xpack.esql.expression.NamedExpressions.mergeOutputAttributes;
 
 public class EvalExec extends UnaryExec implements EstimatesRowSize {
+    public static final NamedWriteableRegistry.Entry ENTRY = new NamedWriteableRegistry.Entry(
+        PhysicalPlan.class,
+        "EvalExec",
+        EvalExec::new
+    );
+
     private final List<Alias> fields;
 
     public EvalExec(Source source, PhysicalPlan child, List<Alias> fields) {
@@ -25,6 +37,22 @@ public EvalExec(Source source, PhysicalPlan child, List<Alias> fields) {
         this.fields = fields;
     }
 
+    private EvalExec(StreamInput in) throws IOException {
+        this(Source.readFrom((PlanStreamInput) in), ((PlanStreamInput) in).readPhysicalPlanNode(), in.readCollectionAsList(Alias::new));
+    }
+
+    @Override
+    public void writeTo(StreamOutput out) throws IOException {
+        Source.EMPTY.writeTo(out);
+        ((PlanStreamOutput) out).writePhysicalPlanNode(child());
+        out.writeCollection(fields());
+    }
+
+    @Override
+    public String getWriteableName() {
+        return ENTRY.name;
+    }
+
     public List<Alias> fields() {
         return fields;
     }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/PhysicalPlan.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/PhysicalPlan.java
index 42a97802038a2..60e44a5140dfa 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/PhysicalPlan.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/PhysicalPlan.java
@@ -23,7 +23,7 @@
  */
 public abstract class PhysicalPlan extends QueryPlan<PhysicalPlan> {
     public static List<NamedWriteableRegistry.Entry> getNamedWriteables() {
-        return List.of(AggregateExec.ENTRY, DissectExec.ENTRY, EsSourceExec.ENTRY);
+        return List.of(AggregateExec.ENTRY, DissectExec.ENTRY, EsQueryExec.ENTRY, EsSourceExec.ENTRY, EvalExec.ENTRY);
     }
 
     public PhysicalPlan(Source source, List<PhysicalPlan> children) {
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypesTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypesTests.java
index 56ab1bd41693e..a3d1e70e558d6 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypesTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypesTests.java
@@ -20,24 +20,9 @@
 import org.elasticsearch.xpack.esql.core.expression.FieldAttribute;
 import org.elasticsearch.xpack.esql.core.expression.NameId;
 import org.elasticsearch.xpack.esql.core.expression.Nullability;
-import org.elasticsearch.xpack.esql.core.expression.predicate.operator.arithmetic.ArithmeticOperation;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 import org.elasticsearch.xpack.esql.core.type.DataType;
 import org.elasticsearch.xpack.esql.core.type.EsField;
-import org.elasticsearch.xpack.esql.core.type.KeywordEsField;
-import org.elasticsearch.xpack.esql.expression.Order;
-import org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic.Add;
-import org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic.Div;
-import org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic.Mod;
-import org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic.Mul;
-import org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic.Sub;
-import org.elasticsearch.xpack.esql.expression.predicate.operator.comparison.Equals;
-import org.elasticsearch.xpack.esql.expression.predicate.operator.comparison.EsqlBinaryComparison;
-import org.elasticsearch.xpack.esql.expression.predicate.operator.comparison.GreaterThan;
-import org.elasticsearch.xpack.esql.expression.predicate.operator.comparison.GreaterThanOrEqual;
-import org.elasticsearch.xpack.esql.expression.predicate.operator.comparison.LessThan;
-import org.elasticsearch.xpack.esql.expression.predicate.operator.comparison.LessThanOrEqual;
-import org.elasticsearch.xpack.esql.expression.predicate.operator.comparison.NotEquals;
 import org.elasticsearch.xpack.esql.plan.physical.AggregateExec;
 import org.elasticsearch.xpack.esql.plan.physical.DissectExec;
 import org.elasticsearch.xpack.esql.plan.physical.EnrichExec;
@@ -137,15 +122,6 @@ public void testWrappedStreamSimple() throws IOException {
         assertThat(in.readVInt(), equalTo(11_345));
     }
 
-    public void testFieldSortSimple() throws IOException {
-        var orig = new EsQueryExec.FieldSort(field("val", DataType.LONG), Order.OrderDirection.ASC, Order.NullsPosition.FIRST);
-        BytesStreamOutput bso = new BytesStreamOutput();
-        PlanStreamOutput out = new PlanStreamOutput(bso, planNameRegistry, null);
-        PlanNamedTypes.writeFieldSort(out, orig);
-        var deser = PlanNamedTypes.readFieldSort(planStreamInput(bso));
-        EqualsHashCodeTestUtils.checkEqualsAndHashCode(orig, unused -> deser);
-    }
-
     static FieldAttribute randomFieldAttributeOrNull() {
         return randomBoolean() ? randomFieldAttribute() : null;
     }
@@ -163,46 +139,6 @@ static FieldAttribute randomFieldAttribute() {
         );
     }
 
-    static KeywordEsField randomKeywordEsField() {
-        return new KeywordEsField(
-            randomAlphaOfLength(randomIntBetween(1, 25)), // name
-            randomProperties(),
-            randomBoolean(), // hasDocValues
-            randomIntBetween(1, 12), // precision
-            randomBoolean(), // normalized
-            randomBoolean() // alias
-        );
-    }
-
-    static EsqlBinaryComparison randomBinaryComparison() {
-        int v = randomIntBetween(0, 5);
-        var left = field(randomName(), randomDataType());
-        var right = field(randomName(), randomDataType());
-        return switch (v) {
-            case 0 -> new Equals(Source.EMPTY, left, right);
-            case 1 -> new NotEquals(Source.EMPTY, left, right);
-            case 2 -> new GreaterThan(Source.EMPTY, left, right);
-            case 3 -> new GreaterThanOrEqual(Source.EMPTY, left, right);
-            case 4 -> new LessThan(Source.EMPTY, left, right);
-            case 5 -> new LessThanOrEqual(Source.EMPTY, left, right);
-            default -> throw new AssertionError(v);
-        };
-    }
-
-    static ArithmeticOperation randomArithmeticOperation() {
-        int v = randomIntBetween(0, 4);
-        var left = field(randomName(), randomDataType());
-        var right = field(randomName(), randomDataType());
-        return switch (v) {
-            case 0 -> new Add(Source.EMPTY, left, right);
-            case 1 -> new Sub(Source.EMPTY, left, right);
-            case 2 -> new Mul(Source.EMPTY, left, right);
-            case 3 -> new Div(Source.EMPTY, left, right);
-            case 4 -> new Mod(Source.EMPTY, left, right);
-            default -> throw new AssertionError(v);
-        };
-    }
-
     static NameId nameIdOrNull() {
         return randomBoolean() ? new NameId() : null;
     }
@@ -231,10 +167,6 @@ static EsField randomEsField(int depth) {
         );
     }
 
-    static Map<String, EsField> randomProperties() {
-        return randomProperties(0);
-    }
-
     static Map<String, EsField> randomProperties(int depth) {
         if (depth > 2) {
             return Map.of(); // prevent infinite recursion (between EsField and properties)
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/AbstractPhysicalPlanSerializationTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/AbstractPhysicalPlanSerializationTests.java
index 7a0d125ad85ba..2a05c472328e5 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/AbstractPhysicalPlanSerializationTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/AbstractPhysicalPlanSerializationTests.java
@@ -16,6 +16,7 @@
 import org.elasticsearch.xpack.esql.core.expression.NamedExpression;
 import org.elasticsearch.xpack.esql.core.tree.Node;
 import org.elasticsearch.xpack.esql.expression.function.aggregate.AggregateFunction;
+import org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic.Add;
 import org.elasticsearch.xpack.esql.plan.AbstractNodeSerializationTests;
 
 import java.util.ArrayList;
@@ -47,7 +48,8 @@ protected final NamedWriteableRegistry getNamedWriteableRegistry() {
         entries.addAll(Attribute.getNamedWriteables());
         entries.addAll(Block.getNamedWriteables());
         entries.addAll(NamedExpression.getNamedWriteables());
-        entries.addAll(new SearchModule(Settings.EMPTY, List.of()).getNamedWriteables());
+        entries.addAll(new SearchModule(Settings.EMPTY, List.of()).getNamedWriteables()); // Query builders
+        entries.add(Add.ENTRY); // Used by the eval tests
         return new NamedWriteableRegistry(entries);
     }
 
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/EsQueryExecSerializationTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/EsQueryExecSerializationTests.java
new file mode 100644
index 0000000000000..6bb5111b154e6
--- /dev/null
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/EsQueryExecSerializationTests.java
@@ -0,0 +1,94 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.esql.plan.physical;
+
+import org.elasticsearch.index.IndexMode;
+import org.elasticsearch.index.query.MatchAllQueryBuilder;
+import org.elasticsearch.index.query.QueryBuilder;
+import org.elasticsearch.index.query.TermQueryBuilder;
+import org.elasticsearch.xpack.esql.core.expression.Attribute;
+import org.elasticsearch.xpack.esql.core.expression.Expression;
+import org.elasticsearch.xpack.esql.core.expression.FieldAttribute;
+import org.elasticsearch.xpack.esql.core.expression.Literal;
+import org.elasticsearch.xpack.esql.core.tree.Source;
+import org.elasticsearch.xpack.esql.core.type.DataType;
+import org.elasticsearch.xpack.esql.expression.Order;
+import org.elasticsearch.xpack.esql.expression.function.FieldAttributeTests;
+import org.elasticsearch.xpack.esql.index.EsIndex;
+import org.elasticsearch.xpack.esql.index.EsIndexSerializationTests;
+
+import java.io.IOException;
+import java.util.List;
+
+import static org.elasticsearch.xpack.esql.plan.logical.AbstractLogicalPlanSerializationTests.randomFieldAttributes;
+
+public class EsQueryExecSerializationTests extends AbstractPhysicalPlanSerializationTests<EsQueryExec> {
+    public static EsQueryExec randomEsQueryExec() {
+        Source source = randomSource();
+        EsIndex index = EsIndexSerializationTests.randomEsIndex();
+        IndexMode indexMode = randomFrom(IndexMode.values());
+        List<Attribute> attrs = randomFieldAttributes(1, 10, false);
+        QueryBuilder query = randomQuery();
+        Expression limit = new Literal(randomSource(), between(0, Integer.MAX_VALUE), DataType.INTEGER);
+        List<EsQueryExec.FieldSort> sorts = randomFieldSorts();
+        Integer estimatedRowSize = randomEstimatedRowSize();
+        return new EsQueryExec(source, index, indexMode, attrs, query, limit, sorts, estimatedRowSize);
+    }
+
+    public static QueryBuilder randomQuery() {
+        return randomBoolean() ? new MatchAllQueryBuilder() : new TermQueryBuilder(randomAlphaOfLength(4), randomAlphaOfLength(4));
+    }
+
+    public static List<EsQueryExec.FieldSort> randomFieldSorts() {
+        return randomList(0, 4, EsQueryExecSerializationTests::randomFieldSort);
+    }
+
+    public static EsQueryExec.FieldSort randomFieldSort() {
+        FieldAttribute field = FieldAttributeTests.createFieldAttribute(0, false);
+        Order.OrderDirection direction = randomFrom(Order.OrderDirection.values());
+        Order.NullsPosition nulls = randomFrom(Order.NullsPosition.values());
+        return new EsQueryExec.FieldSort(field, direction, nulls);
+    }
+
+    @Override
+    protected EsQueryExec createTestInstance() {
+        return randomEsQueryExec();
+    }
+
+    @Override
+    protected EsQueryExec mutateInstance(EsQueryExec instance) throws IOException {
+        EsIndex index = instance.index();
+        IndexMode indexMode = instance.indexMode();
+        List<Attribute> attrs = instance.attrs();
+        QueryBuilder query = instance.query();
+        Expression limit = instance.limit();
+        List<EsQueryExec.FieldSort> sorts = instance.sorts();
+        Integer estimatedRowSize = instance.estimatedRowSize();
+        switch (between(0, 6)) {
+            case 0 -> index = randomValueOtherThan(index, EsIndexSerializationTests::randomEsIndex);
+            case 1 -> indexMode = randomValueOtherThan(indexMode, () -> randomFrom(IndexMode.values()));
+            case 2 -> attrs = randomValueOtherThan(attrs, () -> randomFieldAttributes(1, 10, false));
+            case 3 -> query = randomValueOtherThan(query, EsQueryExecSerializationTests::randomQuery);
+            case 4 -> limit = randomValueOtherThan(
+                limit,
+                () -> new Literal(randomSource(), between(0, Integer.MAX_VALUE), DataType.INTEGER)
+            );
+            case 5 -> sorts = randomValueOtherThan(sorts, EsQueryExecSerializationTests::randomFieldSorts);
+            case 6 -> estimatedRowSize = randomValueOtherThan(
+                estimatedRowSize,
+                AbstractPhysicalPlanSerializationTests::randomEstimatedRowSize
+            );
+        }
+        return new EsQueryExec(instance.source(), index, indexMode, attrs, query, limit, sorts, estimatedRowSize);
+    }
+
+    @Override
+    protected boolean alwaysEmptySource() {
+        return true;
+    }
+}
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/EvalExecSerializationTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/EvalExecSerializationTests.java
new file mode 100644
index 0000000000000..45baf4822b1d2
--- /dev/null
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/EvalExecSerializationTests.java
@@ -0,0 +1,61 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.esql.plan.physical;
+
+import org.elasticsearch.xpack.esql.core.expression.Alias;
+import org.elasticsearch.xpack.esql.core.expression.Expression;
+import org.elasticsearch.xpack.esql.core.tree.Source;
+import org.elasticsearch.xpack.esql.expression.function.FieldAttributeTests;
+import org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic.Add;
+
+import java.io.IOException;
+import java.util.List;
+
+public class EvalExecSerializationTests extends AbstractPhysicalPlanSerializationTests<EvalExec> {
+    public static EvalExec randomEvalExec(int depth) {
+        Source source = randomSource();
+        PhysicalPlan child = randomChild(depth);
+        List<Alias> fields = randomFields();
+        return new EvalExec(source, child, fields);
+    }
+
+    public static List<Alias> randomFields() {
+        return randomList(1, 10, EvalExecSerializationTests::randomField);
+    }
+
+    public static Alias randomField() {
+        Expression child = new Add(
+            randomSource(),
+            FieldAttributeTests.createFieldAttribute(0, true),
+            FieldAttributeTests.createFieldAttribute(0, true)
+        );
+        return new Alias(randomSource(), randomAlphaOfLength(5), child);
+    }
+
+    @Override
+    protected EvalExec createTestInstance() {
+        return randomEvalExec(0);
+    }
+
+    @Override
+    protected EvalExec mutateInstance(EvalExec instance) throws IOException {
+        PhysicalPlan child = instance.child();
+        List<Alias> fields = instance.fields();
+        if (randomBoolean()) {
+            child = randomValueOtherThan(child, () -> randomChild(0));
+        } else {
+            fields = randomValueOtherThan(fields, EvalExecSerializationTests::randomFields);
+        }
+        return new EvalExec(instance.source(), child, fields);
+    }
+
+    @Override
+    protected boolean alwaysEmptySource() {
+        return true;
+    }
+}

From 3cbb5264f5e7a2cc5d85b27b1ec72834ef85bcfc Mon Sep 17 00:00:00 2001
From: Costin Leau <costin@users.noreply.github.com>
Date: Wed, 28 Aug 2024 10:46:36 -0700
Subject: [PATCH 013/144] ESQL: use this. prefix in grammar semantic predicate
 (#112291)

Fix #112285
---
 .../esql/src/main/antlr/EsqlBaseLexer.g4      | 14 ++++++-------
 .../esql/src/main/antlr/EsqlBaseParser.g4     | 10 +++++-----
 .../xpack/esql/parser/EsqlBaseLexer.java      | 10 +++++-----
 .../xpack/esql/parser/EsqlBaseParser.java     | 20 +++++++++----------
 4 files changed, 27 insertions(+), 27 deletions(-)

diff --git a/x-pack/plugin/esql/src/main/antlr/EsqlBaseLexer.g4 b/x-pack/plugin/esql/src/main/antlr/EsqlBaseLexer.g4
index 897bfa5e1ce15..6570a25469971 100644
--- a/x-pack/plugin/esql/src/main/antlr/EsqlBaseLexer.g4
+++ b/x-pack/plugin/esql/src/main/antlr/EsqlBaseLexer.g4
@@ -29,7 +29,7 @@ options {
  *
  * Since the tokens/modes are in development, simply define them under the
  * "// in development section" and follow the section comments in that section.
- * That is use the DEV_ prefix and use the {isDevVersion()}? conditional.
+ * That is use the DEV_ prefix and use the {this.isDevVersion()}? conditional.
  * They are defined at the end of the file, to minimize the impact on the existing
  * token types.
  *
@@ -80,15 +80,15 @@ WHERE : 'where'               -> pushMode(EXPRESSION_MODE);
 // Before adding a new in-development command, to sandbox the behavior when running in production environments
 //
 // For example: to add myCommand use the following declaration:
-// DEV_MYCOMMAND : {isDevVersion()}? 'mycommand' -> ...
+// DEV_MYCOMMAND : {this.isDevVersion()}? 'mycommand' -> ...
 //
 // Once the command has been stabilized, remove the DEV_ prefix and the {}? conditional and move the command to the
 // main section while preserving alphabetical order:
 // MYCOMMAND : 'mycommand' -> ...
-DEV_INLINESTATS : {isDevVersion()}? 'inlinestats'   -> pushMode(EXPRESSION_MODE);
-DEV_LOOKUP :      {isDevVersion()}? 'lookup'        -> pushMode(LOOKUP_MODE);
-DEV_MATCH :       {isDevVersion()}? 'match'         -> pushMode(EXPRESSION_MODE);
-DEV_METRICS :     {isDevVersion()}? 'metrics'       -> pushMode(METRICS_MODE);
+DEV_INLINESTATS : {this.isDevVersion()}? 'inlinestats'   -> pushMode(EXPRESSION_MODE);
+DEV_LOOKUP :      {this.isDevVersion()}? 'lookup'        -> pushMode(LOOKUP_MODE);
+DEV_MATCH :       {this.isDevVersion()}? 'match'         -> pushMode(EXPRESSION_MODE);
+DEV_METRICS :     {this.isDevVersion()}? 'metrics'       -> pushMode(METRICS_MODE);
 
 //
 // Catch-all for unrecognized commands - don't define any beyond this line
@@ -211,7 +211,7 @@ SLASH : '/';
 PERCENT : '%';
 
 // move it in the main section if the feature gets promoted
-DEV_MATCH_OP : {isDevVersion()}? DEV_MATCH -> type(DEV_MATCH);
+DEV_MATCH_OP : {this.isDevVersion()}? DEV_MATCH -> type(DEV_MATCH);
 
 NAMED_OR_POSITIONAL_PARAM
     : PARAM (LETTER | UNDERSCORE) UNQUOTED_ID_BODY*
diff --git a/x-pack/plugin/esql/src/main/antlr/EsqlBaseParser.g4 b/x-pack/plugin/esql/src/main/antlr/EsqlBaseParser.g4
index ce748b3af03d1..a3ef2471d4e56 100644
--- a/x-pack/plugin/esql/src/main/antlr/EsqlBaseParser.g4
+++ b/x-pack/plugin/esql/src/main/antlr/EsqlBaseParser.g4
@@ -36,7 +36,7 @@ sourceCommand
     | rowCommand
     | showCommand
     // in development
-    | {isDevVersion()}? metricsCommand
+    | {this.isDevVersion()}? metricsCommand
     ;
 
 processingCommand
@@ -53,9 +53,9 @@ processingCommand
     | enrichCommand
     | mvExpandCommand
     // in development
-    | {isDevVersion()}? inlinestatsCommand
-    | {isDevVersion()}? lookupCommand
-    | {isDevVersion()}? matchCommand
+    | {this.isDevVersion()}? inlinestatsCommand
+    | {this.isDevVersion()}? lookupCommand
+    | {this.isDevVersion()}? matchCommand
     ;
 
 whereCommand
@@ -70,7 +70,7 @@ booleanExpression
     | left=booleanExpression operator=OR right=booleanExpression                 #logicalBinary
     | valueExpression (NOT)? IN LP valueExpression (COMMA valueExpression)* RP   #logicalIn
     | valueExpression IS NOT? NULL                                               #isNull
-    | {isDevVersion()}? matchBooleanExpression                                   #matchExpression
+    | {this.isDevVersion()}? matchBooleanExpression                              #matchExpression
     ;
 
 regexBooleanExpression
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/parser/EsqlBaseLexer.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/parser/EsqlBaseLexer.java
index 5fc5ab20810a6..a746a0d49004f 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/parser/EsqlBaseLexer.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/parser/EsqlBaseLexer.java
@@ -238,35 +238,35 @@ public boolean sempred(RuleContext _localctx, int ruleIndex, int predIndex) {
   private boolean DEV_INLINESTATS_sempred(RuleContext _localctx, int predIndex) {
     switch (predIndex) {
     case 0:
-      return isDevVersion();
+      return this.isDevVersion();
     }
     return true;
   }
   private boolean DEV_LOOKUP_sempred(RuleContext _localctx, int predIndex) {
     switch (predIndex) {
     case 1:
-      return isDevVersion();
+      return this.isDevVersion();
     }
     return true;
   }
   private boolean DEV_MATCH_sempred(RuleContext _localctx, int predIndex) {
     switch (predIndex) {
     case 2:
-      return isDevVersion();
+      return this.isDevVersion();
     }
     return true;
   }
   private boolean DEV_METRICS_sempred(RuleContext _localctx, int predIndex) {
     switch (predIndex) {
     case 3:
-      return isDevVersion();
+      return this.isDevVersion();
     }
     return true;
   }
   private boolean DEV_MATCH_OP_sempred(RuleContext _localctx, int predIndex) {
     switch (predIndex) {
     case 4:
-      return isDevVersion();
+      return this.isDevVersion();
     }
     return true;
   }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/parser/EsqlBaseParser.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/parser/EsqlBaseParser.java
index 359abbc701dd3..fb63e31a37c90 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/parser/EsqlBaseParser.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/parser/EsqlBaseParser.java
@@ -447,7 +447,7 @@ public final SourceCommandContext sourceCommand() throws RecognitionException {
         enterOuterAlt(_localctx, 6);
         {
         setState(141);
-        if (!(isDevVersion())) throw new FailedPredicateException(this, "isDevVersion()");
+        if (!(this.isDevVersion())) throw new FailedPredicateException(this, "this.isDevVersion()");
         setState(142);
         metricsCommand();
         }
@@ -627,7 +627,7 @@ public final ProcessingCommandContext processingCommand() throws RecognitionExce
         enterOuterAlt(_localctx, 13);
         {
         setState(157);
-        if (!(isDevVersion())) throw new FailedPredicateException(this, "isDevVersion()");
+        if (!(this.isDevVersion())) throw new FailedPredicateException(this, "this.isDevVersion()");
         setState(158);
         inlinestatsCommand();
         }
@@ -636,7 +636,7 @@ public final ProcessingCommandContext processingCommand() throws RecognitionExce
         enterOuterAlt(_localctx, 14);
         {
         setState(159);
-        if (!(isDevVersion())) throw new FailedPredicateException(this, "isDevVersion()");
+        if (!(this.isDevVersion())) throw new FailedPredicateException(this, "this.isDevVersion()");
         setState(160);
         lookupCommand();
         }
@@ -645,7 +645,7 @@ public final ProcessingCommandContext processingCommand() throws RecognitionExce
         enterOuterAlt(_localctx, 15);
         {
         setState(161);
-        if (!(isDevVersion())) throw new FailedPredicateException(this, "isDevVersion()");
+        if (!(this.isDevVersion())) throw new FailedPredicateException(this, "this.isDevVersion()");
         setState(162);
         matchCommand();
         }
@@ -1018,7 +1018,7 @@ private BooleanExpressionContext booleanExpression(int _p) throws RecognitionExc
         _ctx = _localctx;
         _prevctx = _localctx;
         setState(196);
-        if (!(isDevVersion())) throw new FailedPredicateException(this, "isDevVersion()");
+        if (!(this.isDevVersion())) throw new FailedPredicateException(this, "this.isDevVersion()");
         setState(197);
         matchBooleanExpression();
         }
@@ -5339,25 +5339,25 @@ private boolean query_sempred(QueryContext _localctx, int predIndex) {
   private boolean sourceCommand_sempred(SourceCommandContext _localctx, int predIndex) {
     switch (predIndex) {
     case 1:
-      return isDevVersion();
+      return this.isDevVersion();
     }
     return true;
   }
   private boolean processingCommand_sempred(ProcessingCommandContext _localctx, int predIndex) {
     switch (predIndex) {
     case 2:
-      return isDevVersion();
+      return this.isDevVersion();
     case 3:
-      return isDevVersion();
+      return this.isDevVersion();
     case 4:
-      return isDevVersion();
+      return this.isDevVersion();
     }
     return true;
   }
   private boolean booleanExpression_sempred(BooleanExpressionContext _localctx, int predIndex) {
     switch (predIndex) {
     case 5:
-      return isDevVersion();
+      return this.isDevVersion();
     case 6:
       return precpred(_ctx, 5);
     case 7:

From 7b4443016fbd15b431a6382200c0043d57e682cc Mon Sep 17 00:00:00 2001
From: Ryan Ernst <ryan@iernst.net>
Date: Wed, 28 Aug 2024 12:10:24 -0700
Subject: [PATCH 014/144] Use test util for finding platform dir (#112286)

The native platform dir can be found using a TestUtil method, but
benchmarks was trying to construct it on its own. This commit switches
to using the util method.
---
 benchmarks/build.gradle | 16 +++++-----------
 1 file changed, 5 insertions(+), 11 deletions(-)

diff --git a/benchmarks/build.gradle b/benchmarks/build.gradle
index e2511438e7f95..b16621aaaa471 100644
--- a/benchmarks/build.gradle
+++ b/benchmarks/build.gradle
@@ -1,4 +1,5 @@
 import org.elasticsearch.gradle.internal.info.BuildParams
+import org.elasticsearch.gradle.internal.test.TestUtil
 
 /*
  * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
@@ -29,6 +30,7 @@ tasks.named("javadoc").configure { enabled = false }
 configurations {
   expression
   painless
+  nativeLib
 }
 
 dependencies {
@@ -45,6 +47,7 @@ dependencies {
   implementation project(path: ':libs:elasticsearch-simdvec')
   expression(project(path: ':modules:lang-expression', configuration: 'zip'))
   painless(project(path: ':modules:lang-painless', configuration: 'zip'))
+  nativeLib(project(':libs:elasticsearch-native'))
   api "org.openjdk.jmh:jmh-core:$versions.jmh"
   annotationProcessor "org.openjdk.jmh:jmh-generator-annprocess:$versions.jmh"
   // Dependencies of JMH
@@ -76,17 +79,8 @@ tasks.register("copyPainless", Copy) {
 tasks.named("run").configure {
   executable = "${BuildParams.runtimeJavaHome}/bin/java"
   args << "-Dplugins.dir=${buildDir}/plugins" << "-Dtests.index=${buildDir}/index"
-  dependsOn "copyExpression", "copyPainless"
-  systemProperty 'es.nativelibs.path', file("../libs/native/libraries/build/platform/${platformName()}-${os.arch}")
-}
-
-String platformName() {
-  String name = System.getProperty("os.name");
-  if (name.startsWith("Mac")) {
-    return "darwin";
-  } else {
-    return name.toLowerCase(Locale.ROOT);
-  }
+  dependsOn "copyExpression", "copyPainless", configurations.nativeLib
+  systemProperty 'es.nativelibs.path', TestUtil.getTestLibraryPath(file("../libs/native/libraries/build/platform/").toString())
 }
 
 spotless {

From b776cf6460c136fd1ae67810c042dfde6a675c52 Mon Sep 17 00:00:00 2001
From: Parker Timmins <parker.timmins@elastic.co>
Date: Wed, 28 Aug 2024 14:18:50 -0500
Subject: [PATCH 015/144] Do not treat replica as unassigned if new and below
 time threshold. (#112066)

Changes the way we calculate if all replicas are unassigned when primary is recently created.
This change will only be used in serverless, not in stateful. When a primary is new, if the primary
is active, but the replica is unassigned for less than a buffer time period, do not treat is as unassigned.
Control time period through health.shards_availability.replica_unassigned_buffer_time setting.
---
 docs/changelog/112066.yaml                    |   6 +
 ...rdsAvailabilityHealthIndicatorService.java |  69 ++++-
 .../common/settings/ClusterSettings.java      |   4 +-
 .../ShardsAvailabilityActionGuideTests.java   |  14 +-
 ...ailabilityHealthIndicatorServiceTests.java | 258 +++++++++++++-----
 5 files changed, 271 insertions(+), 80 deletions(-)
 create mode 100644 docs/changelog/112066.yaml

diff --git a/docs/changelog/112066.yaml b/docs/changelog/112066.yaml
new file mode 100644
index 0000000000000..5dd846766bc8e
--- /dev/null
+++ b/docs/changelog/112066.yaml
@@ -0,0 +1,6 @@
+pr: 112066
+summary: Do not treat replica as unassigned if primary recently created and unassigned
+  time is below a threshold
+area: Health
+type: enhancement
+issues: []
diff --git a/server/src/main/java/org/elasticsearch/cluster/routing/allocation/shards/ShardsAvailabilityHealthIndicatorService.java b/server/src/main/java/org/elasticsearch/cluster/routing/allocation/shards/ShardsAvailabilityHealthIndicatorService.java
index 8fb91d89417e0..b6c19f331c712 100644
--- a/server/src/main/java/org/elasticsearch/cluster/routing/allocation/shards/ShardsAvailabilityHealthIndicatorService.java
+++ b/server/src/main/java/org/elasticsearch/cluster/routing/allocation/shards/ShardsAvailabilityHealthIndicatorService.java
@@ -40,9 +40,11 @@
 import org.elasticsearch.cluster.routing.allocation.decider.ShardsLimitAllocationDecider;
 import org.elasticsearch.cluster.service.ClusterService;
 import org.elasticsearch.common.settings.ClusterSettings;
+import org.elasticsearch.common.settings.Setting;
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.util.set.Sets;
 import org.elasticsearch.core.Nullable;
+import org.elasticsearch.core.TimeValue;
 import org.elasticsearch.health.Diagnosis;
 import org.elasticsearch.health.HealthIndicatorDetails;
 import org.elasticsearch.health.HealthIndicatorImpact;
@@ -56,6 +58,7 @@
 import org.elasticsearch.snapshots.SearchableSnapshotsSettings;
 import org.elasticsearch.snapshots.SnapshotShardSizeInfo;
 
+import java.time.Instant;
 import java.util.ArrayList;
 import java.util.HashMap;
 import java.util.HashSet;
@@ -108,11 +111,29 @@ public class ShardsAvailabilityHealthIndicatorService implements HealthIndicator
 
     private static final String DATA_TIER_ALLOCATION_DECIDER_NAME = "data_tier";
 
+    /**
+     * Changes the behavior of isNewlyCreatedAndInitializingReplica so that the
+     * shard_availability health indicator returns YELLOW if a primary
+     * is STARTED, but a replica is still INITIALIZING and the replica has been
+     * unassigned for less than the value of this setting. This function is
+     * only used in serverless, so this setting has no effect in stateless.
+     */
+    public static final Setting<TimeValue> REPLICA_UNASSIGNED_BUFFER_TIME = Setting.timeSetting(
+        "health.shards_availability.replica_unassigned_buffer_time",
+        TimeValue.timeValueSeconds(3),
+        TimeValue.timeValueSeconds(0),
+        TimeValue.timeValueSeconds(20),
+        Setting.Property.NodeScope,
+        Setting.Property.Dynamic
+    );
+
     private final ClusterService clusterService;
     private final AllocationService allocationService;
 
     private final SystemIndices systemIndices;
 
+    private volatile TimeValue replicaUnassignedBufferTime = TimeValue.timeValueSeconds(0);
+
     public ShardsAvailabilityHealthIndicatorService(
         ClusterService clusterService,
         AllocationService allocationService,
@@ -121,6 +142,11 @@ public ShardsAvailabilityHealthIndicatorService(
         this.clusterService = clusterService;
         this.allocationService = allocationService;
         this.systemIndices = systemIndices;
+        clusterService.getClusterSettings().addSettingsUpdateConsumer(REPLICA_UNASSIGNED_BUFFER_TIME, this::setReplicaUnassignedBufferTime);
+    }
+
+    private void setReplicaUnassignedBufferTime(TimeValue replicaUnassignedBufferTime) {
+        this.replicaUnassignedBufferTime = replicaUnassignedBufferTime;
     }
 
     @Override
@@ -144,7 +170,7 @@ public HealthIndicatorResult calculate(boolean verbose, int maxAffectedResources
         var state = clusterService.state();
         var shutdown = state.getMetadata().custom(NodesShutdownMetadata.TYPE, NodesShutdownMetadata.EMPTY);
         var status = createNewStatus(state.getMetadata());
-        updateShardAllocationStatus(status, state, shutdown, verbose);
+        updateShardAllocationStatus(status, state, shutdown, verbose, replicaUnassignedBufferTime);
         return createIndicator(
             status.getStatus(),
             status.getSymptom(),
@@ -158,14 +184,15 @@ static void updateShardAllocationStatus(
         ShardAllocationStatus status,
         ClusterState state,
         NodesShutdownMetadata shutdown,
-        boolean verbose
+        boolean verbose,
+        TimeValue replicaUnassignedBufferTime
     ) {
         for (IndexRoutingTable indexShardRouting : state.routingTable()) {
             for (int i = 0; i < indexShardRouting.size(); i++) {
                 IndexShardRoutingTable shardRouting = indexShardRouting.shard(i);
                 status.addPrimary(shardRouting.primaryShard(), state, shutdown, verbose);
                 for (ShardRouting replicaShard : shardRouting.replicaShards()) {
-                    status.addReplica(replicaShard, state, shutdown, verbose);
+                    status.addReplica(replicaShard, state, shutdown, verbose, replicaUnassignedBufferTime);
                 }
             }
         }
@@ -438,11 +465,18 @@ public class ShardAllocationCounts {
         public SearchableSnapshotsState searchableSnapshotsState = new SearchableSnapshotsState();
         final Map<Diagnosis.Definition, Set<String>> diagnosisDefinitions = new HashMap<>();
 
-        public void increment(ShardRouting routing, ClusterState state, NodesShutdownMetadata shutdowns, boolean verbose) {
+        public void increment(
+            ShardRouting routing,
+            ClusterState state,
+            NodesShutdownMetadata shutdowns,
+            boolean verbose,
+            TimeValue replicaUnassignedBufferTime
+        ) {
             boolean isNew = isUnassignedDueToNewInitialization(routing, state);
             boolean isRestarting = isUnassignedDueToTimelyRestart(routing, shutdowns);
+            long replicaUnassignedCutoffTime = Instant.now().toEpochMilli() - replicaUnassignedBufferTime.millis();
             boolean allUnavailable = areAllShardsOfThisTypeUnavailable(routing, state)
-                && isNewlyCreatedAndInitializingReplica(routing, state) == false;
+                && isNewlyCreatedAndInitializingReplica(routing, state, replicaUnassignedCutoffTime) == false;
             if (allUnavailable) {
                 indicesWithAllShardsUnavailable.add(routing.getIndexName());
             }
@@ -520,7 +554,7 @@ boolean areAllShardsOfThisTypeUnavailable(ShardRouting routing, ClusterState sta
      * (a newly created index having unassigned replicas for example), we don't want the cluster
      * to turn "unhealthy" for the tiny amount of time before the shards are allocated.
      */
-    static boolean isNewlyCreatedAndInitializingReplica(ShardRouting routing, ClusterState state) {
+    static boolean isNewlyCreatedAndInitializingReplica(ShardRouting routing, ClusterState state, long replicaUnassignedCutoffTime) {
         if (routing.active()) {
             return false;
         }
@@ -528,10 +562,15 @@ static boolean isNewlyCreatedAndInitializingReplica(ShardRouting routing, Cluste
             return false;
         }
         ShardRouting primary = state.routingTable().shardRoutingTable(routing.shardId()).primaryShard();
-        if (primary.active()) {
-            return false;
+        if (primary.active() == false) {
+            return ClusterShardHealth.getInactivePrimaryHealth(primary) == ClusterHealthStatus.YELLOW;
         }
-        return ClusterShardHealth.getInactivePrimaryHealth(primary) == ClusterHealthStatus.YELLOW;
+
+        Optional<UnassignedInfo> ui = Optional.ofNullable(routing.unassignedInfo());
+        return ui.filter(info -> info.failedAllocations() == 0)
+            .filter(info -> info.lastAllocationStatus() != UnassignedInfo.AllocationStatus.DECIDERS_NO)
+            .filter(info -> info.unassignedTimeMillis() > replicaUnassignedCutoffTime)
+            .isPresent();
     }
 
     private static boolean isUnassignedDueToTimelyRestart(ShardRouting routing, NodesShutdownMetadata shutdowns) {
@@ -910,11 +949,17 @@ public ShardAllocationStatus(Metadata clusterMetadata) {
         }
 
         void addPrimary(ShardRouting routing, ClusterState state, NodesShutdownMetadata shutdowns, boolean verbose) {
-            primaries.increment(routing, state, shutdowns, verbose);
+            primaries.increment(routing, state, shutdowns, verbose, TimeValue.MINUS_ONE);
         }
 
-        void addReplica(ShardRouting routing, ClusterState state, NodesShutdownMetadata shutdowns, boolean verbose) {
-            replicas.increment(routing, state, shutdowns, verbose);
+        void addReplica(
+            ShardRouting routing,
+            ClusterState state,
+            NodesShutdownMetadata shutdowns,
+            boolean verbose,
+            TimeValue replicaUnassignedBufferTime
+        ) {
+            replicas.increment(routing, state, shutdowns, verbose, replicaUnassignedBufferTime);
         }
 
         void updateSearchableSnapshotsOfAvailableIndices() {
diff --git a/server/src/main/java/org/elasticsearch/common/settings/ClusterSettings.java b/server/src/main/java/org/elasticsearch/common/settings/ClusterSettings.java
index 8d9d8452b12bb..3c60d63f78991 100644
--- a/server/src/main/java/org/elasticsearch/common/settings/ClusterSettings.java
+++ b/server/src/main/java/org/elasticsearch/common/settings/ClusterSettings.java
@@ -55,6 +55,7 @@
 import org.elasticsearch.cluster.routing.allocation.decider.SameShardAllocationDecider;
 import org.elasticsearch.cluster.routing.allocation.decider.ShardsLimitAllocationDecider;
 import org.elasticsearch.cluster.routing.allocation.decider.ThrottlingAllocationDecider;
+import org.elasticsearch.cluster.routing.allocation.shards.ShardsAvailabilityHealthIndicatorService;
 import org.elasticsearch.cluster.service.ClusterApplierService;
 import org.elasticsearch.cluster.service.ClusterService;
 import org.elasticsearch.cluster.service.MasterService;
@@ -598,6 +599,7 @@ public void apply(Settings value, Settings current, Settings previous) {
         MergePolicyConfig.DEFAULT_MAX_TIME_BASED_MERGED_SEGMENT_SETTING,
         TransportService.ENABLE_STACK_OVERFLOW_AVOIDANCE,
         DataStreamGlobalRetentionSettings.DATA_STREAMS_DEFAULT_RETENTION_SETTING,
-        DataStreamGlobalRetentionSettings.DATA_STREAMS_MAX_RETENTION_SETTING
+        DataStreamGlobalRetentionSettings.DATA_STREAMS_MAX_RETENTION_SETTING,
+        ShardsAvailabilityHealthIndicatorService.REPLICA_UNASSIGNED_BUFFER_TIME
     );
 }
diff --git a/server/src/test/java/org/elasticsearch/cluster/routing/allocation/ShardsAvailabilityActionGuideTests.java b/server/src/test/java/org/elasticsearch/cluster/routing/allocation/ShardsAvailabilityActionGuideTests.java
index b731fd79c82fe..994e892e3ac3c 100644
--- a/server/src/test/java/org/elasticsearch/cluster/routing/allocation/ShardsAvailabilityActionGuideTests.java
+++ b/server/src/test/java/org/elasticsearch/cluster/routing/allocation/ShardsAvailabilityActionGuideTests.java
@@ -10,6 +10,7 @@
 
 import org.elasticsearch.cluster.routing.allocation.shards.ShardsAvailabilityHealthIndicatorService;
 import org.elasticsearch.cluster.service.ClusterService;
+import org.elasticsearch.common.settings.ClusterSettings;
 import org.elasticsearch.indices.SystemIndices;
 import org.elasticsearch.test.ESTestCase;
 
@@ -33,14 +34,17 @@
 import static org.elasticsearch.cluster.routing.allocation.shards.ShardsAvailabilityHealthIndicatorService.TIER_CAPACITY_ACTION_GUIDE;
 import static org.hamcrest.Matchers.is;
 import static org.mockito.Mockito.mock;
+import static org.mockito.Mockito.when;
 
 public class ShardsAvailabilityActionGuideTests extends ESTestCase {
 
-    private final ShardsAvailabilityHealthIndicatorService service = new ShardsAvailabilityHealthIndicatorService(
-        mock(ClusterService.class),
-        mock(AllocationService.class),
-        mock(SystemIndices.class)
-    );
+    private final ShardsAvailabilityHealthIndicatorService service;
+
+    public ShardsAvailabilityActionGuideTests() {
+        ClusterService clusterService = mock(ClusterService.class);
+        when(clusterService.getClusterSettings()).thenReturn(ClusterSettings.createBuiltInClusterSettings());
+        service = new ShardsAvailabilityHealthIndicatorService(clusterService, mock(AllocationService.class), mock(SystemIndices.class));
+    }
 
     public void testRestoreFromSnapshotAction() {
         assertThat(ACTION_RESTORE_FROM_SNAPSHOT.helpURL(), is(RESTORE_FROM_SNAPSHOT_ACTION_GUIDE));
diff --git a/server/src/test/java/org/elasticsearch/cluster/routing/allocation/shards/ShardsAvailabilityHealthIndicatorServiceTests.java b/server/src/test/java/org/elasticsearch/cluster/routing/allocation/shards/ShardsAvailabilityHealthIndicatorServiceTests.java
index 0e3041dda9853..ad30c79a01334 100644
--- a/server/src/test/java/org/elasticsearch/cluster/routing/allocation/shards/ShardsAvailabilityHealthIndicatorServiceTests.java
+++ b/server/src/test/java/org/elasticsearch/cluster/routing/allocation/shards/ShardsAvailabilityHealthIndicatorServiceTests.java
@@ -42,6 +42,8 @@
 import org.elasticsearch.common.settings.ClusterSettings;
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.core.Nullable;
+import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.core.Tuple;
 import org.elasticsearch.health.Diagnosis;
 import org.elasticsearch.health.HealthIndicatorDetails;
 import org.elasticsearch.health.HealthIndicatorImpact;
@@ -61,9 +63,9 @@
 import org.elasticsearch.snapshots.SearchableSnapshotsSettings;
 import org.elasticsearch.test.ESTestCase;
 import org.elasticsearch.threadpool.ThreadPool;
-import org.mockito.Mockito;
 import org.mockito.stubbing.Answer;
 
+import java.time.Instant;
 import java.util.ArrayList;
 import java.util.Collections;
 import java.util.HashMap;
@@ -104,6 +106,7 @@
 import static org.elasticsearch.cluster.routing.allocation.shards.ShardsAvailabilityHealthIndicatorServiceTests.ShardState.UNAVAILABLE;
 import static org.elasticsearch.common.util.CollectionUtils.concatLists;
 import static org.elasticsearch.core.TimeValue.timeValueSeconds;
+import static org.elasticsearch.core.Tuple.tuple;
 import static org.elasticsearch.health.Diagnosis.Resource.Type.FEATURE_STATE;
 import static org.elasticsearch.health.Diagnosis.Resource.Type.INDEX;
 import static org.elasticsearch.health.HealthStatus.GREEN;
@@ -337,7 +340,8 @@ public void testAllReplicasUnassigned() {
                 status,
                 clusterState,
                 NodesShutdownMetadata.EMPTY,
-                randomBoolean()
+                randomBoolean(),
+                timeValueSeconds(0)
             );
             assertFalse(status.replicas.doAnyIndicesHaveAllUnavailable());
         }
@@ -359,7 +363,8 @@ public void testAllReplicasUnassigned() {
                 status,
                 clusterState,
                 NodesShutdownMetadata.EMPTY,
-                randomBoolean()
+                randomBoolean(),
+                timeValueSeconds(0)
             );
             assertFalse(status.replicas.doAnyIndicesHaveAllUnavailable());
         }
@@ -381,7 +386,8 @@ public void testAllReplicasUnassigned() {
                 status,
                 clusterState,
                 NodesShutdownMetadata.EMPTY,
-                randomBoolean()
+                randomBoolean(),
+                timeValueSeconds(0)
             );
             assertTrue(status.replicas.doAnyIndicesHaveAllUnavailable());
         }
@@ -398,13 +404,15 @@ public void testAllReplicasUnassigned() {
                 ),
                 List.of()
             );
+
             var service = createShardsAvailabilityIndicatorService(clusterState);
             ShardAllocationStatus status = service.createNewStatus(clusterState.metadata());
             ShardsAvailabilityHealthIndicatorService.updateShardAllocationStatus(
                 status,
                 clusterState,
                 NodesShutdownMetadata.EMPTY,
-                randomBoolean()
+                randomBoolean(),
+                timeValueSeconds(0)
             );
             assertTrue(status.replicas.doAnyIndicesHaveAllUnavailable());
         }
@@ -440,7 +448,8 @@ public void testAllReplicasUnassigned() {
                 status,
                 clusterState,
                 NodesShutdownMetadata.EMPTY,
-                randomBoolean()
+                randomBoolean(),
+                timeValueSeconds(0)
             );
             // Here because the replica is unassigned due to the primary being created, it's treated as though the replica can be ignored.
             assertFalse(
@@ -469,7 +478,8 @@ public void testAllReplicasUnassigned() {
                 status,
                 clusterState,
                 NodesShutdownMetadata.EMPTY,
-                randomBoolean()
+                randomBoolean(),
+                timeValueSeconds(0)
             );
             var shardRouting = routingTable.shardsWithState(ShardRoutingState.UNASSIGNED).get(0);
             assertTrue(service.areAllShardsOfThisTypeUnavailable(shardRouting, clusterState));
@@ -492,7 +502,8 @@ public void testAllReplicasUnassigned() {
                 status,
                 clusterState,
                 NodesShutdownMetadata.EMPTY,
-                randomBoolean()
+                randomBoolean(),
+                timeValueSeconds(0)
             );
             var shardRouting = clusterState.routingTable().index("myindex").shardsWithState(ShardRoutingState.UNASSIGNED).get(0);
             assertFalse(service.areAllShardsOfThisTypeUnavailable(shardRouting, clusterState));
@@ -922,7 +933,7 @@ public void testRestoreFromSnapshotReportsFeatureStates() {
         );
         HealthIndicatorResult result = service.calculate(true, HealthInfo.EMPTY_HEALTH_INFO);
 
-        assertThat(result.status(), is(HealthStatus.RED));
+        assertThat(result.status(), is(RED));
         assertThat(result.diagnosisList().size(), is(1));
         Diagnosis diagnosis = result.diagnosisList().get(0);
         List<Diagnosis.Resource> affectedResources = diagnosis.affectedResources();
@@ -1925,7 +1936,7 @@ private SystemIndices getSystemIndices(
     // We expose the indicator name and the diagnoses in the x-pack usage API. In order to index them properly in a telemetry index
     // they need to be declared in the health-api-indexer.edn in the telemetry repository.
     public void testMappedFieldsForTelemetry() {
-        assertThat(ShardsAvailabilityHealthIndicatorService.NAME, equalTo("shards_availability"));
+        assertThat(NAME, equalTo("shards_availability"));
         assertThat(
             ACTION_RESTORE_FROM_SNAPSHOT.getUniqueId(),
             equalTo("elasticsearch:health:shards_availability:diagnosis:restore_from_snapshot")
@@ -1970,8 +1981,10 @@ public void testMappedFieldsForTelemetry() {
             DIAGNOSIS_WAIT_FOR_INITIALIZATION.getUniqueId(),
             equalTo("elasticsearch:health:shards_availability:diagnosis:initializing_shards")
         );
+        ClusterService clusterService = mock(ClusterService.class);
+        when(clusterService.getClusterSettings()).thenReturn(ClusterSettings.createBuiltInClusterSettings());
         var service = new ShardsAvailabilityHealthIndicatorService(
-            mock(ClusterService.class),
+            clusterService,
             mock(AllocationService.class),
             mock(SystemIndices.class)
         );
@@ -2004,6 +2017,7 @@ public void testMappedFieldsForTelemetry() {
     }
 
     public void testIsNewlyCreatedAndInitializingReplica() {
+
         ShardId id = new ShardId("index", "uuid", 0);
         IndexMetadata idxMeta = IndexMetadata.builder("index")
             .numberOfShards(1)
@@ -2017,56 +2031,156 @@ public void testIsNewlyCreatedAndInitializingReplica() {
                     .build()
             )
             .build();
-        ShardRouting primary = createShardRouting(id, true, new ShardAllocation("node", AVAILABLE));
-        var state = createClusterStateWith(List.of(index("index", new ShardAllocation("node", AVAILABLE))), List.of());
-        assertFalse(ShardsAvailabilityHealthIndicatorService.isNewlyCreatedAndInitializingReplica(primary, state));
-
-        ShardRouting replica = createShardRouting(id, false, new ShardAllocation("node", AVAILABLE));
-        state = createClusterStateWith(List.of(index("index", new ShardAllocation("node", AVAILABLE))), List.of());
-        assertFalse(ShardsAvailabilityHealthIndicatorService.isNewlyCreatedAndInitializingReplica(replica, state));
-
-        ShardRouting unassignedReplica = createShardRouting(id, false, new ShardAllocation("node", UNAVAILABLE));
-        state = createClusterStateWith(
-            List.of(idxMeta),
-            List.of(index("index", "uuid", new ShardAllocation("node", UNAVAILABLE))),
-            List.of(),
-            List.of()
-        );
-        assertFalse(ShardsAvailabilityHealthIndicatorService.isNewlyCreatedAndInitializingReplica(unassignedReplica, state));
 
-        UnassignedInfo.Reason reason = randomFrom(UnassignedInfo.Reason.NODE_LEFT, UnassignedInfo.Reason.NODE_RESTARTING);
-        ShardAllocation allocation = new ShardAllocation(
-            "node",
-            UNAVAILABLE,
-            new UnassignedInfo(
-                reason,
-                "message",
-                null,
-                0,
-                0,
-                0,
-                randomBoolean(),
-                randomFrom(UnassignedInfo.AllocationStatus.values()),
-                Set.of(),
-                reason == UnassignedInfo.Reason.NODE_LEFT ? null : randomAlphaOfLength(20)
-            )
-        );
-        ShardRouting unallocatedReplica = createShardRouting(id, false, allocation);
-        state = createClusterStateWith(
-            List.of(idxMeta),
-            List.of(index(idxMeta, new ShardAllocation("node", UNAVAILABLE), allocation)),
-            List.of(),
-            List.of()
-        );
-        assertFalse(ShardsAvailabilityHealthIndicatorService.isNewlyCreatedAndInitializingReplica(unallocatedReplica, state));
+        ClusterState state;
 
-        state = createClusterStateWith(
-            List.of(idxMeta),
-            List.of(index(idxMeta, new ShardAllocation("node", CREATING), allocation)),
-            List.of(),
-            List.of()
-        );
-        assertTrue(ShardsAvailabilityHealthIndicatorService.isNewlyCreatedAndInitializingReplica(unallocatedReplica, state));
+        // --------- Test conditions that don't depend on threshold ---------
+
+        TimeValue replicaUnassignedThreshold = randomFrom(timeValueSeconds(3), timeValueSeconds(0));
+        {
+            // active, whether primary or replica
+            boolean primary = randomBoolean();
+            ShardAllocation primaryAllocation = new ShardAllocation("node", AVAILABLE);
+            ShardRouting shard = createShardRouting(id, primary, primaryAllocation);
+            state = createClusterStateWith(List.of(index("index", primaryAllocation)), List.of());
+            assertFalse(
+                ShardsAvailabilityHealthIndicatorService.isNewlyCreatedAndInitializingReplica(
+                    shard,
+                    state,
+                    Instant.now().toEpochMilli() - replicaUnassignedThreshold.millis()
+                )
+            );
+        }
+
+        {   // primary, but not active
+            var primaryAllocation = new ShardAllocation("node", INITIALIZING);
+            ShardRouting primary = createShardRouting(id, true, primaryAllocation);
+            state = createClusterStateWith(List.of(index("index", primaryAllocation)), List.of());
+            assertFalse(
+                ShardsAvailabilityHealthIndicatorService.isNewlyCreatedAndInitializingReplica(
+                    primary,
+                    state,
+                    Instant.now().toEpochMilli() - replicaUnassignedThreshold.millis()
+                )
+            );
+        }
+
+        // --------- Test conditions that depend on threshold, but with threshold of 0 ---------
+        replicaUnassignedThreshold = timeValueSeconds(0);
+        long now = Instant.now().toEpochMilli();
+        TimeValue afterCutoffTime = TimeValue.timeValueMillis(now);
+        {
+            var unassignedInfo = randomFrom(decidersNo(afterCutoffTime), unassignedInfoNoFailures(afterCutoffTime));
+            var replicaAllocation = new ShardAllocation("node", UNAVAILABLE, unassignedInfo);
+            var primaryAllocation = new ShardAllocation("node", randomFrom(INITIALIZING, UNAVAILABLE, AVAILABLE, RESTARTING));
+
+            ShardRouting unallocatedReplica = createShardRouting(id, false, replicaAllocation);
+            state = createClusterStateWith(
+                List.of(idxMeta),
+                List.of(index(idxMeta, primaryAllocation, replicaAllocation)),
+                List.of(),
+                List.of()
+            );
+            assertFalse(
+                ShardsAvailabilityHealthIndicatorService.isNewlyCreatedAndInitializingReplica(
+                    unallocatedReplica,
+                    state,
+                    now - replicaUnassignedThreshold.millis()
+                )
+            );
+        }
+
+        {
+            var unassignedInfo = randomFrom(decidersNo(afterCutoffTime), unassignedInfoNoFailures(afterCutoffTime));
+            var replicaAllocation = new ShardAllocation("node", UNAVAILABLE, unassignedInfo);
+            var primaryAllocation = new ShardAllocation("node", CREATING);
+
+            ShardRouting unallocatedReplica = createShardRouting(id, false, replicaAllocation);
+            state = createClusterStateWith(
+                List.of(idxMeta),
+                List.of(index(idxMeta, primaryAllocation, replicaAllocation)),
+                List.of(),
+                List.of()
+            );
+            assertTrue(
+                ShardsAvailabilityHealthIndicatorService.isNewlyCreatedAndInitializingReplica(
+                    unallocatedReplica,
+                    state,
+                    now - replicaUnassignedThreshold.millis()
+                )
+            );
+        }
+
+        // --------- Test conditions that do depend on threshold, but with non-zero threshold ---------
+
+        replicaUnassignedThreshold = timeValueSeconds(3);
+        afterCutoffTime = TimeValue.timeValueMillis(now - 3000);
+        TimeValue beforeCutoffTime = TimeValue.timeValueMillis(now - 2999);
+        {
+            List<Tuple<ShardState, UnassignedInfo>> configs = new ArrayList<>();
+
+            // return false if primary is not creating and if unassigned info has failed allocations or is after cutoff
+            var uis = List.of(decidersNo(afterCutoffTime), decidersNo(beforeCutoffTime), unassignedInfoNoFailures(afterCutoffTime));
+            var shardStates = List.of(UNAVAILABLE, INITIALIZING, RESTARTING, AVAILABLE);
+            for (var shardState : shardStates) {
+                for (var ui : uis) {
+                    configs.add(tuple(shardState, ui));
+                }
+            }
+            // return false if primary is not creating or available and unassigned time is before cutoff
+            for (var shardState : List.of(UNAVAILABLE, INITIALIZING, RESTARTING)) {
+                configs.add(tuple(shardState, unassignedInfoNoFailures(beforeCutoffTime)));
+            }
+
+            for (var config : configs) {
+                var replicaAllocation = new ShardAllocation("node", UNAVAILABLE, config.v2());
+                var primaryAllocation = new ShardAllocation("node", config.v1());
+                ShardRouting unallocatedReplica = createShardRouting(id, false, replicaAllocation);
+                state = createClusterStateWith(
+                    List.of(idxMeta),
+                    List.of(index(idxMeta, primaryAllocation, replicaAllocation)),
+                    List.of(),
+                    List.of()
+                );
+                assertFalse(
+                    ShardsAvailabilityHealthIndicatorService.isNewlyCreatedAndInitializingReplica(
+                        unallocatedReplica,
+                        state,
+                        now - replicaUnassignedThreshold.millis()
+                    )
+                );
+            }
+        }
+
+        {
+            var configs = List.of(
+                // return true because primary is still creating
+                tuple(CREATING, decidersNo(afterCutoffTime)),
+                tuple(CREATING, decidersNo(beforeCutoffTime)),
+                tuple(CREATING, unassignedInfoNoFailures(afterCutoffTime)),
+                tuple(CREATING, unassignedInfoNoFailures(beforeCutoffTime)),
+
+                // returns true because unassigned time is before cutoff, and no failedAllocations
+                tuple(AVAILABLE, unassignedInfoNoFailures(beforeCutoffTime))
+            );
+
+            for (var config : configs) {
+                var replicaAllocation = new ShardAllocation("node", UNAVAILABLE, config.v2());
+                var primaryAllocation = new ShardAllocation("node", config.v1());
+
+                ShardRouting unallocatedReplica = createShardRouting(id, false, replicaAllocation);
+                IndexRoutingTable index = index(idxMeta, primaryAllocation, replicaAllocation);
+
+                state = createClusterStateWith(List.of(idxMeta), List.of(index), List.of(), List.of());
+                assertTrue(
+                    ShardsAvailabilityHealthIndicatorService.isNewlyCreatedAndInitializingReplica(
+                        unallocatedReplica,
+                        state,
+                        now - replicaUnassignedThreshold.millis()
+                    )
+                );
+            }
+        }
     }
 
     private HealthIndicatorResult createExpectedResult(
@@ -2373,14 +2487,34 @@ private static UnassignedInfo nodeLeft() {
         );
     }
 
+    private static UnassignedInfo unassignedInfoNoFailures(TimeValue unassignedTime) {
+        UnassignedInfo.Reason reason = randomFrom(UnassignedInfo.Reason.NODE_LEFT, UnassignedInfo.Reason.NODE_RESTARTING);
+        return new UnassignedInfo(
+            reason,
+            "message",
+            null,
+            0,
+            unassignedTime.nanos(),
+            unassignedTime.millis(),
+            randomBoolean(),
+            randomValueOtherThan(UnassignedInfo.AllocationStatus.DECIDERS_NO, () -> randomFrom(UnassignedInfo.AllocationStatus.values())),
+            Set.of(),
+            reason == UnassignedInfo.Reason.NODE_LEFT ? null : randomAlphaOfLength(20)
+        );
+    }
+
     private static UnassignedInfo decidersNo() {
+        return decidersNo(TimeValue.timeValueMillis(0));
+    }
+
+    private static UnassignedInfo decidersNo(TimeValue unassignedTime) {
         return new UnassignedInfo(
             UnassignedInfo.Reason.ALLOCATION_FAILED,
             null,
             null,
             1,
-            0,
-            0,
+            unassignedTime.nanos(),
+            unassignedTime.millis(),
             false,
             UnassignedInfo.AllocationStatus.DECIDERS_NO,
             Collections.emptySet(),
@@ -2423,7 +2557,7 @@ private static ShardsAvailabilityHealthIndicatorService createAllocationHealthIn
         when(clusterService.state()).thenReturn(clusterState);
         var clusterSettings = new ClusterSettings(nodeSettings, ClusterSettings.BUILT_IN_CLUSTER_SETTINGS);
         when(clusterService.getClusterSettings()).thenReturn(clusterSettings);
-        var allocationService = Mockito.mock(AllocationService.class);
+        var allocationService = mock(AllocationService.class);
         when(allocationService.explainShardAllocation(any(), any())).thenAnswer((Answer<ShardAllocationDecision>) invocation -> {
             ShardRouting shardRouting = invocation.getArgument(0);
             var key = new ShardRoutingKey(shardRouting.getIndexName(), shardRouting.getId(), shardRouting.primary());

From 67d2380cbd94bf300f686b00d7ea94d707f2f0af Mon Sep 17 00:00:00 2001
From: Stanislav Malyshev <smalyshev@users.noreply.github.com>
Date: Wed, 28 Aug 2024 13:36:16 -0600
Subject: [PATCH 016/144] Collecting CCS usage telemetry stats (#111905)

* This creates the use CCSUsage and CCSUsageTelemetry classes and wires them up to the UsageService.

An initial set of telemetry metrics are now being gathered in TransportSearchAction.
Many more will be added later to meet all the requirements for the CCS Telemetry epic of work.

Co-authored-by: Michael Peterson <michael.peterson@elastic.co>
---
 .../search/ccs/CCSUsageTelemetryIT.java       | 708 ++++++++++++++++++
 .../cluster/stats/CCSTelemetrySnapshot.java   | 404 ++++++++++
 .../action/admin/cluster/stats/CCSUsage.java  | 246 ++++++
 .../cluster/stats/CCSUsageTelemetry.java      | 246 ++++++
 .../admin/cluster/stats/LongMetric.java       | 126 ++++
 .../action/search/SearchResponse.java         |   9 +
 .../action/search/TransportSearchAction.java  | 246 ++++--
 .../org/elasticsearch/usage/UsageService.java |   7 +
 .../cluster/stats/ApproximateMatcher.java     |  46 ++
 .../stats/CCSTelemetrySnapshotTests.java      | 324 ++++++++
 .../cluster/stats/CCSUsageTelemetryTests.java | 342 +++++++++
 .../search/TransportSearchActionTests.java    |   4 +-
 .../snapshots/SnapshotResiliencyTests.java    |   7 +-
 .../admin/cluster/stats/telemetry_test.json   |  67 ++
 .../CCSUsageTelemetryAsyncSearchIT.java       | 370 +++++++++
 15 files changed, 3092 insertions(+), 60 deletions(-)
 create mode 100644 server/src/internalClusterTest/java/org/elasticsearch/search/ccs/CCSUsageTelemetryIT.java
 create mode 100644 server/src/main/java/org/elasticsearch/action/admin/cluster/stats/CCSTelemetrySnapshot.java
 create mode 100644 server/src/main/java/org/elasticsearch/action/admin/cluster/stats/CCSUsage.java
 create mode 100644 server/src/main/java/org/elasticsearch/action/admin/cluster/stats/CCSUsageTelemetry.java
 create mode 100644 server/src/main/java/org/elasticsearch/action/admin/cluster/stats/LongMetric.java
 create mode 100644 server/src/test/java/org/elasticsearch/action/admin/cluster/stats/ApproximateMatcher.java
 create mode 100644 server/src/test/java/org/elasticsearch/action/admin/cluster/stats/CCSTelemetrySnapshotTests.java
 create mode 100644 server/src/test/java/org/elasticsearch/action/admin/cluster/stats/CCSUsageTelemetryTests.java
 create mode 100644 server/src/test/resources/org/elasticsearch/action/admin/cluster/stats/telemetry_test.json
 create mode 100644 x-pack/plugin/async-search/src/internalClusterTest/java/org/elasticsearch/xpack/search/CCSUsageTelemetryAsyncSearchIT.java

diff --git a/server/src/internalClusterTest/java/org/elasticsearch/search/ccs/CCSUsageTelemetryIT.java b/server/src/internalClusterTest/java/org/elasticsearch/search/ccs/CCSUsageTelemetryIT.java
new file mode 100644
index 0000000000000..40d98b2b5ea71
--- /dev/null
+++ b/server/src/internalClusterTest/java/org/elasticsearch/search/ccs/CCSUsageTelemetryIT.java
@@ -0,0 +1,708 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.search.ccs;
+
+import org.apache.logging.log4j.LogManager;
+import org.apache.logging.log4j.Logger;
+import org.elasticsearch.action.admin.cluster.stats.CCSTelemetrySnapshot;
+import org.elasticsearch.action.admin.cluster.stats.CCSUsageTelemetry.Result;
+import org.elasticsearch.action.search.ClosePointInTimeRequest;
+import org.elasticsearch.action.search.OpenPointInTimeRequest;
+import org.elasticsearch.action.search.SearchRequest;
+import org.elasticsearch.action.search.SearchResponse;
+import org.elasticsearch.action.search.TransportClosePointInTimeAction;
+import org.elasticsearch.action.search.TransportOpenPointInTimeAction;
+import org.elasticsearch.action.search.TransportSearchAction;
+import org.elasticsearch.action.support.PlainActionFuture;
+import org.elasticsearch.client.internal.Client;
+import org.elasticsearch.common.bytes.BytesReference;
+import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.common.util.CollectionUtils;
+import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.index.query.MatchAllQueryBuilder;
+import org.elasticsearch.plugins.Plugin;
+import org.elasticsearch.search.builder.PointInTimeBuilder;
+import org.elasticsearch.search.builder.SearchSourceBuilder;
+import org.elasticsearch.search.query.SlowRunningQueryBuilder;
+import org.elasticsearch.search.query.ThrowingQueryBuilder;
+import org.elasticsearch.tasks.Task;
+import org.elasticsearch.test.AbstractMultiClustersTestCase;
+import org.elasticsearch.test.InternalTestCluster;
+import org.elasticsearch.usage.UsageService;
+import org.junit.Assert;
+import org.junit.Rule;
+import org.junit.rules.TestRule;
+import org.junit.runner.Description;
+import org.junit.runners.model.Statement;
+
+import java.lang.annotation.ElementType;
+import java.lang.annotation.Retention;
+import java.lang.annotation.RetentionPolicy;
+import java.lang.annotation.Target;
+import java.util.Arrays;
+import java.util.Collection;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+import java.util.concurrent.ExecutionException;
+import java.util.concurrent.TimeUnit;
+import java.util.function.Function;
+import java.util.stream.Collectors;
+
+import static org.elasticsearch.action.admin.cluster.stats.CCSUsageTelemetry.ASYNC_FEATURE;
+import static org.elasticsearch.action.admin.cluster.stats.CCSUsageTelemetry.MRT_FEATURE;
+import static org.elasticsearch.action.admin.cluster.stats.CCSUsageTelemetry.WILDCARD_FEATURE;
+import static org.elasticsearch.test.hamcrest.ElasticsearchAssertions.assertAcked;
+import static org.elasticsearch.test.hamcrest.ElasticsearchAssertions.assertResponse;
+import static org.hamcrest.Matchers.equalTo;
+
+public class CCSUsageTelemetryIT extends AbstractMultiClustersTestCase {
+    private static final Logger LOGGER = LogManager.getLogger(CCSUsageTelemetryIT.class);
+    private static final String REMOTE1 = "cluster-a";
+    private static final String REMOTE2 = "cluster-b";
+
+    @Override
+    protected boolean reuseClusters() {
+        return false;
+    }
+
+    @Override
+    protected Collection<String> remoteClusterAlias() {
+        return List.of(REMOTE1, REMOTE2);
+    }
+
+    @Rule
+    public SkipUnavailableRule skipOverride = new SkipUnavailableRule(REMOTE1, REMOTE2);
+
+    @Override
+    protected Map<String, Boolean> skipUnavailableForRemoteClusters() {
+        var map = skipOverride.getMap();
+        LOGGER.info("Using skip_unavailable map: [{}]", map);
+        return map;
+    }
+
+    @Override
+    protected Collection<Class<? extends Plugin>> nodePlugins(String clusterAlias) {
+        return CollectionUtils.appendToCopy(super.nodePlugins(clusterAlias), CrossClusterSearchIT.TestQueryBuilderPlugin.class);
+    }
+
+    private SearchRequest makeSearchRequest(String... indices) {
+        SearchRequest searchRequest = new SearchRequest(indices);
+        searchRequest.allowPartialSearchResults(false);
+        searchRequest.setBatchedReduceSize(randomIntBetween(3, 20));
+        searchRequest.setCcsMinimizeRoundtrips(randomBoolean());
+        if (randomBoolean()) {
+            searchRequest.setPreFilterShardSize(1);
+        }
+        searchRequest.source(new SearchSourceBuilder().query(new MatchAllQueryBuilder()).size(10));
+        return searchRequest;
+    }
+
+    /**
+    * Run search request and get telemetry from it
+    */
+    private CCSTelemetrySnapshot getTelemetryFromSearch(SearchRequest searchRequest) throws ExecutionException, InterruptedException {
+        // We want to send search to a specific node (we don't care which one) so that we could
+        // collect the CCS telemetry from it later
+        String nodeName = cluster(LOCAL_CLUSTER).getRandomNodeName();
+        // We don't care here too much about the response, we just want to trigger the telemetry collection.
+        // So we check it's not null and leave the rest to other tests.
+        assertResponse(cluster(LOCAL_CLUSTER).client(nodeName).search(searchRequest), Assert::assertNotNull);
+        return getTelemetrySnapshot(nodeName);
+    }
+
+    private CCSTelemetrySnapshot getTelemetryFromFailedSearch(SearchRequest searchRequest) throws Exception {
+        // We want to send search to a specific node (we don't care which one) so that we could
+        // collect the CCS telemetry from it later
+        String nodeName = cluster(LOCAL_CLUSTER).getRandomNodeName();
+        PlainActionFuture<SearchResponse> queryFuture = new PlainActionFuture<>();
+        cluster(LOCAL_CLUSTER).client(nodeName).search(searchRequest, queryFuture);
+        assertBusy(() -> assertTrue(queryFuture.isDone()));
+
+        // We expect failure, but we don't care too much which failure it is in this test
+        ExecutionException ee = expectThrows(ExecutionException.class, queryFuture::get);
+        assertNotNull(ee.getCause());
+
+        return getTelemetrySnapshot(nodeName);
+    }
+
+    /**
+     * Create search request for indices and get telemetry from it
+     */
+    private CCSTelemetrySnapshot getTelemetryFromSearch(String... indices) throws ExecutionException, InterruptedException {
+        return getTelemetryFromSearch(makeSearchRequest(indices));
+    }
+
+    /**
+     * Search on all remotes
+     */
+    public void testAllRemotesSearch() throws ExecutionException, InterruptedException {
+        Map<String, Object> testClusterInfo = setupClusters();
+        String localIndex = (String) testClusterInfo.get("local.index");
+        String remoteIndex = (String) testClusterInfo.get("remote.index");
+
+        SearchRequest searchRequest = makeSearchRequest(localIndex, "*:" + remoteIndex);
+        boolean minimizeRoundtrips = TransportSearchAction.shouldMinimizeRoundtrips(searchRequest);
+
+        String nodeName = cluster(LOCAL_CLUSTER).getRandomNodeName();
+        assertResponse(
+            cluster(LOCAL_CLUSTER).client(nodeName)
+                .filterWithHeader(Map.of(Task.X_ELASTIC_PRODUCT_ORIGIN_HTTP_HEADER, "kibana"))
+                .search(searchRequest),
+            Assert::assertNotNull
+        );
+        CCSTelemetrySnapshot telemetry = getTelemetrySnapshot(nodeName);
+
+        assertThat(telemetry.getTotalCount(), equalTo(1L));
+        assertThat(telemetry.getSuccessCount(), equalTo(1L));
+        assertThat(telemetry.getFailureReasons().size(), equalTo(0));
+        assertThat(telemetry.getTook().count(), equalTo(1L));
+        assertThat(telemetry.getTookMrtTrue().count(), equalTo(minimizeRoundtrips ? 1L : 0L));
+        assertThat(telemetry.getTookMrtFalse().count(), equalTo(minimizeRoundtrips ? 0L : 1L));
+        assertThat(telemetry.getRemotesPerSearchAvg(), equalTo(2.0));
+        assertThat(telemetry.getRemotesPerSearchMax(), equalTo(2L));
+        assertThat(telemetry.getSearchCountWithSkippedRemotes(), equalTo(0L));
+        assertThat(telemetry.getClientCounts().size(), equalTo(1));
+        assertThat(telemetry.getClientCounts().get("kibana"), equalTo(1L));
+        if (minimizeRoundtrips) {
+            assertThat(telemetry.getFeatureCounts().get(MRT_FEATURE), equalTo(1L));
+        } else {
+            assertThat(telemetry.getFeatureCounts().get(MRT_FEATURE), equalTo(null));
+        }
+        assertThat(telemetry.getFeatureCounts().get(ASYNC_FEATURE), equalTo(null));
+
+        var perCluster = telemetry.getByRemoteCluster();
+        assertThat(perCluster.size(), equalTo(3));
+        for (String clusterAlias : remoteClusterAlias()) {
+            var clusterTelemetry = perCluster.get(clusterAlias);
+            assertThat(clusterTelemetry.getCount(), equalTo(1L));
+            assertThat(clusterTelemetry.getSkippedCount(), equalTo(0L));
+            assertThat(clusterTelemetry.getTook().count(), equalTo(1L));
+        }
+
+        // another search
+        assertResponse(cluster(LOCAL_CLUSTER).client(nodeName).search(searchRequest), Assert::assertNotNull);
+        telemetry = getTelemetrySnapshot(nodeName);
+        assertThat(telemetry.getTotalCount(), equalTo(2L));
+        assertThat(telemetry.getSuccessCount(), equalTo(2L));
+        assertThat(telemetry.getFailureReasons().size(), equalTo(0));
+        assertThat(telemetry.getTook().count(), equalTo(2L));
+        assertThat(telemetry.getTookMrtTrue().count(), equalTo(minimizeRoundtrips ? 2L : 0L));
+        assertThat(telemetry.getTookMrtFalse().count(), equalTo(minimizeRoundtrips ? 0L : 2L));
+        assertThat(telemetry.getRemotesPerSearchAvg(), equalTo(2.0));
+        assertThat(telemetry.getRemotesPerSearchMax(), equalTo(2L));
+        assertThat(telemetry.getSearchCountWithSkippedRemotes(), equalTo(0L));
+        assertThat(telemetry.getClientCounts().size(), equalTo(1));
+        assertThat(telemetry.getClientCounts().get("kibana"), equalTo(1L));
+        perCluster = telemetry.getByRemoteCluster();
+        assertThat(perCluster.size(), equalTo(3));
+        for (String clusterAlias : remoteClusterAlias()) {
+            var clusterTelemetry = perCluster.get(clusterAlias);
+            assertThat(clusterTelemetry.getCount(), equalTo(2L));
+            assertThat(clusterTelemetry.getSkippedCount(), equalTo(0L));
+            assertThat(clusterTelemetry.getTook().count(), equalTo(2L));
+        }
+    }
+
+    /**
+     * Search on a specific remote
+     */
+    public void testOneRemoteSearch() throws ExecutionException, InterruptedException {
+        Map<String, Object> testClusterInfo = setupClusters();
+        String localIndex = (String) testClusterInfo.get("local.index");
+        String remoteIndex = (String) testClusterInfo.get("remote.index");
+
+        // Make request to cluster a
+        SearchRequest searchRequest = makeSearchRequest(localIndex, REMOTE1 + ":" + remoteIndex);
+        String nodeName = cluster(LOCAL_CLUSTER).getRandomNodeName();
+        assertResponse(cluster(LOCAL_CLUSTER).client(nodeName).search(searchRequest), Assert::assertNotNull);
+        CCSTelemetrySnapshot telemetry = getTelemetrySnapshot(nodeName);
+        var perCluster = telemetry.getByRemoteCluster();
+        assertThat(perCluster.size(), equalTo(2));
+        assertThat(perCluster.get(REMOTE1).getCount(), equalTo(1L));
+        assertThat(perCluster.get(REMOTE1).getTook().count(), equalTo(1L));
+        assertThat(perCluster.get(REMOTE2), equalTo(null));
+        assertThat(telemetry.getClientCounts().size(), equalTo(0));
+
+        // Make request to cluster b
+        searchRequest = makeSearchRequest(localIndex, REMOTE2 + ":" + remoteIndex);
+        assertResponse(cluster(LOCAL_CLUSTER).client(nodeName).search(searchRequest), Assert::assertNotNull);
+        telemetry = getTelemetrySnapshot(nodeName);
+        assertThat(telemetry.getTotalCount(), equalTo(2L));
+        assertThat(telemetry.getSuccessCount(), equalTo(2L));
+        perCluster = telemetry.getByRemoteCluster();
+        assertThat(perCluster.size(), equalTo(3));
+        assertThat(perCluster.get(REMOTE1).getCount(), equalTo(1L));
+        assertThat(perCluster.get(REMOTE1).getTook().count(), equalTo(1L));
+        assertThat(perCluster.get(REMOTE2).getCount(), equalTo(1L));
+        assertThat(perCluster.get(REMOTE2).getTook().count(), equalTo(1L));
+    }
+
+    /**
+     * Local search should not produce any telemetry at all
+     */
+    public void testLocalOnlySearch() throws ExecutionException, InterruptedException {
+        Map<String, Object> testClusterInfo = setupClusters();
+        String localIndex = (String) testClusterInfo.get("local.index");
+
+        CCSTelemetrySnapshot telemetry = getTelemetryFromSearch(localIndex);
+        assertThat(telemetry.getTotalCount(), equalTo(0L));
+    }
+
+    /**
+    * Search on remotes only, without local index
+    */
+    public void testRemoteOnlySearch() throws ExecutionException, InterruptedException {
+        Map<String, Object> testClusterInfo = setupClusters();
+        String remoteIndex = (String) testClusterInfo.get("remote.index");
+
+        CCSTelemetrySnapshot telemetry = getTelemetryFromSearch("*:" + remoteIndex);
+        var perCluster = telemetry.getByRemoteCluster();
+        assertThat(telemetry.getTotalCount(), equalTo(1L));
+        assertThat(telemetry.getSuccessCount(), equalTo(1L));
+        assertThat(telemetry.getFailureReasons().size(), equalTo(0));
+        assertThat(telemetry.getTook().count(), equalTo(1L));
+        assertThat(perCluster.size(), equalTo(2));
+        assertThat(telemetry.getClientCounts().size(), equalTo(0));
+        assertThat(perCluster.get(REMOTE1).getCount(), equalTo(1L));
+        assertThat(perCluster.get(REMOTE1).getSkippedCount(), equalTo(0L));
+        assertThat(perCluster.get(REMOTE1).getTook().count(), equalTo(1L));
+        assertThat(perCluster.get(REMOTE2).getCount(), equalTo(1L));
+        assertThat(perCluster.get(REMOTE2).getSkippedCount(), equalTo(0L));
+        assertThat(perCluster.get(REMOTE2).getTook().count(), equalTo(1L));
+    }
+
+    /**
+     * Count wildcard searches. Only wildcards in index names (not in cluster names) are counted.
+     */
+    public void testWildcardSearch() throws ExecutionException, InterruptedException {
+        Map<String, Object> testClusterInfo = setupClusters();
+        String localIndex = (String) testClusterInfo.get("local.index");
+        String remoteIndex = (String) testClusterInfo.get("remote.index");
+
+        SearchRequest searchRequest = makeSearchRequest(localIndex, "*:" + remoteIndex);
+        String nodeName = cluster(LOCAL_CLUSTER).getRandomNodeName();
+        assertResponse(cluster(LOCAL_CLUSTER).client(nodeName).search(searchRequest), Assert::assertNotNull);
+        CCSTelemetrySnapshot telemetry = getTelemetrySnapshot(nodeName);
+        assertThat(telemetry.getTotalCount(), equalTo(1L));
+        assertThat(telemetry.getFeatureCounts().get(WILDCARD_FEATURE), equalTo(null));
+
+        searchRequest = makeSearchRequest("*", REMOTE1 + ":" + remoteIndex);
+        assertResponse(cluster(LOCAL_CLUSTER).client(nodeName).search(searchRequest), Assert::assertNotNull);
+        telemetry = getTelemetrySnapshot(nodeName);
+        assertThat(telemetry.getTotalCount(), equalTo(2L));
+        assertThat(telemetry.getFeatureCounts().get(WILDCARD_FEATURE), equalTo(1L));
+
+        searchRequest = makeSearchRequest(localIndex, REMOTE2 + ":*");
+        assertResponse(cluster(LOCAL_CLUSTER).client(nodeName).search(searchRequest), Assert::assertNotNull);
+        telemetry = getTelemetrySnapshot(nodeName);
+        assertThat(telemetry.getTotalCount(), equalTo(3L));
+        assertThat(telemetry.getFeatureCounts().get(WILDCARD_FEATURE), equalTo(2L));
+
+        // Wildcards in cluster name do not count
+        searchRequest = makeSearchRequest(localIndex, "*:" + remoteIndex);
+        assertResponse(cluster(LOCAL_CLUSTER).client(nodeName).search(searchRequest), Assert::assertNotNull);
+        telemetry = getTelemetrySnapshot(nodeName);
+        assertThat(telemetry.getTotalCount(), equalTo(4L));
+        assertThat(telemetry.getFeatureCounts().get(WILDCARD_FEATURE), equalTo(2L));
+
+        // Wildcard in the middle of the index name counts
+        searchRequest = makeSearchRequest(localIndex, REMOTE2 + ":rem*");
+        assertResponse(cluster(LOCAL_CLUSTER).client(nodeName).search(searchRequest), Assert::assertNotNull);
+        telemetry = getTelemetrySnapshot(nodeName);
+        assertThat(telemetry.getTotalCount(), equalTo(5L));
+        assertThat(telemetry.getFeatureCounts().get(WILDCARD_FEATURE), equalTo(3L));
+
+        // Wildcard only counted once per search
+        searchRequest = makeSearchRequest("*", REMOTE1 + ":rem*", REMOTE2 + ":remote*");
+        assertResponse(cluster(LOCAL_CLUSTER).client(nodeName).search(searchRequest), Assert::assertNotNull);
+        telemetry = getTelemetrySnapshot(nodeName);
+        assertThat(telemetry.getTotalCount(), equalTo(6L));
+        assertThat(telemetry.getFeatureCounts().get(WILDCARD_FEATURE), equalTo(4L));
+    }
+
+    /**
+     * Test complete search failure
+     */
+    public void testFailedSearch() throws Exception {
+        Map<String, Object> testClusterInfo = setupClusters();
+        String localIndex = (String) testClusterInfo.get("local.index");
+        String remoteIndex = (String) testClusterInfo.get("remote.index");
+
+        SearchRequest searchRequest = makeSearchRequest(localIndex, "*:" + remoteIndex);
+        // shardId -1 means to throw the Exception on all shards, so should result in complete search failure
+        ThrowingQueryBuilder queryBuilder = new ThrowingQueryBuilder(randomLong(), new IllegalStateException("index corrupted"), -1);
+        searchRequest.source(new SearchSourceBuilder().query(queryBuilder).size(10));
+        searchRequest.allowPartialSearchResults(true);
+
+        CCSTelemetrySnapshot telemetry = getTelemetryFromFailedSearch(searchRequest);
+        assertThat(telemetry.getTotalCount(), equalTo(1L));
+        assertThat(telemetry.getSuccessCount(), equalTo(0L));
+        assertThat(telemetry.getTook().count(), equalTo(0L));
+        assertThat(telemetry.getTookMrtTrue().count(), equalTo(0L));
+        assertThat(telemetry.getTookMrtFalse().count(), equalTo(0L));
+        Map<String, Long> expectedFailures = Map.of(Result.UNKNOWN.getName(), 1L);
+        assertThat(telemetry.getFailureReasons(), equalTo(expectedFailures));
+    }
+
+    /**
+     * Search when all the remotes failed and skipped
+     */
+    public void testSkippedAllRemotesSearch() throws Exception {
+        Map<String, Object> testClusterInfo = setupClusters();
+        String localIndex = (String) testClusterInfo.get("local.index");
+        String remoteIndex = (String) testClusterInfo.get("remote.index");
+
+        SearchRequest searchRequest = makeSearchRequest(localIndex, "*:" + remoteIndex);
+        // throw Exception on all shards of remoteIndex, but not against localIndex
+        ThrowingQueryBuilder queryBuilder = new ThrowingQueryBuilder(
+            randomLong(),
+            new IllegalStateException("index corrupted"),
+            remoteIndex
+        );
+        searchRequest.source(new SearchSourceBuilder().query(queryBuilder).size(10));
+        searchRequest.allowPartialSearchResults(true);
+
+        String nodeName = cluster(LOCAL_CLUSTER).getRandomNodeName();
+        assertResponse(cluster(LOCAL_CLUSTER).client(nodeName).search(searchRequest), Assert::assertNotNull);
+
+        CCSTelemetrySnapshot telemetry = getTelemetrySnapshot(nodeName);
+        assertThat(telemetry.getTotalCount(), equalTo(1L));
+        assertThat(telemetry.getSuccessCount(), equalTo(1L));
+        // Note that this counts how many searches had skipped remotes, not how many remotes are skipped
+        assertThat(telemetry.getSearchCountWithSkippedRemotes(), equalTo(1L));
+        // Still count the remote that failed
+        assertThat(telemetry.getRemotesPerSearchMax(), equalTo(2L));
+        assertThat(telemetry.getTook().count(), equalTo(1L));
+        // Each remote will have its skipped count bumped
+        var perCluster = telemetry.getByRemoteCluster();
+        assertThat(perCluster.size(), equalTo(3));
+        for (String remote : remoteClusterAlias()) {
+            assertThat(perCluster.get(remote).getCount(), equalTo(0L));
+            assertThat(perCluster.get(remote).getSkippedCount(), equalTo(1L));
+            assertThat(perCluster.get(remote).getTook().count(), equalTo(0L));
+        }
+    }
+
+    public void testSkippedOneRemoteSearch() throws Exception {
+        Map<String, Object> testClusterInfo = setupClusters();
+        String localIndex = (String) testClusterInfo.get("local.index");
+        String remoteIndex = (String) testClusterInfo.get("remote.index");
+
+        // Remote1 will fail, Remote2 will just do nothing but it counts as success
+        SearchRequest searchRequest = makeSearchRequest(localIndex, REMOTE1 + ":" + remoteIndex, REMOTE2 + ":" + "nosuchindex*");
+        // throw Exception on all shards of remoteIndex, but not against localIndex
+        ThrowingQueryBuilder queryBuilder = new ThrowingQueryBuilder(
+            randomLong(),
+            new IllegalStateException("index corrupted"),
+            remoteIndex
+        );
+        searchRequest.source(new SearchSourceBuilder().query(queryBuilder).size(10));
+        searchRequest.allowPartialSearchResults(true);
+
+        String nodeName = cluster(LOCAL_CLUSTER).getRandomNodeName();
+        assertResponse(cluster(LOCAL_CLUSTER).client(nodeName).search(searchRequest), Assert::assertNotNull);
+
+        CCSTelemetrySnapshot telemetry = getTelemetrySnapshot(nodeName);
+        assertThat(telemetry.getTotalCount(), equalTo(1L));
+        assertThat(telemetry.getSuccessCount(), equalTo(1L));
+        // Note that this counts how many searches had skipped remotes, not how many remotes are skipped
+        assertThat(telemetry.getSearchCountWithSkippedRemotes(), equalTo(1L));
+        // Still count the remote that failed
+        assertThat(telemetry.getRemotesPerSearchMax(), equalTo(2L));
+        assertThat(telemetry.getTook().count(), equalTo(1L));
+        // Each remote will have its skipped count bumped
+        var perCluster = telemetry.getByRemoteCluster();
+        assertThat(perCluster.size(), equalTo(3));
+        // This one is skipped
+        assertThat(perCluster.get(REMOTE1).getCount(), equalTo(0L));
+        assertThat(perCluster.get(REMOTE1).getSkippedCount(), equalTo(1L));
+        assertThat(perCluster.get(REMOTE1).getTook().count(), equalTo(0L));
+        // This one is OK
+        assertThat(perCluster.get(REMOTE2).getCount(), equalTo(1L));
+        assertThat(perCluster.get(REMOTE2).getSkippedCount(), equalTo(0L));
+        assertThat(perCluster.get(REMOTE2).getTook().count(), equalTo(1L));
+    }
+
+    /**
+     * Test what happens if remote times out - it should be skipped
+     */
+    public void testRemoteTimesOut() throws Exception {
+        Map<String, Object> testClusterInfo = setupClusters();
+        String localIndex = (String) testClusterInfo.get("local.index");
+        String remoteIndex = (String) testClusterInfo.get("remote.index");
+
+        SearchRequest searchRequest = makeSearchRequest(localIndex, REMOTE1 + ":" + remoteIndex);
+        // This works only with minimize_roundtrips enabled, since otherwise timed out shards will be counted as
+        // partial failure, and we disable partial results..
+        searchRequest.setCcsMinimizeRoundtrips(true);
+
+        TimeValue searchTimeout = new TimeValue(200, TimeUnit.MILLISECONDS);
+        // query builder that will sleep for the specified amount of time in the query phase
+        SlowRunningQueryBuilder slowRunningQueryBuilder = new SlowRunningQueryBuilder(searchTimeout.millis() * 5, remoteIndex);
+        SearchSourceBuilder sourceBuilder = new SearchSourceBuilder().query(slowRunningQueryBuilder).timeout(searchTimeout);
+        searchRequest.source(sourceBuilder);
+
+        CCSTelemetrySnapshot telemetry = getTelemetryFromSearch(searchRequest);
+        assertThat(telemetry.getTotalCount(), equalTo(1L));
+        assertThat(telemetry.getSuccessCount(), equalTo(1L));
+        assertThat(telemetry.getSearchCountWithSkippedRemotes(), equalTo(1L));
+        assertThat(telemetry.getRemotesPerSearchMax(), equalTo(1L));
+        var perCluster = telemetry.getByRemoteCluster();
+        assertThat(perCluster.size(), equalTo(2));
+        assertThat(perCluster.get(REMOTE1).getCount(), equalTo(0L));
+        assertThat(perCluster.get(REMOTE1).getSkippedCount(), equalTo(1L));
+        assertThat(perCluster.get(REMOTE1).getTook().count(), equalTo(0L));
+        assertThat(perCluster.get(REMOTE2), equalTo(null));
+    }
+
+    /**
+    * Test what happens if remote times out and there's no local - it should be skipped
+    */
+    public void testRemoteOnlyTimesOut() throws Exception {
+        Map<String, Object> testClusterInfo = setupClusters();
+        String remoteIndex = (String) testClusterInfo.get("remote.index");
+
+        SearchRequest searchRequest = makeSearchRequest(REMOTE1 + ":" + remoteIndex);
+        // This works only with minimize_roundtrips enabled, since otherwise timed out shards will be counted as
+        // partial failure, and we disable partial results...
+        searchRequest.setCcsMinimizeRoundtrips(true);
+
+        TimeValue searchTimeout = new TimeValue(100, TimeUnit.MILLISECONDS);
+        // query builder that will sleep for the specified amount of time in the query phase
+        SlowRunningQueryBuilder slowRunningQueryBuilder = new SlowRunningQueryBuilder(searchTimeout.millis() * 5, remoteIndex);
+        SearchSourceBuilder sourceBuilder = new SearchSourceBuilder().query(slowRunningQueryBuilder).timeout(searchTimeout);
+        searchRequest.source(sourceBuilder);
+
+        CCSTelemetrySnapshot telemetry = getTelemetryFromSearch(searchRequest);
+        assertThat(telemetry.getTotalCount(), equalTo(1L));
+        assertThat(telemetry.getSuccessCount(), equalTo(1L));
+        assertThat(telemetry.getSearchCountWithSkippedRemotes(), equalTo(1L));
+        assertThat(telemetry.getRemotesPerSearchMax(), equalTo(1L));
+        var perCluster = telemetry.getByRemoteCluster();
+        assertThat(perCluster.size(), equalTo(1));
+        assertThat(perCluster.get(REMOTE1).getCount(), equalTo(0L));
+        assertThat(perCluster.get(REMOTE1).getSkippedCount(), equalTo(1L));
+        assertThat(perCluster.get(REMOTE1).getTook().count(), equalTo(0L));
+        assertThat(perCluster.get(REMOTE2), equalTo(null));
+    }
+
+    @SkipOverride(aliases = { REMOTE1 })
+    public void testRemoteTimesOutFailure() throws Exception {
+        Map<String, Object> testClusterInfo = setupClusters();
+        String remoteIndex = (String) testClusterInfo.get("remote.index");
+
+        SearchRequest searchRequest = makeSearchRequest(REMOTE1 + ":" + remoteIndex);
+
+        TimeValue searchTimeout = new TimeValue(100, TimeUnit.MILLISECONDS);
+        // query builder that will sleep for the specified amount of time in the query phase
+        SlowRunningQueryBuilder slowRunningQueryBuilder = new SlowRunningQueryBuilder(searchTimeout.millis() * 5, remoteIndex);
+        SearchSourceBuilder sourceBuilder = new SearchSourceBuilder().query(slowRunningQueryBuilder).timeout(searchTimeout);
+        searchRequest.source(sourceBuilder);
+
+        CCSTelemetrySnapshot telemetry = getTelemetryFromFailedSearch(searchRequest);
+        assertThat(telemetry.getTotalCount(), equalTo(1L));
+        assertThat(telemetry.getSuccessCount(), equalTo(0L));
+        // Failure is not skipping
+        assertThat(telemetry.getSearchCountWithSkippedRemotes(), equalTo(0L));
+        // Still count the remote that failed
+        assertThat(telemetry.getRemotesPerSearchMax(), equalTo(1L));
+        assertThat(telemetry.getTook().count(), equalTo(0L));
+        Map<String, Long> expectedFailure = Map.of(Result.TIMEOUT.getName(), 1L);
+        assertThat(telemetry.getFailureReasons(), equalTo(expectedFailure));
+        // No per-cluster data on total failure
+        assertThat(telemetry.getByRemoteCluster().size(), equalTo(0));
+    }
+
+    /**
+    * Search when all the remotes failed and not skipped
+    */
+    @SkipOverride(aliases = { REMOTE1, REMOTE2 })
+    public void testFailedAllRemotesSearch() throws Exception {
+        Map<String, Object> testClusterInfo = setupClusters();
+        String localIndex = (String) testClusterInfo.get("local.index");
+        String remoteIndex = (String) testClusterInfo.get("remote.index");
+
+        SearchRequest searchRequest = makeSearchRequest(localIndex, "*:" + remoteIndex);
+        // throw Exception on all shards of remoteIndex, but not against localIndex
+        ThrowingQueryBuilder queryBuilder = new ThrowingQueryBuilder(
+            randomLong(),
+            new IllegalStateException("index corrupted"),
+            remoteIndex
+        );
+        searchRequest.source(new SearchSourceBuilder().query(queryBuilder).size(10));
+
+        CCSTelemetrySnapshot telemetry = getTelemetryFromFailedSearch(searchRequest);
+        assertThat(telemetry.getTotalCount(), equalTo(1L));
+        assertThat(telemetry.getSuccessCount(), equalTo(0L));
+        // Failure is not skipping
+        assertThat(telemetry.getSearchCountWithSkippedRemotes(), equalTo(0L));
+        // Still count the remote that failed
+        assertThat(telemetry.getRemotesPerSearchMax(), equalTo(2L));
+        assertThat(telemetry.getTook().count(), equalTo(0L));
+        Map<String, Long> expectedFailure = Map.of(Result.REMOTES_UNAVAILABLE.getName(), 1L);
+        assertThat(telemetry.getFailureReasons(), equalTo(expectedFailure));
+        // No per-cluster data on total failure
+        assertThat(telemetry.getByRemoteCluster().size(), equalTo(0));
+    }
+
+    /**
+     * Test that we're still counting remote search even if remote cluster has no such index
+     */
+    public void testRemoteHasNoIndex() throws Exception {
+        Map<String, Object> testClusterInfo = setupClusters();
+        String localIndex = (String) testClusterInfo.get("local.index");
+
+        CCSTelemetrySnapshot telemetry = getTelemetryFromSearch(localIndex, REMOTE1 + ":" + "no_such_index*");
+        assertThat(telemetry.getTotalCount(), equalTo(1L));
+        assertThat(telemetry.getSuccessCount(), equalTo(1L));
+        var perCluster = telemetry.getByRemoteCluster();
+        assertThat(perCluster.size(), equalTo(2));
+        assertThat(perCluster.get(REMOTE1).getCount(), equalTo(1L));
+        assertThat(perCluster.get(REMOTE1).getTook().count(), equalTo(1L));
+        assertThat(perCluster.get(REMOTE2), equalTo(null));
+    }
+
+    /**
+     * Test that we're still counting remote search even if remote cluster has no such index
+     */
+    @SkipOverride(aliases = { REMOTE1 })
+    public void testRemoteHasNoIndexFailure() throws Exception {
+        SearchRequest searchRequest = makeSearchRequest(REMOTE1 + ":no_such_index");
+        CCSTelemetrySnapshot telemetry = getTelemetryFromFailedSearch(searchRequest);
+        assertThat(telemetry.getTotalCount(), equalTo(1L));
+        assertThat(telemetry.getSuccessCount(), equalTo(0L));
+        var perCluster = telemetry.getByRemoteCluster();
+        assertThat(perCluster.size(), equalTo(0));
+        Map<String, Long> expectedFailure = Map.of(Result.NOT_FOUND.getName(), 1L);
+        assertThat(telemetry.getFailureReasons(), equalTo(expectedFailure));
+    }
+
+    public void testPITSearch() throws ExecutionException, InterruptedException {
+        Map<String, Object> testClusterInfo = setupClusters();
+        String localIndex = (String) testClusterInfo.get("local.index");
+        String remoteIndex = (String) testClusterInfo.get("remote.index");
+
+        OpenPointInTimeRequest openPITRequest = new OpenPointInTimeRequest(localIndex, "*:" + remoteIndex).keepAlive(
+            TimeValue.timeValueMinutes(5)
+        );
+        String nodeName = cluster(LOCAL_CLUSTER).getRandomNodeName();
+        var client = cluster(LOCAL_CLUSTER).client(nodeName);
+        BytesReference pitID = client.execute(TransportOpenPointInTimeAction.TYPE, openPITRequest).actionGet().getPointInTimeId();
+        SearchRequest searchRequest = new SearchRequest().source(
+            new SearchSourceBuilder().pointInTimeBuilder(new PointInTimeBuilder(pitID).setKeepAlive(TimeValue.timeValueMinutes(5)))
+                .sort("@timestamp")
+                .size(10)
+        );
+        searchRequest.setCcsMinimizeRoundtrips(randomBoolean());
+
+        assertResponse(client.search(searchRequest), Assert::assertNotNull);
+        // do it again
+        assertResponse(client.search(searchRequest), Assert::assertNotNull);
+        client.execute(TransportClosePointInTimeAction.TYPE, new ClosePointInTimeRequest(pitID)).actionGet();
+        CCSTelemetrySnapshot telemetry = getTelemetrySnapshot(nodeName);
+
+        assertThat(telemetry.getTotalCount(), equalTo(2L));
+        assertThat(telemetry.getSuccessCount(), equalTo(2L));
+    }
+
+    private CCSTelemetrySnapshot getTelemetrySnapshot(String nodeName) {
+        var usage = cluster(LOCAL_CLUSTER).getInstance(UsageService.class, nodeName);
+        return usage.getCcsUsageHolder().getCCSTelemetrySnapshot();
+    }
+
+    private Map<String, Object> setupClusters() {
+        String localIndex = "demo";
+        int numShardsLocal = randomIntBetween(2, 10);
+        Settings localSettings = indexSettings(numShardsLocal, randomIntBetween(0, 1)).build();
+        assertAcked(
+            client(LOCAL_CLUSTER).admin()
+                .indices()
+                .prepareCreate(localIndex)
+                .setSettings(localSettings)
+                .setMapping("@timestamp", "type=date", "f", "type=text")
+        );
+        indexDocs(client(LOCAL_CLUSTER), localIndex);
+
+        String remoteIndex = "prod";
+        int numShardsRemote = randomIntBetween(2, 10);
+        for (String clusterAlias : remoteClusterAlias()) {
+            final InternalTestCluster remoteCluster = cluster(clusterAlias);
+            remoteCluster.ensureAtLeastNumDataNodes(randomIntBetween(1, 3));
+            assertAcked(
+                client(clusterAlias).admin()
+                    .indices()
+                    .prepareCreate(remoteIndex)
+                    .setSettings(indexSettings(numShardsRemote, randomIntBetween(0, 1)))
+                    .setMapping("@timestamp", "type=date", "f", "type=text")
+            );
+            assertFalse(
+                client(clusterAlias).admin()
+                    .cluster()
+                    .prepareHealth(remoteIndex)
+                    .setWaitForYellowStatus()
+                    .setTimeout(TimeValue.timeValueSeconds(10))
+                    .get()
+                    .isTimedOut()
+            );
+            indexDocs(client(clusterAlias), remoteIndex);
+        }
+
+        Map<String, Object> clusterInfo = new HashMap<>();
+        clusterInfo.put("local.index", localIndex);
+        clusterInfo.put("remote.index", remoteIndex);
+        return clusterInfo;
+    }
+
+    private int indexDocs(Client client, String index) {
+        int numDocs = between(5, 20);
+        for (int i = 0; i < numDocs; i++) {
+            client.prepareIndex(index).setSource("f", "v", "@timestamp", randomNonNegativeLong()).get();
+        }
+        client.admin().indices().prepareRefresh(index).get();
+        return numDocs;
+    }
+
+    /**
+     * Annotation to mark specific cluster in a test as not to be skipped when unavailable
+     */
+    @Retention(RetentionPolicy.RUNTIME)
+    @Target(ElementType.METHOD)
+    @interface SkipOverride {
+        String[] aliases();
+    }
+
+    /**
+     * Test rule to process skip annotations
+     */
+    static class SkipUnavailableRule implements TestRule {
+        private final Map<String, Boolean> skipMap;
+
+        SkipUnavailableRule(String... clusterAliases) {
+            this.skipMap = Arrays.stream(clusterAliases).collect(Collectors.toMap(Function.identity(), alias -> true));
+        }
+
+        public Map<String, Boolean> getMap() {
+            return skipMap;
+        }
+
+        @Override
+        public Statement apply(Statement base, Description description) {
+            // Check for annotation named "SkipOverride" and set the overrides accordingly
+            var aliases = description.getAnnotation(SkipOverride.class);
+            if (aliases != null) {
+                for (String alias : aliases.aliases()) {
+                    skipMap.put(alias, false);
+                }
+            }
+            return base;
+        }
+
+    }
+}
diff --git a/server/src/main/java/org/elasticsearch/action/admin/cluster/stats/CCSTelemetrySnapshot.java b/server/src/main/java/org/elasticsearch/action/admin/cluster/stats/CCSTelemetrySnapshot.java
new file mode 100644
index 0000000000000..fe1da86dd54c7
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/action/admin/cluster/stats/CCSTelemetrySnapshot.java
@@ -0,0 +1,404 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.action.admin.cluster.stats;
+
+import org.elasticsearch.action.admin.cluster.stats.LongMetric.LongMetricValue;
+import org.elasticsearch.action.search.SearchResponse;
+import org.elasticsearch.common.Strings;
+import org.elasticsearch.common.io.stream.StreamInput;
+import org.elasticsearch.common.io.stream.StreamOutput;
+import org.elasticsearch.common.io.stream.Writeable;
+import org.elasticsearch.transport.RemoteClusterAware;
+import org.elasticsearch.xcontent.ToXContentFragment;
+import org.elasticsearch.xcontent.XContentBuilder;
+
+import java.io.IOException;
+import java.util.Collections;
+import java.util.HashMap;
+import java.util.Map;
+import java.util.Objects;
+
+/**
+ * Holds a snapshot of the CCS telemetry statistics from {@link CCSUsageTelemetry}.
+ * Used to hold the stats for a single node that's part of a {@link ClusterStatsNodeResponse}, as well as to
+ * accumulate stats for the entire cluster and return them as part of the {@link ClusterStatsResponse}.
+ * <br>
+ * Theory of operation:
+ * - The snapshot is created on each particular node with the stats for the node, and is sent to the coordinating node
+ * - Coordinating node creates an empty snapshot and merges all the node snapshots into it using add()
+ * <br>
+ * The snapshot contains {@link LongMetricValue}s for latencies, which currently contain full histograms (since you can't
+ * produce p90 from a set of node p90s, you need the full histogram for that). To avoid excessive copying (histogram weighs several KB),
+ * the snapshot is designed to be mutable, so that you can add multiple snapshots to it without copying the histograms all the time.
+ * It is not the intent to mutate the snapshot objects otherwise.
+ * <br>
+ */
+public final class CCSTelemetrySnapshot implements Writeable, ToXContentFragment {
+    public static final String CCS_TELEMETRY_FIELD_NAME = "_search";
+    private long totalCount;
+    private long successCount;
+    private final Map<String, Long> failureReasons;
+
+    /**
+     * Latency metrics, overall.
+     */
+    private final LongMetricValue took;
+    /**
+     * Latency metrics with minimize_roundtrips=true
+     */
+    private final LongMetricValue tookMrtTrue;
+    /**
+     * Latency metrics with minimize_roundtrips=false
+     */
+    private final LongMetricValue tookMrtFalse;
+    private long remotesPerSearchMax;
+    private double remotesPerSearchAvg;
+    private long skippedRemotes;
+
+    private final Map<String, Long> featureCounts;
+
+    private final Map<String, Long> clientCounts;
+    private final Map<String, PerClusterCCSTelemetry> byRemoteCluster;
+
+    /**
+    * Creates a new stats instance with the provided info.
+    */
+    public CCSTelemetrySnapshot(
+        long totalCount,
+        long successCount,
+        Map<String, Long> failureReasons,
+        LongMetricValue took,
+        LongMetricValue tookMrtTrue,
+        LongMetricValue tookMrtFalse,
+        long remotesPerSearchMax,
+        double remotesPerSearchAvg,
+        long skippedRemotes,
+        Map<String, Long> featureCounts,
+        Map<String, Long> clientCounts,
+        Map<String, PerClusterCCSTelemetry> byRemoteCluster
+    ) {
+        this.totalCount = totalCount;
+        this.successCount = successCount;
+        this.failureReasons = failureReasons;
+        this.took = took;
+        this.tookMrtTrue = tookMrtTrue;
+        this.tookMrtFalse = tookMrtFalse;
+        this.remotesPerSearchMax = remotesPerSearchMax;
+        this.remotesPerSearchAvg = remotesPerSearchAvg;
+        this.skippedRemotes = skippedRemotes;
+        this.featureCounts = featureCounts;
+        this.clientCounts = clientCounts;
+        this.byRemoteCluster = byRemoteCluster;
+    }
+
+    /**
+     * Creates a new empty stats instance, that will get additional stats added through {@link #add(CCSTelemetrySnapshot)}
+     */
+    public CCSTelemetrySnapshot() {
+        // Note this produces modifiable maps, so other snapshots can be merged into it
+        failureReasons = new HashMap<>();
+        featureCounts = new HashMap<>();
+        clientCounts = new HashMap<>();
+        byRemoteCluster = new HashMap<>();
+        took = new LongMetricValue();
+        tookMrtTrue = new LongMetricValue();
+        tookMrtFalse = new LongMetricValue();
+    }
+
+    public CCSTelemetrySnapshot(StreamInput in) throws IOException {
+        this.totalCount = in.readVLong();
+        this.successCount = in.readVLong();
+        this.failureReasons = in.readMap(StreamInput::readLong);
+        this.took = LongMetricValue.fromStream(in);
+        this.tookMrtTrue = LongMetricValue.fromStream(in);
+        this.tookMrtFalse = LongMetricValue.fromStream(in);
+        this.remotesPerSearchMax = in.readVLong();
+        this.remotesPerSearchAvg = in.readDouble();
+        this.skippedRemotes = in.readVLong();
+        this.featureCounts = in.readMap(StreamInput::readLong);
+        this.clientCounts = in.readMap(StreamInput::readLong);
+        this.byRemoteCluster = in.readMap(PerClusterCCSTelemetry::new);
+    }
+
+    @Override
+    public void writeTo(StreamOutput out) throws IOException {
+        out.writeVLong(totalCount);
+        out.writeVLong(successCount);
+        out.writeMap(failureReasons, StreamOutput::writeLong);
+        took.writeTo(out);
+        tookMrtTrue.writeTo(out);
+        tookMrtFalse.writeTo(out);
+        out.writeVLong(remotesPerSearchMax);
+        out.writeDouble(remotesPerSearchAvg);
+        out.writeVLong(skippedRemotes);
+        out.writeMap(featureCounts, StreamOutput::writeLong);
+        out.writeMap(clientCounts, StreamOutput::writeLong);
+        out.writeMap(byRemoteCluster, StreamOutput::writeWriteable);
+    }
+
+    public long getTotalCount() {
+        return totalCount;
+    }
+
+    public long getSuccessCount() {
+        return successCount;
+    }
+
+    public Map<String, Long> getFailureReasons() {
+        return Collections.unmodifiableMap(failureReasons);
+    }
+
+    public LongMetricValue getTook() {
+        return took;
+    }
+
+    public LongMetricValue getTookMrtTrue() {
+        return tookMrtTrue;
+    }
+
+    public LongMetricValue getTookMrtFalse() {
+        return tookMrtFalse;
+    }
+
+    public long getRemotesPerSearchMax() {
+        return remotesPerSearchMax;
+    }
+
+    public double getRemotesPerSearchAvg() {
+        return remotesPerSearchAvg;
+    }
+
+    public long getSearchCountWithSkippedRemotes() {
+        return skippedRemotes;
+    }
+
+    public Map<String, Long> getFeatureCounts() {
+        return Collections.unmodifiableMap(featureCounts);
+    }
+
+    public Map<String, Long> getClientCounts() {
+        return Collections.unmodifiableMap(clientCounts);
+    }
+
+    public Map<String, PerClusterCCSTelemetry> getByRemoteCluster() {
+        return Collections.unmodifiableMap(byRemoteCluster);
+    }
+
+    public static class PerClusterCCSTelemetry implements Writeable, ToXContentFragment {
+        private long count;
+        private long skippedCount;
+        private final LongMetricValue took;
+
+        public PerClusterCCSTelemetry() {
+            took = new LongMetricValue();
+        }
+
+        public PerClusterCCSTelemetry(long count, long skippedCount, LongMetricValue took) {
+            this.took = took;
+            this.skippedCount = skippedCount;
+            this.count = count;
+        }
+
+        public PerClusterCCSTelemetry(PerClusterCCSTelemetry other) {
+            this.count = other.count;
+            this.skippedCount = other.skippedCount;
+            this.took = new LongMetricValue(other.took);
+        }
+
+        public PerClusterCCSTelemetry(StreamInput in) throws IOException {
+            this.count = in.readVLong();
+            this.skippedCount = in.readVLong();
+            this.took = LongMetricValue.fromStream(in);
+        }
+
+        @Override
+        public void writeTo(StreamOutput out) throws IOException {
+            out.writeVLong(count);
+            out.writeVLong(skippedCount);
+            took.writeTo(out);
+        }
+
+        public PerClusterCCSTelemetry add(PerClusterCCSTelemetry v) {
+            count += v.count;
+            skippedCount += v.skippedCount;
+            took.add(v.took);
+            return this;
+        }
+
+        @Override
+        public XContentBuilder toXContent(XContentBuilder builder, Params params) throws IOException {
+            builder.startObject();
+            builder.field("total", count);
+            builder.field("skipped", skippedCount);
+            publishLatency(builder, "took", took);
+            builder.endObject();
+            return builder;
+        }
+
+        public long getCount() {
+            return count;
+        }
+
+        public long getSkippedCount() {
+            return skippedCount;
+        }
+
+        public LongMetricValue getTook() {
+            return took;
+        }
+
+        @Override
+        public boolean equals(Object o) {
+            if (this == o) {
+                return true;
+            }
+            if (o == null || getClass() != o.getClass()) {
+                return false;
+            }
+            PerClusterCCSTelemetry that = (PerClusterCCSTelemetry) o;
+            return count == that.count && skippedCount == that.skippedCount && Objects.equals(took, that.took);
+        }
+
+        @Override
+        public int hashCode() {
+            return Objects.hash(count, skippedCount, took);
+        }
+    }
+
+    /**
+     * Add the provided stats to the ones held by the current instance, effectively merging the two.
+     * @param stats the other stats object to add to this one
+     */
+    public void add(CCSTelemetrySnapshot stats) {
+        // This should be called in ClusterStatsResponse ctor only, so we don't need to worry about concurrency
+        if (stats.totalCount == 0) {
+            // Just ignore the empty stats.
+            // This could happen if the node is brand new or if the stats are not available, e.g. because it runs an old version.
+            return;
+        }
+        long oldCount = totalCount;
+        totalCount += stats.totalCount;
+        successCount += stats.successCount;
+        skippedRemotes += stats.skippedRemotes;
+        stats.failureReasons.forEach((k, v) -> failureReasons.merge(k, v, Long::sum));
+        stats.featureCounts.forEach((k, v) -> featureCounts.merge(k, v, Long::sum));
+        stats.clientCounts.forEach((k, v) -> clientCounts.merge(k, v, Long::sum));
+        took.add(stats.took);
+        tookMrtTrue.add(stats.tookMrtTrue);
+        tookMrtFalse.add(stats.tookMrtFalse);
+        remotesPerSearchMax = Math.max(remotesPerSearchMax, stats.remotesPerSearchMax);
+        if (totalCount > 0 && oldCount > 0) {
+            // Weighted average
+            remotesPerSearchAvg = (remotesPerSearchAvg * oldCount + stats.remotesPerSearchAvg * stats.totalCount) / totalCount;
+        } else {
+            // If we didn't have any old value, we just take the new one
+            remotesPerSearchAvg = stats.remotesPerSearchAvg;
+        }
+        // we copy the object here since we'll be modifying it later on subsequent adds
+        // TODO: this may be sub-optimal, as we'll be copying histograms when adding first snapshot to an empty container,
+        // which we could have avoided probably.
+        stats.byRemoteCluster.forEach((r, v) -> byRemoteCluster.merge(r, new PerClusterCCSTelemetry(v), PerClusterCCSTelemetry::add));
+    }
+
+    /**
+     * Publishes the latency statistics to the provided {@link XContentBuilder}.
+     * Example:
+     * "took": {
+     *      "max": 345032,
+     *      "avg": 1620,
+     *      "p90": 2570
+     * }
+     */
+    public static void publishLatency(XContentBuilder builder, String name, LongMetricValue took) throws IOException {
+        builder.startObject(name);
+        {
+            builder.field("max", took.max());
+            builder.field("avg", took.avg());
+            builder.field("p90", took.p90());
+        }
+        builder.endObject();
+    }
+
+    @Override
+    public XContentBuilder toXContent(XContentBuilder builder, Params params) throws IOException {
+        builder.startObject(CCS_TELEMETRY_FIELD_NAME);
+        {
+            builder.field("total", totalCount);
+            builder.field("success", successCount);
+            builder.field("skipped", skippedRemotes);
+            publishLatency(builder, "took", took);
+            publishLatency(builder, "took_mrt_true", tookMrtTrue);
+            publishLatency(builder, "took_mrt_false", tookMrtFalse);
+            builder.field("remotes_per_search_max", remotesPerSearchMax);
+            builder.field("remotes_per_search_avg", remotesPerSearchAvg);
+            builder.field("failure_reasons", failureReasons);
+            builder.field("features", featureCounts);
+            builder.field("clients", clientCounts);
+            builder.startObject("clusters");
+            {
+                for (var entry : byRemoteCluster.entrySet()) {
+                    String remoteName = entry.getKey();
+                    if (RemoteClusterAware.LOCAL_CLUSTER_GROUP_KEY.equals(remoteName)) {
+                        remoteName = SearchResponse.LOCAL_CLUSTER_NAME_REPRESENTATION;
+                    }
+                    builder.field(remoteName, entry.getValue());
+                }
+            }
+            builder.endObject();
+        }
+        builder.endObject();
+        return builder;
+    }
+
+    @Override
+    public boolean equals(Object o) {
+        if (this == o) {
+            return true;
+        }
+        if (o == null || getClass() != o.getClass()) {
+            return false;
+        }
+        CCSTelemetrySnapshot that = (CCSTelemetrySnapshot) o;
+        return totalCount == that.totalCount
+            && successCount == that.successCount
+            && skippedRemotes == that.skippedRemotes
+            && Objects.equals(failureReasons, that.failureReasons)
+            && Objects.equals(took, that.took)
+            && Objects.equals(tookMrtTrue, that.tookMrtTrue)
+            && Objects.equals(tookMrtFalse, that.tookMrtFalse)
+            && Objects.equals(remotesPerSearchMax, that.remotesPerSearchMax)
+            && Objects.equals(remotesPerSearchAvg, that.remotesPerSearchAvg)
+            && Objects.equals(featureCounts, that.featureCounts)
+            && Objects.equals(clientCounts, that.clientCounts)
+            && Objects.equals(byRemoteCluster, that.byRemoteCluster);
+    }
+
+    @Override
+    public int hashCode() {
+        return Objects.hash(
+            totalCount,
+            successCount,
+            failureReasons,
+            took,
+            tookMrtTrue,
+            tookMrtFalse,
+            remotesPerSearchMax,
+            remotesPerSearchAvg,
+            skippedRemotes,
+            featureCounts,
+            clientCounts,
+            byRemoteCluster
+        );
+    }
+
+    @Override
+    public String toString() {
+        return Strings.toString(this, true, true);
+    }
+}
diff --git a/server/src/main/java/org/elasticsearch/action/admin/cluster/stats/CCSUsage.java b/server/src/main/java/org/elasticsearch/action/admin/cluster/stats/CCSUsage.java
new file mode 100644
index 0000000000000..b2d75ac8f61f3
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/action/admin/cluster/stats/CCSUsage.java
@@ -0,0 +1,246 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.action.admin.cluster.stats;
+
+import org.elasticsearch.ElasticsearchSecurityException;
+import org.elasticsearch.ExceptionsHelper;
+import org.elasticsearch.ResourceNotFoundException;
+import org.elasticsearch.action.ShardOperationFailedException;
+import org.elasticsearch.action.admin.cluster.stats.CCSUsageTelemetry.Result;
+import org.elasticsearch.action.search.SearchPhaseExecutionException;
+import org.elasticsearch.action.search.ShardSearchFailure;
+import org.elasticsearch.action.search.TransportSearchAction;
+import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.search.SearchShardTarget;
+import org.elasticsearch.search.query.SearchTimeoutException;
+import org.elasticsearch.tasks.TaskCancelledException;
+import org.elasticsearch.transport.ConnectTransportException;
+import org.elasticsearch.transport.NoSeedNodeLeftException;
+import org.elasticsearch.transport.NoSuchRemoteClusterException;
+
+import java.util.Arrays;
+import java.util.HashMap;
+import java.util.HashSet;
+import java.util.Map;
+import java.util.Set;
+
+import static org.elasticsearch.transport.RemoteClusterAware.LOCAL_CLUSTER_GROUP_KEY;
+
+/**
+ * This is a container for telemetry data from an individual cross-cluster search for _search or _async_search (or
+ * other search endpoints that use the {@link TransportSearchAction} such as _msearch).
+ */
+public class CCSUsage {
+    private final long took;
+    private final Result status;
+    private final Set<String> features;
+    private final int remotesCount;
+
+    private final String client;
+
+    private final Set<String> skippedRemotes;
+    private final Map<String, PerClusterUsage> perClusterUsage;
+
+    public static class Builder {
+        private long took;
+        private final Set<String> features;
+        private Result status = Result.SUCCESS;
+        private int remotesCount;
+        private String client;
+        private final Set<String> skippedRemotes;
+        private final Map<String, PerClusterUsage> perClusterUsage;
+
+        public Builder() {
+            features = new HashSet<>();
+            skippedRemotes = new HashSet<>();
+            perClusterUsage = new HashMap<>();
+        }
+
+        public Builder took(long took) {
+            this.took = took;
+            return this;
+        }
+
+        public Builder setFailure(Result failureType) {
+            this.status = failureType;
+            return this;
+        }
+
+        public Builder setFailure(Exception e) {
+            return setFailure(getFailureType(e));
+        }
+
+        public Builder setFeature(String feature) {
+            this.features.add(feature);
+            return this;
+        }
+
+        public Builder setClient(String client) {
+            this.client = client;
+            return this;
+        }
+
+        public Builder skippedRemote(String remote) {
+            this.skippedRemotes.add(remote);
+            return this;
+        }
+
+        public Builder perClusterUsage(String remote, TimeValue took) {
+            this.perClusterUsage.put(remote, new PerClusterUsage(took));
+            return this;
+        }
+
+        public CCSUsage build() {
+            return new CCSUsage(took, status, remotesCount, skippedRemotes, features, client, perClusterUsage);
+        }
+
+        public Builder setRemotesCount(int remotesCount) {
+            this.remotesCount = remotesCount;
+            return this;
+        }
+
+        public int getRemotesCount() {
+            return remotesCount;
+        }
+
+        /**
+         * Get failure type as {@link Result} from the search failure exception.
+         */
+        public static Result getFailureType(Exception e) {
+            var unwrapped = ExceptionsHelper.unwrapCause(e);
+            if (unwrapped instanceof Exception) {
+                e = (Exception) unwrapped;
+            }
+            if (isRemoteUnavailable(e)) {
+                return Result.REMOTES_UNAVAILABLE;
+            }
+            if (ExceptionsHelper.unwrap(e, ResourceNotFoundException.class) != null) {
+                return Result.NOT_FOUND;
+            }
+            if (e instanceof TaskCancelledException || (ExceptionsHelper.unwrap(e, TaskCancelledException.class) != null)) {
+                return Result.CANCELED;
+            }
+            if (ExceptionsHelper.unwrap(e, SearchTimeoutException.class) != null) {
+                return Result.TIMEOUT;
+            }
+            if (ExceptionsHelper.unwrap(e, ElasticsearchSecurityException.class) != null) {
+                return Result.SECURITY;
+            }
+            if (ExceptionsHelper.unwrapCorruption(e) != null) {
+                return Result.CORRUPTION;
+            }
+            // This is kind of last resort check - if we still don't know the reason but all shard failures are remote,
+            // we assume it's remote's fault somehow.
+            if (e instanceof SearchPhaseExecutionException spe) {
+                // If this is a failure that happened because of remote failures only
+                var groupedFails = ExceptionsHelper.groupBy(spe.shardFailures());
+                if (Arrays.stream(groupedFails).allMatch(Builder::isRemoteFailure)) {
+                    return Result.REMOTES_UNAVAILABLE;
+                }
+            }
+            // OK we don't know what happened
+            return Result.UNKNOWN;
+        }
+
+        /**
+         * Is this failure exception because remote was unavailable?
+         * See also: TransportResolveClusterAction#notConnectedError
+         */
+        static boolean isRemoteUnavailable(Exception e) {
+            if (ExceptionsHelper.unwrap(
+                e,
+                ConnectTransportException.class,
+                NoSuchRemoteClusterException.class,
+                NoSeedNodeLeftException.class
+            ) != null) {
+                return true;
+            }
+            Throwable ill = ExceptionsHelper.unwrap(e, IllegalStateException.class, IllegalArgumentException.class);
+            if (ill != null && (ill.getMessage().contains("Unable to open any connections") || ill.getMessage().contains("unknown host"))) {
+                return true;
+            }
+            // Ok doesn't look like any of the known remote exceptions
+            return false;
+        }
+
+        /**
+         * Is this failure coming from a remote cluster?
+         */
+        static boolean isRemoteFailure(ShardOperationFailedException failure) {
+            if (failure instanceof ShardSearchFailure shardFailure) {
+                SearchShardTarget shard = shardFailure.shard();
+                return shard != null && shard.getClusterAlias() != null && LOCAL_CLUSTER_GROUP_KEY.equals(shard.getClusterAlias()) == false;
+            }
+            return false;
+        }
+    }
+
+    private CCSUsage(
+        long took,
+        Result status,
+        int remotesCount,
+        Set<String> skippedRemotes,
+        Set<String> features,
+        String client,
+        Map<String, PerClusterUsage> perClusterUsage
+    ) {
+        this.status = status;
+        this.remotesCount = remotesCount;
+        this.features = features;
+        this.client = client;
+        this.took = took;
+        this.skippedRemotes = skippedRemotes;
+        this.perClusterUsage = perClusterUsage;
+    }
+
+    public Map<String, PerClusterUsage> getPerClusterUsage() {
+        return perClusterUsage;
+    }
+
+    public Result getStatus() {
+        return status;
+    }
+
+    public Set<String> getFeatures() {
+        return features;
+    }
+
+    public long getRemotesCount() {
+        return remotesCount;
+    }
+
+    public String getClient() {
+        return client;
+    }
+
+    public long getTook() {
+        return took;
+    }
+
+    public Set<String> getSkippedRemotes() {
+        return skippedRemotes;
+    }
+
+    public static class PerClusterUsage {
+
+        // if MRT=true, the took time on the remote cluster (if MRT=true), otherwise the overall took time
+        private long took;
+
+        public PerClusterUsage(TimeValue took) {
+            if (took != null) {
+                this.took = took.millis();
+            }
+        }
+
+        public long getTook() {
+            return took;
+        }
+    }
+
+}
diff --git a/server/src/main/java/org/elasticsearch/action/admin/cluster/stats/CCSUsageTelemetry.java b/server/src/main/java/org/elasticsearch/action/admin/cluster/stats/CCSUsageTelemetry.java
new file mode 100644
index 0000000000000..60766bd4068e3
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/action/admin/cluster/stats/CCSUsageTelemetry.java
@@ -0,0 +1,246 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.action.admin.cluster.stats;
+
+import org.elasticsearch.common.util.Maps;
+
+import java.util.Collections;
+import java.util.Map;
+import java.util.Set;
+import java.util.concurrent.ConcurrentHashMap;
+import java.util.concurrent.atomic.LongAdder;
+
+/**
+ * Service holding accumulated CCS search usage statistics. Individual cross-cluster searches will pass
+ * CCSUsage data here to have it collated and aggregated. Snapshots of the current CCS Telemetry Usage
+ * can be obtained by getting {@link CCSTelemetrySnapshot} objects.
+ * <br>
+ * Theory of operation:
+ * Each search creates a {@link CCSUsage.Builder}, which can be updated during the progress of the search request,
+ * and then it instantiates a {@link CCSUsage} object when the request is finished.
+ * That object is passed to {@link #updateUsage(CCSUsage)} on the request processing end (whether successful or not).
+ * The {@link #updateUsage(CCSUsage)} method will then update the internal counters and metrics.
+ * <br>
+ * When we need to return the current state of the telemetry, we can call {@link #getCCSTelemetrySnapshot()} which produces
+ * a snapshot of the current state of the telemetry as {@link CCSTelemetrySnapshot}. These snapshots are additive so
+ * when collecting the snapshots from multiple nodes, an empty snapshot is created and then all the node's snapshots are added
+ * to it to obtain the summary telemetry.
+ */
+public class CCSUsageTelemetry {
+
+    /**
+     * Result of the request execution.
+     * Either "success" or a failure reason.
+     */
+    public enum Result {
+        SUCCESS("success"),
+        REMOTES_UNAVAILABLE("remotes_unavailable"),
+        CANCELED("canceled"),
+        NOT_FOUND("not_found"),
+        TIMEOUT("timeout"),
+        CORRUPTION("corruption"),
+        SECURITY("security"),
+        // May be helpful if there's a lot of other reasons, and it may be hard to calculate the unknowns for some clients.
+        UNKNOWN("other");
+
+        private final String name;
+
+        Result(String name) {
+            this.name = name;
+        }
+
+        public String getName() {
+            return name;
+        }
+    }
+
+    // Not enum because we won't mind other places adding their own features
+    public static final String MRT_FEATURE = "mrt_on";
+    public static final String ASYNC_FEATURE = "async";
+    public static final String WILDCARD_FEATURE = "wildcards";
+
+    // The list of known Elastic clients. May be incomplete.
+    public static final Set<String> KNOWN_CLIENTS = Set.of(
+        "kibana",
+        "cloud",
+        "logstash",
+        "beats",
+        "fleet",
+        "ml",
+        "security",
+        "observability",
+        "enterprise-search",
+        "elasticsearch",
+        "connectors",
+        "connectors-cli"
+    );
+
+    private final LongAdder totalCount;
+    private final LongAdder successCount;
+    private final Map<Result, LongAdder> failureReasons;
+
+    /**
+     * Latency metrics overall
+     */
+    private final LongMetric took;
+    /**
+     * Latency metrics with minimize_roundtrips=true
+     */
+    private final LongMetric tookMrtTrue;
+    /**
+     * Latency metrics with minimize_roundtrips=false
+     */
+    private final LongMetric tookMrtFalse;
+    private final LongMetric remotesPerSearch;
+    private final LongAdder skippedRemotes;
+
+    private final Map<String, LongAdder> featureCounts;
+
+    private final Map<String, LongAdder> clientCounts;
+    private final Map<String, PerClusterCCSTelemetry> byRemoteCluster;
+
+    public CCSUsageTelemetry() {
+        this.byRemoteCluster = new ConcurrentHashMap<>();
+        totalCount = new LongAdder();
+        successCount = new LongAdder();
+        failureReasons = new ConcurrentHashMap<>();
+        took = new LongMetric();
+        tookMrtTrue = new LongMetric();
+        tookMrtFalse = new LongMetric();
+        remotesPerSearch = new LongMetric();
+        skippedRemotes = new LongAdder();
+        featureCounts = new ConcurrentHashMap<>();
+        clientCounts = new ConcurrentHashMap<>();
+    }
+
+    public void updateUsage(CCSUsage ccsUsage) {
+        assert ccsUsage.getRemotesCount() > 0 : "Expected at least one remote cluster in CCSUsage";
+        // TODO: fork this to a background thread?
+        doUpdate(ccsUsage);
+    }
+
+    // This is not synchronized, instead we ensure that every metric in the class is thread-safe.
+    private void doUpdate(CCSUsage ccsUsage) {
+        totalCount.increment();
+        long searchTook = ccsUsage.getTook();
+        if (isSuccess(ccsUsage)) {
+            successCount.increment();
+            took.record(searchTook);
+            if (isMRT(ccsUsage)) {
+                tookMrtTrue.record(searchTook);
+            } else {
+                tookMrtFalse.record(searchTook);
+            }
+            ccsUsage.getPerClusterUsage().forEach((r, u) -> byRemoteCluster.computeIfAbsent(r, PerClusterCCSTelemetry::new).update(u));
+        } else {
+            failureReasons.computeIfAbsent(ccsUsage.getStatus(), k -> new LongAdder()).increment();
+        }
+
+        remotesPerSearch.record(ccsUsage.getRemotesCount());
+        if (ccsUsage.getSkippedRemotes().isEmpty() == false) {
+            skippedRemotes.increment();
+            ccsUsage.getSkippedRemotes().forEach(remote -> byRemoteCluster.computeIfAbsent(remote, PerClusterCCSTelemetry::new).skipped());
+        }
+        ccsUsage.getFeatures().forEach(f -> featureCounts.computeIfAbsent(f, k -> new LongAdder()).increment());
+        String client = ccsUsage.getClient();
+        if (client != null && KNOWN_CLIENTS.contains(client)) {
+            // We count only known clients for now
+            clientCounts.computeIfAbsent(ccsUsage.getClient(), k -> new LongAdder()).increment();
+        }
+    }
+
+    private boolean isMRT(CCSUsage ccsUsage) {
+        return ccsUsage.getFeatures().contains(MRT_FEATURE);
+    }
+
+    private boolean isSuccess(CCSUsage ccsUsage) {
+        return ccsUsage.getStatus() == Result.SUCCESS;
+    }
+
+    public Map<String, PerClusterCCSTelemetry> getTelemetryByCluster() {
+        return byRemoteCluster;
+    }
+
+    /**
+     * Telemetry of each remote involved in cross cluster searches
+     */
+    public static class PerClusterCCSTelemetry {
+        private final String clusterAlias;
+        // The number of successful (not skipped) requests to this cluster.
+        private final LongAdder count;
+        private final LongAdder skippedCount;
+        // This is only over the successful requetss, skipped ones do not count here.
+        private final LongMetric took;
+
+        PerClusterCCSTelemetry(String clusterAlias) {
+            this.clusterAlias = clusterAlias;
+            this.count = new LongAdder();
+            took = new LongMetric();
+            this.skippedCount = new LongAdder();
+        }
+
+        void update(CCSUsage.PerClusterUsage remoteUsage) {
+            count.increment();
+            took.record(remoteUsage.getTook());
+        }
+
+        void skipped() {
+            skippedCount.increment();
+        }
+
+        public long getCount() {
+            return count.longValue();
+        }
+
+        @Override
+        public String toString() {
+            return "PerClusterCCSTelemetry{"
+                + "clusterAlias='"
+                + clusterAlias
+                + '\''
+                + ", count="
+                + count
+                + ", latency="
+                + took.toString()
+                + '}';
+        }
+
+        public long getSkippedCount() {
+            return skippedCount.longValue();
+        }
+
+        public CCSTelemetrySnapshot.PerClusterCCSTelemetry getSnapshot() {
+            return new CCSTelemetrySnapshot.PerClusterCCSTelemetry(count.longValue(), skippedCount.longValue(), took.getValue());
+        }
+
+    }
+
+    public CCSTelemetrySnapshot getCCSTelemetrySnapshot() {
+        Map<String, Long> reasonsMap = Maps.newMapWithExpectedSize(failureReasons.size());
+        failureReasons.forEach((k, v) -> reasonsMap.put(k.getName(), v.longValue()));
+
+        LongMetric.LongMetricValue remotes = remotesPerSearch.getValue();
+
+        // Maps returned here are unmodifiable, but the empty ctor produces modifiable maps
+        return new CCSTelemetrySnapshot(
+            totalCount.longValue(),
+            successCount.longValue(),
+            Collections.unmodifiableMap(reasonsMap),
+            took.getValue(),
+            tookMrtTrue.getValue(),
+            tookMrtFalse.getValue(),
+            remotes.max(),
+            remotes.avg(),
+            skippedRemotes.longValue(),
+            Collections.unmodifiableMap(Maps.transformValues(featureCounts, LongAdder::longValue)),
+            Collections.unmodifiableMap(Maps.transformValues(clientCounts, LongAdder::longValue)),
+            Collections.unmodifiableMap(Maps.transformValues(byRemoteCluster, PerClusterCCSTelemetry::getSnapshot))
+        );
+    }
+}
diff --git a/server/src/main/java/org/elasticsearch/action/admin/cluster/stats/LongMetric.java b/server/src/main/java/org/elasticsearch/action/admin/cluster/stats/LongMetric.java
new file mode 100644
index 0000000000000..f3bb936b108c0
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/action/admin/cluster/stats/LongMetric.java
@@ -0,0 +1,126 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.action.admin.cluster.stats;
+
+import org.HdrHistogram.ConcurrentHistogram;
+import org.HdrHistogram.Histogram;
+import org.elasticsearch.common.io.stream.StreamInput;
+import org.elasticsearch.common.io.stream.StreamOutput;
+import org.elasticsearch.common.io.stream.Writeable;
+
+import java.io.IOException;
+import java.nio.ByteBuffer;
+import java.util.Objects;
+import java.util.zip.DataFormatException;
+
+/**
+ * Metric class that accepts longs and provides count, average, max and percentiles.
+ * Abstracts out the details of how exactly the values are stored and calculated.
+ * {@link LongMetricValue} is a snapshot of the current state of the metric.
+ */
+public class LongMetric {
+    private final Histogram values;
+    private static final int SIGNIFICANT_DIGITS = 2;
+
+    LongMetric() {
+        values = new ConcurrentHistogram(SIGNIFICANT_DIGITS);
+    }
+
+    void record(long v) {
+        values.recordValue(v);
+    }
+
+    LongMetricValue getValue() {
+        return new LongMetricValue(values);
+    }
+
+    /**
+     * Snapshot of {@link LongMetric} value that provides the current state of the metric.
+     * Can be added with another {@link LongMetricValue} object.
+     */
+    public static final class LongMetricValue implements Writeable {
+        // We have to carry the full histogram around since we might need to calculate aggregate percentiles
+        // after collecting individual stats from the nodes, and we can't do that without having the full histogram.
+        // This costs about 2K per metric, which was deemed acceptable.
+        private final Histogram values;
+
+        public LongMetricValue(Histogram values) {
+            // Copy here since we don't want the snapshot value to change if somebody updates the original one
+            this.values = values.copy();
+        }
+
+        public LongMetricValue(LongMetricValue v) {
+            this.values = v.values.copy();
+        }
+
+        LongMetricValue() {
+            this.values = new Histogram(SIGNIFICANT_DIGITS);
+        }
+
+        public void add(LongMetricValue v) {
+            this.values.add(v.values);
+        }
+
+        public static LongMetricValue fromStream(StreamInput in) throws IOException {
+            byte[] b = in.readByteArray();
+            ByteBuffer bb = ByteBuffer.wrap(b);
+            try {
+                // TODO: not sure what is the good value for minBarForHighestToLowestValueRatio here?
+                Histogram dh = Histogram.decodeFromCompressedByteBuffer(bb, 1);
+                return new LongMetricValue(dh);
+            } catch (DataFormatException e) {
+                throw new IOException(e);
+            }
+        }
+
+        @Override
+        public void writeTo(StreamOutput out) throws IOException {
+            ByteBuffer b = ByteBuffer.allocate(values.getNeededByteBufferCapacity());
+            values.encodeIntoCompressedByteBuffer(b);
+            int size = b.position();
+            out.writeVInt(size);
+            out.writeBytes(b.array(), 0, size);
+        }
+
+        public long count() {
+            return values.getTotalCount();
+        }
+
+        public long max() {
+            return values.getMaxValue();
+        }
+
+        public long avg() {
+            return (long) Math.ceil(values.getMean());
+        }
+
+        public long p90() {
+            return values.getValueAtPercentile(90);
+        }
+
+        @Override
+        public boolean equals(Object obj) {
+            if (obj == this) return true;
+            if (obj == null || obj.getClass() != this.getClass()) return false;
+            var that = (LongMetricValue) obj;
+            return this.values.equals(that.values);
+        }
+
+        @Override
+        public int hashCode() {
+            return Objects.hash(values);
+        }
+
+        @Override
+        public String toString() {
+            return "LongMetricValue[count=" + count() + ", " + "max=" + max() + ", " + "avg=" + avg() + "]";
+        }
+
+    }
+}
diff --git a/server/src/main/java/org/elasticsearch/action/search/SearchResponse.java b/server/src/main/java/org/elasticsearch/action/search/SearchResponse.java
index 45cb118691082..8d70e2dd6bb66 100644
--- a/server/src/main/java/org/elasticsearch/action/search/SearchResponse.java
+++ b/server/src/main/java/org/elasticsearch/action/search/SearchResponse.java
@@ -47,6 +47,7 @@
 import java.util.Locale;
 import java.util.Map;
 import java.util.Objects;
+import java.util.Set;
 import java.util.function.BiFunction;
 import java.util.function.Predicate;
 import java.util.function.Supplier;
@@ -701,6 +702,13 @@ public Cluster getCluster(String clusterAlias) {
             return clusterInfo.get(clusterAlias);
         }
 
+        /**
+         * @return collection of cluster aliases in the search response (including "(local)" if was searched).
+         */
+        public Set<String> getClusterAliases() {
+            return clusterInfo.keySet();
+        }
+
         /**
          * Utility to swap a Cluster object. Guidelines for the remapping function:
          * <ul>
@@ -803,6 +811,7 @@ public boolean hasClusterObjects() {
         public boolean hasRemoteClusters() {
             return total > 1 || clusterInfo.keySet().stream().anyMatch(alias -> alias != RemoteClusterAware.LOCAL_CLUSTER_GROUP_KEY);
         }
+
     }
 
     /**
diff --git a/server/src/main/java/org/elasticsearch/action/search/TransportSearchAction.java b/server/src/main/java/org/elasticsearch/action/search/TransportSearchAction.java
index 11e767df9c010..6e1645c1ed711 100644
--- a/server/src/main/java/org/elasticsearch/action/search/TransportSearchAction.java
+++ b/server/src/main/java/org/elasticsearch/action/search/TransportSearchAction.java
@@ -23,6 +23,8 @@
 import org.elasticsearch.action.admin.cluster.shards.ClusterSearchShardsRequest;
 import org.elasticsearch.action.admin.cluster.shards.ClusterSearchShardsResponse;
 import org.elasticsearch.action.admin.cluster.shards.TransportClusterSearchShardsAction;
+import org.elasticsearch.action.admin.cluster.stats.CCSUsage;
+import org.elasticsearch.action.admin.cluster.stats.CCSUsageTelemetry;
 import org.elasticsearch.action.support.ActionFilters;
 import org.elasticsearch.action.support.HandledTransportAction;
 import org.elasticsearch.action.support.IndicesOptions;
@@ -46,6 +48,7 @@
 import org.elasticsearch.common.io.stream.NamedWriteableRegistry;
 import org.elasticsearch.common.logging.DeprecationCategory;
 import org.elasticsearch.common.logging.DeprecationLogger;
+import org.elasticsearch.common.regex.Regex;
 import org.elasticsearch.common.settings.Setting;
 import org.elasticsearch.common.settings.Setting.Property;
 import org.elasticsearch.common.util.ArrayUtils;
@@ -84,6 +87,7 @@
 import org.elasticsearch.transport.Transport;
 import org.elasticsearch.transport.TransportRequestOptions;
 import org.elasticsearch.transport.TransportService;
+import org.elasticsearch.usage.UsageService;
 import org.elasticsearch.xcontent.ToXContent;
 import org.elasticsearch.xcontent.XContentFactory;
 
@@ -156,6 +160,7 @@ public class TransportSearchAction extends HandledTransportAction<SearchRequest,
     private final boolean ccsCheckCompatibility;
     private final SearchResponseMetrics searchResponseMetrics;
     private final Client client;
+    private final UsageService usageService;
 
     @Inject
     public TransportSearchAction(
@@ -172,7 +177,8 @@ public TransportSearchAction(
         ExecutorSelector executorSelector,
         SearchTransportAPMMetrics searchTransportMetrics,
         SearchResponseMetrics searchResponseMetrics,
-        Client client
+        Client client,
+        UsageService usageService
     ) {
         super(TYPE.name(), transportService, actionFilters, SearchRequest::new, EsExecutors.DIRECT_EXECUTOR_SERVICE);
         this.threadPool = threadPool;
@@ -191,6 +197,7 @@ public TransportSearchAction(
         this.ccsCheckCompatibility = SearchService.CCS_VERSION_CHECK_SETTING.get(clusterService.getSettings());
         this.searchResponseMetrics = searchResponseMetrics;
         this.client = client;
+        this.usageService = usageService;
     }
 
     private Map<String, OriginalIndices> buildPerIndexOriginalIndices(
@@ -305,43 +312,7 @@ public long buildTookInMillis() {
 
     @Override
     protected void doExecute(Task task, SearchRequest searchRequest, ActionListener<SearchResponse> listener) {
-        ActionListener<SearchResponse> loggingAndMetrics = new ActionListener<>() {
-            @Override
-            public void onResponse(SearchResponse searchResponse) {
-                try {
-                    searchResponseMetrics.recordTookTime(searchResponse.getTookInMillis());
-                    SearchResponseMetrics.ResponseCountTotalStatus responseCountTotalStatus =
-                        SearchResponseMetrics.ResponseCountTotalStatus.SUCCESS;
-                    if (searchResponse.getShardFailures() != null && searchResponse.getShardFailures().length > 0) {
-                        // Deduplicate failures by exception message and index
-                        ShardOperationFailedException[] groupedFailures = ExceptionsHelper.groupBy(searchResponse.getShardFailures());
-                        for (ShardOperationFailedException f : groupedFailures) {
-                            boolean causeHas500Status = false;
-                            if (f.getCause() != null) {
-                                causeHas500Status = ExceptionsHelper.status(f.getCause()).getStatus() >= 500;
-                            }
-                            if ((f.status().getStatus() >= 500 || causeHas500Status)
-                                && ExceptionsHelper.isNodeOrShardUnavailableTypeException(f.getCause()) == false) {
-                                logger.warn("TransportSearchAction shard failure (partial results response)", f);
-                                responseCountTotalStatus = SearchResponseMetrics.ResponseCountTotalStatus.PARTIAL_FAILURE;
-                            }
-                        }
-                    }
-                    listener.onResponse(searchResponse);
-                    // increment after the delegated onResponse to ensure we don't
-                    // record both a success and a failure if there is an exception
-                    searchResponseMetrics.incrementResponseCount(responseCountTotalStatus);
-                } catch (Exception e) {
-                    onFailure(e);
-                }
-            }
-
-            @Override
-            public void onFailure(Exception e) {
-                searchResponseMetrics.incrementResponseCount(SearchResponseMetrics.ResponseCountTotalStatus.FAILURE);
-                listener.onFailure(e);
-            }
-        };
+        ActionListener<SearchResponse> loggingAndMetrics = new SearchResponseActionListener((SearchTask) task, listener);
         executeRequest((SearchTask) task, searchRequest, loggingAndMetrics, AsyncSearchActionProvider::new);
     }
 
@@ -396,8 +367,32 @@ void executeRequest(
                     searchPhaseProvider.apply(delegate)
                 );
             } else {
+                if ((listener instanceof TelemetryListener tl) && CCS_TELEMETRY_FEATURE_FLAG.isEnabled()) {
+                    tl.setRemotes(resolvedIndices.getRemoteClusterIndices().size());
+                    if (isAsyncSearchTask(task)) {
+                        tl.setFeature(CCSUsageTelemetry.ASYNC_FEATURE);
+                    }
+                    String client = task.getHeader(Task.X_ELASTIC_PRODUCT_ORIGIN_HTTP_HEADER);
+                    if (client != null) {
+                        tl.setClient(client);
+                    }
+                    // Check if any of the index patterns are wildcard patterns
+                    var localIndices = resolvedIndices.getLocalIndices();
+                    if (localIndices != null && Arrays.stream(localIndices.indices()).anyMatch(Regex::isSimpleMatchPattern)) {
+                        tl.setFeature(CCSUsageTelemetry.WILDCARD_FEATURE);
+                    }
+                    if (resolvedIndices.getRemoteClusterIndices()
+                        .values()
+                        .stream()
+                        .anyMatch(indices -> Arrays.stream(indices.indices()).anyMatch(Regex::isSimpleMatchPattern))) {
+                        tl.setFeature(CCSUsageTelemetry.WILDCARD_FEATURE);
+                    }
+                }
                 final TaskId parentTaskId = task.taskInfo(clusterService.localNode().getId(), false).taskId();
                 if (shouldMinimizeRoundtrips(rewritten)) {
+                    if ((listener instanceof TelemetryListener tl) && CCS_TELEMETRY_FEATURE_FLAG.isEnabled()) {
+                        tl.setFeature(CCSUsageTelemetry.MRT_FEATURE);
+                    }
                     final AggregationReduceContext.Builder aggregationReduceContextBuilder = rewritten.source() != null
                         && rewritten.source().aggregations() != null
                             ? searchService.aggReduceContextBuilder(task::isCancelled, rewritten.source().aggregations())
@@ -805,27 +800,26 @@ static void collectSearchShards(
         for (Map.Entry<String, OriginalIndices> entry : remoteIndicesByCluster.entrySet()) {
             final String clusterAlias = entry.getKey();
             boolean skipUnavailable = remoteClusterService.isSkipUnavailable(clusterAlias);
-            TransportSearchAction.CCSActionListener<SearchShardsResponse, Map<String, SearchShardsResponse>> singleListener =
-                new TransportSearchAction.CCSActionListener<>(
-                    clusterAlias,
-                    skipUnavailable,
-                    responsesCountDown,
-                    exceptions,
-                    clusters,
-                    listener
-                ) {
-                    @Override
-                    void innerOnResponse(SearchShardsResponse searchShardsResponse) {
-                        assert ThreadPool.assertCurrentThreadPool(ThreadPool.Names.SEARCH_COORDINATION);
-                        ccsClusterInfoUpdate(searchShardsResponse, clusters, clusterAlias, timeProvider);
-                        searchShardsResponses.put(clusterAlias, searchShardsResponse);
-                    }
+            CCSActionListener<SearchShardsResponse, Map<String, SearchShardsResponse>> singleListener = new CCSActionListener<>(
+                clusterAlias,
+                skipUnavailable,
+                responsesCountDown,
+                exceptions,
+                clusters,
+                listener
+            ) {
+                @Override
+                void innerOnResponse(SearchShardsResponse searchShardsResponse) {
+                    assert ThreadPool.assertCurrentThreadPool(ThreadPool.Names.SEARCH_COORDINATION);
+                    ccsClusterInfoUpdate(searchShardsResponse, clusters, clusterAlias, timeProvider);
+                    searchShardsResponses.put(clusterAlias, searchShardsResponse);
+                }
 
-                    @Override
-                    Map<String, SearchShardsResponse> createFinalResponse() {
-                        return searchShardsResponses;
-                    }
-                };
+                @Override
+                Map<String, SearchShardsResponse> createFinalResponse() {
+                    return searchShardsResponses;
+                }
+            };
             remoteClusterService.maybeEnsureConnectedAndGetConnection(
                 clusterAlias,
                 skipUnavailable == false,
@@ -1520,6 +1514,34 @@ public SearchPhase newSearchPhase(
         }
     }
 
+    /**
+     * TransportSearchAction cannot access async-search code, so can't check whether this the Task
+     * is an instance of AsyncSearchTask, so this roundabout method is used
+     * @param searchTask SearchTask to analyze
+     * @return true if this is an async search task; false if a synchronous search task
+     */
+    private boolean isAsyncSearchTask(SearchTask searchTask) {
+        assert assertAsyncSearchTaskListener(searchTask) : "AsyncSearchTask SearchProgressListener is not one of the expected types";
+        // AsyncSearchTask will not return SearchProgressListener.NOOP, since it uses its own progress listener
+        // which delegates to CCSSingleCoordinatorSearchProgressListener when minimizing roundtrips.
+        // Only synchronous SearchTask uses SearchProgressListener.NOOP or CCSSingleCoordinatorSearchProgressListener directly
+        return searchTask.getProgressListener() != SearchProgressListener.NOOP
+            && searchTask.getProgressListener() instanceof CCSSingleCoordinatorSearchProgressListener == false;
+    }
+
+    /**
+     * @param searchTask SearchTask to analyze
+     * @return true if AsyncSearchTask still uses its own special listener, not one of the two that synchronous SearchTask uses
+     */
+    private boolean assertAsyncSearchTaskListener(SearchTask searchTask) {
+        if (searchTask.getClass().getSimpleName().contains("AsyncSearchTask")) {
+            SearchProgressListener progressListener = searchTask.getProgressListener();
+            return progressListener != SearchProgressListener.NOOP
+                && progressListener instanceof CCSSingleCoordinatorSearchProgressListener == false;
+        }
+        return true;
+    }
+
     private static void validateAndResolveWaitForCheckpoint(
         ClusterState clusterState,
         IndexNameExpressionResolver resolver,
@@ -1824,4 +1846,112 @@ List<SearchShardIterator> getLocalShardsIterator(
         // the returned list must support in-place sorting, so this is the most memory efficient we can do here
         return Arrays.asList(list);
     }
+
+    private interface TelemetryListener {
+        void setRemotes(int count);
+
+        void setFeature(String feature);
+
+        void setClient(String client);
+    }
+
+    private class SearchResponseActionListener implements ActionListener<SearchResponse>, TelemetryListener {
+        private final SearchTask task;
+        private final ActionListener<SearchResponse> listener;
+        private final CCSUsage.Builder usageBuilder;
+
+        SearchResponseActionListener(SearchTask task, ActionListener<SearchResponse> listener) {
+            this.task = task;
+            this.listener = listener;
+            usageBuilder = new CCSUsage.Builder();
+        }
+
+        /**
+         * Should we collect telemetry for this search?
+         */
+        private boolean collectTelemetry() {
+            return CCS_TELEMETRY_FEATURE_FLAG.isEnabled() && usageBuilder.getRemotesCount() > 0;
+        }
+
+        public void setRemotes(int count) {
+            usageBuilder.setRemotesCount(count);
+        }
+
+        @Override
+        public void setFeature(String feature) {
+            usageBuilder.setFeature(feature);
+        }
+
+        @Override
+        public void setClient(String client) {
+            usageBuilder.setClient(client);
+        }
+
+        @Override
+        public void onResponse(SearchResponse searchResponse) {
+            try {
+                searchResponseMetrics.recordTookTime(searchResponse.getTookInMillis());
+                SearchResponseMetrics.ResponseCountTotalStatus responseCountTotalStatus =
+                    SearchResponseMetrics.ResponseCountTotalStatus.SUCCESS;
+                if (searchResponse.getShardFailures() != null && searchResponse.getShardFailures().length > 0) {
+                    // Deduplicate failures by exception message and index
+                    ShardOperationFailedException[] groupedFailures = ExceptionsHelper.groupBy(searchResponse.getShardFailures());
+                    for (ShardOperationFailedException f : groupedFailures) {
+                        boolean causeHas500Status = false;
+                        if (f.getCause() != null) {
+                            causeHas500Status = ExceptionsHelper.status(f.getCause()).getStatus() >= 500;
+                        }
+                        if ((f.status().getStatus() >= 500 || causeHas500Status)
+                            && ExceptionsHelper.isNodeOrShardUnavailableTypeException(f.getCause()) == false) {
+                            logger.warn("TransportSearchAction shard failure (partial results response)", f);
+                            responseCountTotalStatus = SearchResponseMetrics.ResponseCountTotalStatus.PARTIAL_FAILURE;
+                        }
+                    }
+                }
+                searchResponseMetrics.incrementResponseCount(responseCountTotalStatus);
+
+                if (collectTelemetry()) {
+                    extractCCSTelemetry(searchResponse);
+                    recordTelemetry();
+                }
+            } catch (Exception e) {
+                onFailure(e);
+                return;
+            }
+            // This is last because we want to collect telemetry before returning the response.
+            listener.onResponse(searchResponse);
+        }
+
+        @Override
+        public void onFailure(Exception e) {
+            searchResponseMetrics.incrementResponseCount(SearchResponseMetrics.ResponseCountTotalStatus.FAILURE);
+            if (collectTelemetry()) {
+                usageBuilder.setFailure(e);
+                recordTelemetry();
+            }
+            listener.onFailure(e);
+        }
+
+        private void recordTelemetry() {
+            usageService.getCcsUsageHolder().updateUsage(usageBuilder.build());
+        }
+
+        /**
+         * Extract telemetry data from the search response.
+         * @param searchResponse The final response from the search.
+         */
+        private void extractCCSTelemetry(SearchResponse searchResponse) {
+            usageBuilder.took(searchResponse.getTookInMillis());
+            for (String clusterAlias : searchResponse.getClusters().getClusterAliases()) {
+                SearchResponse.Cluster cluster = searchResponse.getClusters().getCluster(clusterAlias);
+                if (cluster.getStatus() == SearchResponse.Cluster.Status.SKIPPED) {
+                    usageBuilder.skippedRemote(clusterAlias);
+                } else {
+                    usageBuilder.perClusterUsage(clusterAlias, cluster.getTook());
+                }
+            }
+
+        }
+
+    }
 }
diff --git a/server/src/main/java/org/elasticsearch/usage/UsageService.java b/server/src/main/java/org/elasticsearch/usage/UsageService.java
index e11b343c7055a..573332060f55d 100644
--- a/server/src/main/java/org/elasticsearch/usage/UsageService.java
+++ b/server/src/main/java/org/elasticsearch/usage/UsageService.java
@@ -9,6 +9,7 @@
 package org.elasticsearch.usage;
 
 import org.elasticsearch.action.admin.cluster.node.usage.NodeUsage;
+import org.elasticsearch.action.admin.cluster.stats.CCSUsageTelemetry;
 import org.elasticsearch.rest.BaseRestHandler;
 
 import java.util.HashMap;
@@ -23,10 +24,12 @@ public class UsageService {
 
     private final Map<String, BaseRestHandler> handlers;
     private final SearchUsageHolder searchUsageHolder;
+    private final CCSUsageTelemetry ccsUsageHolder;
 
     public UsageService() {
         this.handlers = new HashMap<>();
         this.searchUsageHolder = new SearchUsageHolder();
+        this.ccsUsageHolder = new CCSUsageTelemetry();
     }
 
     /**
@@ -81,4 +84,8 @@ public Map<String, Long> getRestUsageStats() {
     public SearchUsageHolder getSearchUsageHolder() {
         return searchUsageHolder;
     }
+
+    public CCSUsageTelemetry getCcsUsageHolder() {
+        return ccsUsageHolder;
+    }
 }
diff --git a/server/src/test/java/org/elasticsearch/action/admin/cluster/stats/ApproximateMatcher.java b/server/src/test/java/org/elasticsearch/action/admin/cluster/stats/ApproximateMatcher.java
new file mode 100644
index 0000000000000..3ceda1c7f4651
--- /dev/null
+++ b/server/src/test/java/org/elasticsearch/action/admin/cluster/stats/ApproximateMatcher.java
@@ -0,0 +1,46 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.action.admin.cluster.stats;
+
+import org.hamcrest.Description;
+import org.hamcrest.TypeSafeMatcher;
+
+/**
+ * Matches a value that is within given range (currently 1%) of an expected value.
+ *
+ * We need this because histograms do not store exact values, but only value ranges.
+ * Since we have 2 significant digits, the value should be within 1% of the expected value.
+ */
+public class ApproximateMatcher extends TypeSafeMatcher<Long> {
+    public static double ACCURACY = 0.01;
+    private final long expectedValue;
+
+    public ApproximateMatcher(long expectedValue) {
+        this.expectedValue = expectedValue;
+    }
+
+    @Override
+    protected boolean matchesSafely(Long actualValue) {
+        double lowerBound = Math.floor(expectedValue * (1.00 - ACCURACY));
+        double upperBound = Math.ceil(expectedValue * (1.00 + ACCURACY));
+        return actualValue >= lowerBound && actualValue <= upperBound;
+    }
+
+    @Override
+    public void describeTo(Description description) {
+        description.appendText("a long value within 1% of ").appendValue(expectedValue);
+    }
+
+    /**
+     * Matches a value that is within given range (currently 1%) of an expected value.
+     */
+    public static ApproximateMatcher closeTo(long expectedValue) {
+        return new ApproximateMatcher(expectedValue);
+    }
+}
diff --git a/server/src/test/java/org/elasticsearch/action/admin/cluster/stats/CCSTelemetrySnapshotTests.java b/server/src/test/java/org/elasticsearch/action/admin/cluster/stats/CCSTelemetrySnapshotTests.java
new file mode 100644
index 0000000000000..9f08934503b69
--- /dev/null
+++ b/server/src/test/java/org/elasticsearch/action/admin/cluster/stats/CCSTelemetrySnapshotTests.java
@@ -0,0 +1,324 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.action.admin.cluster.stats;
+
+import org.elasticsearch.action.admin.cluster.stats.CCSTelemetrySnapshot.PerClusterCCSTelemetry;
+import org.elasticsearch.action.admin.cluster.stats.LongMetric.LongMetricValue;
+import org.elasticsearch.common.io.stream.Writeable;
+import org.elasticsearch.core.Tuple;
+import org.elasticsearch.test.AbstractWireSerializingTestCase;
+
+import java.io.IOException;
+import java.io.InputStream;
+import java.nio.charset.StandardCharsets;
+import java.util.HashMap;
+import java.util.Map;
+import java.util.TreeMap;
+
+import static org.hamcrest.Matchers.closeTo;
+import static org.hamcrest.Matchers.equalTo;
+
+public class CCSTelemetrySnapshotTests extends AbstractWireSerializingTestCase<CCSTelemetrySnapshot> {
+
+    private LongMetricValue randomLongMetricValue() {
+        LongMetric v = new LongMetric();
+        for (int i = 0; i < randomIntBetween(1, 10); i++) {
+            v.record(randomIntBetween(0, 1_000_000));
+        }
+        return v.getValue();
+    }
+
+    private PerClusterCCSTelemetry randomPerClusterCCSTelemetry() {
+        return new PerClusterCCSTelemetry(randomLongBetween(0, 1_000_000), randomLongBetween(0, 1_000_000), randomLongMetricValue());
+    }
+
+    @Override
+    protected CCSTelemetrySnapshot createTestInstance() {
+        if (randomBoolean()) {
+            return new CCSTelemetrySnapshot();
+        } else {
+            return randomCCSTelemetrySnapshot();
+        }
+    }
+
+    private CCSTelemetrySnapshot randomCCSTelemetrySnapshot() {
+        return new CCSTelemetrySnapshot(
+            randomLongBetween(0, 1_000_000),
+            randomLongBetween(0, 1_000_000),
+            Map.of(),
+            randomLongMetricValue(),
+            randomLongMetricValue(),
+            randomLongMetricValue(),
+            randomLongBetween(0, 1_000_000),
+            randomDoubleBetween(0.0, 100.0, false),
+            randomLongBetween(0, 1_000_000),
+            Map.of(),
+            Map.of(),
+            randomMap(1, 10, () -> new Tuple<>(randomAlphaOfLengthBetween(5, 10), randomPerClusterCCSTelemetry()))
+        );
+    }
+
+    @Override
+    protected Writeable.Reader<CCSTelemetrySnapshot> instanceReader() {
+        return CCSTelemetrySnapshot::new;
+    }
+
+    @Override
+    protected CCSTelemetrySnapshot mutateInstance(CCSTelemetrySnapshot instance) throws IOException {
+        // create a copy of CCSTelemetrySnapshot by extracting each field and mutating it
+        long totalCount = instance.getTotalCount();
+        long successCount = instance.getSuccessCount();
+        var failureReasons = instance.getFailureReasons();
+        LongMetricValue took = instance.getTook();
+        LongMetricValue tookMrtTrue = instance.getTookMrtTrue();
+        LongMetricValue tookMrtFalse = instance.getTookMrtFalse();
+        long skippedRemotes = instance.getSearchCountWithSkippedRemotes();
+        long remotesPerSearchMax = instance.getRemotesPerSearchMax();
+        double remotesPerSearchAvg = instance.getRemotesPerSearchAvg();
+        var featureCounts = instance.getFeatureCounts();
+        var clientCounts = instance.getClientCounts();
+        var perClusterCCSTelemetries = instance.getByRemoteCluster();
+
+        // Mutate values
+        int i = randomInt(11);
+        switch (i) {
+            case 0:
+                totalCount += randomNonNegativeLong();
+                break;
+            case 1:
+                successCount += randomNonNegativeLong();
+                break;
+            case 2:
+                failureReasons = new HashMap<>(failureReasons);
+                if (failureReasons.isEmpty() || randomBoolean()) {
+                    failureReasons.put(randomAlphaOfLengthBetween(5, 10), randomNonNegativeLong());
+                } else {
+                    // modify random element of the map
+                    String key = randomFrom(failureReasons.keySet());
+                    failureReasons.put(key, randomNonNegativeLong());
+                }
+                break;
+            case 3:
+                took = randomLongMetricValue();
+                break;
+            case 4:
+                tookMrtTrue = randomLongMetricValue();
+                break;
+            case 5:
+                tookMrtFalse = randomLongMetricValue();
+                break;
+            case 6:
+                skippedRemotes += randomNonNegativeLong();
+                break;
+            case 7:
+                remotesPerSearchMax += randomNonNegativeLong();
+                break;
+            case 8:
+                remotesPerSearchAvg = randomDoubleBetween(0.0, 100.0, false);
+                break;
+            case 9:
+                featureCounts = new HashMap<>(featureCounts);
+                if (featureCounts.isEmpty() || randomBoolean()) {
+                    featureCounts.put(randomAlphaOfLengthBetween(5, 10), randomNonNegativeLong());
+                } else {
+                    // modify random element of the map
+                    String key = randomFrom(featureCounts.keySet());
+                    featureCounts.put(key, randomNonNegativeLong());
+                }
+                break;
+            case 10:
+                clientCounts = new HashMap<>(clientCounts);
+                if (clientCounts.isEmpty() || randomBoolean()) {
+                    clientCounts.put(randomAlphaOfLengthBetween(5, 10), randomNonNegativeLong());
+                } else {
+                    // modify random element of the map
+                    String key = randomFrom(clientCounts.keySet());
+                    clientCounts.put(key, randomNonNegativeLong());
+                }
+                break;
+            case 11:
+                perClusterCCSTelemetries = new HashMap<>(perClusterCCSTelemetries);
+                if (perClusterCCSTelemetries.isEmpty() || randomBoolean()) {
+                    perClusterCCSTelemetries.put(randomAlphaOfLengthBetween(5, 10), randomPerClusterCCSTelemetry());
+                } else {
+                    // modify random element of the map
+                    String key = randomFrom(perClusterCCSTelemetries.keySet());
+                    perClusterCCSTelemetries.put(key, randomPerClusterCCSTelemetry());
+                }
+                break;
+        }
+        // Return new instance
+        return new CCSTelemetrySnapshot(
+            totalCount,
+            successCount,
+            failureReasons,
+            took,
+            tookMrtTrue,
+            tookMrtFalse,
+            remotesPerSearchMax,
+            remotesPerSearchAvg,
+            skippedRemotes,
+            featureCounts,
+            clientCounts,
+            perClusterCCSTelemetries
+        );
+    }
+
+    public void testAdd() {
+        CCSTelemetrySnapshot empty = new CCSTelemetrySnapshot();
+        CCSTelemetrySnapshot full = randomCCSTelemetrySnapshot();
+        empty.add(full);
+        assertThat(empty, equalTo(full));
+        // Add again
+        empty.add(full);
+        assertThat(empty.getTotalCount(), equalTo(full.getTotalCount() * 2));
+        assertThat(empty.getSuccessCount(), equalTo(full.getSuccessCount() * 2));
+        // check that each element of the map is doubled
+        empty.getFailureReasons().forEach((k, v) -> assertThat(v, equalTo(full.getFailureReasons().get(k) * 2)));
+        assertThat(empty.getTook().count(), equalTo(full.getTook().count() * 2));
+        assertThat(empty.getTookMrtTrue().count(), equalTo(full.getTookMrtTrue().count() * 2));
+        assertThat(empty.getTookMrtFalse().count(), equalTo(full.getTookMrtFalse().count() * 2));
+        assertThat(empty.getSearchCountWithSkippedRemotes(), equalTo(full.getSearchCountWithSkippedRemotes() * 2));
+        assertThat(empty.getRemotesPerSearchMax(), equalTo(full.getRemotesPerSearchMax()));
+        assertThat(empty.getRemotesPerSearchAvg(), closeTo(full.getRemotesPerSearchAvg(), 0.01));
+        empty.getFeatureCounts().forEach((k, v) -> assertThat(v, equalTo(full.getFeatureCounts().get(k) * 2)));
+        empty.getClientCounts().forEach((k, v) -> assertThat(v, equalTo(full.getClientCounts().get(k) * 2)));
+        empty.getByRemoteCluster().forEach((k, v) -> {
+            assertThat(v.getCount(), equalTo(full.getByRemoteCluster().get(k).getCount() * 2));
+            assertThat(v.getSkippedCount(), equalTo(full.getByRemoteCluster().get(k).getSkippedCount() * 2));
+            assertThat(v.getTook().count(), equalTo(full.getByRemoteCluster().get(k).getTook().count() * 2));
+        });
+    }
+
+    public void testAddTwo() {
+        CCSTelemetrySnapshot empty = new CCSTelemetrySnapshot();
+        CCSTelemetrySnapshot full = randomCCSTelemetrySnapshot();
+        CCSTelemetrySnapshot full2 = randomCCSTelemetrySnapshot();
+
+        empty.add(full);
+        empty.add(full2);
+        assertThat(empty.getTotalCount(), equalTo(full.getTotalCount() + full2.getTotalCount()));
+        assertThat(empty.getSuccessCount(), equalTo(full.getSuccessCount() + full2.getSuccessCount()));
+        empty.getFailureReasons()
+            .forEach(
+                (k, v) -> assertThat(
+                    v,
+                    equalTo(full.getFailureReasons().getOrDefault(k, 0L) + full2.getFailureReasons().getOrDefault(k, 0L))
+                )
+            );
+        assertThat(empty.getTook().count(), equalTo(full.getTook().count() + full2.getTook().count()));
+        assertThat(empty.getTookMrtTrue().count(), equalTo(full.getTookMrtTrue().count() + full2.getTookMrtTrue().count()));
+        assertThat(empty.getTookMrtFalse().count(), equalTo(full.getTookMrtFalse().count() + full2.getTookMrtFalse().count()));
+        assertThat(
+            empty.getSearchCountWithSkippedRemotes(),
+            equalTo(full.getSearchCountWithSkippedRemotes() + full2.getSearchCountWithSkippedRemotes())
+        );
+        assertThat(empty.getRemotesPerSearchMax(), equalTo(Math.max(full.getRemotesPerSearchMax(), full2.getRemotesPerSearchMax())));
+        double expectedAvg = (full.getRemotesPerSearchAvg() * full.getTotalCount() + full2.getRemotesPerSearchAvg() * full2.getTotalCount())
+            / empty.getTotalCount();
+        assertThat(empty.getRemotesPerSearchAvg(), closeTo(expectedAvg, 0.01));
+        empty.getFeatureCounts()
+            .forEach(
+                (k, v) -> assertThat(v, equalTo(full.getFeatureCounts().getOrDefault(k, 0L) + full2.getFeatureCounts().getOrDefault(k, 0L)))
+            );
+        empty.getClientCounts()
+            .forEach(
+                (k, v) -> assertThat(v, equalTo(full.getClientCounts().getOrDefault(k, 0L) + full2.getClientCounts().getOrDefault(k, 0L)))
+            );
+        PerClusterCCSTelemetry zeroDummy = new PerClusterCCSTelemetry();
+        empty.getByRemoteCluster().forEach((k, v) -> {
+            assertThat(
+                v.getCount(),
+                equalTo(
+                    full.getByRemoteCluster().getOrDefault(k, zeroDummy).getCount() + full2.getByRemoteCluster()
+                        .getOrDefault(k, zeroDummy)
+                        .getCount()
+                )
+            );
+            assertThat(
+                v.getSkippedCount(),
+                equalTo(
+                    full.getByRemoteCluster().getOrDefault(k, zeroDummy).getSkippedCount() + full2.getByRemoteCluster()
+                        .getOrDefault(k, zeroDummy)
+                        .getSkippedCount()
+                )
+            );
+            assertThat(
+                v.getTook().count(),
+                equalTo(
+                    full.getByRemoteCluster().getOrDefault(k, zeroDummy).getTook().count() + full2.getByRemoteCluster()
+                        .getOrDefault(k, zeroDummy)
+                        .getTook()
+                        .count()
+                )
+            );
+        });
+    }
+
+    private LongMetricValue manyValuesHistogram(long startingWith) {
+        LongMetric metric = new LongMetric();
+        // Produce 100 values from startingWith to 2 * startingWith with equal intervals
+        // We need to space values relative to initial value, otherwise the histogram would put them all in one bucket
+        for (long i = startingWith; i < 2 * startingWith; i += startingWith / 100) {
+            metric.record(i);
+        }
+        return metric.getValue();
+    }
+
+    public void testToXContent() throws IOException {
+        long totalCount = 10;
+        long successCount = 20;
+        // Using TreeMap's here to ensure consistent ordering in the JSON output
+        var failureReasons = new TreeMap<>(Map.of("reason1", 1L, "reason2", 2L, "unknown", 3L));
+        LongMetricValue took = manyValuesHistogram(1000);
+        LongMetricValue tookMrtTrue = manyValuesHistogram(5000);
+        LongMetricValue tookMrtFalse = manyValuesHistogram(10000);
+        long skippedRemotes = 5;
+        long remotesPerSearchMax = 6;
+        double remotesPerSearchAvg = 7.89;
+        var featureCounts = new TreeMap<>(Map.of("async", 10L, "mrt", 20L, "wildcard", 30L));
+        var clientCounts = new TreeMap<>(Map.of("kibana", 40L, "other", 500L));
+        var perClusterCCSTelemetries = new TreeMap<>(
+            Map.of(
+                "",
+                new PerClusterCCSTelemetry(12, 0, manyValuesHistogram(2000)),
+                "remote1",
+                new PerClusterCCSTelemetry(100, 22, manyValuesHistogram(2000)),
+                "remote2",
+                new PerClusterCCSTelemetry(300, 42, manyValuesHistogram(500000))
+            )
+        );
+
+        var snapshot = new CCSTelemetrySnapshot(
+            totalCount,
+            successCount,
+            failureReasons,
+            took,
+            tookMrtTrue,
+            tookMrtFalse,
+            remotesPerSearchMax,
+            remotesPerSearchAvg,
+            skippedRemotes,
+            featureCounts,
+            clientCounts,
+            perClusterCCSTelemetries
+        );
+        String expected = readJSONFromResource("telemetry_test.json");
+        assertEquals(expected, snapshot.toString());
+    }
+
+    private String readJSONFromResource(String fileName) throws IOException {
+        try (InputStream inputStream = getClass().getResourceAsStream("/org/elasticsearch/action/admin/cluster/stats/" + fileName)) {
+            if (inputStream == null) {
+                throw new IOException("Resource not found: " + fileName);
+            }
+            return new String(inputStream.readAllBytes(), StandardCharsets.UTF_8);
+        }
+    }
+}
diff --git a/server/src/test/java/org/elasticsearch/action/admin/cluster/stats/CCSUsageTelemetryTests.java b/server/src/test/java/org/elasticsearch/action/admin/cluster/stats/CCSUsageTelemetryTests.java
new file mode 100644
index 0000000000000..bd36f89f38e4d
--- /dev/null
+++ b/server/src/test/java/org/elasticsearch/action/admin/cluster/stats/CCSUsageTelemetryTests.java
@@ -0,0 +1,342 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.action.admin.cluster.stats;
+
+import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.test.ESTestCase;
+
+import static org.elasticsearch.action.admin.cluster.stats.ApproximateMatcher.closeTo;
+import static org.elasticsearch.action.admin.cluster.stats.CCSUsageTelemetry.ASYNC_FEATURE;
+import static org.elasticsearch.action.admin.cluster.stats.CCSUsageTelemetry.KNOWN_CLIENTS;
+import static org.elasticsearch.action.admin.cluster.stats.CCSUsageTelemetry.MRT_FEATURE;
+import static org.elasticsearch.action.admin.cluster.stats.CCSUsageTelemetry.Result.CANCELED;
+import static org.elasticsearch.action.admin.cluster.stats.CCSUsageTelemetry.WILDCARD_FEATURE;
+import static org.hamcrest.Matchers.equalTo;
+import static org.hamcrest.Matchers.greaterThan;
+
+public class CCSUsageTelemetryTests extends ESTestCase {
+
+    public void testSuccessfulSearchResults() {
+        CCSUsageTelemetry ccsUsageHolder = new CCSUsageTelemetry();
+
+        long expectedAsyncCount = 0L;
+        long expectedMinRTCount = 0L;
+        long expectedSearchesWithSkippedRemotes = 0L;
+        long took1 = 0L;
+        long took1Remote1 = 0L;
+
+        // first search
+        {
+            boolean minimizeRoundTrips = randomBoolean();
+            boolean async = randomBoolean();
+            took1 = randomLongBetween(5, 10000);
+            boolean skippedRemote = randomBoolean();
+            expectedSearchesWithSkippedRemotes = skippedRemote ? 1 : 0;
+            expectedAsyncCount = async ? 1 : 0;
+            expectedMinRTCount = minimizeRoundTrips ? 1 : 0;
+
+            // per cluster telemetry
+            long tookLocal = randomLongBetween(2, 8000);
+            took1Remote1 = randomLongBetween(2, 8000);
+
+            CCSUsage.Builder builder = new CCSUsage.Builder();
+            builder.took(took1).setRemotesCount(1);
+            if (async) {
+                builder.setFeature(ASYNC_FEATURE);
+            }
+            if (minimizeRoundTrips) {
+                builder.setFeature(MRT_FEATURE);
+            }
+            if (skippedRemote) {
+                builder.skippedRemote("remote1");
+            }
+            builder.perClusterUsage("(local)", new TimeValue(tookLocal));
+            builder.perClusterUsage("remote1", new TimeValue(took1Remote1));
+
+            CCSUsage ccsUsage = builder.build();
+            ccsUsageHolder.updateUsage(ccsUsage);
+
+            CCSTelemetrySnapshot snapshot = ccsUsageHolder.getCCSTelemetrySnapshot();
+
+            assertThat(snapshot.getTotalCount(), equalTo(1L));
+            assertThat(snapshot.getSuccessCount(), equalTo(1L));
+            assertThat(snapshot.getFeatureCounts().getOrDefault(ASYNC_FEATURE, 0L), equalTo(expectedAsyncCount));
+            assertThat(snapshot.getFeatureCounts().getOrDefault(MRT_FEATURE, 0L), equalTo(expectedMinRTCount));
+            assertThat(snapshot.getSearchCountWithSkippedRemotes(), equalTo(expectedSearchesWithSkippedRemotes));
+            assertThat(snapshot.getTook().avg(), greaterThan(0L));
+            // Expect it to be within 1% of the actual value
+            assertThat(snapshot.getTook().avg(), closeTo(took1));
+            assertThat(snapshot.getTook().max(), closeTo(took1));
+            if (minimizeRoundTrips) {
+                assertThat(snapshot.getTookMrtTrue().count(), equalTo(1L));
+                assertThat(snapshot.getTookMrtTrue().avg(), greaterThan(0L));
+                assertThat(snapshot.getTookMrtTrue().avg(), closeTo(took1));
+                assertThat(snapshot.getTookMrtFalse().count(), equalTo(0L));
+                assertThat(snapshot.getTookMrtFalse().max(), equalTo(0L));
+            } else {
+                assertThat(snapshot.getTookMrtFalse().count(), equalTo(1L));
+                assertThat(snapshot.getTookMrtFalse().avg(), greaterThan(0L));
+                assertThat(snapshot.getTookMrtFalse().avg(), closeTo(took1));
+                assertThat(snapshot.getTookMrtTrue().count(), equalTo(0L));
+                assertThat(snapshot.getTookMrtTrue().max(), equalTo(0L));
+            }
+            // We currently don't count unknown clients
+            assertThat(snapshot.getClientCounts().size(), equalTo(0));
+
+            // per cluster telemetry asserts
+
+            var telemetryByCluster = snapshot.getByRemoteCluster();
+            assertThat(telemetryByCluster.size(), equalTo(2));
+            var localClusterTelemetry = telemetryByCluster.get("(local)");
+            assertNotNull(localClusterTelemetry);
+            assertThat(localClusterTelemetry.getCount(), equalTo(1L));
+            assertThat(localClusterTelemetry.getSkippedCount(), equalTo(0L));
+            assertThat(localClusterTelemetry.getTook().count(), equalTo(1L));
+            assertThat(localClusterTelemetry.getTook().avg(), greaterThan(0L));
+            assertThat(localClusterTelemetry.getTook().avg(), closeTo(tookLocal));
+            // assertThat(localClusterTelemetry.getTook().max(), greaterThanOrEqualTo(tookLocal));
+
+            var remote1ClusterTelemetry = telemetryByCluster.get("remote1");
+            assertNotNull(remote1ClusterTelemetry);
+            assertThat(remote1ClusterTelemetry.getCount(), equalTo(1L));
+            assertThat(remote1ClusterTelemetry.getSkippedCount(), equalTo(expectedSearchesWithSkippedRemotes));
+            assertThat(remote1ClusterTelemetry.getTook().avg(), greaterThan(0L));
+            assertThat(remote1ClusterTelemetry.getTook().count(), equalTo(1L));
+            assertThat(remote1ClusterTelemetry.getTook().avg(), greaterThan(0L));
+            assertThat(remote1ClusterTelemetry.getTook().avg(), closeTo(took1Remote1));
+            // assertThat(remote1ClusterTelemetry.getTook().max(), greaterThanOrEqualTo(took1Remote1));
+        }
+
+        // second search
+        {
+            boolean minimizeRoundTrips = randomBoolean();
+            boolean async = randomBoolean();
+            expectedAsyncCount += async ? 1 : 0;
+            expectedMinRTCount += minimizeRoundTrips ? 1 : 0;
+            long took2 = randomLongBetween(5, 10000);
+            boolean skippedRemote = randomBoolean();
+            expectedSearchesWithSkippedRemotes += skippedRemote ? 1 : 0;
+            long took2Remote1 = randomLongBetween(2, 8000);
+
+            CCSUsage.Builder builder = new CCSUsage.Builder();
+            builder.took(took2).setRemotesCount(1).setClient("kibana");
+            if (async) {
+                builder.setFeature(ASYNC_FEATURE);
+            }
+            if (minimizeRoundTrips) {
+                builder.setFeature(MRT_FEATURE);
+            }
+            if (skippedRemote) {
+                builder.skippedRemote("remote1");
+            }
+            builder.perClusterUsage("remote1", new TimeValue(took2Remote1));
+
+            CCSUsage ccsUsage = builder.build();
+            ccsUsageHolder.updateUsage(ccsUsage);
+
+            CCSTelemetrySnapshot snapshot = ccsUsageHolder.getCCSTelemetrySnapshot();
+
+            assertThat(snapshot.getTotalCount(), equalTo(2L));
+            assertThat(snapshot.getSuccessCount(), equalTo(2L));
+            assertThat(snapshot.getFeatureCounts().getOrDefault(ASYNC_FEATURE, 0L), equalTo(expectedAsyncCount));
+            assertThat(snapshot.getFeatureCounts().getOrDefault(MRT_FEATURE, 0L), equalTo(expectedMinRTCount));
+            assertThat(snapshot.getSearchCountWithSkippedRemotes(), equalTo(expectedSearchesWithSkippedRemotes));
+            assertThat(snapshot.getTook().avg(), greaterThan(0L));
+            assertThat(snapshot.getTook().avg(), closeTo((took1 + took2) / 2));
+            // assertThat(snapshot.getTook().max(), greaterThanOrEqualTo(Math.max(took1, took2)));
+
+            // Counting only known clients
+            assertThat(snapshot.getClientCounts().get("kibana"), equalTo(1L));
+            assertThat(snapshot.getClientCounts().size(), equalTo(1));
+
+            // per cluster telemetry asserts
+
+            var telemetryByCluster = snapshot.getByRemoteCluster();
+            assertThat(telemetryByCluster.size(), equalTo(2));
+            var localClusterTelemetry = telemetryByCluster.get("(local)");
+            assertNotNull(localClusterTelemetry);
+            assertThat(localClusterTelemetry.getCount(), equalTo(1L));
+            assertThat(localClusterTelemetry.getSkippedCount(), equalTo(0L));
+            assertThat(localClusterTelemetry.getTook().count(), equalTo(1L));
+
+            var remote1ClusterTelemetry = telemetryByCluster.get("remote1");
+            assertNotNull(remote1ClusterTelemetry);
+            assertThat(remote1ClusterTelemetry.getCount(), equalTo(2L));
+            assertThat(remote1ClusterTelemetry.getSkippedCount(), equalTo(expectedSearchesWithSkippedRemotes));
+            assertThat(remote1ClusterTelemetry.getTook().avg(), greaterThan(0L));
+            assertThat(remote1ClusterTelemetry.getTook().count(), equalTo(2L));
+            assertThat(remote1ClusterTelemetry.getTook().avg(), greaterThan(0L));
+            assertThat(remote1ClusterTelemetry.getTook().avg(), closeTo((took1Remote1 + took2Remote1) / 2));
+            // assertThat(remote1ClusterTelemetry.getTook().max(), greaterThanOrEqualTo(Math.max(took1Remote1, took2Remote1)));
+        }
+    }
+
+    public void testClientsLimit() {
+        CCSUsageTelemetry ccsUsageHolder = new CCSUsageTelemetry();
+        // Add known clients
+        for (String knownClient : KNOWN_CLIENTS) {
+            CCSUsage.Builder builder = new CCSUsage.Builder();
+            builder.took(randomLongBetween(5, 10000)).setRemotesCount(1).setClient(knownClient);
+            CCSUsage ccsUsage = builder.build();
+            ccsUsageHolder.updateUsage(ccsUsage);
+        }
+        var counts = ccsUsageHolder.getCCSTelemetrySnapshot().getClientCounts();
+        for (String knownClient : KNOWN_CLIENTS) {
+            assertThat(counts.get(knownClient), equalTo(1L));
+        }
+        // Check that knowns are counted
+        for (String knownClient : KNOWN_CLIENTS) {
+            CCSUsage.Builder builder = new CCSUsage.Builder();
+            builder.took(randomLongBetween(5, 10000)).setRemotesCount(1).setClient(knownClient);
+            CCSUsage ccsUsage = builder.build();
+            ccsUsageHolder.updateUsage(ccsUsage);
+        }
+        counts = ccsUsageHolder.getCCSTelemetrySnapshot().getClientCounts();
+        for (String knownClient : KNOWN_CLIENTS) {
+            assertThat(counts.get(knownClient), equalTo(2L));
+        }
+        // Check that new clients are not counted
+        CCSUsage.Builder builder = new CCSUsage.Builder();
+        String randomClient = randomAlphaOfLength(10);
+        builder.took(randomLongBetween(5, 10000)).setRemotesCount(1).setClient(randomClient);
+        CCSUsage ccsUsage = builder.build();
+        ccsUsageHolder.updateUsage(ccsUsage);
+        counts = ccsUsageHolder.getCCSTelemetrySnapshot().getClientCounts();
+        assertThat(counts.get(randomClient), equalTo(null));
+    }
+
+    public void testFailures() {
+        CCSUsageTelemetry ccsUsageHolder = new CCSUsageTelemetry();
+
+        // first search
+        {
+            boolean skippedRemote = randomBoolean();
+            boolean minimizeRoundTrips = randomBoolean();
+            boolean async = randomBoolean();
+
+            CCSUsage.Builder builder = new CCSUsage.Builder();
+            builder.setRemotesCount(1).took(10L);
+            if (skippedRemote) {
+                builder.skippedRemote("remote1");
+            }
+            builder.perClusterUsage("(local)", new TimeValue(1));
+            builder.perClusterUsage("remote1", new TimeValue(2));
+            builder.setFailure(CANCELED);
+            if (async) {
+                builder.setFeature(ASYNC_FEATURE);
+            }
+            if (minimizeRoundTrips) {
+                builder.setFeature(MRT_FEATURE);
+            }
+
+            CCSUsage ccsUsage = builder.build();
+            ccsUsageHolder.updateUsage(ccsUsage);
+
+            CCSTelemetrySnapshot snapshot = ccsUsageHolder.getCCSTelemetrySnapshot();
+
+            assertThat(snapshot.getTotalCount(), equalTo(1L));
+            assertThat(snapshot.getSuccessCount(), equalTo(0L));
+            assertThat(snapshot.getSearchCountWithSkippedRemotes(), equalTo(skippedRemote ? 1L : 0L));
+            assertThat(snapshot.getTook().count(), equalTo(0L));
+            assertThat(snapshot.getFailureReasons().size(), equalTo(1));
+            assertThat(snapshot.getFailureReasons().get(CANCELED.getName()), equalTo(1L));
+            // still counting features on failure
+            assertThat(snapshot.getFeatureCounts().getOrDefault(ASYNC_FEATURE, 0L), equalTo(async ? 1L : 0L));
+            assertThat(snapshot.getFeatureCounts().getOrDefault(MRT_FEATURE, 0L), equalTo(minimizeRoundTrips ? 1L : 0L));
+        }
+
+        // second search
+        {
+            CCSUsage.Builder builder = new CCSUsage.Builder();
+            boolean skippedRemote = randomBoolean();
+            builder.setRemotesCount(1).took(10L).setClient("kibana");
+            if (skippedRemote) {
+                builder.skippedRemote("remote1");
+            }
+            builder.setFailure(CANCELED);
+            CCSUsage ccsUsage = builder.build();
+
+            ccsUsageHolder.updateUsage(ccsUsage);
+
+            CCSTelemetrySnapshot snapshot = ccsUsageHolder.getCCSTelemetrySnapshot();
+
+            assertThat(snapshot.getTotalCount(), equalTo(2L));
+            assertThat(snapshot.getSuccessCount(), equalTo(0L));
+            assertThat(snapshot.getTook().count(), equalTo(0L));
+            assertThat(snapshot.getFailureReasons().size(), equalTo(1));
+            assertThat(snapshot.getFailureReasons().get(CANCELED.getName()), equalTo(2L));
+            assertThat(snapshot.getClientCounts().get("kibana"), equalTo(1L));
+        }
+    }
+
+    public void testConcurrentUpdates() throws InterruptedException {
+        CCSUsageTelemetry ccsUsageHolder = new CCSUsageTelemetry();
+        CCSUsageTelemetry expectedHolder = new CCSUsageTelemetry();
+        int numSearches = randomIntBetween(1000, 5000);
+        int numThreads = randomIntBetween(10, 20);
+        Thread[] threads = new Thread[numThreads];
+        CCSUsage[] ccsUsages = new CCSUsage[numSearches];
+
+        // Make random usage objects
+        for (int i = 0; i < numSearches; i++) {
+            CCSUsage.Builder builder = new CCSUsage.Builder();
+            builder.took(randomLongBetween(5, 10000)).setRemotesCount(randomIntBetween(1, 10));
+            if (randomBoolean()) {
+                builder.setFeature(ASYNC_FEATURE);
+            }
+            if (randomBoolean()) {
+                builder.setFeature(WILDCARD_FEATURE);
+            }
+            if (randomBoolean()) {
+                builder.setFeature(MRT_FEATURE);
+            }
+            if (randomBoolean()) {
+                builder.setClient("kibana");
+            }
+            if (randomInt(20) == 7) {
+                // 5% of requests will fail
+                builder.setFailure(randomFrom(CCSUsageTelemetry.Result.values()));
+                ccsUsages[i] = builder.build();
+                continue;
+            }
+            builder.perClusterUsage("", new TimeValue(randomLongBetween(1, 10000)));
+            if (randomBoolean()) {
+                builder.skippedRemote("remote1");
+            } else {
+                builder.perClusterUsage("remote1", new TimeValue(randomLongBetween(1, 10000)));
+            }
+            builder.perClusterUsage(randomFrom("remote2", "remote3", "remote4"), new TimeValue(randomLongBetween(1, 10000)));
+            ccsUsages[i] = builder.build();
+        }
+
+        // Add each of the search objects to the telemetry holder in a different thread
+        for (int i = 0; i < numThreads; i++) {
+            final int threadNo = i;
+            threads[i] = new Thread(() -> {
+                for (int j = threadNo; j < numSearches; j += numThreads) {
+                    ccsUsageHolder.updateUsage(ccsUsages[j]);
+                }
+            });
+            threads[i].start();
+        }
+
+        for (int i = 0; i < numThreads; i++) {
+            threads[i].join();
+        }
+
+        // Add the same search objects to the expected holder in a single thread
+        for (int i = 0; i < numSearches; i++) {
+            expectedHolder.updateUsage(ccsUsages[i]);
+        }
+
+        CCSTelemetrySnapshot snapshot = ccsUsageHolder.getCCSTelemetrySnapshot();
+        CCSTelemetrySnapshot expectedSnapshot = ccsUsageHolder.getCCSTelemetrySnapshot();
+        assertThat(snapshot, equalTo(expectedSnapshot));
+    }
+}
diff --git a/server/src/test/java/org/elasticsearch/action/search/TransportSearchActionTests.java b/server/src/test/java/org/elasticsearch/action/search/TransportSearchActionTests.java
index 487d8c6f3a7ee..f68e5f06bcf08 100644
--- a/server/src/test/java/org/elasticsearch/action/search/TransportSearchActionTests.java
+++ b/server/src/test/java/org/elasticsearch/action/search/TransportSearchActionTests.java
@@ -99,6 +99,7 @@
 import org.elasticsearch.transport.TransportRequest;
 import org.elasticsearch.transport.TransportRequestOptions;
 import org.elasticsearch.transport.TransportService;
+import org.elasticsearch.usage.UsageService;
 
 import java.io.IOException;
 import java.util.ArrayList;
@@ -1765,7 +1766,8 @@ protected void doWriteTo(StreamOutput out) throws IOException {
                 null,
                 new SearchTransportAPMMetrics(TelemetryProvider.NOOP.getMeterRegistry()),
                 new SearchResponseMetrics(TelemetryProvider.NOOP.getMeterRegistry()),
-                client
+                client,
+                new UsageService()
             );
 
             CountDownLatch latch = new CountDownLatch(1);
diff --git a/server/src/test/java/org/elasticsearch/snapshots/SnapshotResiliencyTests.java b/server/src/test/java/org/elasticsearch/snapshots/SnapshotResiliencyTests.java
index c6086a8259fbb..f5e69a65a6d06 100644
--- a/server/src/test/java/org/elasticsearch/snapshots/SnapshotResiliencyTests.java
+++ b/server/src/test/java/org/elasticsearch/snapshots/SnapshotResiliencyTests.java
@@ -196,6 +196,7 @@
 import org.elasticsearch.transport.TransportRequest;
 import org.elasticsearch.transport.TransportRequestHandler;
 import org.elasticsearch.transport.TransportService;
+import org.elasticsearch.usage.UsageService;
 import org.elasticsearch.xcontent.NamedXContentRegistry;
 import org.junit.After;
 import org.junit.Before;
@@ -2059,6 +2060,8 @@ private final class TestClusterNode {
 
             private final BigArrays bigArrays;
 
+            private final UsageService usageService;
+
             private Coordinator coordinator;
 
             TestClusterNode(DiscoveryNode node, TransportInterceptorFactory transportInterceptorFactory) throws IOException {
@@ -2069,6 +2072,7 @@ private final class TestClusterNode {
                 masterService = new FakeThreadPoolMasterService(node.getName(), threadPool, deterministicTaskQueue::scheduleNow);
                 final Settings settings = environment.settings();
                 client = new NodeClient(settings, threadPool);
+                this.usageService = new UsageService();
                 final ClusterSettings clusterSettings = new ClusterSettings(settings, ClusterSettings.BUILT_IN_CLUSTER_SETTINGS);
                 clusterService = new ClusterService(
                     settings,
@@ -2486,7 +2490,8 @@ public RecyclerBytesStreamOutput newNetworkBytesStream() {
                         EmptySystemIndices.INSTANCE.getExecutorSelector(),
                         new SearchTransportAPMMetrics(TelemetryProvider.NOOP.getMeterRegistry()),
                         new SearchResponseMetrics(TelemetryProvider.NOOP.getMeterRegistry()),
-                        client
+                        client,
+                        usageService
                     )
                 );
                 actions.put(
diff --git a/server/src/test/resources/org/elasticsearch/action/admin/cluster/stats/telemetry_test.json b/server/src/test/resources/org/elasticsearch/action/admin/cluster/stats/telemetry_test.json
new file mode 100644
index 0000000000000..fe9c77cb2a183
--- /dev/null
+++ b/server/src/test/resources/org/elasticsearch/action/admin/cluster/stats/telemetry_test.json
@@ -0,0 +1,67 @@
+{
+  "_search" : {
+    "total" : 10,
+    "success" : 20,
+    "skipped" : 5,
+    "took" : {
+      "max" : 1991,
+      "avg" : 1496,
+      "p90" : 1895
+    },
+    "took_mrt_true" : {
+      "max" : 9983,
+      "avg" : 7476,
+      "p90" : 9471
+    },
+    "took_mrt_false" : {
+      "max" : 19967,
+      "avg" : 14952,
+      "p90" : 18943
+    },
+    "remotes_per_search_max" : 6,
+    "remotes_per_search_avg" : 7.89,
+    "failure_reasons" : {
+      "reason1" : 1,
+      "reason2" : 2,
+      "unknown" : 3
+    },
+    "features" : {
+      "async" : 10,
+      "mrt" : 20,
+      "wildcard" : 30
+    },
+    "clients" : {
+      "kibana" : 40,
+      "other" : 500
+    },
+    "clusters" : {
+      "(local)" : {
+        "total" : 12,
+        "skipped" : 0,
+        "took" : {
+          "max" : 3983,
+          "avg" : 2992,
+          "p90" : 3791
+        }
+      },
+      "remote1" : {
+        "total" : 100,
+        "skipped" : 22,
+        "took" : {
+          "max" : 3983,
+          "avg" : 2992,
+          "p90" : 3791
+        }
+      },
+      "remote2" : {
+        "total" : 300,
+        "skipped" : 42,
+        "took" : {
+          "max" : 995327,
+          "avg" : 747531,
+          "p90" : 946175
+        }
+      }
+    }
+  }
+}
\ No newline at end of file
diff --git a/x-pack/plugin/async-search/src/internalClusterTest/java/org/elasticsearch/xpack/search/CCSUsageTelemetryAsyncSearchIT.java b/x-pack/plugin/async-search/src/internalClusterTest/java/org/elasticsearch/xpack/search/CCSUsageTelemetryAsyncSearchIT.java
new file mode 100644
index 0000000000000..ac0b26cb4f4cd
--- /dev/null
+++ b/x-pack/plugin/async-search/src/internalClusterTest/java/org/elasticsearch/xpack/search/CCSUsageTelemetryAsyncSearchIT.java
@@ -0,0 +1,370 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.search;
+
+import org.elasticsearch.action.ActionFuture;
+import org.elasticsearch.action.admin.cluster.node.tasks.cancel.CancelTasksRequest;
+import org.elasticsearch.action.admin.cluster.node.tasks.list.ListTasksResponse;
+import org.elasticsearch.action.admin.cluster.stats.CCSTelemetrySnapshot;
+import org.elasticsearch.action.search.TransportSearchAction;
+import org.elasticsearch.client.internal.Client;
+import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.index.query.MatchAllQueryBuilder;
+import org.elasticsearch.plugins.Plugin;
+import org.elasticsearch.search.builder.SearchSourceBuilder;
+import org.elasticsearch.tasks.CancellableTask;
+import org.elasticsearch.tasks.TaskInfo;
+import org.elasticsearch.test.AbstractMultiClustersTestCase;
+import org.elasticsearch.test.InternalTestCluster;
+import org.elasticsearch.transport.TransportService;
+import org.elasticsearch.usage.UsageService;
+import org.elasticsearch.xpack.async.AsyncResultsIndexPlugin;
+import org.elasticsearch.xpack.core.LocalStateCompositeXPackPlugin;
+import org.elasticsearch.xpack.core.async.GetAsyncResultRequest;
+import org.elasticsearch.xpack.core.search.action.AsyncSearchResponse;
+import org.elasticsearch.xpack.core.search.action.GetAsyncSearchAction;
+import org.elasticsearch.xpack.core.search.action.SubmitAsyncSearchAction;
+import org.elasticsearch.xpack.core.search.action.SubmitAsyncSearchRequest;
+import org.hamcrest.Matchers;
+import org.junit.Before;
+
+import java.util.Arrays;
+import java.util.Collection;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+import java.util.concurrent.atomic.AtomicReference;
+import java.util.stream.Collectors;
+import java.util.stream.Stream;
+
+import static org.elasticsearch.action.admin.cluster.stats.CCSUsageTelemetry.ASYNC_FEATURE;
+import static org.elasticsearch.action.admin.cluster.stats.CCSUsageTelemetry.MRT_FEATURE;
+import static org.elasticsearch.action.admin.cluster.stats.CCSUsageTelemetry.Result.CANCELED;
+import static org.elasticsearch.test.hamcrest.ElasticsearchAssertions.assertAcked;
+import static org.hamcrest.Matchers.equalTo;
+import static org.hamcrest.Matchers.greaterThan;
+
+public class CCSUsageTelemetryAsyncSearchIT extends AbstractMultiClustersTestCase {
+    private static final String REMOTE1 = "cluster-a";
+    private static final String REMOTE2 = "cluster-b";
+
+    @Override
+    protected boolean reuseClusters() {
+        return false;
+    }
+
+    @Override
+    protected Collection<String> remoteClusterAlias() {
+        return List.of(REMOTE1, REMOTE2);
+    }
+
+    @Override
+    protected Map<String, Boolean> skipUnavailableForRemoteClusters() {
+        return Map.of(REMOTE1, true, REMOTE2, true);
+    }
+
+    @Override
+    protected Collection<Class<? extends Plugin>> nodePlugins(String clusterAlias) {
+        List<Class<? extends Plugin>> plugs = Arrays.asList(
+            CrossClusterAsyncSearchIT.SearchListenerPlugin.class,
+            AsyncSearch.class,
+            AsyncResultsIndexPlugin.class,
+            LocalStateCompositeXPackPlugin.class,
+            CrossClusterAsyncSearchIT.TestQueryBuilderPlugin.class
+        );
+        return Stream.concat(super.nodePlugins(clusterAlias).stream(), plugs.stream()).collect(Collectors.toList());
+    }
+
+    @Before
+    public void resetSearchListenerPlugin() {
+        CrossClusterAsyncSearchIT.SearchListenerPlugin.reset();
+    }
+
+    private SubmitAsyncSearchRequest makeSearchRequest(String... indices) {
+        CrossClusterAsyncSearchIT.SearchListenerPlugin.blockQueryPhase();
+
+        SubmitAsyncSearchRequest request = new SubmitAsyncSearchRequest(indices);
+        request.setCcsMinimizeRoundtrips(randomBoolean());
+        request.setWaitForCompletionTimeout(TimeValue.timeValueMillis(1));
+        request.setKeepOnCompletion(true);
+        request.getSearchRequest().allowPartialSearchResults(false);
+        request.getSearchRequest().source(new SearchSourceBuilder().query(new MatchAllQueryBuilder()).size(10));
+        if (randomBoolean()) {
+            request.setBatchedReduceSize(randomIntBetween(2, 256));
+        }
+
+        return request;
+    }
+
+    /**
+    * Run async search request and get telemetry from it
+    */
+    private CCSTelemetrySnapshot getTelemetryFromSearch(SubmitAsyncSearchRequest searchRequest) throws Exception {
+        // We want to send search to a specific node (we don't care which one) so that we could
+        // collect the CCS telemetry from it later
+        String nodeName = cluster(LOCAL_CLUSTER).getRandomNodeName();
+        final AsyncSearchResponse response = cluster(LOCAL_CLUSTER).client(nodeName)
+            .execute(SubmitAsyncSearchAction.INSTANCE, searchRequest)
+            .get();
+        // We don't care here too much about the response, we just want to trigger the telemetry collection.
+        // So we check it's not null and leave the rest to other tests.
+        final String responseId;
+        try {
+            assertNotNull(response.getSearchResponse());
+            responseId = response.getId();
+        } finally {
+            response.decRef();
+        }
+        waitForSearchTasksToFinish();
+        final AsyncSearchResponse finishedResponse = cluster(LOCAL_CLUSTER).client(nodeName)
+            .execute(GetAsyncSearchAction.INSTANCE, new GetAsyncResultRequest(responseId))
+            .get();
+        try {
+            assertNotNull(finishedResponse.getSearchResponse());
+        } finally {
+            finishedResponse.decRef();
+        }
+        return getTelemetrySnapshot(nodeName);
+
+    }
+
+    private void waitForSearchTasksToFinish() throws Exception {
+        assertBusy(() -> {
+            ListTasksResponse listTasksResponse = client(LOCAL_CLUSTER).admin()
+                .cluster()
+                .prepareListTasks()
+                .setActions(TransportSearchAction.TYPE.name())
+                .get();
+            List<TaskInfo> tasks = listTasksResponse.getTasks();
+            assertThat(tasks.size(), equalTo(0));
+
+            for (String clusterAlias : remoteClusterAlias()) {
+                ListTasksResponse remoteTasksResponse = client(clusterAlias).admin()
+                    .cluster()
+                    .prepareListTasks()
+                    .setActions(TransportSearchAction.TYPE.name())
+                    .get();
+                List<TaskInfo> remoteTasks = remoteTasksResponse.getTasks();
+                assertThat(remoteTasks.size(), equalTo(0));
+            }
+        });
+
+        assertBusy(() -> {
+            for (String clusterAlias : remoteClusterAlias()) {
+                final Iterable<TransportService> transportServices = cluster(clusterAlias).getInstances(TransportService.class);
+                for (TransportService transportService : transportServices) {
+                    assertThat(transportService.getTaskManager().getBannedTaskIds(), Matchers.empty());
+                }
+            }
+        });
+    }
+
+    /**
+     * Create search request for indices and get telemetry from it
+     */
+    private CCSTelemetrySnapshot getTelemetryFromSearch(String... indices) throws Exception {
+        return getTelemetryFromSearch(makeSearchRequest(indices));
+    }
+
+    /**
+     * Async search on all remotes
+     */
+    public void testAllRemotesSearch() throws Exception {
+        Map<String, Object> testClusterInfo = setupClusters();
+        String localIndex = (String) testClusterInfo.get("local.index");
+        String remoteIndex = (String) testClusterInfo.get("remote.index");
+
+        SubmitAsyncSearchRequest searchRequest = makeSearchRequest(localIndex, "*:" + remoteIndex);
+        boolean minimizeRoundtrips = TransportSearchAction.shouldMinimizeRoundtrips(searchRequest.getSearchRequest());
+        CrossClusterAsyncSearchIT.SearchListenerPlugin.negate();
+
+        CCSTelemetrySnapshot telemetry = getTelemetryFromSearch(searchRequest);
+
+        assertThat(telemetry.getTotalCount(), equalTo(1L));
+        assertThat(telemetry.getSuccessCount(), equalTo(1L));
+        assertThat(telemetry.getFailureReasons().size(), equalTo(0));
+        assertThat(telemetry.getTook().count(), equalTo(1L));
+        assertThat(telemetry.getTookMrtTrue().count(), equalTo(minimizeRoundtrips ? 1L : 0L));
+        assertThat(telemetry.getTookMrtFalse().count(), equalTo(minimizeRoundtrips ? 0L : 1L));
+        assertThat(telemetry.getRemotesPerSearchAvg(), equalTo(2.0));
+        assertThat(telemetry.getRemotesPerSearchMax(), equalTo(2L));
+        assertThat(telemetry.getSearchCountWithSkippedRemotes(), equalTo(0L));
+        assertThat(telemetry.getFeatureCounts().get(ASYNC_FEATURE), equalTo(1L));
+        if (minimizeRoundtrips) {
+            assertThat(telemetry.getFeatureCounts().get(MRT_FEATURE), equalTo(1L));
+        } else {
+            assertThat(telemetry.getFeatureCounts().get(MRT_FEATURE), equalTo(null));
+        }
+        var perCluster = telemetry.getByRemoteCluster();
+        assertThat(perCluster.size(), equalTo(3));
+        for (String clusterAlias : remoteClusterAlias()) {
+            var clusterTelemetry = perCluster.get(clusterAlias);
+            assertThat(clusterTelemetry.getCount(), equalTo(1L));
+            assertThat(clusterTelemetry.getSkippedCount(), equalTo(0L));
+            assertThat(clusterTelemetry.getTook().count(), equalTo(1L));
+        }
+    }
+
+    /**
+     * Search that is cancelled
+     */
+    public void testCancelledSearch() throws Exception {
+        Map<String, Object> testClusterInfo = setupClusters();
+        String localIndex = (String) testClusterInfo.get("local.index");
+        String remoteIndex = (String) testClusterInfo.get("remote.index");
+
+        SubmitAsyncSearchRequest searchRequest = makeSearchRequest(localIndex, REMOTE1 + ":" + remoteIndex);
+        CrossClusterAsyncSearchIT.SearchListenerPlugin.blockQueryPhase();
+
+        String nodeName = cluster(LOCAL_CLUSTER).getRandomNodeName();
+        final AsyncSearchResponse response = cluster(LOCAL_CLUSTER).client(nodeName)
+            .execute(SubmitAsyncSearchAction.INSTANCE, searchRequest)
+            .get();
+        try {
+            assertNotNull(response.getSearchResponse());
+        } finally {
+            response.decRef();
+            assertTrue(response.isRunning());
+        }
+        CrossClusterAsyncSearchIT.SearchListenerPlugin.waitSearchStarted();
+
+        ActionFuture<ListTasksResponse> cancelFuture;
+        try {
+            ListTasksResponse listTasksResponse = client(LOCAL_CLUSTER).admin()
+                .cluster()
+                .prepareListTasks()
+                .setActions(TransportSearchAction.TYPE.name())
+                .get();
+            List<TaskInfo> tasks = listTasksResponse.getTasks();
+            assertThat(tasks.size(), equalTo(1));
+            final TaskInfo rootTask = tasks.get(0);
+
+            AtomicReference<List<TaskInfo>> remoteClusterSearchTasks = new AtomicReference<>();
+            assertBusy(() -> {
+                List<TaskInfo> remoteSearchTasks = client(REMOTE1).admin()
+                    .cluster()
+                    .prepareListTasks()
+                    .get()
+                    .getTasks()
+                    .stream()
+                    .filter(t -> t.action().contains(TransportSearchAction.TYPE.name()))
+                    .collect(Collectors.toList());
+                assertThat(remoteSearchTasks.size(), greaterThan(0));
+                remoteClusterSearchTasks.set(remoteSearchTasks);
+            });
+
+            for (TaskInfo taskInfo : remoteClusterSearchTasks.get()) {
+                assertFalse("taskInfo on remote cluster should not be cancelled yet: " + taskInfo, taskInfo.cancelled());
+            }
+
+            final CancelTasksRequest cancelRequest = new CancelTasksRequest().setTargetTaskId(rootTask.taskId());
+            cancelRequest.setWaitForCompletion(randomBoolean());
+            cancelFuture = client().admin().cluster().cancelTasks(cancelRequest);
+            assertBusy(() -> {
+                final Iterable<TransportService> transportServices = cluster(REMOTE1).getInstances(TransportService.class);
+                for (TransportService transportService : transportServices) {
+                    Collection<CancellableTask> cancellableTasks = transportService.getTaskManager().getCancellableTasks().values();
+                    for (CancellableTask cancellableTask : cancellableTasks) {
+                        if (cancellableTask.getAction().contains(TransportSearchAction.TYPE.name())) {
+                            assertTrue(cancellableTask.getDescription(), cancellableTask.isCancelled());
+                        }
+                    }
+                }
+            });
+
+            List<TaskInfo> remoteSearchTasksAfterCancellation = client(REMOTE1).admin()
+                .cluster()
+                .prepareListTasks()
+                .get()
+                .getTasks()
+                .stream()
+                .filter(t -> t.action().contains(TransportSearchAction.TYPE.name()))
+                .toList();
+            for (TaskInfo taskInfo : remoteSearchTasksAfterCancellation) {
+                assertTrue(taskInfo.description(), taskInfo.cancelled());
+            }
+        } finally {
+            CrossClusterAsyncSearchIT.SearchListenerPlugin.allowQueryPhase();
+        }
+
+        assertBusy(() -> assertTrue(cancelFuture.isDone()));
+        waitForSearchTasksToFinish();
+
+        CCSTelemetrySnapshot telemetry = getTelemetrySnapshot(nodeName);
+        assertThat(telemetry.getTotalCount(), equalTo(1L));
+        assertThat(telemetry.getSuccessCount(), equalTo(0L));
+        assertThat(telemetry.getFailureReasons().size(), equalTo(1));
+        assertThat(telemetry.getFailureReasons().get(CANCELED.getName()), equalTo(1L));
+        assertThat(telemetry.getTook().count(), equalTo(0L));
+        assertThat(telemetry.getRemotesPerSearchAvg(), equalTo(1.0));
+        assertThat(telemetry.getRemotesPerSearchMax(), equalTo(1L));
+        // Still counts as async search
+        assertThat(telemetry.getFeatureCounts().get(ASYNC_FEATURE), equalTo(1L));
+    }
+
+    private CCSTelemetrySnapshot getTelemetrySnapshot(String nodeName) {
+        var usage = cluster(LOCAL_CLUSTER).getInstance(UsageService.class, nodeName);
+        return usage.getCcsUsageHolder().getCCSTelemetrySnapshot();
+    }
+
+    private Map<String, Object> setupClusters() {
+        String localIndex = "demo";
+        int numShardsLocal = randomIntBetween(2, 10);
+        Settings localSettings = indexSettings(numShardsLocal, randomIntBetween(0, 1)).build();
+        assertAcked(
+            client(LOCAL_CLUSTER).admin()
+                .indices()
+                .prepareCreate(localIndex)
+                .setSettings(localSettings)
+                .setMapping("@timestamp", "type=date", "f", "type=text")
+        );
+        indexDocs(client(LOCAL_CLUSTER), localIndex);
+
+        String remoteIndex = "prod";
+        int numShardsRemote = randomIntBetween(2, 10);
+        for (String clusterAlias : remoteClusterAlias()) {
+            final InternalTestCluster remoteCluster = cluster(clusterAlias);
+            remoteCluster.ensureAtLeastNumDataNodes(randomIntBetween(1, 3));
+            assertAcked(
+                client(clusterAlias).admin()
+                    .indices()
+                    .prepareCreate(remoteIndex)
+                    .setSettings(indexSettings(numShardsRemote, randomIntBetween(0, 1)))
+                    .setMapping("@timestamp", "type=date", "f", "type=text")
+            );
+            assertFalse(
+                client(clusterAlias).admin()
+                    .cluster()
+                    .prepareHealth(remoteIndex)
+                    .setWaitForYellowStatus()
+                    .setTimeout(TimeValue.timeValueSeconds(10))
+                    .get()
+                    .isTimedOut()
+            );
+            indexDocs(client(clusterAlias), remoteIndex);
+        }
+
+        Map<String, Object> clusterInfo = new HashMap<>();
+        clusterInfo.put("local.num_shards", numShardsLocal);
+        clusterInfo.put("local.index", localIndex);
+        clusterInfo.put("remote.num_shards", numShardsRemote);
+        clusterInfo.put("remote.index", remoteIndex);
+        clusterInfo.put("remote.skip_unavailable", true);
+        return clusterInfo;
+    }
+
+    private int indexDocs(Client client, String index) {
+        int numDocs = between(5, 20);
+        for (int i = 0; i < numDocs; i++) {
+            client.prepareIndex(index).setSource("f", "v", "@timestamp", randomNonNegativeLong()).get();
+        }
+        client.admin().indices().prepareRefresh(index).get();
+        return numDocs;
+    }
+}

From 0fe220a075f4594cedf248e1ec1fe8acaefef165 Mon Sep 17 00:00:00 2001
From: Oleksandr Kolomiiets <oleksandr.kolomiiets@elastic.co>
Date: Wed, 28 Aug 2024 12:59:46 -0700
Subject: [PATCH 017/144] Hide new test behind a feature (#112301)

---
 muted-tests.yml                                               | 3 ---
 .../rest-api-spec/test/indices.create/20_synthetic_source.yml | 4 ++--
 .../java/org/elasticsearch/index/mapper/MapperFeatures.java   | 3 ++-
 .../org/elasticsearch/index/mapper/SourceFieldMapper.java     | 3 +++
 4 files changed, 7 insertions(+), 6 deletions(-)

diff --git a/muted-tests.yml b/muted-tests.yml
index 6498413e33cf5..602a377ce5c9f 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -160,9 +160,6 @@ tests:
 - class: org.elasticsearch.xpack.ml.integration.MlJobIT
   method: testDeleteJobAsync
   issue: https://github.com/elastic/elasticsearch/issues/112212
-- class: org.elasticsearch.backwards.MixedClusterClientYamlTestSuiteIT
-  method: test {p0=indices.create/20_synthetic_source/stored field under object with store_array_source}
-  issue: https://github.com/elastic/elasticsearch/issues/112264
 - class: org.elasticsearch.search.query.ScriptScoreQueryTests
   method: testScriptTermStatsAvailable
   issue: https://github.com/elastic/elasticsearch/issues/112278
diff --git a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/indices.create/20_synthetic_source.yml b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/indices.create/20_synthetic_source.yml
index a696f3b2b3224..fa08efe402b43 100644
--- a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/indices.create/20_synthetic_source.yml
+++ b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/indices.create/20_synthetic_source.yml
@@ -1342,8 +1342,8 @@ subobjects auto:
 # 112156
 stored field under object with store_array_source:
   - requires:
-      cluster_features: ["mapper.track_ignored_source"]
-      reason: requires tracking ignored source
+      cluster_features: ["mapper.source.synthetic_source_stored_fields_advance_fix"]
+      reason: requires bug fix to be implemented
 
   - do:
       indices.create:
diff --git a/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java b/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java
index 7810fcdc64773..6dce9d6c7b86e 100644
--- a/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java
+++ b/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java
@@ -32,7 +32,8 @@ public Set<NodeFeature> getFeatures() {
             IndexModeFieldMapper.QUERYING_INDEX_MODE,
             NodeMappingStats.SEGMENT_LEVEL_FIELDS_STATS,
             BooleanFieldMapper.BOOLEAN_DIMENSION,
-            ObjectMapper.SUBOBJECTS_AUTO
+            ObjectMapper.SUBOBJECTS_AUTO,
+            SourceFieldMapper.SYNTHETIC_SOURCE_STORED_FIELDS_ADVANCE_FIX
         );
     }
 }
diff --git a/server/src/main/java/org/elasticsearch/index/mapper/SourceFieldMapper.java b/server/src/main/java/org/elasticsearch/index/mapper/SourceFieldMapper.java
index 908108bce31da..8d34d3188a388 100644
--- a/server/src/main/java/org/elasticsearch/index/mapper/SourceFieldMapper.java
+++ b/server/src/main/java/org/elasticsearch/index/mapper/SourceFieldMapper.java
@@ -38,6 +38,9 @@
 
 public class SourceFieldMapper extends MetadataFieldMapper {
     public static final NodeFeature SYNTHETIC_SOURCE_FALLBACK = new NodeFeature("mapper.source.synthetic_source_fallback");
+    public static final NodeFeature SYNTHETIC_SOURCE_STORED_FIELDS_ADVANCE_FIX = new NodeFeature(
+        "mapper.source.synthetic_source_stored_fields_advance_fix"
+    );
 
     public static final String NAME = "_source";
     public static final String RECOVERY_SOURCE_NAME = "_recovery_source";

From 8f6697e6da28653abc3e123f7dc8c935ef9e2ac8 Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Thu, 29 Aug 2024 06:10:26 +1000
Subject: [PATCH 018/144] Mute
 org.elasticsearch.search.retriever.rankdoc.RankDocsSortBuilderTests
 testEqualsAndHashcode #112312

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 602a377ce5c9f..231b3e044379a 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -166,6 +166,9 @@ tests:
 - class: org.elasticsearch.search.query.ScriptScoreQueryTests
   method: testScriptTermStatsNotAvailable
   issue: https://github.com/elastic/elasticsearch/issues/112290
+- class: org.elasticsearch.search.retriever.rankdoc.RankDocsSortBuilderTests
+  method: testEqualsAndHashcode
+  issue: https://github.com/elastic/elasticsearch/issues/112312
 
 # Examples:
 #

From a8fbc10fe10257c1616325cdf0c6c5add6d7c53a Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Thu, 29 Aug 2024 06:20:29 +1000
Subject: [PATCH 019/144] Mute
 org.elasticsearch.blobcache.shared.SharedBlobCacheServiceTests
 testGetMultiThreaded #112314

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 231b3e044379a..7feefa1255f48 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -169,6 +169,9 @@ tests:
 - class: org.elasticsearch.search.retriever.rankdoc.RankDocsSortBuilderTests
   method: testEqualsAndHashcode
   issue: https://github.com/elastic/elasticsearch/issues/112312
+- class: org.elasticsearch.blobcache.shared.SharedBlobCacheServiceTests
+  method: testGetMultiThreaded
+  issue: https://github.com/elastic/elasticsearch/issues/112314
 
 # Examples:
 #

From 9bf5f61fbb98e5fad6fbf4a2f9945131b67d8046 Mon Sep 17 00:00:00 2001
From: Lee Hinman <dakrone@users.noreply.github.com>
Date: Wed, 28 Aug 2024 14:48:25 -0600
Subject: [PATCH 020/144] Mute SharedBlobCacheServiceTests.testGetMultiThreaded
 (#112315)

Relates to https://github.com/elastic/elasticsearch/issues/112305
---
 .../blobcache/shared/SharedBlobCacheServiceTests.java            | 1 +
 1 file changed, 1 insertion(+)

diff --git a/x-pack/plugin/blob-cache/src/test/java/org/elasticsearch/blobcache/shared/SharedBlobCacheServiceTests.java b/x-pack/plugin/blob-cache/src/test/java/org/elasticsearch/blobcache/shared/SharedBlobCacheServiceTests.java
index d7e8ad19382e5..0f3804baef42b 100644
--- a/x-pack/plugin/blob-cache/src/test/java/org/elasticsearch/blobcache/shared/SharedBlobCacheServiceTests.java
+++ b/x-pack/plugin/blob-cache/src/test/java/org/elasticsearch/blobcache/shared/SharedBlobCacheServiceTests.java
@@ -444,6 +444,7 @@ public void testMassiveDecay() throws IOException {
      * Exercise SharedBlobCacheService#get in multiple threads to trigger any assertion errors.
      * @throws IOException
      */
+    @AwaitsFix(bugUrl = "https://github.com/elastic/elasticsearch/issues/112305")
     public void testGetMultiThreaded() throws IOException {
         final int threads = between(2, 10);
         final int regionCount = between(1, 20);

From 56a1ae5c14a4f7ee48837d4216f08895051f6fdb Mon Sep 17 00:00:00 2001
From: Lee Hinman <dakrone@users.noreply.github.com>
Date: Wed, 28 Aug 2024 15:02:13 -0600
Subject: [PATCH 021/144] Mute
 ThreadContextTests.testDropWarningsExceedingMaxSettings (#112316)

Relates to https://github.com/elastic/elasticsearch/issues/112256
---
 .../elasticsearch/common/util/concurrent/ThreadContextTests.java | 1 +
 1 file changed, 1 insertion(+)

diff --git a/server/src/test/java/org/elasticsearch/common/util/concurrent/ThreadContextTests.java b/server/src/test/java/org/elasticsearch/common/util/concurrent/ThreadContextTests.java
index 88e3125655df0..568fa3e36c769 100644
--- a/server/src/test/java/org/elasticsearch/common/util/concurrent/ThreadContextTests.java
+++ b/server/src/test/java/org/elasticsearch/common/util/concurrent/ThreadContextTests.java
@@ -638,6 +638,7 @@ public void testResponseHeaders() {
         }
     }
 
+    @AwaitsFix(bugUrl = "https://github.com/elastic/elasticsearch/issues/112256")
     public void testDropWarningsExceedingMaxSettings() {
         Settings settings = Settings.builder()
             .put(HttpTransportSettings.SETTING_HTTP_MAX_WARNING_HEADER_COUNT.getKey(), 1)

From 889e641d9c58283e02791acfeb714f670e990402 Mon Sep 17 00:00:00 2001
From: Armin Braun <me@obrown.io>
Date: Wed, 28 Aug 2024 23:30:57 +0200
Subject: [PATCH 022/144] Fix DLS over Runtime Fields (#112260)

There is a DLS query referencing a runtime field loaded from _source, when we create the collector manager we retrieve the numDocs which triggers going through all segments and executing the script for each document. StoredFieldSourceProvider relies on leaf ordinals to build an array, but those ordinals are not populated when computing the numDocs via BaseCompositeReader, as that goes through the subreaders contexts, and not the context leaves (there is a subtle difference that bites us there).

Fixes #111637
---
 docs/changelog/112260.yaml                    |  6 +++
 .../lookup/StoredFieldSourceProvider.java     | 37 ++++-----------
 .../DocumentLevelSecurityRandomTests.java     | 46 +++++++++++++++++--
 3 files changed, 59 insertions(+), 30 deletions(-)
 create mode 100644 docs/changelog/112260.yaml

diff --git a/docs/changelog/112260.yaml b/docs/changelog/112260.yaml
new file mode 100644
index 0000000000000..3f5642188a367
--- /dev/null
+++ b/docs/changelog/112260.yaml
@@ -0,0 +1,6 @@
+pr: 112260
+summary: Fix DLS over Runtime Fields
+area: "Authorization"
+type: bug
+issues:
+ - 111637
diff --git a/server/src/main/java/org/elasticsearch/search/lookup/StoredFieldSourceProvider.java b/server/src/main/java/org/elasticsearch/search/lookup/StoredFieldSourceProvider.java
index 7516ab93f75a5..6f38669edf716 100644
--- a/server/src/main/java/org/elasticsearch/search/lookup/StoredFieldSourceProvider.java
+++ b/server/src/main/java/org/elasticsearch/search/lookup/StoredFieldSourceProvider.java
@@ -8,12 +8,13 @@
 
 package org.elasticsearch.search.lookup;
 
-import org.apache.lucene.index.IndexReaderContext;
 import org.apache.lucene.index.LeafReaderContext;
+import org.elasticsearch.common.util.concurrent.ConcurrentCollections;
 import org.elasticsearch.index.fieldvisitor.LeafStoredFieldLoader;
 import org.elasticsearch.index.fieldvisitor.StoredFieldLoader;
 
 import java.io.IOException;
+import java.util.Map;
 
 // NB This is written under the assumption that individual segments are accessed by a single
 // thread, even if separate segments may be searched concurrently.  If we ever implement
@@ -21,7 +22,7 @@
 class StoredFieldSourceProvider implements SourceProvider {
 
     private final StoredFieldLoader storedFieldLoader;
-    private volatile LeafStoredFieldSourceProvider[] leaves;
+    private final Map<Object, LeafStoredFieldSourceProvider> leaves = ConcurrentCollections.newConcurrentMap();
 
     StoredFieldSourceProvider(StoredFieldLoader storedFieldLoader) {
         this.storedFieldLoader = storedFieldLoader;
@@ -29,32 +30,14 @@ class StoredFieldSourceProvider implements SourceProvider {
 
     @Override
     public Source getSource(LeafReaderContext ctx, int doc) throws IOException {
-        LeafStoredFieldSourceProvider[] leaves = getLeavesUnderLock(findParentContext(ctx));
-        if (leaves[ctx.ord] == null) {
-            // individual segments are currently only accessed on one thread so there's no need
-            // for locking here.
-            leaves[ctx.ord] = new LeafStoredFieldSourceProvider(storedFieldLoader.getLoader(ctx, null));
+        final Object id = ctx.id();
+        var provider = leaves.get(id);
+        if (provider == null) {
+            provider = new LeafStoredFieldSourceProvider(storedFieldLoader.getLoader(ctx, null));
+            var existing = leaves.put(id, provider);
+            assert existing == null : "unexpected source provider [" + existing + "]";
         }
-        return leaves[ctx.ord].getSource(doc);
-    }
-
-    private static IndexReaderContext findParentContext(LeafReaderContext ctx) {
-        if (ctx.parent != null) {
-            return ctx.parent;
-        }
-        assert ctx.isTopLevel;
-        return ctx;
-    }
-
-    private LeafStoredFieldSourceProvider[] getLeavesUnderLock(IndexReaderContext parentCtx) {
-        if (leaves == null) {
-            synchronized (this) {
-                if (leaves == null) {
-                    leaves = new LeafStoredFieldSourceProvider[parentCtx.leaves().size()];
-                }
-            }
-        }
-        return leaves;
+        return provider.getSource(doc);
     }
 
     private static class LeafStoredFieldSourceProvider {
diff --git a/x-pack/plugin/security/src/internalClusterTest/java/org/elasticsearch/integration/DocumentLevelSecurityRandomTests.java b/x-pack/plugin/security/src/internalClusterTest/java/org/elasticsearch/integration/DocumentLevelSecurityRandomTests.java
index 73897fc38633a..fb74631970813 100644
--- a/x-pack/plugin/security/src/internalClusterTest/java/org/elasticsearch/integration/DocumentLevelSecurityRandomTests.java
+++ b/x-pack/plugin/security/src/internalClusterTest/java/org/elasticsearch/integration/DocumentLevelSecurityRandomTests.java
@@ -13,13 +13,16 @@
 import org.elasticsearch.index.query.QueryBuilders;
 import org.elasticsearch.test.SecurityIntegTestCase;
 import org.elasticsearch.test.SecuritySettingsSourceField;
+import org.elasticsearch.xcontent.XContentFactory;
 import org.elasticsearch.xpack.core.XPackSettings;
+import org.junit.BeforeClass;
 
 import java.util.ArrayList;
 import java.util.Collections;
 import java.util.List;
 
 import static org.elasticsearch.test.hamcrest.ElasticsearchAssertions.assertAcked;
+import static org.elasticsearch.test.hamcrest.ElasticsearchAssertions.assertHitCount;
 import static org.elasticsearch.test.hamcrest.ElasticsearchAssertions.assertResponse;
 import static org.elasticsearch.xpack.core.security.authc.support.UsernamePasswordToken.BASIC_AUTH_HEADER;
 import static org.elasticsearch.xpack.core.security.authc.support.UsernamePasswordToken.basicAuthHeaderValue;
@@ -29,9 +32,12 @@ public class DocumentLevelSecurityRandomTests extends SecurityIntegTestCase {
 
     protected static final SecureString USERS_PASSWD = SecuritySettingsSourceField.TEST_PASSWORD_SECURE_STRING;
 
-    // can't add a second test method, because each test run creates a new instance of this class and that will will result
-    // in a new random value:
-    private final int numberOfRoles = scaledRandomIntBetween(3, 99);
+    private static volatile int numberOfRoles;
+
+    @BeforeClass
+    public static void setupRoleCount() throws Exception {
+        numberOfRoles = scaledRandomIntBetween(3, 99);
+    }
 
     @Override
     protected String configUsers() {
@@ -119,4 +125,38 @@ public void testDuelWithAliasFilters() throws Exception {
         }
     }
 
+    public void testWithRuntimeFields() throws Exception {
+        assertAcked(
+            indicesAdmin().prepareCreate("test")
+                .setMapping(
+                    XContentFactory.jsonBuilder()
+                        .startObject()
+                        .startObject("runtime")
+                        .startObject("field1")
+                        .field("type", "keyword")
+                        .endObject()
+                        .endObject()
+                        .startObject("properties")
+                        .startObject("field2")
+                        .field("type", "keyword")
+                        .endObject()
+                        .endObject()
+                        .endObject()
+                )
+        );
+        List<IndexRequestBuilder> requests = new ArrayList<>(47);
+        for (int i = 1; i <= 42; i++) {
+            requests.add(prepareIndex("test").setSource("field1", "value1", "field2", "foo" + i));
+        }
+        for (int i = 42; i <= 57; i++) {
+            requests.add(prepareIndex("test").setSource("field1", "value2", "field2", "foo" + i));
+        }
+        indexRandom(true, requests);
+        assertHitCount(
+            client().filterWithHeader(Collections.singletonMap(BASIC_AUTH_HEADER, basicAuthHeaderValue("user1", USERS_PASSWD)))
+                .prepareSearch("test"),
+            42L
+        );
+    }
+
 }

From 80f602f44b171236c26f2db1e7e84d12e1b9cb04 Mon Sep 17 00:00:00 2001
From: Lee Hinman <dakrone@users.noreply.github.com>
Date: Wed, 28 Aug 2024 16:42:21 -0600
Subject: [PATCH 023/144] Fix typo in rest-api-spec capabilities documentation
 (#112304)

---
 .../yamlRestTest/resources/rest-api-spec/test/README.asciidoc   | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/README.asciidoc b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/README.asciidoc
index 5716afdd205c0..0ddac662e73ef 100644
--- a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/README.asciidoc
+++ b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/README.asciidoc
@@ -138,7 +138,7 @@ other test runners to skip tests if they do not support the capabilities API yet
               path: /_api
               parameters: [param1, param2]
               capabilities: [cap1, cap2]
-          test_runner_feature: [capabilities]
+          test_runner_features: [capabilities]
           reason: Capability required to run test
      - do:
        ... test definitions ...

From 98fe686da4c5cb82d4b03719977be428dc7934e7 Mon Sep 17 00:00:00 2001
From: Nhat Nguyen <nhat.nguyen@elastic.co>
Date: Wed, 28 Aug 2024 15:59:12 -0700
Subject: [PATCH 024/144] Upgrade xcontent to Jackson 2.17.2 (#112320)

Avoid FasterXML/jackson-core#1256
---
 docs/changelog/112320.yaml       |  5 +++++
 gradle/verification-metadata.xml | 20 ++++++++++++++++++++
 libs/x-content/impl/build.gradle |  2 +-
 3 files changed, 26 insertions(+), 1 deletion(-)
 create mode 100644 docs/changelog/112320.yaml

diff --git a/docs/changelog/112320.yaml b/docs/changelog/112320.yaml
new file mode 100644
index 0000000000000..d35a08dfa4e91
--- /dev/null
+++ b/docs/changelog/112320.yaml
@@ -0,0 +1,5 @@
+pr: 112320
+summary: Upgrade xcontent to Jackson 2.17.2
+area: Infra/Core
+type: upgrade
+issues: []
diff --git a/gradle/verification-metadata.xml b/gradle/verification-metadata.xml
index fd514103449c1..a27e2083a0849 100644
--- a/gradle/verification-metadata.xml
+++ b/gradle/verification-metadata.xml
@@ -311,6 +311,11 @@
             <sha256 value="55be130f6a68038088a261856c4e383ce79957a0fc1a29ecb213a9efd6ef4389" origin="Generated by Gradle"/>
          </artifact>
       </component>
+      <component group="com.fasterxml.jackson.core" name="jackson-core" version="2.17.2">
+         <artifact name="jackson-core-2.17.2.jar">
+            <sha256 value="721a189241dab0525d9e858e5cb604d3ecc0ede081e2de77d6f34fa5779a5b46" origin="Generated by Gradle"/>
+         </artifact>
+      </component>
       <component group="com.fasterxml.jackson.core" name="jackson-databind" version="2.10.5.1">
          <artifact name="jackson-databind-2.10.5.1.jar">
             <sha256 value="f93db83891a53e8d268e2cc8fcd88ead2981edc2163e35c2a52c88d9ab57b4a0" origin="Generated by Gradle"/>
@@ -346,6 +351,11 @@
             <sha256 value="d7050cb5e622848d5be382848b1792e8244d529e24c84ba1cc27aabf2496fe3b" origin="Generated by Gradle"/>
          </artifact>
       </component>
+      <component group="com.fasterxml.jackson.dataformat" name="jackson-dataformat-cbor" version="2.17.2">
+         <artifact name="jackson-dataformat-cbor-2.17.2.jar">
+            <sha256 value="1d7dc634ba3d7981d7017f4f44d43cf371e922c80028b4eb3e5374ce6546d5f6" origin="Generated by Gradle"/>
+         </artifact>
+      </component>
       <component group="com.fasterxml.jackson.dataformat" name="jackson-dataformat-smile" version="2.14.2">
          <artifact name="jackson-dataformat-smile-2.14.2.jar">
             <sha256 value="9c279bb29770de09289c14cf8862dd195112687cd7fde815919f54a9157ce213" origin="Generated by Gradle"/>
@@ -361,6 +371,11 @@
             <sha256 value="e6b2bf2a53d1f88ec02f1833da24c208aa299876e47d37f7920b1e83e214baab" origin="Generated by Gradle"/>
          </artifact>
       </component>
+      <component group="com.fasterxml.jackson.dataformat" name="jackson-dataformat-smile" version="2.17.2">
+         <artifact name="jackson-dataformat-smile-2.17.2.jar">
+            <sha256 value="120b07ad7b7b9097d9a174ab6176e07b6409fb7af3f63fcf3d7147c053be0d29" origin="Generated by Gradle"/>
+         </artifact>
+      </component>
       <component group="com.fasterxml.jackson.dataformat" name="jackson-dataformat-xml" version="2.15.0">
          <artifact name="jackson-dataformat-xml-2.15.0.jar">
             <sha256 value="e3137c89b08d0c3d9f7dfeae11d5b941b310f5f7bfdea90063f29c0b3b1f6807" origin="Generated by Gradle"/>
@@ -381,6 +396,11 @@
             <sha256 value="46b65ace036b01743710bcfc9e7f041eded2fc82ba0d3d83e19b32c818c18b4c" origin="Generated by Gradle"/>
          </artifact>
       </component>
+      <component group="com.fasterxml.jackson.dataformat" name="jackson-dataformat-yaml" version="2.17.2">
+         <artifact name="jackson-dataformat-yaml-2.17.2.jar">
+            <sha256 value="941bcd8b1381bb3b0d726fab41624fa8ece0ee7b6cf2860ad95e8157ce673376" origin="Generated by Gradle"/>
+         </artifact>
+      </component>
       <component group="com.fasterxml.jackson.datatype" name="jackson-datatype-jsr310" version="2.15.0">
          <artifact name="jackson-datatype-jsr310-2.15.0.jar">
             <sha256 value="d5deb92d59668a8de0ac8da818d5d9c0fdfb4db6b2f1d66a779fe357f310d648" origin="Generated by Gradle"/>
diff --git a/libs/x-content/impl/build.gradle b/libs/x-content/impl/build.gradle
index 829b75524baeb..6cf278e826d4c 100644
--- a/libs/x-content/impl/build.gradle
+++ b/libs/x-content/impl/build.gradle
@@ -12,7 +12,7 @@ base {
   archivesName = "x-content-impl"
 }
 
-String jacksonVersion = "2.17.0"
+String jacksonVersion = "2.17.2"
 
 dependencies {
   compileOnly project(':libs:elasticsearch-core')

From b2d400ccf17b6e04012e3c667baa94626e199728 Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Thu, 29 Aug 2024 14:29:25 +1000
Subject: [PATCH 025/144] Mute
 org.elasticsearch.search.retriever.RankDocRetrieverBuilderIT
 testRankDocsRetrieverWithCollapse #112254

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 7feefa1255f48..ec2a846f71c44 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -172,6 +172,9 @@ tests:
 - class: org.elasticsearch.blobcache.shared.SharedBlobCacheServiceTests
   method: testGetMultiThreaded
   issue: https://github.com/elastic/elasticsearch/issues/112314
+- class: org.elasticsearch.search.retriever.RankDocRetrieverBuilderIT
+  method: testRankDocsRetrieverWithCollapse
+  issue: https://github.com/elastic/elasticsearch/issues/112254
 
 # Examples:
 #

From 633f5f9fe37618e1a998e397cdb006db4af55610 Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Thu, 29 Aug 2024 14:41:59 +1000
Subject: [PATCH 026/144] Mute org.elasticsearch.search.ccs.CCSUsageTelemetryIT
 org.elasticsearch.search.ccs.CCSUsageTelemetryIT #112324

---
 muted-tests.yml | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index ec2a846f71c44..71a3479201783 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -175,6 +175,8 @@ tests:
 - class: org.elasticsearch.search.retriever.RankDocRetrieverBuilderIT
   method: testRankDocsRetrieverWithCollapse
   issue: https://github.com/elastic/elasticsearch/issues/112254
+- class: org.elasticsearch.search.ccs.CCSUsageTelemetryIT
+  issue: https://github.com/elastic/elasticsearch/issues/112324
 
 # Examples:
 #

From 9344f173d32231f1c47e5ef994bffa27b61da876 Mon Sep 17 00:00:00 2001
From: David Turner <david.turner@elastic.co>
Date: Thu, 29 Aug 2024 05:54:13 +0100
Subject: [PATCH 027/144] Add general read/write optional support (#112276)

Today `StreamOutput#writeOptionalWriteable` allows to write a
possibly-null value that implements `Writeable` and therefore carries
its own serialization, but sometimes we want to write an optional value
and provide a custom `Writer` too. This commit adds
`StreamOutput#writeOptional` and a corresponding
`StreamInput#readOptional` to support this.
---
 .../action/bulk/BulkItemRequest.java          | 10 +++---
 .../action/bulk/BulkItemResponse.java         | 32 +++++++------------
 .../action/bulk/BulkShardRequest.java         |  9 +-----
 .../action/bulk/BulkShardResponse.java        |  2 +-
 .../common/io/stream/StreamInput.java         | 15 +++++++++
 .../common/io/stream/StreamOutput.java        | 21 ++++++++++++
 .../bucket/range/InternalBinaryRange.java     | 14 +++-----
 .../common/io/stream/AbstractStreamTests.java | 11 +++++++
 .../core/rollup/job/RollupJobStatus.java      |  9 +++---
 .../actions/execute/ExecuteWatchRequest.java  | 18 +++--------
 10 files changed, 77 insertions(+), 64 deletions(-)

diff --git a/server/src/main/java/org/elasticsearch/action/bulk/BulkItemRequest.java b/server/src/main/java/org/elasticsearch/action/bulk/BulkItemRequest.java
index 425461d1f4ba1..7c1304f92eefd 100644
--- a/server/src/main/java/org/elasticsearch/action/bulk/BulkItemRequest.java
+++ b/server/src/main/java/org/elasticsearch/action/bulk/BulkItemRequest.java
@@ -101,11 +101,11 @@ public void writeTo(StreamOutput out) throws IOException {
         out.writeOptionalWriteable(primaryResponse);
     }
 
-    public void writeThin(StreamOutput out) throws IOException {
-        out.writeVInt(id);
-        DocWriteRequest.writeDocumentRequestThin(out, request);
-        out.writeOptionalWriteable(primaryResponse == null ? null : primaryResponse::writeThin);
-    }
+    public static final Writer<BulkItemRequest> THIN_WRITER = (out, item) -> {
+        out.writeVInt(item.id);
+        DocWriteRequest.writeDocumentRequestThin(out, item.request);
+        out.writeOptional(BulkItemResponse.THIN_WRITER, item.primaryResponse);
+    };
 
     @Override
     public long ramBytesUsed() {
diff --git a/server/src/main/java/org/elasticsearch/action/bulk/BulkItemResponse.java b/server/src/main/java/org/elasticsearch/action/bulk/BulkItemResponse.java
index 151e8795d0f82..d3e550eaf05b3 100644
--- a/server/src/main/java/org/elasticsearch/action/bulk/BulkItemResponse.java
+++ b/server/src/main/java/org/elasticsearch/action/bulk/BulkItemResponse.java
@@ -264,7 +264,7 @@ public String toString() {
         id = in.readVInt();
         opType = OpType.fromId(in.readByte());
         response = readResponse(shardId, in);
-        failure = in.readBoolean() ? new Failure(in) : null;
+        failure = in.readOptionalWriteable(Failure::new);
         assertConsistent();
     }
 
@@ -272,7 +272,7 @@ public String toString() {
         id = in.readVInt();
         opType = OpType.fromId(in.readByte());
         response = readResponse(in);
-        failure = in.readBoolean() ? new Failure(in) : null;
+        failure = in.readOptionalWriteable(Failure::new);
         assertConsistent();
     }
 
@@ -384,31 +384,21 @@ public void writeTo(StreamOutput out) throws IOException {
             writeResponseType(out);
             response.writeTo(out);
         }
-        if (failure == null) {
-            out.writeBoolean(false);
-        } else {
-            out.writeBoolean(true);
-            failure.writeTo(out);
-        }
+        out.writeOptionalWriteable(failure);
     }
 
-    public void writeThin(StreamOutput out) throws IOException {
-        out.writeVInt(id);
-        out.writeByte(opType.getId());
+    public static final Writer<BulkItemResponse> THIN_WRITER = (out, item) -> {
+        out.writeVInt(item.id);
+        out.writeByte(item.opType.getId());
 
-        if (response == null) {
+        if (item.response == null) {
             out.writeByte((byte) 2);
         } else {
-            writeResponseType(out);
-            response.writeThin(out);
+            item.writeResponseType(out);
+            item.response.writeThin(out);
         }
-        if (failure == null) {
-            out.writeBoolean(false);
-        } else {
-            out.writeBoolean(true);
-            failure.writeTo(out);
-        }
-    }
+        out.writeOptionalWriteable(item.failure);
+    };
 
     private void writeResponseType(StreamOutput out) throws IOException {
         if (response instanceof SimulateIndexResponse) {
diff --git a/server/src/main/java/org/elasticsearch/action/bulk/BulkShardRequest.java b/server/src/main/java/org/elasticsearch/action/bulk/BulkShardRequest.java
index 0d2942e688382..f7860c47d8b73 100644
--- a/server/src/main/java/org/elasticsearch/action/bulk/BulkShardRequest.java
+++ b/server/src/main/java/org/elasticsearch/action/bulk/BulkShardRequest.java
@@ -130,14 +130,7 @@ public void writeTo(StreamOutput out) throws IOException {
             throw new IllegalStateException("Inference metadata should have been consumed before writing to the stream");
         }
         super.writeTo(out);
-        out.writeArray((o, item) -> {
-            if (item != null) {
-                o.writeBoolean(true);
-                item.writeThin(o);
-            } else {
-                o.writeBoolean(false);
-            }
-        }, items);
+        out.writeArray((o, item) -> o.writeOptional(BulkItemRequest.THIN_WRITER, item), items);
         if (out.getTransportVersion().onOrAfter(TransportVersions.SIMULATE_VALIDATES_MAPPINGS)) {
             out.writeBoolean(isSimulated);
         }
diff --git a/server/src/main/java/org/elasticsearch/action/bulk/BulkShardResponse.java b/server/src/main/java/org/elasticsearch/action/bulk/BulkShardResponse.java
index 3eeb96546c9b0..eb1bb0468c9bb 100644
--- a/server/src/main/java/org/elasticsearch/action/bulk/BulkShardResponse.java
+++ b/server/src/main/java/org/elasticsearch/action/bulk/BulkShardResponse.java
@@ -56,6 +56,6 @@ public void setForcedRefresh(boolean forcedRefresh) {
     public void writeTo(StreamOutput out) throws IOException {
         super.writeTo(out);
         shardId.writeTo(out);
-        out.writeArray((o, item) -> item.writeThin(o), responses);
+        out.writeArray(BulkItemResponse.THIN_WRITER, responses);
     }
 }
diff --git a/server/src/main/java/org/elasticsearch/common/io/stream/StreamInput.java b/server/src/main/java/org/elasticsearch/common/io/stream/StreamInput.java
index ec0edb2d07e5a..497028ef37c69 100644
--- a/server/src/main/java/org/elasticsearch/common/io/stream/StreamInput.java
+++ b/server/src/main/java/org/elasticsearch/common/io/stream/StreamInput.java
@@ -1095,8 +1095,23 @@ public <T> T[] readOptionalArray(Writeable.Reader<T> reader, IntFunction<T[]> ar
         return readBoolean() ? readArray(reader, arraySupplier) : null;
     }
 
+    /**
+     * Reads a possibly-null value using the given {@link org.elasticsearch.common.io.stream.Writeable.Reader}.
+     *
+     * @see StreamOutput#writeOptionalWriteable
+     */
+    // just an alias for readOptional() since we don't actually care whether T extends Writeable
     @Nullable
     public <T extends Writeable> T readOptionalWriteable(Writeable.Reader<T> reader) throws IOException {
+        return readOptional(reader);
+    }
+
+    /**
+     * Reads a possibly-null value using the given {@link org.elasticsearch.common.io.stream.Writeable.Reader}.
+     *
+     * @see StreamOutput#writeOptional
+     */
+    public <T> T readOptional(Writeable.Reader<T> reader) throws IOException {
         if (readBoolean()) {
             T t = reader.read(this);
             if (t == null) {
diff --git a/server/src/main/java/org/elasticsearch/common/io/stream/StreamOutput.java b/server/src/main/java/org/elasticsearch/common/io/stream/StreamOutput.java
index c65ae2e3463d4..5780885473b00 100644
--- a/server/src/main/java/org/elasticsearch/common/io/stream/StreamOutput.java
+++ b/server/src/main/java/org/elasticsearch/common/io/stream/StreamOutput.java
@@ -1015,6 +1015,12 @@ public <T extends Writeable> void writeOptionalArray(@Nullable T[] array) throws
         writeOptionalArray(StreamOutput::writeWriteable, array);
     }
 
+    /**
+     * Writes a boolean value indicating whether the given object is {@code null}, followed by the object's serialization if it is not
+     * {@code null}.
+     *
+     * @see StreamInput#readOptionalWriteable
+     */
     public void writeOptionalWriteable(@Nullable Writeable writeable) throws IOException {
         if (writeable != null) {
             writeBoolean(true);
@@ -1024,6 +1030,21 @@ public void writeOptionalWriteable(@Nullable Writeable writeable) throws IOExcep
         }
     }
 
+    /**
+     * Writes a boolean value indicating whether the given object is {@code null}, followed by the object's serialization if it is not
+     * {@code null}.
+     *
+     * @see StreamInput#readOptional
+     */
+    public <T> void writeOptional(Writer<T> writer, @Nullable T maybeItem) throws IOException {
+        if (maybeItem != null) {
+            writeBoolean(true);
+            writer.write(this, maybeItem);
+        } else {
+            writeBoolean(false);
+        }
+    }
+
     /**
      * This method allow to use a method reference when writing collection elements such as
      * {@code out.writeMap(map, StreamOutput::writeString, StreamOutput::writeWriteable)}
diff --git a/server/src/main/java/org/elasticsearch/search/aggregations/bucket/range/InternalBinaryRange.java b/server/src/main/java/org/elasticsearch/search/aggregations/bucket/range/InternalBinaryRange.java
index 2b5bcd9931f6e..528c37de7a4a8 100644
--- a/server/src/main/java/org/elasticsearch/search/aggregations/bucket/range/InternalBinaryRange.java
+++ b/server/src/main/java/org/elasticsearch/search/aggregations/bucket/range/InternalBinaryRange.java
@@ -72,8 +72,8 @@ private static Bucket createFromStream(StreamInput in, DocValueFormat format, bo
             String key = in.getTransportVersion().equals(TransportVersions.V_8_0_0) ? in.readString()
                 : in.getTransportVersion().onOrAfter(TransportVersions.V_7_17_1) ? in.readOptionalString()
                 : in.readString();
-            BytesRef from = in.readBoolean() ? in.readBytesRef() : null;
-            BytesRef to = in.readBoolean() ? in.readBytesRef() : null;
+            BytesRef from = in.readOptional(StreamInput::readBytesRef);
+            BytesRef to = in.readOptional(StreamInput::readBytesRef);
             long docCount = in.readLong();
             InternalAggregations aggregations = InternalAggregations.readFrom(in);
 
@@ -89,14 +89,8 @@ public void writeTo(StreamOutput out) throws IOException {
             } else {
                 out.writeString(key == null ? generateKey(from, to, format) : key);
             }
-            out.writeBoolean(from != null);
-            if (from != null) {
-                out.writeBytesRef(from);
-            }
-            out.writeBoolean(to != null);
-            if (to != null) {
-                out.writeBytesRef(to);
-            }
+            out.writeOptional(StreamOutput::writeBytesRef, from);
+            out.writeOptional(StreamOutput::writeBytesRef, to);
             out.writeLong(docCount);
             aggregations.writeTo(out);
         }
diff --git a/server/src/test/java/org/elasticsearch/common/io/stream/AbstractStreamTests.java b/server/src/test/java/org/elasticsearch/common/io/stream/AbstractStreamTests.java
index b1104a72400ea..ae686afcbb296 100644
--- a/server/src/test/java/org/elasticsearch/common/io/stream/AbstractStreamTests.java
+++ b/server/src/test/java/org/elasticsearch/common/io/stream/AbstractStreamTests.java
@@ -761,6 +761,17 @@ public void checkZonedDateTimeSerialization(TransportVersion tv) throws IOExcept
         }
     }
 
+    public void testOptional() throws IOException {
+        try (var output = new BytesStreamOutput()) {
+            output.writeOptional(StreamOutput::writeString, "not-null");
+            output.writeOptional(StreamOutput::writeString, null);
+
+            final var input = getStreamInput(output.bytes());
+            assertEquals("not-null", input.readOptional(StreamInput::readString));
+            assertNull(input.readOptional(StreamInput::readString));
+        }
+    }
+
     private void assertSerialization(
         CheckedConsumer<StreamOutput, IOException> outputAssertions,
         CheckedConsumer<StreamInput, IOException> inputAssertions,
diff --git a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/rollup/job/RollupJobStatus.java b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/rollup/job/RollupJobStatus.java
index 1ba625a507a46..f7ad1f65628b2 100644
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/rollup/job/RollupJobStatus.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/rollup/job/RollupJobStatus.java
@@ -74,7 +74,7 @@ public RollupJobStatus(IndexerState state, @Nullable Map<String, Object> positio
 
     public RollupJobStatus(StreamInput in) throws IOException {
         state = IndexerState.fromStream(in);
-        currentPosition = in.readBoolean() ? new TreeMap<>(in.readGenericMap()) : null;
+        currentPosition = in.readOptional(CURRENT_POSITION_READER);
         if (in.getTransportVersion().before(TransportVersions.V_8_0_0)) {
             // 7.x nodes serialize `upgradedDocumentID` flag. We don't need it anymore, but
             // we need to pull it off the stream
@@ -83,6 +83,8 @@ public RollupJobStatus(StreamInput in) throws IOException {
         }
     }
 
+    private static final Reader<TreeMap<String, Object>> CURRENT_POSITION_READER = in -> new TreeMap<>(in.readGenericMap());
+
     public IndexerState getIndexerState() {
         return state;
     }
@@ -118,10 +120,7 @@ public String getWriteableName() {
     @Override
     public void writeTo(StreamOutput out) throws IOException {
         state.writeTo(out);
-        out.writeBoolean(currentPosition != null);
-        if (currentPosition != null) {
-            out.writeGenericMap(currentPosition);
-        }
+        out.writeOptional(StreamOutput::writeGenericMap, currentPosition);
         if (out.getTransportVersion().before(TransportVersions.V_8_0_0)) {
             // 7.x nodes expect a boolean `upgradedDocumentID` flag. We don't have it anymore,
             // but we need to tell them we are upgraded in case there is a mixed cluster
diff --git a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/watcher/transport/actions/execute/ExecuteWatchRequest.java b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/watcher/transport/actions/execute/ExecuteWatchRequest.java
index 681b004dd1d28..2f2617f956ed9 100644
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/watcher/transport/actions/execute/ExecuteWatchRequest.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/watcher/transport/actions/execute/ExecuteWatchRequest.java
@@ -59,12 +59,8 @@ public ExecuteWatchRequest(StreamInput in) throws IOException {
         id = in.readOptionalString();
         ignoreCondition = in.readBoolean();
         recordExecution = in.readBoolean();
-        if (in.readBoolean()) {
-            alternativeInput = in.readGenericMap();
-        }
-        if (in.readBoolean()) {
-            triggerData = in.readGenericMap();
-        }
+        alternativeInput = in.readOptional(StreamInput::readGenericMap);
+        triggerData = in.readOptional(StreamInput::readGenericMap);
         long actionModesCount = in.readLong();
         actionModes = new HashMap<>();
         for (int i = 0; i < actionModesCount; i++) {
@@ -83,14 +79,8 @@ public void writeTo(StreamOutput out) throws IOException {
         out.writeOptionalString(id);
         out.writeBoolean(ignoreCondition);
         out.writeBoolean(recordExecution);
-        out.writeBoolean(alternativeInput != null);
-        if (alternativeInput != null) {
-            out.writeGenericMap(alternativeInput);
-        }
-        out.writeBoolean(triggerData != null);
-        if (triggerData != null) {
-            out.writeGenericMap(triggerData);
-        }
+        out.writeOptional(StreamOutput::writeGenericMap, alternativeInput);
+        out.writeOptional(StreamOutput::writeGenericMap, triggerData);
         out.writeLong(actionModes.size());
         for (Map.Entry<String, ActionExecutionMode> entry : actionModes.entrySet()) {
             out.writeString(entry.getKey());

From 59a42ed41b72ea92e62e4522b83d9f9f48955203 Mon Sep 17 00:00:00 2001
From: David Turner <david.turner@elastic.co>
Date: Thu, 29 Aug 2024 06:03:13 +0100
Subject: [PATCH 028/144] Include network disconnect info in troubleshooting
 docs (#112323)

A misplaced `//end::` tag meant that the docs added in #112271 are only
included in the page on fault detection and not the equivalent
troubleshooting docs. This commit fixes the problem.
---
 docs/reference/modules/discovery/fault-detection.asciidoc | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/reference/modules/discovery/fault-detection.asciidoc b/docs/reference/modules/discovery/fault-detection.asciidoc
index 89c8a78eccbc6..d12985b70597c 100644
--- a/docs/reference/modules/discovery/fault-detection.asciidoc
+++ b/docs/reference/modules/discovery/fault-detection.asciidoc
@@ -300,7 +300,6 @@ To reconstruct the output, base64-decode the data and decompress it using
 ----
 cat shardlock.log | sed -e 's/.*://' | base64 --decode | gzip --decompress
 ----
-//end::troubleshooting[]
 
 [discrete]
 ===== Diagnosing other network disconnections
@@ -345,3 +344,4 @@ packet capture simultaneously from the nodes at both ends of an unstable
 connection and analyse it alongside the {es} logs from those nodes to determine
 if traffic between the nodes is being disrupted by another device on the
 network.
+//end::troubleshooting[]

From aa67bdb5ca8abebcee8a50ebb58e6160d134230c Mon Sep 17 00:00:00 2001
From: Andrei Stefan <astefan@users.noreply.github.com>
Date: Thu, 29 Aug 2024 09:53:09 +0300
Subject: [PATCH 029/144] ES|QL: EsqlAsyncSecurityIT workaround for lazy
 .async-search indexing (#112287)

---
 muted-tests.yml                               |  3 --
 .../xpack/esql/EsqlAsyncSecurityIT.java       | 30 ++++++++++++++-----
 2 files changed, 22 insertions(+), 11 deletions(-)

diff --git a/muted-tests.yml b/muted-tests.yml
index 71a3479201783..508403ee6238c 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -137,9 +137,6 @@ tests:
 - class: org.elasticsearch.xpack.ml.integration.MlJobIT
   method: testDeleteJobAfterMissingIndex
   issue: https://github.com/elastic/elasticsearch/issues/112088
-- class: org.elasticsearch.xpack.esql.EsqlAsyncSecurityIT
-  method: testLimitedPrivilege
-  issue: https://github.com/elastic/elasticsearch/issues/112110
 - class: org.elasticsearch.xpack.esql.qa.mixed.MixedClusterEsqlSpecIT
   method: test {stats.ByTwoCalculatedSecondOverwrites SYNC}
   issue: https://github.com/elastic/elasticsearch/issues/112117
diff --git a/x-pack/plugin/esql/qa/security/src/javaRestTest/java/org/elasticsearch/xpack/esql/EsqlAsyncSecurityIT.java b/x-pack/plugin/esql/qa/security/src/javaRestTest/java/org/elasticsearch/xpack/esql/EsqlAsyncSecurityIT.java
index 0806e41186395..f2633dfffb0fe 100644
--- a/x-pack/plugin/esql/qa/security/src/javaRestTest/java/org/elasticsearch/xpack/esql/EsqlAsyncSecurityIT.java
+++ b/x-pack/plugin/esql/qa/security/src/javaRestTest/java/org/elasticsearch/xpack/esql/EsqlAsyncSecurityIT.java
@@ -67,7 +67,7 @@ public void testUnauthorizedIndices() throws IOException {
             var getResponse = runAsyncGet("user1", id); // sanity
             assertOK(getResponse);
             ResponseException error;
-            error = expectThrows(ResponseException.class, () -> runAsyncGet("user2", id));
+            error = expectThrows(ResponseException.class, () -> runAsyncGet("user2", id, true));
             // resource not found exception if the authenticated user is not the creator of the original task
             assertThat(error.getResponse().getStatusLine().getStatusCode(), equalTo(404));
 
@@ -85,7 +85,7 @@ public void testUnauthorizedIndices() throws IOException {
             var getResponse = runAsyncGet("user2", id); // sanity
             assertOK(getResponse);
             ResponseException error;
-            error = expectThrows(ResponseException.class, () -> runAsyncGet("user1", id));
+            error = expectThrows(ResponseException.class, () -> runAsyncGet("user1", id, true));
             assertThat(error.getResponse().getStatusLine().getStatusCode(), equalTo(404));
 
             error = expectThrows(ResponseException.class, () -> runAsyncDelete("user1", id));
@@ -117,6 +117,10 @@ private Response runAsync(String user, String command) throws IOException {
     }
 
     private Response runAsyncGet(String user, String id) throws IOException {
+        return runAsyncGet(user, id, false);
+    }
+
+    private Response runAsyncGet(String user, String id, boolean isAsyncIdNotFound_Expected) throws IOException {
         int tries = 0;
         while (tries < 10) {
             // Sometimes we get 404s fetching the task status.
@@ -129,22 +133,32 @@ private Response runAsyncGet(String user, String id) throws IOException {
                 logResponse(response);
                 return response;
             } catch (ResponseException e) {
-                if (e.getResponse().getStatusLine().getStatusCode() == 404
-                    && EntityUtils.toString(e.getResponse().getEntity()).contains("no such index [.async-search]")) {
-                    /*
-                     * Work around https://github.com/elastic/elasticsearch/issues/110304 - the .async-search
-                     * index may not exist when we try the fetch, but it should exist on next attempt.
-                     */
+                var statusCode = e.getResponse().getStatusLine().getStatusCode();
+                var message = EntityUtils.toString(e.getResponse().getEntity());
+
+                if (statusCode == 404 && message.contains("no such index [.async-search]")) {
+                    // Work around https://github.com/elastic/elasticsearch/issues/110304 - the .async-search
+                    // index may not exist when we try the fetch, but it should exist on next attempt.
                     logger.warn("async-search index does not exist", e);
                     try {
                         Thread.sleep(1000);
                     } catch (InterruptedException ex) {
                         throw new RuntimeException(ex);
                     }
+                } else if (statusCode == 404 && false == isAsyncIdNotFound_Expected && message.contains("resource_not_found_exception")) {
+                    // Work around for https://github.com/elastic/elasticsearch/issues/112110
+                    // The async id is not indexed quickly enough in .async-search index for us to retrieve it.
+                    logger.warn("async id not found", e);
+                    try {
+                        Thread.sleep(500);
+                    } catch (InterruptedException ex) {
+                        throw new RuntimeException(ex);
+                    }
                 } else {
                     throw e;
                 }
                 tries++;
+                logger.warn("retry [" + tries + "] for GET /_query/async/" + id);
             }
         }
         throw new IllegalStateException("couldn't find task status");

From b9dea69b5ca5b34600d1fc51badc3a9b163107b2 Mon Sep 17 00:00:00 2001
From: weizijun <weizijun1989@gmail.com>
Date: Thu, 29 Aug 2024 15:17:27 +0800
Subject: [PATCH 030/144] [Inference API] Add Docs for AlibabaCloud AI Search
 Support for the Inference API (#112273)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: István Zoltán Szabó <istvan.szabo@elastic.co>
---
 docs/changelog/112273.yaml                    |   5 +
 .../inference/inference-apis.asciidoc         |   1 +
 .../inference/put-inference.asciidoc          |   1 +
 .../service-alibabacloud-ai-search.asciidoc   | 184 ++++++++++++++++++
 .../semantic-search-inference.asciidoc        |   1 +
 .../infer-api-ingest-pipeline-widget.asciidoc |  17 ++
 .../infer-api-ingest-pipeline.asciidoc        |  26 +++
 .../infer-api-mapping-widget.asciidoc         |  17 ++
 .../inference-api/infer-api-mapping.asciidoc  |  32 +++
 .../infer-api-reindex-widget.asciidoc         |  17 ++
 .../inference-api/infer-api-reindex.asciidoc  |  23 +++
 .../infer-api-requirements-widget.asciidoc    |  17 ++
 .../infer-api-requirements.asciidoc           |   6 +
 .../infer-api-search-widget.asciidoc          |  17 ++
 .../inference-api/infer-api-search.asciidoc   |  65 +++++++
 .../infer-api-task-widget.asciidoc            |  17 ++
 .../inference-api/infer-api-task.asciidoc     |  29 +++
 17 files changed, 475 insertions(+)
 create mode 100644 docs/changelog/112273.yaml
 create mode 100644 docs/reference/inference/service-alibabacloud-ai-search.asciidoc

diff --git a/docs/changelog/112273.yaml b/docs/changelog/112273.yaml
new file mode 100644
index 0000000000000..3182a1884a145
--- /dev/null
+++ b/docs/changelog/112273.yaml
@@ -0,0 +1,5 @@
+pr: 111181
+summary: "[Inference API] Add Docs for AlibabaCloud AI Search Support for the Inference API"
+area: Machine Learning
+type: enhancement
+issues: [ ]
diff --git a/docs/reference/inference/inference-apis.asciidoc b/docs/reference/inference/inference-apis.asciidoc
index 33db148755d8e..8fdf8aecc2ae5 100644
--- a/docs/reference/inference/inference-apis.asciidoc
+++ b/docs/reference/inference/inference-apis.asciidoc
@@ -39,6 +39,7 @@ include::delete-inference.asciidoc[]
 include::get-inference.asciidoc[]
 include::post-inference.asciidoc[]
 include::put-inference.asciidoc[]
+include::service-alibabacloud-ai-search.asciidoc[]
 include::service-amazon-bedrock.asciidoc[]
 include::service-anthropic.asciidoc[]
 include::service-azure-ai-studio.asciidoc[]
diff --git a/docs/reference/inference/put-inference.asciidoc b/docs/reference/inference/put-inference.asciidoc
index 57485e0720cca..ba26a563541fc 100644
--- a/docs/reference/inference/put-inference.asciidoc
+++ b/docs/reference/inference/put-inference.asciidoc
@@ -39,6 +39,7 @@ The create {infer} API enables you to create an {infer} endpoint and configure a
 
 The following services are available through the {infer} API, click the links to review the configuration details of the services:
 
+* <<infer-service-alibabacloud-ai-search,AlibabaCloud AI Search>>
 * <<infer-service-amazon-bedrock,Amazon Bedrock>>
 * <<infer-service-anthropic,Anthropic>>
 * <<infer-service-azure-ai-studio,Azure AI Studio>>
diff --git a/docs/reference/inference/service-alibabacloud-ai-search.asciidoc b/docs/reference/inference/service-alibabacloud-ai-search.asciidoc
new file mode 100644
index 0000000000000..df5220573d9e4
--- /dev/null
+++ b/docs/reference/inference/service-alibabacloud-ai-search.asciidoc
@@ -0,0 +1,184 @@
+[[infer-service-alibabacloud-ai-search]]
+=== AlibabaCloud AI Search {infer} service
+
+Creates an {infer} endpoint to perform an {infer} task with the `alibabacloud-ai-search` service.
+
+[discrete]
+[[infer-service-alibabacloud-ai-search-api-request]]
+==== {api-request-title}
+
+`PUT /_inference/<task_type>/<inference_id>`
+
+[discrete]
+[[infer-service-alibabacloud-ai-search-api-path-params]]
+==== {api-path-parms-title}
+
+`<inference_id>`::
+(Required, string)
+include::inference-shared.asciidoc[tag=inference-id]
+
+`<task_type>`::
+(Required, string)
+include::inference-shared.asciidoc[tag=task-type]
++
+--
+Available task types:
+
+* `text_embedding`,
+* `sparse_embedding`.
+* `rerank`.
+--
+
+[discrete]
+[[infer-service-alibabacloud-ai-search-api-request-body]]
+==== {api-request-body-title}
+
+`service`::
+(Required, string) The type of service supported for the specified task type.
+In this case,
+`alibabacloud-ai-search`.
+
+`service_settings`::
+(Required, object)
+include::inference-shared.asciidoc[tag=service-settings]
++
+--
+These settings are specific to the `alibabacloud-ai-search` service.
+--
+
+`api_key`:::
+(Required, string)
+A valid API key for the AlibabaCloud AI Search API.
+
+`service_id`:::
+(Required, string)
+The name of the model service to use for the {infer} task.
++
+--
+Available service_ids for the `text_embedding` task:
+
+* `ops-text-embedding-001`
+* `ops-text-embedding-zh-001`
+* `ops-text-embedding-en-001`
+* `ops-text-embedding-002`
+
+For the supported `text_embedding` service_ids, refer to the https://help.aliyun.com/zh/open-search/search-platform/developer-reference/text-embedding-api-details[documentation].
+
+Available service_id for the `sparse_embedding` task:
+
+* `ops-text-sparse-embedding-001`
+
+For the supported `sparse_embedding` service_id, refer to the https://help.aliyun.com/zh/open-search/search-platform/developer-reference/text-sparse-embedding-api-details[documentation].
+
+Available service_id for the `rerank` task is:
+
+* `ops-bge-reranker-larger`
+
+For the supported `rerank` service_id, refer to the https://help.aliyun.com/zh/open-search/search-platform/developer-reference/ranker-api-details[documentation].
+--
+
+`host`:::
+(Required, string)
+The name of the host address used for the {infer} task. You can find the host address at https://opensearch.console.aliyun.com/cn-shanghai/rag/api-key[ the API keys section] of the documentation.
+
+`workspace`:::
+(Required, string)
+The name of the workspace used for the {infer} task.
+
+`rate_limit`:::
+(Optional, object)
+By default, the `alibabacloud-ai-search` service sets the number of requests allowed per minute to `1000`.
+This helps to minimize the number of rate limit errors returned from AlibabaCloud AI Search.
+To modify this, set the `requests_per_minute` setting of this object in your service settings:
++
+--
+include::inference-shared.asciidoc[tag=request-per-minute-example]
+--
+
+
+`task_settings`::
+(Optional, object)
+include::inference-shared.asciidoc[tag=task-settings]
++
+.`task_settings` for the `text_embedding` task type
+[%collapsible%closed]
+=====
+`input_type`:::
+(Optional, string)
+Specifies the type of input passed to the model.
+Valid values are:
+* `ingest`: for storing document embeddings in a vector database.
+* `search`: for storing embeddings of search queries run against a vector database to find relevant documents.
+=====
++
+.`task_settings` for the `sparse_embedding` task type
+[%collapsible%closed]
+=====
+`input_type`:::
+(Optional, string)
+Specifies the type of input passed to the model.
+Valid values are:
+* `ingest`: for storing document embeddings in a vector database.
+* `search`: for storing embeddings of search queries run against a vector database to find relevant documents.
+
+`return_token`:::
+(Optional, boolean)
+If `true`, the token name will be returned in the response. Defaults to `false` which means only the token ID will be returned in the response.
+=====
+
+[discrete]
+[[inference-example-alibabacloud-ai-search]]
+==== AlibabaCloud AI Search service examples
+
+The following example shows how to create an {infer} endpoint called `alibabacloud_ai_search_embeddings` to perform a `text_embedding` task type.
+
+[source,console]
+------------------------------------------------------------
+PUT _inference/text_embedding/alibabacloud_ai_search_embeddings
+{
+    "service": "alibabacloud-ai-search",
+    "service_settings": {
+        "api_key": "<api_key>",
+        "service_id": "ops-text-embedding-001",
+        "host": "default-j01.platform-cn-shanghai.opensearch.aliyuncs.com",
+        "workspace": "default"
+    }
+}
+------------------------------------------------------------
+// TEST[skip:TBD]
+
+The following example shows how to create an {infer} endpoint called
+`alibabacloud_ai_search_sparse` to perform a `sparse_embedding` task type.
+
+[source,console]
+------------------------------------------------------------
+PUT _inference/sparse_embedding/alibabacloud_ai_search_sparse
+{
+    "service": "alibabacloud-ai-search",
+    "service_settings": {
+        "api_key": "<api_key>",
+        "service_id": "ops-text-sparse-embedding-001",
+        "host": "default-j01.platform-cn-shanghai.opensearch.aliyuncs.com",
+        "workspace": "default"
+    }
+}
+------------------------------------------------------------
+// TEST[skip:TBD]
+
+The next example shows how to create an {infer} endpoint called
+`alibabacloud_ai_search_rerank` to perform a `rerank` task type.
+
+[source,console]
+------------------------------------------------------------
+PUT _inference/rerank/alibabacloud_ai_search_rerank
+{
+    "service": "alibabacloud-ai-search",
+    "service_settings": {
+        "api_key": "<api_key>",
+        "service_id": "ops-bge-reranker-larger",
+        "host": "default-j01.platform-cn-shanghai.opensearch.aliyuncs.com",
+        "workspace": "default"
+    }
+}
+------------------------------------------------------------
+// TEST[skip:TBD]
diff --git a/docs/reference/search/search-your-data/semantic-search-inference.asciidoc b/docs/reference/search/search-your-data/semantic-search-inference.asciidoc
index f74bc65e31bf0..719aeb070fc7c 100644
--- a/docs/reference/search/search-your-data/semantic-search-inference.asciidoc
+++ b/docs/reference/search/search-your-data/semantic-search-inference.asciidoc
@@ -17,6 +17,7 @@ Azure based examples use models available through https://ai.azure.com/explore/m
 or https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models[Azure OpenAI].
 Mistral examples use the `mistral-embed` model from https://docs.mistral.ai/getting-started/models/[the Mistral API].
 Amazon Bedrock examples use the `amazon.titan-embed-text-v1` model from https://docs.aws.amazon.com/bedrock/latest/userguide/model-ids.html[the Amazon Bedrock base models].
+AlibabaCloud AI Search examples use the `ops-text-embedding-zh-001` model from https://help.aliyun.com/zh/open-search/search-platform/developer-reference/text-embedding-api-details[the AlibabaCloud AI Search base models].
 
 Click the name of the service you want to use on any of the widgets below to review the corresponding instructions.
 
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-ingest-pipeline-widget.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-ingest-pipeline-widget.asciidoc
index 997dbbe8a20e6..3a686e27cf580 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-ingest-pipeline-widget.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-ingest-pipeline-widget.asciidoc
@@ -49,6 +49,12 @@
             id="infer-api-ingest-amazon-bedrock">
       Amazon Bedrock
     </button>
+    <button role="tab"
+            aria-selected="false"
+            aria-controls="infer-api-ingest-alibabacloud-ai-search-tab"
+            id="infer-api-ingest-alibabacloud-ai-search">
+      AlibabaCloud AI Search
+    </button>
   </div>
   <div tabindex="0"
        role="tabpanel"
@@ -135,6 +141,17 @@ include::infer-api-ingest-pipeline.asciidoc[tag=mistral]
 
 include::infer-api-ingest-pipeline.asciidoc[tag=amazon-bedrock]
 
+++++
+  </div>
+  <div tabindex="0"
+       role="tabpanel"
+       id="infer-api-ingest-alibabacloud-ai-search-tab"
+       aria-labelledby="infer-api-ingest-alibabacloud-ai-search"
+       hidden="">
+++++
+
+include::infer-api-ingest-pipeline.asciidoc[tag=alibabacloud-ai-search]
+
 ++++
   </div>
 </div>
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-ingest-pipeline.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-ingest-pipeline.asciidoc
index 6adf3d2ebbf46..6678b60fabc40 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-ingest-pipeline.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-ingest-pipeline.asciidoc
@@ -216,3 +216,29 @@ PUT _ingest/pipeline/amazon_bedrock_embeddings
 and the `output_field` that will contain the {infer} results.
 
 // end::amazon-bedrock[]
+
+// tag::alibabacloud-ai-search[]
+
+[source,console]
+--------------------------------------------------
+PUT _ingest/pipeline/alibabacloud_ai_search_embeddings
+{
+  "processors": [
+    {
+      "inference": {
+        "model_id": "alibabacloud_ai_search_embeddings", <1>
+        "input_output": { <2>
+          "input_field": "content",
+          "output_field": "content_embedding"
+        }
+      }
+    }
+  ]
+}
+--------------------------------------------------
+<1> The name of the inference endpoint you created by using the
+<<put-inference-api>>, it's referred to as `inference_id` in that step.
+<2> Configuration object that defines the `input_field` for the {infer} process
+and the `output_field` that will contain the {infer} results.
+
+// end::alibabacloud-ai-search[]
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-mapping-widget.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-mapping-widget.asciidoc
index 4e3a453a7bbea..66b790bdd57a5 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-mapping-widget.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-mapping-widget.asciidoc
@@ -49,6 +49,12 @@
             id="infer-api-mapping-amazon-bedrock">
       Amazon Bedrock
     </button>
+    <button role="tab"
+            aria-selected="false"
+            aria-controls="infer-api-mapping-alibabacloud-ai-search-tab"
+            id="infer-api-mapping-alibabacloud-ai-search">
+      AlibabaCloud AI Search
+    </button>
   </div>
   <div tabindex="0"
        role="tabpanel"
@@ -135,6 +141,17 @@ include::infer-api-mapping.asciidoc[tag=mistral]
 
 include::infer-api-mapping.asciidoc[tag=amazon-bedrock]
 
+++++
+  </div>
+  <div tabindex="0"
+       role="tabpanel"
+       id="infer-api-mapping-alibabacloud-ai-search-tab"
+       aria-labelledby="infer-api-mapping-alibabacloud-ai-search"
+       hidden="">
+++++
+
+include::infer-api-mapping.asciidoc[tag=alibabacloud-ai-search]
+
 ++++
   </div>
 </div>
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-mapping.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-mapping.asciidoc
index abeeb87f03e75..c86538ceb9c87 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-mapping.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-mapping.asciidoc
@@ -270,3 +270,35 @@ the {infer} pipeline configuration in the next step.
 <6> The field type which is text in this example.
 
 // end::amazon-bedrock[]
+
+// tag::alibabacloud-ai-search[]
+
+[source,console]
+--------------------------------------------------
+PUT alibabacloud-ai-search-embeddings
+{
+  "mappings": {
+    "properties": {
+      "content_embedding": { <1>
+        "type": "dense_vector", <2>
+        "dims": 1024, <3>
+        "element_type": "float"
+      },
+      "content": { <4>
+        "type": "text" <5>
+      }
+    }
+  }
+}
+--------------------------------------------------
+<1> The name of the field to contain the generated tokens. It must be referenced
+in the {infer} pipeline configuration in the next step.
+<2> The field to contain the tokens is a `dense_vector` field.
+<3> The output dimensions of the model. This value may be different depending on the underlying model used.
+See the https://help.aliyun.com/zh/open-search/search-platform/developer-reference/text-embedding-api-details[AlibabaCloud AI Search embedding model] documentation.
+<4> The name of the field from which to create the dense vector representation.
+In this example, the name of the field is `content`. It must be referenced in
+the {infer} pipeline configuration in the next step.
+<5> The field type which is text in this example.
+
+// end::alibabacloud-ai-search[]
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-reindex-widget.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-reindex-widget.asciidoc
index 45cb9fc51b9f1..86f52fee2063c 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-reindex-widget.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-reindex-widget.asciidoc
@@ -49,6 +49,12 @@
             id="infer-api-reindex-amazon-bedrock">
       Amazon Bedrock
     </button>
+    <button role="tab"
+            aria-selected="false"
+            aria-controls="infer-api-reindex-alibabacloud-ai-search-tab"
+            id="infer-api-reindex-alibabacloud-ai-search">
+      AlibabaCloud AI Search
+    </button>
   </div>
   <div tabindex="0"
        role="tabpanel"
@@ -135,6 +141,17 @@ include::infer-api-reindex.asciidoc[tag=mistral]
 
 include::infer-api-reindex.asciidoc[tag=amazon-bedrock]
 
+++++
+  </div>
+  <div tabindex="0"
+       role="tabpanel"
+       id="infer-api-reindex-alibabacloud-ai-search-tab"
+       aria-labelledby="infer-api-reindex-alibabacloud-ai-search"
+       hidden="">
+++++
+
+include::infer-api-reindex.asciidoc[tag=alibabacloud-ai-search]
+
 ++++
   </div>
 </div>
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-reindex.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-reindex.asciidoc
index d961ec8bd39bd..25d4023c650c0 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-reindex.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-reindex.asciidoc
@@ -200,3 +200,26 @@ number makes the update of the reindexing process quicker which enables you to
 follow the progress closely and detect errors early.
 
 // end::amazon-bedrock[]
+
+// tag::alibabacloud-ai-search[]
+
+[source,console]
+----
+POST _reindex?wait_for_completion=false
+{
+  "source": {
+    "index": "test-data",
+    "size": 50 <1>
+  },
+  "dest": {
+    "index": "alibabacloud-ai-search-embeddings",
+    "pipeline": "alibabacloud_ai_search_embeddings"
+  }
+}
+----
+// TEST[skip:TBD]
+<1> The default batch size for reindexing is 1000. Reducing `size` to a smaller
+number makes the update of the reindexing process quicker which enables you to
+follow the progress closely and detect errors early.
+
+// end::alibabacloud-ai-search[]
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-requirements-widget.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-requirements-widget.asciidoc
index c867b39b88e3b..fb686a2d8be12 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-requirements-widget.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-requirements-widget.asciidoc
@@ -49,6 +49,12 @@
             id="infer-api-requirements-amazon-bedrock">
       Amazon Bedrock
     </button>
+    <button role="tab"
+            aria-selected="false"
+            aria-controls="infer-api-requirements-alibabacloud-ai-search-tab"
+            id="infer-api-requirements-alibabacloud-ai-search">
+      AlibabaCloud AI Search
+    </button>
   </div>
   <div tabindex="0"
        role="tabpanel"
@@ -135,6 +141,17 @@ include::infer-api-requirements.asciidoc[tag=mistral]
 
 include::infer-api-requirements.asciidoc[tag=amazon-bedrock]
 
+++++
+  </div>
+  <div tabindex="0"
+       role="tabpanel"
+       id="infer-api-requirements-alibabacloud-ai-search-tab"
+       aria-labelledby="infer-api-requirements-alibabacloud-ai-search"
+       hidden="">
+++++
+
+include::infer-api-requirements.asciidoc[tag=alibabacloud-ai-search]
+
 ++++
   </div>
 </div>
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-requirements.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-requirements.asciidoc
index 603cd85a8f93d..c9e7ca8b80ba6 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-requirements.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-requirements.asciidoc
@@ -52,3 +52,9 @@ You can apply for access to Azure OpenAI by completing the form at https://aka.m
 * A pair of access and secret keys used to access Amazon Bedrock
 
 // end::amazon-bedrock[]
+
+// tag::alibabacloud-ai-search[]
+* An AlibabaCloud Account with https://console.aliyun.com[AlibabaCloud] access
+* An API key generated for your account from the https://opensearch.console.aliyun.com/cn-shanghai/rag/api-key[API keys section]
+
+// end::alibabacloud-ai-search[]
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-search-widget.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-search-widget.asciidoc
index fa4a11c59a158..996148d80a4bd 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-search-widget.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-search-widget.asciidoc
@@ -49,6 +49,12 @@
             id="infer-api-search-amazon-bedrock">
       Amazon Bedrock
     </button>
+    <button role="tab"
+            aria-selected="false"
+            aria-controls="infer-api-search-alibabacloud-ai-search-tab"
+            id="infer-api-search-alibabacloud-ai-search">
+      AlibabaCloud AI Search
+    </button>
   </div>
   <div tabindex="0"
        role="tabpanel"
@@ -135,6 +141,17 @@ include::infer-api-search.asciidoc[tag=mistral]
 
 include::infer-api-search.asciidoc[tag=amazon-bedrock]
 
+++++
+  </div>
+  <div tabindex="0"
+       role="tabpanel"
+       id="infer-api-search-alibabacloud-ai-search-tab"
+       aria-labelledby="infer-api-search-alibabacloud-ai-search"
+       hidden="">
+++++
+
+include::infer-api-search.asciidoc[tag=alibabacloud-ai-search]
+
 ++++
   </div>
 </div>
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-search.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-search.asciidoc
index f23ed1dfef05d..fe1f58b6bd1a9 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-search.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-search.asciidoc
@@ -531,3 +531,68 @@ query from the `amazon-bedrock-embeddings` index sorted by their proximity to th
 // NOTCONSOLE
 
 // end::amazon-bedrock[]
+
+// tag::alibabacloud-ai-search[]
+
+[source,console]
+--------------------------------------------------
+GET alibabacloud-ai-search-embeddings/_search
+{
+  "knn": {
+    "field": "content_embedding",
+    "query_vector_builder": {
+      "text_embedding": {
+        "model_id": "alibabacloud_ai_search_embeddings",
+        "model_text": "Calculate fuel cost"
+      }
+    },
+    "k": 10,
+    "num_candidates": 100
+  },
+  "_source": [
+    "id",
+    "content"
+  ]
+}
+--------------------------------------------------
+// TEST[skip:TBD]
+
+As a result, you receive the top 10 documents that are closest in meaning to the
+query from the `alibabacloud-ai-search-embeddings` index sorted by their proximity to the query:
+
+[source,consol-result]
+--------------------------------------------------
+"hits": [
+      {
+        "_index": "alibabacloud-ai-search-embeddings",
+        "_id": "DDd5OowBHxQKHyc3TDSC",
+        "_score": 0.83704096,
+        "_source": {
+          "id": 862114,
+          "body": "How to calculate fuel cost for a road trip. By Tara Baukus Mello • Bankrate.com. Dear Driving for Dollars, My family is considering taking a long road trip to finish off the end of the summer, but I'm a little worried about gas prices and our overall fuel cost.It doesn't seem easy to calculate since we'll be traveling through many states and we are considering several routes.y family is considering taking a long road trip to finish off the end of the summer, but I'm a little worried about gas prices and our overall fuel cost. It doesn't seem easy to calculate since we'll be traveling through many states and we are considering several routes."
+        }
+      },
+      {
+        "_index": "alibabacloud-ai-search-embeddings",
+        "_id": "ajd5OowBHxQKHyc3TDSC",
+        "_score": 0.8345704,
+        "_source": {
+          "id": 820622,
+          "body": "Home Heating Calculator. Typically, approximately 50% of the energy consumed in a home annually is for space heating. When deciding on a heating system, many factors will come into play: cost of fuel, installation cost, convenience and life style are all important.This calculator can help you estimate the cost of fuel for different heating appliances.hen deciding on a heating system, many factors will come into play: cost of fuel, installation cost, convenience and life style are all important. This calculator can help you estimate the cost of fuel for different heating appliances."
+        }
+      },
+      {
+        "_index": "alibabacloud-ai-search-embeddings",
+        "_id": "Djd5OowBHxQKHyc3TDSC",
+        "_score": 0.8327426,
+        "_source": {
+          "id": 8202683,
+          "body": "Fuel is another important cost. This cost will depend on your boat, how far you travel, and how fast you travel. A 33-foot sailboat traveling at 7 knots should be able to travel 300 miles on 50 gallons of diesel fuel.If you are paying $4 per gallon, the trip would cost you $200.Most boats have much larger gas tanks than cars.uel is another important cost. This cost will depend on your boat, how far you travel, and how fast you travel. A 33-foot sailboat traveling at 7 knots should be able to travel 300 miles on 50 gallons of diesel fuel."
+        }
+      },
+      (...)
+    ]
+--------------------------------------------------
+// NOTCONSOLE
+
+// end::alibabacloud-ai-search[]
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-task-widget.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-task-widget.asciidoc
index f12be341d866d..1dfa6077553fe 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-task-widget.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-task-widget.asciidoc
@@ -49,6 +49,12 @@
             id="infer-api-task-amazon-bedrock">
       Amazon Bedrock
     </button>
+    <button role="tab"
+            aria-selected="false"
+            aria-controls="infer-api-task-alibabacloud-ai-search-tab"
+            id="infer-api-task-alibabacloud-ai-search">
+      AlibabaCloud AI Search
+    </button>
   </div>
   <div tabindex="0"
        role="tabpanel"
@@ -135,6 +141,17 @@ include::infer-api-task.asciidoc[tag=mistral]
 
 include::infer-api-task.asciidoc[tag=amazon-bedrock]
 
+++++
+  </div>
+  <div tabindex="0"
+       role="tabpanel"
+       id="infer-api-task-alibabacloud-ai-search-tab"
+       aria-labelledby="infer-api-task-alibabacloud-ai-search"
+       hidden="">
+++++
+
+include::infer-api-task.asciidoc[tag=alibabacloud-ai-search]
+
 ++++
   </div>
 </div>
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-task.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-task.asciidoc
index b186b2c58ccc5..2b4aa1a200102 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-task.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-task.asciidoc
@@ -223,3 +223,32 @@ PUT _inference/text_embedding/amazon_bedrock_embeddings <1>
 <6> The model ID or ARN of the model to use.
 
 // end::amazon-bedrock[]
+
+// tag::alibabacloud-ai-search[]
+
+[source,console]
+------------------------------------------------------------
+PUT _inference/text_embedding/alibabacloud_ai_search_embeddings <1>
+{
+    "service": "alibabacloud-ai-search",
+    "service_settings": {
+        "api_key": "<api_key>", <2>
+        "service_id": "<service_id>", <3>
+        "host": "<host>", <4>
+        "workspace": "<workspace>" <5>
+    }
+}
+------------------------------------------------------------
+// TEST[skip:TBD]
+<1> The task type is `text_embedding` in the path and the `inference_id` which is the unique identifier of the {infer} endpoint is `alibabacloud_ai_search_embeddings`.
+<2> The API key for accessing the AlibabaCloud AI Search API. You can find your API keys in
+your AlibabaCloud account under the
+https://opensearch.console.aliyun.com/cn-shanghai/rag/api-key[API keys section]. You need to provide
+your API key only once. The <<get-inference-api>> does not return your API
+key.
+<3> The AlibabaCloud AI Search embeddings model name, for example `ops-text-embedding-zh-001`.
+<4> The name our your AlibabaCloud AI Search host address.
+<5> The name our your AlibabaCloud AI Search workspace.
+
+// end::alibabacloud-ai-search[]
+

From 569184871bc0006ba55c20bcbc4500e98e853aea Mon Sep 17 00:00:00 2001
From: Chris Hegarty <62058229+ChrisHegarty@users.noreply.github.com>
Date: Thu, 29 Aug 2024 08:23:34 +0100
Subject: [PATCH 031/144] Add UpdateForV10 annotation (#112281)

In preparation for the next major release of Elasticsearch, this commit adds the UpdateForV10 annotation.
---
 .../org/elasticsearch/core/UpdateForV10.java  | 23 +++++++++++++++++++
 1 file changed, 23 insertions(+)
 create mode 100644 libs/core/src/main/java/org/elasticsearch/core/UpdateForV10.java

diff --git a/libs/core/src/main/java/org/elasticsearch/core/UpdateForV10.java b/libs/core/src/main/java/org/elasticsearch/core/UpdateForV10.java
new file mode 100644
index 0000000000000..0fe816bd3721d
--- /dev/null
+++ b/libs/core/src/main/java/org/elasticsearch/core/UpdateForV10.java
@@ -0,0 +1,23 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.core;
+
+import java.lang.annotation.ElementType;
+import java.lang.annotation.Retention;
+import java.lang.annotation.RetentionPolicy;
+import java.lang.annotation.Target;
+
+/**
+ * Annotation to identify a block of code (a whole class, a method, or a field) that needs to be reviewed (for cleanup, remove or change)
+ * before releasing 10.0
+ */
+@Retention(RetentionPolicy.SOURCE)
+@Target({ ElementType.LOCAL_VARIABLE, ElementType.CONSTRUCTOR, ElementType.FIELD, ElementType.METHOD, ElementType.TYPE })
+public @interface UpdateForV10 {
+}

From 727f1e72c6d930ad763ca307f622eadbbdfff112 Mon Sep 17 00:00:00 2001
From: Dominique Clarke <doclarke71@gmail.com>
Date: Thu, 29 Aug 2024 03:46:44 -0400
Subject: [PATCH 032/144] [Observability] add .slo-observability.* index
 privileges to built in editor and viewer roles (#111984)

Today, the `editor` and `viewer` roles do not contain
the appropriate index privileges for SLO users.

This PR updates the index privileges to include
the `.slo-observability.*` indices.

---------

Co-authored-by: Slobodan Adamovic <slobodan.adamovic@elastic.co>
---
 .../authz/store/ReservedRolesStore.java       |  9 ++++
 .../authz/store/ReservedRolesStoreTests.java  | 42 +++++++++++++++++++
 2 files changed, 51 insertions(+)

diff --git a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authz/store/ReservedRolesStore.java b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authz/store/ReservedRolesStore.java
index 4f3d7a245fc8f..74434adf61fbb 100644
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authz/store/ReservedRolesStore.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authz/store/ReservedRolesStore.java
@@ -868,6 +868,11 @@ private static RoleDescriptor buildViewerRoleDescriptor() {
                     .indices("/~(([.]|ilm-history-).*)/")
                     .privileges("read", "view_index_metadata")
                     .build(),
+                // Observability
+                RoleDescriptor.IndicesPrivileges.builder()
+                    .indices(".slo-observability.*")
+                    .privileges("read", "view_index_metadata")
+                    .build(),
                 // Security
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices(ReservedRolesStore.ALERTS_LEGACY_INDEX, ReservedRolesStore.LISTS_INDEX, ReservedRolesStore.LISTS_ITEMS_INDEX)
@@ -915,6 +920,10 @@ private static RoleDescriptor buildEditorRoleDescriptor() {
                     .indices("observability-annotations")
                     .privileges("read", "view_index_metadata", "write")
                     .build(),
+                RoleDescriptor.IndicesPrivileges.builder()
+                    .indices(".slo-observability.*")
+                    .privileges("read", "view_index_metadata", "write", "manage")
+                    .build(),
                 // Security
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices(ReservedRolesStore.ALERTS_LEGACY_INDEX, ReservedRolesStore.LISTS_INDEX, ReservedRolesStore.LISTS_ITEMS_INDEX)
diff --git a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/authz/store/ReservedRolesStoreTests.java b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/authz/store/ReservedRolesStoreTests.java
index f0676f35ae316..0cdf7de63ca99 100644
--- a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/authz/store/ReservedRolesStoreTests.java
+++ b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/authz/store/ReservedRolesStoreTests.java
@@ -28,6 +28,7 @@
 import org.elasticsearch.action.admin.indices.get.GetIndexAction;
 import org.elasticsearch.action.admin.indices.mapping.get.GetFieldMappingsAction;
 import org.elasticsearch.action.admin.indices.mapping.get.GetMappingsAction;
+import org.elasticsearch.action.admin.indices.mapping.put.TransportAutoPutMappingAction;
 import org.elasticsearch.action.admin.indices.mapping.put.TransportPutMappingAction;
 import org.elasticsearch.action.admin.indices.recovery.RecoveryAction;
 import org.elasticsearch.action.admin.indices.resolve.ResolveIndexAction;
@@ -3662,6 +3663,9 @@ public void testPredefinedViewerRole() {
         assertOnlyReadAllowed(role, ".profiling-" + randomIntBetween(0, 5));
         assertOnlyReadAllowed(role, randomAlphaOfLength(5));
 
+        assertOnlyReadAllowed(role, ".slo-observability." + randomIntBetween(0, 5));
+        assertViewIndexMetadata(role, ".slo-observability." + randomIntBetween(0, 5));
+
         assertNoAccessAllowed(role, TestRestrictedIndices.SAMPLE_RESTRICTED_NAMES);
         assertNoAccessAllowed(role, "." + randomAlphaOfLengthBetween(6, 10));
         assertNoAccessAllowed(role, "ilm-history-" + randomIntBetween(0, 5));
@@ -3740,6 +3744,9 @@ public void testPredefinedEditorRole() {
         assertReadWriteDocsAndMaintenanceButNotDeleteIndexAllowed(role, ".preview.alerts-" + randomIntBetween(0, 5));
         assertReadWriteDocsAndMaintenanceButNotDeleteIndexAllowed(role, ".internal.preview.alerts-" + randomIntBetween(0, 5));
 
+        assertViewIndexMetadata(role, ".slo-observability." + randomIntBetween(0, 5));
+        assertReadWriteAndManage(role, ".slo-observability." + randomIntBetween(0, 5));
+
         assertNoAccessAllowed(role, TestRestrictedIndices.SAMPLE_RESTRICTED_NAMES);
         assertNoAccessAllowed(role, "." + randomAlphaOfLengthBetween(6, 10));
         assertNoAccessAllowed(role, "ilm-history-" + randomIntBetween(0, 5));
@@ -3865,6 +3872,41 @@ private void assertReadWriteDocsButNotDeleteIndexAllowed(Role role, String index
             role.indices().allowedIndicesMatcher(TransportDeleteIndexAction.TYPE.name()).test(mockIndexAbstraction(index)),
             is(false)
         );
+
+        assertThat(role.indices().allowedIndicesMatcher(TransportSearchAction.TYPE.name()).test(mockIndexAbstraction(index)), is(true));
+        assertThat(role.indices().allowedIndicesMatcher(TransportGetAction.TYPE.name()).test(mockIndexAbstraction(index)), is(true));
+        assertThat(role.indices().allowedIndicesMatcher(TransportIndexAction.NAME).test(mockIndexAbstraction(index)), is(true));
+        assertThat(role.indices().allowedIndicesMatcher(TransportUpdateAction.NAME).test(mockIndexAbstraction(index)), is(true));
+        assertThat(role.indices().allowedIndicesMatcher(TransportDeleteAction.NAME).test(mockIndexAbstraction(index)), is(true));
+        assertThat(role.indices().allowedIndicesMatcher(TransportBulkAction.NAME).test(mockIndexAbstraction(index)), is(true));
+    }
+
+    private void assertReadWriteAndManage(Role role, String index) {
+        assertThat(
+            role.indices().allowedIndicesMatcher(TransportDeleteIndexAction.TYPE.name()).test(mockIndexAbstraction(index)),
+            is(true)
+        );
+        assertThat(
+            role.indices().allowedIndicesMatcher(TransportFieldCapabilitiesAction.NAME + "*").test(mockIndexAbstraction(index)),
+            is(true)
+        );
+        assertThat(
+            role.indices().allowedIndicesMatcher(TransportCreateIndexAction.TYPE.name()).test(mockIndexAbstraction(index)),
+            is(true)
+        );
+        assertThat(
+            role.indices().allowedIndicesMatcher(TransportUpdateSettingsAction.TYPE.name()).test(mockIndexAbstraction(index)),
+            is(true)
+        );
+        assertThat(role.indices().allowedIndicesMatcher(GetRollupIndexCapsAction.NAME + "*").test(mockIndexAbstraction(index)), is(true));
+        assertThat(role.indices().allowedIndicesMatcher("indices:admin/*").test(mockIndexAbstraction(index)), is(true));
+        assertThat(role.indices().allowedIndicesMatcher("indices:monitor/*").test(mockIndexAbstraction(index)), is(true));
+        assertThat(
+            role.indices().allowedIndicesMatcher(TransportAutoPutMappingAction.TYPE.name()).test(mockIndexAbstraction(index)),
+            is(true)
+        );
+        assertThat(role.indices().allowedIndicesMatcher(AutoCreateAction.NAME).test(mockIndexAbstraction(index)), is(true));
+
         assertThat(role.indices().allowedIndicesMatcher(TransportSearchAction.TYPE.name()).test(mockIndexAbstraction(index)), is(true));
         assertThat(role.indices().allowedIndicesMatcher(TransportGetAction.TYPE.name()).test(mockIndexAbstraction(index)), is(true));
         assertThat(role.indices().allowedIndicesMatcher(TransportIndexAction.NAME).test(mockIndexAbstraction(index)), is(true));

From 55ed03fddfa8c77c354a2db2910593b40d2be890 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Christoph=20B=C3=BCscher?= <christophbuescher@posteo.de>
Date: Wed, 28 Aug 2024 19:21:00 +0200
Subject: [PATCH 033/144] Remove Scorable#docID implementations

This method was removed in https://github.com/apache/lucene/pull/12407 so
we also need to remove it in implementations of Scorable.
---
 .../painless/ScriptedMetricAggContextsTests.java       |  5 -----
 .../join/aggregations/ParentJoinAggregator.java        |  5 -----
 .../aggregations/bucket/nested/NestedAggregator.java   |  7 -------
 .../bucket/sampler/BestDocsDeferringCollector.java     |  8 --------
 .../search/aggregations/MultiBucketCollectorTests.java | 10 ++--------
 .../search/query/QueryPhaseCollectorTests.java         | 10 ----------
 .../search/sort/BucketedSortForFloatsTests.java        |  6 ------
 7 files changed, 2 insertions(+), 49 deletions(-)

diff --git a/modules/lang-painless/src/test/java/org/elasticsearch/painless/ScriptedMetricAggContextsTests.java b/modules/lang-painless/src/test/java/org/elasticsearch/painless/ScriptedMetricAggContextsTests.java
index 2d3f09fc7243a..8eae139eb8226 100644
--- a/modules/lang-painless/src/test/java/org/elasticsearch/painless/ScriptedMetricAggContextsTests.java
+++ b/modules/lang-painless/src/test/java/org/elasticsearch/painless/ScriptedMetricAggContextsTests.java
@@ -73,11 +73,6 @@ public void testMapBasic() throws IOException {
         Map<String, Object> state = new HashMap<>();
 
         Scorable scorer = new Scorable() {
-            @Override
-            public int docID() {
-                return 0;
-            }
-
             @Override
             public float score() {
                 return 0.5f;
diff --git a/modules/parent-join/src/main/java/org/elasticsearch/join/aggregations/ParentJoinAggregator.java b/modules/parent-join/src/main/java/org/elasticsearch/join/aggregations/ParentJoinAggregator.java
index 9c6a788ea2f77..ed4dcf2072b8d 100644
--- a/modules/parent-join/src/main/java/org/elasticsearch/join/aggregations/ParentJoinAggregator.java
+++ b/modules/parent-join/src/main/java/org/elasticsearch/join/aggregations/ParentJoinAggregator.java
@@ -133,11 +133,6 @@ protected void prepareSubAggs(long[] ordsToCollect) throws IOException {
                 public float score() {
                     return 1f;
                 }
-
-                @Override
-                public int docID() {
-                    return childDocsIter.docID();
-                }
             });
 
             final Bits liveDocs = ctx.reader().getLiveDocs();
diff --git a/server/src/main/java/org/elasticsearch/search/aggregations/bucket/nested/NestedAggregator.java b/server/src/main/java/org/elasticsearch/search/aggregations/bucket/nested/NestedAggregator.java
index 39dfd6e4aac3a..28e010f541a74 100644
--- a/server/src/main/java/org/elasticsearch/search/aggregations/bucket/nested/NestedAggregator.java
+++ b/server/src/main/java/org/elasticsearch/search/aggregations/bucket/nested/NestedAggregator.java
@@ -206,19 +206,12 @@ void processBufferedChildBuckets() throws IOException {
     }
 
     private static class CachedScorable extends Scorable {
-        int doc;
         float score;
 
         @Override
         public final float score() {
             return score;
         }
-
-        @Override
-        public int docID() {
-            return doc;
-        }
-
     }
 
 }
diff --git a/server/src/main/java/org/elasticsearch/search/aggregations/bucket/sampler/BestDocsDeferringCollector.java b/server/src/main/java/org/elasticsearch/search/aggregations/bucket/sampler/BestDocsDeferringCollector.java
index 1344604a8d39c..c72c4b29a478f 100644
--- a/server/src/main/java/org/elasticsearch/search/aggregations/bucket/sampler/BestDocsDeferringCollector.java
+++ b/server/src/main/java/org/elasticsearch/search/aggregations/bucket/sampler/BestDocsDeferringCollector.java
@@ -213,7 +213,6 @@ class PerSegmentCollects extends Scorable {
         private final AggregationExecutionContext aggCtx;
         int maxDocId = Integer.MIN_VALUE;
         private float currentScore;
-        private int currentDocId = -1;
         private Scorable currentScorer;
 
         PerSegmentCollects(AggregationExecutionContext aggCtx) throws IOException {
@@ -248,7 +247,6 @@ public void replayRelatedMatches(List<ScoreDoc> sd) throws IOException {
                 leafCollector.setScorer(this);
 
                 currentScore = 0;
-                currentDocId = -1;
                 if (maxDocId < 0) {
                     return;
                 }
@@ -258,7 +256,6 @@ public void replayRelatedMatches(List<ScoreDoc> sd) throws IOException {
                     int rebased = scoreDoc.doc - aggCtx.getLeafReaderContext().docBase;
                     if ((rebased >= 0) && (rebased <= maxDocId)) {
                         currentScore = scoreDoc.score;
-                        currentDocId = rebased;
                         // We stored the bucket ID in Lucene's shardIndex property
                         // for convenience.
                         leafCollector.collect(rebased, scoreDoc.shardIndex);
@@ -275,11 +272,6 @@ public float score() throws IOException {
             return currentScore;
         }
 
-        @Override
-        public int docID() {
-            return currentDocId;
-        }
-
         public void collect(int docId, long parentBucket) throws IOException {
             perBucketSamples = bigArrays.grow(perBucketSamples, parentBucket + 1);
             PerParentBucketSamples sampler = perBucketSamples.get((int) parentBucket);
diff --git a/server/src/test/java/org/elasticsearch/search/aggregations/MultiBucketCollectorTests.java b/server/src/test/java/org/elasticsearch/search/aggregations/MultiBucketCollectorTests.java
index cfb9c4bb83249..ff4ad059559fc 100644
--- a/server/src/test/java/org/elasticsearch/search/aggregations/MultiBucketCollectorTests.java
+++ b/server/src/test/java/org/elasticsearch/search/aggregations/MultiBucketCollectorTests.java
@@ -32,14 +32,8 @@
 import static org.hamcrest.Matchers.equalTo;
 
 public class MultiBucketCollectorTests extends ESTestCase {
-    private static class ScoreAndDoc extends Scorable {
+    private static class Score extends Scorable {
         float score;
-        int doc = -1;
-
-        @Override
-        public int docID() {
-            return doc;
-        }
 
         @Override
         public float score() {
@@ -246,7 +240,7 @@ public void testSetScorerAfterCollectionTerminated() throws IOException {
         collector1 = new TerminateAfterBucketCollector(collector1, 1);
         collector2 = new TerminateAfterBucketCollector(collector2, 2);
 
-        Scorable scorer = new ScoreAndDoc();
+        Scorable scorer = new Score();
 
         List<BucketCollector> collectors = Arrays.asList(collector1, collector2);
         Collections.shuffle(collectors, random());
diff --git a/server/src/test/java/org/elasticsearch/search/query/QueryPhaseCollectorTests.java b/server/src/test/java/org/elasticsearch/search/query/QueryPhaseCollectorTests.java
index f222e697488d2..dbfd9d83ee887 100644
--- a/server/src/test/java/org/elasticsearch/search/query/QueryPhaseCollectorTests.java
+++ b/server/src/test/java/org/elasticsearch/search/query/QueryPhaseCollectorTests.java
@@ -1138,11 +1138,6 @@ public void testSetScorerAfterCollectionTerminated() throws IOException {
             public float score() {
                 return 0;
             }
-
-            @Override
-            public int docID() {
-                return 0;
-            }
         };
 
         QueryPhaseCollector queryPhaseCollector = new QueryPhaseCollector(
@@ -1472,11 +1467,6 @@ public float score() throws IOException {
             return 0;
         }
 
-        @Override
-        public int docID() {
-            return 0;
-        }
-
         @Override
         public void setMinCompetitiveScore(float minScore) {
             setMinCompetitiveScoreCalled = true;
diff --git a/server/src/test/java/org/elasticsearch/search/sort/BucketedSortForFloatsTests.java b/server/src/test/java/org/elasticsearch/search/sort/BucketedSortForFloatsTests.java
index 0f088d2948fcb..7f136a097e24a 100644
--- a/server/src/test/java/org/elasticsearch/search/sort/BucketedSortForFloatsTests.java
+++ b/server/src/test/java/org/elasticsearch/search/sort/BucketedSortForFloatsTests.java
@@ -120,18 +120,12 @@ public void testScorer() throws IOException {
     }
 
     private class MockScorable extends Scorable {
-        private int doc;
         private float score;
 
         @Override
         public float score() throws IOException {
             return score;
         }
-
-        @Override
-        public int docID() {
-            return doc;
-        }
     }
 
     /**

From 5e455db10ecbb1a31cad58ecb1120a66fc50079f Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Christoph=20B=C3=BCscher?= <christophbuescher@posteo.de>
Date: Thu, 29 Aug 2024 10:04:27 +0200
Subject: [PATCH 034/144] Revert "Remove Scorable#docID implementations"

This reverts commit 55ed03fddfa8c77c354a2db2910593b40d2be890.
---
 .../painless/ScriptedMetricAggContextsTests.java       |  5 +++++
 .../join/aggregations/ParentJoinAggregator.java        |  5 +++++
 .../aggregations/bucket/nested/NestedAggregator.java   |  7 +++++++
 .../bucket/sampler/BestDocsDeferringCollector.java     |  8 ++++++++
 .../search/aggregations/MultiBucketCollectorTests.java | 10 ++++++++--
 .../search/query/QueryPhaseCollectorTests.java         | 10 ++++++++++
 .../search/sort/BucketedSortForFloatsTests.java        |  6 ++++++
 7 files changed, 49 insertions(+), 2 deletions(-)

diff --git a/modules/lang-painless/src/test/java/org/elasticsearch/painless/ScriptedMetricAggContextsTests.java b/modules/lang-painless/src/test/java/org/elasticsearch/painless/ScriptedMetricAggContextsTests.java
index 8eae139eb8226..2d3f09fc7243a 100644
--- a/modules/lang-painless/src/test/java/org/elasticsearch/painless/ScriptedMetricAggContextsTests.java
+++ b/modules/lang-painless/src/test/java/org/elasticsearch/painless/ScriptedMetricAggContextsTests.java
@@ -73,6 +73,11 @@ public void testMapBasic() throws IOException {
         Map<String, Object> state = new HashMap<>();
 
         Scorable scorer = new Scorable() {
+            @Override
+            public int docID() {
+                return 0;
+            }
+
             @Override
             public float score() {
                 return 0.5f;
diff --git a/modules/parent-join/src/main/java/org/elasticsearch/join/aggregations/ParentJoinAggregator.java b/modules/parent-join/src/main/java/org/elasticsearch/join/aggregations/ParentJoinAggregator.java
index ed4dcf2072b8d..9c6a788ea2f77 100644
--- a/modules/parent-join/src/main/java/org/elasticsearch/join/aggregations/ParentJoinAggregator.java
+++ b/modules/parent-join/src/main/java/org/elasticsearch/join/aggregations/ParentJoinAggregator.java
@@ -133,6 +133,11 @@ protected void prepareSubAggs(long[] ordsToCollect) throws IOException {
                 public float score() {
                     return 1f;
                 }
+
+                @Override
+                public int docID() {
+                    return childDocsIter.docID();
+                }
             });
 
             final Bits liveDocs = ctx.reader().getLiveDocs();
diff --git a/server/src/main/java/org/elasticsearch/search/aggregations/bucket/nested/NestedAggregator.java b/server/src/main/java/org/elasticsearch/search/aggregations/bucket/nested/NestedAggregator.java
index 28e010f541a74..39dfd6e4aac3a 100644
--- a/server/src/main/java/org/elasticsearch/search/aggregations/bucket/nested/NestedAggregator.java
+++ b/server/src/main/java/org/elasticsearch/search/aggregations/bucket/nested/NestedAggregator.java
@@ -206,12 +206,19 @@ void processBufferedChildBuckets() throws IOException {
     }
 
     private static class CachedScorable extends Scorable {
+        int doc;
         float score;
 
         @Override
         public final float score() {
             return score;
         }
+
+        @Override
+        public int docID() {
+            return doc;
+        }
+
     }
 
 }
diff --git a/server/src/main/java/org/elasticsearch/search/aggregations/bucket/sampler/BestDocsDeferringCollector.java b/server/src/main/java/org/elasticsearch/search/aggregations/bucket/sampler/BestDocsDeferringCollector.java
index c72c4b29a478f..1344604a8d39c 100644
--- a/server/src/main/java/org/elasticsearch/search/aggregations/bucket/sampler/BestDocsDeferringCollector.java
+++ b/server/src/main/java/org/elasticsearch/search/aggregations/bucket/sampler/BestDocsDeferringCollector.java
@@ -213,6 +213,7 @@ class PerSegmentCollects extends Scorable {
         private final AggregationExecutionContext aggCtx;
         int maxDocId = Integer.MIN_VALUE;
         private float currentScore;
+        private int currentDocId = -1;
         private Scorable currentScorer;
 
         PerSegmentCollects(AggregationExecutionContext aggCtx) throws IOException {
@@ -247,6 +248,7 @@ public void replayRelatedMatches(List<ScoreDoc> sd) throws IOException {
                 leafCollector.setScorer(this);
 
                 currentScore = 0;
+                currentDocId = -1;
                 if (maxDocId < 0) {
                     return;
                 }
@@ -256,6 +258,7 @@ public void replayRelatedMatches(List<ScoreDoc> sd) throws IOException {
                     int rebased = scoreDoc.doc - aggCtx.getLeafReaderContext().docBase;
                     if ((rebased >= 0) && (rebased <= maxDocId)) {
                         currentScore = scoreDoc.score;
+                        currentDocId = rebased;
                         // We stored the bucket ID in Lucene's shardIndex property
                         // for convenience.
                         leafCollector.collect(rebased, scoreDoc.shardIndex);
@@ -272,6 +275,11 @@ public float score() throws IOException {
             return currentScore;
         }
 
+        @Override
+        public int docID() {
+            return currentDocId;
+        }
+
         public void collect(int docId, long parentBucket) throws IOException {
             perBucketSamples = bigArrays.grow(perBucketSamples, parentBucket + 1);
             PerParentBucketSamples sampler = perBucketSamples.get((int) parentBucket);
diff --git a/server/src/test/java/org/elasticsearch/search/aggregations/MultiBucketCollectorTests.java b/server/src/test/java/org/elasticsearch/search/aggregations/MultiBucketCollectorTests.java
index ff4ad059559fc..cfb9c4bb83249 100644
--- a/server/src/test/java/org/elasticsearch/search/aggregations/MultiBucketCollectorTests.java
+++ b/server/src/test/java/org/elasticsearch/search/aggregations/MultiBucketCollectorTests.java
@@ -32,8 +32,14 @@
 import static org.hamcrest.Matchers.equalTo;
 
 public class MultiBucketCollectorTests extends ESTestCase {
-    private static class Score extends Scorable {
+    private static class ScoreAndDoc extends Scorable {
         float score;
+        int doc = -1;
+
+        @Override
+        public int docID() {
+            return doc;
+        }
 
         @Override
         public float score() {
@@ -240,7 +246,7 @@ public void testSetScorerAfterCollectionTerminated() throws IOException {
         collector1 = new TerminateAfterBucketCollector(collector1, 1);
         collector2 = new TerminateAfterBucketCollector(collector2, 2);
 
-        Scorable scorer = new Score();
+        Scorable scorer = new ScoreAndDoc();
 
         List<BucketCollector> collectors = Arrays.asList(collector1, collector2);
         Collections.shuffle(collectors, random());
diff --git a/server/src/test/java/org/elasticsearch/search/query/QueryPhaseCollectorTests.java b/server/src/test/java/org/elasticsearch/search/query/QueryPhaseCollectorTests.java
index dbfd9d83ee887..f222e697488d2 100644
--- a/server/src/test/java/org/elasticsearch/search/query/QueryPhaseCollectorTests.java
+++ b/server/src/test/java/org/elasticsearch/search/query/QueryPhaseCollectorTests.java
@@ -1138,6 +1138,11 @@ public void testSetScorerAfterCollectionTerminated() throws IOException {
             public float score() {
                 return 0;
             }
+
+            @Override
+            public int docID() {
+                return 0;
+            }
         };
 
         QueryPhaseCollector queryPhaseCollector = new QueryPhaseCollector(
@@ -1467,6 +1472,11 @@ public float score() throws IOException {
             return 0;
         }
 
+        @Override
+        public int docID() {
+            return 0;
+        }
+
         @Override
         public void setMinCompetitiveScore(float minScore) {
             setMinCompetitiveScoreCalled = true;
diff --git a/server/src/test/java/org/elasticsearch/search/sort/BucketedSortForFloatsTests.java b/server/src/test/java/org/elasticsearch/search/sort/BucketedSortForFloatsTests.java
index 7f136a097e24a..0f088d2948fcb 100644
--- a/server/src/test/java/org/elasticsearch/search/sort/BucketedSortForFloatsTests.java
+++ b/server/src/test/java/org/elasticsearch/search/sort/BucketedSortForFloatsTests.java
@@ -120,12 +120,18 @@ public void testScorer() throws IOException {
     }
 
     private class MockScorable extends Scorable {
+        private int doc;
         private float score;
 
         @Override
         public float score() throws IOException {
             return score;
         }
+
+        @Override
+        public int docID() {
+            return doc;
+        }
     }
 
     /**

From aa57a1553e3371158c23faed7a5f7c5833a6e18d Mon Sep 17 00:00:00 2001
From: Liam Thompson <32779855+leemthompo@users.noreply.github.com>
Date: Thu, 29 Aug 2024 09:13:30 +0100
Subject: [PATCH 035/144] [DOCS] Rewrite "What is Elasticsearch?" (Part 1)
 (#112213)

---
 docs/reference/intro.asciidoc                 | 132 ++++++++++--------
 .../search-your-data/near-real-time.asciidoc  |   2 +-
 2 files changed, 72 insertions(+), 62 deletions(-)

diff --git a/docs/reference/intro.asciidoc b/docs/reference/intro.asciidoc
index 3fc23b44994a7..cd9c126e7b1fd 100644
--- a/docs/reference/intro.asciidoc
+++ b/docs/reference/intro.asciidoc
@@ -1,42 +1,70 @@
 [[elasticsearch-intro]]
 == What is {es}?
-_**You know, for search (and analysis)**_
-
-{es} is the distributed search and analytics engine at the heart of
-the {stack}. {ls} and {beats} facilitate collecting, aggregating, and
-enriching your data and storing it in {es}. {kib} enables you to
-interactively explore, visualize, and share insights into your data and manage
-and monitor the stack. {es} is where the indexing, search, and analysis
-magic happens.
-
-{es} provides near real-time search and analytics for all types of data. Whether you
-have structured or unstructured text, numerical data, or geospatial data,
-{es} can efficiently store and index it in a way that supports fast searches.
-You can go far beyond simple data retrieval and aggregate information to discover
-trends and patterns in your data. And as your data and query volume grows, the
-distributed nature of {es} enables your deployment to grow seamlessly right
-along with it.
-
-While not _every_ problem is a search problem, {es} offers speed and flexibility
-to handle data in a wide variety of use cases:
-
-* Add a search box to an app or website
-* Store and analyze logs, metrics, and security event data
-* Use machine learning to automatically model the behavior of your data in real
-  time
-* Use {es} as a vector database to create, store, and search vector embeddings
-* Automate business workflows using {es} as a storage engine
-* Manage, integrate, and analyze spatial information using {es} as a geographic
-  information system (GIS)
-* Store and process genetic data using {es} as a bioinformatics research tool
-
-We’re continually amazed by the novel ways people use search. But whether
-your use case is similar to one of these, or you're using {es} to tackle a new
-problem, the way you work with your data, documents, and indices in {es} is
-the same.
+
+{es-repo}[{es}] is a distributed search and analytics engine, scalable data store, and vector database built on Apache Lucene.
+It's optimized for speed and relevance on production-scale workloads.
+Use {es} to search, index, store, and analyze data of all shapes and sizes in near real time.
+
+[TIP]
+====
+{es} has a lot of features. Explore the full list on the https://www.elastic.co/elasticsearch/features[product webpage^].
+====
+
+{es} is the heart of the {estc-welcome-current}/stack-components.html[Elastic Stack] and powers the Elastic https://www.elastic.co/enterprise-search[Search], https://www.elastic.co/observability[Observability] and https://www.elastic.co/security[Security] solutions.
+
+{es} is used for a wide and growing range of use cases. Here are a few examples:
+
+* *Monitor log and event data*. Store logs, metrics, and event data for observability and security information and event management (SIEM).
+* *Build search applications*. Add search capabilities to apps or websites, or build enterprise search engines over your organization's internal data sources.
+* *Vector database*. Store and search vectorized data, and create vector embeddings with built-in and third-party natural language processing (NLP) models.
+* *Retrieval augmented generation (RAG)*. Use {es} as a retrieval engine to augment Generative AI models.
+* *Application and security monitoring*. Monitor and analyze application performance and security data effectively.
+* *Machine learning*. Use {ml} to automatically model the behavior of your data in real-time.
+
+This is just a sample of search, observability, and security use cases enabled by {es}. 
+Refer to our https://www.elastic.co/customers/success-stories[customer success stories] for concrete examples across a range of industries.
+// Link to demos, search labs chatbots
+
+[discrete]
+[[elasticsearch-intro-elastic-stack]]
+.What is the Elastic Stack?
+*******************************
+{es} is the core component of the Elastic Stack, a suite of products for collecting, storing, searching, and visualizing data.
+https://www.elastic.co/guide/en/starting-with-the-elasticsearch-platform-and-its-solutions/current/stack-components.html[Learn more about the Elastic Stack].
+*******************************
+// TODO: Remove once we've moved Stack Overview to a subpage?
+
+[discrete]
+[[elasticsearch-intro-deploy]]
+=== Deployment options
+
+To use {es}, you need a running instance of the {es} service.
+You can deploy {es} in various ways:
+
+* <<run-elasticsearch-locally,*Local dev*>>. Get started quickly with a minimal local Docker setup. 
+* {cloud}/ec-getting-started-trial.html[*Elastic Cloud*]. {es} is available as part of our hosted Elastic Stack offering, deployed in the cloud with your provider of choice. Sign up for a https://cloud.elastic.co/registration[14 day free trial].
+* {serverless-docs}/general/sign-up-trial[*Elastic Cloud Serverless* (technical preview)]. Create serverless projects for autoscaled and fully managed {es} deployments. Sign up for a https://cloud.elastic.co/serverless-registration[14 day free trial].
+
+**Advanced deployment options**
+
+* <<elasticsearch-deployment-options,*Self-managed*>>. Install, configure, and run {es} on your own premises.
+* {ece-ref}/Elastic-Cloud-Enterprise-overview.html[*Elastic Cloud Enterprise*]. Deploy Elastic Cloud on public or private clouds, virtual machines, or your own premises.
+* {eck-ref}/k8s-overview.html[*Elastic Cloud on Kubernetes*]. Deploy Elastic Cloud on Kubernetes.
+
+[discrete]
+[[elasticsearch-next-steps]]
+=== Learn more
+
+Here are some resources to help you get started:
+
+* <<getting-started, Quickstart>>. A beginner's guide to deploying your first {es} instance, indexing data, and running queries.
+* https://elastic.co/webinars/getting-started-elasticsearch[Webinar: Introduction to {es}]. Register for our live webinars to learn directly from {es} experts.
+* https://www.elastic.co/search-labs[Elastic Search Labs]. Tutorials and blogs that explore AI-powered search using the latest {es} features.
+** Follow our tutorial https://www.elastic.co/search-labs/tutorials/search-tutorial/welcome[to build a hybrid search solution in Python].
+** Check out the https://github.com/elastic/elasticsearch-labs?tab=readme-ov-file#elasticsearch-examples--apps[`elasticsearch-labs` repository] for a range of Python notebooks and apps for various use cases.
 
 [[documents-indices]]
-=== Data in: documents and indices
+=== Documents and indices
 
 {es} is a distributed document store. Instead of storing information as rows of
 columnar data, {es} stores complex data structures that have been serialized
@@ -65,8 +93,7 @@ behavior makes it easy to index and explore your data--just start
 indexing documents and {es} will detect and map booleans, floating point and
 integer values, dates, and strings to the appropriate {es} data types.
 
-Ultimately, however, you know more about your data and how you want to use it
-than {es} can. You can define rules to control dynamic mapping and explicitly
+You can define rules to control dynamic mapping and explicitly
 define mappings to take full control of how fields are stored and indexed.
 
 Defining your own mappings enables you to:
@@ -89,7 +116,7 @@ used at search time. When you query a full-text field, the query text undergoes
 the same analysis before the terms are looked up in the index.
 
 [[search-analyze]]
-=== Information out: search and analyze
+=== Search and analyze
 
 While you can use {es} as a document store and retrieve documents and their
 metadata, the real power comes from being able to easily access the full suite
@@ -160,27 +187,8 @@ size 70 needles, you’re displaying a count of the size 70 needles
 that match your users' search criteria--for example, all size 70 _non-stick
 embroidery_ needles.
 
-[discrete]
-[[more-features]]
-===== But wait, there’s more
-
-Want to automate the analysis of your time series data? You can use
-{ml-docs}/ml-ad-overview.html[machine learning] features to create accurate
-baselines of normal behavior in your data and identify anomalous patterns. With
-machine learning, you can detect:
-
-* Anomalies related to temporal deviations in values, counts, or frequencies
-* Statistical rarity
-* Unusual behaviors for a member of a population
-
-And the best part? You can do this without having to specify algorithms, models,
-or other data science-related configurations.
-
 [[scalability]]
-=== Scalability and resilience: clusters, nodes, and shards
-++++
-<titleabbrev>Scalability and resilience</titleabbrev>
-++++
+=== Scalability and resilience
 
 {es} is built to be always available and to scale with your needs. It does this
 by being distributed by nature. You can add servers (nodes) to a cluster to
@@ -209,7 +217,7 @@ interrupting indexing or query operations.
 
 [discrete]
 [[it-depends]]
-==== It depends...
+==== Shard size and number of shards
 
 There are a number of performance considerations and trade offs with respect
 to shard size and the number of primary shards configured for an index. The more
@@ -237,7 +245,7 @@ testing with your own data and queries].
 
 [discrete]
 [[disaster-ccr]]
-==== In case of disaster
+==== Disaster recovery
 
 A cluster's nodes need good, reliable connections to each other. To provide
 better connections, you typically co-locate the nodes in the same data center or
@@ -257,7 +265,7 @@ secondary clusters are read-only followers.
 
 [discrete]
 [[admin]]
-==== Care and feeding
+==== Security, management, and monitoring
 
 As with any enterprise system, you need tools to secure, manage, and
 monitor your {es} clusters. Security, monitoring, and administrative features
@@ -265,3 +273,5 @@ that are integrated into {es} enable you to use {kibana-ref}/introduction.html[{
 as a control center for managing a cluster. Features like <<downsampling,
 downsampling>> and <<index-lifecycle-management, index lifecycle management>>
 help you intelligently manage your data over time.
+
+Refer to <<monitor-elasticsearch-cluster>> for more information.
\ No newline at end of file
diff --git a/docs/reference/search/search-your-data/near-real-time.asciidoc b/docs/reference/search/search-your-data/near-real-time.asciidoc
index 46a996c237c38..47618ecd9fd7a 100644
--- a/docs/reference/search/search-your-data/near-real-time.asciidoc
+++ b/docs/reference/search/search-your-data/near-real-time.asciidoc
@@ -2,7 +2,7 @@
 
 [[near-real-time]]
 === Near real-time search
-The overview of <<documents-indices,documents and indices>> indicates that when a document is stored in {es}, it is indexed and fully searchable in _near real-time_--within 1 second. What defines near real-time search?
+When a document is stored in {es}, it is indexed and fully searchable in _near real-time_--within 1 second. What defines near real-time search?
 
 Lucene, the Java libraries on which {es} is based, introduced the concept of per-segment search. A _segment_ is similar to an inverted index, but the word _index_ in Lucene means "a collection of segments plus a commit point". After a commit, a new segment is added to the commit point and the buffer is cleared.
 

From 320ccbc24748809feecc42df1f7bab6c4d6fd4cc Mon Sep 17 00:00:00 2001
From: Kostas Krikellas <131142368+kkrik-es@users.noreply.github.com>
Date: Thu, 29 Aug 2024 11:25:04 +0300
Subject: [PATCH 036/144] Reduce load for stress test to avoid oom (#112331)

Fixes #112326
---
 .../logsdb/datageneration/DataGeneratorTests.java             | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/test/framework/src/test/java/org/elasticsearch/logsdb/datageneration/DataGeneratorTests.java b/test/framework/src/test/java/org/elasticsearch/logsdb/datageneration/DataGeneratorTests.java
index db3b81891e87e..4a4ffca0f37aa 100644
--- a/test/framework/src/test/java/org/elasticsearch/logsdb/datageneration/DataGeneratorTests.java
+++ b/test/framework/src/test/java/org/elasticsearch/logsdb/datageneration/DataGeneratorTests.java
@@ -113,13 +113,13 @@ protected Collection<? extends Plugin> getPlugins() {
     }
 
     public void testDataGeneratorStressTest() throws IOException {
-        // Let's generate 1000000 fields to test an extreme case (2 levels of objects + 1 leaf level with 100 fields per object).
+        // Let's generate 125000 fields to test an extreme case (2 levels of objects + 1 leaf level with 50 fields per object).
         var testChildFieldGenerator = new DataSourceResponse.ChildFieldGenerator() {
             private int generatedFields = 0;
 
             @Override
             public int generateChildFieldCount() {
-                return 100;
+                return 50;
             }
 
             @Override

From 2c29a3ae0a6e743c2df72df5895e90aa56dd2683 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Istv=C3=A1n=20Zolt=C3=A1n=20Szab=C3=B3?=
 <istvan.szabo@elastic.co>
Date: Thu, 29 Aug 2024 12:43:10 +0200
Subject: [PATCH 037/144] [DOCS] Highlights auto-chunking in intro of semantic
 text. (#111836)

---
 docs/reference/mapping/types/semantic-text.asciidoc | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/reference/mapping/types/semantic-text.asciidoc b/docs/reference/mapping/types/semantic-text.asciidoc
index 522a0c54c8aad..a006f288dc66d 100644
--- a/docs/reference/mapping/types/semantic-text.asciidoc
+++ b/docs/reference/mapping/types/semantic-text.asciidoc
@@ -7,8 +7,8 @@
 
 beta[]
 
-The `semantic_text` field type automatically generates embeddings for text
-content using an inference endpoint.
+The `semantic_text` field type automatically generates embeddings for text content using an inference endpoint.
+Long passages are <<auto-text-chunking, automatically chunked>> to smaller sections to enable the processing of larger corpuses of text.
 
 The `semantic_text` field type specifies an inference endpoint identifier that will be used to generate embeddings.
 You can create the inference endpoint by using the <<put-inference-api>>.

From 35fe3a9c47500ab21735f7c40f7184fb7d724f9c Mon Sep 17 00:00:00 2001
From: weizijun <weizijun.wzj@alibaba-inc.com>
Date: Thu, 29 Aug 2024 19:46:58 +0800
Subject: [PATCH 038/144] some fixed (#112332)

---
 .../inference/service-alibabacloud-ai-search.asciidoc     | 2 +-
 docs/reference/inference/service-amazon-bedrock.asciidoc  | 8 --------
 2 files changed, 1 insertion(+), 9 deletions(-)

diff --git a/docs/reference/inference/service-alibabacloud-ai-search.asciidoc b/docs/reference/inference/service-alibabacloud-ai-search.asciidoc
index df5220573d9e4..23a3d532635ac 100644
--- a/docs/reference/inference/service-alibabacloud-ai-search.asciidoc
+++ b/docs/reference/inference/service-alibabacloud-ai-search.asciidoc
@@ -25,7 +25,7 @@ include::inference-shared.asciidoc[tag=task-type]
 Available task types:
 
 * `text_embedding`,
-* `sparse_embedding`.
+* `sparse_embedding`,
 * `rerank`.
 --
 
diff --git a/docs/reference/inference/service-amazon-bedrock.asciidoc b/docs/reference/inference/service-amazon-bedrock.asciidoc
index 4ffa368613a0e..dbffd5c26fbcc 100644
--- a/docs/reference/inference/service-amazon-bedrock.asciidoc
+++ b/docs/reference/inference/service-amazon-bedrock.asciidoc
@@ -122,14 +122,6 @@ Only available for `anthropic`, `cohere`, and `mistral` providers.
 Alternative to `temperature`. Limits samples to the top-K most likely words, balancing coherence and variability.
 Should not be used if `temperature` is specified.
 
-=====
-+
-.`task_settings` for the `text_embedding` task type
-[%collapsible%closed]
-=====
-
-There are no `task_settings` available for the `text_embedding` task type.
-
 =====
 
 [discrete]

From b4c8fa362dc88d9d1220c7466ec2c0219a258433 Mon Sep 17 00:00:00 2001
From: Bogdan Pintea <bogdan.pintea@elastic.co>
Date: Thu, 29 Aug 2024 13:50:24 +0200
Subject: [PATCH 039/144] Reenable 26_aggs_bucket EsqlClientYamlIT (#112343)

Reenable 26_aggs_bucket EsqlClientYamlIT, fixed in #111897.

Fixes #111901, fixes #111902.
---
 muted-tests.yml | 6 ------
 1 file changed, 6 deletions(-)

diff --git a/muted-tests.yml b/muted-tests.yml
index 508403ee6238c..e4c2f62d2617f 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -122,12 +122,6 @@ tests:
 - class: org.elasticsearch.xpack.restart.CoreFullClusterRestartIT
   method: testSnapshotRestore {cluster=UPGRADED}
   issue: https://github.com/elastic/elasticsearch/issues/111799
-- class: org.elasticsearch.xpack.esql.qa.mixed.EsqlClientYamlIT
-  method: "test {p0=esql/26_aggs_bucket/friendlier BUCKET interval hourly: #110916}"
-  issue: https://github.com/elastic/elasticsearch/issues/111901
-- class: org.elasticsearch.xpack.esql.qa.mixed.EsqlClientYamlIT
-  method: "test {p0=esql/26_aggs_bucket/friendlier BUCKET interval: monthly #110916}"
-  issue: https://github.com/elastic/elasticsearch/issues/111902
 - class: org.elasticsearch.xpack.esql.qa.mixed.FieldExtractorIT
   method: testScaledFloat
   issue: https://github.com/elastic/elasticsearch/issues/112003

From a97b0e226e3d7ea5e27eb565ae05d01ca22b06a9 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Aur=C3=A9lien=20FOUCRET?= <aurelien.foucret@gmail.com>
Date: Thu, 29 Aug 2024 13:59:16 +0200
Subject: [PATCH 040/144] Fix test failures in ScriptScoreQueryTests (#112334)

---
 muted-tests.yml                                             | 6 ------
 .../elasticsearch/search/query/ScriptScoreQueryTests.java   | 2 +-
 2 files changed, 1 insertion(+), 7 deletions(-)

diff --git a/muted-tests.yml b/muted-tests.yml
index e4c2f62d2617f..e80a39040a4ef 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -151,12 +151,6 @@ tests:
 - class: org.elasticsearch.xpack.ml.integration.MlJobIT
   method: testDeleteJobAsync
   issue: https://github.com/elastic/elasticsearch/issues/112212
-- class: org.elasticsearch.search.query.ScriptScoreQueryTests
-  method: testScriptTermStatsAvailable
-  issue: https://github.com/elastic/elasticsearch/issues/112278
-- class: org.elasticsearch.search.query.ScriptScoreQueryTests
-  method: testScriptTermStatsNotAvailable
-  issue: https://github.com/elastic/elasticsearch/issues/112290
 - class: org.elasticsearch.search.retriever.rankdoc.RankDocsSortBuilderTests
   method: testEqualsAndHashcode
   issue: https://github.com/elastic/elasticsearch/issues/112312
diff --git a/server/src/test/java/org/elasticsearch/search/query/ScriptScoreQueryTests.java b/server/src/test/java/org/elasticsearch/search/query/ScriptScoreQueryTests.java
index d6b1da9f76b42..177968b9a1326 100644
--- a/server/src/test/java/org/elasticsearch/search/query/ScriptScoreQueryTests.java
+++ b/server/src/test/java/org/elasticsearch/search/query/ScriptScoreQueryTests.java
@@ -72,7 +72,7 @@ public void initSearcher() throws IOException {
         w.commit();
         reader = DirectoryReader.open(w);
         searcher = newSearcher(reader);
-        leafReaderContext = reader.leaves().get(0);
+        leafReaderContext = searcher.getTopReaderContext().leaves().get(0);
     }
 
     @After

From a69f8e19ed4513d552b24a655f45b38098336b26 Mon Sep 17 00:00:00 2001
From: Albert Zaharovits <albert.zaharovits@elastic.co>
Date: Thu, 29 Aug 2024 15:09:28 +0300
Subject: [PATCH 041/144] Avoid redundant cluster state build (#112340)

Avoid redundant cluster state build when creating index
---
 .../cluster/metadata/MetadataCreateIndexService.java       | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexService.java b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexService.java
index b5ee0ebd7e387..b1a19d99dcb19 100644
--- a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexService.java
+++ b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexService.java
@@ -1249,11 +1249,10 @@ static ClusterState clusterStateCreateIndex(
         ClusterBlocks.Builder blocks = createClusterBlocksBuilder(currentState, indexName, clusterBlocks);
         blocks.updateBlocks(indexMetadata);
 
-        ClusterState updatedState = ClusterState.builder(currentState).blocks(blocks).metadata(newMetadata).build();
+        RoutingTable.Builder routingTableBuilder = RoutingTable.builder(shardRoutingRoleStrategy, currentState.routingTable())
+            .addAsNew(newMetadata.index(indexName));
 
-        RoutingTable.Builder routingTableBuilder = RoutingTable.builder(shardRoutingRoleStrategy, updatedState.routingTable())
-            .addAsNew(updatedState.metadata().index(indexName));
-        return ClusterState.builder(updatedState).routingTable(routingTableBuilder.build()).build();
+        return ClusterState.builder(currentState).blocks(blocks).metadata(newMetadata).routingTable(routingTableBuilder).build();
     }
 
     static IndexMetadata buildIndexMetadata(

From cefe358b4197332aca6b4d15d440851033134d61 Mon Sep 17 00:00:00 2001
From: Armin Braun <me@obrown.io>
Date: Thu, 29 Aug 2024 14:15:29 +0200
Subject: [PATCH 042/144] Fix DLS using runtime fields and synthetic source
 (#112341)

Somewhat of a tortured test but applying the same fix from #112260
to synthetic source which was running into the same bug as
a stored field source.
---
 docs/changelog/112341.yaml                    |  5 +++
 .../lookup/SyntheticSourceProvider.java       | 36 +++++-------------
 .../DocumentLevelSecurityRandomTests.java     | 38 ++++++++++++++++++-
 3 files changed, 52 insertions(+), 27 deletions(-)
 create mode 100644 docs/changelog/112341.yaml

diff --git a/docs/changelog/112341.yaml b/docs/changelog/112341.yaml
new file mode 100644
index 0000000000000..8f44b53ad9998
--- /dev/null
+++ b/docs/changelog/112341.yaml
@@ -0,0 +1,5 @@
+pr: 112341
+summary: Fix DLS using runtime fields and synthetic source
+area: Authorization
+type: bug
+issues: []
diff --git a/server/src/main/java/org/elasticsearch/search/lookup/SyntheticSourceProvider.java b/server/src/main/java/org/elasticsearch/search/lookup/SyntheticSourceProvider.java
index bccfc22dc7e95..a4549f0814a06 100644
--- a/server/src/main/java/org/elasticsearch/search/lookup/SyntheticSourceProvider.java
+++ b/server/src/main/java/org/elasticsearch/search/lookup/SyntheticSourceProvider.java
@@ -8,13 +8,14 @@
 
 package org.elasticsearch.search.lookup;
 
-import org.apache.lucene.index.IndexReaderContext;
 import org.apache.lucene.index.LeafReaderContext;
+import org.elasticsearch.common.util.concurrent.ConcurrentCollections;
 import org.elasticsearch.index.fieldvisitor.LeafStoredFieldLoader;
 import org.elasticsearch.index.fieldvisitor.StoredFieldLoader;
 import org.elasticsearch.index.mapper.SourceLoader;
 
 import java.io.IOException;
+import java.util.Map;
 
 // NB This is written under the assumption that individual segments are accessed by a single
 // thread, even if separate segments may be searched concurrently.  If we ever implement
@@ -22,7 +23,7 @@
 class SyntheticSourceProvider implements SourceProvider {
 
     private final SourceLoader sourceLoader;
-    private volatile SyntheticSourceLeafLoader[] leafLoaders;
+    private final Map<Object, SyntheticSourceLeafLoader> leaves = ConcurrentCollections.newConcurrentMap();
 
     SyntheticSourceProvider(SourceLoader sourceLoader) {
         this.sourceLoader = sourceLoader;
@@ -30,31 +31,14 @@ class SyntheticSourceProvider implements SourceProvider {
 
     @Override
     public Source getSource(LeafReaderContext ctx, int doc) throws IOException {
-        maybeInit(ctx);
-        if (leafLoaders[ctx.ord] == null) {
-            // individual segments are currently only accessed on one thread so there's no need
-            // for locking here.
-            leafLoaders[ctx.ord] = new SyntheticSourceLeafLoader(ctx);
+        final Object id = ctx.id();
+        var provider = leaves.get(id);
+        if (provider == null) {
+            provider = new SyntheticSourceLeafLoader(ctx);
+            var existing = leaves.put(id, provider);
+            assert existing == null : "unexpected source provider [" + existing + "]";
         }
-        return leafLoaders[ctx.ord].getSource(doc);
-    }
-
-    private void maybeInit(LeafReaderContext ctx) {
-        if (leafLoaders == null) {
-            synchronized (this) {
-                if (leafLoaders == null) {
-                    leafLoaders = new SyntheticSourceLeafLoader[findParentContext(ctx).leaves().size()];
-                }
-            }
-        }
-    }
-
-    private IndexReaderContext findParentContext(LeafReaderContext ctx) {
-        if (ctx.parent != null) {
-            return ctx.parent;
-        }
-        assert ctx.isTopLevel;
-        return ctx;
+        return provider.getSource(doc);
     }
 
     private class SyntheticSourceLeafLoader {
diff --git a/x-pack/plugin/security/src/internalClusterTest/java/org/elasticsearch/integration/DocumentLevelSecurityRandomTests.java b/x-pack/plugin/security/src/internalClusterTest/java/org/elasticsearch/integration/DocumentLevelSecurityRandomTests.java
index fb74631970813..1bf7d89347755 100644
--- a/x-pack/plugin/security/src/internalClusterTest/java/org/elasticsearch/integration/DocumentLevelSecurityRandomTests.java
+++ b/x-pack/plugin/security/src/internalClusterTest/java/org/elasticsearch/integration/DocumentLevelSecurityRandomTests.java
@@ -144,6 +144,43 @@ public void testWithRuntimeFields() throws Exception {
                         .endObject()
                 )
         );
+        doTestWithRuntimeFieldsInTestIndex();
+    }
+
+    public void testWithRuntimeFieldsAndSyntheticSource() throws Exception {
+        assertAcked(
+            indicesAdmin().prepareCreate("test")
+                .setMapping(
+                    XContentFactory.jsonBuilder()
+                        .startObject()
+                        .startObject("_source")
+                        .field("mode", "synthetic")
+                        .endObject()
+                        .startObject("runtime")
+                        .startObject("field1")
+                        .field("type", "keyword")
+                        .endObject()
+                        .startObject("field2")
+                        .field("type", "keyword")
+                        .endObject()
+                        .endObject()
+                        .startObject("properties")
+                        .startObject("field1")
+                        .field("type", "text")
+                        .field("store", true)
+                        .endObject()
+                        .startObject("field2")
+                        .field("type", "text")
+                        .field("store", true)
+                        .endObject()
+                        .endObject()
+                        .endObject()
+                )
+        );
+        doTestWithRuntimeFieldsInTestIndex();
+    }
+
+    private void doTestWithRuntimeFieldsInTestIndex() {
         List<IndexRequestBuilder> requests = new ArrayList<>(47);
         for (int i = 1; i <= 42; i++) {
             requests.add(prepareIndex("test").setSource("field1", "value1", "field2", "foo" + i));
@@ -158,5 +195,4 @@ public void testWithRuntimeFields() throws Exception {
             42L
         );
     }
-
 }

From 9387ce335757194da1986722a98f95338a45a873 Mon Sep 17 00:00:00 2001
From: David Turner <david.turner@elastic.co>
Date: Thu, 29 Aug 2024 13:16:37 +0100
Subject: [PATCH 043/144] Deduplicate unstable-cluster troubleshooting docs
 (#112333)

We duplicated these docs in order to avoid breaking older links, but
this makes it confusing and hard to link to the right copy of the
information. This commit removes the duplication by replacing the docs
at the old locations with stubs that link to the new locations.
---
 .../discovery/fault-detection.asciidoc        | 295 +---------------
 .../troubleshooting-unstable-cluster.asciidoc | 314 +++++++++++++++++-
 .../common/reference-docs-links.json          |   4 +-
 3 files changed, 321 insertions(+), 292 deletions(-)

diff --git a/docs/reference/modules/discovery/fault-detection.asciidoc b/docs/reference/modules/discovery/fault-detection.asciidoc
index d12985b70597c..21f4ae2317e6a 100644
--- a/docs/reference/modules/discovery/fault-detection.asciidoc
+++ b/docs/reference/modules/discovery/fault-detection.asciidoc
@@ -35,313 +35,30 @@ starting from the beginning of the cluster state update. Refer to
 
 [[cluster-fault-detection-troubleshooting]]
 ==== Troubleshooting an unstable cluster
-//tag::troubleshooting[]
-Normally, a node will only leave a cluster if deliberately shut down. If a node
-leaves the cluster unexpectedly, it's important to address the cause. A cluster
-in which nodes leave unexpectedly is unstable and can create several issues.
-For instance:
 
-* The cluster health may be yellow or red.
-
-* Some shards will be initializing and other shards may be failing.
-
-* Search, indexing, and monitoring operations may fail and report exceptions in
-logs.
-
-* The `.security` index may be unavailable, blocking access to the cluster.
-
-* The master may appear busy due to frequent cluster state updates.
-
-To troubleshoot a cluster in this state, first ensure the cluster has a
-<<discovery-troubleshooting,stable master>>. Next, focus on the nodes
-unexpectedly leaving the cluster ahead of all other issues. It will not be
-possible to solve other issues until the cluster has a stable master node and
-stable node membership.
-
-Diagnostics and statistics are usually not useful in an unstable cluster. These
-tools only offer a view of the state of the cluster at a single point in time.
-Instead, look at the cluster logs to see the pattern of behaviour over time.
-Focus particularly on logs from the elected master. When a node leaves the
-cluster, logs for the elected master include a message like this (with line
-breaks added to make it easier to read):
-
-[source,text]
-----
-[2022-03-21T11:02:35,513][INFO ][o.e.c.c.NodeLeftExecutor] [instance-0000000000]
-    node-left: [{instance-0000000004}{bfcMDTiDRkietFb9v_di7w}{aNlyORLASam1ammv2DzYXA}{172.27.47.21}{172.27.47.21:19054}{m}]
-    with reason [disconnected]
-----
-
-This message says that the `NodeLeftExecutor` on the elected master
-(`instance-0000000000`) processed a `node-left` task, identifying the node that
-was removed and the reason for its removal. When the node joins the cluster
-again, logs for the elected master will include a message like this (with line
-breaks added to make it easier to read):
-
-[source,text]
-----
-[2022-03-21T11:02:59,892][INFO ][o.e.c.c.NodeJoinExecutor] [instance-0000000000]
-    node-join: [{instance-0000000004}{bfcMDTiDRkietFb9v_di7w}{UNw_RuazQCSBskWZV8ID_w}{172.27.47.21}{172.27.47.21:19054}{m}]
-    with reason [joining after restart, removed [24s] ago with reason [disconnected]]
-----
-
-This message says that the `NodeJoinExecutor` on the elected master
-(`instance-0000000000`) processed a `node-join` task, identifying the node that
-was added to the cluster and the reason for the task.
-
-Other nodes may log similar messages, but report fewer details:
-
-[source,text]
-----
-[2020-01-29T11:02:36,985][INFO ][o.e.c.s.ClusterApplierService]
-    [instance-0000000001] removed {
-        {instance-0000000004}{bfcMDTiDRkietFb9v_di7w}{aNlyORLASam1ammv2DzYXA}{172.27.47.21}{172.27.47.21:19054}{m}
-        {tiebreaker-0000000003}{UNw_RuazQCSBskWZV8ID_w}{bltyVOQ-RNu20OQfTHSLtA}{172.27.161.154}{172.27.161.154:19251}{mv}
-    }, term: 14, version: 1653415, reason: Publication{term=14, version=1653415}
-----
-
-These messages are not especially useful for troubleshooting, so focus on the
-ones from the `NodeLeftExecutor` and `NodeJoinExecutor` which are only emitted
-on the elected master and which contain more details. If you don't see the
-messages from the `NodeLeftExecutor` and `NodeJoinExecutor`, check that:
-
-* You're looking at the logs for the elected master node.
-
-* The logs cover the correct time period.
-
-* Logging is enabled at `INFO` level.
-
-Nodes will also log a message containing `master node changed` whenever they
-start or stop following the elected master. You can use these messages to
-determine each node's view of the state of the master over time.
-
-If a node restarts, it will leave the cluster and then join the cluster again.
-When it rejoins, the `NodeJoinExecutor` will log that it processed a
-`node-join` task indicating that the node is `joining after restart`. If a node
-is unexpectedly restarting, look at the node's logs to see why it is shutting
-down.
-
-The <<health-api>> API on the affected node will also provide some useful
-information about the situation.
-
-If the node did not restart then you should look at the reason for its
-departure more closely. Each reason has different troubleshooting steps,
-described below. There are three possible reasons:
-
-* `disconnected`: The connection from the master node to the removed node was
-closed.
-
-* `lagging`: The master published a cluster state update, but the removed node
-did not apply it within the permitted timeout. By default, this timeout is 2
-minutes. Refer to <<modules-discovery-settings>> for information about the
-settings which control this mechanism.
-
-* `followers check retry count exceeded`: The master sent a number of
-consecutive health checks to the removed node. These checks were rejected or
-timed out. By default, each health check times out after 10 seconds and {es}
-removes the node removed after three consecutively failed health checks. Refer
-to <<modules-discovery-settings>> for information about the settings which
-control this mechanism.
+See <<troubleshooting-unstable-cluster>>.
 
 [discrete]
 ===== Diagnosing `disconnected` nodes
 
-Nodes typically leave the cluster with reason `disconnected` when they shut
-down, but if they rejoin the cluster without restarting then there is some
-other problem.
-
-{es} is designed to run on a fairly reliable network. It opens a number of TCP
-connections between nodes and expects these connections to remain open
-<<long-lived-connections,forever>>. If a connection is closed then {es} will
-try and reconnect, so the occasional blip may fail some in-flight operations
-but should otherwise have limited impact on the cluster. In contrast,
-repeatedly-dropped connections will severely affect its operation.
-
-The connections from the elected master node to every other node in the cluster
-are particularly important. The elected master never spontaneously closes its
-outbound connections to other nodes. Similarly, once an inbound connection is
-fully established, a node never spontaneously it unless the node is shutting
-down.
-
-If you see a node unexpectedly leave the cluster with the `disconnected`
-reason, something other than {es} likely caused the connection to close. A
-common cause is a misconfigured firewall with an improper timeout or another
-policy that's <<long-lived-connections,incompatible with {es}>>. It could also
-be caused by general connectivity issues, such as packet loss due to faulty
-hardware or network congestion. If you're an advanced user, configure the
-following loggers to get more detailed information about network exceptions:
-
-[source,yaml]
-----
-logger.org.elasticsearch.transport.TcpTransport: DEBUG
-logger.org.elasticsearch.xpack.core.security.transport.netty4.SecurityNetty4Transport: DEBUG
-----
-
-If these logs do not show enough information to diagnose the problem, obtain a
-packet capture simultaneously from the nodes at both ends of an unstable
-connection and analyse it alongside the {es} logs from those nodes to determine
-if traffic between the nodes is being disrupted by another device on the
-network.
+See <<troubleshooting-unstable-cluster-disconnected>>.
 
 [discrete]
 ===== Diagnosing `lagging` nodes
 
-{es} needs every node to process cluster state updates reasonably quickly. If a
-node takes too long to process a cluster state update, it can be harmful to the
-cluster. The master will remove these nodes with the `lagging` reason. Refer to
-<<modules-discovery-settings>> for information about the settings which control
-this mechanism.
-
-Lagging is typically caused by performance issues on the removed node. However,
-a node may also lag due to severe network delays. To rule out network delays,
-ensure that `net.ipv4.tcp_retries2` is <<system-config-tcpretries,configured
-properly>>. Log messages that contain `warn threshold` may provide more
-information about the root cause.
-
-If you're an advanced user, you can get more detailed information about what
-the node was doing when it was removed by configuring the following logger:
-
-[source,yaml]
-----
-logger.org.elasticsearch.cluster.coordination.LagDetector: DEBUG
-----
-
-When this logger is enabled, {es} will attempt to run the
-<<cluster-nodes-hot-threads>> API on the faulty node and report the results in
-the logs on the elected master. The results are compressed, encoded, and split
-into chunks to avoid truncation:
-
-[source,text]
-----
-[DEBUG][o.e.c.c.LagDetector      ] [master] hot threads from node [{node}{g3cCUaMDQJmQ2ZLtjr-3dg}{10.0.0.1:9300}] lagging at version [183619] despite commit of cluster state version [183620] [part 1]: H4sIAAAAAAAA/x...
-[DEBUG][o.e.c.c.LagDetector      ] [master] hot threads from node [{node}{g3cCUaMDQJmQ2ZLtjr-3dg}{10.0.0.1:9300}] lagging at version [183619] despite commit of cluster state version [183620] [part 2]: p7x3w1hmOQVtuV...
-[DEBUG][o.e.c.c.LagDetector      ] [master] hot threads from node [{node}{g3cCUaMDQJmQ2ZLtjr-3dg}{10.0.0.1:9300}] lagging at version [183619] despite commit of cluster state version [183620] [part 3]: v7uTboMGDbyOy+...
-[DEBUG][o.e.c.c.LagDetector      ] [master] hot threads from node [{node}{g3cCUaMDQJmQ2ZLtjr-3dg}{10.0.0.1:9300}] lagging at version [183619] despite commit of cluster state version [183620] [part 4]: 4tse0RnPnLeDNN...
-[DEBUG][o.e.c.c.LagDetector      ] [master] hot threads from node [{node}{g3cCUaMDQJmQ2ZLtjr-3dg}{10.0.0.1:9300}] lagging at version [183619] despite commit of cluster state version [183620] (gzip compressed, base64-encoded, and split into 4 parts on preceding log lines)
-----
-
-To reconstruct the output, base64-decode the data and decompress it using
-`gzip`. For instance, on Unix-like systems:
-
-[source,sh]
-----
-cat lagdetector.log | sed -e 's/.*://' | base64 --decode | gzip --decompress
-----
+See <<troubleshooting-unstable-cluster-lagging>>.
 
 [discrete]
 ===== Diagnosing `follower check retry count exceeded` nodes
 
-Nodes sometimes leave the cluster with reason `follower check retry count
-exceeded` when they shut down, but if they rejoin the cluster without
-restarting then there is some other problem.
-
-{es} needs every node to respond to network messages successfully and
-reasonably quickly. If a node rejects requests or does not respond at all then
-it can be harmful to the cluster. If enough consecutive checks fail then the
-master will remove the node with reason `follower check retry count exceeded`
-and will indicate in the `node-left` message how many of the consecutive
-unsuccessful checks failed and how many of them timed out. Refer to
-<<modules-discovery-settings>> for information about the settings which control
-this mechanism.
-
-Timeouts and failures may be due to network delays or performance problems on
-the affected nodes. Ensure that `net.ipv4.tcp_retries2` is
-<<system-config-tcpretries,configured properly>> to eliminate network delays as
-a possible cause for this kind of instability. Log messages containing
-`warn threshold` may give further clues about the cause of the instability.
-
-If the last check failed with an exception then the exception is reported, and
-typically indicates the problem that needs to be addressed. If any of the
-checks timed out then narrow down the problem as follows.
-
-include::../../troubleshooting/network-timeouts.asciidoc[tag=troubleshooting-network-timeouts-gc-vm]
-
-include::../../troubleshooting/network-timeouts.asciidoc[tag=troubleshooting-network-timeouts-packet-capture-fault-detection]
-
-include::../../troubleshooting/network-timeouts.asciidoc[tag=troubleshooting-network-timeouts-threads]
-
-By default the follower checks will time out after 30s, so if node departures
-are unpredictable then capture stack dumps every 15s to be sure that at least
-one stack dump was taken at the right time.
+See <<troubleshooting-unstable-cluster-follower-check>>.
 
 [discrete]
 ===== Diagnosing `ShardLockObtainFailedException` failures
 
-If a node leaves and rejoins the cluster then {es} will usually shut down and
-re-initialize its shards. If the shards do not shut down quickly enough then
-{es} may fail to re-initialize them due to a `ShardLockObtainFailedException`.
-
-To gather more information about the reason for shards shutting down slowly,
-configure the following logger:
-
-[source,yaml]
-----
-logger.org.elasticsearch.env.NodeEnvironment: DEBUG
-----
-
-When this logger is enabled, {es} will attempt to run the
-<<cluster-nodes-hot-threads>> API whenever it encounters a
-`ShardLockObtainFailedException`. The results are compressed, encoded, and
-split into chunks to avoid truncation:
-
-[source,text]
-----
-[DEBUG][o.e.e.NodeEnvironment    ] [master] hot threads while failing to obtain shard lock for [index][0] [part 1]: H4sIAAAAAAAA/x...
-[DEBUG][o.e.e.NodeEnvironment    ] [master] hot threads while failing to obtain shard lock for [index][0] [part 2]: p7x3w1hmOQVtuV...
-[DEBUG][o.e.e.NodeEnvironment    ] [master] hot threads while failing to obtain shard lock for [index][0] [part 3]: v7uTboMGDbyOy+...
-[DEBUG][o.e.e.NodeEnvironment    ] [master] hot threads while failing to obtain shard lock for [index][0] [part 4]: 4tse0RnPnLeDNN...
-[DEBUG][o.e.e.NodeEnvironment    ] [master] hot threads while failing to obtain shard lock for [index][0] (gzip compressed, base64-encoded, and split into 4 parts on preceding log lines)
-----
-
-To reconstruct the output, base64-decode the data and decompress it using
-`gzip`. For instance, on Unix-like systems:
-
-[source,sh]
-----
-cat shardlock.log | sed -e 's/.*://' | base64 --decode | gzip --decompress
-----
+See <<troubleshooting-unstable-cluster-shardlockobtainfailedexception>>.
 
 [discrete]
 ===== Diagnosing other network disconnections
 
-{es} is designed to run on a fairly reliable network. It opens a number of TCP
-connections between nodes and expects these connections to remain open
-<<long-lived-connections,forever>>. If a connection is closed then {es} will
-try and reconnect, so the occasional blip may fail some in-flight operations
-but should otherwise have limited impact on the cluster. In contrast,
-repeatedly-dropped connections will severely affect its operation.
-
-{es} nodes will only actively close an outbound connection to another node if
-the other node leaves the cluster. See
-<<cluster-fault-detection-troubleshooting>> for further information about
-identifying and troubleshooting this situation. If an outbound connection
-closes for some other reason, nodes will log a message such as the following:
-
-[source,text]
-----
-[INFO ][o.e.t.ClusterConnectionManager] [node-1] transport connection to [{node-2}{g3cCUaMDQJmQ2ZLtjr-3dg}{10.0.0.1:9300}] closed by remote
-----
-
-Similarly, once an inbound connection is fully established, a node never
-spontaneously closes it unless the node is shutting down.
-
-Therefore if you see a node report that a connection to another node closed
-unexpectedly, something other than {es} likely caused the connection to close.
-A common cause is a misconfigured firewall with an improper timeout or another
-policy that's <<long-lived-connections,incompatible with {es}>>. It could also
-be caused by general connectivity issues, such as packet loss due to faulty
-hardware or network congestion. If you're an advanced user, configure the
-following loggers to get more detailed information about network exceptions:
-
-[source,yaml]
-----
-logger.org.elasticsearch.transport.TcpTransport: DEBUG
-logger.org.elasticsearch.xpack.core.security.transport.netty4.SecurityNetty4Transport: DEBUG
-----
-
-If these logs do not show enough information to diagnose the problem, obtain a
-packet capture simultaneously from the nodes at both ends of an unstable
-connection and analyse it alongside the {es} logs from those nodes to determine
-if traffic between the nodes is being disrupted by another device on the
-network.
-//end::troubleshooting[]
+See <<troubleshooting-unstable-cluster-network>>.
diff --git a/docs/reference/troubleshooting/troubleshooting-unstable-cluster.asciidoc b/docs/reference/troubleshooting/troubleshooting-unstable-cluster.asciidoc
index 387ebcdcd43c0..cbb35f7731034 100644
--- a/docs/reference/troubleshooting/troubleshooting-unstable-cluster.asciidoc
+++ b/docs/reference/troubleshooting/troubleshooting-unstable-cluster.asciidoc
@@ -1,4 +1,316 @@
 [[troubleshooting-unstable-cluster]]
 == Troubleshooting an unstable cluster
 
-include::../modules/discovery/fault-detection.asciidoc[tag=troubleshooting,leveloffset=-2]
\ No newline at end of file
+Normally, a node will only leave a cluster if deliberately shut down. If a node
+leaves the cluster unexpectedly, it's important to address the cause. A cluster
+in which nodes leave unexpectedly is unstable and can create several issues.
+For instance:
+
+* The cluster health may be yellow or red.
+
+* Some shards will be initializing and other shards may be failing.
+
+* Search, indexing, and monitoring operations may fail and report exceptions in
+logs.
+
+* The `.security` index may be unavailable, blocking access to the cluster.
+
+* The master may appear busy due to frequent cluster state updates.
+
+To troubleshoot a cluster in this state, first ensure the cluster has a
+<<discovery-troubleshooting,stable master>>. Next, focus on the nodes
+unexpectedly leaving the cluster ahead of all other issues. It will not be
+possible to solve other issues until the cluster has a stable master node and
+stable node membership.
+
+Diagnostics and statistics are usually not useful in an unstable cluster. These
+tools only offer a view of the state of the cluster at a single point in time.
+Instead, look at the cluster logs to see the pattern of behaviour over time.
+Focus particularly on logs from the elected master. When a node leaves the
+cluster, logs for the elected master include a message like this (with line
+breaks added to make it easier to read):
+
+[source,text]
+----
+[2022-03-21T11:02:35,513][INFO ][o.e.c.c.NodeLeftExecutor] [instance-0000000000]
+    node-left: [{instance-0000000004}{bfcMDTiDRkietFb9v_di7w}{aNlyORLASam1ammv2DzYXA}{172.27.47.21}{172.27.47.21:19054}{m}]
+    with reason [disconnected]
+----
+
+This message says that the `NodeLeftExecutor` on the elected master
+(`instance-0000000000`) processed a `node-left` task, identifying the node that
+was removed and the reason for its removal. When the node joins the cluster
+again, logs for the elected master will include a message like this (with line
+breaks added to make it easier to read):
+
+[source,text]
+----
+[2022-03-21T11:02:59,892][INFO ][o.e.c.c.NodeJoinExecutor] [instance-0000000000]
+    node-join: [{instance-0000000004}{bfcMDTiDRkietFb9v_di7w}{UNw_RuazQCSBskWZV8ID_w}{172.27.47.21}{172.27.47.21:19054}{m}]
+    with reason [joining after restart, removed [24s] ago with reason [disconnected]]
+----
+
+This message says that the `NodeJoinExecutor` on the elected master
+(`instance-0000000000`) processed a `node-join` task, identifying the node that
+was added to the cluster and the reason for the task.
+
+Other nodes may log similar messages, but report fewer details:
+
+[source,text]
+----
+[2020-01-29T11:02:36,985][INFO ][o.e.c.s.ClusterApplierService]
+    [instance-0000000001] removed {
+        {instance-0000000004}{bfcMDTiDRkietFb9v_di7w}{aNlyORLASam1ammv2DzYXA}{172.27.47.21}{172.27.47.21:19054}{m}
+        {tiebreaker-0000000003}{UNw_RuazQCSBskWZV8ID_w}{bltyVOQ-RNu20OQfTHSLtA}{172.27.161.154}{172.27.161.154:19251}{mv}
+    }, term: 14, version: 1653415, reason: Publication{term=14, version=1653415}
+----
+
+These messages are not especially useful for troubleshooting, so focus on the
+ones from the `NodeLeftExecutor` and `NodeJoinExecutor` which are only emitted
+on the elected master and which contain more details. If you don't see the
+messages from the `NodeLeftExecutor` and `NodeJoinExecutor`, check that:
+
+* You're looking at the logs for the elected master node.
+
+* The logs cover the correct time period.
+
+* Logging is enabled at `INFO` level.
+
+Nodes will also log a message containing `master node changed` whenever they
+start or stop following the elected master. You can use these messages to
+determine each node's view of the state of the master over time.
+
+If a node restarts, it will leave the cluster and then join the cluster again.
+When it rejoins, the `NodeJoinExecutor` will log that it processed a
+`node-join` task indicating that the node is `joining after restart`. If a node
+is unexpectedly restarting, look at the node's logs to see why it is shutting
+down.
+
+The <<health-api>> API on the affected node will also provide some useful
+information about the situation.
+
+If the node did not restart then you should look at the reason for its
+departure more closely. Each reason has different troubleshooting steps,
+described below. There are three possible reasons:
+
+* `disconnected`: The connection from the master node to the removed node was
+closed.
+
+* `lagging`: The master published a cluster state update, but the removed node
+did not apply it within the permitted timeout. By default, this timeout is 2
+minutes. Refer to <<modules-discovery-settings>> for information about the
+settings which control this mechanism.
+
+* `followers check retry count exceeded`: The master sent a number of
+consecutive health checks to the removed node. These checks were rejected or
+timed out. By default, each health check times out after 10 seconds and {es}
+removes the node removed after three consecutively failed health checks. Refer
+to <<modules-discovery-settings>> for information about the settings which
+control this mechanism.
+
+[discrete]
+[[troubleshooting-unstable-cluster-disconnected]]
+=== Diagnosing `disconnected` nodes
+
+Nodes typically leave the cluster with reason `disconnected` when they shut
+down, but if they rejoin the cluster without restarting then there is some
+other problem.
+
+{es} is designed to run on a fairly reliable network. It opens a number of TCP
+connections between nodes and expects these connections to remain open
+<<long-lived-connections,forever>>. If a connection is closed then {es} will
+try and reconnect, so the occasional blip may fail some in-flight operations
+but should otherwise have limited impact on the cluster. In contrast,
+repeatedly-dropped connections will severely affect its operation.
+
+The connections from the elected master node to every other node in the cluster
+are particularly important. The elected master never spontaneously closes its
+outbound connections to other nodes. Similarly, once an inbound connection is
+fully established, a node never spontaneously it unless the node is shutting
+down.
+
+If you see a node unexpectedly leave the cluster with the `disconnected`
+reason, something other than {es} likely caused the connection to close. A
+common cause is a misconfigured firewall with an improper timeout or another
+policy that's <<long-lived-connections,incompatible with {es}>>. It could also
+be caused by general connectivity issues, such as packet loss due to faulty
+hardware or network congestion. If you're an advanced user, configure the
+following loggers to get more detailed information about network exceptions:
+
+[source,yaml]
+----
+logger.org.elasticsearch.transport.TcpTransport: DEBUG
+logger.org.elasticsearch.xpack.core.security.transport.netty4.SecurityNetty4Transport: DEBUG
+----
+
+If these logs do not show enough information to diagnose the problem, obtain a
+packet capture simultaneously from the nodes at both ends of an unstable
+connection and analyse it alongside the {es} logs from those nodes to determine
+if traffic between the nodes is being disrupted by another device on the
+network.
+
+[discrete]
+[[troubleshooting-unstable-cluster-lagging]]
+=== Diagnosing `lagging` nodes
+
+{es} needs every node to process cluster state updates reasonably quickly. If a
+node takes too long to process a cluster state update, it can be harmful to the
+cluster. The master will remove these nodes with the `lagging` reason. Refer to
+<<modules-discovery-settings>> for information about the settings which control
+this mechanism.
+
+Lagging is typically caused by performance issues on the removed node. However,
+a node may also lag due to severe network delays. To rule out network delays,
+ensure that `net.ipv4.tcp_retries2` is <<system-config-tcpretries,configured
+properly>>. Log messages that contain `warn threshold` may provide more
+information about the root cause.
+
+If you're an advanced user, you can get more detailed information about what
+the node was doing when it was removed by configuring the following logger:
+
+[source,yaml]
+----
+logger.org.elasticsearch.cluster.coordination.LagDetector: DEBUG
+----
+
+When this logger is enabled, {es} will attempt to run the
+<<cluster-nodes-hot-threads>> API on the faulty node and report the results in
+the logs on the elected master. The results are compressed, encoded, and split
+into chunks to avoid truncation:
+
+[source,text]
+----
+[DEBUG][o.e.c.c.LagDetector      ] [master] hot threads from node [{node}{g3cCUaMDQJmQ2ZLtjr-3dg}{10.0.0.1:9300}] lagging at version [183619] despite commit of cluster state version [183620] [part 1]: H4sIAAAAAAAA/x...
+[DEBUG][o.e.c.c.LagDetector      ] [master] hot threads from node [{node}{g3cCUaMDQJmQ2ZLtjr-3dg}{10.0.0.1:9300}] lagging at version [183619] despite commit of cluster state version [183620] [part 2]: p7x3w1hmOQVtuV...
+[DEBUG][o.e.c.c.LagDetector      ] [master] hot threads from node [{node}{g3cCUaMDQJmQ2ZLtjr-3dg}{10.0.0.1:9300}] lagging at version [183619] despite commit of cluster state version [183620] [part 3]: v7uTboMGDbyOy+...
+[DEBUG][o.e.c.c.LagDetector      ] [master] hot threads from node [{node}{g3cCUaMDQJmQ2ZLtjr-3dg}{10.0.0.1:9300}] lagging at version [183619] despite commit of cluster state version [183620] [part 4]: 4tse0RnPnLeDNN...
+[DEBUG][o.e.c.c.LagDetector      ] [master] hot threads from node [{node}{g3cCUaMDQJmQ2ZLtjr-3dg}{10.0.0.1:9300}] lagging at version [183619] despite commit of cluster state version [183620] (gzip compressed, base64-encoded, and split into 4 parts on preceding log lines)
+----
+
+To reconstruct the output, base64-decode the data and decompress it using
+`gzip`. For instance, on Unix-like systems:
+
+[source,sh]
+----
+cat lagdetector.log | sed -e 's/.*://' | base64 --decode | gzip --decompress
+----
+
+[discrete]
+[[troubleshooting-unstable-cluster-follower-check]]
+=== Diagnosing `follower check retry count exceeded` nodes
+
+Nodes sometimes leave the cluster with reason `follower check retry count
+exceeded` when they shut down, but if they rejoin the cluster without
+restarting then there is some other problem.
+
+{es} needs every node to respond to network messages successfully and
+reasonably quickly. If a node rejects requests or does not respond at all then
+it can be harmful to the cluster. If enough consecutive checks fail then the
+master will remove the node with reason `follower check retry count exceeded`
+and will indicate in the `node-left` message how many of the consecutive
+unsuccessful checks failed and how many of them timed out. Refer to
+<<modules-discovery-settings>> for information about the settings which control
+this mechanism.
+
+Timeouts and failures may be due to network delays or performance problems on
+the affected nodes. Ensure that `net.ipv4.tcp_retries2` is
+<<system-config-tcpretries,configured properly>> to eliminate network delays as
+a possible cause for this kind of instability. Log messages containing
+`warn threshold` may give further clues about the cause of the instability.
+
+If the last check failed with an exception then the exception is reported, and
+typically indicates the problem that needs to be addressed. If any of the
+checks timed out then narrow down the problem as follows.
+
+include::network-timeouts.asciidoc[tag=troubleshooting-network-timeouts-gc-vm]
+
+include::network-timeouts.asciidoc[tag=troubleshooting-network-timeouts-packet-capture-fault-detection]
+
+include::network-timeouts.asciidoc[tag=troubleshooting-network-timeouts-threads]
+
+By default the follower checks will time out after 30s, so if node departures
+are unpredictable then capture stack dumps every 15s to be sure that at least
+one stack dump was taken at the right time.
+
+[discrete]
+[[troubleshooting-unstable-cluster-shardlockobtainfailedexception]]
+=== Diagnosing `ShardLockObtainFailedException` failures
+
+If a node leaves and rejoins the cluster then {es} will usually shut down and
+re-initialize its shards. If the shards do not shut down quickly enough then
+{es} may fail to re-initialize them due to a `ShardLockObtainFailedException`.
+
+To gather more information about the reason for shards shutting down slowly,
+configure the following logger:
+
+[source,yaml]
+----
+logger.org.elasticsearch.env.NodeEnvironment: DEBUG
+----
+
+When this logger is enabled, {es} will attempt to run the
+<<cluster-nodes-hot-threads>> API whenever it encounters a
+`ShardLockObtainFailedException`. The results are compressed, encoded, and
+split into chunks to avoid truncation:
+
+[source,text]
+----
+[DEBUG][o.e.e.NodeEnvironment    ] [master] hot threads while failing to obtain shard lock for [index][0] [part 1]: H4sIAAAAAAAA/x...
+[DEBUG][o.e.e.NodeEnvironment    ] [master] hot threads while failing to obtain shard lock for [index][0] [part 2]: p7x3w1hmOQVtuV...
+[DEBUG][o.e.e.NodeEnvironment    ] [master] hot threads while failing to obtain shard lock for [index][0] [part 3]: v7uTboMGDbyOy+...
+[DEBUG][o.e.e.NodeEnvironment    ] [master] hot threads while failing to obtain shard lock for [index][0] [part 4]: 4tse0RnPnLeDNN...
+[DEBUG][o.e.e.NodeEnvironment    ] [master] hot threads while failing to obtain shard lock for [index][0] (gzip compressed, base64-encoded, and split into 4 parts on preceding log lines)
+----
+
+To reconstruct the output, base64-decode the data and decompress it using
+`gzip`. For instance, on Unix-like systems:
+
+[source,sh]
+----
+cat shardlock.log | sed -e 's/.*://' | base64 --decode | gzip --decompress
+----
+
+[discrete]
+[[troubleshooting-unstable-cluster-network]]
+=== Diagnosing other network disconnections
+
+{es} is designed to run on a fairly reliable network. It opens a number of TCP
+connections between nodes and expects these connections to remain open
+<<long-lived-connections,forever>>. If a connection is closed then {es} will
+try and reconnect, so the occasional blip may fail some in-flight operations
+but should otherwise have limited impact on the cluster. In contrast,
+repeatedly-dropped connections will severely affect its operation.
+
+{es} nodes will only actively close an outbound connection to another node if
+the other node leaves the cluster. See
+<<cluster-fault-detection-troubleshooting>> for further information about
+identifying and troubleshooting this situation. If an outbound connection
+closes for some other reason, nodes will log a message such as the following:
+
+[source,text]
+----
+[INFO ][o.e.t.ClusterConnectionManager] [node-1] transport connection to [{node-2}{g3cCUaMDQJmQ2ZLtjr-3dg}{10.0.0.1:9300}] closed by remote
+----
+
+Similarly, once an inbound connection is fully established, a node never
+spontaneously closes it unless the node is shutting down.
+
+Therefore if you see a node report that a connection to another node closed
+unexpectedly, something other than {es} likely caused the connection to close.
+A common cause is a misconfigured firewall with an improper timeout or another
+policy that's <<long-lived-connections,incompatible with {es}>>. It could also
+be caused by general connectivity issues, such as packet loss due to faulty
+hardware or network congestion. If you're an advanced user, configure the
+following loggers to get more detailed information about network exceptions:
+
+[source,yaml]
+----
+logger.org.elasticsearch.transport.TcpTransport: DEBUG
+logger.org.elasticsearch.xpack.core.security.transport.netty4.SecurityNetty4Transport: DEBUG
+----
+
+If these logs do not show enough information to diagnose the problem, obtain a
+packet capture simultaneously from the nodes at both ends of an unstable
+connection and analyse it alongside the {es} logs from those nodes to determine
+if traffic between the nodes is being disrupted by another device on the
+network.
diff --git a/server/src/main/resources/org/elasticsearch/common/reference-docs-links.json b/server/src/main/resources/org/elasticsearch/common/reference-docs-links.json
index 3eb8939c22a65..cc0bc5e2257c8 100644
--- a/server/src/main/resources/org/elasticsearch/common/reference-docs-links.json
+++ b/server/src/main/resources/org/elasticsearch/common/reference-docs-links.json
@@ -2,8 +2,8 @@
   "INITIAL_MASTER_NODES": "important-settings.html#initial_master_nodes",
   "DISCOVERY_TROUBLESHOOTING": "discovery-troubleshooting.html",
   "UNSTABLE_CLUSTER_TROUBLESHOOTING": "troubleshooting-unstable-cluster.html",
-  "LAGGING_NODE_TROUBLESHOOTING": "troubleshooting-unstable-cluster.html#_diagnosing_lagging_nodes_2",
-  "SHARD_LOCK_TROUBLESHOOTING": "troubleshooting-unstable-cluster.html#_diagnosing_shardlockobtainfailedexception_failures_2",
+  "LAGGING_NODE_TROUBLESHOOTING": "troubleshooting-unstable-cluster.html#troubleshooting-unstable-cluster-lagging",
+  "SHARD_LOCK_TROUBLESHOOTING": "troubleshooting-unstable-cluster.html#troubleshooting-unstable-cluster-shardlockobtainfailedexception",
   "CONCURRENT_REPOSITORY_WRITERS": "diagnosing-corrupted-repositories.html",
   "ARCHIVE_INDICES": "archive-indices.html",
   "HTTP_TRACER": "modules-network.html#http-rest-request-tracer",

From 5ac4d8c71e06880624a9a91bfec4ae310d9cab2f Mon Sep 17 00:00:00 2001
From: Craig Taverner <craig@amanzi.com>
Date: Thu, 29 Aug 2024 14:48:15 +0200
Subject: [PATCH 044/144] Fix union-types where one index is missing the field
 (#111932)

* Fix union-types where one index is missing the field

When none of the indexes has the field, a validation error is correctly thrown, and when all indexes have the field, union-types works as normal.
But when some indexes have the field and some do not, we were getting and internal error.
We treat this case similarly to when some documents are missing the field, in which case `null` values are produced.
So now a multi-index query where some indexes are missing the field will produce nulls for the documents coming from those indexes.

* Update docs/changelog/111932.yaml

* Added capability for this fix (missing-field)
---
 docs/changelog/111932.yaml                    |  6 ++
 .../xpack/esql/CsvTestsDataLoader.java        |  6 ++
 .../mapping-missing_ip_sample_data.json       | 13 ++++
 .../main/resources/missing_ip_sample_data.csv |  8 +++
 .../src/main/resources/union_types.csv-spec   | 68 +++++++++++++++++++
 .../xpack/esql/action/EsqlCapabilities.java   |  5 ++
 .../planner/EsPhysicalOperationProviders.java |  4 +-
 7 files changed, 109 insertions(+), 1 deletion(-)
 create mode 100644 docs/changelog/111932.yaml
 create mode 100644 x-pack/plugin/esql/qa/testFixtures/src/main/resources/mapping-missing_ip_sample_data.json
 create mode 100644 x-pack/plugin/esql/qa/testFixtures/src/main/resources/missing_ip_sample_data.csv

diff --git a/docs/changelog/111932.yaml b/docs/changelog/111932.yaml
new file mode 100644
index 0000000000000..ce840ecebcff0
--- /dev/null
+++ b/docs/changelog/111932.yaml
@@ -0,0 +1,6 @@
+pr: 111932
+summary: Fix union-types where one index is missing the field
+area: ES|QL
+type: bug
+issues:
+ - 111912
diff --git a/x-pack/plugin/esql/qa/testFixtures/src/main/java/org/elasticsearch/xpack/esql/CsvTestsDataLoader.java b/x-pack/plugin/esql/qa/testFixtures/src/main/java/org/elasticsearch/xpack/esql/CsvTestsDataLoader.java
index b20e3bb0d5409..9ee22113a4244 100644
--- a/x-pack/plugin/esql/qa/testFixtures/src/main/java/org/elasticsearch/xpack/esql/CsvTestsDataLoader.java
+++ b/x-pack/plugin/esql/qa/testFixtures/src/main/java/org/elasticsearch/xpack/esql/CsvTestsDataLoader.java
@@ -68,6 +68,11 @@ public class CsvTestsDataLoader {
         "mapping-sample_data_ts_long.json",
         "sample_data_ts_long.csv"
     );
+    private static final TestsDataset MISSING_IP_SAMPLE_DATA = new TestsDataset(
+        "missing_ip_sample_data",
+        "mapping-missing_ip_sample_data.json",
+        "missing_ip_sample_data.csv"
+    );
     private static final TestsDataset CLIENT_IPS = new TestsDataset("clientips", "mapping-clientips.json", "clientips.csv");
     private static final TestsDataset CLIENT_CIDR = new TestsDataset("client_cidr", "mapping-client_cidr.json", "client_cidr.csv");
     private static final TestsDataset AGES = new TestsDataset("ages", "mapping-ages.json", "ages.csv");
@@ -112,6 +117,7 @@ public class CsvTestsDataLoader {
         Map.entry(ALERTS.indexName, ALERTS),
         Map.entry(SAMPLE_DATA_STR.indexName, SAMPLE_DATA_STR),
         Map.entry(SAMPLE_DATA_TS_LONG.indexName, SAMPLE_DATA_TS_LONG),
+        Map.entry(MISSING_IP_SAMPLE_DATA.indexName, MISSING_IP_SAMPLE_DATA),
         Map.entry(CLIENT_IPS.indexName, CLIENT_IPS),
         Map.entry(CLIENT_CIDR.indexName, CLIENT_CIDR),
         Map.entry(AGES.indexName, AGES),
diff --git a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/mapping-missing_ip_sample_data.json b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/mapping-missing_ip_sample_data.json
new file mode 100644
index 0000000000000..6f3796dd7715d
--- /dev/null
+++ b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/mapping-missing_ip_sample_data.json
@@ -0,0 +1,13 @@
+{
+    "properties": {
+        "@timestamp": {
+            "type": "date"
+        },
+        "event_duration": {
+            "type": "long"
+        },
+        "message": {
+            "type": "keyword"
+        }
+    }
+}
diff --git a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/missing_ip_sample_data.csv b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/missing_ip_sample_data.csv
new file mode 100644
index 0000000000000..e8e9ddcaee83b
--- /dev/null
+++ b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/missing_ip_sample_data.csv
@@ -0,0 +1,8 @@
+@timestamp:date,event_duration:long,message:keyword
+2023-10-23T13:55:01.543Z,1756467,Connected to 10.1.0.1
+2023-10-23T13:53:55.832Z,5033755,Connection error
+2023-10-23T13:52:55.015Z,8268153,Connection error
+2023-10-23T13:51:54.732Z,725448,Connection error
+2023-10-23T13:33:34.937Z,1232382,Disconnected
+2023-10-23T12:27:28.948Z,2764889,Connected to 10.1.0.2
+2023-10-23T12:15:03.360Z,3450233,Connected to 10.1.0.3
diff --git a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/union_types.csv-spec b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/union_types.csv-spec
index 6819727be0131..c6a2d47a78dc9 100644
--- a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/union_types.csv-spec
+++ b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/union_types.csv-spec
@@ -405,6 +405,74 @@ count:long  |  message:keyword
 2           |  Connected to 10.1.0.3
 ;
 
+multiIndexMissingIpToString
+required_capability: union_types
+required_capability: union_types_missing_field
+
+FROM sample_data, sample_data_str, missing_ip_sample_data METADATA _index
+| EVAL client_ip = TO_STRING(client_ip)
+| KEEP _index, @timestamp, client_ip, event_duration, message
+| SORT _index ASC, @timestamp DESC
+;
+
+_index:keyword         | @timestamp:date           |  client_ip:keyword  |  event_duration:long  |  message:keyword
+missing_ip_sample_data | 2023-10-23T13:55:01.543Z  |  null               |  1756467              |  Connected to 10.1.0.1
+missing_ip_sample_data | 2023-10-23T13:53:55.832Z  |  null               |  5033755              |  Connection error
+missing_ip_sample_data | 2023-10-23T13:52:55.015Z  |  null               |  8268153              |  Connection error
+missing_ip_sample_data | 2023-10-23T13:51:54.732Z  |  null               |  725448               |  Connection error
+missing_ip_sample_data | 2023-10-23T13:33:34.937Z  |  null               |  1232382              |  Disconnected
+missing_ip_sample_data | 2023-10-23T12:27:28.948Z  |  null               |  2764889              |  Connected to 10.1.0.2
+missing_ip_sample_data | 2023-10-23T12:15:03.360Z  |  null               |  3450233              |  Connected to 10.1.0.3
+sample_data            | 2023-10-23T13:55:01.543Z  |  172.21.3.15        |  1756467              |  Connected to 10.1.0.1
+sample_data            | 2023-10-23T13:53:55.832Z  |  172.21.3.15        |  5033755              |  Connection error
+sample_data            | 2023-10-23T13:52:55.015Z  |  172.21.3.15        |  8268153              |  Connection error
+sample_data            | 2023-10-23T13:51:54.732Z  |  172.21.3.15        |  725448               |  Connection error
+sample_data            | 2023-10-23T13:33:34.937Z  |  172.21.0.5         |  1232382              |  Disconnected
+sample_data            | 2023-10-23T12:27:28.948Z  |  172.21.2.113       |  2764889              |  Connected to 10.1.0.2
+sample_data            | 2023-10-23T12:15:03.360Z  |  172.21.2.162       |  3450233              |  Connected to 10.1.0.3
+sample_data_str        | 2023-10-23T13:55:01.543Z  |  172.21.3.15        |  1756467              |  Connected to 10.1.0.1
+sample_data_str        | 2023-10-23T13:53:55.832Z  |  172.21.3.15        |  5033755              |  Connection error
+sample_data_str        | 2023-10-23T13:52:55.015Z  |  172.21.3.15        |  8268153              |  Connection error
+sample_data_str        | 2023-10-23T13:51:54.732Z  |  172.21.3.15        |  725448               |  Connection error
+sample_data_str        | 2023-10-23T13:33:34.937Z  |  172.21.0.5         |  1232382              |  Disconnected
+sample_data_str        | 2023-10-23T12:27:28.948Z  |  172.21.2.113       |  2764889              |  Connected to 10.1.0.2
+sample_data_str        | 2023-10-23T12:15:03.360Z  |  172.21.2.162       |  3450233              |  Connected to 10.1.0.3
+;
+
+multiIndexMissingIpToIp
+required_capability: union_types
+required_capability: union_types_missing_field
+
+FROM sample_data, sample_data_str, missing_ip_sample_data METADATA _index
+| EVAL client_ip = TO_IP(client_ip)
+| KEEP _index, @timestamp, client_ip, event_duration, message
+| SORT _index ASC, @timestamp DESC
+;
+
+_index:keyword         | @timestamp:date           |  client_ip:ip  |  event_duration:long  |  message:keyword
+missing_ip_sample_data | 2023-10-23T13:55:01.543Z  |  null          |  1756467              |  Connected to 10.1.0.1
+missing_ip_sample_data | 2023-10-23T13:53:55.832Z  |  null          |  5033755              |  Connection error
+missing_ip_sample_data | 2023-10-23T13:52:55.015Z  |  null          |  8268153              |  Connection error
+missing_ip_sample_data | 2023-10-23T13:51:54.732Z  |  null          |  725448               |  Connection error
+missing_ip_sample_data | 2023-10-23T13:33:34.937Z  |  null          |  1232382              |  Disconnected
+missing_ip_sample_data | 2023-10-23T12:27:28.948Z  |  null          |  2764889              |  Connected to 10.1.0.2
+missing_ip_sample_data | 2023-10-23T12:15:03.360Z  |  null          |  3450233              |  Connected to 10.1.0.3
+sample_data            | 2023-10-23T13:55:01.543Z  |  172.21.3.15   |  1756467              |  Connected to 10.1.0.1
+sample_data            | 2023-10-23T13:53:55.832Z  |  172.21.3.15   |  5033755              |  Connection error
+sample_data            | 2023-10-23T13:52:55.015Z  |  172.21.3.15   |  8268153              |  Connection error
+sample_data            | 2023-10-23T13:51:54.732Z  |  172.21.3.15   |  725448               |  Connection error
+sample_data            | 2023-10-23T13:33:34.937Z  |  172.21.0.5    |  1232382              |  Disconnected
+sample_data            | 2023-10-23T12:27:28.948Z  |  172.21.2.113  |  2764889              |  Connected to 10.1.0.2
+sample_data            | 2023-10-23T12:15:03.360Z  |  172.21.2.162  |  3450233              |  Connected to 10.1.0.3
+sample_data_str        | 2023-10-23T13:55:01.543Z  |  172.21.3.15   |  1756467              |  Connected to 10.1.0.1
+sample_data_str        | 2023-10-23T13:53:55.832Z  |  172.21.3.15   |  5033755              |  Connection error
+sample_data_str        | 2023-10-23T13:52:55.015Z  |  172.21.3.15   |  8268153              |  Connection error
+sample_data_str        | 2023-10-23T13:51:54.732Z  |  172.21.3.15   |  725448               |  Connection error
+sample_data_str        | 2023-10-23T13:33:34.937Z  |  172.21.0.5    |  1232382              |  Disconnected
+sample_data_str        | 2023-10-23T12:27:28.948Z  |  172.21.2.113  |  2764889              |  Connected to 10.1.0.2
+sample_data_str        | 2023-10-23T12:15:03.360Z  |  172.21.2.162  |  3450233              |  Connected to 10.1.0.3
+;
+
 multiIndexTsLong
 required_capability: union_types
 required_capability: metadata_fields
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/action/EsqlCapabilities.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/action/EsqlCapabilities.java
index 81b2ba71b8808..120323ebeb7a6 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/action/EsqlCapabilities.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/action/EsqlCapabilities.java
@@ -183,6 +183,11 @@ public enum Cap {
          */
         UNION_TYPES_FIX_RENAME_RESOLUTION,
 
+        /**
+         * Fix for union-types when some indexes are missing the required field. Done in #111932.
+         */
+        UNION_TYPES_MISSING_FIELD,
+
         /**
          * Fix a parsing issue where numbers below Long.MIN_VALUE threw an exception instead of parsing as doubles.
          * see <a href="https://github.com/elastic/elasticsearch/issues/104323"> Parsing large numbers is inconsistent #104323 </a>
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/EsPhysicalOperationProviders.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/EsPhysicalOperationProviders.java
index 8fddb7407a02a..04be731484267 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/EsPhysicalOperationProviders.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/EsPhysicalOperationProviders.java
@@ -138,7 +138,9 @@ private BlockLoader getBlockLoaderFor(
         if (unionTypes != null) {
             String indexName = shardContext.ctx.index().getName();
             Expression conversion = unionTypes.getConversionExpressionForIndex(indexName);
-            return new TypeConvertingBlockLoader(blockLoader, (AbstractConvertFunction) conversion);
+            return conversion == null
+                ? BlockLoader.CONSTANT_NULLS
+                : new TypeConvertingBlockLoader(blockLoader, (AbstractConvertFunction) conversion);
         }
         return blockLoader;
     }

From 5c200afb9e3a02400cfdf45c4469c30bd1417223 Mon Sep 17 00:00:00 2001
From: "Mark J. Hoy" <mark.hoy@elastic.co>
Date: Thu, 29 Aug 2024 09:12:03 -0400
Subject: [PATCH 045/144] [ML] Adds Explain Functionality to LTR Rescoring
 (#112155)

---
 .../integration/LearningToRankRescorerIT.java | 433 ++++++++++--------
 .../inference/ltr/LearningToRankRescorer.java |  55 ++-
 2 files changed, 303 insertions(+), 185 deletions(-)

diff --git a/x-pack/plugin/ml/qa/single-node-tests/src/javaRestTest/java/org/elasticsearch/xpack/ml/integration/LearningToRankRescorerIT.java b/x-pack/plugin/ml/qa/single-node-tests/src/javaRestTest/java/org/elasticsearch/xpack/ml/integration/LearningToRankRescorerIT.java
index b2a0b60aed7ba..4a703117c6551 100644
--- a/x-pack/plugin/ml/qa/single-node-tests/src/javaRestTest/java/org/elasticsearch/xpack/ml/integration/LearningToRankRescorerIT.java
+++ b/x-pack/plugin/ml/qa/single-node-tests/src/javaRestTest/java/org/elasticsearch/xpack/ml/integration/LearningToRankRescorerIT.java
@@ -16,7 +16,9 @@
 import org.junit.Before;
 
 import java.io.IOException;
+import java.util.ArrayList;
 import java.util.List;
+import java.util.Map;
 
 import static org.hamcrest.Matchers.containsString;
 import static org.hamcrest.Matchers.equalTo;
@@ -28,189 +30,11 @@ public class LearningToRankRescorerIT extends InferenceTestCase {
 
     @Before
     public void setupModelAndData() throws IOException {
-        putRegressionModel(MODEL_ID, """
-            {
-              "description": "super complex model for tests",
-              "inference_config": {
-                "learning_to_rank": {
-                  "feature_extractors": [
-                    {
-                      "query_extractor": {
-                        "feature_name": "cost",
-                        "query": {"script_score": {"query": {"match_all":{}}, "script": {"source": "return doc['cost'].value;"}}}
-                      }
-                    },
-                    {
-                      "query_extractor": {
-                        "feature_name": "type_tv",
-                        "query": {"constant_score": {"filter": {"term": { "product": "TV" }}, "boost": 1.0}}
-                      }
-                    },
-                    {
-                      "query_extractor": {
-                        "feature_name": "type_vcr",
-                        "query": {"constant_score": {"filter": {"term": { "product": "VCR" }}, "boost": 1.0}}
-                      }
-                    },
-                    {
-                      "query_extractor": {
-                        "feature_name": "type_laptop",
-                        "query": {"constant_score": {"filter": {"term": { "product": "Laptop" }}, "boost": 1.0}}
-                      }
-                    },
-                    {
-                        "query_extractor": {
-                            "feature_name": "two",
-                            "query": { "script_score": { "query": { "match_all": {} }, "script": { "source": "return 2.0;" } } }
-                        }
-                    },
-                    {
-                        "query_extractor": {
-                            "feature_name": "product_bm25",
-                            "query": { "term": { "product": "{{keyword}}" } }
-                        }
-                    }
-                  ]
-                }
-              },
-              "definition": {
-                "trained_model": {
-                  "ensemble": {
-                    "feature_names": ["cost", "type_tv", "type_vcr", "type_laptop", "two", "product_bm25"],
-                    "target_type": "regression",
-                    "trained_models": [
-                    {
-                      "tree": {
-                        "feature_names": [
-                          "cost"
-                        ],
-                        "tree_structure": [
-                        {
-                          "node_index": 0,
-                          "split_feature": 0,
-                          "split_gain": 12,
-                          "threshold": 400,
-                          "decision_type": "lte",
-                          "default_left": true,
-                          "left_child": 1,
-                          "right_child": 2
-                        },
-                        {
-                          "node_index": 1,
-                          "leaf_value": 5.0
-                        },
-                        {
-                          "node_index": 2,
-                          "leaf_value": 2.0
-                        }
-                        ],
-                        "target_type": "regression"
-                      }
-                    },
-                    {
-                      "tree": {
-                        "feature_names": [
-                          "type_tv"
-                        ],
-                        "tree_structure": [
-                        {
-                          "node_index": 0,
-                          "split_feature": 0,
-                          "split_gain": 12,
-                          "threshold": 1,
-                          "decision_type": "lt",
-                          "default_left": true,
-                          "left_child": 1,
-                          "right_child": 2
-                        },
-                        {
-                          "node_index": 1,
-                          "leaf_value": 1.0
-                        },
-                        {
-                          "node_index": 2,
-                          "leaf_value": 12.0
-                        }
-                        ],
-                        "target_type": "regression"
-                      }
-                    },
-                     {
-                      "tree": {
-                        "feature_names": [
-                          "two"
-                        ],
-                        "tree_structure": [
-                        {
-                          "node_index": 0,
-                          "split_feature": 0,
-                          "split_gain": 12,
-                          "threshold": 1,
-                          "decision_type": "lt",
-                          "default_left": true,
-                          "left_child": 1,
-                          "right_child": 2
-                        },
-                        {
-                          "node_index": 1,
-                          "leaf_value": 1.0
-                        },
-                        {
-                          "node_index": 2,
-                          "leaf_value": 2.0
-                        }
-                        ],
-                        "target_type": "regression"
-                      }
-                    },
-                     {
-                      "tree": {
-                        "feature_names": [
-                          "product_bm25"
-                        ],
-                        "tree_structure": [
-                        {
-                          "node_index": 0,
-                          "split_feature": 0,
-                          "split_gain": 12,
-                          "threshold": 1,
-                          "decision_type": "lt",
-                          "default_left": true,
-                          "left_child": 1,
-                          "right_child": 2
-                        },
-                        {
-                          "node_index": 1,
-                          "leaf_value": 1.0
-                        },
-                        {
-                          "node_index": 2,
-                          "leaf_value": 4.0
-                        }
-                        ],
-                        "target_type": "regression"
-                      }
-                    }
-                    ]
-                  }
-                }
-              }
-            }
-            """);
-        createIndex(INDEX_NAME, Settings.EMPTY, """
-            "properties":{
-              "product":{"type": "keyword"},
-              "cost":{"type": "integer"}
-            }""");
-        indexData("{ \"product\": \"TV\", \"cost\": 300}");
-        indexData("{ \"product\": \"TV\", \"cost\": 400}");
-        indexData("{ \"product\": \"TV\", \"cost\": 600}");
-        indexData("{ \"product\": \"VCR\", \"cost\": 15}");
-        indexData("{ \"product\": \"VCR\", \"cost\": 350}");
-        indexData("{ \"product\": \"VCR\", \"cost\": 580}");
-        indexData("{ \"product\": \"Laptop\", \"cost\": 100}");
-        indexData("{ \"product\": \"Laptop\", \"cost\": 300}");
-        indexData("{ \"product\": \"Laptop\", \"cost\": 500}");
+        putRegressionModel(MODEL_ID, testRegressionModel);
+        createIndex(INDEX_NAME, Settings.EMPTY, testIndexDefinition);
+        for (String testDataItem : testIndexData) {
+            indexData(testDataItem);
+        }
         adminClient().performRequest(new Request("POST", INDEX_NAME + "/_refresh"));
     }
 
@@ -249,6 +73,19 @@ public void testLearningToRankRescore() throws Exception {
         assertHitScores(client().performRequest(request), List.of(9.0, 9.0, 6.0));
     }
 
+    public void testLearningToRankRescoreWithExplain() throws Exception {
+        Request request = new Request("GET", "store/_search?size=3&explain=true&error_trace");
+        request.setJsonEntity("""
+            {
+              "rescore": {
+                "window_size": 10,
+                "learning_to_rank": { "model_id": "ltr-model" }
+              }
+            }""");
+        var response = client().performRequest(request);
+        assertExplainExtractedFeatures(response, List.of("type_tv", "cost", "two"));
+    }
+
     public void testLearningToRankRescoreSmallWindow() throws Exception {
         Request request = new Request("GET", "store/_search?size=5");
         request.setJsonEntity("""
@@ -336,4 +173,234 @@ private void indexData(String data) throws IOException {
     private static void assertHitScores(Response response, List<Double> expectedScores) throws IOException {
         assertThat((List<Double>) XContentMapValues.extractValue("hits.hits._score", responseAsMap(response)), equalTo(expectedScores));
     }
+
+    @SuppressWarnings("unchecked")
+    private static void assertExplainExtractedFeatures(Response response, List<String> expectedFeatures) throws IOException {
+        var explainValues = (ArrayList<Map<String, Object>>) XContentMapValues.extractValue(
+            "hits.hits._explanation",
+            responseAsMap(response)
+        );
+
+        assertThat(explainValues.size(), equalTo(3));
+        for (Map<String, Object> hit : explainValues) {
+            assertThat(hit.get("description"), equalTo("rescored using LTR model ltr-model"));
+
+            var queryDetails = (ArrayList<Map<String, Object>>) hit.get("details");
+            assertThat(queryDetails.size(), equalTo(2));
+
+            assertThat(queryDetails.get(0).get("description"), equalTo("first pass query score"));
+            assertThat(queryDetails.get(1).get("description"), equalTo("extracted features"));
+
+            var featureDetails = new ArrayList<>((ArrayList<Map<String, Object>>) queryDetails.get(1).get("details"));
+            assertThat(featureDetails.size(), equalTo(3));
+
+            var missingKeys = new ArrayList<String>();
+            for (String expectedFeature : expectedFeatures) {
+                var expectedDescription = Strings.format("feature value for [%s]", expectedFeature);
+
+                var wasFound = false;
+                for (Map<String, Object> detailItem : featureDetails) {
+                    if (detailItem.get("description").equals(expectedDescription)) {
+                        featureDetails.remove(detailItem);
+                        wasFound = true;
+                        break;
+                    }
+                }
+
+                if (wasFound == false) {
+                    missingKeys.add(expectedFeature);
+                }
+            }
+
+            assertThat(Strings.format("Could not find features: [%s]", String.join(", ", missingKeys)), featureDetails.size(), equalTo(0));
+        }
+    }
+
+    private static String testIndexDefinition = """
+        "properties":{
+          "product":{"type": "keyword"},
+          "cost":{"type": "integer"}
+        }""";
+
+    private static List<String> testIndexData = List.of(
+        "{ \"product\": \"TV\", \"cost\": 300}",
+        "{ \"product\": \"TV\", \"cost\": 400}",
+        "{ \"product\": \"TV\", \"cost\": 600}",
+        "{ \"product\": \"VCR\", \"cost\": 15}",
+        "{ \"product\": \"VCR\", \"cost\": 350}",
+        "{ \"product\": \"VCR\", \"cost\": 580}",
+        "{ \"product\": \"Laptop\", \"cost\": 100}",
+        "{ \"product\": \"Laptop\", \"cost\": 300}",
+        "{ \"product\": \"Laptop\", \"cost\": 500}"
+    );
+
+    private static String testRegressionModel = """
+        {
+          "description": "super complex model for tests",
+          "inference_config": {
+            "learning_to_rank": {
+              "feature_extractors": [
+                {
+                  "query_extractor": {
+                    "feature_name": "cost",
+                    "query": {"script_score": {"query": {"match_all":{}}, "script": {"source": "return doc['cost'].value;"}}}
+                  }
+                },
+                {
+                  "query_extractor": {
+                    "feature_name": "type_tv",
+                    "query": {"constant_score": {"filter": {"term": { "product": "TV" }}, "boost": 1.0}}
+                  }
+                },
+                {
+                  "query_extractor": {
+                    "feature_name": "type_vcr",
+                    "query": {"constant_score": {"filter": {"term": { "product": "VCR" }}, "boost": 1.0}}
+                  }
+                },
+                {
+                  "query_extractor": {
+                    "feature_name": "type_laptop",
+                    "query": {"constant_score": {"filter": {"term": { "product": "Laptop" }}, "boost": 1.0}}
+                  }
+                },
+                {
+                    "query_extractor": {
+                        "feature_name": "two",
+                        "query": { "script_score": { "query": { "match_all": {} }, "script": { "source": "return 2.0;" } } }
+                    }
+                },
+                {
+                    "query_extractor": {
+                        "feature_name": "product_bm25",
+                        "query": { "term": { "product": "{{keyword}}" } }
+                    }
+                }
+              ]
+            }
+          },
+          "definition": {
+            "trained_model": {
+              "ensemble": {
+                "feature_names": ["cost", "type_tv", "type_vcr", "type_laptop", "two", "product_bm25"],
+                "target_type": "regression",
+                "trained_models": [
+                {
+                  "tree": {
+                    "feature_names": [
+                      "cost"
+                    ],
+                    "tree_structure": [
+                    {
+                      "node_index": 0,
+                      "split_feature": 0,
+                      "split_gain": 12,
+                      "threshold": 400,
+                      "decision_type": "lte",
+                      "default_left": true,
+                      "left_child": 1,
+                      "right_child": 2
+                    },
+                    {
+                      "node_index": 1,
+                      "leaf_value": 5.0
+                    },
+                    {
+                      "node_index": 2,
+                      "leaf_value": 2.0
+                    }
+                    ],
+                    "target_type": "regression"
+                  }
+                },
+                {
+                  "tree": {
+                    "feature_names": [
+                      "type_tv"
+                    ],
+                    "tree_structure": [
+                    {
+                      "node_index": 0,
+                      "split_feature": 0,
+                      "split_gain": 12,
+                      "threshold": 1,
+                      "decision_type": "lt",
+                      "default_left": true,
+                      "left_child": 1,
+                      "right_child": 2
+                    },
+                    {
+                      "node_index": 1,
+                      "leaf_value": 1.0
+                    },
+                    {
+                      "node_index": 2,
+                      "leaf_value": 12.0
+                    }
+                    ],
+                    "target_type": "regression"
+                  }
+                },
+                 {
+                  "tree": {
+                    "feature_names": [
+                      "two"
+                    ],
+                    "tree_structure": [
+                    {
+                      "node_index": 0,
+                      "split_feature": 0,
+                      "split_gain": 12,
+                      "threshold": 1,
+                      "decision_type": "lt",
+                      "default_left": true,
+                      "left_child": 1,
+                      "right_child": 2
+                    },
+                    {
+                      "node_index": 1,
+                      "leaf_value": 1.0
+                    },
+                    {
+                      "node_index": 2,
+                      "leaf_value": 2.0
+                    }
+                    ],
+                    "target_type": "regression"
+                  }
+                },
+                 {
+                  "tree": {
+                    "feature_names": [
+                      "product_bm25"
+                    ],
+                    "tree_structure": [
+                    {
+                      "node_index": 0,
+                      "split_feature": 0,
+                      "split_gain": 12,
+                      "threshold": 1,
+                      "decision_type": "lt",
+                      "default_left": true,
+                      "left_child": 1,
+                      "right_child": 2
+                    },
+                    {
+                      "node_index": 1,
+                      "leaf_value": 1.0
+                    },
+                    {
+                      "node_index": 2,
+                      "leaf_value": 4.0
+                    }
+                    ],
+                    "target_type": "regression"
+                  }
+                }
+                ]
+              }
+            }
+          }
+        }
+        """;
 }
diff --git a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/ltr/LearningToRankRescorer.java b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/ltr/LearningToRankRescorer.java
index 8a310ba2719f2..70d0b980bb3bf 100644
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/ltr/LearningToRankRescorer.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/ltr/LearningToRankRescorer.java
@@ -28,6 +28,7 @@
 import java.util.Comparator;
 import java.util.List;
 import java.util.Map;
+import java.util.Objects;
 import java.util.Set;
 
 import static java.util.stream.Collectors.toUnmodifiableSet;
@@ -129,8 +130,58 @@ public TopDocs rescore(TopDocs topDocs, IndexSearcher searcher, RescoreContext r
     @Override
     public Explanation explain(int topLevelDocId, IndexSearcher searcher, RescoreContext rescoreContext, Explanation sourceExplanation)
         throws IOException {
-        // TODO: Call infer again but with individual feature importance values and explaining the model (which features are used, etc.)
-        return null;
+        if (sourceExplanation == null) {
+            return Explanation.noMatch("no match found");
+        }
+
+        LearningToRankRescorerContext ltrContext = (LearningToRankRescorerContext) rescoreContext;
+        LocalModel localModelDefinition = ltrContext.regressionModelDefinition;
+
+        if (localModelDefinition == null) {
+            throw new IllegalStateException("local model reference is null, missing rewriteAndFetch before rescore phase?");
+        }
+
+        List<LeafReaderContext> leaves = ltrContext.executionContext.searcher().getIndexReader().leaves();
+
+        int endDoc = 0;
+        int readerUpto = -1;
+        LeafReaderContext currentSegment = null;
+
+        while (topLevelDocId >= endDoc) {
+            readerUpto++;
+            currentSegment = leaves.get(readerUpto);
+            endDoc = currentSegment.docBase + currentSegment.reader().maxDoc();
+        }
+
+        assert currentSegment != null : "Unexpected null segment";
+
+        int targetDoc = topLevelDocId - currentSegment.docBase;
+
+        List<FeatureExtractor> featureExtractors = ltrContext.buildFeatureExtractors(searcher);
+        int featureSize = featureExtractors.stream().mapToInt(fe -> fe.featureNames().size()).sum();
+
+        Map<String, Object> features = Maps.newMapWithExpectedSize(featureSize);
+
+        for (FeatureExtractor featureExtractor : featureExtractors) {
+            featureExtractor.setNextReader(currentSegment);
+            featureExtractor.addFeatures(features, targetDoc);
+        }
+
+        // Predicting the value
+        var ltrScore = ((Number) localModelDefinition.inferLtr(features, ltrContext.learningToRankConfig).predictedValue()).floatValue();
+
+        List<Explanation> featureExplanations = new ArrayList<>();
+        for (String featureName : features.keySet()) {
+            Number featureValue = Objects.requireNonNullElse((Number) features.get(featureName), 0);
+            featureExplanations.add(Explanation.match(featureValue, "feature value for [" + featureName + "]"));
+        }
+
+        return Explanation.match(
+            ltrScore,
+            "rescored using LTR model " + ltrContext.regressionModelDefinition.getModelId(),
+            Explanation.match(sourceExplanation.getValue(), "first pass query score", sourceExplanation),
+            Explanation.match(0f, "extracted features", featureExplanations)
+        );
     }
 
     /** Returns a new {@link TopDocs} with the topN from the incoming one, or the same TopDocs if the number of hits is already &lt;=

From e36b5551ab418860e9db84cdaa96dc2e0df30d6b Mon Sep 17 00:00:00 2001
From: Nik Everett <nik9000@gmail.com>
Date: Thu, 29 Aug 2024 09:44:15 -0400
Subject: [PATCH 046/144] ESQL: Method to convert BooleanBlock to a "mask"
 (#112253)

This adds a method, `BooleanBlock#toMask` to convert `BooleanBlock`s
into a "mask" for use with `keepMask`.
---
 .../compute/data/BooleanArrayBlock.java       | 21 ++++++
 .../compute/data/BooleanBigArrayBlock.java    | 21 ++++++
 .../compute/data/BooleanBlock.java            |  7 ++
 .../compute/data/BooleanVectorBlock.java      |  6 ++
 .../compute/data/ConstantNullBlock.java       |  5 ++
 .../elasticsearch/compute/data/ToMask.java    | 22 +++++++
 .../compute/data/X-ArrayBlock.java.st         | 22 +++++++
 .../compute/data/X-BigArrayBlock.java.st      | 23 +++++++
 .../compute/data/X-Block.java.st              | 10 ++-
 .../compute/data/X-Vector.java.st             |  2 +-
 .../compute/data/X-VectorBlock.java.st        |  9 ++-
 .../compute/data/BasicBlockTests.java         | 41 +++++++++++-
 .../data/BigArrayBlockBuilderTests.java       | 66 +++++++++++++++++++
 .../compute/data/BigArrayVectorTests.java     |  6 ++
 .../compute/data/BlockMultiValuedTests.java   | 49 ++++++++++++++
 15 files changed, 306 insertions(+), 4 deletions(-)
 create mode 100644 x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/ToMask.java

diff --git a/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/data/BooleanArrayBlock.java b/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/data/BooleanArrayBlock.java
index 14f6c9591ed10..3d600bec1bd65 100644
--- a/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/data/BooleanArrayBlock.java
+++ b/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/data/BooleanArrayBlock.java
@@ -85,6 +85,27 @@ public BooleanVector asVector() {
         return null;
     }
 
+    @Override
+    public ToMask toMask() {
+        if (getPositionCount() == 0) {
+            return new ToMask(blockFactory().newConstantBooleanVector(false, 0), false);
+        }
+        try (BooleanVector.FixedBuilder builder = blockFactory().newBooleanVectorFixedBuilder(getPositionCount())) {
+            boolean hasMv = false;
+            for (int p = 0; p < getPositionCount(); p++) {
+                builder.appendBoolean(switch (getValueCount(p)) {
+                    case 0 -> false;
+                    case 1 -> getBoolean(getFirstValueIndex(p));
+                    default -> {
+                        hasMv = true;
+                        yield false;
+                    }
+                });
+            }
+            return new ToMask(builder.build(), hasMv);
+        }
+    }
+
     @Override
     public boolean getBoolean(int valueIndex) {
         return vector.getBoolean(valueIndex);
diff --git a/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/data/BooleanBigArrayBlock.java b/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/data/BooleanBigArrayBlock.java
index 5342728af4fee..f353512eb93b7 100644
--- a/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/data/BooleanBigArrayBlock.java
+++ b/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/data/BooleanBigArrayBlock.java
@@ -86,6 +86,27 @@ public BooleanVector asVector() {
         return null;
     }
 
+    @Override
+    public ToMask toMask() {
+        if (getPositionCount() == 0) {
+            return new ToMask(blockFactory().newConstantBooleanVector(false, 0), false);
+        }
+        try (BooleanVector.FixedBuilder builder = blockFactory().newBooleanVectorFixedBuilder(getPositionCount())) {
+            boolean hasMv = false;
+            for (int p = 0; p < getPositionCount(); p++) {
+                builder.appendBoolean(switch (getValueCount(p)) {
+                    case 0 -> false;
+                    case 1 -> getBoolean(getFirstValueIndex(p));
+                    default -> {
+                        hasMv = true;
+                        yield false;
+                    }
+                });
+            }
+            return new ToMask(builder.build(), hasMv);
+        }
+    }
+
     @Override
     public boolean getBoolean(int valueIndex) {
         return vector.getBoolean(valueIndex);
diff --git a/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/data/BooleanBlock.java b/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/data/BooleanBlock.java
index 566b8fbed445c..5d2d6c97a11f1 100644
--- a/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/data/BooleanBlock.java
+++ b/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/data/BooleanBlock.java
@@ -37,6 +37,13 @@ public sealed interface BooleanBlock extends Block permits BooleanArrayBlock, Bo
     @Override
     BooleanVector asVector();
 
+    /**
+     * Convert this to a {@link BooleanVector "mask"} that's appropriate for
+     * passing to {@link #keepMask}. Null and multivalued positions will be
+     * converted to {@code false}.
+     */
+    ToMask toMask();
+
     @Override
     BooleanBlock filter(int... positions);
 
diff --git a/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/data/BooleanVectorBlock.java b/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/data/BooleanVectorBlock.java
index ca2fc58bf0bb5..1544cc3355cd0 100644
--- a/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/data/BooleanVectorBlock.java
+++ b/x-pack/plugin/esql/compute/src/main/generated-src/org/elasticsearch/compute/data/BooleanVectorBlock.java
@@ -31,6 +31,12 @@ public BooleanVector asVector() {
         return vector;
     }
 
+    @Override
+    public ToMask toMask() {
+        vector.incRef();
+        return new ToMask(vector, false);
+    }
+
     @Override
     public boolean getBoolean(int valueIndex) {
         return vector.getBoolean(valueIndex);
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/ConstantNullBlock.java b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/ConstantNullBlock.java
index fc4cdc1d41f46..3d61613ba70e9 100644
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/ConstantNullBlock.java
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/ConstantNullBlock.java
@@ -48,6 +48,11 @@ public OrdinalBytesRefBlock asOrdinals() {
         return null;
     }
 
+    @Override
+    public ToMask toMask() {
+        return new ToMask(blockFactory.newConstantBooleanVector(false, positionCount), false);
+    }
+
     @Override
     public boolean isNull(int position) {
         return true;
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/ToMask.java b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/ToMask.java
new file mode 100644
index 0000000000000..5b71679048e21
--- /dev/null
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/ToMask.java
@@ -0,0 +1,22 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.compute.data;
+
+import org.elasticsearch.core.Releasable;
+
+/**
+ * Result from calling {@link BooleanBlock#toMask}. {@link #close closing} this will
+ * close the contained {@link #mask()}. If you want to keep a reference to it then you'll
+ * have to {@link Block#incRef()} it.
+ */
+public record ToMask(BooleanVector mask, boolean hadMultivaluedFields) implements Releasable {
+    @Override
+    public void close() {
+        mask.close();
+    }
+}
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-ArrayBlock.java.st b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-ArrayBlock.java.st
index 750de95e7b8d7..e855e6d6296d8 100644
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-ArrayBlock.java.st
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-ArrayBlock.java.st
@@ -101,6 +101,28 @@ $if(BytesRef)$
     public OrdinalBytesRefBlock asOrdinals() {
         return null;
     }
+
+$elseif(boolean)$
+    @Override
+    public ToMask toMask() {
+        if (getPositionCount() == 0) {
+            return new ToMask(blockFactory().newConstantBooleanVector(false, 0), false);
+        }
+        try (BooleanVector.FixedBuilder builder = blockFactory().newBooleanVectorFixedBuilder(getPositionCount())) {
+            boolean hasMv = false;
+            for (int p = 0; p < getPositionCount(); p++) {
+                builder.appendBoolean(switch (getValueCount(p)) {
+                    case 0 -> false;
+                    case 1 -> getBoolean(getFirstValueIndex(p));
+                    default -> {
+                        hasMv = true;
+                        yield false;
+                    }
+                });
+            }
+            return new ToMask(builder.build(), hasMv);
+        }
+    }
 $endif$
 
     @Override
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-BigArrayBlock.java.st b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-BigArrayBlock.java.st
index bf9e6fec18726..23632bf41349c 100644
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-BigArrayBlock.java.st
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-BigArrayBlock.java.st
@@ -86,6 +86,29 @@ public final class $Type$BigArrayBlock extends AbstractArrayBlock implements $Ty
         return null;
     }
 
+$if(boolean)$
+    @Override
+    public ToMask toMask() {
+        if (getPositionCount() == 0) {
+            return new ToMask(blockFactory().newConstantBooleanVector(false, 0), false);
+        }
+        try (BooleanVector.FixedBuilder builder = blockFactory().newBooleanVectorFixedBuilder(getPositionCount())) {
+            boolean hasMv = false;
+            for (int p = 0; p < getPositionCount(); p++) {
+                builder.appendBoolean(switch (getValueCount(p)) {
+                    case 0 -> false;
+                    case 1 -> getBoolean(getFirstValueIndex(p));
+                    default -> {
+                        hasMv = true;
+                        yield false;
+                    }
+                });
+            }
+            return new ToMask(builder.build(), hasMv);
+        }
+    }
+$endif$
+
     @Override
     public $type$ get$Type$(int valueIndex) {
         return vector.get$Type$(valueIndex);
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-Block.java.st b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-Block.java.st
index da0769af2d185..67e4ac4bb334f 100644
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-Block.java.st
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-Block.java.st
@@ -63,8 +63,16 @@ $if(BytesRef)$
      * returns null. Callers must not release the returned block as no extra reference is retained by this method.
      */
     OrdinalBytesRefBlock asOrdinals();
-$endif$
 
+$elseif(boolean)$
+    /**
+     * Convert this to a {@link BooleanVector "mask"} that's appropriate for
+     * passing to {@link #keepMask}. Null and multivalued positions will be
+     * converted to {@code false}.
+     */
+    ToMask toMask();
+
+$endif$
     @Override
     $Type$Block filter(int... positions);
 
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-Vector.java.st b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-Vector.java.st
index 09f11f3504393..e19c1788cdb6b 100644
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-Vector.java.st
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-Vector.java.st
@@ -51,8 +51,8 @@ $if(BytesRef)$
      * returns null. Callers must not release the returned vector as no extra reference is retained by this method.
      */
     OrdinalBytesRefVector asOrdinals();
-$endif$
 
+$endif$
     @Override
     $Type$Vector filter(int... positions);
 
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-VectorBlock.java.st b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-VectorBlock.java.st
index eec75f62f22f8..d4c6859e64b2a 100644
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-VectorBlock.java.st
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/X-VectorBlock.java.st
@@ -44,8 +44,15 @@ $if(BytesRef)$
             return null;
         }
     }
-$endif$
 
+$elseif(boolean)$
+    @Override
+    public ToMask toMask() {
+        vector.incRef();
+        return new ToMask(vector, false);
+    }
+
+$endif$
     @Override
 $if(BytesRef)$
     public BytesRef getBytesRef(int valueIndex, BytesRef dest) {
diff --git a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/BasicBlockTests.java b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/BasicBlockTests.java
index e8401048af011..ad372da47d6b8 100644
--- a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/BasicBlockTests.java
+++ b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/BasicBlockTests.java
@@ -800,6 +800,12 @@ public void testBooleanBlock() {
             }
             assertLookup(block, positions(blockFactory, positionCount + 1000), singletonList(null));
             assertEmptyLookup(blockFactory, block);
+            try (ToMask mask = block.toMask()) {
+                assertThat(mask.hadMultivaluedFields(), equalTo(false));
+                for (int p = 0; p < positionCount; p++) {
+                    assertThat(mask.mask().getBoolean(p), equalTo(p % 10 == 0));
+                }
+            }
 
             try (BooleanBlock.Builder blockBuilder = blockFactory.newBooleanBlockBuilder(1)) {
                 BooleanBlock copy = blockBuilder.copyFrom(block, 0, block.getPositionCount()).build();
@@ -826,6 +832,7 @@ public void testBooleanBlock() {
             IntStream.range(0, positionCount).mapToObj(ii -> randomBoolean()).forEach(vectorBuilder::appendBoolean);
             BooleanVector vector = vectorBuilder.build();
             assertSingleValueDenseBlock(vector.asBlock());
+            assertToMask(vector);
             releaseAndAssertBreaker(vector.asBlock());
         }
     }
@@ -1358,6 +1365,19 @@ <B extends Block, BB extends Block.Builder, T> void assertNullValues(
         assertTrue(block.isNull(randomNullPosition));
         assertFalse(block.isNull(randomNonNullPosition));
         releaseAndAssertBreaker(block);
+        if (block instanceof BooleanBlock bb) {
+            try (ToMask mask = bb.toMask()) {
+                assertThat(mask.hadMultivaluedFields(), equalTo(false));
+                for (int p = 0; p < positionCount; p++) {
+                    assertThat(mask.mask().getBoolean(p), equalTo(nullsMask.get(p) == false && p % 10 == 0));
+                }
+            }
+        }
+    }
+
+    void assertZeroPositionsAndRelease(BooleanBlock block) {
+        assertToMaskZeroPositions(block);
+        assertZeroPositionsAndRelease((Block) block);
     }
 
     void assertZeroPositionsAndRelease(Block block) {
@@ -1366,6 +1386,11 @@ void assertZeroPositionsAndRelease(Block block) {
         releaseAndAssertBreaker(block);
     }
 
+    void assertZeroPositionsAndRelease(BooleanVector vector) {
+        assertToMask(vector);
+        assertZeroPositionsAndRelease((Vector) vector);
+    }
+
     void assertZeroPositionsAndRelease(Vector vector) {
         assertThat(vector.getPositionCount(), is(0));
         assertKeepMaskEmpty(vector);
@@ -1386,6 +1411,20 @@ static void assertKeepMaskEmpty(Vector vector) {
         }
     }
 
+    static void assertToMaskZeroPositions(BooleanBlock block) {
+        try (ToMask mask = block.toMask()) {
+            assertThat(mask.mask().getPositionCount(), equalTo(0));
+            assertThat(mask.hadMultivaluedFields(), equalTo(false));
+        }
+    }
+
+    static void assertToMask(BooleanVector vector) {
+        try (ToMask mask = vector.asBlock().toMask()) {
+            assertThat(mask.mask(), sameInstance(vector));
+            assertThat(mask.hadMultivaluedFields(), equalTo(false));
+        }
+    }
+
     void releaseAndAssertBreaker(Block... blocks) {
         assertThat(breaker.getUsed(), greaterThan(0L));
         Page[] pages = Arrays.stream(blocks).map(Page::new).toArray(Page[]::new);
@@ -1836,7 +1875,7 @@ static void assertKeepMask(Block block) {
     /**
      * Build a random valid "mask" of single valued boolean fields that.
      */
-    private static BooleanVector randomMask(int positions) {
+    static BooleanVector randomMask(int positions) {
         try (BooleanVector.Builder builder = TestBlockFactory.getNonBreakingInstance().newBooleanVectorFixedBuilder(positions)) {
             for (int i = 0; i < positions; i++) {
                 builder.appendBoolean(randomBoolean());
diff --git a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/BigArrayBlockBuilderTests.java b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/BigArrayBlockBuilderTests.java
index df32dcaddd927..34d591cd87d84 100644
--- a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/BigArrayBlockBuilderTests.java
+++ b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/BigArrayBlockBuilderTests.java
@@ -164,6 +164,12 @@ public void testBooleanVector() throws IOException {
                     assertThat(block.getBoolean(i), equalTo(elements[i]));
                 }
                 assertKeepMask(block);
+                try (ToMask mask = block.toMask()) {
+                    assertThat(mask.hadMultivaluedFields(), equalTo(false));
+                    for (int p = 0; p < elements.length; p++) {
+                        assertThat(mask.mask().getBoolean(p), equalTo(elements[p]));
+                    }
+                }
                 try (var copy = serializeDeserializeBlock(block)) {
                     assertThat(copy, instanceOf(BooleanVectorBlock.class));
                     assertThat(block.asVector(), instanceOf(BooleanArrayVector.class));
@@ -224,6 +230,12 @@ public void testBooleanBlock() throws IOException {
                     assertThat(block.getBoolean(i), equalTo(elements[i]));
                 }
                 assertKeepMask(block);
+                try (ToMask mask = block.toMask()) {
+                    assertThat(mask.hadMultivaluedFields(), equalTo(true));
+                    for (int p = 0; p < elements.length; p++) {
+                        assertThat(mask.mask().getBoolean(p), equalTo(false));
+                    }
+                }
                 try (var copy = serializeDeserializeBlock(block)) {
                     assertThat(copy, instanceOf(BooleanArrayBlock.class));
                     assertNull(copy.asVector());
@@ -253,6 +265,12 @@ public void testBooleanBlock() throws IOException {
                     assertThat(block.getBoolean(i), equalTo(elements[i]));
                 }
                 assertKeepMask(block);
+                try (ToMask mask = block.toMask()) {
+                    assertThat(mask.hadMultivaluedFields(), equalTo(true));
+                    for (int p = 0; p < elements.length; p++) {
+                        assertThat(mask.mask().getBoolean(p), equalTo(false));
+                    }
+                }
                 try (var copy = serializeDeserializeBlock(block)) {
                     assertThat(copy, instanceOf(BooleanBigArrayBlock.class));
                     assertNull(block.asVector());
@@ -266,4 +284,52 @@ public void testBooleanBlock() throws IOException {
         }
         assertThat(blockFactory.breaker().getUsed(), equalTo(0L));
     }
+
+    /**
+     * Tests a block with one value being multivalued and the rest are single valued.
+     */
+    public void testBooleanBlockOneMv() {
+        int mvCount = between(2, 10);
+        int positionCount = randomIntBetween(1000, 5000);
+        blockFactory = new BlockFactory(blockFactory.breaker(), blockFactory.bigArrays(), ByteSizeValue.ofBytes(1));
+        try (var builder = blockFactory.newBooleanBlockBuilder(between(1, mvCount + positionCount))) {
+            boolean[] elements = new boolean[positionCount + mvCount];
+            builder.beginPositionEntry();
+            for (int i = 0; i < mvCount; i++) {
+                elements[i] = randomBoolean();
+                builder.appendBoolean(elements[i]);
+            }
+            builder.endPositionEntry();
+            for (int p = 1; p < positionCount; p++) {
+                elements[mvCount + p] = randomBoolean();
+                builder.appendBoolean(elements[mvCount + p]);
+            }
+            try (var block = builder.build()) {
+                assertThat(block, instanceOf(BooleanBigArrayBlock.class));
+                assertNull(block.asVector());
+                assertThat(block.getPositionCount(), equalTo(positionCount));
+                assertThat(block.getValueCount(0), equalTo(mvCount));
+                for (int i = 0; i < mvCount; i++) {
+                    assertThat(block.getBoolean(block.getFirstValueIndex(0) + i), equalTo(elements[i]));
+                }
+                for (int p = 1; p < positionCount; p++) {
+                    assertThat(block.getValueCount(p), equalTo(1));
+                    assertThat(block.getBoolean(block.getFirstValueIndex(p)), equalTo(elements[mvCount + p]));
+                }
+                assertKeepMask(block);
+                try (ToMask mask = block.toMask()) {
+                    /*
+                     * NOTE: this test is customized to the layout above where we don't make
+                     * any fields with 0 values.
+                     */
+                    assertThat(mask.hadMultivaluedFields(), equalTo(true));
+                    assertThat(mask.mask().getBoolean(0), equalTo(false));
+                    for (int p = 1; p < positionCount; p++) {
+                        assertThat(mask.mask().getBoolean(p), equalTo(elements[mvCount + p]));
+                    }
+                }
+            }
+        }
+        assertThat(blockFactory.breaker().getUsed(), equalTo(0L));
+    }
 }
diff --git a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/BigArrayVectorTests.java b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/BigArrayVectorTests.java
index af4c643a90625..aab8b86f9b795 100644
--- a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/BigArrayVectorTests.java
+++ b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/BigArrayVectorTests.java
@@ -72,6 +72,12 @@ public void testBoolean() throws IOException {
             assertEmptyLookup(blockFactory, vector.asBlock());
             assertSerialization(block);
             assertThat(vector.toString(), containsString("BooleanBigArrayVector[positions=" + positionCount));
+            try (ToMask mask = block.toMask()) {
+                assertThat(mask.hadMultivaluedFields(), equalTo(false));
+                for (int p = 0; p < values.length; p++) {
+                    assertThat(mask.mask().getBoolean(p), equalTo(values[p]));
+                }
+            }
         }
     }
 
diff --git a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/BlockMultiValuedTests.java b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/BlockMultiValuedTests.java
index c5e130726844d..e37b2638b56f7 100644
--- a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/BlockMultiValuedTests.java
+++ b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/data/BlockMultiValuedTests.java
@@ -31,6 +31,7 @@
 
 import static org.hamcrest.Matchers.equalTo;
 import static org.hamcrest.Matchers.greaterThanOrEqualTo;
+import static org.hamcrest.Matchers.nullValue;
 
 public class BlockMultiValuedTests extends ESTestCase {
     @ParametersFactory
@@ -122,6 +123,54 @@ public void testLookupFromSingleManyPages() {
         assertLookup(ByteSizeValue.ofBytes(1), between(1, 32), p -> 1);
     }
 
+    public void testToMask() {
+        if (elementType != ElementType.BOOLEAN) {
+            return;
+        }
+        int positionCount = randomIntBetween(1, 16 * 1024);
+        var b = BasicBlockTests.randomBlock(blockFactory(), elementType, positionCount, nullAllowed, 2, 10, 0, 0);
+        try (ToMask mask = ((BooleanBlock) b.block()).toMask()) {
+            assertThat(mask.hadMultivaluedFields(), equalTo(true));
+            for (int p = 0; p < b.values().size(); p++) {
+                List<Object> v = b.values().get(p);
+                if (v == null) {
+                    assertThat(mask.mask().getBoolean(p), equalTo(false));
+                    continue;
+                }
+                if (v.size() != 1) {
+                    assertThat(mask.mask().getBoolean(p), equalTo(false));
+                    continue;
+                }
+                assertThat(mask.mask().getBoolean(p), equalTo(v.get(0)));
+            }
+        } finally {
+            b.block().close();
+        }
+    }
+
+    public void testMask() {
+        int positionCount = randomIntBetween(1, 16 * 1024);
+        var b = BasicBlockTests.randomBlock(blockFactory(), elementType, positionCount, nullAllowed, 0, 10, 0, 0);
+        try (
+            BooleanVector mask = BasicBlockTests.randomMask(b.values().size() + between(0, 1000));
+            Block masked = b.block().keepMask(mask)
+        ) {
+            for (int p = 0; p < b.values().size(); p++) {
+                List<Object> inputValues = b.values().get(p);
+                List<Object> valuesAtPosition = BasicBlockTests.valuesAtPositions(masked, p, p + 1).get(0);
+                if (inputValues == null || mask.getBoolean(p) == false) {
+                    assertThat(masked.isNull(p), equalTo(true));
+                    assertThat(valuesAtPosition, nullValue());
+                    continue;
+                }
+                assertThat(masked.isNull(p), equalTo(false));
+                assertThat(valuesAtPosition, equalTo(inputValues));
+            }
+        } finally {
+            b.block().close();
+        }
+    }
+
     private void assertFiltered(boolean all, boolean shuffled) {
         int positionCount = randomIntBetween(1, 16 * 1024);
         var b = BasicBlockTests.randomBlock(blockFactory(), elementType, positionCount, nullAllowed, 0, 10, 0, 0);

From 68b211e025f2222704e50b2f6b6890dbf8f94515 Mon Sep 17 00:00:00 2001
From: Salvatore Campagna
 <93581129+salvatore-campagna@users.noreply.github.com>
Date: Thu, 29 Aug 2024 16:01:56 +0200
Subject: [PATCH 047/144] Store original source for keywords using a normalizer
 (#112151)

Using a normalizer for a keyword field might result in not being able
to reconstruct the original source when using synthetic source.
Here if synthetic source is enabled and a normalizer is configured
we store the original value in a stored field which is later used
at document reconstruction time to reconstruct the field value as
it was in the original document.

We use the same fallback solution we use in other places like
`ignore_malformed`.
---
 docs/changelog/112151.yaml                    |  5 ++
 .../test/mget/90_synthetic_source.yml         | 88 +++++++++++++++++++
 .../index/mapper/KeywordFieldMapper.java      | 19 ++--
 .../index/mapper/MapperFeatures.java          |  1 +
 .../KeywordFieldSyntheticSourceSupport.java   |  9 +-
 5 files changed, 105 insertions(+), 17 deletions(-)
 create mode 100644 docs/changelog/112151.yaml

diff --git a/docs/changelog/112151.yaml b/docs/changelog/112151.yaml
new file mode 100644
index 0000000000000..f5cbfd8da07c2
--- /dev/null
+++ b/docs/changelog/112151.yaml
@@ -0,0 +1,5 @@
+pr: 112151
+summary: Store original source for keywords using a normalizer
+area: Logs
+type: enhancement
+issues: []
diff --git a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/mget/90_synthetic_source.yml b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/mget/90_synthetic_source.yml
index 2935c0c1c41b5..ff17a92ed0fcc 100644
--- a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/mget/90_synthetic_source.yml
+++ b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/mget/90_synthetic_source.yml
@@ -46,6 +46,94 @@ keyword:
       docs.1._source:
         kwd: bar
 
+---
+keyword with normalizer:
+  - requires:
+      cluster_features: [ "mapper.keyword_normalizer_synthetic_source" ]
+      reason: support for normalizer on keyword fields
+  - do:
+      indices.create:
+        index: test-keyword-with-normalizer
+        body:
+          settings:
+            analysis:
+              normalizer:
+                lowercase:
+                  type: custom
+                  filter:
+                    - lowercase
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              keyword:
+                type: keyword
+                normalizer: lowercase
+              keyword_with_ignore_above:
+                type: keyword
+                normalizer: lowercase
+                ignore_above: 10
+              keyword_without_doc_values:
+                type: keyword
+                normalizer: lowercase
+                doc_values: false
+
+  - do:
+      index:
+        index: test-keyword-with-normalizer
+        id: 1
+        body:
+          keyword: "the Quick Brown Fox jumps over the lazy Dog"
+          keyword_with_ignore_above: "the Quick Brown Fox jumps over the lazy Dog"
+          keyword_without_doc_values: "the Quick Brown Fox jumps over the lazy Dog"
+
+  - do:
+      index:
+        index: test-keyword-with-normalizer
+        id: 2
+        body:
+          keyword: "The five BOXING wizards jump Quickly"
+          keyword_with_ignore_above: "The five BOXING wizards jump Quickly"
+          keyword_without_doc_values: "The five BOXING wizards jump Quickly"
+
+  - do:
+      index:
+        index: test-keyword-with-normalizer
+        id: 3
+        body:
+          keyword: [ "May the FORCE be with You!", "Do or Do Not, There is no Try" ]
+          keyword_with_ignore_above: [ "May the FORCE be with You!", "Do or Do Not, There is no Try" ]
+          keyword_without_doc_values: [ "May the FORCE be with You!", "Do or Do Not, There is no Try" ]
+
+  - do:
+      mget:
+        index: test-keyword-with-normalizer
+        body:
+          ids:    [ 1, 2, 3 ]
+  - match: { docs.0._index: "test-keyword-with-normalizer" }
+  - match: { docs.0._id: "1" }
+  - match:
+      docs.0._source:
+        keyword: "the Quick Brown Fox jumps over the lazy Dog"
+        keyword_with_ignore_above: "the Quick Brown Fox jumps over the lazy Dog"
+        keyword_without_doc_values: "the Quick Brown Fox jumps over the lazy Dog"
+
+  - match: { docs.1._index: "test-keyword-with-normalizer" }
+  - match: { docs.1._id: "2" }
+  - match:
+      docs.1._source:
+        keyword: "The five BOXING wizards jump Quickly"
+        keyword_with_ignore_above: "The five BOXING wizards jump Quickly"
+        keyword_without_doc_values: "The five BOXING wizards jump Quickly"
+
+  - match: { docs.2._index: "test-keyword-with-normalizer" }
+  - match: { docs.2._id: "3" }
+  - match:
+      docs.2._source:
+        keyword: [ "May the FORCE be with You!", "Do or Do Not, There is no Try" ]
+        keyword_with_ignore_above: [ "May the FORCE be with You!", "Do or Do Not, There is no Try" ]
+        keyword_without_doc_values: [ "May the FORCE be with You!", "Do or Do Not, There is no Try" ]
+
 ---
 stored text:
   - requires:
diff --git a/server/src/main/java/org/elasticsearch/index/mapper/KeywordFieldMapper.java b/server/src/main/java/org/elasticsearch/index/mapper/KeywordFieldMapper.java
index 9645b4397df4f..d130f37c3e8eb 100644
--- a/server/src/main/java/org/elasticsearch/index/mapper/KeywordFieldMapper.java
+++ b/server/src/main/java/org/elasticsearch/index/mapper/KeywordFieldMapper.java
@@ -89,6 +89,7 @@ public final class KeywordFieldMapper extends FieldMapper {
     public static final String CONTENT_TYPE = "keyword";
 
     static final NodeFeature KEYWORD_DIMENSION_IGNORE_ABOVE = new NodeFeature("mapper.keyword_dimension_ignore_above");
+    static final NodeFeature KEYWORD_NORMALIZER_SYNTHETIC_SOURCE = new NodeFeature("mapper.keyword_normalizer_synthetic_source");
 
     public static class Defaults {
         public static final FieldType FIELD_TYPE;
@@ -856,7 +857,7 @@ public boolean hasNormalizer() {
     private final Script script;
     private final ScriptCompiler scriptCompiler;
     private final IndexVersion indexCreatedVersion;
-    private final boolean storeIgnored;
+    private final boolean isSyntheticSource;
 
     private final IndexAnalyzers indexAnalyzers;
 
@@ -866,7 +867,7 @@ private KeywordFieldMapper(
         KeywordFieldType mappedFieldType,
         MultiFields multiFields,
         CopyTo copyTo,
-        boolean storeIgnored,
+        boolean isSyntheticSource,
         Builder builder
     ) {
         super(simpleName, mappedFieldType, multiFields, copyTo, builder.script.get() != null, builder.onScriptError.getValue());
@@ -881,7 +882,7 @@ private KeywordFieldMapper(
         this.indexAnalyzers = builder.indexAnalyzers;
         this.scriptCompiler = builder.scriptCompiler;
         this.indexCreatedVersion = builder.indexCreatedVersion;
-        this.storeIgnored = storeIgnored;
+        this.isSyntheticSource = isSyntheticSource;
     }
 
     @Override
@@ -916,7 +917,7 @@ private void indexValue(DocumentParserContext context, String value) {
 
         if (value.length() > fieldType().ignoreAbove()) {
             context.addIgnoredField(fullPath());
-            if (storeIgnored) {
+            if (isSyntheticSource) {
                 // Save a copy of the field so synthetic source can load it
                 context.doc().add(new StoredField(originalName(), new BytesRef(value)));
             }
@@ -1026,6 +1027,11 @@ private String originalName() {
 
     @Override
     protected SyntheticSourceMode syntheticSourceMode() {
+        if (hasNormalizer()) {
+            // NOTE: no matter if we have doc values or not we use a stored field to reconstruct the original value
+            // whose doc values would be altered by the normalizer
+            return SyntheticSourceMode.FALLBACK;
+        }
         if (fieldType.stored() || hasDocValues) {
             return SyntheticSourceMode.NATIVE;
         }
@@ -1047,11 +1053,6 @@ public SourceLoader.SyntheticFieldLoader syntheticFieldLoader(String simpleName)
                 "field [" + fullPath() + "] of type [" + typeName() + "] doesn't support synthetic source because it declares copy_to"
             );
         }
-        if (hasNormalizer()) {
-            throw new IllegalArgumentException(
-                "field [" + fullPath() + "] of type [" + typeName() + "] doesn't support synthetic source because it declares a normalizer"
-            );
-        }
 
         if (syntheticSourceMode() != SyntheticSourceMode.NATIVE) {
             return super.syntheticFieldLoader();
diff --git a/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java b/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java
index 6dce9d6c7b86e..63bbef061c61f 100644
--- a/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java
+++ b/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java
@@ -33,6 +33,7 @@ public Set<NodeFeature> getFeatures() {
             NodeMappingStats.SEGMENT_LEVEL_FIELDS_STATS,
             BooleanFieldMapper.BOOLEAN_DIMENSION,
             ObjectMapper.SUBOBJECTS_AUTO,
+            KeywordFieldMapper.KEYWORD_NORMALIZER_SYNTHETIC_SOURCE,
             SourceFieldMapper.SYNTHETIC_SOURCE_STORED_FIELDS_ADVANCE_FIX
         );
     }
diff --git a/test/framework/src/main/java/org/elasticsearch/index/mapper/KeywordFieldSyntheticSourceSupport.java b/test/framework/src/main/java/org/elasticsearch/index/mapper/KeywordFieldSyntheticSourceSupport.java
index 6abe923851318..2f452161b10ca 100644
--- a/test/framework/src/main/java/org/elasticsearch/index/mapper/KeywordFieldSyntheticSourceSupport.java
+++ b/test/framework/src/main/java/org/elasticsearch/index/mapper/KeywordFieldSyntheticSourceSupport.java
@@ -21,8 +21,6 @@
 import java.util.stream.Collectors;
 import java.util.stream.Stream;
 
-import static org.hamcrest.Matchers.equalTo;
-
 public class KeywordFieldSyntheticSourceSupport implements MapperTestCase.SyntheticSourceSupport {
     private final Integer ignoreAbove;
     private final boolean allIgnored;
@@ -128,11 +126,6 @@ private void mapping(XContentBuilder b) throws IOException {
 
     @Override
     public List<MapperTestCase.SyntheticSourceInvalidExample> invalidExample() throws IOException {
-        return List.of(
-            new MapperTestCase.SyntheticSourceInvalidExample(
-                equalTo("field [field] of type [keyword] doesn't support synthetic source because it declares a normalizer"),
-                b -> b.field("type", "keyword").field("normalizer", "lowercase")
-            )
-        );
+        return List.of();
     }
 }

From 1be4f65da2ac35d971626353b8a076aa75a7b693 Mon Sep 17 00:00:00 2001
From: David Turner <david.turner@elastic.co>
Date: Thu, 29 Aug 2024 15:20:03 +0100
Subject: [PATCH 048/144] Add constants for UUID lengths (#112353)

Our UUID strings have fixed lengths (depending on the type of UUID).
Sometimes we might want code to rely on knowing these lengths rather
than doing some other string manipulations to look for a boundary. This
commit exposes constants for these things.
---
 .../common/RandomBasedUUIDGenerator.java      |  4 +-
 .../common/TimeBasedUUIDGenerator.java        |  4 +-
 .../java/org/elasticsearch/common/UUIDs.java  | 40 +++++++++++++++----
 .../org/elasticsearch/common/UUIDTests.java   | 16 ++++++++
 .../blobstore/RepositoryFileType.java         |  5 ++-
 5 files changed, 57 insertions(+), 12 deletions(-)

diff --git a/server/src/main/java/org/elasticsearch/common/RandomBasedUUIDGenerator.java b/server/src/main/java/org/elasticsearch/common/RandomBasedUUIDGenerator.java
index e731cf3bc58be..58c23ab9aa398 100644
--- a/server/src/main/java/org/elasticsearch/common/RandomBasedUUIDGenerator.java
+++ b/server/src/main/java/org/elasticsearch/common/RandomBasedUUIDGenerator.java
@@ -56,8 +56,10 @@ public static String getBase64UUID(Random random) {
         return Base64.getUrlEncoder().withoutPadding().encodeToString(getUUIDBytes(random));
     }
 
+    static final int SIZE_IN_BYTES = 16;
+
     private static byte[] getUUIDBytes(Random random) {
-        final byte[] randomBytes = new byte[16];
+        final byte[] randomBytes = new byte[SIZE_IN_BYTES];
         random.nextBytes(randomBytes);
         /* Set the version to version 4 (see http://www.ietf.org/rfc/rfc4122.txt)
          * The randomly or pseudo-randomly generated version.
diff --git a/server/src/main/java/org/elasticsearch/common/TimeBasedUUIDGenerator.java b/server/src/main/java/org/elasticsearch/common/TimeBasedUUIDGenerator.java
index f7f7f520fec90..d66b0f579ce3e 100644
--- a/server/src/main/java/org/elasticsearch/common/TimeBasedUUIDGenerator.java
+++ b/server/src/main/java/org/elasticsearch/common/TimeBasedUUIDGenerator.java
@@ -47,6 +47,8 @@ protected byte[] macAddress() {
         return SECURE_MUNGED_ADDRESS;
     }
 
+    static final int SIZE_IN_BYTES = 15;
+
     @Override
     public String getBase64UUID() {
         final int sequenceId = sequenceNumber.incrementAndGet() & 0xffffff;
@@ -61,7 +63,7 @@ public String getBase64UUID() {
             sequenceId == 0 ? (lastTimestamp, currentTimeMillis) -> Math.max(lastTimestamp, currentTimeMillis) + 1 : Math::max
         );
 
-        final byte[] uuidBytes = new byte[15];
+        final byte[] uuidBytes = new byte[SIZE_IN_BYTES];
         int i = 0;
 
         // We have auto-generated ids, which are usually used for append-only workloads.
diff --git a/server/src/main/java/org/elasticsearch/common/UUIDs.java b/server/src/main/java/org/elasticsearch/common/UUIDs.java
index 43a232e82510e..ebc0978f38d49 100644
--- a/server/src/main/java/org/elasticsearch/common/UUIDs.java
+++ b/server/src/main/java/org/elasticsearch/common/UUIDs.java
@@ -17,26 +17,50 @@ public class UUIDs {
     private static final RandomBasedUUIDGenerator RANDOM_UUID_GENERATOR = new RandomBasedUUIDGenerator();
     private static final UUIDGenerator TIME_UUID_GENERATOR = new TimeBasedUUIDGenerator();
 
-    /** Generates a time-based UUID (similar to Flake IDs), which is preferred when generating an ID to be indexed into a Lucene index as
-     *  primary key.  The id is opaque and the implementation is free to change at any time! */
+    /**
+     * The length of a UUID string generated by {@link #base64UUID}.
+     */
+    // A 15-byte time-based UUID is base64-encoded as 5 3-byte chunks (each becoming 4 chars after encoding).
+    public static final int TIME_BASED_UUID_STRING_LENGTH = 20;
+
+    /**
+     * Generates a time-based UUID (similar to Flake IDs), which is preferred when generating an ID to be indexed into a Lucene index as
+     * primary key. The id is opaque and the implementation is free to change at any time!
+     * The resulting string has length {@link #TIME_BASED_UUID_STRING_LENGTH}.
+     */
     public static String base64UUID() {
         return TIME_UUID_GENERATOR.getBase64UUID();
     }
 
-    /** Returns a Base64 encoded version of a Version 4.0 compatible UUID as defined here: http://www.ietf.org/rfc/rfc4122.txt, using the
-     *  provided {@code Random} instance */
+    /**
+     * The length of a UUID string generated by {@link #randomBase64UUID} and {@link #randomBase64UUIDSecureString}.
+     */
+    // A 16-byte v4 UUID is base64-encoded as 5 3-byte chunks (each becoming 4 chars after encoding) plus another byte (becomes 2 chars).
+    public static final int RANDOM_BASED_UUID_STRING_LENGTH = 22;
+
+    /**
+     * Returns a Base64 encoded string representing a <a href="http://www.ietf.org/rfc/rfc4122.txt">RFC4122 version 4 UUID</a>, using the
+     * provided {@code Random} instance.
+     * The resulting string has length {@link #RANDOM_BASED_UUID_STRING_LENGTH}.
+     */
     public static String randomBase64UUID(Random random) {
         return RandomBasedUUIDGenerator.getBase64UUID(random);
     }
 
-    /** Returns a Base64 encoded version of a Version 4.0 compatible UUID as defined here: http://www.ietf.org/rfc/rfc4122.txt, using a
-     *  private {@code SecureRandom} instance */
+    /**
+     * Returns a Base64 encoded string representing a <a href="http://www.ietf.org/rfc/rfc4122.txt">RFC4122 version 4 UUID</a>, using a
+     * private {@code SecureRandom} instance.
+     * The resulting string has length {@link #RANDOM_BASED_UUID_STRING_LENGTH}.
+     */
     public static String randomBase64UUID() {
         return RANDOM_UUID_GENERATOR.getBase64UUID();
     }
 
-    /** Returns a Base64 encoded {@link SecureString} of a Version 4.0 compatible UUID as defined here: http://www.ietf.org/rfc/rfc4122.txt,
-     *  using a private {@code SecureRandom} instance */
+    /**
+     * Returns a Base64 encoded {@link SecureString} representing a <a href="http://www.ietf.org/rfc/rfc4122.txt">RFC4122 version 4
+     * UUID</a>, using a private {@code SecureRandom} instance.
+     * The resulting string has length {@link #RANDOM_BASED_UUID_STRING_LENGTH}.
+     */
     public static SecureString randomBase64UUIDSecureString() {
         return RandomBasedUUIDGenerator.getBase64UUIDSecureString();
     }
diff --git a/server/src/test/java/org/elasticsearch/common/UUIDTests.java b/server/src/test/java/org/elasticsearch/common/UUIDTests.java
index 5af036ce0648f..3229049b67b4c 100644
--- a/server/src/test/java/org/elasticsearch/common/UUIDTests.java
+++ b/server/src/test/java/org/elasticsearch/common/UUIDTests.java
@@ -176,4 +176,20 @@ protected byte[] macAddress() {
         );
         return bytesPerDoc;
     }
+
+    public void testStringLength() {
+        assertEquals(UUIDs.RANDOM_BASED_UUID_STRING_LENGTH, getUnpaddedBase64StringLength(RandomBasedUUIDGenerator.SIZE_IN_BYTES));
+        assertEquals(UUIDs.RANDOM_BASED_UUID_STRING_LENGTH, UUIDs.randomBase64UUID().length());
+        assertEquals(UUIDs.RANDOM_BASED_UUID_STRING_LENGTH, UUIDs.randomBase64UUID(random()).length());
+        try (var secureString = UUIDs.randomBase64UUIDSecureString()) {
+            assertEquals(UUIDs.RANDOM_BASED_UUID_STRING_LENGTH, secureString.toString().length());
+        }
+
+        assertEquals(UUIDs.TIME_BASED_UUID_STRING_LENGTH, getUnpaddedBase64StringLength(TimeBasedUUIDGenerator.SIZE_IN_BYTES));
+        assertEquals(UUIDs.TIME_BASED_UUID_STRING_LENGTH, UUIDs.base64UUID().length());
+    }
+
+    private static int getUnpaddedBase64StringLength(int sizeInBytes) {
+        return (int) Math.ceil(sizeInBytes * 4.0 / 3.0);
+    }
 }
diff --git a/test/framework/src/main/java/org/elasticsearch/repositories/blobstore/RepositoryFileType.java b/test/framework/src/main/java/org/elasticsearch/repositories/blobstore/RepositoryFileType.java
index 014cbcd2bcc3a..8d20cce33bbb4 100644
--- a/test/framework/src/main/java/org/elasticsearch/repositories/blobstore/RepositoryFileType.java
+++ b/test/framework/src/main/java/org/elasticsearch/repositories/blobstore/RepositoryFileType.java
@@ -9,6 +9,7 @@
 package org.elasticsearch.repositories.blobstore;
 
 import org.elasticsearch.common.Strings;
+import org.elasticsearch.common.UUIDs;
 
 import java.nio.file.Path;
 import java.util.regex.Pattern;
@@ -38,9 +39,9 @@ public enum RepositoryFileType {
                     // decimal numbers
                     .replace("NUM", "(0|[1-9][0-9]*)")
                     // 15-byte UUIDS from TimeBasedUUIDGenerator
-                    .replace("SHORTUUID", "[0-9a-zA-Z_-]{20}")
+                    .replace("SHORTUUID", "[0-9a-zA-Z_-]{" + UUIDs.TIME_BASED_UUID_STRING_LENGTH + "}")
                     // 16-byte UUIDs from RandomBasedUUIDGenerator
-                    .replace("UUID", "[0-9a-zA-Z_-]{22}")
+                    .replace("UUID", "[0-9a-zA-Z_-]{" + UUIDs.RANDOM_BASED_UUID_STRING_LENGTH + "}")
                 + ")$"
         );
     }

From 9e01181f0dd9bf6ea919164f8929f0874ad6e26d Mon Sep 17 00:00:00 2001
From: Albert Zaharovits <albert.zaharovits@elastic.co>
Date: Thu, 29 Aug 2024 17:33:05 +0300
Subject: [PATCH 049/144] Remove unused cluster blocks in create index
 (#112352)

Remove unused cluster blocks in create index
---
 .../CreateIndexClusterStateUpdateRequest.java |  9 -------
 .../metadata/MetadataCreateIndexService.java  | 24 ++++---------------
 .../MetadataCreateIndexServiceTests.java      | 10 +-------
 3 files changed, 6 insertions(+), 37 deletions(-)

diff --git a/server/src/main/java/org/elasticsearch/action/admin/indices/create/CreateIndexClusterStateUpdateRequest.java b/server/src/main/java/org/elasticsearch/action/admin/indices/create/CreateIndexClusterStateUpdateRequest.java
index 8a46daa45e73b..948199fbe74f4 100644
--- a/server/src/main/java/org/elasticsearch/action/admin/indices/create/CreateIndexClusterStateUpdateRequest.java
+++ b/server/src/main/java/org/elasticsearch/action/admin/indices/create/CreateIndexClusterStateUpdateRequest.java
@@ -12,7 +12,6 @@
 import org.elasticsearch.action.admin.indices.shrink.ResizeType;
 import org.elasticsearch.action.support.ActiveShardCount;
 import org.elasticsearch.cluster.ack.ClusterStateUpdateRequest;
-import org.elasticsearch.cluster.block.ClusterBlock;
 import org.elasticsearch.cluster.metadata.ComposableIndexTemplate;
 import org.elasticsearch.cluster.metadata.IndexMetadata;
 import org.elasticsearch.common.settings.Settings;
@@ -43,8 +42,6 @@ public class CreateIndexClusterStateUpdateRequest extends ClusterStateUpdateRequ
 
     private final Set<Alias> aliases = new HashSet<>();
 
-    private final Set<ClusterBlock> blocks = new HashSet<>();
-
     private ActiveShardCount waitForActiveShards = ActiveShardCount.DEFAULT;
 
     private boolean performReroute = true;
@@ -125,10 +122,6 @@ public Set<Alias> aliases() {
         return aliases;
     }
 
-    public Set<ClusterBlock> blocks() {
-        return blocks;
-    }
-
     public Index recoverFrom() {
         return recoverFrom;
     }
@@ -229,8 +222,6 @@ public String toString() {
             + settings
             + ", aliases="
             + aliases
-            + ", blocks="
-            + blocks
             + ", waitForActiveShards="
             + waitForActiveShards
             + ", systemDataStreamDescriptor="
diff --git a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexService.java b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexService.java
index b1a19d99dcb19..07dcb7baf0777 100644
--- a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexService.java
+++ b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexService.java
@@ -25,7 +25,6 @@
 import org.elasticsearch.cluster.AckedClusterStateUpdateTask;
 import org.elasticsearch.cluster.ClusterState;
 import org.elasticsearch.cluster.ClusterStateUpdateTask;
-import org.elasticsearch.cluster.block.ClusterBlock;
 import org.elasticsearch.cluster.block.ClusterBlockLevel;
 import org.elasticsearch.cluster.block.ClusterBlocks;
 import org.elasticsearch.cluster.node.DiscoveryNodes;
@@ -514,7 +513,6 @@ private ClusterState applyCreateIndexWithTemporaryService(
 
             ClusterState updated = clusterStateCreateIndex(
                 currentState,
-                request.blocks(),
                 indexMetadata,
                 metadataTransformer,
                 allocationService.getShardRoutingRoleStrategy()
@@ -1231,7 +1229,6 @@ public static List<AliasMetadata> resolveAndValidateAliases(
      */
     static ClusterState clusterStateCreateIndex(
         ClusterState currentState,
-        Set<ClusterBlock> clusterBlocks,
         IndexMetadata indexMetadata,
         BiConsumer<Metadata.Builder, IndexMetadata> metadataTransformer,
         ShardRoutingRoleStrategy shardRoutingRoleStrategy
@@ -1245,14 +1242,13 @@ static ClusterState clusterStateCreateIndex(
             newMetadata = currentState.metadata().withAddedIndex(indexMetadata);
         }
 
-        String indexName = indexMetadata.getIndex().getName();
-        ClusterBlocks.Builder blocks = createClusterBlocksBuilder(currentState, indexName, clusterBlocks);
-        blocks.updateBlocks(indexMetadata);
+        var blocksBuilder = ClusterBlocks.builder().blocks(currentState.blocks());
+        blocksBuilder.updateBlocks(indexMetadata);
 
-        RoutingTable.Builder routingTableBuilder = RoutingTable.builder(shardRoutingRoleStrategy, currentState.routingTable())
-            .addAsNew(newMetadata.index(indexName));
+        var routingTableBuilder = RoutingTable.builder(shardRoutingRoleStrategy, currentState.routingTable())
+            .addAsNew(newMetadata.index(indexMetadata.getIndex().getName()));
 
-        return ClusterState.builder(currentState).blocks(blocks).metadata(newMetadata).routingTable(routingTableBuilder).build();
+        return ClusterState.builder(currentState).blocks(blocksBuilder).metadata(newMetadata).routingTable(routingTableBuilder).build();
     }
 
     static IndexMetadata buildIndexMetadata(
@@ -1325,16 +1321,6 @@ private static IndexMetadata.Builder createIndexMetadataBuilder(
         return builder;
     }
 
-    private static ClusterBlocks.Builder createClusterBlocksBuilder(ClusterState currentState, String index, Set<ClusterBlock> blocks) {
-        ClusterBlocks.Builder blocksBuilder = ClusterBlocks.builder().blocks(currentState.blocks());
-        if (blocks.isEmpty() == false) {
-            for (ClusterBlock block : blocks) {
-                blocksBuilder.addIndexBlock(index, block);
-            }
-        }
-        return blocksBuilder;
-    }
-
     private static void updateIndexMappingsAndBuildSortOrder(
         IndexService indexService,
         CreateIndexClusterStateUpdateRequest request,
diff --git a/server/src/test/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexServiceTests.java b/server/src/test/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexServiceTests.java
index 8a487e5653627..f7d343b43b29c 100644
--- a/server/src/test/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexServiceTests.java
+++ b/server/src/test/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexServiceTests.java
@@ -967,13 +967,7 @@ public void testClusterStateCreateIndexThrowsWriteIndexValidationException() thr
         assertThat(
             expectThrows(
                 IllegalStateException.class,
-                () -> clusterStateCreateIndex(
-                    currentClusterState,
-                    Set.of(),
-                    newIndex,
-                    null,
-                    TestShardRoutingRoleStrategies.DEFAULT_ROLE_ONLY
-                )
+                () -> clusterStateCreateIndex(currentClusterState, newIndex, null, TestShardRoutingRoleStrategies.DEFAULT_ROLE_ONLY)
             ).getMessage(),
             startsWith("alias [alias1] has more than one write index [")
         );
@@ -991,7 +985,6 @@ public void testClusterStateCreateIndex() {
 
         ClusterState updatedClusterState = clusterStateCreateIndex(
             currentClusterState,
-            Set.of(INDEX_READ_ONLY_BLOCK),
             newIndexMetadata,
             null,
             TestShardRoutingRoleStrategies.DEFAULT_ROLE_ONLY
@@ -1037,7 +1030,6 @@ public void testClusterStateCreateIndexWithMetadataTransaction() {
 
         ClusterState updatedClusterState = clusterStateCreateIndex(
             currentClusterState,
-            Set.of(INDEX_READ_ONLY_BLOCK),
             newIndexMetadata,
             metadataTransformer,
             TestShardRoutingRoleStrategies.DEFAULT_ROLE_ONLY

From cf0e18872878cce9332722c491b5cc7749106ae4 Mon Sep 17 00:00:00 2001
From: Stanislav Malyshev <smalyshev@users.noreply.github.com>
Date: Thu, 29 Aug 2024 08:56:00 -0600
Subject: [PATCH 050/144] Add isAsync() to SearcTask and eliminate code for
 async detection from TransportSearchAction (#112311)

---
 .../action/search/SearchTask.java             |  7 +++++
 .../action/search/TransportSearchAction.java  | 30 +------------------
 .../xpack/search/AsyncSearchTask.java         |  5 ++++
 3 files changed, 13 insertions(+), 29 deletions(-)

diff --git a/server/src/main/java/org/elasticsearch/action/search/SearchTask.java b/server/src/main/java/org/elasticsearch/action/search/SearchTask.java
index 3bf72313c4c21..cc5d60ad0b0c0 100644
--- a/server/src/main/java/org/elasticsearch/action/search/SearchTask.java
+++ b/server/src/main/java/org/elasticsearch/action/search/SearchTask.java
@@ -69,4 +69,11 @@ public Supplier<SearchResponseMerger> getSearchResponseMergerSupplier() {
     public void setSearchResponseMergerSupplier(Supplier<SearchResponseMerger> supplier) {
         this.searchResponseMergerSupplier = supplier;
     }
+
+    /**
+     * Is this async search?
+     */
+    public boolean isAsync() {
+        return false;
+    }
 }
diff --git a/server/src/main/java/org/elasticsearch/action/search/TransportSearchAction.java b/server/src/main/java/org/elasticsearch/action/search/TransportSearchAction.java
index 6e1645c1ed711..32ee9c331295c 100644
--- a/server/src/main/java/org/elasticsearch/action/search/TransportSearchAction.java
+++ b/server/src/main/java/org/elasticsearch/action/search/TransportSearchAction.java
@@ -369,7 +369,7 @@ void executeRequest(
             } else {
                 if ((listener instanceof TelemetryListener tl) && CCS_TELEMETRY_FEATURE_FLAG.isEnabled()) {
                     tl.setRemotes(resolvedIndices.getRemoteClusterIndices().size());
-                    if (isAsyncSearchTask(task)) {
+                    if (task.isAsync()) {
                         tl.setFeature(CCSUsageTelemetry.ASYNC_FEATURE);
                     }
                     String client = task.getHeader(Task.X_ELASTIC_PRODUCT_ORIGIN_HTTP_HEADER);
@@ -1514,34 +1514,6 @@ public SearchPhase newSearchPhase(
         }
     }
 
-    /**
-     * TransportSearchAction cannot access async-search code, so can't check whether this the Task
-     * is an instance of AsyncSearchTask, so this roundabout method is used
-     * @param searchTask SearchTask to analyze
-     * @return true if this is an async search task; false if a synchronous search task
-     */
-    private boolean isAsyncSearchTask(SearchTask searchTask) {
-        assert assertAsyncSearchTaskListener(searchTask) : "AsyncSearchTask SearchProgressListener is not one of the expected types";
-        // AsyncSearchTask will not return SearchProgressListener.NOOP, since it uses its own progress listener
-        // which delegates to CCSSingleCoordinatorSearchProgressListener when minimizing roundtrips.
-        // Only synchronous SearchTask uses SearchProgressListener.NOOP or CCSSingleCoordinatorSearchProgressListener directly
-        return searchTask.getProgressListener() != SearchProgressListener.NOOP
-            && searchTask.getProgressListener() instanceof CCSSingleCoordinatorSearchProgressListener == false;
-    }
-
-    /**
-     * @param searchTask SearchTask to analyze
-     * @return true if AsyncSearchTask still uses its own special listener, not one of the two that synchronous SearchTask uses
-     */
-    private boolean assertAsyncSearchTaskListener(SearchTask searchTask) {
-        if (searchTask.getClass().getSimpleName().contains("AsyncSearchTask")) {
-            SearchProgressListener progressListener = searchTask.getProgressListener();
-            return progressListener != SearchProgressListener.NOOP
-                && progressListener instanceof CCSSingleCoordinatorSearchProgressListener == false;
-        }
-        return true;
-    }
-
     private static void validateAndResolveWaitForCheckpoint(
         ClusterState clusterState,
         IndexNameExpressionResolver resolver,
diff --git a/x-pack/plugin/async-search/src/main/java/org/elasticsearch/xpack/search/AsyncSearchTask.java b/x-pack/plugin/async-search/src/main/java/org/elasticsearch/xpack/search/AsyncSearchTask.java
index c0305f873327d..5068ac69e462a 100644
--- a/x-pack/plugin/async-search/src/main/java/org/elasticsearch/xpack/search/AsyncSearchTask.java
+++ b/x-pack/plugin/async-search/src/main/java/org/elasticsearch/xpack/search/AsyncSearchTask.java
@@ -545,4 +545,9 @@ public void onFailure(Exception exc) {
             executeCompletionListeners();
         }
     }
+
+    @Override
+    public boolean isAsync() {
+        return true;
+    }
 }

From 8f526098dbfcb109b8e5b01ee436e09491169025 Mon Sep 17 00:00:00 2001
From: Armin Braun <me@obrown.io>
Date: Thu, 29 Aug 2024 16:57:51 +0200
Subject: [PATCH 051/144] Fix SearchServiceTests not waiting for scroll clear
 (#111547)

We were not waiting on the response here but assume the scrolls are cleared
in the following lines. This worked as long as the transport action wasn't forking but is broken now
that we fork to generic. Fixed by just waiting.

closes #111529
---
 .../test/java/org/elasticsearch/search/SearchServiceTests.java  | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/server/src/test/java/org/elasticsearch/search/SearchServiceTests.java b/server/src/test/java/org/elasticsearch/search/SearchServiceTests.java
index bdddea58b713f..2617f82b09f08 100644
--- a/server/src/test/java/org/elasticsearch/search/SearchServiceTests.java
+++ b/server/src/test/java/org/elasticsearch/search/SearchServiceTests.java
@@ -1548,7 +1548,7 @@ public void testMaxOpenScrollContexts() throws Exception {
 
         ClearScrollRequest clearScrollRequest = new ClearScrollRequest();
         clearScrollRequest.setScrollIds(clearScrollIds);
-        client().clearScroll(clearScrollRequest);
+        client().clearScroll(clearScrollRequest).get();
 
         for (int i = 0; i < clearScrollIds.size(); i++) {
             client().prepareSearch("index").setSize(1).setScroll(TimeValue.timeValueMinutes(1)).get().decRef();

From e966d0d9da74cb24c97a17d174f1b65324411e2b Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Aur=C3=A9lien=20FOUCRET?= <aurelien.foucret@gmail.com>
Date: Thu, 29 Aug 2024 17:30:16 +0200
Subject: [PATCH 052/144] Removing the feature flag mechanism for LTR.
 (#112358)

---
 .../ml/DefaultMachineLearningExtension.java      |  5 -----
 .../elasticsearch/xpack/ml/MachineLearning.java  | 14 +++++---------
 .../xpack/ml/MachineLearningExtension.java       |  4 ----
 .../ml/LocalStateMachineLearningAdOnly.java      |  2 +-
 .../ml/LocalStateMachineLearningDfaOnly.java     |  2 +-
 .../ml/LocalStateMachineLearningNlpOnly.java     |  2 +-
 .../MachineLearningInfoTransportActionTests.java |  9 +--------
 .../xpack/ml/MachineLearningTests.java           | 16 ++++------------
 8 files changed, 13 insertions(+), 41 deletions(-)

diff --git a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/DefaultMachineLearningExtension.java b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/DefaultMachineLearningExtension.java
index 66f4797ef707c..fa94bf96c1167 100644
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/DefaultMachineLearningExtension.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/DefaultMachineLearningExtension.java
@@ -51,11 +51,6 @@ public boolean isNlpEnabled() {
         return true;
     }
 
-    @Override
-    public boolean isLearningToRankEnabled() {
-        return true;
-    }
-
     @Override
     public String[] getAnalyticsDestIndexAllowedSettings() {
         return ANALYTICS_DEST_INDEX_ALLOWED_SETTINGS;
diff --git a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/MachineLearning.java b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/MachineLearning.java
index c4bf92401be9d..5876836185ba3 100644
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/MachineLearning.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/MachineLearning.java
@@ -902,7 +902,7 @@ private static void reportClashingNodeAttribute(String attrName) {
 
     @Override
     public List<RescorerSpec<?>> getRescorers() {
-        if (enabled && machineLearningExtension.get().isLearningToRankEnabled()) {
+        if (enabled) {
             return List.of(
                 new RescorerSpec<>(
                     LearningToRankRescorerBuilder.NAME,
@@ -1864,10 +1864,8 @@ public List<NamedXContentRegistry.Entry> getNamedXContent() {
             )
         );
         namedXContent.addAll(new CorrelationNamedContentProvider().getNamedXContentParsers());
-        // LTR Combine with Inference named content provider when feature flag is removed
-        if (machineLearningExtension.get().isLearningToRankEnabled()) {
-            namedXContent.addAll(new MlLTRNamedXContentProvider().getNamedXContentParsers());
-        }
+        namedXContent.addAll(new MlLTRNamedXContentProvider().getNamedXContentParsers());
+
         return namedXContent;
     }
 
@@ -1958,10 +1956,8 @@ public List<NamedWriteableRegistry.Entry> getNamedWriteables() {
         namedWriteables.addAll(MlAutoscalingNamedWritableProvider.getNamedWriteables());
         namedWriteables.addAll(new CorrelationNamedContentProvider().getNamedWriteables());
         namedWriteables.addAll(new ChangePointNamedContentProvider().getNamedWriteables());
-        // LTR Combine with Inference named content provider when feature flag is removed
-        if (machineLearningExtension.get().isLearningToRankEnabled()) {
-            namedWriteables.addAll(new MlLTRNamedXContentProvider().getNamedWriteables());
-        }
+        namedWriteables.addAll(new MlLTRNamedXContentProvider().getNamedWriteables());
+
         return namedWriteables;
     }
 
diff --git a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/MachineLearningExtension.java b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/MachineLearningExtension.java
index 528883439ef2f..f46652978753c 100644
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/MachineLearningExtension.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/MachineLearningExtension.java
@@ -25,10 +25,6 @@ default void configure(Settings settings) {}
 
     boolean isNlpEnabled();
 
-    default boolean isLearningToRankEnabled() {
-        return true;
-    }
-
     default boolean disableInferenceProcessCache() {
         return false;
     }
diff --git a/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/LocalStateMachineLearningAdOnly.java b/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/LocalStateMachineLearningAdOnly.java
index 175a035a70f7e..3ff3a4a404f97 100644
--- a/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/LocalStateMachineLearningAdOnly.java
+++ b/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/LocalStateMachineLearningAdOnly.java
@@ -14,6 +14,6 @@
 
 public class LocalStateMachineLearningAdOnly extends LocalStateMachineLearning {
     public LocalStateMachineLearningAdOnly(final Settings settings, final Path configPath) {
-        super(settings, configPath, new MlTestExtensionLoader(new MlTestExtension(true, true, true, false, false, false)));
+        super(settings, configPath, new MlTestExtensionLoader(new MlTestExtension(true, true, true, false, false)));
     }
 }
diff --git a/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/LocalStateMachineLearningDfaOnly.java b/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/LocalStateMachineLearningDfaOnly.java
index f054e52dc29ec..1a72f27865d8a 100644
--- a/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/LocalStateMachineLearningDfaOnly.java
+++ b/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/LocalStateMachineLearningDfaOnly.java
@@ -14,6 +14,6 @@
 
 public class LocalStateMachineLearningDfaOnly extends LocalStateMachineLearning {
     public LocalStateMachineLearningDfaOnly(final Settings settings, final Path configPath) {
-        super(settings, configPath, new MlTestExtensionLoader(new MlTestExtension(true, true, false, true, false, false)));
+        super(settings, configPath, new MlTestExtensionLoader(new MlTestExtension(true, true, false, true, false)));
     }
 }
diff --git a/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/LocalStateMachineLearningNlpOnly.java b/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/LocalStateMachineLearningNlpOnly.java
index a3d684011e932..0f11e8033b83d 100644
--- a/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/LocalStateMachineLearningNlpOnly.java
+++ b/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/LocalStateMachineLearningNlpOnly.java
@@ -14,6 +14,6 @@
 
 public class LocalStateMachineLearningNlpOnly extends LocalStateMachineLearning {
     public LocalStateMachineLearningNlpOnly(final Settings settings, final Path configPath) {
-        super(settings, configPath, new MlTestExtensionLoader(new MlTestExtension(true, true, false, false, true, false)));
+        super(settings, configPath, new MlTestExtensionLoader(new MlTestExtension(true, true, false, false, true)));
     }
 }
diff --git a/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/MachineLearningInfoTransportActionTests.java b/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/MachineLearningInfoTransportActionTests.java
index afa372fb94527..e5575abfeb020 100644
--- a/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/MachineLearningInfoTransportActionTests.java
+++ b/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/MachineLearningInfoTransportActionTests.java
@@ -160,14 +160,7 @@ private MachineLearningUsageTransportAction newUsageAction(
             licenseState,
             jobManagerHolder,
             new MachineLearningExtensionHolder(
-                new MachineLearningTests.MlTestExtension(
-                    true,
-                    true,
-                    isAnomalyDetectionEnabled,
-                    isDataFrameAnalyticsEnabled,
-                    isNlpEnabled,
-                    true
-                )
+                new MachineLearningTests.MlTestExtension(true, true, isAnomalyDetectionEnabled, isDataFrameAnalyticsEnabled, isNlpEnabled)
             )
         );
     }
diff --git a/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/MachineLearningTests.java b/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/MachineLearningTests.java
index c35b9da7b2bd2..8a05537917abe 100644
--- a/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/MachineLearningTests.java
+++ b/x-pack/plugin/ml/src/test/java/org/elasticsearch/xpack/ml/MachineLearningTests.java
@@ -220,7 +220,7 @@ public void testNoAttributes_givenClash() throws IOException {
 
     public void testAnomalyDetectionOnly() throws IOException {
         Settings settings = Settings.builder().put("path.home", createTempDir()).build();
-        MlTestExtensionLoader loader = new MlTestExtensionLoader(new MlTestExtension(false, false, true, false, false, false));
+        MlTestExtensionLoader loader = new MlTestExtensionLoader(new MlTestExtension(false, false, true, false, false));
         try (MachineLearning machineLearning = createTrialLicensedMachineLearning(settings, loader)) {
             List<RestHandler> restHandlers = machineLearning.getRestHandlers(settings, null, null, null, null, null, null, null, null);
             assertThat(restHandlers, hasItem(instanceOf(RestMlInfoAction.class)));
@@ -240,7 +240,7 @@ public void testAnomalyDetectionOnly() throws IOException {
 
     public void testDataFrameAnalyticsOnly() throws IOException {
         Settings settings = Settings.builder().put("path.home", createTempDir()).build();
-        MlTestExtensionLoader loader = new MlTestExtensionLoader(new MlTestExtension(false, false, false, true, false, false));
+        MlTestExtensionLoader loader = new MlTestExtensionLoader(new MlTestExtension(false, false, false, true, false));
         try (MachineLearning machineLearning = createTrialLicensedMachineLearning(settings, loader)) {
             List<RestHandler> restHandlers = machineLearning.getRestHandlers(settings, null, null, null, null, null, null, null, null);
             assertThat(restHandlers, hasItem(instanceOf(RestMlInfoAction.class)));
@@ -260,7 +260,7 @@ public void testDataFrameAnalyticsOnly() throws IOException {
 
     public void testNlpOnly() throws IOException {
         Settings settings = Settings.builder().put("path.home", createTempDir()).build();
-        MlTestExtensionLoader loader = new MlTestExtensionLoader(new MlTestExtension(false, false, false, false, true, false));
+        MlTestExtensionLoader loader = new MlTestExtensionLoader(new MlTestExtension(false, false, false, false, true));
         try (MachineLearning machineLearning = createTrialLicensedMachineLearning(settings, loader)) {
             List<RestHandler> restHandlers = machineLearning.getRestHandlers(settings, null, null, null, null, null, null, null, null);
             assertThat(restHandlers, hasItem(instanceOf(RestMlInfoAction.class)));
@@ -287,22 +287,19 @@ public static class MlTestExtension implements MachineLearningExtension {
         private final boolean isAnomalyDetectionEnabled;
         private final boolean isDataFrameAnalyticsEnabled;
         private final boolean isNlpEnabled;
-        private final boolean isLearningToRankEnabled;
 
         MlTestExtension(
             boolean useIlm,
             boolean includeNodeInfo,
             boolean isAnomalyDetectionEnabled,
             boolean isDataFrameAnalyticsEnabled,
-            boolean isNlpEnabled,
-            boolean isLearningToRankEnabled
+            boolean isNlpEnabled
         ) {
             this.useIlm = useIlm;
             this.includeNodeInfo = includeNodeInfo;
             this.isAnomalyDetectionEnabled = isAnomalyDetectionEnabled;
             this.isDataFrameAnalyticsEnabled = isDataFrameAnalyticsEnabled;
             this.isNlpEnabled = isNlpEnabled;
-            this.isLearningToRankEnabled = isLearningToRankEnabled;
         }
 
         @Override
@@ -330,11 +327,6 @@ public boolean isNlpEnabled() {
             return isNlpEnabled;
         }
 
-        @Override
-        public boolean isLearningToRankEnabled() {
-            return isLearningToRankEnabled;
-        }
-
         @Override
         public String[] getAnalyticsDestIndexAllowedSettings() {
             return ANALYTICS_DEST_INDEX_ALLOWED_SETTINGS;

From 592858281400cfa608080aca5dac8331d3ea1f5c Mon Sep 17 00:00:00 2001
From: Fang Xing <155562079+fang-xing-esql@users.noreply.github.com>
Date: Thu, 29 Aug 2024 12:03:03 -0400
Subject: [PATCH 053/144] [ES|QL] Combine 3 commonTypes into one (#112220)

Combine 3 commonTypes into one.
---
 .../esql/core/type/DataTypeConverter.java     |  80 ---------
 .../predicate/operator/arithmetic/Add.java    |   1 -
 .../arithmetic/ArithmeticOperation.java       |   7 +-
 .../BinaryComparisonInversible.java           |   2 +-
 .../predicate/operator/arithmetic/Div.java    |   1 -
 .../arithmetic/EsqlArithmeticOperation.java   |   5 +-
 .../predicate/operator/arithmetic/Mul.java    |   1 -
 .../predicate/operator/arithmetic/Sub.java    |   1 -
 .../comparison/EsqlBinaryComparison.java      |   4 +-
 .../predicate/operator/comparison/In.java     |   4 +-
 .../rules/SimplifyComparisonsArithmetics.java |   4 +-
 .../esql/type/EsqlDataTypeConverter.java      |  77 +++++++--
 .../xpack/esql/type/EsqlDataTypeRegistry.java |  24 ---
 .../esql/type/DataTypeConversionTests.java    |  20 ---
 .../esql/type/EsqlDataTypeConverterTests.java | 158 ++++++++++++++++++
 15 files changed, 234 insertions(+), 155 deletions(-)
 rename x-pack/plugin/{esql-core/src/main/java/org/elasticsearch/xpack/esql/core => esql/src/main/java/org/elasticsearch/xpack/esql}/expression/predicate/operator/arithmetic/ArithmeticOperation.java (80%)
 rename x-pack/plugin/{esql-core/src/main/java/org/elasticsearch/xpack/esql/core => esql/src/main/java/org/elasticsearch/xpack/esql}/expression/predicate/operator/arithmetic/BinaryComparisonInversible.java (91%)

diff --git a/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/type/DataTypeConverter.java b/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/type/DataTypeConverter.java
index 1e68d63ef7bb1..78b395503e700 100644
--- a/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/type/DataTypeConverter.java
+++ b/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/type/DataTypeConverter.java
@@ -38,7 +38,6 @@
 import static org.elasticsearch.xpack.esql.core.type.DataType.UNSIGNED_LONG;
 import static org.elasticsearch.xpack.esql.core.type.DataType.VERSION;
 import static org.elasticsearch.xpack.esql.core.type.DataType.isDateTime;
-import static org.elasticsearch.xpack.esql.core.type.DataType.isPrimitiveAndSupported;
 import static org.elasticsearch.xpack.esql.core.type.DataType.isString;
 import static org.elasticsearch.xpack.esql.core.util.NumericUtils.UNSIGNED_LONG_MAX;
 import static org.elasticsearch.xpack.esql.core.util.NumericUtils.inUnsignedLongRange;
@@ -51,85 +50,6 @@ public final class DataTypeConverter {
 
     private DataTypeConverter() {}
 
-    /**
-     * Returns the type compatible with both left and right types
-     * <p>
-     * If one of the types is null - returns another type
-     * If both types are numeric - returns type with the highest precision int &lt; long &lt; float &lt; double
-     * If one of the types is string and another numeric - returns numeric
-     */
-    public static DataType commonType(DataType left, DataType right) {
-        if (left == right) {
-            return left;
-        }
-        if (left == NULL) {
-            return right;
-        }
-        if (right == NULL) {
-            return left;
-        }
-        if (isString(left) && isString(right)) {
-            if (left == TEXT || right == TEXT) {
-                return TEXT;
-            }
-            if (left == KEYWORD) {
-                return KEYWORD;
-            }
-            return right;
-        }
-        if (left.isNumeric() && right.isNumeric()) {
-            int lsize = left.estimatedSize().orElseThrow();
-            int rsize = right.estimatedSize().orElseThrow();
-            // if one is int
-            if (left.isWholeNumber()) {
-                // promote the highest int
-                if (right.isWholeNumber()) {
-                    if (left == UNSIGNED_LONG || right == UNSIGNED_LONG) {
-                        return UNSIGNED_LONG;
-                    }
-                    return lsize > rsize ? left : right;
-                }
-                // promote the rational
-                return right;
-            }
-            // try the other side
-            if (right.isWholeNumber()) {
-                return left;
-            }
-            // promote the highest rational
-            return lsize > rsize ? left : right;
-        }
-        if (isString(left)) {
-            if (right.isNumeric()) {
-                return right;
-            }
-        }
-        if (isString(right)) {
-            if (left.isNumeric()) {
-                return left;
-            }
-        }
-
-        if (isDateTime(left) && isDateTime(right)) {
-            return DATETIME;
-        }
-
-        // none found
-        return null;
-    }
-
-    /**
-     * Returns true if the from type can be converted to the to type, false - otherwise
-     */
-    public static boolean canConvert(DataType from, DataType to) {
-        // Special handling for nulls and if conversion is not requires
-        if (from == to || from == NULL) {
-            return true;
-        }
-        // only primitives are supported so far
-        return isPrimitiveAndSupported(from) && isPrimitiveAndSupported(to) && converterFor(from, to) != null;
-    }
-
     /**
      * Get the conversion from one type to another.
      */
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/Add.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/Add.java
index b6ec9b6fd0e23..8f8d885ee379b 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/Add.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/Add.java
@@ -12,7 +12,6 @@
 import org.elasticsearch.compute.ann.Evaluator;
 import org.elasticsearch.compute.ann.Fixed;
 import org.elasticsearch.xpack.esql.core.expression.Expression;
-import org.elasticsearch.xpack.esql.core.expression.predicate.operator.arithmetic.BinaryComparisonInversible;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 import org.elasticsearch.xpack.esql.core.util.NumericUtils;
diff --git a/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/predicate/operator/arithmetic/ArithmeticOperation.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/ArithmeticOperation.java
similarity index 80%
rename from x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/predicate/operator/arithmetic/ArithmeticOperation.java
rename to x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/ArithmeticOperation.java
index 8dc0f58083179..cb7e7c4643fb9 100644
--- a/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/predicate/operator/arithmetic/ArithmeticOperation.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/ArithmeticOperation.java
@@ -4,16 +4,17 @@
  * 2.0; you may not use this file except in compliance with the Elastic License
  * 2.0.
  */
-package org.elasticsearch.xpack.esql.core.expression.predicate.operator.arithmetic;
+package org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic;
 
 import org.elasticsearch.xpack.esql.core.expression.Expression;
 import org.elasticsearch.xpack.esql.core.expression.TypeResolutions.ParamOrdinal;
 import org.elasticsearch.xpack.esql.core.expression.predicate.BinaryOperator;
+import org.elasticsearch.xpack.esql.core.expression.predicate.operator.arithmetic.BinaryArithmeticOperation;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 import org.elasticsearch.xpack.esql.core.type.DataType;
-import org.elasticsearch.xpack.esql.core.type.DataTypeConverter;
 
 import static org.elasticsearch.xpack.esql.core.expression.TypeResolutions.isNumeric;
+import static org.elasticsearch.xpack.esql.type.EsqlDataTypeConverter.commonType;
 
 public abstract class ArithmeticOperation extends BinaryOperator<Object, Object, Object, BinaryArithmeticOperation> {
 
@@ -36,7 +37,7 @@ public ArithmeticOperation swapLeftAndRight() {
     @Override
     public DataType dataType() {
         if (dataType == null) {
-            dataType = DataTypeConverter.commonType(left().dataType(), right().dataType());
+            dataType = commonType(left().dataType(), right().dataType());
         }
         return dataType;
     }
diff --git a/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/predicate/operator/arithmetic/BinaryComparisonInversible.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/BinaryComparisonInversible.java
similarity index 91%
rename from x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/predicate/operator/arithmetic/BinaryComparisonInversible.java
rename to x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/BinaryComparisonInversible.java
index 358ad59ec6356..b0ab4c48d970e 100644
--- a/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/predicate/operator/arithmetic/BinaryComparisonInversible.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/BinaryComparisonInversible.java
@@ -5,7 +5,7 @@
  * 2.0.
  */
 
-package org.elasticsearch.xpack.esql.core.expression.predicate.operator.arithmetic;
+package org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic;
 
 import org.elasticsearch.xpack.esql.core.expression.Expression;
 import org.elasticsearch.xpack.esql.core.tree.Source;
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/Div.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/Div.java
index 0e4c506a90d85..f1e197cf350b6 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/Div.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/Div.java
@@ -11,7 +11,6 @@
 import org.elasticsearch.common.io.stream.StreamInput;
 import org.elasticsearch.compute.ann.Evaluator;
 import org.elasticsearch.xpack.esql.core.expression.Expression;
-import org.elasticsearch.xpack.esql.core.expression.predicate.operator.arithmetic.BinaryComparisonInversible;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 import org.elasticsearch.xpack.esql.core.type.DataType;
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/EsqlArithmeticOperation.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/EsqlArithmeticOperation.java
index 647071c44cfd3..400e70b641111 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/EsqlArithmeticOperation.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/EsqlArithmeticOperation.java
@@ -13,14 +13,12 @@
 import org.elasticsearch.compute.operator.EvalOperator.ExpressionEvaluator;
 import org.elasticsearch.xpack.esql.EsqlIllegalArgumentException;
 import org.elasticsearch.xpack.esql.core.expression.Expression;
-import org.elasticsearch.xpack.esql.core.expression.predicate.operator.arithmetic.ArithmeticOperation;
 import org.elasticsearch.xpack.esql.core.expression.predicate.operator.arithmetic.BinaryArithmeticOperation;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 import org.elasticsearch.xpack.esql.core.type.DataType;
 import org.elasticsearch.xpack.esql.evaluator.mapper.EvaluatorMapper;
 import org.elasticsearch.xpack.esql.expression.function.scalar.math.Cast;
 import org.elasticsearch.xpack.esql.io.stream.PlanStreamInput;
-import org.elasticsearch.xpack.esql.type.EsqlDataTypeRegistry;
 
 import java.io.IOException;
 import java.util.List;
@@ -31,6 +29,7 @@
 import static org.elasticsearch.xpack.esql.core.type.DataType.INTEGER;
 import static org.elasticsearch.xpack.esql.core.type.DataType.LONG;
 import static org.elasticsearch.xpack.esql.core.type.DataType.UNSIGNED_LONG;
+import static org.elasticsearch.xpack.esql.type.EsqlDataTypeConverter.commonType;
 
 public abstract class EsqlArithmeticOperation extends ArithmeticOperation implements EvaluatorMapper {
     public static List<NamedWriteableRegistry.Entry> getNamedWriteables() {
@@ -133,7 +132,7 @@ public Object fold() {
 
     public DataType dataType() {
         if (dataType == null) {
-            dataType = EsqlDataTypeRegistry.INSTANCE.commonType(left().dataType(), right().dataType());
+            dataType = commonType(left().dataType(), right().dataType());
         }
         return dataType;
     }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/Mul.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/Mul.java
index a73562ff153b2..03981a821f52d 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/Mul.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/Mul.java
@@ -11,7 +11,6 @@
 import org.elasticsearch.common.io.stream.StreamInput;
 import org.elasticsearch.compute.ann.Evaluator;
 import org.elasticsearch.xpack.esql.core.expression.Expression;
-import org.elasticsearch.xpack.esql.core.expression.predicate.operator.arithmetic.BinaryComparisonInversible;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 import org.elasticsearch.xpack.esql.core.util.NumericUtils;
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/Sub.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/Sub.java
index ee2ccc3b7107a..27f5579129cc9 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/Sub.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/arithmetic/Sub.java
@@ -12,7 +12,6 @@
 import org.elasticsearch.compute.ann.Evaluator;
 import org.elasticsearch.compute.ann.Fixed;
 import org.elasticsearch.xpack.esql.core.expression.Expression;
-import org.elasticsearch.xpack.esql.core.expression.predicate.operator.arithmetic.BinaryComparisonInversible;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 import org.elasticsearch.xpack.esql.core.type.DataType;
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/comparison/EsqlBinaryComparison.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/comparison/EsqlBinaryComparison.java
index 52d4c111b2eae..b50d70e69819d 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/comparison/EsqlBinaryComparison.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/comparison/EsqlBinaryComparison.java
@@ -22,7 +22,6 @@
 import org.elasticsearch.xpack.esql.expression.function.scalar.math.Cast;
 import org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic.EsqlArithmeticOperation;
 import org.elasticsearch.xpack.esql.io.stream.PlanStreamInput;
-import org.elasticsearch.xpack.esql.type.EsqlDataTypeRegistry;
 
 import java.io.IOException;
 import java.time.ZoneId;
@@ -32,6 +31,7 @@
 
 import static org.elasticsearch.common.logging.LoggerMessageFormat.format;
 import static org.elasticsearch.xpack.esql.core.type.DataType.UNSIGNED_LONG;
+import static org.elasticsearch.xpack.esql.type.EsqlDataTypeConverter.commonType;
 
 public abstract class EsqlBinaryComparison extends BinaryComparison implements EvaluatorMapper {
     public static List<NamedWriteableRegistry.Entry> getNamedWriteables() {
@@ -172,7 +172,7 @@ public EvalOperator.ExpressionEvaluator.Factory toEvaluator(
         Function<Expression, EvalOperator.ExpressionEvaluator.Factory> toEvaluator
     ) {
         // Our type is always boolean, so figure out the evaluator type from the inputs
-        DataType commonType = EsqlDataTypeRegistry.INSTANCE.commonType(left().dataType(), right().dataType());
+        DataType commonType = commonType(left().dataType(), right().dataType());
         EvalOperator.ExpressionEvaluator.Factory lhs;
         EvalOperator.ExpressionEvaluator.Factory rhs;
 
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/comparison/In.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/comparison/In.java
index 636b31fcc691b..333f32e82c579 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/comparison/In.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/predicate/operator/comparison/In.java
@@ -27,7 +27,7 @@
 import org.elasticsearch.xpack.esql.expression.function.scalar.EsqlScalarFunction;
 import org.elasticsearch.xpack.esql.expression.function.scalar.math.Cast;
 import org.elasticsearch.xpack.esql.io.stream.PlanStreamInput;
-import org.elasticsearch.xpack.esql.type.EsqlDataTypeRegistry;
+import org.elasticsearch.xpack.esql.type.EsqlDataTypeConverter;
 
 import java.io.IOException;
 import java.util.BitSet;
@@ -269,7 +269,7 @@ private DataType commonType() {
                     break;
                 }
             }
-            commonType = EsqlDataTypeRegistry.INSTANCE.commonType(commonType, e.dataType());
+            commonType = EsqlDataTypeConverter.commonType(commonType, e.dataType());
         }
         return commonType;
     }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/rules/SimplifyComparisonsArithmetics.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/rules/SimplifyComparisonsArithmetics.java
index 4ef069ea16d04..fe83aeb647bf9 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/rules/SimplifyComparisonsArithmetics.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/rules/SimplifyComparisonsArithmetics.java
@@ -9,10 +9,10 @@
 
 import org.elasticsearch.xpack.esql.core.expression.Expression;
 import org.elasticsearch.xpack.esql.core.expression.Literal;
-import org.elasticsearch.xpack.esql.core.expression.predicate.operator.arithmetic.ArithmeticOperation;
-import org.elasticsearch.xpack.esql.core.expression.predicate.operator.arithmetic.BinaryComparisonInversible;
 import org.elasticsearch.xpack.esql.core.expression.predicate.operator.comparison.BinaryComparison;
 import org.elasticsearch.xpack.esql.core.type.DataType;
+import org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic.ArithmeticOperation;
+import org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic.BinaryComparisonInversible;
 import org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic.Neg;
 import org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic.Sub;
 
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/type/EsqlDataTypeConverter.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/type/EsqlDataTypeConverter.java
index 1572f8950e0ac..b090708a64ad3 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/type/EsqlDataTypeConverter.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/type/EsqlDataTypeConverter.java
@@ -58,6 +58,7 @@
 import static org.elasticsearch.xpack.esql.core.type.DataType.CARTESIAN_POINT;
 import static org.elasticsearch.xpack.esql.core.type.DataType.CARTESIAN_SHAPE;
 import static org.elasticsearch.xpack.esql.core.type.DataType.DATETIME;
+import static org.elasticsearch.xpack.esql.core.type.DataType.DATE_PERIOD;
 import static org.elasticsearch.xpack.esql.core.type.DataType.DOUBLE;
 import static org.elasticsearch.xpack.esql.core.type.DataType.GEO_POINT;
 import static org.elasticsearch.xpack.esql.core.type.DataType.GEO_SHAPE;
@@ -67,9 +68,14 @@
 import static org.elasticsearch.xpack.esql.core.type.DataType.LONG;
 import static org.elasticsearch.xpack.esql.core.type.DataType.NULL;
 import static org.elasticsearch.xpack.esql.core.type.DataType.TEXT;
+import static org.elasticsearch.xpack.esql.core.type.DataType.TIME_DURATION;
 import static org.elasticsearch.xpack.esql.core.type.DataType.UNSIGNED_LONG;
 import static org.elasticsearch.xpack.esql.core.type.DataType.VERSION;
-import static org.elasticsearch.xpack.esql.core.type.DataType.isPrimitiveAndSupported;
+import static org.elasticsearch.xpack.esql.core.type.DataType.isDateTime;
+import static org.elasticsearch.xpack.esql.core.type.DataType.isDateTimeOrTemporal;
+import static org.elasticsearch.xpack.esql.core.type.DataType.isNullOrDatePeriod;
+import static org.elasticsearch.xpack.esql.core.type.DataType.isNullOrTemporalAmount;
+import static org.elasticsearch.xpack.esql.core.type.DataType.isNullOrTimeDuration;
 import static org.elasticsearch.xpack.esql.core.type.DataType.isString;
 import static org.elasticsearch.xpack.esql.core.type.DataTypeConverter.safeDoubleToLong;
 import static org.elasticsearch.xpack.esql.core.type.DataTypeConverter.safeToInt;
@@ -107,18 +113,6 @@ public class EsqlDataTypeConverter {
         entry(VERSION, ToVersion::new)
     );
 
-    /**
-     * Returns true if the from type can be converted to the to type, false - otherwise
-     */
-    public static boolean canConvert(DataType from, DataType to) {
-        // Special handling for nulls and if conversion is not requires
-        if (from == to || from == NULL) {
-            return true;
-        }
-        // only primitives are supported so far
-        return isPrimitiveAndSupported(from) && isPrimitiveAndSupported(to) && converterFor(from, to) != null;
-    }
-
     public static Converter converterFor(DataType from, DataType to) {
         // TODO move EXPRESSION_TO_LONG here if there is no regression
         if (isString(from)) {
@@ -230,8 +224,63 @@ public static Object convert(Object value, DataType dataType) {
         return converter.convert(value);
     }
 
+    /**
+     * Returns the type compatible with both left and right types
+     * <p>
+     * If one of the types is null - returns another type
+     * If both types are numeric - returns type with the highest precision int &lt; long &lt; float &lt; double
+     */
     public static DataType commonType(DataType left, DataType right) {
-        return DataTypeConverter.commonType(left, right);
+        if (left == right) {
+            return left;
+        }
+        if (left == NULL) {
+            return right;
+        }
+        if (right == NULL) {
+            return left;
+        }
+        if (isDateTimeOrTemporal(left) || isDateTimeOrTemporal(right)) {
+            if ((isDateTime(left) && isNullOrTemporalAmount(right)) || (isNullOrTemporalAmount(left) && isDateTime(right))) {
+                return DATETIME;
+            }
+            if (isNullOrTimeDuration(left) && isNullOrTimeDuration(right)) {
+                return TIME_DURATION;
+            }
+            if (isNullOrDatePeriod(left) && isNullOrDatePeriod(right)) {
+                return DATE_PERIOD;
+            }
+        }
+        if (isString(left) && isString(right)) {
+            if (left == TEXT || right == TEXT) {
+                return TEXT;
+            }
+            return right;
+        }
+        if (left.isNumeric() && right.isNumeric()) {
+            int lsize = left.estimatedSize().orElseThrow();
+            int rsize = right.estimatedSize().orElseThrow();
+            // if one is int
+            if (left.isWholeNumber()) {
+                // promote the highest int
+                if (right.isWholeNumber()) {
+                    if (left == UNSIGNED_LONG || right == UNSIGNED_LONG) {
+                        return UNSIGNED_LONG;
+                    }
+                    return lsize > rsize ? left : right;
+                }
+                // promote the rational
+                return right;
+            }
+            // try the other side
+            if (right.isWholeNumber()) {
+                return left;
+            }
+            // promote the highest rational
+            return lsize > rsize ? left : right;
+        }
+        // none found
+        return null;
     }
 
     // generally supporting abbreviations from https://en.wikipedia.org/wiki/Unit_of_time
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/type/EsqlDataTypeRegistry.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/type/EsqlDataTypeRegistry.java
index 96e206b82cf0c..f8e8cd37dc8b2 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/type/EsqlDataTypeRegistry.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/type/EsqlDataTypeRegistry.java
@@ -10,15 +10,6 @@
 import org.elasticsearch.index.mapper.TimeSeriesParams;
 import org.elasticsearch.xpack.esql.core.type.DataType;
 
-import static org.elasticsearch.xpack.esql.core.type.DataType.DATETIME;
-import static org.elasticsearch.xpack.esql.core.type.DataType.DATE_PERIOD;
-import static org.elasticsearch.xpack.esql.core.type.DataType.TIME_DURATION;
-import static org.elasticsearch.xpack.esql.core.type.DataType.isDateTime;
-import static org.elasticsearch.xpack.esql.core.type.DataType.isDateTimeOrTemporal;
-import static org.elasticsearch.xpack.esql.core.type.DataType.isNullOrDatePeriod;
-import static org.elasticsearch.xpack.esql.core.type.DataType.isNullOrTemporalAmount;
-import static org.elasticsearch.xpack.esql.core.type.DataType.isNullOrTimeDuration;
-
 public class EsqlDataTypeRegistry {
 
     public static final EsqlDataTypeRegistry INSTANCE = new EsqlDataTypeRegistry();
@@ -35,19 +26,4 @@ public DataType fromEs(String typeName, TimeSeriesParams.MetricType metricType)
          */
         return metricType == TimeSeriesParams.MetricType.COUNTER ? type.widenSmallNumeric().counter() : type;
     }
-
-    public DataType commonType(DataType left, DataType right) {
-        if (isDateTimeOrTemporal(left) || isDateTimeOrTemporal(right)) {
-            if ((isDateTime(left) && isNullOrTemporalAmount(right)) || (isNullOrTemporalAmount(left) && isDateTime(right))) {
-                return DATETIME;
-            }
-            if (isNullOrTimeDuration(left) && isNullOrTimeDuration(right)) {
-                return TIME_DURATION;
-            }
-            if (isNullOrDatePeriod(left) && isNullOrDatePeriod(right)) {
-                return DATE_PERIOD;
-            }
-        }
-        return EsqlDataTypeConverter.commonType(left, right);
-    }
 }
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/type/DataTypeConversionTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/type/DataTypeConversionTests.java
index 9f8c8f91b7037..871bf632adcc6 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/type/DataTypeConversionTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/type/DataTypeConversionTests.java
@@ -35,7 +35,6 @@
 import static org.elasticsearch.xpack.esql.core.type.DataType.UNSIGNED_LONG;
 import static org.elasticsearch.xpack.esql.core.type.DataType.UNSUPPORTED;
 import static org.elasticsearch.xpack.esql.core.type.DataType.VERSION;
-import static org.elasticsearch.xpack.esql.core.type.DataTypeConverter.commonType;
 import static org.elasticsearch.xpack.esql.core.type.DataTypeConverter.converterFor;
 import static org.elasticsearch.xpack.esql.core.util.DateUtils.asDateTime;
 
@@ -522,25 +521,6 @@ public void testConversionToIdentity() {
         assertEquals(10, conversion.convert(10));
     }
 
-    public void testCommonType() {
-        assertEquals(BOOLEAN, commonType(BOOLEAN, NULL));
-        assertEquals(BOOLEAN, commonType(NULL, BOOLEAN));
-        assertEquals(BOOLEAN, commonType(BOOLEAN, BOOLEAN));
-        assertEquals(NULL, commonType(NULL, NULL));
-        assertEquals(INTEGER, commonType(INTEGER, KEYWORD));
-        assertEquals(LONG, commonType(TEXT, LONG));
-        assertEquals(SHORT, commonType(SHORT, BYTE));
-        assertEquals(FLOAT, commonType(BYTE, FLOAT));
-        assertEquals(FLOAT, commonType(FLOAT, INTEGER));
-        assertEquals(UNSIGNED_LONG, commonType(UNSIGNED_LONG, LONG));
-        assertEquals(DOUBLE, commonType(DOUBLE, FLOAT));
-        assertEquals(FLOAT, commonType(FLOAT, UNSIGNED_LONG));
-
-        // strings
-        assertEquals(TEXT, commonType(TEXT, KEYWORD));
-        assertEquals(TEXT, commonType(KEYWORD, TEXT));
-    }
-
     public void testEsDataTypes() {
         for (DataType type : DataType.types()) {
             assertEquals(type, DataType.fromTypeName(type.typeName()));
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/type/EsqlDataTypeConverterTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/type/EsqlDataTypeConverterTests.java
index 0997c88aac2b0..8ad083683f696 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/type/EsqlDataTypeConverterTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/type/EsqlDataTypeConverterTests.java
@@ -8,6 +8,44 @@
 package org.elasticsearch.xpack.esql.type;
 
 import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xpack.esql.core.type.DataType;
+
+import java.util.Arrays;
+import java.util.List;
+
+import static org.elasticsearch.xpack.esql.core.type.DataType.BOOLEAN;
+import static org.elasticsearch.xpack.esql.core.type.DataType.BYTE;
+import static org.elasticsearch.xpack.esql.core.type.DataType.CARTESIAN_POINT;
+import static org.elasticsearch.xpack.esql.core.type.DataType.CARTESIAN_SHAPE;
+import static org.elasticsearch.xpack.esql.core.type.DataType.COUNTER_DOUBLE;
+import static org.elasticsearch.xpack.esql.core.type.DataType.COUNTER_INTEGER;
+import static org.elasticsearch.xpack.esql.core.type.DataType.COUNTER_LONG;
+import static org.elasticsearch.xpack.esql.core.type.DataType.DATETIME;
+import static org.elasticsearch.xpack.esql.core.type.DataType.DATE_NANOS;
+import static org.elasticsearch.xpack.esql.core.type.DataType.DOC_DATA_TYPE;
+import static org.elasticsearch.xpack.esql.core.type.DataType.DOUBLE;
+import static org.elasticsearch.xpack.esql.core.type.DataType.FLOAT;
+import static org.elasticsearch.xpack.esql.core.type.DataType.GEO_POINT;
+import static org.elasticsearch.xpack.esql.core.type.DataType.GEO_SHAPE;
+import static org.elasticsearch.xpack.esql.core.type.DataType.HALF_FLOAT;
+import static org.elasticsearch.xpack.esql.core.type.DataType.INTEGER;
+import static org.elasticsearch.xpack.esql.core.type.DataType.IP;
+import static org.elasticsearch.xpack.esql.core.type.DataType.LONG;
+import static org.elasticsearch.xpack.esql.core.type.DataType.NULL;
+import static org.elasticsearch.xpack.esql.core.type.DataType.OBJECT;
+import static org.elasticsearch.xpack.esql.core.type.DataType.PARTIAL_AGG;
+import static org.elasticsearch.xpack.esql.core.type.DataType.SCALED_FLOAT;
+import static org.elasticsearch.xpack.esql.core.type.DataType.SHORT;
+import static org.elasticsearch.xpack.esql.core.type.DataType.SOURCE;
+import static org.elasticsearch.xpack.esql.core.type.DataType.TEXT;
+import static org.elasticsearch.xpack.esql.core.type.DataType.TSID_DATA_TYPE;
+import static org.elasticsearch.xpack.esql.core.type.DataType.UNSIGNED_LONG;
+import static org.elasticsearch.xpack.esql.core.type.DataType.UNSUPPORTED;
+import static org.elasticsearch.xpack.esql.core.type.DataType.VERSION;
+import static org.elasticsearch.xpack.esql.core.type.DataType.isDateTime;
+import static org.elasticsearch.xpack.esql.core.type.DataType.isDateTimeOrTemporal;
+import static org.elasticsearch.xpack.esql.core.type.DataType.isString;
+import static org.elasticsearch.xpack.esql.type.EsqlDataTypeConverter.commonType;
 
 public class EsqlDataTypeConverterTests extends ESTestCase {
 
@@ -16,4 +54,124 @@ public void testNanoTimeToString() {
         long actual = EsqlDataTypeConverter.dateNanosToLong(EsqlDataTypeConverter.nanoTimeToString(expected));
         assertEquals(expected, actual);
     }
+
+    public void testCommonTypeNull() {
+        for (DataType dataType : DataType.values()) {
+            assertEqualsCommonType(dataType, NULL, dataType);
+        }
+    }
+
+    public void testCommonTypeStrings() {
+        List<DataType> STRINGS = Arrays.stream(DataType.values()).filter(DataType::isString).toList();
+        for (DataType dataType1 : STRINGS) {
+            for (DataType dataType2 : DataType.values()) {
+                if (dataType2 == NULL) {
+                    assertEqualsCommonType(dataType1, NULL, dataType1);
+                } else if ((isString(dataType1) && isString(dataType2))) {
+                    if (dataType1 == dataType2) {
+                        assertEqualsCommonType(dataType1, dataType2, dataType1);
+                    } else {
+                        assertEqualsCommonType(dataType1, dataType2, TEXT);
+                    }
+                } else {
+                    assertNullCommonType(dataType1, dataType2);
+                }
+            }
+        }
+    }
+
+    public void testCommonTypeDateTimeIntervals() {
+        List<DataType> DATE_TIME_INTERVALS = Arrays.stream(DataType.values()).filter(DataType::isDateTimeOrTemporal).toList();
+        for (DataType dataType1 : DATE_TIME_INTERVALS) {
+            for (DataType dataType2 : DataType.values()) {
+                if (dataType2 == NULL) {
+                    assertEqualsCommonType(dataType1, NULL, dataType1);
+                } else if (isDateTimeOrTemporal(dataType2)) {
+                    if (isDateTime(dataType1) || isDateTime(dataType2)) {
+                        assertEqualsCommonType(dataType1, dataType2, DATETIME);
+                    } else if (dataType1 == dataType2) {
+                        assertEqualsCommonType(dataType1, dataType2, dataType1);
+                    } else {
+                        assertNullCommonType(dataType1, dataType2);
+                    }
+                } else {
+                    assertNullCommonType(dataType1, dataType2);
+                }
+            }
+        }
+    }
+
+    public void testCommonTypeNumeric() {
+        // whole numbers
+        commonNumericType(BYTE, List.of(NULL, BYTE));
+        commonNumericType(SHORT, List.of(NULL, BYTE, SHORT));
+        commonNumericType(INTEGER, List.of(NULL, BYTE, SHORT, INTEGER));
+        commonNumericType(LONG, List.of(NULL, BYTE, SHORT, INTEGER, LONG));
+        commonNumericType(UNSIGNED_LONG, List.of(NULL, BYTE, SHORT, INTEGER, LONG, UNSIGNED_LONG));
+        // floats
+        commonNumericType(HALF_FLOAT, List.of(NULL, BYTE, SHORT, INTEGER, LONG, UNSIGNED_LONG, HALF_FLOAT, FLOAT));
+        commonNumericType(FLOAT, List.of(NULL, BYTE, SHORT, INTEGER, LONG, UNSIGNED_LONG, FLOAT, HALF_FLOAT));
+        commonNumericType(DOUBLE, List.of(NULL, BYTE, SHORT, INTEGER, LONG, UNSIGNED_LONG, HALF_FLOAT, FLOAT, DOUBLE, SCALED_FLOAT));
+        commonNumericType(SCALED_FLOAT, List.of(NULL, BYTE, SHORT, INTEGER, LONG, UNSIGNED_LONG, HALF_FLOAT, FLOAT, SCALED_FLOAT, DOUBLE));
+    }
+
+    /**
+     * The first argument and the second argument(s) have the first argument as a common type.
+     */
+    private static void commonNumericType(DataType numericType, List<DataType> lowerTypes) {
+        List<DataType> NUMERICS = Arrays.stream(DataType.values()).filter(DataType::isNumeric).toList();
+        List<DataType> DOUBLES = Arrays.stream(DataType.values()).filter(DataType::isRationalNumber).toList();
+        for (DataType dataType : DataType.values()) {
+            if (DOUBLES.containsAll(List.of(numericType, dataType)) && (dataType.estimatedSize().equals(numericType.estimatedSize()))) {
+                assertEquals(numericType, commonType(dataType, numericType));
+            } else if (lowerTypes.contains(dataType)) {
+                assertEqualsCommonType(numericType, dataType, numericType);
+            } else if (NUMERICS.contains(dataType)) {
+                assertEqualsCommonType(numericType, dataType, dataType);
+            } else {
+                assertNullCommonType(numericType, dataType);
+            }
+        }
+    }
+
+    public void testCommonTypeMiscellaneous() {
+        List<DataType> MISCELLANEOUS = List.of(
+            COUNTER_INTEGER,
+            COUNTER_LONG,
+            COUNTER_DOUBLE,
+            UNSUPPORTED,
+            OBJECT,
+            SOURCE,
+            DATE_NANOS,
+            DOC_DATA_TYPE,
+            TSID_DATA_TYPE,
+            PARTIAL_AGG,
+            IP,
+            VERSION,
+            GEO_POINT,
+            GEO_SHAPE,
+            CARTESIAN_POINT,
+            CARTESIAN_SHAPE,
+            BOOLEAN
+        );
+        for (DataType dataType1 : MISCELLANEOUS) {
+            for (DataType dataType2 : DataType.values()) {
+                if (dataType2 == NULL || dataType1 == dataType2) {
+                    assertEqualsCommonType(dataType1, dataType2, dataType1);
+                } else {
+                    assertNullCommonType(dataType1, dataType2);
+                }
+            }
+        }
+    }
+
+    private static void assertEqualsCommonType(DataType dataType1, DataType dataType2, DataType commonType) {
+        assertEquals(commonType, commonType(dataType1, dataType2));
+        assertEquals(commonType, commonType(dataType2, dataType1));
+    }
+
+    private static void assertNullCommonType(DataType dataType1, DataType dataType2) {
+        assertNull(commonType(dataType1, dataType2));
+        assertNull(commonType(dataType2, dataType1));
+    }
 }

From e3e562ffbfb981014bdd71bf663bb6f972f5e352 Mon Sep 17 00:00:00 2001
From: David Kyle <david.kyle@elastic.co>
Date: Thu, 29 Aug 2024 17:18:54 +0100
Subject: [PATCH 054/144] [ML] Support sparse embedding models in the
 elasticsearch inference service (#112270)

For a sparse embedding model created with the ml trained models APIs
---
 docs/changelog/112270.yaml                    |   5 +
 .../inference/service-elasticsearch.asciidoc  |   3 +-
 .../xpack/inference/CustomElandModelIT.java   | 134 +++++++++
 .../xpack/inference/RerankingIT.java          |   8 +-
 .../BaseElasticsearchInternalService.java     |   6 +-
 .../ElasticsearchInternalService.java         | 151 +++-------
 .../services/elser/ElserInternalService.java  |  28 --
 .../ElasticsearchInternalServiceTests.java    | 278 +++++++++++-------
 8 files changed, 363 insertions(+), 250 deletions(-)
 create mode 100644 docs/changelog/112270.yaml
 create mode 100644 x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/CustomElandModelIT.java

diff --git a/docs/changelog/112270.yaml b/docs/changelog/112270.yaml
new file mode 100644
index 0000000000000..1e6b9c7fc9290
--- /dev/null
+++ b/docs/changelog/112270.yaml
@@ -0,0 +1,5 @@
+pr: 112270
+summary: Support sparse embedding models in the elasticsearch inference service
+area: Machine Learning
+type: enhancement
+issues: []
diff --git a/docs/reference/inference/service-elasticsearch.asciidoc b/docs/reference/inference/service-elasticsearch.asciidoc
index 99fd41ee2db65..572cad591fba6 100644
--- a/docs/reference/inference/service-elasticsearch.asciidoc
+++ b/docs/reference/inference/service-elasticsearch.asciidoc
@@ -31,6 +31,7 @@ include::inference-shared.asciidoc[tag=task-type]
 Available task types:
 
 * `rerank`,
+* `sparse_embedding`,
 * `text_embedding`.
 --
 
@@ -182,4 +183,4 @@ PUT _inference/text_embedding/my-e5-model
   }
 }
 ------------------------------------------------------------
-// TEST[skip:TBD]
\ No newline at end of file
+// TEST[skip:TBD]
diff --git a/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/CustomElandModelIT.java b/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/CustomElandModelIT.java
new file mode 100644
index 0000000000000..65b7a138e7e1e
--- /dev/null
+++ b/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/CustomElandModelIT.java
@@ -0,0 +1,134 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference;
+
+import org.elasticsearch.client.Request;
+import org.elasticsearch.core.Strings;
+import org.elasticsearch.inference.TaskType;
+
+import java.io.IOException;
+import java.util.ArrayList;
+import java.util.Base64;
+import java.util.List;
+import java.util.stream.Collectors;
+
+public class CustomElandModelIT extends InferenceBaseRestTest {
+
+    // The model definition is taken from org.elasticsearch.xpack.ml.integration.TextExpansionQueryIT
+
+    static final String BASE_64_ENCODED_MODEL = "UEsDBAAACAgAAAAAAAAAAAAAAAAAA"
+        + "AAAAAAUAA4Ac2ltcGxlbW9kZWwvZGF0YS5wa2xGQgoAWlpaWlpaWlpaWoACY19fdG9yY2hfXwpUaW55VG"
+        + "V4dEV4cGFuc2lvbgpxACmBfShYCAAAAHRyYWluaW5ncQGJWBYAAABfaXNfZnVsbF9iYWNrd2FyZF9ob29"
+        + "rcQJOdWJxAy5QSwcIITmbsFgAAABYAAAAUEsDBBQACAgIAAAAAAAAAAAAAAAAAAAAAAAdAB0Ac2ltcGxl"
+        + "bW9kZWwvY29kZS9fX3RvcmNoX18ucHlGQhkAWlpaWlpaWlpaWlpaWlpaWlpaWlpaWlpaWoWRT4+cMAzF7"
+        + "/spfASJomF3e0Ga3nrrn8vcELIyxAzRhAQlpjvbT19DWDrdquqBA/bvPT87nVUxwsm41xPd+PNtUi4a77"
+        + "KvXs+W8voBAHFSQY3EFCIiHKFp1+p57vs/ShyUccZdoIaz93aBTMR+thbPqru+qKBx8P4q/e8TyxRlmwVc"
+        + "tJp66H1YmCyS7WsZwD50A2L5V7pCBADGTTOj0bGGE7noQyqzv5JDfp0o9fZRCWqP37yjhE4+mqX5X3AdF"
+        + "ZHGM/2TzOHDpy1IvQWR+OWo3KwsRiKdpcqg4pBFDtm+QJ7nqwIPckrlnGfFJG0uNhOl38Sjut3pCqg26Qu"
+        + "Zy8BR9In7ScHHrKkKMW0TIucFrGQXCMpdaDO05O6DpOiy8e4kr0Ed/2YKOIhplW8gPr4ntygrd9ixpx3j9"
+        + "UZZVRagl2c6+imWUzBjuf5m+Ch7afphuvvW+r/0dsfn+2N9MZGb9+/SFtCYdhd83CMYp+mGy0LiKNs8y/e"
+        + "UuEA8B/d2z4dfUEsHCFSE3IaCAQAAIAMAAFBLAwQUAAgICAAAAAAAAAAAAAAAAAAAAAAAJwApAHNpbXBsZ"
+        + "W1vZGVsL2NvZGUvX190b3JjaF9fLnB5LmRlYnVnX3BrbEZCJQBaWlpaWlpaWlpaWlpaWlpaWlpaWlpaWlp"
+        + "aWlpaWlpaWlpaWlpahZHLbtNAFIZtp03rSVIuLRKXjdk5ojitKJsiFq24lem0KKSqpRIZt55gE9/GM+lNL"
+        + "Fgx4i1Ys2aHhIBXgAVICNggHgNm6rqJN2BZGv36/v/MOWeea/Z5RVHurLfRUsfZXOnccx522itrd53O0vL"
+        + "qbaKYtsAKUe1pcege7hm9JNtzM8+kOOzNApIX0A3xBXE6YE7g0UWjg2OaZAJXbKvALOnj2GEHKc496ykLkt"
+        + "gNt3Jz17hprCUxFqExe7YIpQkNpO1/kfHhPUdtUAdH2/gfmeYiIFW7IkM6IBP2wrDNbMe3Mjf2ksiK3Hjg"
+        + "hg7F2DN9l/omZZl5Mmez2QRk0q4WUUB0+1oh9nDwxGdUXJdXPMRZQs352eGaRPV9s2lcMeZFGWBfKJJiw0Y"
+        + "gbCMLBaRmXyy4flx6a667Fch55q05QOq2Jg2ANOyZwplhNsjiohVApo7aa21QnNGW5+4GXv8gxK1beBeHSR"
+        + "rhmLXWVh+0aBhErZ7bx1ejxMOhlR6QU4ycNqGyk8/yNGCWkwY7/RCD7UEQek4QszCgDJAzZtfErA0VqHBy9"
+        + "ugQP9pUfUmgCjVYgWNwHFbhBJyEOgSwBuuwARWZmoI6J9PwLfzEocpRpPrT8DP8wqHG0b4UX+E3DiscvRgl"
+        + "XIoi81KKPwioHI5x9EooNKWiy0KOc/T6WF4SssrRuzJ9L2VNRXUhJzj6UKYfS4W/q/5wuh/l4M9R9qsU+y2"
+        + "dpoo2hJzkaEET8r6KRONicnRdK9EbUi6raFVIwNGjsrlbpk6ZPi7TbS3fv3LyNjPiEKzG0aG0tvNb6xw90/"
+        + "whe6ONjnJcUxobHDUqQ8bIOW79BVBLBwhfSmPKdAIAAE4EAABQSwMEAAAICAAAAAAAAAAAAAAAAAAAAAAAA"
+        + "BkABQBzaW1wbGVtb2RlbC9jb25zdGFudHMucGtsRkIBAFqAAikuUEsHCG0vCVcEAAAABAAAAFBLAwQAAAgI"
+        + "AAAAAAAAAAAAAAAAAAAAAAAAEwA7AHNpbXBsZW1vZGVsL3ZlcnNpb25GQjcAWlpaWlpaWlpaWlpaWlpaWlp"
+        + "aWlpaWlpaWlpaWlpaWlpaWlpaWlpaWlpaWlpaWlpaWlpaWlpaWjMKUEsHCNGeZ1UCAAAAAgAAAFBLAQIAAA"
+        + "AACAgAAAAAAAAhOZuwWAAAAFgAAAAUAAAAAAAAAAAAAAAAAAAAAABzaW1wbGVtb2RlbC9kYXRhLnBrbFBLA"
+        + "QIAABQACAgIAAAAAABUhNyGggEAACADAAAdAAAAAAAAAAAAAAAAAKgAAABzaW1wbGVtb2RlbC9jb2RlL19f"
+        + "dG9yY2hfXy5weVBLAQIAABQACAgIAAAAAABfSmPKdAIAAE4EAAAnAAAAAAAAAAAAAAAAAJICAABzaW1wbGVt"
+        + "b2RlbC9jb2RlL19fdG9yY2hfXy5weS5kZWJ1Z19wa2xQSwECAAAAAAgIAAAAAAAAbS8JVwQAAAAEAAAAGQAA"
+        + "AAAAAAAAAAAAAACEBQAAc2ltcGxlbW9kZWwvY29uc3RhbnRzLnBrbFBLAQIAAAAACAgAAAAAAADRnmdVAgAA"
+        + "AAIAAAATAAAAAAAAAAAAAAAAANQFAABzaW1wbGVtb2RlbC92ZXJzaW9uUEsGBiwAAAAAAAAAHgMtAAAAAAAA"
+        + "AAAABQAAAAAAAAAFAAAAAAAAAGoBAAAAAAAAUgYAAAAAAABQSwYHAAAAALwHAAAAAAAAAQAAAFBLBQYAAAAABQAFAGoBAABSBgAAAAA=";
+
+    static final long RAW_MODEL_SIZE; // size of the model before base64 encoding
+    static {
+        RAW_MODEL_SIZE = Base64.getDecoder().decode(BASE_64_ENCODED_MODEL).length;
+    }
+
+    // Test a sparse embedding model deployed with the ml trained models APIs
+    public void testSparse() throws IOException {
+        String modelId = "custom-text-expansion-model";
+
+        createTextExpansionModel(modelId);
+        putModelDefinition(modelId, BASE_64_ENCODED_MODEL, RAW_MODEL_SIZE);
+        putVocabulary(
+            List.of("these", "are", "my", "words", "the", "washing", "machine", "is", "leaking", "octopus", "comforter", "smells"),
+            modelId
+        );
+
+        var inferenceConfig = """
+            {
+              "service": "elasticsearch",
+              "service_settings": {
+                "model_id": "custom-text-expansion-model",
+                "num_allocations": 1,
+                "num_threads": 1
+              }
+            }
+            """;
+
+        var inferenceId = "sparse-inf";
+        putModel(inferenceId, inferenceConfig, TaskType.SPARSE_EMBEDDING);
+        var results = inferOnMockService(inferenceId, List.of("washing", "machine"));
+        deleteModel(inferenceId);
+        assertNotNull(results.get("sparse_embedding"));
+    }
+
+    protected void createTextExpansionModel(String modelId) throws IOException {
+        // with_special_tokens: false for this test with limited vocab
+        Request request = new Request("PUT", "/_ml/trained_models/" + modelId);
+        request.setJsonEntity("""
+            {
+               "description": "a text expansion model",
+               "model_type": "pytorch",
+               "inference_config": {
+                 "text_expansion": {
+                   "tokenization": {
+                     "bert": {
+                       "with_special_tokens": false
+                     }
+                   }
+                 }
+               }
+             }""");
+        client().performRequest(request);
+    }
+
+    protected void putVocabulary(List<String> vocabulary, String modelId) throws IOException {
+        List<String> vocabularyWithPad = new ArrayList<>();
+        vocabularyWithPad.add("[PAD]");
+        vocabularyWithPad.add("[UNK]");
+        vocabularyWithPad.addAll(vocabulary);
+        String quotedWords = vocabularyWithPad.stream().map(s -> "\"" + s + "\"").collect(Collectors.joining(","));
+
+        Request request = new Request("PUT", "_ml/trained_models/" + modelId + "/vocabulary");
+        request.setJsonEntity(Strings.format("""
+            { "vocabulary": [%s] }
+            """, quotedWords));
+        client().performRequest(request);
+    }
+
+    protected void putModelDefinition(String modelId, String base64EncodedModel, long unencodedModelSize) throws IOException {
+        Request request = new Request("PUT", "_ml/trained_models/" + modelId + "/definition/0");
+        String body = Strings.format("""
+            {"total_definition_length":%s,"definition": "%s","total_parts": 1}""", unencodedModelSize, base64EncodedModel);
+        request.setJsonEntity(body);
+        client().performRequest(request);
+    }
+}
diff --git a/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/RerankingIT.java b/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/RerankingIT.java
index 77251ada4c488..893d3fb3e9b80 100644
--- a/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/RerankingIT.java
+++ b/x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/RerankingIT.java
@@ -35,7 +35,7 @@ private String putCohereRerankEndpoint() throws IOException {
                 "api_key": ""
               }
             }
-            """);// TODO remove key
+            """);
         return endpointID;
     }
 
@@ -61,7 +61,7 @@ private String putCohereRerankEndpointWithDocuments() throws IOException {
                 "return_documents": true
               }
             }
-            """);// TODO remove key
+            """);
         return endpointID;
     }
 
@@ -81,13 +81,13 @@ private String putCohereRerankEndpointWithTop2() throws IOException {
               "service": "cohere",
               "service_settings": {
                 "model_id": "rerank-english-v2.0",
-                "api_key": "8TNPBvpBO7oN97009HQHzQbBhNrxmREbcJrZCwkK"
+                "api_key": ""
               },
               "task_settings": {
                 "top_n": 2
               }
             }
-            """);// TODO remove key
+            """);
         return endpointID;
     }
 
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/elasticsearch/BaseElasticsearchInternalService.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/elasticsearch/BaseElasticsearchInternalService.java
index 574ca77d4587e..457416370e559 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/elasticsearch/BaseElasticsearchInternalService.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/elasticsearch/BaseElasticsearchInternalService.java
@@ -154,10 +154,10 @@ public void isModelDownloaded(Model model, ActionListener<Boolean> listener) {
             executeAsyncWithOrigin(client, INFERENCE_ORIGIN, GetTrainedModelsAction.INSTANCE, getRequest, getModelsResponseListener);
         } else {
             listener.onFailure(
-                new IllegalArgumentException(
-                    "Unable to determine supported model for ["
+                new IllegalStateException(
+                    "Can not check the download status of the model used by ["
                         + model.getConfigurations().getInferenceEntityId()
-                        + "] please verify the request and submit a bug report if necessary."
+                        + "] as the model_id cannot be found."
                 )
             );
         }
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/elasticsearch/ElasticsearchInternalService.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/elasticsearch/ElasticsearchInternalService.java
index c3a0111562319..cca8ae63e974c 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/elasticsearch/ElasticsearchInternalService.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/elasticsearch/ElasticsearchInternalService.java
@@ -7,8 +7,6 @@
 
 package org.elasticsearch.xpack.inference.services.elasticsearch;
 
-import org.apache.logging.log4j.LogManager;
-import org.apache.logging.log4j.Logger;
 import org.elasticsearch.ElasticsearchStatusException;
 import org.elasticsearch.TransportVersion;
 import org.elasticsearch.TransportVersions;
@@ -27,19 +25,18 @@
 import org.elasticsearch.inference.TaskType;
 import org.elasticsearch.rest.RestStatus;
 import org.elasticsearch.xpack.core.inference.results.ErrorChunkedInferenceResults;
+import org.elasticsearch.xpack.core.inference.results.InferenceChunkedSparseEmbeddingResults;
 import org.elasticsearch.xpack.core.inference.results.InferenceChunkedTextEmbeddingFloatResults;
 import org.elasticsearch.xpack.core.inference.results.InferenceTextEmbeddingFloatResults;
 import org.elasticsearch.xpack.core.inference.results.RankedDocsResults;
+import org.elasticsearch.xpack.core.inference.results.SparseEmbeddingResults;
 import org.elasticsearch.xpack.core.ml.action.GetTrainedModelsAction;
 import org.elasticsearch.xpack.core.ml.action.InferModelAction;
-import org.elasticsearch.xpack.core.ml.action.PutTrainedModelAction;
-import org.elasticsearch.xpack.core.ml.action.StartTrainedModelDeploymentAction;
-import org.elasticsearch.xpack.core.ml.action.StopTrainedModelDeploymentAction;
-import org.elasticsearch.xpack.core.ml.inference.TrainedModelConfig;
-import org.elasticsearch.xpack.core.ml.inference.TrainedModelInput;
 import org.elasticsearch.xpack.core.ml.inference.results.ErrorInferenceResults;
 import org.elasticsearch.xpack.core.ml.inference.results.MlChunkedTextEmbeddingFloatResults;
+import org.elasticsearch.xpack.core.ml.inference.results.MlChunkedTextExpansionResults;
 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.TextEmbeddingConfigUpdate;
+import org.elasticsearch.xpack.core.ml.inference.trainedmodel.TextExpansionConfigUpdate;
 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.TextSimilarityConfigUpdate;
 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.TokenizationConfigUpdate;
 import org.elasticsearch.xpack.inference.services.ConfigurationParseContext;
@@ -53,8 +50,6 @@
 import java.util.Set;
 import java.util.function.Function;
 
-import static org.elasticsearch.xpack.core.ClientHelper.INFERENCE_ORIGIN;
-import static org.elasticsearch.xpack.core.ClientHelper.executeAsyncWithOrigin;
 import static org.elasticsearch.xpack.core.inference.results.ResultUtils.createInvalidChunkedResultException;
 import static org.elasticsearch.xpack.inference.services.ServiceUtils.removeFromMap;
 import static org.elasticsearch.xpack.inference.services.ServiceUtils.removeFromMapOrThrowIfNull;
@@ -71,15 +66,13 @@ public class ElasticsearchInternalService extends BaseElasticsearchInternalServi
         MULTILINGUAL_E5_SMALL_MODEL_ID_LINUX_X86
     );
 
-    private static final Logger logger = LogManager.getLogger(ElasticsearchInternalService.class);
-
     public ElasticsearchInternalService(InferenceServiceExtension.InferenceServiceFactoryContext context) {
         super(context);
     }
 
     @Override
     protected EnumSet<TaskType> supportedTaskTypes() {
-        return EnumSet.of(TaskType.RERANK, TaskType.TEXT_EMBEDDING);
+        return EnumSet.of(TaskType.RERANK, TaskType.TEXT_EMBEDDING, TaskType.SPARSE_EMBEDDING);
     }
 
     @Override
@@ -161,6 +154,12 @@ private static CustomElandModel createCustomElandModel(
                 NAME,
                 CustomElandInternalTextEmbeddingServiceSettings.fromMap(serviceSettings, context)
             );
+            case SPARSE_EMBEDDING -> new CustomElandModel(
+                inferenceEntityId,
+                taskType,
+                NAME,
+                elandServiceSettings(serviceSettings, context)
+            );
             case RERANK -> new CustomElandRerankModel(
                 inferenceEntityId,
                 taskType,
@@ -334,6 +333,8 @@ public void infer(
             inferTextEmbedding(model, input, inputType, timeout, listener);
         } else if (TaskType.RERANK.equals(taskType)) {
             inferRerank(model, query, input, inputType, timeout, taskSettings, listener);
+        } else if (TaskType.SPARSE_EMBEDDING.equals(taskType)) {
+            inferSparseEmbedding(model, input, inputType, timeout, listener);
         } else {
             throw new ElasticsearchStatusException(TaskType.unsupportedTaskTypeErrorMsg(taskType, NAME), RestStatus.BAD_REQUEST);
         }
@@ -364,6 +365,31 @@ public void inferTextEmbedding(
         );
     }
 
+    public void inferSparseEmbedding(
+        Model model,
+        List<String> inputs,
+        InputType inputType,
+        TimeValue timeout,
+        ActionListener<InferenceServiceResults> listener
+    ) {
+        var request = buildInferenceRequest(
+            model.getConfigurations().getInferenceEntityId(),
+            TextExpansionConfigUpdate.EMPTY_UPDATE,
+            inputs,
+            inputType,
+            timeout,
+            false
+        );
+
+        client.execute(
+            InferModelAction.INSTANCE,
+            request,
+            listener.delegateFailureAndWrap(
+                (l, inferenceResult) -> l.onResponse(SparseEmbeddingResults.of(inferenceResult.getInferenceResults()))
+            )
+        );
+    }
+
     public void inferRerank(
         Model model,
         String query,
@@ -422,7 +448,7 @@ public void chunkedInfer(
         TimeValue timeout,
         ActionListener<List<ChunkedInferenceServiceResults>> listener
     ) {
-        if (TaskType.TEXT_EMBEDDING.isAnyOrSame(model.getTaskType()) == false) {
+        if ((TaskType.TEXT_EMBEDDING.equals(model.getTaskType()) || TaskType.SPARSE_EMBEDDING.equals(model.getTaskType())) == false) {
             listener.onFailure(
                 new ElasticsearchStatusException(TaskType.unsupportedTaskTypeErrorMsg(model.getTaskType(), NAME), RestStatus.BAD_REQUEST)
             );
@@ -464,6 +490,8 @@ private static List<ChunkedInferenceServiceResults> translateToChunkedResults(Li
     private static ChunkedInferenceServiceResults translateToChunkedResult(InferenceResults inferenceResult) {
         if (inferenceResult instanceof MlChunkedTextEmbeddingFloatResults mlChunkedResult) {
             return InferenceChunkedTextEmbeddingFloatResults.ofMlResults(mlChunkedResult);
+        } else if (inferenceResult instanceof MlChunkedTextExpansionResults mlChunkedResult) {
+            return InferenceChunkedSparseEmbeddingResults.ofMlResult(mlChunkedResult);
         } else if (inferenceResult instanceof ErrorInferenceResults error) {
             return new ErrorChunkedInferenceResults(error.getException());
         } else {
@@ -471,103 +499,6 @@ private static ChunkedInferenceServiceResults translateToChunkedResult(Inference
         }
     }
 
-    @Override
-    public void start(Model model, ActionListener<Boolean> listener) {
-        if (model instanceof ElasticsearchInternalModel == false) {
-            listener.onFailure(notElasticsearchModelException(model));
-            return;
-        }
-
-        if (model.getTaskType() != TaskType.TEXT_EMBEDDING && model.getTaskType() != TaskType.RERANK) {
-            listener.onFailure(
-                new IllegalStateException(TaskType.unsupportedTaskTypeErrorMsg(model.getConfigurations().getTaskType(), NAME))
-            );
-            return;
-        }
-
-        var startRequest = ((ElasticsearchInternalModel) model).getStartTrainedModelDeploymentActionRequest();
-        var responseListener = ((ElasticsearchInternalModel) model).getCreateTrainedModelAssignmentActionListener(model, listener);
-
-        client.execute(StartTrainedModelDeploymentAction.INSTANCE, startRequest, responseListener);
-    }
-
-    @Override
-    public void stop(String inferenceEntityId, ActionListener<Boolean> listener) {
-        var request = new StopTrainedModelDeploymentAction.Request(inferenceEntityId);
-        request.setForce(true);
-        client.execute(
-            StopTrainedModelDeploymentAction.INSTANCE,
-            request,
-            listener.delegateFailureAndWrap((delegatedResponseListener, response) -> delegatedResponseListener.onResponse(Boolean.TRUE))
-        );
-    }
-
-    @Override
-    public void putModel(Model model, ActionListener<Boolean> listener) {
-        if (model instanceof ElasticsearchInternalModel == false) {
-            listener.onFailure(notElasticsearchModelException(model));
-            return;
-        } else if (model instanceof MultilingualE5SmallModel e5Model) {
-            String modelId = e5Model.getServiceSettings().modelId();
-            var input = new TrainedModelInput(List.<String>of("text_field")); // by convention text_field is used
-            var config = TrainedModelConfig.builder().setInput(input).setModelId(modelId).validate(true).build();
-            PutTrainedModelAction.Request putRequest = new PutTrainedModelAction.Request(config, false, true);
-            executeAsyncWithOrigin(
-                client,
-                INFERENCE_ORIGIN,
-                PutTrainedModelAction.INSTANCE,
-                putRequest,
-                ActionListener.wrap(response -> listener.onResponse(Boolean.TRUE), e -> {
-                    if (e instanceof ElasticsearchStatusException esException
-                        && esException.getMessage().contains(PutTrainedModelAction.MODEL_ALREADY_EXISTS_ERROR_MESSAGE_FRAGMENT)) {
-                        listener.onResponse(Boolean.TRUE);
-                    } else {
-                        listener.onFailure(e);
-                    }
-                })
-            );
-        } else if (model instanceof CustomElandModel) {
-            logger.info("Custom eland model detected, model must have been already loaded into the cluster with eland.");
-            listener.onResponse(Boolean.TRUE);
-        } else {
-            listener.onFailure(
-                new IllegalArgumentException(
-                    "Can not download model automatically for ["
-                        + model.getConfigurations().getInferenceEntityId()
-                        + "] you may need to download it through the trained models API or with eland."
-                )
-            );
-            return;
-        }
-    }
-
-    @Override
-    public void isModelDownloaded(Model model, ActionListener<Boolean> listener) {
-        ActionListener<GetTrainedModelsAction.Response> getModelsResponseListener = listener.delegateFailure((delegate, response) -> {
-            if (response.getResources().count() < 1) {
-                delegate.onResponse(Boolean.FALSE);
-            } else {
-                delegate.onResponse(Boolean.TRUE);
-            }
-        });
-
-        if (model.getServiceSettings() instanceof ElasticsearchInternalServiceSettings internalServiceSettings) {
-            String modelId = internalServiceSettings.modelId();
-            GetTrainedModelsAction.Request getRequest = new GetTrainedModelsAction.Request(modelId);
-            executeAsyncWithOrigin(client, INFERENCE_ORIGIN, GetTrainedModelsAction.INSTANCE, getRequest, getModelsResponseListener);
-        } else if (model instanceof ElasticsearchInternalModel == false) {
-            listener.onFailure(notElasticsearchModelException(model));
-        } else {
-            listener.onFailure(
-                new IllegalArgumentException(
-                    "Unable to determine supported model for ["
-                        + model.getConfigurations().getInferenceEntityId()
-                        + "] please verify the request and submit a bug report if necessary."
-                )
-            );
-        }
-    }
-
     @Override
     public TransportVersion getMinimalSupportedVersion() {
         return TransportVersions.V_8_14_0;
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/elser/ElserInternalService.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/elser/ElserInternalService.java
index 775ddca160463..948117954a63f 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/elser/ElserInternalService.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/elser/ElserInternalService.java
@@ -28,7 +28,6 @@
 import org.elasticsearch.xpack.core.inference.results.ErrorChunkedInferenceResults;
 import org.elasticsearch.xpack.core.inference.results.InferenceChunkedSparseEmbeddingResults;
 import org.elasticsearch.xpack.core.inference.results.SparseEmbeddingResults;
-import org.elasticsearch.xpack.core.ml.action.GetTrainedModelsAction;
 import org.elasticsearch.xpack.core.ml.action.InferModelAction;
 import org.elasticsearch.xpack.core.ml.inference.results.ErrorInferenceResults;
 import org.elasticsearch.xpack.core.ml.inference.results.MlChunkedTextExpansionResults;
@@ -43,8 +42,6 @@
 import java.util.Map;
 import java.util.Set;
 
-import static org.elasticsearch.xpack.core.ClientHelper.INFERENCE_ORIGIN;
-import static org.elasticsearch.xpack.core.ClientHelper.executeAsyncWithOrigin;
 import static org.elasticsearch.xpack.inference.services.ServiceUtils.removeFromMapOrThrowIfNull;
 import static org.elasticsearch.xpack.inference.services.ServiceUtils.throwIfNotEmptyMap;
 import static org.elasticsearch.xpack.inference.services.elser.ElserModels.ELSER_V2_MODEL;
@@ -242,31 +239,6 @@ private void checkCompatibleTaskType(TaskType taskType) {
         }
     }
 
-    @Override
-    public void isModelDownloaded(Model model, ActionListener<Boolean> listener) {
-        ActionListener<GetTrainedModelsAction.Response> getModelsResponseListener = listener.delegateFailure((delegate, response) -> {
-            if (response.getResources().count() < 1) {
-                delegate.onResponse(Boolean.FALSE);
-            } else {
-                delegate.onResponse(Boolean.TRUE);
-            }
-        });
-
-        if (model instanceof ElserInternalModel elserModel) {
-            String modelId = elserModel.getServiceSettings().modelId();
-            GetTrainedModelsAction.Request getRequest = new GetTrainedModelsAction.Request(modelId);
-            executeAsyncWithOrigin(client, INFERENCE_ORIGIN, GetTrainedModelsAction.INSTANCE, getRequest, getModelsResponseListener);
-        } else {
-            listener.onFailure(
-                new IllegalArgumentException(
-                    "Can not download model automatically for ["
-                        + model.getConfigurations().getInferenceEntityId()
-                        + "] you may need to download it through the trained models API or with eland."
-                )
-            );
-        }
-    }
-
     private static ElserMlNodeTaskSettings taskSettingsFromMap(TaskType taskType, Map<String, Object> config) {
         if (taskType != TaskType.SPARSE_EMBEDDING) {
             throw new ElasticsearchStatusException(TaskType.unsupportedTaskTypeErrorMsg(taskType, NAME), RestStatus.BAD_REQUEST);
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/elasticsearch/ElasticsearchInternalServiceTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/elasticsearch/ElasticsearchInternalServiceTests.java
index e6fd725a50198..257616033f080 100644
--- a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/elasticsearch/ElasticsearchInternalServiceTests.java
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/elasticsearch/ElasticsearchInternalServiceTests.java
@@ -17,6 +17,7 @@
 import org.elasticsearch.index.mapper.vectors.DenseVectorFieldMapper;
 import org.elasticsearch.inference.ChunkedInferenceServiceResults;
 import org.elasticsearch.inference.ChunkingOptions;
+import org.elasticsearch.inference.EmptyTaskSettings;
 import org.elasticsearch.inference.InferenceResults;
 import org.elasticsearch.inference.InferenceServiceExtension;
 import org.elasticsearch.inference.InputType;
@@ -31,6 +32,7 @@
 import org.elasticsearch.xpack.core.action.util.QueryPage;
 import org.elasticsearch.xpack.core.inference.action.InferenceAction;
 import org.elasticsearch.xpack.core.inference.results.ErrorChunkedInferenceResults;
+import org.elasticsearch.xpack.core.inference.results.InferenceChunkedSparseEmbeddingResults;
 import org.elasticsearch.xpack.core.inference.results.InferenceChunkedTextEmbeddingFloatResults;
 import org.elasticsearch.xpack.core.ml.action.GetTrainedModelsAction;
 import org.elasticsearch.xpack.core.ml.action.InferModelAction;
@@ -39,8 +41,10 @@
 import org.elasticsearch.xpack.core.ml.inference.TrainedModelConfig;
 import org.elasticsearch.xpack.core.ml.inference.TrainedModelPrefixStrings;
 import org.elasticsearch.xpack.core.ml.inference.results.ErrorInferenceResults;
+import org.elasticsearch.xpack.core.ml.inference.results.InferenceChunkedTextExpansionResultsTests;
 import org.elasticsearch.xpack.core.ml.inference.results.MlChunkedTextEmbeddingFloatResults;
 import org.elasticsearch.xpack.core.ml.inference.results.MlChunkedTextEmbeddingFloatResultsTests;
+import org.elasticsearch.xpack.core.ml.inference.results.MlChunkedTextExpansionResults;
 import org.elasticsearch.xpack.core.ml.inference.results.MlTextEmbeddingResults;
 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.TextEmbeddingConfigUpdate;
 import org.elasticsearch.xpack.core.ml.inference.trainedmodel.TokenizationConfigUpdate;
@@ -52,12 +56,10 @@
 import org.mockito.Mockito;
 
 import java.util.ArrayList;
-import java.util.Arrays;
 import java.util.EnumSet;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
-import java.util.Random;
 import java.util.Set;
 import java.util.concurrent.atomic.AtomicBoolean;
 import java.util.concurrent.atomic.AtomicInteger;
@@ -76,7 +78,6 @@
 
 public class ElasticsearchInternalServiceTests extends ESTestCase {
 
-    TaskType taskType = TaskType.TEXT_EMBEDDING;
     String randomInferenceEntityId = randomAlphaOfLength(10);
 
     private static ThreadPool threadPool;
@@ -92,7 +93,25 @@ public void shutdownThreadPool() {
     }
 
     public void testParseRequestConfig() {
+        var service = createService(mock(Client.class));
+        var settings = new HashMap<String, Object>();
+        settings.put(
+            ModelConfigurations.SERVICE_SETTINGS,
+            new HashMap<>(
+                Map.of(ElasticsearchInternalServiceSettings.NUM_ALLOCATIONS, 1, ElasticsearchInternalServiceSettings.NUM_THREADS, 4)
+            )
+        );
 
+        ActionListener<Model> modelListener = ActionListener.<Model>wrap(
+            model -> fail("Model parsing should have failed"),
+            e -> assertThat(e, instanceOf(IllegalArgumentException.class))
+        );
+
+        var taskType = randomFrom(TaskType.TEXT_EMBEDDING, TaskType.RERANK, TaskType.SPARSE_EMBEDDING);
+        service.parseRequestConfig(randomInferenceEntityId, taskType, settings, Set.of(), modelListener);
+    }
+
+    public void testParseRequestConfig_Misconfigured() {
         // Null model variant
         {
             var service = createService(mock(Client.class));
@@ -109,43 +128,10 @@ public void testParseRequestConfig() {
                 e -> assertThat(e, instanceOf(IllegalArgumentException.class))
             );
 
+            var taskType = randomFrom(TaskType.TEXT_EMBEDDING, TaskType.RERANK, TaskType.SPARSE_EMBEDDING);
             service.parseRequestConfig(randomInferenceEntityId, taskType, settings, Set.of(), modelListener);
         }
 
-        // Valid model variant
-        {
-            var service = createService(mock(Client.class));
-            var settings = new HashMap<String, Object>();
-            settings.put(
-                ModelConfigurations.SERVICE_SETTINGS,
-                new HashMap<>(
-                    Map.of(
-                        ElasticsearchInternalServiceSettings.NUM_ALLOCATIONS,
-                        1,
-                        ElasticsearchInternalServiceSettings.NUM_THREADS,
-                        4,
-                        ElasticsearchInternalServiceSettings.MODEL_ID,
-                        ElasticsearchInternalService.MULTILINGUAL_E5_SMALL_MODEL_ID
-                    )
-                )
-            );
-
-            var e5ServiceSettings = new MultilingualE5SmallInternalServiceSettings(
-                1,
-                4,
-                ElasticsearchInternalService.MULTILINGUAL_E5_SMALL_MODEL_ID,
-                null
-            );
-
-            service.parseRequestConfig(
-                randomInferenceEntityId,
-                taskType,
-                settings,
-                Set.of(),
-                getModelVerificationActionListener(e5ServiceSettings)
-            );
-        }
-
         // Invalid config map
         {
             var service = createService(mock(Client.class));
@@ -163,10 +149,12 @@ public void testParseRequestConfig() {
                 e -> assertThat(e, instanceOf(ElasticsearchStatusException.class))
             );
 
+            var taskType = randomFrom(TaskType.TEXT_EMBEDDING, TaskType.RERANK, TaskType.SPARSE_EMBEDDING);
             service.parseRequestConfig(randomInferenceEntityId, taskType, settings, Set.of(), modelListener);
         }
+    }
 
-        // Invalid service settings
+    public void testParseRequestConfig_E5() {
         {
             var service = createService(mock(Client.class));
             var settings = new HashMap<String, Object>();
@@ -179,52 +167,28 @@ public void testParseRequestConfig() {
                         ElasticsearchInternalServiceSettings.NUM_THREADS,
                         4,
                         ElasticsearchInternalServiceSettings.MODEL_ID,
-                        ElasticsearchInternalService.MULTILINGUAL_E5_SMALL_MODEL_ID, // we can't directly test the eland case until we mock
-                                                                                     // the threadpool within the client
-                        "not_a_valid_service_setting",
-                        randomAlphaOfLength(10)
+                        ElasticsearchInternalService.MULTILINGUAL_E5_SMALL_MODEL_ID
                     )
                 )
             );
 
-            ActionListener<Model> modelListener = ActionListener.<Model>wrap(
-                model -> fail("Model parsing should have failed"),
-                e -> assertThat(e, instanceOf(ElasticsearchStatusException.class))
-            );
-
-            service.parseRequestConfig(randomInferenceEntityId, taskType, settings, Set.of(), modelListener);
-        }
-
-        // Extra service settings
-        {
-            var service = createService(mock(Client.class));
-            var settings = new HashMap<String, Object>();
-            settings.put(
-                ModelConfigurations.SERVICE_SETTINGS,
-                new HashMap<>(
-                    Map.of(
-                        ElasticsearchInternalServiceSettings.NUM_ALLOCATIONS,
-                        1,
-                        ElasticsearchInternalServiceSettings.NUM_THREADS,
-                        4,
-                        ElasticsearchInternalServiceSettings.MODEL_ID,
-                        ElasticsearchInternalService.MULTILINGUAL_E5_SMALL_MODEL_ID, // we can't directly test the eland case until we mock
-                                                                                     // the threadpool within the client
-                        "extra_setting_that_should_not_be_here",
-                        randomAlphaOfLength(10)
-                    )
-                )
+            var e5ServiceSettings = new MultilingualE5SmallInternalServiceSettings(
+                1,
+                4,
+                ElasticsearchInternalService.MULTILINGUAL_E5_SMALL_MODEL_ID,
+                null
             );
 
-            ActionListener<Model> modelListener = ActionListener.<Model>wrap(
-                model -> fail("Model parsing should have failed"),
-                e -> assertThat(e, instanceOf(ElasticsearchStatusException.class))
+            service.parseRequestConfig(
+                randomInferenceEntityId,
+                TaskType.TEXT_EMBEDDING,
+                settings,
+                Set.of(),
+                getModelVerificationActionListener(e5ServiceSettings)
             );
-
-            service.parseRequestConfig(randomInferenceEntityId, taskType, settings, Set.of(), modelListener);
         }
 
-        // Extra settings
+        // Invalid service settings
         {
             var service = createService(mock(Client.class));
             var settings = new HashMap<String, Object>();
@@ -237,19 +201,19 @@ public void testParseRequestConfig() {
                         ElasticsearchInternalServiceSettings.NUM_THREADS,
                         4,
                         ElasticsearchInternalServiceSettings.MODEL_ID,
-                        ElasticsearchInternalService.MULTILINGUAL_E5_SMALL_MODEL_ID // we can't directly test the eland case until we mock
-                        // the threadpool within the client
+                        ElasticsearchInternalService.MULTILINGUAL_E5_SMALL_MODEL_ID,
+                        "not_a_valid_service_setting",
+                        randomAlphaOfLength(10)
                     )
                 )
             );
-            settings.put("extra_setting_that_should_not_be_here", randomAlphaOfLength(10));
 
             ActionListener<Model> modelListener = ActionListener.<Model>wrap(
                 model -> fail("Model parsing should have failed"),
                 e -> assertThat(e, instanceOf(ElasticsearchStatusException.class))
             );
 
-            service.parseRequestConfig(randomInferenceEntityId, taskType, settings, Set.of(), modelListener);
+            service.parseRequestConfig(randomInferenceEntityId, TaskType.TEXT_EMBEDDING, settings, Set.of(), modelListener);
         }
     }
 
@@ -342,10 +306,53 @@ public void testParseRequestConfig_Rerank_DefaultTaskSettings() {
         }
     }
 
+    @SuppressWarnings("unchecked")
+    public void testParseRequestConfig_SparseEmbedding() {
+        var client = mock(Client.class);
+        doAnswer(invocation -> {
+            var listener = (ActionListener<GetTrainedModelsAction.Response>) invocation.getArguments()[2];
+            listener.onResponse(
+                new GetTrainedModelsAction.Response(new QueryPage<>(List.of(mock(TrainedModelConfig.class)), 1, mock(ParseField.class)))
+            );
+            return null;
+        }).when(client).execute(Mockito.same(GetTrainedModelsAction.INSTANCE), any(), any());
+
+        when(client.threadPool()).thenReturn(threadPool);
+
+        var service = createService(client);
+        var settings = new HashMap<String, Object>();
+        settings.put(
+            ModelConfigurations.SERVICE_SETTINGS,
+            new HashMap<>(
+                Map.of(
+                    ElasticsearchInternalServiceSettings.NUM_ALLOCATIONS,
+                    1,
+                    ElasticsearchInternalServiceSettings.NUM_THREADS,
+                    4,
+                    ElasticsearchInternalServiceSettings.MODEL_ID,
+                    "foo"
+                )
+            )
+        );
+
+        ActionListener<Model> modelListener = ActionListener.<Model>wrap(model -> {
+            assertThat(model, instanceOf(CustomElandModel.class));
+            assertThat(model.getTaskSettings(), instanceOf(EmptyTaskSettings.class));
+            assertThat(model.getServiceSettings(), instanceOf(CustomElandInternalServiceSettings.class));
+        }, e -> { fail("Model parsing failed " + e.getMessage()); });
+
+        service.parseRequestConfig(randomInferenceEntityId, TaskType.SPARSE_EMBEDDING, settings, Set.of(), modelListener);
+    }
+
     private ActionListener<Model> getModelVerificationActionListener(MultilingualE5SmallInternalServiceSettings e5ServiceSettings) {
         return ActionListener.<Model>wrap(model -> {
             assertEquals(
-                new MultilingualE5SmallModel(randomInferenceEntityId, taskType, ElasticsearchInternalService.NAME, e5ServiceSettings),
+                new MultilingualE5SmallModel(
+                    randomInferenceEntityId,
+                    TaskType.TEXT_EMBEDDING,
+                    ElasticsearchInternalService.NAME,
+                    e5ServiceSettings
+                ),
                 model
             );
         }, e -> { fail("Model parsing failed " + e.getMessage()); });
@@ -371,7 +378,10 @@ public void testParsePersistedConfig() {
                 )
             );
 
-            expectThrows(IllegalArgumentException.class, () -> service.parsePersistedConfig(randomInferenceEntityId, taskType, settings));
+            expectThrows(
+                IllegalArgumentException.class,
+                () -> service.parsePersistedConfig(randomInferenceEntityId, TaskType.TEXT_EMBEDDING, settings)
+            );
 
         }
 
@@ -397,12 +407,17 @@ public void testParsePersistedConfig() {
 
             CustomElandEmbeddingModel parsedModel = (CustomElandEmbeddingModel) service.parsePersistedConfig(
                 randomInferenceEntityId,
-                taskType,
+                TaskType.TEXT_EMBEDDING,
                 settings
             );
             var elandServiceSettings = new CustomElandInternalTextEmbeddingServiceSettings(1, 4, "invalid", null);
             assertEquals(
-                new CustomElandEmbeddingModel(randomInferenceEntityId, taskType, ElasticsearchInternalService.NAME, elandServiceSettings),
+                new CustomElandEmbeddingModel(
+                    randomInferenceEntityId,
+                    TaskType.TEXT_EMBEDDING,
+                    ElasticsearchInternalService.NAME,
+                    elandServiceSettings
+                ),
                 parsedModel
             );
         }
@@ -436,11 +451,16 @@ public void testParsePersistedConfig() {
 
             MultilingualE5SmallModel parsedModel = (MultilingualE5SmallModel) service.parsePersistedConfig(
                 randomInferenceEntityId,
-                taskType,
+                TaskType.TEXT_EMBEDDING,
                 settings
             );
             assertEquals(
-                new MultilingualE5SmallModel(randomInferenceEntityId, taskType, ElasticsearchInternalService.NAME, e5ServiceSettings),
+                new MultilingualE5SmallModel(
+                    randomInferenceEntityId,
+                    TaskType.TEXT_EMBEDDING,
+                    ElasticsearchInternalService.NAME,
+                    e5ServiceSettings
+                ),
                 parsedModel
             );
         }
@@ -456,6 +476,8 @@ public void testParsePersistedConfig() {
                 )
             );
             settings.put("not_a_valid_config_setting", randomAlphaOfLength(10));
+
+            var taskType = randomFrom(TaskType.TEXT_EMBEDDING, TaskType.RERANK, TaskType.SPARSE_EMBEDDING);
             expectThrows(IllegalArgumentException.class, () -> service.parsePersistedConfig(randomInferenceEntityId, taskType, settings));
         }
 
@@ -476,12 +498,13 @@ public void testParsePersistedConfig() {
                     )
                 )
             );
+            var taskType = randomFrom(TaskType.TEXT_EMBEDDING, TaskType.RERANK, TaskType.SPARSE_EMBEDDING);
             expectThrows(IllegalArgumentException.class, () -> service.parsePersistedConfig(randomInferenceEntityId, taskType, settings));
         }
     }
 
     @SuppressWarnings("unchecked")
-    public void testChunkInfer() {
+    public void testChunkInfer_e5() {
         var mlTrainedModelResults = new ArrayList<InferenceResults>();
         mlTrainedModelResults.add(MlChunkedTextEmbeddingFloatResultsTests.createRandomResults());
         mlTrainedModelResults.add(MlChunkedTextEmbeddingFloatResultsTests.createRandomResults());
@@ -568,6 +591,63 @@ public void testChunkInfer() {
         assertTrue("Listener not called", gotResults.get());
     }
 
+    @SuppressWarnings("unchecked")
+    public void testChunkInfer_Sparse() {
+        var mlTrainedModelResults = new ArrayList<InferenceResults>();
+        mlTrainedModelResults.add(InferenceChunkedTextExpansionResultsTests.createRandomResults());
+        mlTrainedModelResults.add(InferenceChunkedTextExpansionResultsTests.createRandomResults());
+        mlTrainedModelResults.add(new ErrorInferenceResults(new RuntimeException("boom")));
+        var response = new InferModelAction.Response(mlTrainedModelResults, "foo", true);
+
+        ThreadPool threadpool = new TestThreadPool("test");
+        Client client = mock(Client.class);
+        when(client.threadPool()).thenReturn(threadpool);
+        doAnswer(invocationOnMock -> {
+            var listener = (ActionListener<InferModelAction.Response>) invocationOnMock.getArguments()[2];
+            listener.onResponse(response);
+            return null;
+        }).when(client).execute(same(InferModelAction.INSTANCE), any(InferModelAction.Request.class), any(ActionListener.class));
+
+        var model = new CustomElandModel(
+            "foo",
+            TaskType.SPARSE_EMBEDDING,
+            "elasticsearch",
+            new ElasticsearchInternalServiceSettings(1, 1, "model-id", null)
+        );
+        var service = createService(client);
+
+        var gotResults = new AtomicBoolean();
+        var resultsListener = ActionListener.<List<ChunkedInferenceServiceResults>>wrap(chunkedResponse -> {
+            assertThat(chunkedResponse, hasSize(3));
+            assertThat(chunkedResponse.get(0), instanceOf(InferenceChunkedSparseEmbeddingResults.class));
+            var result1 = (InferenceChunkedSparseEmbeddingResults) chunkedResponse.get(0);
+            assertEquals(((MlChunkedTextExpansionResults) mlTrainedModelResults.get(0)).getChunks(), result1.getChunkedResults());
+            assertThat(chunkedResponse.get(1), instanceOf(InferenceChunkedSparseEmbeddingResults.class));
+            var result2 = (InferenceChunkedSparseEmbeddingResults) chunkedResponse.get(1);
+            assertEquals(((MlChunkedTextExpansionResults) mlTrainedModelResults.get(1)).getChunks(), result2.getChunkedResults());
+            var result3 = (ErrorChunkedInferenceResults) chunkedResponse.get(2);
+            assertThat(result3.getException(), instanceOf(RuntimeException.class));
+            assertThat(result3.getException().getMessage(), containsString("boom"));
+            gotResults.set(true);
+        }, ESTestCase::fail);
+
+        service.chunkedInfer(
+            model,
+            null,
+            List.of("foo", "bar"),
+            Map.of(),
+            InputType.SEARCH,
+            new ChunkingOptions(null, null),
+            InferenceAction.Request.DEFAULT_TIMEOUT,
+            ActionListener.runAfter(resultsListener, () -> terminate(threadpool))
+        );
+
+        if (gotResults.get() == false) {
+            terminate(threadpool);
+        }
+        assertTrue("Listener not called", gotResults.get());
+    }
+
     @SuppressWarnings("unchecked")
     public void testChunkInferSetsTokenization() {
         var expectedSpan = new AtomicInteger();
@@ -711,7 +791,7 @@ public void testParseRequestConfigEland_PreservesTaskType() {
             )
         );
 
-        var taskType = randomFrom(EnumSet.of(TaskType.RERANK, TaskType.TEXT_EMBEDDING));
+        var taskType = randomFrom(EnumSet.of(TaskType.RERANK, TaskType.TEXT_EMBEDDING, TaskType.SPARSE_EMBEDDING));
         CustomElandModel expectedModel = getCustomElandModel(taskType);
 
         PlainActionFuture<Model> listener = new PlainActionFuture<>();
@@ -739,6 +819,13 @@ private CustomElandModel getCustomElandModel(TaskType taskType) {
                 ElasticsearchInternalService.NAME,
                 serviceSettings
             );
+        } else if (taskType == TaskType.SPARSE_EMBEDDING) {
+            expectedModel = new CustomElandModel(
+                randomInferenceEntityId,
+                taskType,
+                ElasticsearchInternalService.NAME,
+                new CustomElandInternalServiceSettings(1, 4, "custom-model", null)
+            );
         }
         return expectedModel;
     }
@@ -867,21 +954,4 @@ private ElasticsearchInternalService createService(Client client) {
         var context = new InferenceServiceExtension.InferenceServiceFactoryContext(client);
         return new ElasticsearchInternalService(context);
     }
-
-    public static Model randomModelConfig(String inferenceEntityId) {
-        List<String> givenList = Arrays.asList("MultilingualE5SmallModel");
-        Random rand = org.elasticsearch.common.Randomness.get();
-        String model = givenList.get(rand.nextInt(givenList.size()));
-
-        return switch (model) {
-            case "MultilingualE5SmallModel" -> new MultilingualE5SmallModel(
-                inferenceEntityId,
-                TaskType.TEXT_EMBEDDING,
-                ElasticsearchInternalService.NAME,
-                MultilingualE5SmallInternalServiceSettingsTests.createRandom()
-            );
-            default -> throw new IllegalArgumentException("model " + model + " is not supported for testing");
-        };
-    }
-
 }

From 70261214641bfacada301bc5dd9392e0bc2a4594 Mon Sep 17 00:00:00 2001
From: Nik Everett <nik9000@gmail.com>
Date: Thu, 29 Aug 2024 12:51:24 -0400
Subject: [PATCH 055/144] ESQL: Move Exchange stuff to NamedWriteable (#112236)

This moves all of our `Exchange` style `PhysicalPlan`s to
`NamedWriteable` to line up with the rest of Elasticsearch.
---
 .../xpack/esql/io/stream/PlanNamedTypes.java  | 52 +-----------
 .../esql/plan/physical/ExchangeExec.java      | 50 ++++++++++-
 .../esql/plan/physical/ExchangeSinkExec.java  | 33 +++++++
 .../plan/physical/ExchangeSourceExec.java     | 26 ++++++
 .../esql/plan/physical/PhysicalPlan.java      | 11 ++-
 .../xpack/esql/planner/PlannerUtils.java      |  4 +-
 .../LocalPhysicalPlanOptimizerTests.java      |  2 +-
 .../optimizer/PhysicalPlanOptimizerTests.java |  2 +-
 .../plan/AbstractNodeSerializationTests.java  |  7 ++
 ...AbstractLogicalPlanSerializationTests.java |  5 --
 ...bstractPhysicalPlanSerializationTests.java | 15 +++-
 .../ExchangeExecSerializationTests.java       | 47 ++++++++++
 .../ExchangeSinkExecSerializationTests.java   | 85 +++++++------------
 .../ExchangeSourceExecSerializationTests.java | 40 +++++++++
 14 files changed, 260 insertions(+), 119 deletions(-)
 create mode 100644 x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeExecSerializationTests.java
 create mode 100644 x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSourceExecSerializationTests.java

diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypes.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypes.java
index af82ceb4bf809..56eab73cd042b 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypes.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypes.java
@@ -92,14 +92,9 @@ public static List<PlanNameRegistry.Entry> namedTypeEntries() {
             of(PhysicalPlan.class, EsSourceExec.ENTRY),
             of(PhysicalPlan.class, EvalExec.ENTRY),
             of(PhysicalPlan.class, EnrichExec.class, PlanNamedTypes::writeEnrichExec, PlanNamedTypes::readEnrichExec),
-            of(PhysicalPlan.class, ExchangeExec.class, PlanNamedTypes::writeExchangeExec, PlanNamedTypes::readExchangeExec),
-            of(PhysicalPlan.class, ExchangeSinkExec.class, PlanNamedTypes::writeExchangeSinkExec, PlanNamedTypes::readExchangeSinkExec),
-            of(
-                PhysicalPlan.class,
-                ExchangeSourceExec.class,
-                PlanNamedTypes::writeExchangeSourceExec,
-                PlanNamedTypes::readExchangeSourceExec
-            ),
+            of(PhysicalPlan.class, ExchangeExec.ENTRY),
+            of(PhysicalPlan.class, ExchangeSinkExec.ENTRY),
+            of(PhysicalPlan.class, ExchangeSourceExec.ENTRY),
             of(PhysicalPlan.class, FieldExtractExec.class, PlanNamedTypes::writeFieldExtractExec, PlanNamedTypes::readFieldExtractExec),
             of(PhysicalPlan.class, FilterExec.class, PlanNamedTypes::writeFilterExec, PlanNamedTypes::readFilterExec),
             of(PhysicalPlan.class, FragmentExec.class, PlanNamedTypes::writeFragmentExec, PlanNamedTypes::readFragmentExec),
@@ -174,47 +169,6 @@ static void writeEnrichExec(PlanStreamOutput out, EnrichExec enrich) throws IOEx
         out.writeNamedWriteableCollection(enrich.enrichFields());
     }
 
-    static ExchangeExec readExchangeExec(PlanStreamInput in) throws IOException {
-        return new ExchangeExec(
-            Source.readFrom(in),
-            in.readNamedWriteableCollectionAsList(Attribute.class),
-            in.readBoolean(),
-            in.readPhysicalPlanNode()
-        );
-    }
-
-    static void writeExchangeExec(PlanStreamOutput out, ExchangeExec exchangeExec) throws IOException {
-        Source.EMPTY.writeTo(out);
-        out.writeNamedWriteableCollection(exchangeExec.output());
-        out.writeBoolean(exchangeExec.isInBetweenAggs());
-        out.writePhysicalPlanNode(exchangeExec.child());
-    }
-
-    static ExchangeSinkExec readExchangeSinkExec(PlanStreamInput in) throws IOException {
-        return new ExchangeSinkExec(
-            Source.readFrom(in),
-            in.readNamedWriteableCollectionAsList(Attribute.class),
-            in.readBoolean(),
-            in.readPhysicalPlanNode()
-        );
-    }
-
-    static void writeExchangeSinkExec(PlanStreamOutput out, ExchangeSinkExec exchangeSinkExec) throws IOException {
-        Source.EMPTY.writeTo(out);
-        out.writeNamedWriteableCollection(exchangeSinkExec.output());
-        out.writeBoolean(exchangeSinkExec.isIntermediateAgg());
-        out.writePhysicalPlanNode(exchangeSinkExec.child());
-    }
-
-    static ExchangeSourceExec readExchangeSourceExec(PlanStreamInput in) throws IOException {
-        return new ExchangeSourceExec(Source.readFrom(in), in.readNamedWriteableCollectionAsList(Attribute.class), in.readBoolean());
-    }
-
-    static void writeExchangeSourceExec(PlanStreamOutput out, ExchangeSourceExec exchangeSourceExec) throws IOException {
-        out.writeNamedWriteableCollection(exchangeSourceExec.output());
-        out.writeBoolean(exchangeSourceExec.isIntermediateAgg());
-    }
-
     static FieldExtractExec readFieldExtractExec(PlanStreamInput in) throws IOException {
         return new FieldExtractExec(Source.readFrom(in), in.readPhysicalPlanNode(), in.readNamedWriteableCollectionAsList(Attribute.class));
     }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeExec.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeExec.java
index 61c65c484059e..f20b218f28efb 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeExec.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeExec.java
@@ -7,15 +7,27 @@
 
 package org.elasticsearch.xpack.esql.plan.physical;
 
+import org.elasticsearch.common.io.stream.NamedWriteableRegistry;
+import org.elasticsearch.common.io.stream.StreamInput;
+import org.elasticsearch.common.io.stream.StreamOutput;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
+import org.elasticsearch.xpack.esql.io.stream.PlanStreamInput;
+import org.elasticsearch.xpack.esql.io.stream.PlanStreamOutput;
 
+import java.io.IOException;
 import java.util.List;
+import java.util.Objects;
 
 import static java.util.Collections.emptyList;
 
 public class ExchangeExec extends UnaryExec {
+    public static final NamedWriteableRegistry.Entry ENTRY = new NamedWriteableRegistry.Entry(
+        PhysicalPlan.class,
+        "ExchangeExec",
+        ExchangeExec::new
+    );
 
     private final List<Attribute> output;
     private final boolean inBetweenAggs;
@@ -30,12 +42,34 @@ public ExchangeExec(Source source, List<Attribute> output, boolean inBetweenAggs
         this.inBetweenAggs = inBetweenAggs;
     }
 
+    private ExchangeExec(StreamInput in) throws IOException {
+        this(
+            Source.readFrom((PlanStreamInput) in),
+            in.readNamedWriteableCollectionAsList(Attribute.class),
+            in.readBoolean(),
+            ((PlanStreamInput) in).readPhysicalPlanNode()
+        );
+    }
+
+    @Override
+    public void writeTo(StreamOutput out) throws IOException {
+        Source.EMPTY.writeTo(out);
+        out.writeNamedWriteableCollection(output);
+        out.writeBoolean(inBetweenAggs());
+        ((PlanStreamOutput) out).writePhysicalPlanNode(child());
+    }
+
+    @Override
+    public String getWriteableName() {
+        return ENTRY.name;
+    }
+
     @Override
     public List<Attribute> output() {
         return output.isEmpty() ? super.output() : output;
     }
 
-    public boolean isInBetweenAggs() {
+    public boolean inBetweenAggs() {
         return inBetweenAggs;
     }
 
@@ -48,4 +82,18 @@ public UnaryExec replaceChild(PhysicalPlan newChild) {
     protected NodeInfo<? extends PhysicalPlan> info() {
         return NodeInfo.create(this, ExchangeExec::new, output, inBetweenAggs, child());
     }
+
+    @Override
+    public boolean equals(Object obj) {
+        if (super.equals(obj) == false) {
+            return false;
+        }
+        ExchangeExec other = (ExchangeExec) obj;
+        return output.equals(other.output) && inBetweenAggs == other.inBetweenAggs;
+    }
+
+    @Override
+    public int hashCode() {
+        return Objects.hash(super.hashCode(), output, inBetweenAggs);
+    }
 }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSinkExec.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSinkExec.java
index 2f7c4a93eec71..2992619da75ef 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSinkExec.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSinkExec.java
@@ -7,14 +7,25 @@
 
 package org.elasticsearch.xpack.esql.plan.physical;
 
+import org.elasticsearch.common.io.stream.NamedWriteableRegistry;
+import org.elasticsearch.common.io.stream.StreamInput;
+import org.elasticsearch.common.io.stream.StreamOutput;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
+import org.elasticsearch.xpack.esql.io.stream.PlanStreamInput;
+import org.elasticsearch.xpack.esql.io.stream.PlanStreamOutput;
 
+import java.io.IOException;
 import java.util.List;
 import java.util.Objects;
 
 public class ExchangeSinkExec extends UnaryExec {
+    public static final NamedWriteableRegistry.Entry ENTRY = new NamedWriteableRegistry.Entry(
+        PhysicalPlan.class,
+        "ExchangeSinkExec",
+        ExchangeSinkExec::new
+    );
 
     private final List<Attribute> output;
     private final boolean intermediateAgg;
@@ -25,6 +36,28 @@ public ExchangeSinkExec(Source source, List<Attribute> output, boolean intermedi
         this.intermediateAgg = intermediateAgg;
     }
 
+    private ExchangeSinkExec(StreamInput in) throws IOException {
+        this(
+            Source.readFrom((PlanStreamInput) in),
+            in.readNamedWriteableCollectionAsList(Attribute.class),
+            in.readBoolean(),
+            ((PlanStreamInput) in).readPhysicalPlanNode()
+        );
+    }
+
+    @Override
+    public void writeTo(StreamOutput out) throws IOException {
+        Source.EMPTY.writeTo(out);
+        out.writeNamedWriteableCollection(output());
+        out.writeBoolean(isIntermediateAgg());
+        ((PlanStreamOutput) out).writePhysicalPlanNode(child());
+    }
+
+    @Override
+    public String getWriteableName() {
+        return ENTRY.name;
+    }
+
     @Override
     public List<Attribute> output() {
         return output;
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSourceExec.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSourceExec.java
index 44c9b38feee48..e679a9b131d1d 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSourceExec.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSourceExec.java
@@ -7,14 +7,24 @@
 
 package org.elasticsearch.xpack.esql.plan.physical;
 
+import org.elasticsearch.common.io.stream.NamedWriteableRegistry;
+import org.elasticsearch.common.io.stream.StreamInput;
+import org.elasticsearch.common.io.stream.StreamOutput;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
+import org.elasticsearch.xpack.esql.io.stream.PlanStreamInput;
 
+import java.io.IOException;
 import java.util.List;
 import java.util.Objects;
 
 public class ExchangeSourceExec extends LeafExec {
+    public static final NamedWriteableRegistry.Entry ENTRY = new NamedWriteableRegistry.Entry(
+        PhysicalPlan.class,
+        "ExchangeSourceExec",
+        ExchangeSourceExec::new
+    );
 
     private final List<Attribute> output;
     private final boolean intermediateAgg;
@@ -25,6 +35,22 @@ public ExchangeSourceExec(Source source, List<Attribute> output, boolean interme
         this.intermediateAgg = intermediateAgg;
     }
 
+    private ExchangeSourceExec(StreamInput in) throws IOException {
+        this(Source.readFrom((PlanStreamInput) in), in.readNamedWriteableCollectionAsList(Attribute.class), in.readBoolean());
+    }
+
+    @Override
+    public void writeTo(StreamOutput out) throws IOException {
+        source().writeTo(out);
+        out.writeNamedWriteableCollection(output());
+        out.writeBoolean(isIntermediateAgg());
+    }
+
+    @Override
+    public String getWriteableName() {
+        return ENTRY.name;
+    }
+
     @Override
     public List<Attribute> output() {
         return output;
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/PhysicalPlan.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/PhysicalPlan.java
index 60e44a5140dfa..6fcdf573564ff 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/PhysicalPlan.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/PhysicalPlan.java
@@ -23,7 +23,16 @@
  */
 public abstract class PhysicalPlan extends QueryPlan<PhysicalPlan> {
     public static List<NamedWriteableRegistry.Entry> getNamedWriteables() {
-        return List.of(AggregateExec.ENTRY, DissectExec.ENTRY, EsQueryExec.ENTRY, EsSourceExec.ENTRY, EvalExec.ENTRY);
+        return List.of(
+            AggregateExec.ENTRY,
+            DissectExec.ENTRY,
+            EsQueryExec.ENTRY,
+            EsSourceExec.ENTRY,
+            EvalExec.ENTRY,
+            ExchangeExec.ENTRY,
+            ExchangeSinkExec.ENTRY,
+            ExchangeSourceExec.ENTRY
+        );
     }
 
     public PhysicalPlan(Source source, List<PhysicalPlan> children) {
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/PlannerUtils.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/PlannerUtils.java
index 7187de4676fe7..29be49e60ad37 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/PlannerUtils.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/PlannerUtils.java
@@ -73,9 +73,9 @@ public static Tuple<PhysicalPlan, PhysicalPlan> breakPlanBetweenCoordinatorAndDa
         PhysicalPlan coordinatorPlan = plan.transformUp(ExchangeExec.class, e -> {
             // remember the datanode subplan and wire it to a sink
             var subplan = e.child();
-            dataNodePlan.set(new ExchangeSinkExec(e.source(), e.output(), e.isInBetweenAggs(), subplan));
+            dataNodePlan.set(new ExchangeSinkExec(e.source(), e.output(), e.inBetweenAggs(), subplan));
 
-            return new ExchangeSourceExec(e.source(), e.output(), e.isInBetweenAggs());
+            return new ExchangeSourceExec(e.source(), e.output(), e.inBetweenAggs());
         });
         return new Tuple<>(coordinatorPlan, dataNodePlan.get());
     }
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalPhysicalPlanOptimizerTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalPhysicalPlanOptimizerTests.java
index 5fba11c13561c..ee66e3043b62f 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalPhysicalPlanOptimizerTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalPhysicalPlanOptimizerTests.java
@@ -504,7 +504,7 @@ public boolean exists(String field) {
         assertThat(agg.getMode(), is(FINAL));
         assertThat(Expressions.names(agg.aggregates()), contains("c"));
         var exchange = as(agg.child(), ExchangeExec.class);
-        assertThat(exchange.isInBetweenAggs(), is(true));
+        assertThat(exchange.inBetweenAggs(), is(true));
         var localSource = as(exchange.child(), LocalSourceExec.class);
         assertThat(Expressions.names(localSource.output()), contains("count", "seen"));
     }
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/PhysicalPlanOptimizerTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/PhysicalPlanOptimizerTests.java
index 7dfa36011bf1f..5b8a465b05f1c 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/PhysicalPlanOptimizerTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/PhysicalPlanOptimizerTests.java
@@ -4603,7 +4603,7 @@ static PhysicalPlan localRelationshipAlignment(PhysicalPlan l) {
         // handle local reduction alignment
         return l.transformUp(ExchangeExec.class, exg -> {
             PhysicalPlan pl = exg;
-            if (exg.isInBetweenAggs() && exg.child() instanceof LocalSourceExec lse) {
+            if (exg.inBetweenAggs() && exg.child() instanceof LocalSourceExec lse) {
                 var output = exg.output();
                 if (lse.output().equals(output) == false) {
                     pl = exg.replaceChild(new LocalSourceExec(lse.source(), output, lse.supplier()));
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/AbstractNodeSerializationTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/AbstractNodeSerializationTests.java
index 40dc05dd64cc0..e6f5d6e4fac70 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/AbstractNodeSerializationTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/AbstractNodeSerializationTests.java
@@ -9,8 +9,10 @@
 
 import org.elasticsearch.TransportVersion;
 import org.elasticsearch.test.AbstractWireTestCase;
+import org.elasticsearch.xpack.esql.core.expression.Attribute;
 import org.elasticsearch.xpack.esql.core.tree.Node;
 import org.elasticsearch.xpack.esql.core.tree.Source;
+import org.elasticsearch.xpack.esql.expression.function.FieldAttributeTests;
 import org.elasticsearch.xpack.esql.io.stream.PlanNameRegistry;
 import org.elasticsearch.xpack.esql.io.stream.PlanStreamInput;
 import org.elasticsearch.xpack.esql.io.stream.PlanStreamOutput;
@@ -18,6 +20,7 @@
 import org.junit.Before;
 
 import java.io.IOException;
+import java.util.List;
 import java.util.Map;
 
 import static org.elasticsearch.xpack.esql.ConfigurationTestUtils.randomConfiguration;
@@ -44,6 +47,10 @@ public static Source randomSource() {
         return new Source(lineNumber + 1, offset, text);
     }
 
+    public static List<Attribute> randomFieldAttributes(int min, int max, boolean onlyRepresentable) {
+        return randomList(min, max, () -> FieldAttributeTests.createFieldAttribute(0, onlyRepresentable));
+    }
+
     @Override
     protected final T copyInstance(T instance, TransportVersion version) throws IOException {
         return copyInstance(
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/logical/AbstractLogicalPlanSerializationTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/logical/AbstractLogicalPlanSerializationTests.java
index 1b9df46a1c842..6936c96a143d4 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/logical/AbstractLogicalPlanSerializationTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/logical/AbstractLogicalPlanSerializationTests.java
@@ -13,7 +13,6 @@
 import org.elasticsearch.xpack.esql.core.expression.Expression;
 import org.elasticsearch.xpack.esql.core.expression.NamedExpression;
 import org.elasticsearch.xpack.esql.core.tree.Node;
-import org.elasticsearch.xpack.esql.expression.function.FieldAttributeTests;
 import org.elasticsearch.xpack.esql.expression.function.aggregate.AggregateFunction;
 import org.elasticsearch.xpack.esql.plan.AbstractNodeSerializationTests;
 import org.elasticsearch.xpack.esql.plan.logical.local.LocalRelationSerializationTests;
@@ -30,10 +29,6 @@ public static LogicalPlan randomChild(int depth) {
         return randomBoolean() ? EsRelationSerializationTests.randomEsRelation() : LocalRelationSerializationTests.randomLocalRelation();
     }
 
-    public static List<Attribute> randomFieldAttributes(int min, int max, boolean onlyRepresentable) {
-        return randomList(min, max, () -> FieldAttributeTests.createFieldAttribute(0, onlyRepresentable));
-    }
-
     @Override
     protected final NamedWriteableRegistry getNamedWriteableRegistry() {
         List<NamedWriteableRegistry.Entry> entries = new ArrayList<>();
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/AbstractPhysicalPlanSerializationTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/AbstractPhysicalPlanSerializationTests.java
index 2a05c472328e5..4b74114a0e01c 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/AbstractPhysicalPlanSerializationTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/AbstractPhysicalPlanSerializationTests.java
@@ -18,6 +18,7 @@
 import org.elasticsearch.xpack.esql.expression.function.aggregate.AggregateFunction;
 import org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic.Add;
 import org.elasticsearch.xpack.esql.plan.AbstractNodeSerializationTests;
+import org.elasticsearch.xpack.esql.plan.logical.LogicalPlan;
 
 import java.util.ArrayList;
 import java.util.List;
@@ -25,14 +26,21 @@
 import static org.elasticsearch.xpack.esql.plan.physical.AggregateExecSerializationTests.randomAggregateExec;
 import static org.elasticsearch.xpack.esql.plan.physical.DissectExecSerializationTests.randomDissectExec;
 import static org.elasticsearch.xpack.esql.plan.physical.EsSourceExecSerializationTests.randomEsSourceExec;
+import static org.elasticsearch.xpack.esql.plan.physical.ExchangeExecSerializationTests.randomExchangeExec;
+import static org.elasticsearch.xpack.esql.plan.physical.ExchangeSinkExecSerializationTests.randomExchangeSinkExec;
+import static org.elasticsearch.xpack.esql.plan.physical.ExchangeSourceExecSerializationTests.randomExchangeSourceExec;
 
 public abstract class AbstractPhysicalPlanSerializationTests<T extends PhysicalPlan> extends AbstractNodeSerializationTests<T> {
     public static PhysicalPlan randomChild(int depth) {
         if (randomBoolean() && depth < 4) {
-            // TODO more random options
-            return randomBoolean() ? randomDissectExec(depth + 1) : randomAggregateExec(depth + 1);
+            switch (between(0, 3)) {
+                case 0 -> randomDissectExec(depth + 1);
+                case 1 -> randomExchangeExec(depth + 1);
+                case 2 -> randomExchangeSinkExec(depth + 1);
+                case 3 -> randomAggregateExec(depth + 1);
+            }
         }
-        return randomEsSourceExec();
+        return randomBoolean() ? randomExchangeSourceExec() : randomEsSourceExec();
     }
 
     public static Integer randomEstimatedRowSize() {
@@ -43,6 +51,7 @@ public static Integer randomEstimatedRowSize() {
     protected final NamedWriteableRegistry getNamedWriteableRegistry() {
         List<NamedWriteableRegistry.Entry> entries = new ArrayList<>();
         entries.addAll(PhysicalPlan.getNamedWriteables());
+        entries.addAll(LogicalPlan.getNamedWriteables());
         entries.addAll(AggregateFunction.getNamedWriteables());
         entries.addAll(Expression.getNamedWriteables());
         entries.addAll(Attribute.getNamedWriteables());
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeExecSerializationTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeExecSerializationTests.java
new file mode 100644
index 0000000000000..572eac0ff409c
--- /dev/null
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeExecSerializationTests.java
@@ -0,0 +1,47 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.esql.plan.physical;
+
+import org.elasticsearch.xpack.esql.core.expression.Attribute;
+import org.elasticsearch.xpack.esql.core.tree.Source;
+
+import java.io.IOException;
+import java.util.List;
+
+public class ExchangeExecSerializationTests extends AbstractPhysicalPlanSerializationTests<ExchangeExec> {
+    static ExchangeExec randomExchangeExec(int depth) {
+        Source source = randomSource();
+        List<Attribute> output = randomFieldAttributes(1, 5, false);
+        boolean inBetweenAggs = randomBoolean();
+        PhysicalPlan child = randomChild(depth);
+        return new ExchangeExec(source, output, inBetweenAggs, child);
+    }
+
+    @Override
+    protected ExchangeExec createTestInstance() {
+        return randomExchangeExec(0);
+    }
+
+    @Override
+    protected ExchangeExec mutateInstance(ExchangeExec instance) throws IOException {
+        List<Attribute> output = instance.output();
+        boolean inBetweenAggs = instance.inBetweenAggs();
+        PhysicalPlan child = instance.child();
+        switch (between(0, 2)) {
+            case 0 -> output = randomValueOtherThan(output, () -> randomFieldAttributes(1, 5, false));
+            case 1 -> inBetweenAggs = false == inBetweenAggs;
+            case 2 -> child = randomValueOtherThan(child, () -> randomChild(0));
+        }
+        return new ExchangeExec(instance.source(), output, inBetweenAggs, child);
+    }
+
+    @Override
+    protected boolean alwaysEmptySource() {
+        return true;
+    }
+}
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSinkExecSerializationTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSinkExecSerializationTests.java
index ae58c49eade17..be30ac20df64e 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSinkExecSerializationTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSinkExecSerializationTests.java
@@ -8,21 +8,13 @@
 package org.elasticsearch.xpack.esql.plan.physical;
 
 import org.elasticsearch.common.io.stream.BytesStreamOutput;
-import org.elasticsearch.common.io.stream.NamedWriteableRegistry;
-import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.unit.ByteSizeValue;
-import org.elasticsearch.compute.data.Block;
 import org.elasticsearch.index.IndexMode;
-import org.elasticsearch.search.SearchModule;
-import org.elasticsearch.test.ESTestCase;
 import org.elasticsearch.xpack.esql.analysis.Analyzer;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
-import org.elasticsearch.xpack.esql.core.expression.Expression;
 import org.elasticsearch.xpack.esql.core.expression.Literal;
-import org.elasticsearch.xpack.esql.core.expression.NamedExpression;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 import org.elasticsearch.xpack.esql.core.type.DataType;
-import org.elasticsearch.xpack.esql.expression.function.aggregate.AggregateFunction;
 import org.elasticsearch.xpack.esql.index.EsIndex;
 import org.elasticsearch.xpack.esql.index.EsIndexSerializationTests;
 import org.elasticsearch.xpack.esql.io.stream.PlanNameRegistry;
@@ -30,31 +22,44 @@
 import org.elasticsearch.xpack.esql.io.stream.PlanStreamOutput;
 import org.elasticsearch.xpack.esql.plan.logical.EsRelation;
 import org.elasticsearch.xpack.esql.plan.logical.Limit;
-import org.elasticsearch.xpack.esql.plan.logical.LogicalPlan;
 import org.elasticsearch.xpack.esql.plan.logical.Project;
-import org.elasticsearch.xpack.esql.session.Configuration;
-import org.junit.Before;
 
 import java.io.IOException;
-import java.util.ArrayList;
 import java.util.List;
-import java.util.Map;
 
 import static org.elasticsearch.test.ByteSizeEqualsMatcher.byteSizeEquals;
-import static org.elasticsearch.xpack.esql.ConfigurationTestUtils.randomConfiguration;
 import static org.hamcrest.Matchers.equalTo;
 
-public class ExchangeSinkExecSerializationTests extends ESTestCase {
-    // TODO port this to AbstractPhysicalPlanSerializationTests when implementing NamedWriteable
-    private Configuration config;
+public class ExchangeSinkExecSerializationTests extends AbstractPhysicalPlanSerializationTests<ExchangeSinkExec> {
+    static ExchangeSinkExec randomExchangeSinkExec(int depth) {
+        Source source = randomSource();
+        List<Attribute> output = randomFieldAttributes(1, 5, false);
+        boolean intermediateAgg = randomBoolean();
+        PhysicalPlan child = randomChild(depth);
+        return new ExchangeSinkExec(source, output, intermediateAgg, child);
+    }
+
+    @Override
+    protected ExchangeSinkExec createTestInstance() {
+        return randomExchangeSinkExec(0);
+    }
 
-    public static Source randomSource() {
-        int lineNumber = between(0, EXAMPLE_QUERY.length - 1);
-        String line = EXAMPLE_QUERY[lineNumber];
-        int offset = between(0, line.length() - 2);
-        int length = between(1, line.length() - offset - 1);
-        String text = line.substring(offset, offset + length);
-        return new Source(lineNumber + 1, offset, text);
+    @Override
+    protected ExchangeSinkExec mutateInstance(ExchangeSinkExec instance) throws IOException {
+        List<Attribute> output = instance.output();
+        boolean intermediateAgg = instance.isIntermediateAgg();
+        PhysicalPlan child = instance.child();
+        switch (between(0, 2)) {
+            case 0 -> output = randomValueOtherThan(output, () -> randomFieldAttributes(1, 5, false));
+            case 1 -> intermediateAgg = false == intermediateAgg;
+            case 2 -> child = randomValueOtherThan(child, () -> randomChild(0));
+        }
+        return new ExchangeSinkExec(instance.source(), output, intermediateAgg, child);
+    }
+
+    @Override
+    protected boolean alwaysEmptySource() {
+        return true;
     }
 
     /**
@@ -128,36 +133,4 @@ private void testManyTypeConflicts(boolean withParent, ByteSizeValue expected) t
             }
         }
     }
-
-    private NamedWriteableRegistry getNamedWriteableRegistry() {
-        List<NamedWriteableRegistry.Entry> entries = new ArrayList<>();
-        entries.addAll(PhysicalPlan.getNamedWriteables());
-        entries.addAll(LogicalPlan.getNamedWriteables());
-        entries.addAll(AggregateFunction.getNamedWriteables());
-        entries.addAll(Expression.getNamedWriteables());
-        entries.addAll(Attribute.getNamedWriteables());
-        entries.addAll(Block.getNamedWriteables());
-        entries.addAll(NamedExpression.getNamedWriteables());
-        entries.addAll(new SearchModule(Settings.EMPTY, List.of()).getNamedWriteables());
-        return new NamedWriteableRegistry(entries);
-    }
-
-    private Configuration configuration() {
-        return config;
-    }
-
-    private static final String[] EXAMPLE_QUERY = new String[] {
-        "I am the very model of a modern Major-Gineral,",
-        "I've information vegetable, animal, and mineral,",
-        "I know the kings of England, and I quote the fights historical",
-        "From Marathon to Waterloo, in order categorical;",
-        "I'm very well acquainted, too, with matters mathematical,",
-        "I understand equations, both the simple and quadratical,",
-        "About binomial theorem I'm teeming with a lot o' news,",
-        "With many cheerful facts about the square of the hypotenuse." };
-
-    @Before
-    public void initConfig() {
-        config = randomConfiguration(String.join("\n", EXAMPLE_QUERY), Map.of());
-    }
 }
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSourceExecSerializationTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSourceExecSerializationTests.java
new file mode 100644
index 0000000000000..a1a890f3addd6
--- /dev/null
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSourceExecSerializationTests.java
@@ -0,0 +1,40 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.esql.plan.physical;
+
+import org.elasticsearch.xpack.esql.core.expression.Attribute;
+import org.elasticsearch.xpack.esql.core.tree.Source;
+
+import java.io.IOException;
+import java.util.List;
+
+public class ExchangeSourceExecSerializationTests extends AbstractPhysicalPlanSerializationTests<ExchangeSourceExec> {
+    static ExchangeSourceExec randomExchangeSourceExec() {
+        Source source = randomSource();
+        List<Attribute> output = randomFieldAttributes(1, 5, false);
+        boolean intermediateAgg = randomBoolean();
+        return new ExchangeSourceExec(source, output, intermediateAgg);
+    }
+
+    @Override
+    protected ExchangeSourceExec createTestInstance() {
+        return randomExchangeSourceExec();
+    }
+
+    @Override
+    protected ExchangeSourceExec mutateInstance(ExchangeSourceExec instance) throws IOException {
+        List<Attribute> output = instance.output();
+        boolean intermediateAgg = instance.isIntermediateAgg();
+        if (randomBoolean()) {
+            output = randomValueOtherThan(output, () -> randomFieldAttributes(1, 5, false));
+        } else {
+            intermediateAgg = false == intermediateAgg;
+        }
+        return new ExchangeSourceExec(instance.source(), output, intermediateAgg);
+    }
+}

From 84bd31eb8eba90d568cf213cdef475d8d03c2bdd Mon Sep 17 00:00:00 2001
From: Ryan Ernst <ryan@iernst.net>
Date: Thu, 29 Aug 2024 10:20:43 -0700
Subject: [PATCH 056/144] Fix shutdown race condition in server start (#112300)

When the server CLI is preparing to start Elasticsearch, it may receive
a SIGTERM. That signal causes the close method of the CLI to be invoked,
which checks for a non-null server process, and stops it if it exists.
Since shutdown occurs in a different thread, it is possible close is
invoked, sees the server process is null, so skips calling close, but
then before close finishes the server process is started.

Normally the above case is ok; the close method will cause Java to exit,
and the child process will be sent a SIGTERM. However, in the case of
serverless, close is wrapped so that the CLI can wait on uploading
possible heapdumps. This presents the possibility that close thinks the
child process has been stopped, but it hasn't, so the wrapped close
waits indefinitely on the child process that was started up during the
race.

This commit guards against the startup race by locking the critical
sections that create the child process and stop it. Either the child
process is created first, and will then be stopped immediately, or close
is invoked first, marking that the CLI is shutting down, and creating
the child process will be skipped.
---
 .../elasticsearch/server/cli/ServerCli.java   | 19 ++++-
 .../server/cli/ServerCliTests.java            | 78 +++++++++++++++----
 2 files changed, 81 insertions(+), 16 deletions(-)

diff --git a/distribution/tools/server-cli/src/main/java/org/elasticsearch/server/cli/ServerCli.java b/distribution/tools/server-cli/src/main/java/org/elasticsearch/server/cli/ServerCli.java
index 7b904d4cb5a89..bea7fbb7f63e8 100644
--- a/distribution/tools/server-cli/src/main/java/org/elasticsearch/server/cli/ServerCli.java
+++ b/distribution/tools/server-cli/src/main/java/org/elasticsearch/server/cli/ServerCli.java
@@ -32,6 +32,7 @@
 import java.nio.file.Path;
 import java.util.Arrays;
 import java.util.Locale;
+import java.util.concurrent.atomic.AtomicBoolean;
 
 /**
  * The main CLI for running Elasticsearch.
@@ -44,6 +45,8 @@ class ServerCli extends EnvironmentAwareCommand {
     private final OptionSpecBuilder quietOption;
     private final OptionSpec<String> enrollmentTokenOption;
 
+    // flag for indicating shutdown has begun. we use an AtomicBoolean to double as a synchronization object
+    private final AtomicBoolean shuttingDown = new AtomicBoolean(false);
     private volatile ServerProcess server;
 
     // visible for testing
@@ -98,7 +101,14 @@ public void execute(Terminal terminal, OptionSet options, Environment env, Proce
             syncPlugins(terminal, env, processInfo);
 
             ServerArgs args = createArgs(options, env, secrets, processInfo);
-            this.server = startServer(terminal, processInfo, args);
+            synchronized (shuttingDown) {
+                // if we are shutting down there is no reason to start the server
+                if (shuttingDown.get()) {
+                    terminal.println("CLI is shutting down, skipping starting server process");
+                    return;
+                }
+                this.server = startServer(terminal, processInfo, args);
+            }
         }
 
         if (options.has(daemonizeOption)) {
@@ -233,8 +243,11 @@ private ServerArgs createArgs(OptionSet options, Environment env, SecureSettings
 
     @Override
     public void close() throws IOException {
-        if (server != null) {
-            server.stop();
+        synchronized (shuttingDown) {
+            shuttingDown.set(true);
+            if (server != null) {
+                server.stop();
+            }
         }
     }
 
diff --git a/distribution/tools/server-cli/src/test/java/org/elasticsearch/server/cli/ServerCliTests.java b/distribution/tools/server-cli/src/test/java/org/elasticsearch/server/cli/ServerCliTests.java
index 38a64a778fc27..e603790051c0c 100644
--- a/distribution/tools/server-cli/src/test/java/org/elasticsearch/server/cli/ServerCliTests.java
+++ b/distribution/tools/server-cli/src/test/java/org/elasticsearch/server/cli/ServerCliTests.java
@@ -36,6 +36,8 @@
 import java.util.List;
 import java.util.Locale;
 import java.util.Optional;
+import java.util.concurrent.BrokenBarrierException;
+import java.util.concurrent.CyclicBarrier;
 import java.util.concurrent.atomic.AtomicBoolean;
 import java.util.concurrent.atomic.AtomicReference;
 import java.util.function.Consumer;
@@ -50,6 +52,7 @@
 import static org.hamcrest.Matchers.is;
 import static org.hamcrest.Matchers.matchesRegex;
 import static org.hamcrest.Matchers.not;
+import static org.hamcrest.Matchers.sameInstance;
 
 public class ServerCliTests extends CommandTestCase {
 
@@ -383,6 +386,52 @@ public void testSecureSettingsLoaderWithNullPassword() throws Exception {
         assertEquals("", loader.password);
     }
 
+    public void testProcessCreationRace() throws Exception {
+        for (int i = 0; i < 10; ++i) {
+            CyclicBarrier raceStart = new CyclicBarrier(2);
+            TestServerCli cli = new TestServerCli() {
+                @Override
+                void syncPlugins(Terminal terminal, Environment env, ProcessInfo processInfo) throws Exception {
+                    super.syncPlugins(terminal, env, processInfo);
+                    raceStart.await();
+                }
+
+                @Override
+                public void close() throws IOException {
+                    try {
+                        raceStart.await();
+                    } catch (InterruptedException ie) {
+                        Thread.currentThread().interrupt();
+                        throw new AssertionError(ie);
+                    } catch (BrokenBarrierException e) {
+                        throw new AssertionError(e);
+                    }
+                    super.close();
+                }
+            };
+            Thread closeThread = new Thread(() -> {
+                try {
+                    cli.close();
+                } catch (IOException e) {
+                    throw new AssertionError(e);
+                }
+            });
+            closeThread.start();
+            cli.main(new String[] {}, terminal, new ProcessInfo(sysprops, envVars, esHomeDir));
+            closeThread.join();
+
+            if (cli.getServer() == null) {
+                // close won the race, so server should never have been started
+                assertThat(cli.startServerCalled, is(false));
+            } else {
+                // creation won the race, so check we correctly waited on it and stopped
+                assertThat(cli.getServer(), sameInstance(mockServer));
+                assertThat(mockServer.waitForCalled, is(true));
+                assertThat(mockServer.stopCalled, is(true));
+            }
+        }
+    }
+
     private MockSecureSettingsLoader loadWithMockSecureSettingsLoader() throws Exception {
         var loader = new MockSecureSettingsLoader();
         this.mockSecureSettingsLoader = loader;
@@ -465,9 +514,9 @@ public void execute(Terminal terminal, OptionSet options, Environment env, Proce
     }
 
     private class MockServerProcess extends ServerProcess {
-        boolean detachCalled = false;
-        boolean waitForCalled = false;
-        boolean stopCalled = false;
+        volatile boolean detachCalled = false;
+        volatile boolean waitForCalled = false;
+        volatile boolean stopCalled = false;
 
         MockServerProcess() {
             super(null, null);
@@ -505,6 +554,8 @@ void reset() {
     }
 
     private class TestServerCli extends ServerCli {
+        boolean startServerCalled = false;
+
         @Override
         protected Command loadTool(String toolname, String libs) {
             if (toolname.equals("auto-configure-node")) {
@@ -551,20 +602,21 @@ protected SecureSettingsLoader secureSettingsLoader(Environment env) {
 
             return new KeystoreSecureSettingsLoader();
         }
+
+        @Override
+        protected ServerProcess startServer(Terminal terminal, ProcessInfo processInfo, ServerArgs args) throws Exception {
+            startServerCalled = true;
+            if (argsValidator != null) {
+                argsValidator.accept(args);
+            }
+            mockServer.reset();
+            return mockServer;
+        }
     }
 
     @Override
     protected Command newCommand() {
-        return new TestServerCli() {
-            @Override
-            protected ServerProcess startServer(Terminal terminal, ProcessInfo processInfo, ServerArgs args) {
-                if (argsValidator != null) {
-                    argsValidator.accept(args);
-                }
-                mockServer.reset();
-                return mockServer;
-            }
-        };
+        return new TestServerCli();
     }
 
     static class MockSecureSettingsLoader implements SecureSettingsLoader {

From bc1706f47906ec52fb7cf08a53d5ee002f8c94eb Mon Sep 17 00:00:00 2001
From: Nhat Nguyen <nhat.nguyen@elastic.co>
Date: Thu, 29 Aug 2024 11:29:24 -0700
Subject: [PATCH 057/144] Add index mode to internal field-caps response
 (#112368)

We need the index mode from resolved indices for the METRICS command and
future LOGS command in ES|QL. This change adds the index mode to the
internal field-caps index response, which is not user-facing. ES|QL will
use this output, and the overhead should be minimal, as we serialize one
index_mode per mapping_hash group.
---
 .../search/fieldcaps/FieldCapabilitiesIT.java | 58 +++++++++++++++++++
 .../org/elasticsearch/TransportVersions.java  |  2 +
 .../fieldcaps/FieldCapabilitiesFetcher.java   | 10 ++--
 .../FieldCapabilitiesIndexResponse.java       | 31 ++++++++--
 .../TransportFieldCapabilitiesAction.java     | 24 +++++++-
 .../org/elasticsearch/index/IndexMode.java    | 21 +++++++
 .../FieldCapabilitiesIndexResponseTests.java  |  7 ++-
 .../FieldCapabilitiesNodeResponseTests.java   | 36 +++++++++---
 .../FieldCapabilitiesResponseTests.java       | 12 ++--
 .../fieldcaps/RequestDispatcherTests.java     |  9 ++-
 .../xpack/esql/analysis/AnalyzerTests.java    |  4 +-
 .../enrich/EnrichPolicyResolverTests.java     |  3 +-
 .../esql/stats/PlanExecutorMetricsTests.java  |  4 +-
 .../esql/type/EsqlDataTypeRegistryTests.java  |  4 +-
 14 files changed, 194 insertions(+), 31 deletions(-)

diff --git a/server/src/internalClusterTest/java/org/elasticsearch/search/fieldcaps/FieldCapabilitiesIT.java b/server/src/internalClusterTest/java/org/elasticsearch/search/fieldcaps/FieldCapabilitiesIT.java
index 0bce9ecb178d0..cc272042d5384 100644
--- a/server/src/internalClusterTest/java/org/elasticsearch/search/fieldcaps/FieldCapabilitiesIT.java
+++ b/server/src/internalClusterTest/java/org/elasticsearch/search/fieldcaps/FieldCapabilitiesIT.java
@@ -89,6 +89,7 @@
 import static org.hamcrest.Matchers.array;
 import static org.hamcrest.Matchers.arrayContainingInAnyOrder;
 import static org.hamcrest.Matchers.containsInAnyOrder;
+import static org.hamcrest.Matchers.empty;
 import static org.hamcrest.Matchers.equalTo;
 import static org.hamcrest.Matchers.greaterThanOrEqualTo;
 import static org.hamcrest.Matchers.hasKey;
@@ -711,6 +712,63 @@ public void testCancel() throws Exception {
         }
     }
 
+    public void testIndexMode() throws Exception {
+        Map<String, IndexMode> indexModes = new HashMap<>();
+        // metrics
+        {
+            final String metricsMapping = """
+                 {
+                     "properties": {
+                       "@timestamp": { "type": "date" },
+                       "hostname": { "type": "keyword", "time_series_dimension": true },
+                       "request_count" : { "type" : "long", "time_series_metric" : "counter" },
+                       "cluster": {"type": "keyword"}
+                     }
+                 }
+                """;
+            Settings settings = Settings.builder().put("mode", "time_series").putList("routing_path", List.of("hostname")).build();
+            int numIndices = between(1, 5);
+            for (int i = 0; i < numIndices; i++) {
+                assertAcked(indicesAdmin().prepareCreate("test_metrics_" + i).setSettings(settings).setMapping(metricsMapping).get());
+                indexModes.put("test_metrics_" + i, IndexMode.TIME_SERIES);
+                assertAcked(indicesAdmin().prepareCreate("test_old_metrics_" + i).setMapping(metricsMapping).get());
+                indexModes.put("test_old_metrics_" + i, IndexMode.STANDARD);
+            }
+        }
+        // logsdb
+        {
+            final String logsMapping = """
+                 {
+                     "properties": {
+                       "@timestamp": { "type": "date" },
+                       "hostname": { "type": "keyword"},
+                       "request_count" : { "type" : "long"},
+                       "cluster": {"type": "keyword"}
+                     }
+                 }
+                """;
+            Settings settings = Settings.builder().put("mode", "logsdb").build();
+            int numIndices = between(1, 5);
+            for (int i = 0; i < numIndices; i++) {
+                assertAcked(indicesAdmin().prepareCreate("test_logs_" + i).setSettings(settings).setMapping(logsMapping).get());
+                indexModes.put("test_logs_" + i, IndexMode.LOGSDB);
+                assertAcked(indicesAdmin().prepareCreate("test_old_logs_" + i).setMapping(logsMapping).get());
+                indexModes.put("test_old_logs_" + i, IndexMode.STANDARD);
+            }
+        }
+        FieldCapabilitiesRequest request = new FieldCapabilitiesRequest();
+        request.setMergeResults(false);
+        request.indices("test_*");
+        request.fields(randomFrom("*", "@timestamp", "host*"));
+        var resp = client().fieldCaps(request).get();
+        assertThat(resp.getFailures(), empty());
+        Map<String, IndexMode> actualIndexModes = new HashMap<>();
+        for (var indexResp : resp.getIndexResponses()) {
+            actualIndexModes.put(indexResp.getIndexName(), indexResp.getIndexMode());
+        }
+        assertThat(actualIndexModes, equalTo(indexModes));
+    }
+
     private void assertIndices(FieldCapabilitiesResponse response, String... indices) {
         assertNotNull(response.getIndices());
         Arrays.sort(indices);
diff --git a/server/src/main/java/org/elasticsearch/TransportVersions.java b/server/src/main/java/org/elasticsearch/TransportVersions.java
index 5963e3c8058de..7581ee7649696 100644
--- a/server/src/main/java/org/elasticsearch/TransportVersions.java
+++ b/server/src/main/java/org/elasticsearch/TransportVersions.java
@@ -202,6 +202,8 @@ static TransportVersion def(int id) {
     public static final TransportVersion REPOSITORIES_TELEMETRY = def(8_732_00_0);
     public static final TransportVersion ML_INFERENCE_ALIBABACLOUD_SEARCH_ADDED = def(8_733_00_0);
 
+    public static final TransportVersion FIELD_CAPS_RESPONSE_INDEX_MODE = def(8_734_00_0);
+
     /*
      * STOP! READ THIS FIRST! No, really,
      *        ____ _____ ___  ____  _        ____  _____    _    ____    _____ _   _ ___ ____    _____ ___ ____  ____ _____ _
diff --git a/server/src/main/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesFetcher.java b/server/src/main/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesFetcher.java
index 51cb05f981177..e435655668882 100644
--- a/server/src/main/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesFetcher.java
+++ b/server/src/main/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesFetcher.java
@@ -108,15 +108,15 @@ private FieldCapabilitiesIndexResponse doFetch(
             null,
             runtimeFields
         );
-
+        var indexMode = searchExecutionContext.getIndexSettings().getMode();
         if (searcher != null && canMatchShard(shardId, indexFilter, nowInMillis, searchExecutionContext) == false) {
-            return new FieldCapabilitiesIndexResponse(shardId.getIndexName(), null, Collections.emptyMap(), false);
+            return new FieldCapabilitiesIndexResponse(shardId.getIndexName(), null, Collections.emptyMap(), false, indexMode);
         }
 
         final MappingMetadata mapping = indexService.getMetadata().mapping();
         String indexMappingHash;
         if (includeEmptyFields || enableFieldHasValue == false) {
-            indexMappingHash = mapping != null ? mapping.getSha256() : null;
+            indexMappingHash = mapping != null ? mapping.getSha256() + indexMode : null;
         } else {
             // even if the mapping is the same if we return only fields with values we need
             // to make sure that we consider all the shard-mappings pair, that is why we
@@ -129,7 +129,7 @@ private FieldCapabilitiesIndexResponse doFetch(
             indexMappingHash = fieldPredicate.modifyHash(indexMappingHash);
             final Map<String, IndexFieldCapabilities> existing = indexMappingHashToResponses.get(indexMappingHash);
             if (existing != null) {
-                return new FieldCapabilitiesIndexResponse(shardId.getIndexName(), indexMappingHash, existing, true);
+                return new FieldCapabilitiesIndexResponse(shardId.getIndexName(), indexMappingHash, existing, true, indexMode);
             }
         }
         task.ensureNotCancelled();
@@ -145,7 +145,7 @@ private FieldCapabilitiesIndexResponse doFetch(
         if (indexMappingHash != null) {
             indexMappingHashToResponses.put(indexMappingHash, responseMap);
         }
-        return new FieldCapabilitiesIndexResponse(shardId.getIndexName(), indexMappingHash, responseMap, true);
+        return new FieldCapabilitiesIndexResponse(shardId.getIndexName(), indexMappingHash, responseMap, true, indexMode);
     }
 
     static Map<String, IndexFieldCapabilities> retrieveFieldCaps(
diff --git a/server/src/main/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesIndexResponse.java b/server/src/main/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesIndexResponse.java
index cc72dd80dceac..5a50ed4c9f573 100644
--- a/server/src/main/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesIndexResponse.java
+++ b/server/src/main/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesIndexResponse.java
@@ -15,6 +15,7 @@
 import org.elasticsearch.common.io.stream.Writeable;
 import org.elasticsearch.common.util.Maps;
 import org.elasticsearch.core.Nullable;
+import org.elasticsearch.index.IndexMode;
 
 import java.io.IOException;
 import java.util.ArrayList;
@@ -33,18 +34,21 @@ public final class FieldCapabilitiesIndexResponse implements Writeable {
     private final Map<String, IndexFieldCapabilities> responseMap;
     private final boolean canMatch;
     private final transient TransportVersion originVersion;
+    private final IndexMode indexMode;
 
     public FieldCapabilitiesIndexResponse(
         String indexName,
         @Nullable String indexMappingHash,
         Map<String, IndexFieldCapabilities> responseMap,
-        boolean canMatch
+        boolean canMatch,
+        IndexMode indexMode
     ) {
         this.indexName = indexName;
         this.indexMappingHash = indexMappingHash;
         this.responseMap = responseMap;
         this.canMatch = canMatch;
         this.originVersion = TransportVersion.current();
+        this.indexMode = indexMode;
     }
 
     FieldCapabilitiesIndexResponse(StreamInput in) throws IOException {
@@ -57,6 +61,11 @@ public FieldCapabilitiesIndexResponse(
         } else {
             this.indexMappingHash = null;
         }
+        if (in.getTransportVersion().onOrAfter(TransportVersions.FIELD_CAPS_RESPONSE_INDEX_MODE)) {
+            this.indexMode = IndexMode.readFrom(in);
+        } else {
+            this.indexMode = IndexMode.STANDARD;
+        }
     }
 
     @Override
@@ -67,9 +76,12 @@ public void writeTo(StreamOutput out) throws IOException {
         if (out.getTransportVersion().onOrAfter(MAPPING_HASH_VERSION)) {
             out.writeOptionalString(indexMappingHash);
         }
+        if (out.getTransportVersion().onOrAfter(TransportVersions.FIELD_CAPS_RESPONSE_INDEX_MODE)) {
+            IndexMode.writeTo(indexMode, out);
+        }
     }
 
-    private record CompressedGroup(String[] indices, String mappingHash, int[] fields) {}
+    private record CompressedGroup(String[] indices, IndexMode indexMode, String mappingHash, int[] fields) {}
 
     static List<FieldCapabilitiesIndexResponse> readList(StreamInput input) throws IOException {
         if (input.getTransportVersion().before(MAPPING_HASH_VERSION)) {
@@ -92,10 +104,12 @@ static List<FieldCapabilitiesIndexResponse> readList(StreamInput input) throws I
     private static void collectCompressedResponses(StreamInput input, int groups, ArrayList<FieldCapabilitiesIndexResponse> responses)
         throws IOException {
         final CompressedGroup[] compressedGroups = new CompressedGroup[groups];
+        final boolean readIndexMode = input.getTransportVersion().onOrAfter(TransportVersions.FIELD_CAPS_RESPONSE_INDEX_MODE);
         for (int i = 0; i < groups; i++) {
             final String[] indices = input.readStringArray();
+            final IndexMode indexMode = readIndexMode ? IndexMode.readFrom(input) : IndexMode.STANDARD;
             final String mappingHash = input.readString();
-            compressedGroups[i] = new CompressedGroup(indices, mappingHash, input.readIntArray());
+            compressedGroups[i] = new CompressedGroup(indices, indexMode, mappingHash, input.readIntArray());
         }
         final IndexFieldCapabilities[] ifcLookup = input.readArray(IndexFieldCapabilities::readFrom, IndexFieldCapabilities[]::new);
         for (CompressedGroup compressedGroup : compressedGroups) {
@@ -105,7 +119,7 @@ private static void collectCompressedResponses(StreamInput input, int groups, Ar
                 ifc.put(val.name(), val);
             }
             for (String index : compressedGroup.indices) {
-                responses.add(new FieldCapabilitiesIndexResponse(index, compressedGroup.mappingHash, ifc, true));
+                responses.add(new FieldCapabilitiesIndexResponse(index, compressedGroup.mappingHash, ifc, true, compressedGroup.indexMode));
             }
         }
     }
@@ -117,7 +131,7 @@ private static void collectResponsesLegacyFormat(StreamInput input, int groups,
             final String mappingHash = input.readString();
             final Map<String, IndexFieldCapabilities> ifc = input.readMap(IndexFieldCapabilities::readFrom);
             for (String index : indices) {
-                responses.add(new FieldCapabilitiesIndexResponse(index, mappingHash, ifc, true));
+                responses.add(new FieldCapabilitiesIndexResponse(index, mappingHash, ifc, true, IndexMode.STANDARD));
             }
         }
     }
@@ -164,6 +178,9 @@ private static void writeCompressedResponses(StreamOutput output, Map<String, Li
         output.writeCollection(groupedResponsesMap.values(), (o, fieldCapabilitiesIndexResponses) -> {
             o.writeCollection(fieldCapabilitiesIndexResponses, (oo, r) -> oo.writeString(r.indexName));
             var first = fieldCapabilitiesIndexResponses.get(0);
+            if (output.getTransportVersion().onOrAfter(TransportVersions.FIELD_CAPS_RESPONSE_INDEX_MODE)) {
+                IndexMode.writeTo(first.indexMode, o);
+            }
             o.writeString(first.indexMappingHash);
             o.writeVInt(first.responseMap.size());
             for (IndexFieldCapabilities ifc : first.responseMap.values()) {
@@ -192,6 +209,10 @@ public String getIndexMappingHash() {
         return indexMappingHash;
     }
 
+    public IndexMode getIndexMode() {
+        return indexMode;
+    }
+
     public boolean canMatch() {
         return canMatch;
     }
diff --git a/server/src/main/java/org/elasticsearch/action/fieldcaps/TransportFieldCapabilitiesAction.java b/server/src/main/java/org/elasticsearch/action/fieldcaps/TransportFieldCapabilitiesAction.java
index b9bf3bb37c7b4..bb97b0dc48c42 100644
--- a/server/src/main/java/org/elasticsearch/action/fieldcaps/TransportFieldCapabilitiesAction.java
+++ b/server/src/main/java/org/elasticsearch/action/fieldcaps/TransportFieldCapabilitiesAction.java
@@ -174,7 +174,13 @@ private void doExecuteForked(
             if (resp.canMatch() && resp.getIndexMappingHash() != null) {
                 FieldCapabilitiesIndexResponse curr = indexMappingHashToResponses.putIfAbsent(resp.getIndexMappingHash(), resp);
                 if (curr != null) {
-                    resp = new FieldCapabilitiesIndexResponse(resp.getIndexName(), curr.getIndexMappingHash(), curr.get(), true);
+                    resp = new FieldCapabilitiesIndexResponse(
+                        resp.getIndexName(),
+                        curr.getIndexMappingHash(),
+                        curr.get(),
+                        true,
+                        curr.getIndexMode()
+                    );
                 }
             }
             if (request.includeEmptyFields()) {
@@ -186,7 +192,13 @@ private void doExecuteForked(
                     }
                     Map<String, IndexFieldCapabilities> mergedCaps = new HashMap<>(a.get());
                     mergedCaps.putAll(b.get());
-                    return new FieldCapabilitiesIndexResponse(a.getIndexName(), a.getIndexMappingHash(), mergedCaps, true);
+                    return new FieldCapabilitiesIndexResponse(
+                        a.getIndexName(),
+                        a.getIndexMappingHash(),
+                        mergedCaps,
+                        true,
+                        a.getIndexMode()
+                    );
                 });
             }
             if (fieldCapTask.isCancelled()) {
@@ -249,7 +261,13 @@ private void doExecuteForked(
                     for (FieldCapabilitiesIndexResponse resp : response.getIndexResponses()) {
                         String indexName = RemoteClusterAware.buildRemoteIndexName(clusterAlias, resp.getIndexName());
                         handleIndexResponse.accept(
-                            new FieldCapabilitiesIndexResponse(indexName, resp.getIndexMappingHash(), resp.get(), resp.canMatch())
+                            new FieldCapabilitiesIndexResponse(
+                                indexName,
+                                resp.getIndexMappingHash(),
+                                resp.get(),
+                                resp.canMatch(),
+                                resp.getIndexMode()
+                            )
                         );
                     }
                     for (FieldCapabilitiesFailure failure : response.getFailures()) {
diff --git a/server/src/main/java/org/elasticsearch/index/IndexMode.java b/server/src/main/java/org/elasticsearch/index/IndexMode.java
index b137cfe27a514..96598ba38a3fe 100644
--- a/server/src/main/java/org/elasticsearch/index/IndexMode.java
+++ b/server/src/main/java/org/elasticsearch/index/IndexMode.java
@@ -12,6 +12,8 @@
 import org.elasticsearch.cluster.metadata.MetadataCreateDataStreamService;
 import org.elasticsearch.cluster.routing.IndexRouting;
 import org.elasticsearch.common.compress.CompressedXContent;
+import org.elasticsearch.common.io.stream.StreamInput;
+import org.elasticsearch.common.io.stream.StreamOutput;
 import org.elasticsearch.common.settings.Setting;
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.core.Nullable;
@@ -494,6 +496,25 @@ public static IndexMode fromString(String value) {
         };
     }
 
+    public static IndexMode readFrom(StreamInput in) throws IOException {
+        int mode = in.readByte();
+        return switch (mode) {
+            case 0 -> STANDARD;
+            case 1 -> TIME_SERIES;
+            case 2 -> LOGSDB;
+            default -> throw new IllegalStateException("unexpected index mode [" + mode + "]");
+        };
+    }
+
+    public static void writeTo(IndexMode indexMode, StreamOutput out) throws IOException {
+        final int code = switch (indexMode) {
+            case STANDARD -> 0;
+            case TIME_SERIES -> 1;
+            case LOGSDB -> 2;
+        };
+        out.writeByte((byte) code);
+    }
+
     @Override
     public String toString() {
         return getName();
diff --git a/server/src/test/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesIndexResponseTests.java b/server/src/test/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesIndexResponseTests.java
index 0f5ba959c5ed8..d487f584a20bb 100644
--- a/server/src/test/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesIndexResponseTests.java
+++ b/server/src/test/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesIndexResponseTests.java
@@ -8,6 +8,7 @@
 
 package org.elasticsearch.action.fieldcaps;
 
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.index.mapper.TimeSeriesParams;
 import org.elasticsearch.test.ESTestCase;
 
@@ -60,9 +61,10 @@ static List<FieldCapabilitiesIndexResponse> randomIndexResponsesWithMappingHash(
         final List<FieldCapabilitiesIndexResponse> responses = new ArrayList<>();
         for (Map.Entry<String, List<String>> e : mappingHashToIndices.entrySet()) {
             Map<String, IndexFieldCapabilities> fieldCaps = randomFieldCaps();
+            var indexMode = randomFrom(IndexMode.values());
             String mappingHash = e.getKey();
             for (String index : e.getValue()) {
-                responses.add(new FieldCapabilitiesIndexResponse(index, mappingHash, fieldCaps, true));
+                responses.add(new FieldCapabilitiesIndexResponse(index, mappingHash, fieldCaps, true, indexMode));
             }
         }
         return responses;
@@ -73,7 +75,8 @@ static List<FieldCapabilitiesIndexResponse> randomIndexResponsesWithoutMappingHa
         int numIndices = between(0, 10);
         for (int i = 0; i < numIndices; i++) {
             String index = "index_without_mapping_hash_" + i;
-            responses.add(new FieldCapabilitiesIndexResponse(index, null, randomFieldCaps(), randomBoolean()));
+            var indexMode = randomFrom(IndexMode.values());
+            responses.add(new FieldCapabilitiesIndexResponse(index, null, randomFieldCaps(), randomBoolean(), indexMode));
         }
         return responses;
     }
diff --git a/server/src/test/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesNodeResponseTests.java b/server/src/test/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesNodeResponseTests.java
index 0802e498c43a7..c39cc6ebfd665 100644
--- a/server/src/test/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesNodeResponseTests.java
+++ b/server/src/test/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesNodeResponseTests.java
@@ -16,6 +16,7 @@
 import org.elasticsearch.common.io.stream.StreamInput;
 import org.elasticsearch.common.io.stream.Writeable;
 import org.elasticsearch.common.util.CollectionUtils;
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.index.shard.ShardId;
 import org.elasticsearch.test.AbstractWireSerializingTestCase;
 import org.elasticsearch.test.TransportVersionUtils;
@@ -49,7 +50,9 @@ protected FieldCapabilitiesNodeResponse createTestInstance() {
         List<FieldCapabilitiesIndexResponse> responses = new ArrayList<>();
         int numResponse = randomIntBetween(0, 10);
         for (int i = 0; i < numResponse; i++) {
-            responses.add(new FieldCapabilitiesIndexResponse("index_" + i, null, randomFieldCaps(), randomBoolean()));
+            responses.add(
+                new FieldCapabilitiesIndexResponse("index_" + i, null, randomFieldCaps(), randomBoolean(), randomFrom(IndexMode.values()))
+            );
         }
         int numUnmatched = randomIntBetween(0, 3);
         Set<ShardId> shardIds = new HashSet<>();
@@ -69,21 +72,38 @@ protected FieldCapabilitiesNodeResponse mutateInstance(FieldCapabilitiesNodeResp
         List<FieldCapabilitiesIndexResponse> newResponses = new ArrayList<>(response.getIndexResponses());
         int mutation = response.getIndexResponses().isEmpty() ? 0 : randomIntBetween(0, 3);
         switch (mutation) {
-            case 0 -> newResponses.add(new FieldCapabilitiesIndexResponse("extra_index", null, randomFieldCaps(), randomBoolean()));
+            case 0 -> newResponses.add(
+                new FieldCapabilitiesIndexResponse("extra_index", null, randomFieldCaps(), randomBoolean(), randomFrom(IndexMode.values()))
+            );
             case 1 -> {
                 int toRemove = randomInt(newResponses.size() - 1);
                 newResponses.remove(toRemove);
             }
             case 2 -> {
                 int toReplace = randomInt(newResponses.size() - 1);
-                newResponses.set(toReplace, new FieldCapabilitiesIndexResponse("new_index", null, randomFieldCaps(), randomBoolean()));
+                newResponses.set(
+                    toReplace,
+                    new FieldCapabilitiesIndexResponse(
+                        "new_index",
+                        null,
+                        randomFieldCaps(),
+                        randomBoolean(),
+                        randomFrom(IndexMode.values())
+                    )
+                );
             }
             case 3 -> {
                 int toReplace = randomInt(newResponses.size() - 1);
                 FieldCapabilitiesIndexResponse resp = newResponses.get(toReplace);
                 newResponses.set(
                     toReplace,
-                    new FieldCapabilitiesIndexResponse(resp.getIndexName(), UUIDs.randomBase64UUID(), resp.get(), true)
+                    new FieldCapabilitiesIndexResponse(
+                        resp.getIndexName(),
+                        UUIDs.randomBase64UUID(),
+                        resp.get(),
+                        true,
+                        randomFrom(IndexMode.values())
+                    )
                 );
             }
         }
@@ -194,9 +214,10 @@ public void testReadNodeResponseFromPre82() throws Exception {
                         "blue_field",
                         new IndexFieldCapabilities("blue_field", "long", false, true, true, false, null, Map.of())
                     ),
-                    true
+                    true,
+                    IndexMode.STANDARD
                 ),
-                new FieldCapabilitiesIndexResponse("index_02", null, Map.of(), false),
+                new FieldCapabilitiesIndexResponse("index_02", null, Map.of(), false, IndexMode.STANDARD),
                 new FieldCapabilitiesIndexResponse(
                     "index_03",
                     null,
@@ -206,7 +227,8 @@ public void testReadNodeResponseFromPre82() throws Exception {
                         "_seq_no",
                         new IndexFieldCapabilities("_seq_no", "long", true, true, true, false, null, Map.of())
                     ),
-                    true
+                    true,
+                    IndexMode.STANDARD
                 )
             )
         );
diff --git a/server/src/test/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesResponseTests.java b/server/src/test/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesResponseTests.java
index 461000fc22b02..cc4d4de1e0f39 100644
--- a/server/src/test/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesResponseTests.java
+++ b/server/src/test/java/org/elasticsearch/action/fieldcaps/FieldCapabilitiesResponseTests.java
@@ -18,6 +18,7 @@
 import org.elasticsearch.common.io.stream.Writeable;
 import org.elasticsearch.common.util.CollectionUtils;
 import org.elasticsearch.common.xcontent.ChunkedToXContent;
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.test.AbstractWireSerializingTestCase;
 import org.elasticsearch.test.TransportVersionUtils;
 import org.elasticsearch.xcontent.ToXContent;
@@ -54,7 +55,8 @@ protected FieldCapabilitiesResponse createTestInstance() {
         int numResponse = randomIntBetween(0, 10);
         for (int i = 0; i < numResponse; i++) {
             Map<String, IndexFieldCapabilities> fieldCaps = FieldCapabilitiesIndexResponseTests.randomFieldCaps();
-            responses.add(new FieldCapabilitiesIndexResponse("index_" + i, null, fieldCaps, randomBoolean()));
+            var indexMode = randomFrom(IndexMode.values());
+            responses.add(new FieldCapabilitiesIndexResponse("index_" + i, null, fieldCaps, randomBoolean(), indexMode));
         }
         randomResponse = new FieldCapabilitiesResponse(responses, Collections.emptyList());
         return randomResponse;
@@ -267,9 +269,10 @@ public void testReadCCSResponseFromPre82() throws Exception {
                         "blue_field",
                         new IndexFieldCapabilities("blue_field", "long", false, true, true, false, null, Map.of())
                     ),
-                    true
+                    true,
+                    IndexMode.STANDARD
                 ),
-                new FieldCapabilitiesIndexResponse("index_02", null, Map.of(), false),
+                new FieldCapabilitiesIndexResponse("index_02", null, Map.of(), false, IndexMode.STANDARD),
                 new FieldCapabilitiesIndexResponse(
                     "index_03",
                     null,
@@ -279,7 +282,8 @@ public void testReadCCSResponseFromPre82() throws Exception {
                         "_seq_no",
                         new IndexFieldCapabilities("_seq_no", "long", true, true, true, false, null, Map.of())
                     ),
-                    true
+                    true,
+                    IndexMode.STANDARD
                 )
             )
         );
diff --git a/server/src/test/java/org/elasticsearch/action/fieldcaps/RequestDispatcherTests.java b/server/src/test/java/org/elasticsearch/action/fieldcaps/RequestDispatcherTests.java
index f5f35c52044d7..96e615afb498f 100644
--- a/server/src/test/java/org/elasticsearch/action/fieldcaps/RequestDispatcherTests.java
+++ b/server/src/test/java/org/elasticsearch/action/fieldcaps/RequestDispatcherTests.java
@@ -42,6 +42,7 @@
 import org.elasticsearch.common.util.concurrent.AbstractRunnable;
 import org.elasticsearch.common.util.concurrent.ConcurrentCollections;
 import org.elasticsearch.common.util.set.Sets;
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.index.IndexVersions;
 import org.elasticsearch.index.query.QueryBuilder;
 import org.elasticsearch.index.query.RangeQueryBuilder;
@@ -890,7 +891,13 @@ static FieldCapabilitiesNodeResponse randomNodeResponse(
                 indicesWithMappingHash.computeIfAbsent(index, k -> new ArrayList<>()).add(index);
             } else {
                 indexResponses.add(
-                    new FieldCapabilitiesIndexResponse(index, null, FieldCapabilitiesIndexResponseTests.randomFieldCaps(), true)
+                    new FieldCapabilitiesIndexResponse(
+                        index,
+                        null,
+                        FieldCapabilitiesIndexResponseTests.randomFieldCaps(),
+                        true,
+                        randomFrom(IndexMode.values())
+                    )
                 );
             }
         }
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/analysis/AnalyzerTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/analysis/AnalyzerTests.java
index 72a905f4b37a4..e4872b24558bc 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/analysis/AnalyzerTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/analysis/AnalyzerTests.java
@@ -2122,7 +2122,9 @@ protected List<String> filteredWarnings() {
     }
 
     private static LogicalPlan analyzeWithEmptyFieldCapsResponse(String query) throws IOException {
-        List<FieldCapabilitiesIndexResponse> idxResponses = List.of(new FieldCapabilitiesIndexResponse("idx", "idx", Map.of(), true));
+        List<FieldCapabilitiesIndexResponse> idxResponses = List.of(
+            new FieldCapabilitiesIndexResponse("idx", "idx", Map.of(), true, IndexMode.STANDARD)
+        );
         FieldCapabilitiesResponse caps = new FieldCapabilitiesResponse(idxResponses, List.of());
         IndexResolution resolution = new IndexResolver(null).mergedMappings("test*", caps);
         var analyzer = analyzer(resolution, TEST_VERIFIER, configuration(query));
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/enrich/EnrichPolicyResolverTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/enrich/EnrichPolicyResolverTests.java
index 45623a39da936..ebad8e6e13b8c 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/enrich/EnrichPolicyResolverTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/enrich/EnrichPolicyResolverTests.java
@@ -26,6 +26,7 @@
 import org.elasticsearch.cluster.service.ClusterService;
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.util.concurrent.EsExecutors;
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.test.ESTestCase;
 import org.elasticsearch.test.client.NoOpClient;
 import org.elasticsearch.test.transport.MockTransportService;
@@ -491,7 +492,7 @@ protected <Request extends ActionRequest, Response extends ActionResponse> void
                     var f = new IndexFieldCapabilities(e.getKey(), e.getValue(), false, false, false, false, null, Map.of());
                     fieldCaps.put(e.getKey(), f);
                 }
-                var indexResponse = new FieldCapabilitiesIndexResponse(alias, null, fieldCaps, true);
+                var indexResponse = new FieldCapabilitiesIndexResponse(alias, null, fieldCaps, true, IndexMode.STANDARD);
                 response = new FieldCapabilitiesResponse(List.of(indexResponse), List.of());
             } else {
                 response = new FieldCapabilitiesResponse(List.of(), List.of());
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/stats/PlanExecutorMetricsTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/stats/PlanExecutorMetricsTests.java
index 66fd95c4f7726..d3795c9e9d953 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/stats/PlanExecutorMetricsTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/stats/PlanExecutorMetricsTests.java
@@ -13,6 +13,7 @@
 import org.elasticsearch.action.fieldcaps.FieldCapabilitiesResponse;
 import org.elasticsearch.action.fieldcaps.IndexFieldCapabilities;
 import org.elasticsearch.client.internal.Client;
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.test.ESTestCase;
 import org.elasticsearch.threadpool.TestThreadPool;
 import org.elasticsearch.threadpool.ThreadPool;
@@ -151,7 +152,8 @@ private List<FieldCapabilitiesIndexResponse> indexFieldCapabilities(String[] ind
                         Map.entry("foo", new IndexFieldCapabilities("foo", "integer", false, true, true, false, null, Map.of())),
                         Map.entry("bar", new IndexFieldCapabilities("bar", "long", false, true, true, false, null, Map.of()))
                     ),
-                    true
+                    true,
+                    IndexMode.STANDARD
                 )
             );
         }
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/type/EsqlDataTypeRegistryTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/type/EsqlDataTypeRegistryTests.java
index 27be2fe941393..e4e10a5c6af19 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/type/EsqlDataTypeRegistryTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/type/EsqlDataTypeRegistryTests.java
@@ -9,6 +9,7 @@
 import org.elasticsearch.action.fieldcaps.FieldCapabilitiesIndexResponse;
 import org.elasticsearch.action.fieldcaps.FieldCapabilitiesResponse;
 import org.elasticsearch.action.fieldcaps.IndexFieldCapabilities;
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.index.mapper.TimeSeriesParams;
 import org.elasticsearch.test.ESTestCase;
 import org.elasticsearch.xpack.esql.core.type.DataType;
@@ -46,7 +47,8 @@ private void resolve(String esTypeName, TimeSeriesParams.MetricType metricType,
                 idx,
                 idx,
                 Map.of(field, new IndexFieldCapabilities(field, esTypeName, false, true, true, false, metricType, Map.of())),
-                true
+                true,
+                IndexMode.TIME_SERIES
             )
         );
 

From 2dae0533a7bdddd25707624190aa71774221462d Mon Sep 17 00:00:00 2001
From: Oleksandr Kolomiiets <oleksandr.kolomiiets@elastic.co>
Date: Thu, 29 Aug 2024 12:22:29 -0700
Subject: [PATCH 058/144] LogsDB QA tests - add dynamic mapping support
 (#112321)

---
 .../logsdb/qa/AbstractChallengeRestTest.java  |  4 +-
 ...ardVersusLogsIndexModeChallengeRestIT.java | 52 +++++------
 ...ogsIndexModeRandomDataChallengeRestIT.java | 87 +++++++++----------
 .../logsdb/qa/matchers/ListEqualMatcher.java  |  2 +-
 .../matchers/source/DynamicFieldMatcher.java  | 87 +++++++++++++++++++
 .../matchers/source/FieldSpecificMatcher.java |  2 +-
 .../qa/matchers/source/MappingTransforms.java | 44 ++++++++--
 .../qa/matchers/source/SourceMatcher.java     | 69 ++++++++-------
 .../qa/matchers/source/SourceTransforms.java  | 13 ++-
 .../logsdb/datageneration/DataGenerator.java  |  6 +-
 .../DataGeneratorSpecification.java           | 10 +++
 .../logsdb/datageneration/FieldType.java      | 29 ++++++-
 .../datasource/DataSourceRequest.java         |  3 +-
 .../datasource/DataSourceResponse.java        |  6 +-
 .../DefaultMappingParametersHandler.java      | 24 ++---
 .../DefaultObjectGenerationHandler.java       | 37 ++++++--
 .../DefaultPrimitiveTypesHandler.java         |  3 +-
 .../logsdb/datageneration/fields/Context.java | 66 ++++++++++----
 .../datageneration/fields/DynamicMapping.java | 15 ++++
 .../GenericSubObjectFieldDataGenerator.java   | 53 ++++-------
 .../fields/NestedFieldDataGenerator.java      |  3 +-
 .../fields/ObjectFieldDataGenerator.java      |  3 +-
 .../fields/PredefinedField.java               | 32 ++++++-
 .../TopLevelObjectFieldDataGenerator.java     | 39 +++++++--
 .../DataGeneratorSnapshotTests.java           | 11 ++-
 .../datageneration/DataGeneratorTests.java    | 40 ++++++++-
 26 files changed, 532 insertions(+), 208 deletions(-)
 create mode 100644 modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/DynamicFieldMatcher.java
 create mode 100644 test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/DynamicMapping.java

diff --git a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/AbstractChallengeRestTest.java b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/AbstractChallengeRestTest.java
index 6292b06d44c9a..1d36a04657e9c 100644
--- a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/AbstractChallengeRestTest.java
+++ b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/AbstractChallengeRestTest.java
@@ -233,9 +233,11 @@ private Response indexDocuments(
         final CheckedSupplier<List<XContentBuilder>, IOException> documentsSupplier
     ) throws IOException {
         final StringBuilder sb = new StringBuilder();
+        int id = 0;
         for (var document : documentsSupplier.get()) {
-            sb.append("{ \"create\": {} }").append("\n");
+            sb.append(Strings.format("{ \"create\": { \"_id\" : \"%d\" } }", id)).append("\n");
             sb.append(Strings.toString(document)).append("\n");
+            id++;
         }
         var request = new Request("POST", "/" + dataStreamName + "/_bulk");
         request.setJsonEntity(sb.toString());
diff --git a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/StandardVersusLogsIndexModeChallengeRestIT.java b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/StandardVersusLogsIndexModeChallengeRestIT.java
index 5824f8fa764f4..9bf1c394f9105 100644
--- a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/StandardVersusLogsIndexModeChallengeRestIT.java
+++ b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/StandardVersusLogsIndexModeChallengeRestIT.java
@@ -34,8 +34,11 @@
 
 import java.io.IOException;
 import java.time.Instant;
+import java.time.ZoneId;
+import java.time.ZonedDateTime;
 import java.time.temporal.ChronoUnit;
 import java.util.ArrayList;
+import java.util.Comparator;
 import java.util.List;
 import java.util.Map;
 
@@ -178,11 +181,8 @@ protected static void waitForLogs(RestClient client) throws Exception {
     }
 
     public void testMatchAllQuery() throws IOException {
-        final List<XContentBuilder> documents = new ArrayList<>();
         int numberOfDocuments = ESTestCase.randomIntBetween(100, 200);
-        for (int i = 0; i < numberOfDocuments; i++) {
-            documents.add(generateDocument(Instant.now().plus(i, ChronoUnit.SECONDS)));
-        }
+        final List<XContentBuilder> documents = generateDocuments(numberOfDocuments);
 
         assertDocumentIndexing(documents);
 
@@ -199,11 +199,8 @@ public void testMatchAllQuery() throws IOException {
     }
 
     public void testTermsQuery() throws IOException {
-        final List<XContentBuilder> documents = new ArrayList<>();
-        int numberOfDocuments = randomIntBetween(100, 200);
-        for (int i = 0; i < numberOfDocuments; i++) {
-            documents.add(generateDocument(Instant.now().plus(i, ChronoUnit.SECONDS)));
-        }
+        int numberOfDocuments = ESTestCase.randomIntBetween(100, 200);
+        final List<XContentBuilder> documents = generateDocuments(numberOfDocuments);
 
         assertDocumentIndexing(documents);
 
@@ -220,11 +217,8 @@ public void testTermsQuery() throws IOException {
     }
 
     public void testHistogramAggregation() throws IOException {
-        final List<XContentBuilder> documents = new ArrayList<>();
-        int numberOfDocuments = randomIntBetween(100, 200);
-        for (int i = 0; i < numberOfDocuments; i++) {
-            documents.add(generateDocument(Instant.now().plus(i, ChronoUnit.SECONDS)));
-        }
+        int numberOfDocuments = ESTestCase.randomIntBetween(100, 200);
+        final List<XContentBuilder> documents = generateDocuments(numberOfDocuments);
 
         assertDocumentIndexing(documents);
 
@@ -241,11 +235,8 @@ public void testHistogramAggregation() throws IOException {
     }
 
     public void testTermsAggregation() throws IOException {
-        final List<XContentBuilder> documents = new ArrayList<>();
-        int numberOfDocuments = randomIntBetween(100, 200);
-        for (int i = 0; i < numberOfDocuments; i++) {
-            documents.add(generateDocument(Instant.now().plus(i, ChronoUnit.SECONDS)));
-        }
+        int numberOfDocuments = ESTestCase.randomIntBetween(100, 200);
+        final List<XContentBuilder> documents = generateDocuments(numberOfDocuments);
 
         assertDocumentIndexing(documents);
 
@@ -262,11 +253,8 @@ public void testTermsAggregation() throws IOException {
     }
 
     public void testDateHistogramAggregation() throws IOException {
-        final List<XContentBuilder> documents = new ArrayList<>();
-        int numberOfDocuments = randomIntBetween(100, 200);
-        for (int i = 0; i < numberOfDocuments; i++) {
-            documents.add(generateDocument(Instant.now().plus(i, ChronoUnit.SECONDS)));
-        }
+        int numberOfDocuments = ESTestCase.randomIntBetween(100, 200);
+        final List<XContentBuilder> documents = generateDocuments(numberOfDocuments);
 
         assertDocumentIndexing(documents);
 
@@ -282,6 +270,17 @@ public void testDateHistogramAggregation() throws IOException {
         assertTrue(matchResult.getMessage(), matchResult.isMatch());
     }
 
+    private List<XContentBuilder> generateDocuments(int numberOfDocuments) throws IOException {
+        final List<XContentBuilder> documents = new ArrayList<>();
+        // This is static in order to be able to identify documents between test runs.
+        var startingPoint = ZonedDateTime.of(2024, 1, 1, 10, 0, 0, 0, ZoneId.of("UTC")).toInstant();
+        for (int i = 0; i < numberOfDocuments; i++) {
+            documents.add(generateDocument(startingPoint.plus(i, ChronoUnit.SECONDS)));
+        }
+
+        return documents;
+    }
+
     protected XContentBuilder generateDocument(final Instant timestamp) throws IOException {
         return XContentFactory.jsonBuilder()
             .startObject()
@@ -301,7 +300,10 @@ private static List<Map<String, Object>> getQueryHits(final Response response) t
         final List<Map<String, Object>> hitsList = (List<Map<String, Object>>) hitsMap.get("hits");
         assertThat(hitsList.size(), greaterThan(0));
 
-        return hitsList.stream().map(hit -> (Map<String, Object>) hit.get("_source")).toList();
+        return hitsList.stream()
+            .sorted(Comparator.comparingInt((Map<String, Object> hit) -> Integer.parseInt((String) hit.get("_id"))))
+            .map(hit -> (Map<String, Object>) hit.get("_source"))
+            .toList();
     }
 
     @SuppressWarnings("unchecked")
diff --git a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/StandardVersusLogsIndexModeRandomDataChallengeRestIT.java b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/StandardVersusLogsIndexModeRandomDataChallengeRestIT.java
index f53fdcb6e8600..8bd62480f333d 100644
--- a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/StandardVersusLogsIndexModeRandomDataChallengeRestIT.java
+++ b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/StandardVersusLogsIndexModeRandomDataChallengeRestIT.java
@@ -10,9 +10,11 @@
 
 import org.elasticsearch.common.time.DateFormatter;
 import org.elasticsearch.common.time.FormatNames;
+import org.elasticsearch.core.CheckedConsumer;
 import org.elasticsearch.index.mapper.ObjectMapper;
 import org.elasticsearch.logsdb.datageneration.DataGenerator;
 import org.elasticsearch.logsdb.datageneration.DataGeneratorSpecification;
+import org.elasticsearch.logsdb.datageneration.FieldDataGenerator;
 import org.elasticsearch.logsdb.datageneration.FieldType;
 import org.elasticsearch.logsdb.datageneration.datasource.DataSourceHandler;
 import org.elasticsearch.logsdb.datageneration.datasource.DataSourceRequest;
@@ -26,40 +28,27 @@
 import java.time.Instant;
 import java.util.HashMap;
 import java.util.List;
+import java.util.Map;
 
 /**
  * Challenge test (see {@link StandardVersusLogsIndexModeChallengeRestIT}) that uses randomly generated
  * mapping and documents in order to cover more code paths and permutations.
  */
 public class StandardVersusLogsIndexModeRandomDataChallengeRestIT extends StandardVersusLogsIndexModeChallengeRestIT {
-    private final boolean fullyDynamicMapping;
     private final ObjectMapper.Subobjects subobjects;
 
     private final DataGenerator dataGenerator;
 
     public StandardVersusLogsIndexModeRandomDataChallengeRestIT() {
         super();
-        this.fullyDynamicMapping = randomBoolean();
         this.subobjects = randomFrom(ObjectMapper.Subobjects.values());
 
-        var specificationBuilder = DataGeneratorSpecification.builder();
+        var specificationBuilder = DataGeneratorSpecification.builder().withFullyDynamicMapping(randomBoolean());
         if (subobjects != ObjectMapper.Subobjects.ENABLED) {
             specificationBuilder = specificationBuilder.withNestedFieldsLimit(0);
         }
         this.dataGenerator = new DataGenerator(specificationBuilder.withDataSourceHandlers(List.of(new DataSourceHandler() {
             @Override
-            public DataSourceResponse.FieldTypeGenerator handle(DataSourceRequest.FieldTypeGenerator request) {
-                // Unsigned long is not used with dynamic mapping
-                // since it can initially look like long
-                // but later fail to parse once big values arrive.
-                // Double is not used since it maps to float with dynamic mapping
-                // resulting in precision loss compared to original source.
-                var excluded = fullyDynamicMapping ? List.of(FieldType.DOUBLE, FieldType.SCALED_FLOAT, FieldType.UNSIGNED_LONG) : List.of();
-                return new DataSourceResponse.FieldTypeGenerator(
-                    () -> randomValueOtherThanMany(excluded::contains, () -> randomFrom(FieldType.values()))
-                );
-            }
-
             public DataSourceResponse.ObjectMappingParametersGenerator handle(DataSourceRequest.ObjectMappingParametersGenerator request) {
                 if (subobjects == ObjectMapper.Subobjects.ENABLED) {
                     // Use default behavior
@@ -82,42 +71,52 @@ public DataSourceResponse.ObjectMappingParametersGenerator handle(DataSourceRequ
                     return parameters;
                 });
             }
-        })).withPredefinedFields(List.of(new PredefinedField("host.name", FieldType.KEYWORD))).build());
+        }))
+            .withPredefinedFields(
+                List.of(
+                    new PredefinedField.WithType("host.name", FieldType.KEYWORD),
+                    // Needed for terms query
+                    new PredefinedField.WithGenerator("method", new FieldDataGenerator() {
+                        @Override
+                        public CheckedConsumer<XContentBuilder, IOException> mappingWriter() {
+                            return b -> b.startObject().field("type", "keyword").endObject();
+                        }
+
+                        @Override
+                        public CheckedConsumer<XContentBuilder, IOException> fieldValueGenerator() {
+                            return b -> b.value(randomFrom("put", "post", "get"));
+                        }
+                    }),
+
+                    // Needed for histogram aggregation
+                    new PredefinedField.WithGenerator("memory_usage_bytes", new FieldDataGenerator() {
+                        @Override
+                        public CheckedConsumer<XContentBuilder, IOException> mappingWriter() {
+                            return b -> b.startObject().field("type", "long").endObject();
+                        }
+
+                        @Override
+                        public CheckedConsumer<XContentBuilder, IOException> fieldValueGenerator() {
+                            // We can generate this using standard long field but we would get "too many buckets"
+                            return b -> b.value(randomLongBetween(1000, 2000));
+                        }
+                    })
+                )
+            )
+            .build());
     }
 
     @Override
     public void baselineMappings(XContentBuilder builder) throws IOException {
-        if (fullyDynamicMapping == false) {
-            dataGenerator.writeMapping(builder);
-        } else {
-            // We want dynamic mapping, but we need host.name to be a keyword instead of text to support aggregations.
-            builder.startObject()
-                .startObject("properties")
-
-                .startObject("host.name")
-                .field("type", "keyword")
-                .field("ignore_above", randomIntBetween(1000, 1200))
-                .endObject()
-
-                .endObject()
-                .endObject();
-        }
+        dataGenerator.writeMapping(builder);
     }
 
     @Override
     public void contenderMappings(XContentBuilder builder) throws IOException {
-        if (fullyDynamicMapping == false) {
-            if (subobjects != ObjectMapper.Subobjects.ENABLED) {
-                dataGenerator.writeMapping(builder, b -> builder.field("subobjects", subobjects.toString()));
-            } else {
-                dataGenerator.writeMapping(builder);
-            }
+        if (subobjects != ObjectMapper.Subobjects.ENABLED) {
+            dataGenerator.writeMapping(builder, Map.of("subobjects", subobjects.toString()));
         } else {
-            builder.startObject();
-            if (subobjects != ObjectMapper.Subobjects.ENABLED) {
-                builder.field("subobjects", subobjects.toString());
-            }
-            builder.endObject();
+            dataGenerator.writeMapping(builder);
         }
     }
 
@@ -126,10 +125,6 @@ protected XContentBuilder generateDocument(final Instant timestamp) throws IOExc
         var document = XContentFactory.jsonBuilder();
         dataGenerator.generateDocument(document, doc -> {
             doc.field("@timestamp", DateFormatter.forPattern(FormatNames.STRICT_DATE_OPTIONAL_TIME.getName()).format(timestamp));
-            // Needed for terms query
-            doc.field("method", randomFrom("put", "post", "get"));
-            // We can generate this but we would get "too many buckets"
-            doc.field("memory_usage_bytes", randomLongBetween(1000, 2000));
         });
 
         return document;
diff --git a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/ListEqualMatcher.java b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/ListEqualMatcher.java
index bb5751b8873f2..ae18129a77111 100644
--- a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/ListEqualMatcher.java
+++ b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/ListEqualMatcher.java
@@ -43,7 +43,7 @@ private MatchResult matchListEquals(final List<Object> actualList, final List<Ob
                     actualSettings,
                     expectedMappings,
                     expectedSettings,
-                    "List lengths do no match, " + prettyPrintCollections(actualList, expectedList)
+                    "List lengths do not match, " + prettyPrintCollections(actualList, expectedList)
                 )
             );
         }
diff --git a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/DynamicFieldMatcher.java b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/DynamicFieldMatcher.java
new file mode 100644
index 0000000000000..dc371aae82ce1
--- /dev/null
+++ b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/DynamicFieldMatcher.java
@@ -0,0 +1,87 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.datastreams.logsdb.qa.matchers.source;
+
+import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.datastreams.logsdb.qa.matchers.MatchResult;
+import org.elasticsearch.xcontent.XContentBuilder;
+
+import java.util.List;
+import java.util.Objects;
+import java.util.Optional;
+import java.util.Set;
+import java.util.function.Function;
+import java.util.stream.Collectors;
+
+import static org.elasticsearch.datastreams.logsdb.qa.matchers.Messages.formatErrorMessage;
+import static org.elasticsearch.datastreams.logsdb.qa.matchers.Messages.prettyPrintCollections;
+
+class DynamicFieldMatcher {
+    private final XContentBuilder actualMappings;
+    private final Settings.Builder actualSettings;
+    private final XContentBuilder expectedMappings;
+    private final Settings.Builder expectedSettings;
+
+    DynamicFieldMatcher(
+        XContentBuilder actualMappings,
+        Settings.Builder actualSettings,
+        XContentBuilder expectedMappings,
+        Settings.Builder expectedSettings
+    ) {
+        this.actualMappings = actualMappings;
+        this.actualSettings = actualSettings;
+        this.expectedMappings = expectedMappings;
+        this.expectedSettings = expectedSettings;
+    }
+
+    /**
+     * Performs matching of dynamically mapped field values if they need special treatment.
+     * @return {#{@link MatchResult}} if field values need special treatment by this matcher.
+     * If field values can be matched using generic mapper, returns {@link Optional#empty()}.
+     */
+    public Optional<MatchResult> match(List<Object> actual, List<Object> expected) {
+        if (expected == null) {
+            return Optional.empty();
+        }
+
+        // Floating point values are always mapped as float with dynamic mapping.
+        var isDouble = expected.stream().filter(Objects::nonNull).findFirst().map(o -> o instanceof Double).orElse(false);
+        if (isDouble) {
+            assert expected.stream().allMatch(o -> o == null || o instanceof Double);
+
+            var normalizedActual = normalizeDoubles(actual);
+            var normalizedExpected = normalizeDoubles(expected);
+
+            var matchResult = normalizedActual.equals(normalizedExpected)
+                ? MatchResult.match()
+                : MatchResult.noMatch(
+                    formatErrorMessage(
+                        actualMappings,
+                        actualSettings,
+                        expectedMappings,
+                        expectedSettings,
+                        "Values of dynamically mapped field containing double values don't match after normalization, normalized "
+                            + prettyPrintCollections(normalizedActual, normalizedExpected)
+                    )
+                );
+            return Optional.of(matchResult);
+        }
+
+        return Optional.empty();
+    }
+
+    private static Set<Float> normalizeDoubles(List<Object> values) {
+        if (values == null) {
+            return Set.of();
+        }
+
+        Function<Object, Float> toFloat = (o) -> o instanceof Number n ? n.floatValue() : Float.parseFloat((String) o);
+        return values.stream().filter(Objects::nonNull).map(toFloat).collect(Collectors.toSet());
+    }
+}
diff --git a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/FieldSpecificMatcher.java b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/FieldSpecificMatcher.java
index 10b1922e1e217..253fb4b0e9688 100644
--- a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/FieldSpecificMatcher.java
+++ b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/FieldSpecificMatcher.java
@@ -198,7 +198,7 @@ public MatchResult match(
                         actualSettings,
                         expectedMappings,
                         expectedSettings,
-                        "Values of type [scaled_float] don't match after normalization, normalized "
+                        "Values of type [unsigned_long] don't match after normalization, normalized "
                             + prettyPrintCollections(actualNormalized, expectedNormalized)
                     )
                 );
diff --git a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/MappingTransforms.java b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/MappingTransforms.java
index 4ca3142310b44..eade6f10e48fe 100644
--- a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/MappingTransforms.java
+++ b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/MappingTransforms.java
@@ -8,10 +8,21 @@
 
 package org.elasticsearch.datastreams.logsdb.qa.matchers.source;
 
+import java.util.ArrayList;
 import java.util.HashMap;
+import java.util.List;
 import java.util.Map;
 
 class MappingTransforms {
+    /**
+     * Container for mapping of a field. Contains field mapping parameters and mapping parameters of parent fields (if present)
+     * in order of increasing distance (direct parent first).
+     * This is needed because some parent mapping parameters influence how source of the field is stored (e.g. `enabled: false`).
+     * @param mappingParameters
+     * @param parentMappingParameters
+     */
+    record FieldMapping(Map<String, Object> mappingParameters, List<Map<String, Object>> parentMappingParameters) {}
+
     /**
      * Normalize mapping to have the same structure as normalized source and enable field mapping lookup.
      * Similar to {@link SourceTransforms#normalize(Map)} but needs to get rid of intermediate nodes
@@ -20,8 +31,8 @@ class MappingTransforms {
      * @param map raw mapping document converted to map
      * @return map from normalized field name (like a.b.c) to a map of mapping parameters (like type)
      */
-    public static Map<String, Map<String, Object>> normalizeMapping(Map<String, Object> map) {
-        var flattened = new HashMap<String, Map<String, Object>>();
+    public static Map<String, FieldMapping> normalizeMapping(Map<String, Object> map) {
+        var flattened = new HashMap<String, FieldMapping>();
 
         descend(null, map, flattened);
 
@@ -29,21 +40,36 @@ public static Map<String, Map<String, Object>> normalizeMapping(Map<String, Obje
     }
 
     @SuppressWarnings("unchecked")
-    private static void descend(String pathFromRoot, Map<String, Object> currentLevel, Map<String, Map<String, Object>> flattened) {
+    private static void descend(String pathFromRoot, Map<String, Object> currentLevel, Map<String, FieldMapping> flattened) {
         for (var entry : currentLevel.entrySet()) {
             if (entry.getKey().equals("_doc") || entry.getKey().equals("properties")) {
                 descend(pathFromRoot, (Map<String, Object>) entry.getValue(), flattened);
             } else {
                 if (entry.getValue() instanceof Map<?, ?> map) {
                     var pathToField = pathFromRoot == null ? entry.getKey() : pathFromRoot + "." + entry.getKey();
-                    descend(pathToField, (Map<String, Object>) map, flattened);
-                } else {
-                    if (pathFromRoot == null) {
-                        // Ignore top level mapping parameters for now
-                        continue;
+
+                    // Descending to subobject, we need to remember parent mapping
+                    if (pathFromRoot != null) {
+                        var parentMapping = flattened.computeIfAbsent(
+                            pathFromRoot,
+                            k -> new FieldMapping(new HashMap<>(), new ArrayList<>())
+                        );
+                        var childMapping = flattened.computeIfAbsent(
+                            pathToField,
+                            k -> new FieldMapping(new HashMap<>(), new ArrayList<>())
+                        );
+                        childMapping.parentMappingParameters.add(parentMapping.mappingParameters);
+                        childMapping.parentMappingParameters.addAll(parentMapping.parentMappingParameters);
                     }
 
-                    flattened.computeIfAbsent(pathFromRoot, k -> new HashMap<>()).put(entry.getKey(), entry.getValue());
+                    descend(pathToField, (Map<String, Object>) map, flattened);
+                } else {
+                    var pathToField = pathFromRoot == null ? "_doc" : pathFromRoot;
+                    // We are either at the lowest level of mapping or it's a leaf field of top level object
+                    flattened.computeIfAbsent(pathToField, k -> new FieldMapping(new HashMap<>(), new ArrayList<>())).mappingParameters.put(
+                        entry.getKey(),
+                        entry.getValue()
+                    );
                 }
             }
         }
diff --git a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/SourceMatcher.java b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/SourceMatcher.java
index f0e188a17631f..5eb93cee67d74 100644
--- a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/SourceMatcher.java
+++ b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/SourceMatcher.java
@@ -10,15 +10,12 @@
 
 import org.elasticsearch.common.bytes.BytesReference;
 import org.elasticsearch.common.settings.Settings;
-import org.elasticsearch.common.time.DateFormatter;
-import org.elasticsearch.common.time.FormatNames;
 import org.elasticsearch.common.xcontent.XContentHelper;
 import org.elasticsearch.datastreams.logsdb.qa.matchers.GenericEqualsMatcher;
 import org.elasticsearch.datastreams.logsdb.qa.matchers.ListEqualMatcher;
 import org.elasticsearch.datastreams.logsdb.qa.matchers.MatchResult;
 import org.elasticsearch.xcontent.XContentBuilder;
 
-import java.util.Comparator;
 import java.util.List;
 import java.util.Map;
 import java.util.Objects;
@@ -28,10 +25,11 @@
 import static org.elasticsearch.datastreams.logsdb.qa.matchers.Messages.prettyPrintCollections;
 
 public class SourceMatcher extends GenericEqualsMatcher<List<Map<String, Object>>> {
-    private final Map<String, Map<String, Object>> actualNormalizedMapping;
-    private final Map<String, Map<String, Object>> expectedNormalizedMapping;
+    private final Map<String, MappingTransforms.FieldMapping> actualNormalizedMapping;
+    private final Map<String, MappingTransforms.FieldMapping> expectedNormalizedMapping;
 
     private final Map<String, FieldSpecificMatcher> fieldSpecificMatchers;
+    private final DynamicFieldMatcher dynamicFieldMatcher;
 
     public SourceMatcher(
         final XContentBuilder actualMappings,
@@ -60,6 +58,7 @@ public SourceMatcher(
             "unsigned_long",
             new FieldSpecificMatcher.UnsignedLongMatcher(actualMappings, actualSettings, expectedMappings, expectedSettings)
         );
+        this.dynamicFieldMatcher = new DynamicFieldMatcher(actualMappings, actualSettings, expectedMappings, expectedSettings);
     }
 
     @Override
@@ -76,14 +75,8 @@ public MatchResult match() {
             );
         }
 
-        var sortedAndFlattenedActual = actual.stream()
-            .sorted(Comparator.comparing((Map<String, Object> m) -> parseTimestampToEpochMillis(m.get("@timestamp"))))
-            .map(SourceTransforms::normalize)
-            .toList();
-        var sortedAndFlattenedExpected = expected.stream()
-            .sorted(Comparator.comparing((Map<String, Object> m) -> parseTimestampToEpochMillis(m.get("@timestamp"))))
-            .map(SourceTransforms::normalize)
-            .toList();
+        var sortedAndFlattenedActual = actual.stream().map(SourceTransforms::normalize).toList();
+        var sortedAndFlattenedExpected = expected.stream().map(SourceTransforms::normalize).toList();
 
         for (int i = 0; i < sortedAndFlattenedActual.size(); i++) {
             var actual = sortedAndFlattenedActual.get(i);
@@ -91,7 +84,8 @@ public MatchResult match() {
 
             var result = compareSource(actual, expected);
             if (result.isMatch() == false) {
-                return result;
+                var message = "Source matching failed at document id [" + i + "]. " + result.getMessage();
+                return MatchResult.noMatch(message);
             }
         }
 
@@ -105,12 +99,20 @@ private MatchResult compareSource(Map<String, List<Object>> actual, Map<String,
             var actualValues = actual.get(name);
             var expectedValues = expectedFieldEntry.getValue();
 
-            MatchResult fieldMatch = matchWithFieldSpecificMatcher(name, actualValues, expectedValues).orElseGet(
-                () -> matchWithGenericMatcher(actualValues, expectedValues)
-            );
+            // There are cases when field values are stored in ignored source
+            // so we try to match them as is first and then apply field specific matcher.
+            // This is temporary, we should be able to tell when source is exact using mappings.
+            // See #111916.
+            var genericMatchResult = matchWithGenericMatcher(actualValues, expectedValues);
+            if (genericMatchResult.isMatch()) {
+                return genericMatchResult;
+            }
 
-            if (fieldMatch.isMatch() == false) {
-                var message = "Source documents don't match for field [" + name + "]: " + fieldMatch.getMessage();
+            var matchIncludingFieldSpecificMatchers = matchWithFieldSpecificMatcher(name, actualValues, expectedValues).orElse(
+                genericMatchResult
+            );
+            if (matchIncludingFieldSpecificMatchers.isMatch() == false) {
+                var message = "Source documents don't match for field [" + name + "]: " + matchIncludingFieldSpecificMatchers.getMessage();
                 return MatchResult.noMatch(message);
             }
         }
@@ -130,11 +132,11 @@ private Optional<MatchResult> matchWithFieldSpecificMatcher(String fieldName, Li
                 );
             }
 
-            // Dynamic mapping, nothing to do
-            return Optional.empty();
+            // Field is dynamically mapped
+            return dynamicFieldMatcher.match(actualValues, expectedValues);
         }
 
-        var actualFieldType = (String) actualFieldMapping.get("type");
+        var actualFieldType = (String) actualFieldMapping.mappingParameters().get("type");
         if (actualFieldType == null) {
             throw new IllegalStateException("Field type is missing from leaf field Leaf field [" + fieldName + "] mapping parameters");
         }
@@ -143,7 +145,7 @@ private Optional<MatchResult> matchWithFieldSpecificMatcher(String fieldName, Li
         if (expectedFieldMapping == null) {
             throw new IllegalStateException("Leaf field [" + fieldName + "] is present in actual mapping but absent in expected mapping");
         } else {
-            var expectedFieldType = expectedFieldMapping.get("type");
+            var expectedFieldType = expectedFieldMapping.mappingParameters().get("type");
             if (Objects.equals(actualFieldType, expectedFieldType) == false) {
                 throw new IllegalStateException(
                     "Leaf field ["
@@ -157,15 +159,29 @@ private Optional<MatchResult> matchWithFieldSpecificMatcher(String fieldName, Li
             }
         }
 
+        if (sourceMatchesExactly(expectedFieldMapping, expectedValues)) {
+            return Optional.empty();
+        }
+
         var fieldSpecificMatcher = fieldSpecificMatchers.get(actualFieldType);
         if (fieldSpecificMatcher == null) {
             return Optional.empty();
         }
 
-        MatchResult matched = fieldSpecificMatcher.match(actualValues, expectedValues, expectedFieldMapping, actualFieldMapping);
+        MatchResult matched = fieldSpecificMatcher.match(
+            actualValues,
+            expectedValues,
+            actualFieldMapping.mappingParameters(),
+            expectedFieldMapping.mappingParameters()
+        );
         return Optional.of(matched);
     }
 
+    // Checks for scenarios when source is stored exactly and therefore can be compared without special logic.
+    private boolean sourceMatchesExactly(MappingTransforms.FieldMapping mapping, List<Object> expectedValues) {
+        return mapping.parentMappingParameters().stream().anyMatch(m -> m.getOrDefault("enabled", "true").equals("false"));
+    }
+
     private MatchResult matchWithGenericMatcher(List<Object> actualValues, List<Object> expectedValues) {
         var genericListMatcher = new ListEqualMatcher(
             actualMappings,
@@ -179,9 +195,4 @@ private MatchResult matchWithGenericMatcher(List<Object> actualValues, List<Obje
 
         return genericListMatcher.match();
     }
-
-    // We could look up the format from mapping eventually.
-    private static long parseTimestampToEpochMillis(Object timestamp) {
-        return DateFormatter.forPattern(FormatNames.STRICT_DATE_OPTIONAL_TIME.getName()).parseMillis((String) timestamp);
-    }
 }
diff --git a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/SourceTransforms.java b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/SourceTransforms.java
index 5fbc9b18ccb91..d7d5bf369b018 100644
--- a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/SourceTransforms.java
+++ b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/matchers/source/SourceTransforms.java
@@ -14,6 +14,7 @@
 import java.util.List;
 import java.util.Map;
 import java.util.Objects;
+import java.util.function.Function;
 import java.util.stream.Collectors;
 
 class SourceTransforms {
@@ -42,10 +43,20 @@ public static <T> List<T> normalizeValues(List<T> values) {
             return Collections.emptyList();
         }
 
+        return normalizeValues(values, Function.identity());
+    }
+
+    public static <T, U> List<U> normalizeValues(List<T> values, Function<T, U> transform) {
+        if (values == null) {
+            return Collections.emptyList();
+        }
+
         // Synthetic source modifications:
         // * null values are not present
         // * duplicates are removed
-        return new ArrayList<>(values.stream().filter(v -> v != null && Objects.equals(v, "null") == false).collect(Collectors.toSet()));
+        return new ArrayList<>(
+            values.stream().filter(v -> v != null && Objects.equals(v, "null") == false).map(transform).collect(Collectors.toSet())
+        );
     }
 
     private static void descend(String pathFromRoot, Map<String, Object> currentLevel, Map<String, List<Object>> flattened) {
diff --git a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/DataGenerator.java b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/DataGenerator.java
index e6cfba2138882..ed2d968a78818 100644
--- a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/DataGenerator.java
+++ b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/DataGenerator.java
@@ -13,6 +13,7 @@
 import org.elasticsearch.xcontent.XContentBuilder;
 
 import java.io.IOException;
+import java.util.Map;
 
 /**
  * Entry point of data generation logic.
@@ -33,7 +34,7 @@ public DataGenerator(DataGeneratorSpecification specification) {
      */
     public void writeMapping(XContentBuilder mapping) throws IOException {
         mapping.startObject().field("_doc");
-        topLevelGenerator.mappingWriter(b -> {}).accept(mapping);
+        topLevelGenerator.mappingWriter(Map.of()).accept(mapping);
         mapping.endObject();
     }
 
@@ -44,8 +45,7 @@ public void writeMapping(XContentBuilder mapping) throws IOException {
      * @param customMappingParameters writer of custom mapping parameters of top level object mapping
      * @throws IOException
      */
-    public void writeMapping(XContentBuilder mapping, CheckedConsumer<XContentBuilder, IOException> customMappingParameters)
-        throws IOException {
+    public void writeMapping(XContentBuilder mapping, Map<String, Object> customMappingParameters) throws IOException {
         mapping.startObject().field("_doc");
         topLevelGenerator.mappingWriter(customMappingParameters).accept(mapping);
         mapping.endObject();
diff --git a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/DataGeneratorSpecification.java b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/DataGeneratorSpecification.java
index 57bf9f12ccef1..04c30ae484f44 100644
--- a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/DataGeneratorSpecification.java
+++ b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/DataGeneratorSpecification.java
@@ -23,6 +23,7 @@
  *                              Applies to subobjects.
  * @param maxObjectDepth maximum depth of nested objects
  * @param nestedFieldsLimit how many total nested fields can be present in a produced mapping
+ * @param fullyDynamicMapping if the mapping is fully dynamic, meaning none of the fields are mapped (essentially mapping is empty)
  * @param predefinedFields predefined fields that must be present in mapping and documents. Only top level fields are supported.
  */
 public record DataGeneratorSpecification(
@@ -30,6 +31,7 @@ public record DataGeneratorSpecification(
     int maxFieldCountPerLevel,
     int maxObjectDepth,
     int nestedFieldsLimit,
+    boolean fullyDynamicMapping,
     List<PredefinedField> predefinedFields
 ) {
 
@@ -46,6 +48,7 @@ public static class Builder {
         private int maxFieldCountPerLevel;
         private int maxObjectDepth;
         private int nestedFieldsLimit;
+        private boolean fullyDynamicMapping;
         private List<PredefinedField> predefinedFields;
 
         public Builder() {
@@ -55,6 +58,7 @@ public Builder() {
             this.maxObjectDepth = 2;
             // Default value of index.mapping.nested_fields.limit
             this.nestedFieldsLimit = 50;
+            fullyDynamicMapping = false;
             this.predefinedFields = new ArrayList<>();
         }
 
@@ -78,6 +82,11 @@ public Builder withNestedFieldsLimit(int nestedFieldsLimit) {
             return this;
         }
 
+        public Builder withFullyDynamicMapping(boolean fullyDynamicMapping) {
+            this.fullyDynamicMapping = fullyDynamicMapping;
+            return this;
+        }
+
         public Builder withPredefinedFields(List<PredefinedField> predefinedFields) {
             this.predefinedFields = predefinedFields;
             return this;
@@ -89,6 +98,7 @@ public DataGeneratorSpecification build() {
                 maxFieldCountPerLevel,
                 maxObjectDepth,
                 nestedFieldsLimit,
+                fullyDynamicMapping,
                 predefinedFields
             );
         }
diff --git a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/FieldType.java b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/FieldType.java
index c8821c087d084..4ed36ea685238 100644
--- a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/FieldType.java
+++ b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/FieldType.java
@@ -8,6 +8,18 @@
 
 package org.elasticsearch.logsdb.datageneration;
 
+import org.elasticsearch.logsdb.datageneration.datasource.DataSource;
+import org.elasticsearch.logsdb.datageneration.fields.leaf.ByteFieldDataGenerator;
+import org.elasticsearch.logsdb.datageneration.fields.leaf.DoubleFieldDataGenerator;
+import org.elasticsearch.logsdb.datageneration.fields.leaf.FloatFieldDataGenerator;
+import org.elasticsearch.logsdb.datageneration.fields.leaf.HalfFloatFieldDataGenerator;
+import org.elasticsearch.logsdb.datageneration.fields.leaf.IntegerFieldDataGenerator;
+import org.elasticsearch.logsdb.datageneration.fields.leaf.KeywordFieldDataGenerator;
+import org.elasticsearch.logsdb.datageneration.fields.leaf.LongFieldDataGenerator;
+import org.elasticsearch.logsdb.datageneration.fields.leaf.ScaledFloatFieldDataGenerator;
+import org.elasticsearch.logsdb.datageneration.fields.leaf.ShortFieldDataGenerator;
+import org.elasticsearch.logsdb.datageneration.fields.leaf.UnsignedLongFieldDataGenerator;
+
 /**
  * Lists all leaf field types that are supported for data generation.
  */
@@ -21,5 +33,20 @@ public enum FieldType {
     DOUBLE,
     FLOAT,
     HALF_FLOAT,
-    SCALED_FLOAT
+    SCALED_FLOAT;
+
+    public FieldDataGenerator generator(String fieldName, DataSource dataSource) {
+        return switch (this) {
+            case KEYWORD -> new KeywordFieldDataGenerator(fieldName, dataSource);
+            case LONG -> new LongFieldDataGenerator(fieldName, dataSource);
+            case UNSIGNED_LONG -> new UnsignedLongFieldDataGenerator(fieldName, dataSource);
+            case INTEGER -> new IntegerFieldDataGenerator(fieldName, dataSource);
+            case SHORT -> new ShortFieldDataGenerator(fieldName, dataSource);
+            case BYTE -> new ByteFieldDataGenerator(fieldName, dataSource);
+            case DOUBLE -> new DoubleFieldDataGenerator(fieldName, dataSource);
+            case FLOAT -> new FloatFieldDataGenerator(fieldName, dataSource);
+            case HALF_FLOAT -> new HalfFloatFieldDataGenerator(fieldName, dataSource);
+            case SCALED_FLOAT -> new ScaledFloatFieldDataGenerator(fieldName, dataSource);
+        };
+    }
 }
diff --git a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DataSourceRequest.java b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DataSourceRequest.java
index df3adc458829e..fadf51ee3ea10 100644
--- a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DataSourceRequest.java
+++ b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DataSourceRequest.java
@@ -10,6 +10,7 @@
 
 import org.elasticsearch.logsdb.datageneration.DataGeneratorSpecification;
 import org.elasticsearch.logsdb.datageneration.FieldType;
+import org.elasticsearch.logsdb.datageneration.fields.DynamicMapping;
 
 public interface DataSourceRequest<TResponse extends DataSourceResponse> {
     TResponse accept(DataSourceHandler handler);
@@ -88,7 +89,7 @@ public DataSourceResponse.ChildFieldGenerator accept(DataSourceHandler handler)
         }
     }
 
-    record FieldTypeGenerator() implements DataSourceRequest<DataSourceResponse.FieldTypeGenerator> {
+    record FieldTypeGenerator(DynamicMapping dynamicMapping) implements DataSourceRequest<DataSourceResponse.FieldTypeGenerator> {
         public DataSourceResponse.FieldTypeGenerator accept(DataSourceHandler handler) {
             return handler.handle(this);
         }
diff --git a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DataSourceResponse.java b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DataSourceResponse.java
index 2386c4c32ab6c..9093799ade41d 100644
--- a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DataSourceResponse.java
+++ b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DataSourceResponse.java
@@ -41,6 +41,8 @@ record ArrayWrapper(Function<Supplier<Object>, Supplier<Object>> wrapper) implem
     interface ChildFieldGenerator extends DataSourceResponse {
         int generateChildFieldCount();
 
+        boolean generateDynamicSubObject();
+
         boolean generateNestedSubObject();
 
         boolean generateRegularSubObject();
@@ -48,7 +50,9 @@ interface ChildFieldGenerator extends DataSourceResponse {
         String generateFieldName();
     }
 
-    record FieldTypeGenerator(Supplier<FieldType> generator) implements DataSourceResponse {}
+    record FieldTypeGenerator(Supplier<FieldTypeInfo> generator) implements DataSourceResponse {
+        public record FieldTypeInfo(FieldType fieldType, boolean dynamic) {}
+    }
 
     record ObjectArrayGenerator(Supplier<Optional<Integer>> lengthGenerator) implements DataSourceResponse {}
 
diff --git a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DefaultMappingParametersHandler.java b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DefaultMappingParametersHandler.java
index 9eea4e6ae932f..e57257f69da20 100644
--- a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DefaultMappingParametersHandler.java
+++ b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DefaultMappingParametersHandler.java
@@ -56,29 +56,23 @@ private Supplier<Map<String, Object>> scaledFloatMapping() {
     @Override
     public DataSourceResponse.ObjectMappingParametersGenerator handle(DataSourceRequest.ObjectMappingParametersGenerator request) {
         if (request.isNested()) {
-            return new DataSourceResponse.ObjectMappingParametersGenerator(
-                // TODO enable "false" and "strict"
-                // It is disabled because it hits a bug in synthetic source.
-                () -> {
-                    var parameters = new HashMap<String, Object>();
-                    if (ESTestCase.randomBoolean()) {
-                        parameters.put("dynamic", "true");
-                    }
-
-                    return parameters;
+            return new DataSourceResponse.ObjectMappingParametersGenerator(() -> {
+                var parameters = new HashMap<String, Object>();
+                if (ESTestCase.randomBoolean()) {
+                    parameters.put("dynamic", ESTestCase.randomFrom("true", "false", "strict"));
                 }
-            );
+
+                return parameters;
+            });
         }
 
-        // TODO enable "enabled: false" and "dynamic: false/runtime"
-        // It is disabled because it hits a bug in synthetic source.
         return new DataSourceResponse.ObjectMappingParametersGenerator(() -> {
             var parameters = new HashMap<String, Object>();
             if (ESTestCase.randomBoolean()) {
-                parameters.put("dynamic", ESTestCase.randomFrom("true", "strict"));
+                parameters.put("dynamic", ESTestCase.randomFrom("true", "false", "strict", "runtime"));
             }
             if (ESTestCase.randomBoolean()) {
-                parameters.put("enabled", "true");
+                parameters.put("enabled", ESTestCase.randomFrom("true", "false"));
             }
 
             return parameters;
diff --git a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DefaultObjectGenerationHandler.java b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DefaultObjectGenerationHandler.java
index 45e4b0b6d6624..4ad9ac61a9158 100644
--- a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DefaultObjectGenerationHandler.java
+++ b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DefaultObjectGenerationHandler.java
@@ -12,10 +12,11 @@
 import org.elasticsearch.test.ESTestCase;
 
 import java.util.Optional;
+import java.util.Set;
+import java.util.function.Supplier;
 
 import static org.elasticsearch.test.ESTestCase.randomAlphaOfLengthBetween;
 import static org.elasticsearch.test.ESTestCase.randomDouble;
-import static org.elasticsearch.test.ESTestCase.randomFrom;
 import static org.elasticsearch.test.ESTestCase.randomIntBetween;
 
 public class DefaultObjectGenerationHandler implements DataSourceHandler {
@@ -27,16 +28,22 @@ public int generateChildFieldCount() {
                 return ESTestCase.randomIntBetween(0, request.specification().maxFieldCountPerLevel());
             }
 
+            @Override
+            public boolean generateDynamicSubObject() {
+                // Using a static 5% change, this is just a chosen value that can be tweaked.
+                return randomDouble() <= 0.05;
+            }
+
             @Override
             public boolean generateNestedSubObject() {
-                // Using a static 10% change, this is just a chosen value that can be tweaked.
-                return randomDouble() <= 0.1;
+                // Using a static 5% change, this is just a chosen value that can be tweaked.
+                return randomDouble() <= 0.05;
             }
 
             @Override
             public boolean generateRegularSubObject() {
-                // Using a static 10% change, this is just a chosen value that can be tweaked.
-                return randomDouble() <= 0.1;
+                // Using a static 5% change, this is just a chosen value that can be tweaked.
+                return randomDouble() <= 0.05;
             }
 
             @Override
@@ -46,9 +53,27 @@ public String generateFieldName() {
         };
     }
 
+    // UNSIGNED_LONG is excluded because it is mapped as long
+    // and values larger than long fail to parse.
+    private static final Set<FieldType> EXCLUDED_FROM_DYNAMIC_MAPPING = Set.of(FieldType.UNSIGNED_LONG);
+
     @Override
     public DataSourceResponse.FieldTypeGenerator handle(DataSourceRequest.FieldTypeGenerator request) {
-        return new DataSourceResponse.FieldTypeGenerator(() -> randomFrom(FieldType.values()));
+        Supplier<DataSourceResponse.FieldTypeGenerator.FieldTypeInfo> generator = switch (request.dynamicMapping()) {
+            case FORBIDDEN -> () -> generateFieldTypeInfo(false);
+            case FORCED -> () -> generateFieldTypeInfo(true);
+            case SUPPORTED -> () -> generateFieldTypeInfo(ESTestCase.randomBoolean());
+        };
+
+        return new DataSourceResponse.FieldTypeGenerator(generator);
+    }
+
+    private static DataSourceResponse.FieldTypeGenerator.FieldTypeInfo generateFieldTypeInfo(boolean isDynamic) {
+        var excluded = isDynamic ? EXCLUDED_FROM_DYNAMIC_MAPPING : Set.of();
+
+        var fieldType = ESTestCase.randomValueOtherThanMany(excluded::contains, () -> ESTestCase.randomFrom(FieldType.values()));
+
+        return new DataSourceResponse.FieldTypeGenerator.FieldTypeInfo(fieldType, isDynamic);
     }
 
     @Override
diff --git a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DefaultPrimitiveTypesHandler.java b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DefaultPrimitiveTypesHandler.java
index 68bb628cc8b27..2514cbd51e21c 100644
--- a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DefaultPrimitiveTypesHandler.java
+++ b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/datasource/DefaultPrimitiveTypesHandler.java
@@ -20,8 +20,7 @@ public DataSourceResponse.LongGenerator handle(DataSourceRequest.LongGenerator r
 
     @Override
     public DataSourceResponse.UnsignedLongGenerator handle(DataSourceRequest.UnsignedLongGenerator request) {
-        // TODO there is currently an issue with handling BigInteger in some synthetic source scenarios
-        return new DataSourceResponse.UnsignedLongGenerator(() -> new BigInteger(64, ESTestCase.random()).toString());
+        return new DataSourceResponse.UnsignedLongGenerator(() -> new BigInteger(64, ESTestCase.random()));
     }
 
     @Override
diff --git a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/Context.java b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/Context.java
index 62130967508f6..ef83ced13f0dc 100644
--- a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/Context.java
+++ b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/Context.java
@@ -12,6 +12,7 @@
 import org.elasticsearch.logsdb.datageneration.datasource.DataSourceRequest;
 import org.elasticsearch.logsdb.datageneration.datasource.DataSourceResponse;
 
+import java.util.Map;
 import java.util.Optional;
 import java.util.concurrent.atomic.AtomicInteger;
 
@@ -19,23 +20,28 @@ class Context {
     private final DataGeneratorSpecification specification;
 
     private final DataSourceResponse.ChildFieldGenerator childFieldGenerator;
-    private final DataSourceResponse.FieldTypeGenerator fieldTypeGenerator;
     private final DataSourceResponse.ObjectArrayGenerator objectArrayGenerator;
     private final int objectDepth;
     // We don't need atomicity, but we need to pass counter by reference to accumulate total value from sub-objects.
     private final AtomicInteger nestedFieldsCount;
+    private final DynamicMapping parentDynamicMapping;
 
-    Context(DataGeneratorSpecification specification) {
-        this(specification, 0, new AtomicInteger(0));
+    Context(DataGeneratorSpecification specification, DynamicMapping parentDynamicMapping) {
+        this(specification, 0, new AtomicInteger(0), parentDynamicMapping);
     }
 
-    private Context(DataGeneratorSpecification specification, int objectDepth, AtomicInteger nestedFieldsCount) {
+    private Context(
+        DataGeneratorSpecification specification,
+        int objectDepth,
+        AtomicInteger nestedFieldsCount,
+        DynamicMapping parentDynamicMapping
+    ) {
         this.specification = specification;
         this.childFieldGenerator = specification.dataSource().get(new DataSourceRequest.ChildFieldGenerator(specification));
-        this.fieldTypeGenerator = specification.dataSource().get(new DataSourceRequest.FieldTypeGenerator());
         this.objectArrayGenerator = specification.dataSource().get(new DataSourceRequest.ObjectArrayGenerator());
         this.objectDepth = objectDepth;
         this.nestedFieldsCount = nestedFieldsCount;
+        this.parentDynamicMapping = parentDynamicMapping;
     }
 
     public DataGeneratorSpecification specification() {
@@ -46,27 +52,43 @@ public DataSourceResponse.ChildFieldGenerator childFieldGenerator() {
         return childFieldGenerator;
     }
 
-    public DataSourceResponse.FieldTypeGenerator fieldTypeGenerator() {
-        return fieldTypeGenerator;
+    public DataSourceResponse.FieldTypeGenerator fieldTypeGenerator(DynamicMapping dynamicMapping) {
+        return specification.dataSource().get(new DataSourceRequest.FieldTypeGenerator(dynamicMapping));
     }
 
-    public Context subObject() {
-        return new Context(specification, objectDepth + 1, nestedFieldsCount);
+    public Context subObject(DynamicMapping dynamicMapping) {
+        return new Context(specification, objectDepth + 1, nestedFieldsCount, dynamicMapping);
     }
 
-    public Context nestedObject() {
+    public Context nestedObject(DynamicMapping dynamicMapping) {
         nestedFieldsCount.incrementAndGet();
-        return new Context(specification, objectDepth + 1, nestedFieldsCount);
+        return new Context(specification, objectDepth + 1, nestedFieldsCount, dynamicMapping);
+    }
+
+    public boolean shouldAddDynamicObjectField(DynamicMapping dynamicMapping) {
+        if (objectDepth >= specification.maxObjectDepth() || dynamicMapping == DynamicMapping.FORBIDDEN) {
+            return false;
+        }
+
+        return childFieldGenerator.generateDynamicSubObject();
     }
 
     public boolean shouldAddObjectField() {
-        return childFieldGenerator.generateRegularSubObject() && objectDepth < specification.maxObjectDepth();
+        if (objectDepth >= specification.maxObjectDepth() || parentDynamicMapping == DynamicMapping.FORCED) {
+            return false;
+        }
+
+        return childFieldGenerator.generateRegularSubObject();
     }
 
     public boolean shouldAddNestedField() {
-        return childFieldGenerator.generateNestedSubObject()
-            && objectDepth < specification.maxObjectDepth()
-            && nestedFieldsCount.get() < specification.nestedFieldsLimit();
+        if (objectDepth >= specification.maxObjectDepth()
+            || nestedFieldsCount.get() >= specification.nestedFieldsLimit()
+            || parentDynamicMapping == DynamicMapping.FORCED) {
+            return false;
+        }
+
+        return childFieldGenerator.generateNestedSubObject();
     }
 
     public Optional<Integer> generateObjectArray() {
@@ -76,4 +98,18 @@ public Optional<Integer> generateObjectArray() {
 
         return objectArrayGenerator.lengthGenerator().get();
     }
+
+    public DynamicMapping determineDynamicMapping(Map<String, Object> mappingParameters) {
+        if (parentDynamicMapping == DynamicMapping.FORCED) {
+            return DynamicMapping.FORCED;
+        }
+
+        var dynamicParameter = mappingParameters.get("dynamic");
+        // Inherited from parent
+        if (dynamicParameter == null) {
+            return parentDynamicMapping;
+        }
+
+        return dynamicParameter.equals("strict") ? DynamicMapping.FORBIDDEN : DynamicMapping.SUPPORTED;
+    }
 }
diff --git a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/DynamicMapping.java b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/DynamicMapping.java
new file mode 100644
index 0000000000000..ea74080c03610
--- /dev/null
+++ b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/DynamicMapping.java
@@ -0,0 +1,15 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.logsdb.datageneration.fields;
+
+public enum DynamicMapping {
+    SUPPORTED,
+    FORBIDDEN,
+    FORCED
+}
diff --git a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/GenericSubObjectFieldDataGenerator.java b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/GenericSubObjectFieldDataGenerator.java
index 8a6a8939c7ddb..e8f9724fee269 100644
--- a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/GenericSubObjectFieldDataGenerator.java
+++ b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/GenericSubObjectFieldDataGenerator.java
@@ -10,17 +10,6 @@
 
 import org.elasticsearch.core.CheckedConsumer;
 import org.elasticsearch.logsdb.datageneration.FieldDataGenerator;
-import org.elasticsearch.logsdb.datageneration.FieldType;
-import org.elasticsearch.logsdb.datageneration.fields.leaf.ByteFieldDataGenerator;
-import org.elasticsearch.logsdb.datageneration.fields.leaf.DoubleFieldDataGenerator;
-import org.elasticsearch.logsdb.datageneration.fields.leaf.FloatFieldDataGenerator;
-import org.elasticsearch.logsdb.datageneration.fields.leaf.HalfFloatFieldDataGenerator;
-import org.elasticsearch.logsdb.datageneration.fields.leaf.IntegerFieldDataGenerator;
-import org.elasticsearch.logsdb.datageneration.fields.leaf.KeywordFieldDataGenerator;
-import org.elasticsearch.logsdb.datageneration.fields.leaf.LongFieldDataGenerator;
-import org.elasticsearch.logsdb.datageneration.fields.leaf.ScaledFloatFieldDataGenerator;
-import org.elasticsearch.logsdb.datageneration.fields.leaf.ShortFieldDataGenerator;
-import org.elasticsearch.logsdb.datageneration.fields.leaf.UnsignedLongFieldDataGenerator;
 import org.elasticsearch.xcontent.XContentBuilder;
 
 import java.io.IOException;
@@ -39,7 +28,7 @@ public class GenericSubObjectFieldDataGenerator {
         this.context = context;
     }
 
-    List<ChildField> generateChildFields() {
+    List<ChildField> generateChildFields(DynamicMapping dynamicMapping) {
         var existingFieldNames = new HashSet<String>();
         // no child fields is legal
         var childFieldsCount = context.childFieldGenerator().generateChildFieldCount();
@@ -48,13 +37,16 @@ List<ChildField> generateChildFields() {
         for (int i = 0; i < childFieldsCount; i++) {
             var fieldName = generateFieldName(existingFieldNames);
 
-            if (context.shouldAddObjectField()) {
-                result.add(new ChildField(fieldName, new ObjectFieldDataGenerator(context.subObject()), false));
+            if (context.shouldAddDynamicObjectField(dynamicMapping)) {
+                result.add(new ChildField(fieldName, new ObjectFieldDataGenerator(context.subObject(DynamicMapping.FORCED)), true));
+            } else if (context.shouldAddObjectField()) {
+                result.add(new ChildField(fieldName, new ObjectFieldDataGenerator(context.subObject(dynamicMapping)), false));
             } else if (context.shouldAddNestedField()) {
-                result.add(new ChildField(fieldName, new NestedFieldDataGenerator(context.nestedObject()), false));
+                result.add(new ChildField(fieldName, new NestedFieldDataGenerator(context.nestedObject(dynamicMapping)), false));
             } else {
-                var fieldType = context.fieldTypeGenerator().generator().get();
-                result.add(leafField(fieldType, fieldName));
+                var fieldTypeInfo = context.fieldTypeGenerator(dynamicMapping).generator().get();
+                var generator = fieldTypeInfo.fieldType().generator(fieldName, context.specification().dataSource());
+                result.add(new ChildField(fieldName, generator, fieldTypeInfo.dynamic()));
             }
         }
 
@@ -62,13 +54,17 @@ List<ChildField> generateChildFields() {
     }
 
     List<ChildField> generateChildFields(List<PredefinedField> predefinedFields) {
-        return predefinedFields.stream().map(pf -> leafField(pf.fieldType(), pf.fieldName())).toList();
+        return predefinedFields.stream()
+            .map(pf -> new ChildField(pf.name(), pf.generator(context.specification().dataSource()), false))
+            .toList();
     }
 
     static void writeChildFieldsMapping(XContentBuilder mapping, List<ChildField> childFields) throws IOException {
         for (var childField : childFields) {
-            mapping.field(childField.fieldName);
-            childField.generator.mappingWriter().accept(mapping);
+            if (childField.dynamic() == false) {
+                mapping.field(childField.fieldName);
+                childField.generator.mappingWriter().accept(mapping);
+            }
         }
     }
 
@@ -101,23 +97,6 @@ static void writeChildFieldsData(XContentBuilder document, Iterable<ChildField>
         }
     }
 
-    private ChildField leafField(FieldType type, String fieldName) {
-        var generator = switch (type) {
-            case KEYWORD -> new KeywordFieldDataGenerator(fieldName, context.specification().dataSource());
-            case LONG -> new LongFieldDataGenerator(fieldName, context.specification().dataSource());
-            case UNSIGNED_LONG -> new UnsignedLongFieldDataGenerator(fieldName, context.specification().dataSource());
-            case INTEGER -> new IntegerFieldDataGenerator(fieldName, context.specification().dataSource());
-            case SHORT -> new ShortFieldDataGenerator(fieldName, context.specification().dataSource());
-            case BYTE -> new ByteFieldDataGenerator(fieldName, context.specification().dataSource());
-            case DOUBLE -> new DoubleFieldDataGenerator(fieldName, context.specification().dataSource());
-            case FLOAT -> new FloatFieldDataGenerator(fieldName, context.specification().dataSource());
-            case HALF_FLOAT -> new HalfFloatFieldDataGenerator(fieldName, context.specification().dataSource());
-            case SCALED_FLOAT -> new ScaledFloatFieldDataGenerator(fieldName, context.specification().dataSource());
-        };
-
-        return new ChildField(fieldName, generator, false);
-    }
-
     private String generateFieldName(Set<String> existingFields) {
         var fieldName = context.childFieldGenerator().generateFieldName();
         while (existingFields.contains(fieldName)) {
diff --git a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/NestedFieldDataGenerator.java b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/NestedFieldDataGenerator.java
index 3ba220a64d4fd..5b9891ab15920 100644
--- a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/NestedFieldDataGenerator.java
+++ b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/NestedFieldDataGenerator.java
@@ -30,9 +30,10 @@ public class NestedFieldDataGenerator implements FieldDataGenerator {
             .get(new DataSourceRequest.ObjectMappingParametersGenerator(true))
             .mappingGenerator()
             .get();
+        var dynamicMapping = context.determineDynamicMapping(mappingParameters);
 
         var genericGenerator = new GenericSubObjectFieldDataGenerator(context);
-        this.childFields = genericGenerator.generateChildFields();
+        this.childFields = genericGenerator.generateChildFields(dynamicMapping);
     }
 
     @Override
diff --git a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/ObjectFieldDataGenerator.java b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/ObjectFieldDataGenerator.java
index 00f2977c8af33..51732b71b73d0 100644
--- a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/ObjectFieldDataGenerator.java
+++ b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/ObjectFieldDataGenerator.java
@@ -30,9 +30,10 @@ public class ObjectFieldDataGenerator implements FieldDataGenerator {
             .get(new DataSourceRequest.ObjectMappingParametersGenerator(false))
             .mappingGenerator()
             .get();
+        var dynamicMapping = context.determineDynamicMapping(mappingParameters);
 
         var genericGenerator = new GenericSubObjectFieldDataGenerator(context);
-        this.childFields = genericGenerator.generateChildFields();
+        this.childFields = genericGenerator.generateChildFields(dynamicMapping);
     }
 
     @Override
diff --git a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/PredefinedField.java b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/PredefinedField.java
index 6adae35dc909c..81b73e4407bd7 100644
--- a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/PredefinedField.java
+++ b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/PredefinedField.java
@@ -8,6 +8,36 @@
 
 package org.elasticsearch.logsdb.datageneration.fields;
 
+import org.elasticsearch.logsdb.datageneration.FieldDataGenerator;
 import org.elasticsearch.logsdb.datageneration.FieldType;
+import org.elasticsearch.logsdb.datageneration.datasource.DataSource;
 
-public record PredefinedField(String fieldName, FieldType fieldType) {}
+public interface PredefinedField {
+    String name();
+
+    FieldDataGenerator generator(DataSource dataSource);
+
+    record WithType(String fieldName, FieldType fieldType) implements PredefinedField {
+        @Override
+        public String name() {
+            return fieldName;
+        }
+
+        @Override
+        public FieldDataGenerator generator(DataSource dataSource) {
+            return fieldType().generator(fieldName, dataSource);
+        }
+    }
+
+    record WithGenerator(String fieldName, FieldDataGenerator generator) implements PredefinedField {
+        @Override
+        public String name() {
+            return fieldName;
+        }
+
+        @Override
+        public FieldDataGenerator generator(DataSource dataSource) {
+            return generator;
+        }
+    }
+}
diff --git a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/TopLevelObjectFieldDataGenerator.java b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/TopLevelObjectFieldDataGenerator.java
index 645b7ca16e291..f2c209fb73862 100644
--- a/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/TopLevelObjectFieldDataGenerator.java
+++ b/test/framework/src/main/java/org/elasticsearch/logsdb/datageneration/fields/TopLevelObjectFieldDataGenerator.java
@@ -10,32 +10,59 @@
 
 import org.elasticsearch.core.CheckedConsumer;
 import org.elasticsearch.logsdb.datageneration.DataGeneratorSpecification;
+import org.elasticsearch.logsdb.datageneration.datasource.DataSourceRequest;
 import org.elasticsearch.xcontent.XContentBuilder;
 
 import java.io.IOException;
+import java.util.HashMap;
 import java.util.List;
+import java.util.Map;
+import java.util.stream.Collectors;
+import java.util.stream.Stream;
 
 public class TopLevelObjectFieldDataGenerator {
     private final Context context;
+    private final Map<String, Object> mappingParameters;
+
     // Child fields of top level object that were explicitly requested, they have predefined name and type.
     private final List<GenericSubObjectFieldDataGenerator.ChildField> predefinedFields;
     // Child fields of top level object that are generated and merged with predefined fields.
     private final List<GenericSubObjectFieldDataGenerator.ChildField> generatedChildFields;
 
     public TopLevelObjectFieldDataGenerator(DataGeneratorSpecification specification) {
-        this.context = new Context(specification);
+        DynamicMapping dynamicMapping;
+        if (specification.fullyDynamicMapping()) {
+            dynamicMapping = DynamicMapping.FORCED;
+            this.mappingParameters = Map.of();
+        } else {
+            this.mappingParameters = new HashMap<>(
+                specification.dataSource().get(new DataSourceRequest.ObjectMappingParametersGenerator(false)).mappingGenerator().get()
+            );
+            // Top-level object can't be disabled because @timestamp is a required field in data streams.
+            this.mappingParameters.remove("enabled");
+
+            dynamicMapping = mappingParameters.getOrDefault("dynamic", "true").equals("strict")
+                ? DynamicMapping.FORBIDDEN
+                : DynamicMapping.SUPPORTED;
+        }
+        this.context = new Context(specification, dynamicMapping);
         var genericGenerator = new GenericSubObjectFieldDataGenerator(context);
+
         this.predefinedFields = genericGenerator.generateChildFields(specification.predefinedFields());
-        this.generatedChildFields = genericGenerator.generateChildFields();
+        this.generatedChildFields = genericGenerator.generateChildFields(dynamicMapping);
     }
 
-    public CheckedConsumer<XContentBuilder, IOException> mappingWriter(
-        CheckedConsumer<XContentBuilder, IOException> customMappingParameters
-    ) {
+    public CheckedConsumer<XContentBuilder, IOException> mappingWriter(Map<String, Object> customMappingParameters) {
         return b -> {
             b.startObject();
 
-            customMappingParameters.accept(b);
+            var mergedParameters = Stream.of(this.mappingParameters, customMappingParameters)
+                .flatMap(map -> map.entrySet().stream())
+                .collect(Collectors.toMap(Map.Entry::getKey, Map.Entry::getValue, (l, r) -> r));
+
+            for (var entry : mergedParameters.entrySet()) {
+                b.field(entry.getKey(), entry.getValue());
+            }
 
             b.startObject("properties");
             GenericSubObjectFieldDataGenerator.writeChildFieldsMapping(b, predefinedFields);
diff --git a/test/framework/src/test/java/org/elasticsearch/logsdb/datageneration/DataGeneratorSnapshotTests.java b/test/framework/src/test/java/org/elasticsearch/logsdb/datageneration/DataGeneratorSnapshotTests.java
index 8ff5998a31d45..81d6028182d21 100644
--- a/test/framework/src/test/java/org/elasticsearch/logsdb/datageneration/DataGeneratorSnapshotTests.java
+++ b/test/framework/src/test/java/org/elasticsearch/logsdb/datageneration/DataGeneratorSnapshotTests.java
@@ -39,6 +39,7 @@ public void testSnapshot() throws Exception {
         var expectedMapping = """
             {
               "_doc" : {
+                "dynamic" : "false",
                 "properties" : {
                   "f1" : {
                     "dynamic" : "false",
@@ -184,7 +185,6 @@ public DataSourceResponse.ArrayWrapper handle(DataSourceRequest.ArrayWrapper req
 
         @Override
         public DataSourceResponse.ChildFieldGenerator handle(DataSourceRequest.ChildFieldGenerator request) {
-
             return childFieldGenerator;
         }
 
@@ -205,11 +205,11 @@ public DataSourceResponse.FieldTypeGenerator handle(DataSourceRequest.FieldTypeG
             return new DataSourceResponse.FieldTypeGenerator(() -> {
                 if (fieldType == FieldType.KEYWORD) {
                     fieldType = FieldType.LONG;
-                    return FieldType.KEYWORD;
+                    return new DataSourceResponse.FieldTypeGenerator.FieldTypeInfo(FieldType.KEYWORD, false);
                 }
 
                 fieldType = FieldType.KEYWORD;
-                return FieldType.LONG;
+                return new DataSourceResponse.FieldTypeGenerator.FieldTypeInfo(FieldType.LONG, false);
             });
         }
 
@@ -240,6 +240,11 @@ public int generateChildFieldCount() {
             return 2;
         }
 
+        @Override
+        public boolean generateDynamicSubObject() {
+            return false;
+        }
+
         @Override
         public boolean generateNestedSubObject() {
             return generatedFields > 6 && generatedFields < 12;
diff --git a/test/framework/src/test/java/org/elasticsearch/logsdb/datageneration/DataGeneratorTests.java b/test/framework/src/test/java/org/elasticsearch/logsdb/datageneration/DataGeneratorTests.java
index 4a4ffca0f37aa..e8535263d387c 100644
--- a/test/framework/src/test/java/org/elasticsearch/logsdb/datageneration/DataGeneratorTests.java
+++ b/test/framework/src/test/java/org/elasticsearch/logsdb/datageneration/DataGeneratorTests.java
@@ -15,6 +15,7 @@
 import org.elasticsearch.logsdb.datageneration.datasource.DataSourceHandler;
 import org.elasticsearch.logsdb.datageneration.datasource.DataSourceRequest;
 import org.elasticsearch.logsdb.datageneration.datasource.DataSourceResponse;
+import org.elasticsearch.logsdb.datageneration.fields.DynamicMapping;
 import org.elasticsearch.plugins.Plugin;
 import org.elasticsearch.test.ESTestCase;
 import org.elasticsearch.xcontent.XContentBuilder;
@@ -42,6 +43,7 @@ public void testDataGeneratorSanity() throws IOException {
     public void testDataGeneratorProducesValidMappingAndDocument() throws IOException {
         // Make sure objects, nested objects and all field types are covered.
         var testChildFieldGenerator = new DataSourceResponse.ChildFieldGenerator() {
+            private boolean dynamicSubObjectCovered = false;
             private boolean subObjectCovered = false;
             private boolean nestedCovered = false;
             private int generatedFields = 0;
@@ -52,6 +54,16 @@ public int generateChildFieldCount() {
                 return 20;
             }
 
+            @Override
+            public boolean generateDynamicSubObject() {
+                if (dynamicSubObjectCovered == false) {
+                    dynamicSubObjectCovered = true;
+                    return true;
+                }
+
+                return false;
+            }
+
             @Override
             public boolean generateNestedSubObject() {
                 if (nestedCovered == false) {
@@ -88,7 +100,24 @@ public DataSourceResponse.ChildFieldGenerator handle(DataSourceRequest.ChildFiel
 
             @Override
             public DataSourceResponse.FieldTypeGenerator handle(DataSourceRequest.FieldTypeGenerator request) {
-                return new DataSourceResponse.FieldTypeGenerator(() -> FieldType.values()[generatedFields++ % FieldType.values().length]);
+                if (request.dynamicMapping() == DynamicMapping.FORBIDDEN || request.dynamicMapping() == DynamicMapping.SUPPORTED) {
+                    return new DataSourceResponse.FieldTypeGenerator(
+                        () -> new DataSourceResponse.FieldTypeGenerator.FieldTypeInfo(
+                            FieldType.values()[generatedFields++ % FieldType.values().length],
+                            false
+                        )
+                    );
+                }
+
+                return new DataSourceResponse.FieldTypeGenerator(() -> {
+                    var fieldType = FieldType.values()[generatedFields++ % FieldType.values().length];
+                    // Does not really work with dynamic mapping.
+                    if (fieldType == FieldType.UNSIGNED_LONG) {
+                        fieldType = FieldType.values()[generatedFields++ % FieldType.values().length];
+                    }
+
+                    return new DataSourceResponse.FieldTypeGenerator.FieldTypeInfo(fieldType, true);
+                });
             }
         };
 
@@ -122,6 +151,11 @@ public int generateChildFieldCount() {
                 return 50;
             }
 
+            @Override
+            public boolean generateDynamicSubObject() {
+                return false;
+            }
+
             @Override
             public boolean generateNestedSubObject() {
                 return false;
@@ -151,7 +185,9 @@ public DataSourceResponse.ObjectArrayGenerator handle(DataSourceRequest.ObjectAr
 
             @Override
             public DataSourceResponse.FieldTypeGenerator handle(DataSourceRequest.FieldTypeGenerator request) {
-                return new DataSourceResponse.FieldTypeGenerator(() -> FieldType.LONG);
+                return new DataSourceResponse.FieldTypeGenerator(
+                    () -> new DataSourceResponse.FieldTypeGenerator.FieldTypeInfo(FieldType.LONG, false)
+                );
             }
         };
 

From 55a185b933ee508812a20ecd94d394974dad6ac1 Mon Sep 17 00:00:00 2001
From: Joe Gallo <joe.gallo@elastic.co>
Date: Thu, 29 Aug 2024 16:07:31 -0400
Subject: [PATCH 059/144] Bump spotless version to 6.25.0 (#112366)

---
 gradle/build.versions.toml                    |   2 +-
 gradle/verification-metadata.xml              | 295 ++++++------------
 .../health/node/DiskHealthInfo.java           |   1 +
 .../xpack/ml/inference/nlp/NerProcessor.java  |   1 +
 4 files changed, 107 insertions(+), 192 deletions(-)

diff --git a/gradle/build.versions.toml b/gradle/build.versions.toml
index 792330fd3613b..12f7776add17b 100644
--- a/gradle/build.versions.toml
+++ b/gradle/build.versions.toml
@@ -44,6 +44,6 @@ snakeyaml = { group = "org.yaml", name = "snakeyaml", version = { strictly = "2.
 spock-core = { group = "org.spockframework", name="spock-core", version.ref="spock" }
 spock-junit4 = { group = "org.spockframework", name="spock-junit4", version.ref="spock" }
 spock-platform = { group = "org.spockframework", name="spock-bom", version.ref="spock" }
-spotless-plugin = "com.diffplug.spotless:spotless-plugin-gradle:6.22.0"
+spotless-plugin = "com.diffplug.spotless:spotless-plugin-gradle:6.25.0"
 wiremock = "com.github.tomakehurst:wiremock-jre8-standalone:2.23.2"
 xmlunit-core = "org.xmlunit:xmlunit-core:2.8.2"
diff --git a/gradle/verification-metadata.xml b/gradle/verification-metadata.xml
index a27e2083a0849..3a4f5ef9d240c 100644
--- a/gradle/verification-metadata.xml
+++ b/gradle/verification-metadata.xml
@@ -204,19 +204,14 @@
             <sha256 value="095fd1dc77888c073f0be39a018156ee526722798b09de9e285ef2135e16eac4" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.diffplug.durian" name="durian-swt.os" version="4.1.1">
-         <artifact name="durian-swt.os-4.1.1.jar">
-            <sha256 value="9ff15ac4f14c4ef9e241108392c43347916a433658c5ad971e999df1191b3230" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
       <component group="com.diffplug.durian" name="durian-swt.os" version="4.2.0">
          <artifact name="durian-swt.os-4.2.0.jar">
             <sha256 value="f21e572bf9fbb549a998cb7e2f79b6b9a3ab9623371ac130b12509523f7b748f" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.diffplug.durian" name="durian-swt.os" version="4.2.1">
-         <artifact name="durian-swt.os-4.2.1.jar">
-            <sha256 value="4075cef438707d669b8d468500289af99fe87cb3fa69b7f564d9cefa4c838b30" origin="Generated by Gradle"/>
+      <component group="com.diffplug.durian" name="durian-swt.os" version="4.2.2">
+         <artifact name="durian-swt.os-4.2.2.jar">
+            <sha256 value="6b531c6b4be581a8b32ead861ddc15c2c93b20c665fb4d33e0381483c24445f4" origin="Generated by Gradle"/>
          </artifact>
       </component>
       <component group="com.diffplug.spotless" name="spotless-eclipse-base" version="3.5.2">
@@ -229,36 +224,19 @@
             <sha256 value="e983d13b1051f8dc49820970aa8da80364857cecf46d78d1b509366e523186bd" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.diffplug.spotless" name="spotless-lib" version="2.38.0">
-         <artifact name="spotless-lib-2.38.0.jar">
-            <sha256 value="de867a4ad15042970c85bd8b822560be501e1d313f588bb8f5ddaab5759219f3" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
-      <component group="com.diffplug.spotless" name="spotless-lib" version="2.42.0">
-         <artifact name="spotless-lib-2.42.0.jar">
-            <sha256 value="aa3678c924f7a55475e3a923fe9a4b34fb7cf0ea1cb81039378ef8e04b3f00fe" origin="Generated by Gradle"/>
+      <component group="com.diffplug.spotless" name="spotless-lib" version="2.45.0">
+         <artifact name="spotless-lib-2.45.0.jar">
+            <sha256 value="b25969972e1d980280ca2ae529197ed9b3160aae48b506cf1935f01bd1318667" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.diffplug.spotless" name="spotless-lib-extra" version="2.38.0">
-         <artifact name="spotless-lib-extra-2.38.0.jar">
-            <sha256 value="ea247cf4548748ad8e8c31101dbb287dbe523faaf57e3a553e834aa6d67118fc" origin="Generated by Gradle"/>
+      <component group="com.diffplug.spotless" name="spotless-lib-extra" version="2.45.0">
+         <artifact name="spotless-lib-extra-2.45.0.jar">
+            <sha256 value="602cbbcd3828ee9cfb2e30a7f9b30335c6927130771414d4cdd294d21fe5cb67" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.diffplug.spotless" name="spotless-lib-extra" version="2.42.0">
-         <artifact name="spotless-lib-extra-2.42.0.jar">
-            <sha256 value="ed823e2a980c87d7df749a89c2356b11b36c15de2c32eab31ca990f7ad6fafb2" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
-      <component group="com.diffplug.spotless" name="spotless-plugin-gradle" version="6.18.0">
-         <artifact name="spotless-plugin-gradle-6.18.0.jar">
-            <sha256 value="8f27c05d31a4389259ba54938c476427ae8a88cc1540d421623fdc6c9fc86f7b" origin="Generated by Gradle">
-               <also-trust value="daf622fc8d6dbfe53b7ec08f80ac64fdd2f9cb00f175e69eb91a8f0da1565970"/>
-            </sha256>
-         </artifact>
-      </component>
-      <component group="com.diffplug.spotless" name="spotless-plugin-gradle" version="6.22.0">
-         <artifact name="spotless-plugin-gradle-6.22.0.jar">
-            <sha256 value="32026f34b42b7b52ca9178d9c36802634f8caedd5a857764c3157ed8792277d1" origin="Generated by Gradle"/>
+      <component group="com.diffplug.spotless" name="spotless-plugin-gradle" version="6.25.0">
+         <artifact name="spotless-plugin-gradle-6.25.0.jar">
+            <sha256 value="f5eb908a4c5da46299e7543faada0402d2c4b77d58c7b432d4b6e59349b280a3" origin="Generated by Gradle"/>
          </artifact>
       </component>
       <component group="com.ethlo.time" name="itu" version="1.7.0">
@@ -601,11 +579,6 @@
             <sha256 value="47b2248705e0c9771bc259f22465a79655c1296e2d47aaee852adb7cdacb6198" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.google.errorprone" name="error_prone_annotations" version="2.1.3">
-         <artifact name="error_prone_annotations-2.1.3.jar">
-            <sha256 value="03d0329547c13da9e17c634d1049ea2ead093925e290567e1a364fd6b1fc7ff8" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
       <component group="com.google.errorprone" name="error_prone_annotations" version="2.11.0">
          <artifact name="error_prone_annotations-2.11.0.jar">
             <sha256 value="721cb91842b46fa056847d104d5225c8b8e1e8b62263b993051e1e5a0137b7ec" origin="Generated by Gradle"/>
@@ -621,6 +594,11 @@
             <sha256 value="6ebd22ca1b9d8ec06d41de8d64e0596981d9607b42035f9ed374f9de271a481a" origin="Generated by Gradle"/>
          </artifact>
       </component>
+      <component group="com.google.errorprone" name="error_prone_annotations" version="2.21.1">
+         <artifact name="error_prone_annotations-2.21.1.jar">
+            <sha256 value="d1f3c66aa91ac52549e00ae3b208ba4b9af7d72d68f230643553beb38e6118ac" origin="Generated by Gradle"/>
+         </artifact>
+      </component>
       <component group="com.google.errorprone" name="error_prone_annotations" version="2.3.4">
          <artifact name="error_prone_annotations-2.3.4.jar">
             <sha256 value="baf7d6ea97ce606c53e11b6854ba5f2ce7ef5c24dddf0afa18d1260bd25b002c" origin="Generated by Gradle"/>
@@ -631,14 +609,9 @@
             <sha256 value="8d10cac2ea9878896077ba437d76fdb1b9a07f55a863c560bb8a024b04103f8b" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.google.googlejavaformat" name="google-java-format" version="1.16.0">
-         <artifact name="google-java-format-1.16.0.jar">
-            <sha256 value="0cff5d0230ba20d538f3f70b2aa68bd33f9fdc69768cde07337c563c23eb7c43" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
-      <component group="com.google.googlejavaformat" name="google-java-format" version="1.17.0">
-         <artifact name="google-java-format-1.17.0.jar">
-            <sha256 value="631ba54c39f6c20df027dc1420736df2e5e43c581880efdd1e46ddb4ce050e3e" origin="Generated by Gradle"/>
+      <component group="com.google.googlejavaformat" name="google-java-format" version="1.19.2">
+         <artifact name="google-java-format-1.19.2.jar">
+            <sha256 value="bac84458eb12499585f2fabb1ac13bbe5b455c120bf3d19db21597814a27c863" origin="Generated by Gradle"/>
          </artifact>
       </component>
       <component group="com.google.guava" name="failureaccess" version="1.0">
@@ -656,11 +629,6 @@
             <sha256 value="a896857d07845d38c7dc5bbc0457b6d9b0f62ecffda010e5e9ec12d561f676d3" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.google.guava" name="guava" version="25.1-android">
-         <artifact name="guava-25.1-android.jar">
-            <sha256 value="f7b8f8fed176b9cf6831b98cb07320d7fbe91d99b29999f752c3821dfe45bdc8" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
       <component group="com.google.guava" name="guava" version="27.0-jre">
          <artifact name="guava-27.0-jre.jar">
             <sha256 value="63b09db6861011e7fb2481be7790c7fd4b03f0bb884b3de2ecba8823ad19bf3f" origin="Generated by Gradle"/>
@@ -686,6 +654,11 @@
             <sha256 value="91fbba37f1c8b251cf9ea9e7d3a369eb79eb1e6a5df1d4bbf483dd0380740281" origin="Generated by Gradle"/>
          </artifact>
       </component>
+      <component group="com.google.guava" name="guava" version="32.1.3-jre">
+         <artifact name="guava-32.1.3-jre.jar">
+            <sha256 value="6d4e2b5a118aab62e6e5e29d185a0224eed82c85c40ac3d33cf04a270c3b3744" origin="Generated by Gradle"/>
+         </artifact>
+      </component>
       <component group="com.google.guava" name="listenablefuture" version="9999.0-empty-to-avoid-conflict-with-guava">
          <artifact name="listenablefuture-9999.0-empty-to-avoid-conflict-with-guava.jar">
             <sha256 value="b372a037d4230aa57fbeffdef30fd6123f9c0c2db85d0aced00c91b974f33f99" origin="Generated by Gradle"/>
@@ -1038,14 +1011,9 @@
             <sha256 value="88ac9fd1bb51f82bcc664cc1eb9c225c90dc4389d660231b4cc737bebfe7d0aa" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.squareup.okhttp3" name="okhttp" version="4.10.0">
-         <artifact name="okhttp-4.10.0.jar">
-            <sha256 value="7580f14fa1691206e37081ad3f92063b1603b328da0bb316f2fef02e0562e7ec" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
-      <component group="com.squareup.okhttp3" name="okhttp" version="4.11.0">
-         <artifact name="okhttp-4.11.0.jar">
-            <sha256 value="ee8f6bd6cd1257013d748330f4ca147638a9fbcb52fb388d5ac93cf53408745d" origin="Generated by Gradle"/>
+      <component group="com.squareup.okhttp3" name="okhttp" version="4.12.0">
+         <artifact name="okhttp-4.12.0.jar">
+            <sha256 value="b1050081b14bb7a3a7e55a4d3ef01b5dcfabc453b4573a4fc019767191d5f4e0" origin="Generated by Gradle"/>
          </artifact>
       </component>
       <component group="com.squareup.okio" name="okio" version="1.4.0">
@@ -1058,14 +1026,9 @@
             <sha256 value="114bdc1f47338a68bcbc95abf2f5cdc72beeec91812f2fcd7b521c1937876266" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="com.squareup.okio" name="okio-jvm" version="3.0.0">
-         <artifact name="okio-jvm-3.0.0.jar">
-            <sha256 value="be64a0cc1f28ea9cd5c970dd7e7557af72c808d738c495b397bf897c9921e907" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
-      <component group="com.squareup.okio" name="okio-jvm" version="3.2.0">
-         <artifact name="okio-jvm-3.2.0.jar">
-            <sha256 value="b642baef4c570055de4cb3d1667b2b16dced901ff8066345a063691aa06025a4" origin="Generated by Gradle"/>
+      <component group="com.squareup.okio" name="okio-jvm" version="3.6.0">
+         <artifact name="okio-jvm-3.6.0.jar">
+            <sha256 value="67543f0736fc422ae927ed0e504b98bc5e269fda0d3500579337cb713da28412" origin="Generated by Gradle"/>
          </artifact>
       </component>
       <component group="com.sun.activation" name="jakarta.activation" version="1.2.1">
@@ -1338,14 +1301,14 @@
             <sha256 value="7b478e69fb613a05c2e1cb0ecfd257618cfb477333660914440a30b5afc712ff" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="dev.equo.ide" name="solstice" version="1.0.3">
-         <artifact name="solstice-1.0.3.jar">
-            <sha256 value="0bfbd724f4ebdbabfc384ba90498702a45b449c92817d2844444713229d2cbf3" origin="Generated by Gradle"/>
+      <component group="dev.equo.ide" name="solstice" version="1.7.4">
+         <artifact name="solstice-1.7.4.jar">
+            <sha256 value="1288c1010299cb8434218e370f2291f2d6ea49b3ccb34b5082080f7c270a254c" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="dev.equo.ide" name="solstice" version="1.7.3">
-         <artifact name="solstice-1.7.3.jar">
-            <sha256 value="a8cfefb2c28b906c920ddb13024f557f57c68668ef8c748662e5b86cde70f55b" origin="Generated by Gradle"/>
+      <component group="dev.equo.ide" name="solstice" version="1.7.5">
+         <artifact name="solstice-1.7.5.jar">
+            <sha256 value="06e14bc43acc331dab6b5ea201fc67364ed123f982c85fa5131f0817ed65ae4f" origin="Generated by Gradle"/>
          </artifact>
       </component>
       <component group="dnsjava" name="dnsjava" version="2.1.7">
@@ -3284,11 +3247,6 @@
             <sha256 value="ac97f7b4b1d8e9337edfa0e34044f8d0efe7223f6ad8f3a85d54cc1018ea2e04" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.checkerframework" name="checker-compat-qual" version="2.0.0">
-         <artifact name="checker-compat-qual-2.0.0.jar">
-            <sha256 value="a40b2ce6d8551e5b90b1bf637064303f32944d61b52ab2014e38699df573941b" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
       <component group="org.checkerframework" name="checker-qual" version="2.10.0">
          <artifact name="checker-qual-2.10.0.jar">
             <sha256 value="d261fde25d590f6b69db7721d469ac1b0a19a17ccaaaa751c31f0d8b8260b894" origin="Generated by Gradle"/>
@@ -3309,16 +3267,16 @@
             <sha256 value="e316255bbfcd9fe50d165314b85abb2b33cb2a66a93c491db648e498a82c2de1" origin="Generated by Gradle"/>
          </artifact>
       </component>
+      <component group="org.checkerframework" name="checker-qual" version="3.37.0">
+         <artifact name="checker-qual-3.37.0.jar">
+            <sha256 value="e4ce1376cc2735e1dde220b62ad0913f51297704daad155a33f386bc5db0d9f7" origin="Generated by Gradle"/>
+         </artifact>
+      </component>
       <component group="org.checkerframework" name="checker-qual" version="3.42.0">
          <artifact name="checker-qual-3.42.0.jar">
             <sha256 value="ccaedd33af0b7894d9f2f3b644f4d19e43928e32902e61ac4d10777830f5aac7" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.checkerframework" name="checker-qual" version="3.5.0">
-         <artifact name="checker-qual-3.5.0.jar">
-            <sha256 value="729990b3f18a95606fc2573836b6958bcdb44cb52bfbd1b7aa9c339cff35a5a4" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
       <component group="org.codehaus.groovy" name="groovy" version="3.0.9">
          <artifact name="groovy-3.0.9.jar">
             <sha256 value="77bf86897f295f8cae2e1f46b1eca109f487ba81b66ef24a2b6dcba1eb7d6ce7" origin="Generated by Gradle"/>
@@ -3434,14 +3392,14 @@
             <sha256 value="81a33da58e5e878ffe8972ef93cd0bfc3a9daa0f5e3af4dd151be2b1d73018b4" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.eclipse.jdt" name="ecj" version="3.33.0">
-         <artifact name="ecj-3.33.0.jar">
-            <sha256 value="f7686c4960cf70c2ebc5c500a73a8cfc04541b730c18f1c5c21329889b137f45" origin="Generated by Gradle"/>
+      <component group="org.eclipse.jdt" name="ecj" version="3.35.0">
+         <artifact name="ecj-3.35.0.jar">
+            <sha256 value="b89df382369f2d16b19b67085426dc0fb7401fe1ad9fba1806af4e9729f5d1c0" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.eclipse.jdt" name="org.eclipse.jdt.core" version="3.33.0">
-         <artifact name="org.eclipse.jdt.core-3.33.0.jar">
-            <sha256 value="c03cbbf5ab447d954efb8268a58dd9f2fe70f9e5d9be0a8371f79d785357eba3" origin="Generated by Gradle"/>
+      <component group="org.eclipse.jdt" name="org.eclipse.jdt.core" version="3.35.0">
+         <artifact name="org.eclipse.jdt.core-3.35.0.jar">
+            <sha256 value="8f5bcb00355b271638b9d82a8cccd0e733225cb74c4a3f0f55a7b75d43ee442a" origin="Generated by Gradle"/>
          </artifact>
       </component>
       <component group="org.eclipse.jetty" name="jetty-annotations" version="9.4.40.v20210413">
@@ -3559,69 +3517,49 @@
             <sha256 value="b564477d092241aaab50c84ac5dd1ac375c0182044d7e5659d3a60a90e2e801a" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.eclipse.platform" name="org.eclipse.core.commands" version="3.10.100">
-         <artifact name="org.eclipse.core.commands-3.10.100.jar">
-            <sha256 value="177c605efd78681e28765b869a2ff5284a79b02d133007a6169a64317cee8633" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
-      <component group="org.eclipse.platform" name="org.eclipse.core.commands" version="3.10.300">
-         <artifact name="org.eclipse.core.commands-3.10.300.jar">
-            <sha256 value="e589b4036723278bcd25e7aa190d1632a58569437a202d5c2b97c7ac9847b874" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
-      <component group="org.eclipse.platform" name="org.eclipse.core.commands" version="3.10.400">
-         <artifact name="org.eclipse.core.commands-3.10.400.jar">
-            <sha256 value="b467c30a1b56029b7338027f8beedd1956f1e19fb0c69b15f56db6968ef3fae6" origin="Generated by Gradle"/>
+      <component group="org.eclipse.platform" name="org.eclipse.core.commands" version="3.11.100">
+         <artifact name="org.eclipse.core.commands-3.11.100.jar">
+            <sha256 value="97a503e4c7711e93e0724cb5181eab8a3cb926fbe0a00ab84f13e69e1d156378" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.eclipse.platform" name="org.eclipse.core.contenttype" version="3.8.0">
-         <artifact name="org.eclipse.core.contenttype-3.8.0.jar">
-            <sha256 value="f90fa8dd89b9da7d5e817281f963b46ad1414d33376354e541464434f0b23c90" origin="Generated by Gradle"/>
+      <component group="org.eclipse.platform" name="org.eclipse.core.contenttype" version="3.9.100">
+         <artifact name="org.eclipse.core.contenttype-3.9.100.jar">
+            <sha256 value="707e81707e8f2843be90f621aa3b7ff318dd3244e6f4a2982af55f66faf55987" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.eclipse.platform" name="org.eclipse.core.contenttype" version="3.8.200">
-         <artifact name="org.eclipse.core.contenttype-3.8.200.jar">
-            <sha256 value="d32716bfb03e7f3244a5df0f8816a8f0b6644a8c782f54062af8a3b00e1b4e45" origin="Generated by Gradle"/>
+      <component group="org.eclipse.platform" name="org.eclipse.core.expressions" version="3.9.100">
+         <artifact name="org.eclipse.core.expressions-3.9.100.jar">
+            <sha256 value="72736638d17cef9183659590d99fd7262a601ed2e3723295737a638db24e23fd" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.eclipse.platform" name="org.eclipse.core.expressions" version="3.8.200">
-         <artifact name="org.eclipse.core.expressions-3.8.200.jar">
-            <sha256 value="13dbbe3256f1199c69a79c3ba4c6ee79e6c1a0e73f67d49f5f3365b7ad387818" origin="Generated by Gradle"/>
+      <component group="org.eclipse.platform" name="org.eclipse.core.filesystem" version="1.10.100">
+         <artifact name="org.eclipse.core.filesystem-1.10.100.jar">
+            <sha256 value="fb9c03bde38e2cfe2d5e32c4ed858e824882cec07e911ae5de2322bd33e6a0a2" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.eclipse.platform" name="org.eclipse.core.filesystem" version="1.9.100">
-         <artifact name="org.eclipse.core.filesystem-1.9.100.jar">
-            <sha256 value="36e802c4d9a2c864e7d6b22b8d06f59927d113475ea04b3fd9bf6312d5a97ff6" origin="Generated by Gradle"/>
+      <component group="org.eclipse.platform" name="org.eclipse.core.jobs" version="3.15.0">
+         <artifact name="org.eclipse.core.jobs-3.15.0.jar">
+            <sha256 value="857df690c6424a6558b5c96732958f03b9c209258562caf93d9fcbc13242fa11" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.eclipse.platform" name="org.eclipse.core.filesystem" version="1.9.500">
-         <artifact name="org.eclipse.core.filesystem-1.9.500.jar">
-            <sha256 value="0c4810a1fa6e871c0bb23b29090a72c83b760af8171495c1325b4711b919072b" origin="Generated by Gradle"/>
+      <component group="org.eclipse.platform" name="org.eclipse.core.resources" version="3.19.100">
+         <artifact name="org.eclipse.core.resources-3.19.100.jar">
+            <sha256 value="537af88de2c0e602446ab0fa9dcfec29c617f0891b96fc4cc3fba1655edcc91b" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.eclipse.platform" name="org.eclipse.core.jobs" version="3.13.300">
-         <artifact name="org.eclipse.core.jobs-3.13.300.jar">
-            <sha256 value="eb59627a7fcaf8c57dc34c75e24a8a54963ebfe1b7630d6fc72be882ea91eed4" origin="Generated by Gradle"/>
+      <component group="org.eclipse.platform" name="org.eclipse.core.runtime" version="3.29.0">
+         <artifact name="org.eclipse.core.runtime-3.29.0.jar">
+            <sha256 value="096373dff05c425cb37e4924b25b3532a8f8c2992f36d4b6266b0e05a19af814" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.eclipse.platform" name="org.eclipse.core.resources" version="3.18.200">
-         <artifact name="org.eclipse.core.resources-3.18.200.jar">
-            <sha256 value="df6e64965c436c96c3d1de0481407a3c5523e320145dac01ca3d2edf4aa66738" origin="Generated by Gradle"/>
+      <component group="org.eclipse.platform" name="org.eclipse.equinox.app" version="1.6.300">
+         <artifact name="org.eclipse.equinox.app-1.6.300.jar">
+            <sha256 value="eaeb288c9bc78916027d3933d7d1f78c1b8675d54a55a7abdea161b001b7adf1" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.eclipse.platform" name="org.eclipse.core.runtime" version="3.26.100">
-         <artifact name="org.eclipse.core.runtime-3.26.100.jar">
-            <sha256 value="f90ebd2f052d602281840b2b8cd1f5a7b6d1cf2d5a85b7b0415c70456855d173" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
-      <component group="org.eclipse.platform" name="org.eclipse.equinox.app" version="1.6.200">
-         <artifact name="org.eclipse.equinox.app-1.6.200.jar">
-            <sha256 value="52840b5fe48ed8f50a26d792d21b2db73b622a0a10d64c18883da6fb85dcbc24" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
-      <component group="org.eclipse.platform" name="org.eclipse.equinox.common" version="3.17.100">
-         <artifact name="org.eclipse.equinox.common-3.17.100.jar">
-            <sha256 value="a3464c02a8a2b0c0dd73e00656064b6ab5cb59387c80bef71244ef18caa9d24d" origin="Generated by Gradle"/>
+      <component group="org.eclipse.platform" name="org.eclipse.equinox.common" version="3.18.100">
+         <artifact name="org.eclipse.equinox.common-3.18.100.jar">
+            <sha256 value="7c15db46dda5f6f1ff9ecac10eb6ffa9ed1cbd0ed5e6996cb95f0e390902700e" origin="Generated by Gradle"/>
          </artifact>
       </component>
       <component group="org.eclipse.platform" name="org.eclipse.equinox.event" version="1.6.200">
@@ -3629,19 +3567,19 @@
             <sha256 value="b83c7f7023a3c30daa75e112f3ad2c6d8c30108e19bbe84ec2d25b8bad0efe7a" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.eclipse.platform" name="org.eclipse.equinox.preferences" version="3.10.200">
-         <artifact name="org.eclipse.equinox.preferences-3.10.200.jar">
-            <sha256 value="3312f21ef759b30a6407ecb1fe8f6b552f2e3661f66bdec55831d05a36aa8ff5" origin="Generated by Gradle"/>
+      <component group="org.eclipse.platform" name="org.eclipse.equinox.preferences" version="3.10.300">
+         <artifact name="org.eclipse.equinox.preferences-3.10.300.jar">
+            <sha256 value="0e231ed4443b1bb21e16ec13a83e975bc04b0503eac2ce6f4b4a7d7b2f53956d" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.eclipse.platform" name="org.eclipse.equinox.registry" version="3.11.200">
-         <artifact name="org.eclipse.equinox.registry-3.11.200.jar">
-            <sha256 value="7a3668ca406930213e3edb8024ac72c51fbc3f289de63a33254c8070aa8d0a3f" origin="Generated by Gradle"/>
+      <component group="org.eclipse.platform" name="org.eclipse.equinox.registry" version="3.11.300">
+         <artifact name="org.eclipse.equinox.registry-3.11.300.jar">
+            <sha256 value="3acbb9c857bae9093f3308aff5abe72be5eabcb23e2791139d3571cade659da0" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.eclipse.platform" name="org.eclipse.equinox.supplement" version="1.10.600">
-         <artifact name="org.eclipse.equinox.supplement-1.10.600.jar">
-            <sha256 value="d36dd1d1b0db36a3dad7a7b7f2f93ca48140fc3e663b47b0d56aed5c5e6fd655" origin="Generated by Gradle"/>
+      <component group="org.eclipse.platform" name="org.eclipse.equinox.supplement" version="1.10.700">
+         <artifact name="org.eclipse.equinox.supplement-1.10.700.jar">
+            <sha256 value="5df4309856c79492807c17f116ca112ea83c7dd04c2c01049f5d3b4811135068" origin="Generated by Gradle"/>
          </artifact>
       </component>
       <component group="org.eclipse.platform" name="org.eclipse.osgi" version="3.18.300">
@@ -3649,9 +3587,14 @@
             <sha256 value="bab943e58edd17309238672dba7a45aec9e2dacbdddb818a8cf17723ea13fa22" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.eclipse.platform" name="org.eclipse.text" version="3.12.300">
-         <artifact name="org.eclipse.text-3.12.300.jar">
-            <sha256 value="6c4f4f01397ae566cb7007ca885ffc5d1813c913d6602d78a8f81801a39060e8" origin="Generated by Gradle"/>
+      <component group="org.eclipse.platform" name="org.eclipse.osgi" version="3.18.500">
+         <artifact name="org.eclipse.osgi-3.18.500.jar">
+            <sha256 value="80b275d58379723b291ea650249cc3809c8f10b34f78aaf988132cd6d434ab4e" origin="Generated by Gradle"/>
+         </artifact>
+      </component>
+      <component group="org.eclipse.platform" name="org.eclipse.text" version="3.13.100">
+         <artifact name="org.eclipse.text-3.13.100.jar">
+            <sha256 value="89afa204e8e686eaa5f1464a6ceb65ac1b341ad1d0326cab6716c6733ecaf5ac" origin="Generated by Gradle"/>
          </artifact>
       </component>
       <component group="org.eclipse.sisu" name="org.eclipse.sisu.inject" version="0.3.3">
@@ -3739,54 +3682,24 @@
             <sha256 value="edc8e3ec9796a5f41c1ae44b2d318507ee6ac1212f121d93d33699b3d0aff638" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.jetbrains.kotlin" name="kotlin-stdlib" version="1.4.21">
-         <artifact name="kotlin-stdlib-1.4.21.jar">
-            <sha256 value="f78c5d8c09db985912ab83a1de3c3b53ddf208d7b151f06a72358ea3e137d01b" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
-      <component group="org.jetbrains.kotlin" name="kotlin-stdlib" version="1.6.20">
-         <artifact name="kotlin-stdlib-1.6.20.jar">
-            <sha256 value="eeb51c2b67b26233fd81d0bc4f8044ec849718890905763ceffd84a31e2cb799" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
-      <component group="org.jetbrains.kotlin" name="kotlin-stdlib-common" version="1.4.21">
-         <artifact name="kotlin-stdlib-common-1.4.21.jar">
-            <sha256 value="812cf197d9c4c67e1f47f95e2d72a9b600f0d1124560617bfe9850773eccbcff" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
-      <component group="org.jetbrains.kotlin" name="kotlin-stdlib-common" version="1.6.20">
-         <artifact name="kotlin-stdlib-common-1.6.20.jar">
-            <sha256 value="8da40a2520d30dcb1012176fe93d24e82d08a3e346c37e0343b0fb6f64f6be01" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
-      <component group="org.jetbrains.kotlin" name="kotlin-stdlib-jdk7" version="1.4.21">
-         <artifact name="kotlin-stdlib-jdk7-1.4.21.jar">
-            <sha256 value="50de5f7dad6235064ac6c0ff577f095a91b3306c2547d8bc372291587495024a" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
-      <component group="org.jetbrains.kotlin" name="kotlin-stdlib-jdk7" version="1.5.31">
-         <artifact name="kotlin-stdlib-jdk7-1.5.31.jar">
-            <sha256 value="a25bf47353ce899d843cbddee516d621a73473e7fba97f8d0301e7b4aed7c15f" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
-      <component group="org.jetbrains.kotlin" name="kotlin-stdlib-jdk7" version="1.6.20">
-         <artifact name="kotlin-stdlib-jdk7-1.6.20.jar">
-            <sha256 value="aa2fa2e81355c4d98dd97da2169bf401f842261378f5b1cbea1aa11855d67620" origin="Generated by Gradle"/>
+      <component group="org.jetbrains.kotlin" name="kotlin-stdlib" version="1.9.10">
+         <artifact name="kotlin-stdlib-1.9.10.jar">
+            <sha256 value="55e989c512b80907799f854309f3bc7782c5b3d13932442d0379d5c472711504" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.jetbrains.kotlin" name="kotlin-stdlib-jdk8" version="1.4.21">
-         <artifact name="kotlin-stdlib-jdk8-1.4.21.jar">
-            <sha256 value="8ec3db1516948b2d3524e3afbe75cb5ac59e02d98cb6ef586ef57ba63ca8d11f" origin="Generated by Gradle"/>
+      <component group="org.jetbrains.kotlin" name="kotlin-stdlib-common" version="1.9.10">
+         <artifact name="kotlin-stdlib-common-1.9.10.jar">
+            <sha256 value="cde3341ba18a2ba262b0b7cf6c55b20c90e8d434e42c9a13e6a3f770db965a88" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.jetbrains.kotlin" name="kotlin-stdlib-jdk8" version="1.5.31">
-         <artifact name="kotlin-stdlib-jdk8-1.5.31.jar">
-            <sha256 value="b548f7767aacf029d2417e47440742bd6d3ebede19b60386e23554ce5c4c5fdc" origin="Generated by Gradle"/>
+      <component group="org.jetbrains.kotlin" name="kotlin-stdlib-jdk7" version="1.9.10">
+         <artifact name="kotlin-stdlib-jdk7-1.9.10.jar">
+            <sha256 value="ac6361bf9ad1ed382c2103d9712c47cdec166232b4903ed596e8876b0681c9b7" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="org.jetbrains.kotlin" name="kotlin-stdlib-jdk8" version="1.6.20">
-         <artifact name="kotlin-stdlib-jdk8-1.6.20.jar">
-            <sha256 value="fdab1bf120e2b5e7ab6d7888e9ebc024ec6b8ca729361296395dab634b213695" origin="Generated by Gradle"/>
+      <component group="org.jetbrains.kotlin" name="kotlin-stdlib-jdk8" version="1.9.10">
+         <artifact name="kotlin-stdlib-jdk8-1.9.10.jar">
+            <sha256 value="a4c74d94d64ce1abe53760fe0389dd941f6fc558d0dab35e47c085a11ec80f28" origin="Generated by Gradle"/>
          </artifact>
       </component>
       <component group="org.jline" name="jline" version="3.9.0">
diff --git a/server/src/main/java/org/elasticsearch/health/node/DiskHealthInfo.java b/server/src/main/java/org/elasticsearch/health/node/DiskHealthInfo.java
index f1e085482b72a..244ed03bf098c 100644
--- a/server/src/main/java/org/elasticsearch/health/node/DiskHealthInfo.java
+++ b/server/src/main/java/org/elasticsearch/health/node/DiskHealthInfo.java
@@ -20,6 +20,7 @@
  * The health status of the disk space of this node along with the cause.
  */
 public record DiskHealthInfo(HealthStatus healthStatus, @Nullable Cause cause) implements Writeable {
+
     public DiskHealthInfo(HealthStatus healthStatus) {
         this(healthStatus, null);
     }
diff --git a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/NerProcessor.java b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/NerProcessor.java
index 3dbf941c8120d..05b97422bfb97 100644
--- a/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/NerProcessor.java
+++ b/x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/nlp/NerProcessor.java
@@ -172,6 +172,7 @@ static String buildAnnotatedText(String seq, List<NerResults.EntityGroup> entiti
     }
 
     record NerResultProcessor(IobTag[] iobMap, String resultsField, boolean ignoreCase) implements NlpTask.ResultProcessor {
+
         NerResultProcessor(IobTag[] iobMap, String resultsField, boolean ignoreCase) {
             this.iobMap = iobMap;
             this.resultsField = Optional.ofNullable(resultsField).orElse(DEFAULT_RESULTS_FIELD);

From f1ef280c19ce3203532015368f2dbbe5112721b5 Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Fri, 30 Aug 2024 06:10:43 +1000
Subject: [PATCH 060/144] Mute
 org.elasticsearch.datastreams.logsdb.qa.StandardVersusLogsIndexModeRandomDataChallengeRestIT
 testMatchAllQuery #112374

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index e80a39040a4ef..94ff4b5d509cd 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -162,6 +162,9 @@ tests:
   issue: https://github.com/elastic/elasticsearch/issues/112254
 - class: org.elasticsearch.search.ccs.CCSUsageTelemetryIT
   issue: https://github.com/elastic/elasticsearch/issues/112324
+- class: org.elasticsearch.datastreams.logsdb.qa.StandardVersusLogsIndexModeRandomDataChallengeRestIT
+  method: testMatchAllQuery
+  issue: https://github.com/elastic/elasticsearch/issues/112374
 
 # Examples:
 #

From 09615aa49c9f21741adb56c957bae20b4d0f56e4 Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Fri, 30 Aug 2024 06:51:01 +1000
Subject: [PATCH 061/144] Mute
 org.elasticsearch.smoketest.DocsClientYamlTestSuiteIT test
 {yaml=reference/rest-api/watcher/put-watch/line_120} #99517

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 94ff4b5d509cd..c50234a8eaa9d 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -165,6 +165,9 @@ tests:
 - class: org.elasticsearch.datastreams.logsdb.qa.StandardVersusLogsIndexModeRandomDataChallengeRestIT
   method: testMatchAllQuery
   issue: https://github.com/elastic/elasticsearch/issues/112374
+- class: org.elasticsearch.smoketest.DocsClientYamlTestSuiteIT
+  method: test {yaml=reference/rest-api/watcher/put-watch/line_120}
+  issue: https://github.com/elastic/elasticsearch/issues/99517
 
 # Examples:
 #

From 5fb3c1dfbec669c6c6192de81cbb0af64791e810 Mon Sep 17 00:00:00 2001
From: Volodymyr Krasnikov <129072588+volodk85@users.noreply.github.com>
Date: Thu, 29 Aug 2024 14:20:34 -0700
Subject: [PATCH 062/144] Write multiple cache gaps for warming service in one
 go (#112071)

* Write multiple cache gaps for warming service in one go
---
 .../shared/SharedBlobCacheService.java        | 51 ++++++++++++++++---
 .../shared/SharedBlobCacheServiceTests.java   | 28 ++++++----
 2 files changed, 60 insertions(+), 19 deletions(-)

diff --git a/x-pack/plugin/blob-cache/src/main/java/org/elasticsearch/blobcache/shared/SharedBlobCacheService.java b/x-pack/plugin/blob-cache/src/main/java/org/elasticsearch/blobcache/shared/SharedBlobCacheService.java
index 3dfece0a9b20e..09fcd1cbeba92 100644
--- a/x-pack/plugin/blob-cache/src/main/java/org/elasticsearch/blobcache/shared/SharedBlobCacheService.java
+++ b/x-pack/plugin/blob-cache/src/main/java/org/elasticsearch/blobcache/shared/SharedBlobCacheService.java
@@ -967,12 +967,48 @@ void populate(
                         listener.onResponse(false);
                         return;
                     }
-                    try (var gapsListener = new RefCountingListener(listener.map(unused -> true))) {
-                        assert writer.sharedInputStreamFactory(gaps) == null;
-                        for (SparseFileTracker.Gap gap : gaps) {
-                            executor.execute(
-                                fillGapRunnable(gap, writer, null, ActionListener.releaseAfter(gapsListener.acquire(), refs.acquire()))
-                            );
+                    final SourceInputStreamFactory streamFactory = writer.sharedInputStreamFactory(gaps);
+                    logger.trace(
+                        () -> Strings.format(
+                            "fill gaps %s %s shared input stream factory",
+                            gaps,
+                            streamFactory == null ? "without" : "with"
+                        )
+                    );
+                    if (streamFactory == null) {
+                        try (var parallelGapsListener = new RefCountingListener(listener.map(unused -> true))) {
+                            for (SparseFileTracker.Gap gap : gaps) {
+                                executor.execute(
+                                    fillGapRunnable(
+                                        gap,
+                                        writer,
+                                        null,
+                                        ActionListener.releaseAfter(parallelGapsListener.acquire(), refs.acquire())
+                                    )
+                                );
+                            }
+                        }
+                    } else {
+                        try (
+                            var sequentialGapsListener = new RefCountingListener(
+                                ActionListener.runBefore(listener.map(unused -> true), streamFactory::close)
+                            )
+                        ) {
+                            final List<Runnable> gapFillingTasks = gaps.stream()
+                                .map(
+                                    gap -> fillGapRunnable(
+                                        gap,
+                                        writer,
+                                        streamFactory,
+                                        ActionListener.releaseAfter(sequentialGapsListener.acquire(), refs.acquire())
+                                    )
+                                )
+                                .toList();
+                            executor.execute(() -> {
+                                // Fill the gaps in order. If a gap fails to fill for whatever reason, the task for filling the next
+                                // gap will still be executed.
+                                gapFillingTasks.forEach(Runnable::run);
+                            });
                         }
                     }
                 }
@@ -1019,8 +1055,7 @@ void populateAndRead(
                             () -> Strings.format(
                                 "fill gaps %s %s shared input stream factory",
                                 gaps,
-                                (streamFactory == null ? "without" : "with"),
-                                (streamFactory == null ? "" : " " + streamFactory)
+                                streamFactory == null ? "without" : "with"
                             )
                         );
                         if (streamFactory == null) {
diff --git a/x-pack/plugin/blob-cache/src/test/java/org/elasticsearch/blobcache/shared/SharedBlobCacheServiceTests.java b/x-pack/plugin/blob-cache/src/test/java/org/elasticsearch/blobcache/shared/SharedBlobCacheServiceTests.java
index 0f3804baef42b..e405ed578b5a5 100644
--- a/x-pack/plugin/blob-cache/src/test/java/org/elasticsearch/blobcache/shared/SharedBlobCacheServiceTests.java
+++ b/x-pack/plugin/blob-cache/src/test/java/org/elasticsearch/blobcache/shared/SharedBlobCacheServiceTests.java
@@ -1422,7 +1422,7 @@ protected int computeCacheFileRegionSize(long fileLength, int region) {
         }
     }
 
-    public void testSharedSourceInputStreamFactory() throws Exception {
+    public void testUsageSharedSourceInputStreamFactoryInCachePopulation() throws Exception {
         final long regionSizeInBytes = size(100);
         final Settings settings = Settings.builder()
             .put(NODE_NAME_SETTING.getKey(), "node")
@@ -1519,16 +1519,22 @@ public void fillCacheRange(
             };
 
             final var range = ByteRange.of(0, regionSizeInBytes);
-            final PlainActionFuture<Integer> future = new PlainActionFuture<>();
-            region.populateAndRead(
-                range,
-                range,
-                (channel, channelPos, relativePos, length) -> length,
-                rangeMissingHandler,
-                threadPool.generic(),
-                future
-            );
-            safeGet(future);
+            if (randomBoolean()) {
+                final PlainActionFuture<Integer> future = new PlainActionFuture<>();
+                region.populateAndRead(
+                    range,
+                    range,
+                    (channel, channelPos, relativePos, length) -> length,
+                    rangeMissingHandler,
+                    threadPool.generic(),
+                    future
+                );
+                assertThat(safeGet(future).longValue(), equalTo(regionSizeInBytes));
+            } else {
+                final PlainActionFuture<Boolean> future = new PlainActionFuture<>();
+                region.populate(range, rangeMissingHandler, threadPool.generic(), future);
+                assertThat(safeGet(future), equalTo(true));
+            }
             assertThat(invocationCounter.get(), equalTo(numberGaps));
             assertThat(region.tracker.checkAvailable(regionSizeInBytes), is(true));
             assertBusy(() -> assertThat(factoryClosed.get(), is(true)));

From cb4d7ff28131650e84ae9aa7b94f1ce86758d3cc Mon Sep 17 00:00:00 2001
From: Stanislav Malyshev <smalyshev@users.noreply.github.com>
Date: Thu, 29 Aug 2024 15:54:08 -0600
Subject: [PATCH 063/144] Skip CCS Usage telemetry ITs if feature flags is not
 enabled. (#112365)

---
 .../elasticsearch/search/ccs/CCSUsageTelemetryIT.java  | 10 +++++++++-
 .../xpack/search/CCSUsageTelemetryAsyncSearchIT.java   |  8 ++++++++
 2 files changed, 17 insertions(+), 1 deletion(-)

diff --git a/server/src/internalClusterTest/java/org/elasticsearch/search/ccs/CCSUsageTelemetryIT.java b/server/src/internalClusterTest/java/org/elasticsearch/search/ccs/CCSUsageTelemetryIT.java
index 40d98b2b5ea71..bb18b8f1b702d 100644
--- a/server/src/internalClusterTest/java/org/elasticsearch/search/ccs/CCSUsageTelemetryIT.java
+++ b/server/src/internalClusterTest/java/org/elasticsearch/search/ccs/CCSUsageTelemetryIT.java
@@ -24,6 +24,7 @@
 import org.elasticsearch.common.bytes.BytesReference;
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.util.CollectionUtils;
+import org.elasticsearch.common.util.FeatureFlag;
 import org.elasticsearch.core.TimeValue;
 import org.elasticsearch.index.query.MatchAllQueryBuilder;
 import org.elasticsearch.plugins.Plugin;
@@ -36,6 +37,7 @@
 import org.elasticsearch.test.InternalTestCluster;
 import org.elasticsearch.usage.UsageService;
 import org.junit.Assert;
+import org.junit.BeforeClass;
 import org.junit.Rule;
 import org.junit.rules.TestRule;
 import org.junit.runner.Description;
@@ -66,6 +68,7 @@ public class CCSUsageTelemetryIT extends AbstractMultiClustersTestCase {
     private static final Logger LOGGER = LogManager.getLogger(CCSUsageTelemetryIT.class);
     private static final String REMOTE1 = "cluster-a";
     private static final String REMOTE2 = "cluster-b";
+    private static final FeatureFlag CCS_TELEMETRY_FEATURE_FLAG = new FeatureFlag("ccs_telemetry");
 
     @Override
     protected boolean reuseClusters() {
@@ -80,6 +83,11 @@ protected Collection<String> remoteClusterAlias() {
     @Rule
     public SkipUnavailableRule skipOverride = new SkipUnavailableRule(REMOTE1, REMOTE2);
 
+    @BeforeClass
+    protected static void skipIfTelemetryDisabled() {
+        assumeTrue("Skipping test as CCS_TELEMETRY_FEATURE_FLAG is disabled", CCS_TELEMETRY_FEATURE_FLAG.isEnabled());
+    }
+
     @Override
     protected Map<String, Boolean> skipUnavailableForRemoteClusters() {
         var map = skipOverride.getMap();
@@ -443,7 +451,7 @@ public void testRemoteTimesOut() throws Exception {
         // partial failure, and we disable partial results..
         searchRequest.setCcsMinimizeRoundtrips(true);
 
-        TimeValue searchTimeout = new TimeValue(200, TimeUnit.MILLISECONDS);
+        TimeValue searchTimeout = new TimeValue(500, TimeUnit.MILLISECONDS);
         // query builder that will sleep for the specified amount of time in the query phase
         SlowRunningQueryBuilder slowRunningQueryBuilder = new SlowRunningQueryBuilder(searchTimeout.millis() * 5, remoteIndex);
         SearchSourceBuilder sourceBuilder = new SearchSourceBuilder().query(slowRunningQueryBuilder).timeout(searchTimeout);
diff --git a/x-pack/plugin/async-search/src/internalClusterTest/java/org/elasticsearch/xpack/search/CCSUsageTelemetryAsyncSearchIT.java b/x-pack/plugin/async-search/src/internalClusterTest/java/org/elasticsearch/xpack/search/CCSUsageTelemetryAsyncSearchIT.java
index ac0b26cb4f4cd..4f8fa122047e1 100644
--- a/x-pack/plugin/async-search/src/internalClusterTest/java/org/elasticsearch/xpack/search/CCSUsageTelemetryAsyncSearchIT.java
+++ b/x-pack/plugin/async-search/src/internalClusterTest/java/org/elasticsearch/xpack/search/CCSUsageTelemetryAsyncSearchIT.java
@@ -14,6 +14,7 @@
 import org.elasticsearch.action.search.TransportSearchAction;
 import org.elasticsearch.client.internal.Client;
 import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.common.util.FeatureFlag;
 import org.elasticsearch.core.TimeValue;
 import org.elasticsearch.index.query.MatchAllQueryBuilder;
 import org.elasticsearch.plugins.Plugin;
@@ -33,6 +34,7 @@
 import org.elasticsearch.xpack.core.search.action.SubmitAsyncSearchRequest;
 import org.hamcrest.Matchers;
 import org.junit.Before;
+import org.junit.BeforeClass;
 
 import java.util.Arrays;
 import java.util.Collection;
@@ -53,6 +55,12 @@
 public class CCSUsageTelemetryAsyncSearchIT extends AbstractMultiClustersTestCase {
     private static final String REMOTE1 = "cluster-a";
     private static final String REMOTE2 = "cluster-b";
+    private static final FeatureFlag CCS_TELEMETRY_FEATURE_FLAG = new FeatureFlag("ccs_telemetry");
+
+    @BeforeClass
+    protected static void skipIfTelemetryDisabled() {
+        assumeTrue("Skipping test as CCS_TELEMETRY_FEATURE_FLAG is disabled", CCS_TELEMETRY_FEATURE_FLAG.isEnabled());
+    }
 
     @Override
     protected boolean reuseClusters() {

From ad0292cc836ebcafbaf9c11c1a1192ae2a33b7ad Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Fri, 30 Aug 2024 09:09:19 +1000
Subject: [PATCH 064/144] Mute org.elasticsearch.xpack.ml.integration.MlJobIT
 testMultiIndexDelete #112381

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index c50234a8eaa9d..356f48e8eb252 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -168,6 +168,9 @@ tests:
 - class: org.elasticsearch.smoketest.DocsClientYamlTestSuiteIT
   method: test {yaml=reference/rest-api/watcher/put-watch/line_120}
   issue: https://github.com/elastic/elasticsearch/issues/99517
+- class: org.elasticsearch.xpack.ml.integration.MlJobIT
+  method: testMultiIndexDelete
+  issue: https://github.com/elastic/elasticsearch/issues/112381
 
 # Examples:
 #

From b5da668ad9400a92073869f09cf8fd89eadc6882 Mon Sep 17 00:00:00 2001
From: Athena Brown <athena.brown@elastic.co>
Date: Thu, 29 Aug 2024 18:05:40 -0600
Subject: [PATCH 065/144] Add tier preference to security index settings
 allowlist and update default tier preference (#111818)

This commit allows tier preference for the security system indices to be
set using the Security Settings API, and adds validation to prevent
using the `data_frozen` tier for security system indices.

Also updates the default tier preference to `data_hot,data_content`.
---
 docs/changelog/111818.yaml                    |  5 +
 .../UpdateSecuritySettingsAction.java         | 68 ++++++++++----
 .../UpdateSecuritySettingsActionTests.java    | 92 ++++++++++++++++---
 .../xpack/security/SecuritySettingsIT.java    | 51 +++++++++-
 .../security/profile/ProfileIntegTests.java   |  2 +-
 .../TransportGetSecuritySettingsAction.java   |  2 +-
 .../support/SecuritySystemIndices.java        |  4 +
 7 files changed, 192 insertions(+), 32 deletions(-)
 create mode 100644 docs/changelog/111818.yaml

diff --git a/docs/changelog/111818.yaml b/docs/changelog/111818.yaml
new file mode 100644
index 0000000000000..c3a632861aae6
--- /dev/null
+++ b/docs/changelog/111818.yaml
@@ -0,0 +1,5 @@
+pr: 111818
+summary: Add tier preference to security index settings allowlist
+area: Security
+type: enhancement
+issues: []
diff --git a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/action/settings/UpdateSecuritySettingsAction.java b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/action/settings/UpdateSecuritySettingsAction.java
index 2d59911ec7ecb..c2bf1466fd41f 100644
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/action/settings/UpdateSecuritySettingsAction.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/action/settings/UpdateSecuritySettingsAction.java
@@ -14,9 +14,9 @@
 import org.elasticsearch.action.support.master.AcknowledgedRequest;
 import org.elasticsearch.action.support.master.AcknowledgedResponse;
 import org.elasticsearch.cluster.metadata.IndexMetadata;
+import org.elasticsearch.cluster.routing.allocation.DataTier;
 import org.elasticsearch.common.io.stream.StreamInput;
 import org.elasticsearch.common.io.stream.StreamOutput;
-import org.elasticsearch.common.util.set.Sets;
 import org.elasticsearch.core.TimeValue;
 import org.elasticsearch.core.UpdateForV9;
 import org.elasticsearch.xcontent.ConstructingObjectParser;
@@ -28,6 +28,8 @@
 import java.util.Map;
 import java.util.Objects;
 import java.util.Set;
+import java.util.function.BiFunction;
+import java.util.stream.Collectors;
 
 import static org.elasticsearch.xcontent.ConstructingObjectParser.optionalConstructorArg;
 
@@ -42,10 +44,35 @@ public class UpdateSecuritySettingsAction {
     public static final String TOKENS_INDEX_NAME = "security-tokens";
     public static final String PROFILES_INDEX_NAME = "security-profile";
 
-    public static final Set<String> ALLOWED_SETTING_KEYS = Set.of(
-        IndexMetadata.SETTING_NUMBER_OF_REPLICAS,
-        IndexMetadata.SETTING_AUTO_EXPAND_REPLICAS
-    );
+    /**
+     * A map of allowed settings to validators for those settings. Values should take the value which is being assigned to the setting
+     * and an existing {@link ActionRequestValidationException}, to which they should add if the value is disallowed.
+     */
+    public static final Map<
+        String,
+        BiFunction<Object, ActionRequestValidationException, ActionRequestValidationException>> ALLOWED_SETTING_VALIDATORS = Map.of(
+            IndexMetadata.SETTING_NUMBER_OF_REPLICAS,
+            (it, ex) -> ex, // no additional validation
+            IndexMetadata.SETTING_AUTO_EXPAND_REPLICAS,
+            (it, ex) -> ex, // no additional validation
+            DataTier.TIER_PREFERENCE,
+            (it, ex) -> {
+                Set<String> allowedTiers = Set.of(DataTier.DATA_CONTENT, DataTier.DATA_HOT, DataTier.DATA_WARM, DataTier.DATA_COLD);
+                if (it instanceof String preference) {
+                    String disallowedTiers = DataTier.parseTierList(preference)
+                        .stream()
+                        .filter(tier -> allowedTiers.contains(tier) == false)
+                        .collect(Collectors.joining(","));
+                    if (disallowedTiers.isEmpty() == false) {
+                        return ValidateActions.addValidationError(
+                            "disallowed data tiers [" + disallowedTiers + "] found, allowed tiers are [" + String.join(",", allowedTiers),
+                            ex
+                        );
+                    }
+                }
+                return ex;
+            }
+        );
 
     private UpdateSecuritySettingsAction() {/* no instances */}
 
@@ -154,19 +181,26 @@ private static ActionRequestValidationException validateIndexSettings(
             String indexName,
             ActionRequestValidationException existingExceptions
         ) {
-            Set<String> forbiddenSettings = Sets.difference(indexSettings.keySet(), ALLOWED_SETTING_KEYS);
-            if (forbiddenSettings.size() > 0) {
-                return ValidateActions.addValidationError(
-                    "illegal settings for index ["
-                        + indexName
-                        + "]: "
-                        + forbiddenSettings
-                        + ", these settings may not be configured. Only the following settings may be configured for that index: "
-                        + ALLOWED_SETTING_KEYS,
-                    existingExceptions
-                );
+            ActionRequestValidationException errors = existingExceptions;
+
+            for (Map.Entry<String, Object> entry : indexSettings.entrySet()) {
+                String setting = entry.getKey();
+                if (ALLOWED_SETTING_VALIDATORS.containsKey(setting)) {
+                    errors = ALLOWED_SETTING_VALIDATORS.get(setting).apply(entry.getValue(), errors);
+                } else {
+                    errors = ValidateActions.addValidationError(
+                        "illegal setting for index ["
+                            + indexName
+                            + "]: ["
+                            + setting
+                            + "], this setting may not be configured. Only the following settings may be configured for that index: "
+                            + ALLOWED_SETTING_VALIDATORS.keySet(),
+                        existingExceptions
+                    );
+                }
             }
-            return existingExceptions;
+
+            return errors;
         }
     }
 }
diff --git a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/action/settings/UpdateSecuritySettingsActionTests.java b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/action/settings/UpdateSecuritySettingsActionTests.java
index 893f7474c3e6e..50ab034a34ef3 100644
--- a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/action/settings/UpdateSecuritySettingsActionTests.java
+++ b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/action/settings/UpdateSecuritySettingsActionTests.java
@@ -7,15 +7,19 @@
 
 package org.elasticsearch.xpack.core.security.action.settings;
 
+import org.elasticsearch.action.ActionRequestValidationException;
+import org.elasticsearch.cluster.metadata.IndexMetadata;
+import org.elasticsearch.cluster.routing.allocation.DataTier;
 import org.elasticsearch.test.ESTestCase;
 
 import java.util.Collections;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
+import java.util.function.Supplier;
 import java.util.regex.Pattern;
 
-import static org.elasticsearch.xpack.core.security.action.settings.UpdateSecuritySettingsAction.ALLOWED_SETTING_KEYS;
+import static org.elasticsearch.xpack.core.security.action.settings.UpdateSecuritySettingsAction.ALLOWED_SETTING_VALIDATORS;
 import static org.elasticsearch.xpack.core.security.action.settings.UpdateSecuritySettingsAction.MAIN_INDEX_NAME;
 import static org.elasticsearch.xpack.core.security.action.settings.UpdateSecuritySettingsAction.PROFILES_INDEX_NAME;
 import static org.elasticsearch.xpack.core.security.action.settings.UpdateSecuritySettingsAction.TOKENS_INDEX_NAME;
@@ -27,6 +31,15 @@
 
 public class UpdateSecuritySettingsActionTests extends ESTestCase {
 
+    static final Map<String, Supplier<String>> ALLOWED_SETTING_GENERATORS = Map.of(
+        IndexMetadata.SETTING_NUMBER_OF_REPLICAS,
+        () -> randomAlphaOfLength(5), // no additional validation
+        IndexMetadata.SETTING_AUTO_EXPAND_REPLICAS,
+        () -> randomAlphaOfLength(5), // no additional validation
+        DataTier.TIER_PREFERENCE,
+        () -> randomFrom(DataTier.DATA_CONTENT, DataTier.DATA_HOT, DataTier.DATA_WARM, DataTier.DATA_COLD)
+    );
+
     public void testValidateSettingsEmpty() {
         var req = new UpdateSecuritySettingsAction.Request(
             TEST_REQUEST_TIMEOUT,
@@ -43,9 +56,10 @@ public void testValidateSettingsEmpty() {
 
     public void testAllowedSettingsOk() {
         Map<String, Object> allAllowedSettingsMap = new HashMap<>();
-        for (String allowedSetting : ALLOWED_SETTING_KEYS) {
-            Map<String, Object> allowedSettingMap = Map.of(allowedSetting, randomAlphaOfLength(5));
-            allAllowedSettingsMap.put(allowedSetting, randomAlphaOfLength(5));
+        for (String allowedSetting : ALLOWED_SETTING_VALIDATORS.keySet()) {
+            String settingValue = ALLOWED_SETTING_GENERATORS.get(allowedSetting).get();
+            Map<String, Object> allowedSettingMap = Map.of(allowedSetting, settingValue);
+            allAllowedSettingsMap.put(allowedSetting, settingValue);
             var req = new UpdateSecuritySettingsAction.Request(
                 TEST_REQUEST_TIMEOUT,
                 TEST_REQUEST_TIMEOUT,
@@ -86,11 +100,12 @@ public void testAllowedSettingsOk() {
 
     public void testDisallowedSettingsFailsValidation() {
         String disallowedSetting = "index."
-            + randomValueOtherThanMany((value) -> ALLOWED_SETTING_KEYS.contains("index." + value), () -> randomAlphaOfLength(5));
+            + randomValueOtherThanMany((value) -> ALLOWED_SETTING_VALIDATORS.containsKey("index." + value), () -> randomAlphaOfLength(5));
         Map<String, Object> disallowedSettingMap = Map.of(disallowedSetting, randomAlphaOfLength(5));
+        String validSetting = randomFrom(ALLOWED_SETTING_VALIDATORS.keySet());
         Map<String, Object> validOrEmptySettingMap = randomFrom(
             Collections.emptyMap(),
-            Map.of(randomFrom(ALLOWED_SETTING_KEYS), randomAlphaOfLength(5))
+            Map.of(validSetting, ALLOWED_SETTING_GENERATORS.get(validSetting).get())
         );
         {
             var req = new UpdateSecuritySettingsAction.Request(
@@ -106,11 +121,11 @@ public void testDisallowedSettingsFailsValidation() {
                 assertThat(
                     errorMsg,
                     matchesRegex(
-                        "illegal settings for index \\["
+                        "illegal setting for index \\["
                             + Pattern.quote(TOKENS_INDEX_NAME)
                             + "\\]: \\["
                             + disallowedSetting
-                            + "\\], these settings may not be configured. Only the following settings may be configured for that index.*"
+                            + "\\], this setting may not be configured. Only the following settings may be configured for that index.*"
                     )
                 );
             }
@@ -130,13 +145,13 @@ public void testDisallowedSettingsFailsValidation() {
                 assertThat(
                     errorMsg,
                     matchesRegex(
-                        "illegal settings for index \\[("
+                        "illegal setting for index \\[("
                             + Pattern.quote(MAIN_INDEX_NAME)
                             + "|"
                             + Pattern.quote(PROFILES_INDEX_NAME)
                             + ")\\]: \\["
                             + disallowedSetting
-                            + "\\], these settings may not be configured. Only the following settings may be configured for that index.*"
+                            + "\\], this setting may not be configured. Only the following settings may be configured for that index.*"
                     )
                 );
             }
@@ -156,7 +171,7 @@ public void testDisallowedSettingsFailsValidation() {
                 assertThat(
                     errorMsg,
                     matchesRegex(
-                        "illegal settings for index \\[("
+                        "illegal setting for index \\[("
                             + Pattern.quote(MAIN_INDEX_NAME)
                             + "|"
                             + Pattern.quote(TOKENS_INDEX_NAME)
@@ -164,11 +179,64 @@ public void testDisallowedSettingsFailsValidation() {
                             + Pattern.quote(PROFILES_INDEX_NAME)
                             + ")\\]: \\["
                             + disallowedSetting
-                            + "\\], these settings may not be configured. Only the following settings may be configured for that index.*"
+                            + "\\], this setting may not be configured. Only the following settings may be configured for that index.*"
                     )
                 );
             }
         }
     }
 
+    public void testSettingValuesAreValidated() {
+        Map<String, Object> forbiddenSettingsMap = Map.of(DataTier.TIER_PREFERENCE, DataTier.DATA_FROZEN);
+        String badTier = randomAlphaOfLength(5);
+        Map<String, Object> badSettingsMap = Map.of(DataTier.TIER_PREFERENCE, badTier);
+        Map<String, Object> allowedSettingMap = Map.of(
+            DataTier.TIER_PREFERENCE,
+            randomFrom(DataTier.DATA_HOT, DataTier.DATA_WARM, DataTier.DATA_CONTENT, DataTier.DATA_COLD)
+        );
+        {
+            var req = new UpdateSecuritySettingsAction.Request(
+                TEST_REQUEST_TIMEOUT,
+                TEST_REQUEST_TIMEOUT,
+                allowedSettingMap,
+                Collections.emptyMap(),
+                Collections.emptyMap()
+            );
+            assertThat(req.validate(), nullValue());
+        }
+
+        {
+            var req = new UpdateSecuritySettingsAction.Request(
+                TEST_REQUEST_TIMEOUT,
+                TEST_REQUEST_TIMEOUT,
+                forbiddenSettingsMap,
+                Collections.emptyMap(),
+                Collections.emptyMap()
+            );
+            ActionRequestValidationException exception = req.validate();
+            assertThat(exception, notNullValue());
+            assertThat(exception.validationErrors(), hasSize(1));
+            assertThat(
+                exception.validationErrors().get(0),
+                containsString("disallowed data tiers [" + DataTier.DATA_FROZEN + "] found, allowed tiers are ")
+            );
+        }
+
+        {
+            var req = new UpdateSecuritySettingsAction.Request(
+                TEST_REQUEST_TIMEOUT,
+                TEST_REQUEST_TIMEOUT,
+                badSettingsMap,
+                Collections.emptyMap(),
+                Collections.emptyMap()
+            );
+            var exception = req.validate();
+            assertThat(exception, notNullValue());
+            assertThat(exception.validationErrors(), hasSize(1));
+            assertThat(
+                exception.validationErrors().get(0),
+                containsString("disallowed data tiers [" + badTier + "] found, allowed tiers are ")
+            );
+        }
+    }
 }
diff --git a/x-pack/plugin/security/qa/security-basic/src/javaRestTest/java/org/elasticsearch/xpack/security/SecuritySettingsIT.java b/x-pack/plugin/security/qa/security-basic/src/javaRestTest/java/org/elasticsearch/xpack/security/SecuritySettingsIT.java
index 5651538b2757c..f776c4834cc5f 100644
--- a/x-pack/plugin/security/qa/security-basic/src/javaRestTest/java/org/elasticsearch/xpack/security/SecuritySettingsIT.java
+++ b/x-pack/plugin/security/qa/security-basic/src/javaRestTest/java/org/elasticsearch/xpack/security/SecuritySettingsIT.java
@@ -19,6 +19,7 @@
 import static org.elasticsearch.test.XContentTestUtils.createJsonMapView;
 import static org.hamcrest.Matchers.containsString;
 import static org.hamcrest.Matchers.equalTo;
+import static org.hamcrest.Matchers.nullValue;
 
 public class SecuritySettingsIT extends SecurityInBasicRestTestCase {
 
@@ -70,6 +71,54 @@ public void testBasicWorkflow() throws IOException {
         assertOK(getResp);
         final XContentTestUtils.JsonMapView mapView = createJsonMapView(getResp.getEntity().getContent());
         assertThat(mapView.get("security.index.auto_expand_replicas"), equalTo("0-all"));
+        assertThat(mapView.get("security-profile.index.auto_expand_replicas"), equalTo("0-all"));
+    }
+
+    public void testTierPreference() throws IOException {
+        {
+            Request req = new Request("PUT", "/_security/settings");
+            req.setJsonEntity("""
+                {
+                    "security": {
+                        "index.routing.allocation.include._tier_preference": "data_hot"
+                    },
+                    "security-profile": {
+                        "index.routing.allocation.include._tier_preference": "data_hot"
+                    }
+                }
+                """);
+            Response resp = adminClient().performRequest(req);
+            assertOK(resp);
+            Request getRequest = new Request("GET", "/_security/settings");
+            Response getResp = adminClient().performRequest(getRequest);
+            assertOK(getResp);
+            final XContentTestUtils.JsonMapView mapView = createJsonMapView(getResp.getEntity().getContent());
+            assertThat(mapView.get("security.index.routing.allocation.include._tier_preference"), equalTo("data_hot"));
+            assertThat(mapView.get("security-profile.index.routing.allocation.include._tier_preference"), equalTo("data_hot"));
+        }
+
+        {
+            Request req = new Request("PUT", "/_security/settings");
+            req.setJsonEntity("""
+                {
+                    "security": {
+                        "index.routing.allocation.include._tier_preference": null
+                    },
+                    "security-profile": {
+                        "index.routing.allocation.include._tier_preference": null
+                    }
+                }
+                """);
+            Response resp = adminClient().performRequest(req);
+            assertOK(resp);
+            Request getRequest = new Request("GET", "/_security/settings");
+            Response getResp = adminClient().performRequest(getRequest);
+            assertOK(getResp);
+            final XContentTestUtils.JsonMapView mapView = createJsonMapView(getResp.getEntity().getContent());
+            assertThat(mapView.get("security.index.routing.allocation.include._tier_preference"), nullValue());
+            assertThat(mapView.get("security-profile.index.routing.allocation.include._tier_preference"), nullValue());
+        }
+
     }
 
     public void testNoUpdatesThrowsException() throws IOException {
@@ -85,7 +134,7 @@ public void testDisallowedSettingThrowsException() throws IOException {
         ResponseException ex = expectThrows(ResponseException.class, () -> adminClient().performRequest(req));
         assertThat(
             EntityUtils.toString(ex.getResponse().getEntity()),
-            containsString("illegal settings for index [security]: " + "[index.max_ngram_diff], these settings may not be configured.")
+            containsString("illegal setting for index [security]: " + "[index.max_ngram_diff], this setting may not be configured.")
         );
     }
 
diff --git a/x-pack/plugin/security/src/internalClusterTest/java/org/elasticsearch/xpack/security/profile/ProfileIntegTests.java b/x-pack/plugin/security/src/internalClusterTest/java/org/elasticsearch/xpack/security/profile/ProfileIntegTests.java
index d057b7ce0be20..4b8fbfd41acdf 100644
--- a/x-pack/plugin/security/src/internalClusterTest/java/org/elasticsearch/xpack/security/profile/ProfileIntegTests.java
+++ b/x-pack/plugin/security/src/internalClusterTest/java/org/elasticsearch/xpack/security/profile/ProfileIntegTests.java
@@ -133,7 +133,7 @@ public void testProfileIndexAutoCreation() {
         final Settings settings = getIndexResponse.getSettings().get(INTERNAL_SECURITY_PROFILE_INDEX_8);
         assertThat(settings.get("index.number_of_shards"), equalTo("1"));
         assertThat(settings.get("index.auto_expand_replicas"), equalTo("0-1"));
-        assertThat(settings.get("index.routing.allocation.include._tier_preference"), equalTo("data_content"));
+        assertThat(settings.get("index.routing.allocation.include._tier_preference"), equalTo("data_hot,data_content"));
 
         final Map<String, Object> mappings = getIndexResponse.getMappings().get(INTERNAL_SECURITY_PROFILE_INDEX_8).getSourceAsMap();
 
diff --git a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportGetSecuritySettingsAction.java b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportGetSecuritySettingsAction.java
index 25a677517825f..96363d5a099da 100644
--- a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportGetSecuritySettingsAction.java
+++ b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/settings/TransportGetSecuritySettingsAction.java
@@ -85,7 +85,7 @@ private static Settings getFilteredSettingsForIndex(String indexName, ClusterSta
             .map(IndexMetadata::getSettings)
             .map(settings -> {
                 Settings.Builder builder = Settings.builder();
-                for (String settingName : UpdateSecuritySettingsAction.ALLOWED_SETTING_KEYS) {
+                for (String settingName : UpdateSecuritySettingsAction.ALLOWED_SETTING_VALIDATORS.keySet()) {
                     if (settings.hasValue(settingName)) {
                         builder.put(settingName, settings.get(settingName));
                     }
diff --git a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/support/SecuritySystemIndices.java b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/support/SecuritySystemIndices.java
index 9541dd9dc470d..36ea14c6e101b 100644
--- a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/support/SecuritySystemIndices.java
+++ b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/support/SecuritySystemIndices.java
@@ -13,6 +13,7 @@
 import org.elasticsearch.client.internal.Client;
 import org.elasticsearch.cluster.metadata.IndexMetadata;
 import org.elasticsearch.cluster.node.DiscoveryNode;
+import org.elasticsearch.cluster.routing.allocation.DataTier;
 import org.elasticsearch.cluster.service.ClusterService;
 import org.elasticsearch.common.VersionId;
 import org.elasticsearch.common.settings.Settings;
@@ -154,6 +155,7 @@ private static Settings getMainIndexSettings() {
         return Settings.builder()
             .put(IndexMetadata.SETTING_NUMBER_OF_SHARDS, 1)
             .put(IndexMetadata.SETTING_AUTO_EXPAND_REPLICAS, "0-1")
+            .put(DataTier.TIER_PREFERENCE, "data_hot,data_content")
             .put(IndexMetadata.SETTING_PRIORITY, 1000)
             .put(IndexMetadata.INDEX_FORMAT_SETTING.getKey(), INTERNAL_MAIN_INDEX_FORMAT)
             .put("analysis.filter.email.type", "pattern_capture")
@@ -702,6 +704,7 @@ private static Settings getTokenIndexSettings() {
         return Settings.builder()
             .put(IndexMetadata.SETTING_NUMBER_OF_SHARDS, 1)
             .put(IndexMetadata.SETTING_AUTO_EXPAND_REPLICAS, "0-1")
+            .put(DataTier.TIER_PREFERENCE, "data_hot,data_content")
             .put(IndexMetadata.SETTING_PRIORITY, 1000)
             .put(IndexMetadata.INDEX_FORMAT_SETTING.getKey(), INTERNAL_TOKENS_INDEX_FORMAT)
             .build();
@@ -902,6 +905,7 @@ private static Settings getProfileIndexSettings(Settings settings) {
         final Settings.Builder settingsBuilder = Settings.builder()
             .put(IndexMetadata.SETTING_NUMBER_OF_SHARDS, 1)
             .put(IndexMetadata.SETTING_AUTO_EXPAND_REPLICAS, "0-1")
+            .put(DataTier.TIER_PREFERENCE, "data_hot,data_content")
             .put(IndexMetadata.SETTING_PRIORITY, 1000)
             .put(IndexMetadata.INDEX_FORMAT_SETTING.getKey(), INTERNAL_PROFILE_INDEX_FORMAT)
             .put("analysis.filter.email.type", "pattern_capture")

From e379c4fcc10041b1cae5a4bb4b231a5c9938ad99 Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Fri, 30 Aug 2024 15:21:50 +1000
Subject: [PATCH 066/144] Mute
 org.elasticsearch.xpack.searchablesnapshots.cache.shared.NodesCachesStatsIntegTests
 testNodesCachesStats #112384

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 356f48e8eb252..57cc7abb899e7 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -171,6 +171,9 @@ tests:
 - class: org.elasticsearch.xpack.ml.integration.MlJobIT
   method: testMultiIndexDelete
   issue: https://github.com/elastic/elasticsearch/issues/112381
+- class: org.elasticsearch.xpack.searchablesnapshots.cache.shared.NodesCachesStatsIntegTests
+  method: testNodesCachesStats
+  issue: https://github.com/elastic/elasticsearch/issues/112384
 
 # Examples:
 #

From bfc7355ed7bd241e6c828e3de5282413bea60e33 Mon Sep 17 00:00:00 2001
From: Simon Cooper <simon.cooper@elastic.co>
Date: Fri, 30 Aug 2024 09:19:58 +0100
Subject: [PATCH 067/144] Some fixes for toReleaseVersion change #112242 from
 the backport #112280 (#112284)

---
 server/src/main/java/org/elasticsearch/ReleaseVersions.java    | 2 +-
 .../src/test/java/org/elasticsearch/TransportVersionTests.java | 3 ++-
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/server/src/main/java/org/elasticsearch/ReleaseVersions.java b/server/src/main/java/org/elasticsearch/ReleaseVersions.java
index cacdca1c5b528..bb90bc79a528a 100644
--- a/server/src/main/java/org/elasticsearch/ReleaseVersions.java
+++ b/server/src/main/java/org/elasticsearch/ReleaseVersions.java
@@ -53,7 +53,7 @@ public static IntFunction<String> generateVersionsLookup(Class<?> versionContain
 
             NavigableMap<Integer, List<Version>> versions = new TreeMap<>();
             // add the current version id, which won't be in the csv
-            versions.put(current, List.of(Version.CURRENT));
+            versions.computeIfAbsent(current, k -> new ArrayList<>()).add(Version.CURRENT);
 
             try (BufferedReader reader = new BufferedReader(new InputStreamReader(versionsFile, StandardCharsets.UTF_8))) {
                 String line;
diff --git a/server/src/test/java/org/elasticsearch/TransportVersionTests.java b/server/src/test/java/org/elasticsearch/TransportVersionTests.java
index a3728f20a23d4..8cc0875fb9f38 100644
--- a/server/src/test/java/org/elasticsearch/TransportVersionTests.java
+++ b/server/src/test/java/org/elasticsearch/TransportVersionTests.java
@@ -19,6 +19,7 @@
 import java.util.regex.Pattern;
 
 import static org.hamcrest.Matchers.containsString;
+import static org.hamcrest.Matchers.endsWith;
 import static org.hamcrest.Matchers.equalTo;
 import static org.hamcrest.Matchers.greaterThan;
 import static org.hamcrest.Matchers.is;
@@ -187,7 +188,7 @@ public void testCURRENTIsLatest() {
     }
 
     public void testToReleaseVersion() {
-        assertThat(TransportVersion.current().toReleaseVersion(), equalTo(Version.CURRENT.toString()));
+        assertThat(TransportVersion.current().toReleaseVersion(), endsWith(Version.CURRENT.toString()));
     }
 
     public void testToString() {

From b8359dbc13bcd588af9badcc2f47ca850fbfde1e Mon Sep 17 00:00:00 2001
From: Moritz Mack <mmack@apache.org>
Date: Fri, 30 Aug 2024 11:14:08 +0200
Subject: [PATCH 068/144] Cleanup / move some serverless code to ES (#112360)

---
 .../common/collect/Iterators.java             | 53 +++++++++++++++++++
 .../common/collect/IteratorsTests.java        | 23 ++++++++
 2 files changed, 76 insertions(+)

diff --git a/server/src/main/java/org/elasticsearch/common/collect/Iterators.java b/server/src/main/java/org/elasticsearch/common/collect/Iterators.java
index d029f8e3becc0..358b5675cc8e1 100644
--- a/server/src/main/java/org/elasticsearch/common/collect/Iterators.java
+++ b/server/src/main/java/org/elasticsearch/common/collect/Iterators.java
@@ -10,9 +10,11 @@
 
 import org.elasticsearch.core.Nullable;
 
+import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.Iterator;
+import java.util.List;
 import java.util.NoSuchElementException;
 import java.util.Objects;
 import java.util.function.BiFunction;
@@ -233,6 +235,57 @@ public T next() {
         }
     }
 
+    /**
+     * Returns an iterator that yields at most the first {@code n} elements of the provided {@code input} iterator.
+     */
+    public static <T> Iterator<T> limit(Iterator<? extends T> input, int n) {
+        assert n >= 0 : "negative limit";
+        if (n > 0 && input.hasNext()) {
+            return new LimitIterator<>(input, n);
+        } else {
+            return Collections.emptyIterator();
+        }
+    }
+
+    private static final class LimitIterator<T> implements Iterator<T> {
+        private final Iterator<? extends T> input;
+        private final int limit;
+        private int current;
+
+        LimitIterator(Iterator<? extends T> input, int limit) {
+            this.input = input;
+            this.limit = limit;
+        }
+
+        @Override
+        public boolean hasNext() {
+            return current < limit && input.hasNext();
+        }
+
+        @Override
+        public T next() {
+            if (current >= limit) {
+                throw new NoSuchElementException();
+            }
+            ++current;
+            return input.next();
+        }
+    }
+
+    /**
+     * Returns a list containing the elements of the provided {@code iterator}.
+     */
+    public static <T> List<T> toList(Iterator<T> iterator) {
+        if (iterator.hasNext()) {
+            var list = new ArrayList<T>();
+            while (iterator.hasNext()) {
+                list.add(iterator.next());
+            }
+            return Collections.unmodifiableList(list);
+        }
+        return Collections.emptyList();
+    }
+
     public static <T, U> Iterator<U> flatMap(Iterator<? extends T> input, Function<T, Iterator<? extends U>> fn) {
         while (input.hasNext()) {
             final var value = fn.apply(input.next());
diff --git a/server/src/test/java/org/elasticsearch/common/collect/IteratorsTests.java b/server/src/test/java/org/elasticsearch/common/collect/IteratorsTests.java
index a3573d081397a..63cafa7e08d26 100644
--- a/server/src/test/java/org/elasticsearch/common/collect/IteratorsTests.java
+++ b/server/src/test/java/org/elasticsearch/common/collect/IteratorsTests.java
@@ -28,6 +28,10 @@
 import java.util.function.ToIntFunction;
 import java.util.stream.IntStream;
 
+import static org.hamcrest.Matchers.contains;
+import static org.hamcrest.Matchers.empty;
+import static org.hamcrest.Matchers.is;
+
 public class IteratorsTests extends ESTestCase {
     public void testConcatentation() {
         List<Integer> threeTwoOne = Arrays.asList(3, 2, 1);
@@ -242,6 +246,25 @@ public void testFilter() {
         }
     }
 
+    public void testLimit() {
+        var result = Iterators.limit(Collections.emptyIterator(), 10);
+        assertThat(result.hasNext(), is(false));
+        assertThat(Iterators.toList(result), is(empty()));
+
+        var values = List.of(1, 2, 3);
+        result = Iterators.limit(values.iterator(), 10);
+        assertThat(result.hasNext(), is(true));
+        assertThat(Iterators.toList(result), contains(1, 2, 3));
+
+        result = Iterators.limit(values.iterator(), 2);
+        assertThat(result.hasNext(), is(true));
+        assertThat(Iterators.toList(result), contains(1, 2));
+
+        result = Iterators.limit(values.iterator(), 0);
+        assertThat(result.hasNext(), is(false));
+        assertThat(Iterators.toList(result), is(empty()));
+    }
+
     public void testFailFast() {
         final var array = randomIntegerArray();
         assertEmptyIterator(Iterators.failFast(Iterators.forArray(array), () -> true));

From f444ce6971f5aff00f5ebd48e9156cc88a038030 Mon Sep 17 00:00:00 2001
From: Pooya Salehi <pxsalehi@users.noreply.github.com>
Date: Fri, 30 Aug 2024 11:14:11 +0200
Subject: [PATCH 069/144] Make write thread pools EWMA configurable (#112283)

Relates https://github.com/elastic/elasticsearch/pull/112206.
---
 .../threadpool/SimpleThreadPoolIT.java        | 20 +++++++++++++++++++
 .../ExponentiallyWeightedMovingAverage.java   |  5 +++++
 .../common/settings/ClusterSettings.java      |  1 +
 ...utionTimeTrackingEsThreadPoolExecutor.java |  5 +++++
 .../DefaultBuiltInExecutorBuilders.java       |  3 ++-
 .../elasticsearch/threadpool/ThreadPool.java  | 11 +++++++++-
 6 files changed, 43 insertions(+), 2 deletions(-)

diff --git a/server/src/internalClusterTest/java/org/elasticsearch/threadpool/SimpleThreadPoolIT.java b/server/src/internalClusterTest/java/org/elasticsearch/threadpool/SimpleThreadPoolIT.java
index 44b6ef1d51ce0..d98b1e7d4e526 100644
--- a/server/src/internalClusterTest/java/org/elasticsearch/threadpool/SimpleThreadPoolIT.java
+++ b/server/src/internalClusterTest/java/org/elasticsearch/threadpool/SimpleThreadPoolIT.java
@@ -10,6 +10,7 @@
 
 import org.elasticsearch.action.index.IndexRequestBuilder;
 import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.common.util.concurrent.TaskExecutionTimeTrackingEsThreadPoolExecutor;
 import org.elasticsearch.index.query.QueryBuilders;
 import org.elasticsearch.plugins.Plugin;
 import org.elasticsearch.plugins.PluginsService;
@@ -19,6 +20,7 @@
 import org.elasticsearch.test.ESIntegTestCase;
 import org.elasticsearch.test.ESIntegTestCase.ClusterScope;
 import org.elasticsearch.test.ESIntegTestCase.Scope;
+import org.hamcrest.CoreMatchers;
 
 import java.lang.management.ManagementFactory;
 import java.lang.management.ThreadInfo;
@@ -36,12 +38,15 @@
 import static java.util.function.Function.identity;
 import static org.elasticsearch.common.util.Maps.toUnmodifiableSortedMap;
 import static org.elasticsearch.test.hamcrest.ElasticsearchAssertions.assertNoFailures;
+import static org.elasticsearch.threadpool.ThreadPool.DEFAULT_INDEX_AUTOSCALING_EWMA_ALPHA;
+import static org.elasticsearch.threadpool.ThreadPool.WRITE_THREAD_POOLS_EWMA_ALPHA_SETTING;
 import static org.elasticsearch.xcontent.XContentFactory.jsonBuilder;
 import static org.hamcrest.Matchers.contains;
 import static org.hamcrest.Matchers.equalTo;
 import static org.hamcrest.Matchers.greaterThanOrEqualTo;
 import static org.hamcrest.Matchers.hasEntry;
 import static org.hamcrest.Matchers.in;
+import static org.hamcrest.Matchers.instanceOf;
 import static org.hamcrest.Matchers.matchesRegex;
 
 @ClusterScope(scope = Scope.TEST, numDataNodes = 0, numClientNodes = 0)
@@ -190,4 +195,19 @@ public void testThreadPoolMetrics() throws Exception {
         });
     }
 
+    public void testWriteThreadpoolEwmaAlphaSetting() {
+        Settings settings = Settings.EMPTY;
+        var ewmaAlpha = DEFAULT_INDEX_AUTOSCALING_EWMA_ALPHA;
+        if (randomBoolean()) {
+            ewmaAlpha = randomDoubleBetween(0.0, 1.0, true);
+            settings = Settings.builder().put(WRITE_THREAD_POOLS_EWMA_ALPHA_SETTING.getKey(), ewmaAlpha).build();
+        }
+        var nodeName = internalCluster().startNode(settings);
+        var threadPool = internalCluster().getInstance(ThreadPool.class, nodeName);
+        for (var name : List.of(ThreadPool.Names.WRITE, ThreadPool.Names.SYSTEM_WRITE, ThreadPool.Names.SYSTEM_CRITICAL_WRITE)) {
+            assertThat(threadPool.executor(name), instanceOf(TaskExecutionTimeTrackingEsThreadPoolExecutor.class));
+            final var executor = (TaskExecutionTimeTrackingEsThreadPoolExecutor) threadPool.executor(name);
+            assertThat(Double.compare(executor.getEwmaAlpha(), ewmaAlpha), CoreMatchers.equalTo(0));
+        }
+    }
 }
diff --git a/server/src/main/java/org/elasticsearch/common/ExponentiallyWeightedMovingAverage.java b/server/src/main/java/org/elasticsearch/common/ExponentiallyWeightedMovingAverage.java
index 8b969cdcf9801..ce4328530ef41 100644
--- a/server/src/main/java/org/elasticsearch/common/ExponentiallyWeightedMovingAverage.java
+++ b/server/src/main/java/org/elasticsearch/common/ExponentiallyWeightedMovingAverage.java
@@ -46,4 +46,9 @@ public void addValue(double newValue) {
             successful = averageBits.compareAndSet(currentBits, newBits);
         } while (successful == false);
     }
+
+    // Used for testing
+    public double getAlpha() {
+        return alpha;
+    }
 }
diff --git a/server/src/main/java/org/elasticsearch/common/settings/ClusterSettings.java b/server/src/main/java/org/elasticsearch/common/settings/ClusterSettings.java
index 3c60d63f78991..fb219f9093a96 100644
--- a/server/src/main/java/org/elasticsearch/common/settings/ClusterSettings.java
+++ b/server/src/main/java/org/elasticsearch/common/settings/ClusterSettings.java
@@ -522,6 +522,7 @@ public void apply(Settings value, Settings current, Settings previous) {
         ThreadPool.ESTIMATED_TIME_INTERVAL_SETTING,
         ThreadPool.LATE_TIME_INTERVAL_WARN_THRESHOLD_SETTING,
         ThreadPool.SLOW_SCHEDULER_TASK_WARN_THRESHOLD_SETTING,
+        ThreadPool.WRITE_THREAD_POOLS_EWMA_ALPHA_SETTING,
         FastVectorHighlighter.SETTING_TV_HIGHLIGHT_MULTI_VALUE,
         Node.BREAKER_TYPE_KEY,
         OperationRouting.USE_ADAPTIVE_REPLICA_SELECTION_SETTING,
diff --git a/server/src/main/java/org/elasticsearch/common/util/concurrent/TaskExecutionTimeTrackingEsThreadPoolExecutor.java b/server/src/main/java/org/elasticsearch/common/util/concurrent/TaskExecutionTimeTrackingEsThreadPoolExecutor.java
index 92e1626b0d0bb..141f4571ca02e 100644
--- a/server/src/main/java/org/elasticsearch/common/util/concurrent/TaskExecutionTimeTrackingEsThreadPoolExecutor.java
+++ b/server/src/main/java/org/elasticsearch/common/util/concurrent/TaskExecutionTimeTrackingEsThreadPoolExecutor.java
@@ -146,4 +146,9 @@ protected void appendThreadPoolExecutorDetails(StringBuilder sb) {
     public Map<Runnable, Long> getOngoingTasks() {
         return trackOngoingTasks ? Map.copyOf(ongoingTasks) : Map.of();
     }
+
+    // Used for testing
+    public double getEwmaAlpha() {
+        return executionEWMA.getAlpha();
+    }
 }
diff --git a/server/src/main/java/org/elasticsearch/threadpool/DefaultBuiltInExecutorBuilders.java b/server/src/main/java/org/elasticsearch/threadpool/DefaultBuiltInExecutorBuilders.java
index a4046f2f1594c..f8f623ff89643 100644
--- a/server/src/main/java/org/elasticsearch/threadpool/DefaultBuiltInExecutorBuilders.java
+++ b/server/src/main/java/org/elasticsearch/threadpool/DefaultBuiltInExecutorBuilders.java
@@ -18,7 +18,7 @@
 import java.util.Map;
 
 import static java.util.Collections.unmodifiableMap;
-import static org.elasticsearch.threadpool.ThreadPool.indexAutoscalingEWMA;
+import static org.elasticsearch.threadpool.ThreadPool.WRITE_THREAD_POOLS_EWMA_ALPHA_SETTING;
 import static org.elasticsearch.threadpool.ThreadPool.searchAutoscalingEWMA;
 
 public class DefaultBuiltInExecutorBuilders implements BuiltInExecutorBuilders {
@@ -29,6 +29,7 @@ public Map<String, ExecutorBuilder> getBuilders(Settings settings, int allocated
         final int halfProcMaxAt5 = ThreadPool.halfAllocatedProcessorsMaxFive(allocatedProcessors);
         final int halfProcMaxAt10 = ThreadPool.halfAllocatedProcessorsMaxTen(allocatedProcessors);
         final int genericThreadPoolMax = ThreadPool.boundedBy(4 * allocatedProcessors, 128, 512);
+        final double indexAutoscalingEWMA = WRITE_THREAD_POOLS_EWMA_ALPHA_SETTING.get(settings);
 
         Map<String, ExecutorBuilder> result = new HashMap<>();
         result.put(
diff --git a/server/src/main/java/org/elasticsearch/threadpool/ThreadPool.java b/server/src/main/java/org/elasticsearch/threadpool/ThreadPool.java
index 10b92f8c6dace..290352132ab00 100644
--- a/server/src/main/java/org/elasticsearch/threadpool/ThreadPool.java
+++ b/server/src/main/java/org/elasticsearch/threadpool/ThreadPool.java
@@ -183,7 +183,7 @@ public static ThreadPoolType fromType(String type) {
     // EWMA value is at least within 90% of the new increased task duration. This value also determines the impact of a single
     // long-running task on the moving average and limits it roughly to 2% of the (long) task duration, e.g. if the current
     // moving average is 100ms, and we get one task which takes 20s the new EWMA will be ~500ms.
-    public static final double indexAutoscalingEWMA = 0.02;
+    public static final double DEFAULT_INDEX_AUTOSCALING_EWMA_ALPHA = 0.02;
 
     private final Map<String, ExecutorHolder> executors;
 
@@ -230,6 +230,15 @@ public Collection<ExecutorBuilder> builders() {
         Setting.Property.NodeScope
     );
 
+    // A setting to change the alpha parameter of the EWMA used in WRITE, SYSTEM_WRITE and SYSTEM_CRITICAL_WRITE thread pools
+    public static final Setting<Double> WRITE_THREAD_POOLS_EWMA_ALPHA_SETTING = Setting.doubleSetting(
+        "thread_pool.write.ewma_alpha",
+        DEFAULT_INDEX_AUTOSCALING_EWMA_ALPHA,
+        0.0,
+        1.0,
+        Setting.Property.NodeScope
+    );
+
     /**
      * Defines and builds the many thread pools delineated in {@link Names}.
      *

From adb23531f9396259a607b33d1bf7587347ad95f2 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Istv=C3=A1n=20Zolt=C3=A1n=20Szab=C3=B3?=
 <istvan.szabo@elastic.co>
Date: Fri, 30 Aug 2024 13:17:59 +0200
Subject: [PATCH 070/144] [DOCS] Adds Google Vertex AI tutorial (#112339)

Co-authored-by: Liam Thompson <32779855+leemthompo@users.noreply.github.com>
---
 .../semantic-search-inference.asciidoc        | 23 ++++---
 .../infer-api-ingest-pipeline-widget.asciidoc | 17 +++++
 .../infer-api-ingest-pipeline.asciidoc        | 26 ++++++++
 .../infer-api-mapping-widget.asciidoc         | 17 +++++
 .../inference-api/infer-api-mapping.asciidoc  | 33 ++++++++++
 .../infer-api-reindex-widget.asciidoc         | 17 +++++
 .../inference-api/infer-api-reindex.asciidoc  | 22 +++++++
 .../infer-api-requirements-widget.asciidoc    | 19 +++++-
 .../infer-api-requirements.asciidoc           |  9 +++
 .../infer-api-search-widget.asciidoc          | 17 +++++
 .../inference-api/infer-api-search.asciidoc   | 65 +++++++++++++++++++
 .../infer-api-task-widget.asciidoc            | 17 +++++
 .../inference-api/infer-api-task.asciidoc     | 24 +++++++
 13 files changed, 296 insertions(+), 10 deletions(-)

diff --git a/docs/reference/search/search-your-data/semantic-search-inference.asciidoc b/docs/reference/search/search-your-data/semantic-search-inference.asciidoc
index 719aeb070fc7c..dee91a6aa4ec4 100644
--- a/docs/reference/search/search-your-data/semantic-search-inference.asciidoc
+++ b/docs/reference/search/search-your-data/semantic-search-inference.asciidoc
@@ -9,16 +9,20 @@ The instructions in this tutorial shows you how to use the {infer} API workflow
 
 IMPORTANT: For the easiest way to perform semantic search in the {stack}, refer to the <<semantic-search-semantic-text, `semantic_text`>> end-to-end tutorial.
 
-The following examples use Cohere's `embed-english-v3.0` model, the `all-mpnet-base-v2` model from HuggingFace, and OpenAI's `text-embedding-ada-002` second generation embedding model.
+The following examples use the:
+
+* `embed-english-v3.0` model for https://docs.cohere.com/docs/cohere-embed[Cohere]
+* `all-mpnet-base-v2` model from https://huggingface.co/sentence-transformers/all-mpnet-base-v2[HuggingFace]
+* `text-embedding-ada-002` second generation embedding model for OpenAI
+* models available through https://ai.azure.com/explore/models?selectedTask=embeddings[Azure AI Studio] or https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models[Azure OpenAI]
+* `text-embedding-004` model for https://cloud.google.com/vertex-ai/generative-ai/docs/model-reference/text-embeddings-api[Google Vertex AI]
+* `mistral-embed` model for https://docs.mistral.ai/getting-started/models/[Mistral]
+* `amazon.titan-embed-text-v1` model for https://docs.aws.amazon.com/bedrock/latest/userguide/model-ids.html[Amazon Bedrock]
+* `ops-text-embedding-zh-001` model for https://help.aliyun.com/zh/open-search/search-platform/developer-reference/text-embedding-api-details[AlibabaCloud AI]
+
 You can use any Cohere and OpenAI models, they are all supported by the {infer} API.
 For a list of recommended models available on HuggingFace, refer to <<inference-example-hugging-face-supported-models, the supported model list>>.
 
-Azure based examples use models available through https://ai.azure.com/explore/models?selectedTask=embeddings[Azure AI Studio]
-or https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models[Azure OpenAI].
-Mistral examples use the `mistral-embed` model from https://docs.mistral.ai/getting-started/models/[the Mistral API].
-Amazon Bedrock examples use the `amazon.titan-embed-text-v1` model from https://docs.aws.amazon.com/bedrock/latest/userguide/model-ids.html[the Amazon Bedrock base models].
-AlibabaCloud AI Search examples use the `ops-text-embedding-zh-001` model from https://help.aliyun.com/zh/open-search/search-platform/developer-reference/text-embedding-api-details[the AlibabaCloud AI Search base models].
-
 Click the name of the service you want to use on any of the widgets below to review the corresponding instructions.
 
 [discrete]
@@ -74,8 +78,8 @@ Once the upload is complete, you can see an index named `test-data` with 182469
 [[reindexing-data-infer]]
 ==== Ingest the data through the {infer} ingest pipeline
 
-Create the embeddings from the text by reindexing the data through the {infer}
-pipeline that uses the chosen model as the inference model.
+Create embeddings from the text by reindexing the data through the {infer} pipeline that uses your chosen model.
+This step uses the {ref}/docs-reindex.html[reindex API] to simulate data ingestion through a pipeline.
 
 include::{es-ref-dir}/tab-widgets/inference-api/infer-api-reindex-widget.asciidoc[]
 
@@ -114,5 +118,6 @@ include::{es-ref-dir}/tab-widgets/inference-api/infer-api-search-widget.asciidoc
 
 You can also find tutorials in an interactive Colab notebook format using the
 {es} Python client:
+
 * https://colab.research.google.com/github/elastic/elasticsearch-labs/blob/main/notebooks/integrations/cohere/inference-cohere.ipynb[Cohere {infer} tutorial notebook]
 * https://colab.research.google.com/github/elastic/elasticsearch-labs/blob/main/notebooks/search/07-inference.ipynb[OpenAI {infer} tutorial notebook]
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-ingest-pipeline-widget.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-ingest-pipeline-widget.asciidoc
index 3a686e27cf580..d8d1cfaa2a2c7 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-ingest-pipeline-widget.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-ingest-pipeline-widget.asciidoc
@@ -37,6 +37,12 @@
             id="infer-api-ingest-azure-ai-studio">
       Azure AI Studio
     </button>
+    <button role="tab"
+            aria-selected="false"
+            aria-controls="infer-api-ingest-google-vertex-ai-tab"
+            id="infer-api-ingest-google-vertex-ai">
+      Google Vertex AI
+    </button>
     <button role="tab"
             aria-selected="false"
             aria-controls="infer-api-ingest-mistral-tab"
@@ -119,6 +125,17 @@ include::infer-api-ingest-pipeline.asciidoc[tag=azure-openai]
 
 include::infer-api-ingest-pipeline.asciidoc[tag=azure-ai-studio]
 
+++++
+  </div>
+  <div tabindex="0"
+       role="tabpanel"
+       id="infer-api-ingest-google-vertex-ai-tab"
+       aria-labelledby="infer-api-ingest-google-vertex-ai"
+       hidden="">
+++++
+
+include::infer-api-ingest-pipeline.asciidoc[tag=google-vertex-ai]
+
 ++++
   </div>
   <div tabindex="0"
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-ingest-pipeline.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-ingest-pipeline.asciidoc
index 6678b60fabc40..f1652c1d8aff8 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-ingest-pipeline.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-ingest-pipeline.asciidoc
@@ -165,6 +165,32 @@ and the `output_field` that will contain the {infer} results.
 
 // end::azure-ai-studio[]
 
+// tag::google-vertex-ai[]
+
+[source,console]
+--------------------------------------------------
+PUT _ingest/pipeline/google_vertex_ai_embeddings
+{
+  "processors": [
+    {
+      "inference": {
+        "model_id": "google_vertex_ai_embeddings", <1>
+        "input_output": { <2>
+          "input_field": "content",
+          "output_field": "content_embedding"
+        }
+      }
+    }
+  ]
+}
+--------------------------------------------------
+<1> The name of the inference endpoint you created by using the
+<<put-inference-api>>, it's referred to as `inference_id` in that step.
+<2> Configuration object that defines the `input_field` for the {infer} process
+and the `output_field` that will contain the {infer} results.
+
+// end::google-vertex-ai[]
+
 // tag::mistral[]
 
 [source,console]
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-mapping-widget.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-mapping-widget.asciidoc
index 66b790bdd57a5..ac09e9e5c7cdc 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-mapping-widget.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-mapping-widget.asciidoc
@@ -37,6 +37,12 @@
             id="infer-api-mapping-azure-ai-studio">
       Azure AI Studio
     </button>
+    <button role="tab"
+            aria-selected="false"
+            aria-controls="infer-api-mapping-google-vertex-ai-tab"
+            id="infer-api-mapping-google-vertex-ai">
+      Google Vertex AI
+    </button>
     <button role="tab"
             aria-selected="false"
             aria-controls="infer-api-mapping-mistral-tab"
@@ -119,6 +125,17 @@ include::infer-api-mapping.asciidoc[tag=azure-openai]
 
 include::infer-api-mapping.asciidoc[tag=azure-ai-studio]
 
+++++
+  </div>
+  <div tabindex="0"
+       role="tabpanel"
+       id="infer-api-mapping-google-vertex-ai-tab"
+       aria-labelledby="infer-api-mapping-google-vertex-ai"
+       hidden="">
+++++
+
+include::infer-api-mapping.asciidoc[tag=google-vertex-ai]
+
 ++++
   </div>
   <div tabindex="0"
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-mapping.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-mapping.asciidoc
index c86538ceb9c87..2b18e644e097b 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-mapping.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-mapping.asciidoc
@@ -202,6 +202,39 @@ the {infer} pipeline configuration in the next step.
 
 // end::azure-ai-studio[]
 
+// tag::google-vertex-ai[]
+
+[source,console]
+--------------------------------------------------
+PUT google-vertex-ai-embeddings
+{
+  "mappings": {
+    "properties": {
+      "content_embedding": { <1>
+        "type": "dense_vector", <2>
+        "dims": 768, <3>
+        "element_type": "float",
+        "similarity": "dot_product" <4>
+      },
+      "content": { <5>
+        "type": "text" <6>
+      }
+    }
+  }
+}
+--------------------------------------------------
+<1> The name of the field to contain the generated embeddings. It must be referenced in the {infer} pipeline configuration in the next step.
+<2> The field to contain the embeddings is a `dense_vector` field.
+<3> The output dimensions of the model. This value may be found on the https://cloud.google.com/vertex-ai/generative-ai/docs/model-reference/text-embeddings-api[Google Vertex AI model reference].
+The {infer} API attempts to calculate the output dimensions automatically if `dims` are not specified.
+<4> For Google Vertex AI embeddings, the `dot_product` function should be used to calculate similarity.
+<5> The name of the field from which to create the dense vector representation.
+In this example, the name of the field is `content`. It must be referenced in
+the {infer} pipeline configuration in the next step.
+<6> The field type which is `text` in this example.
+
+// end::google-vertex-ai[]
+
 // tag::mistral[]
 
 [source,console]
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-reindex-widget.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-reindex-widget.asciidoc
index 86f52fee2063c..d24c751cdbfc6 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-reindex-widget.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-reindex-widget.asciidoc
@@ -37,6 +37,12 @@
             id="infer-api-reindex-azure-ai-studio">
       Azure AI Studio
     </button>
+    <button role="tab"
+            aria-selected="false"
+            aria-controls="infer-api-reindex-google-vertex-ai-tab"
+            id="infer-api-reindex-google-vertex-ai">
+      Google Vertex AI
+    </button>
     <button role="tab"
             aria-selected="false"
             aria-controls="infer-api-reindex-mistral-tab"
@@ -119,6 +125,17 @@ include::infer-api-reindex.asciidoc[tag=azure-openai]
 
 include::infer-api-reindex.asciidoc[tag=azure-ai-studio]
 
+++++
+  </div>
+  <div tabindex="0"
+       role="tabpanel"
+       id="infer-api-reindex-google-vertex-ai-tab"
+       aria-labelledby="infer-api-reindex-google-vertex-ai"
+       hidden="">
+++++
+
+include::infer-api-reindex.asciidoc[tag=google-vertex-ai]
+
 ++++
   </div>
   <div tabindex="0"
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-reindex.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-reindex.asciidoc
index 25d4023c650c0..0b0ab9a9cfe0e 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-reindex.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-reindex.asciidoc
@@ -155,6 +155,28 @@ might affect the throughput of the reindexing process. If this happens, change
 
 // end::azure-ai-studio[]
 
+// tag::google-vertex-ai[]
+
+[source,console]
+----
+POST _reindex?wait_for_completion=false
+{
+  "source": {
+    "index": "test-data",
+    "size": 50 <1>
+  },
+  "dest": {
+    "index": "google-vertex-ai-embeddings",
+    "pipeline": "google_vertex_ai_embeddings"
+  }
+}
+----
+// TEST[skip:TBD]
+<1> The default batch size for reindexing is 1000. Reducing `size` will make updates to the reindexing process faster. This enables you to
+follow the progress closely and detect errors early.
+
+// end::google-vertex-ai[]
+
 // tag::mistral[]
 
 [source,console]
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-requirements-widget.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-requirements-widget.asciidoc
index fb686a2d8be12..430129f2f2edb 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-requirements-widget.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-requirements-widget.asciidoc
@@ -35,7 +35,13 @@
             aria-selected="false"
             aria-controls="infer-api-requirements-azure-ai-studio-tab"
             id="infer-api-requirements-azure-ai-studio">
-      Azure AI Studio
+      Azure AI Studio 
+    </button>
+    <button role="tab"
+            aria-selected="false"
+            aria-controls="infer-api-requirements-google-vertex-ai-tab"
+            id="infer-api-requirements-google-vertex-ai">
+      Google Vertex AI
     </button>
     <button role="tab"
             aria-selected="false"
@@ -119,6 +125,17 @@ include::infer-api-requirements.asciidoc[tag=azure-openai]
 
 include::infer-api-requirements.asciidoc[tag=azure-ai-studio]
 
+++++
+  </div>
+  <div tabindex="0"
+       role="tabpanel"
+       id="infer-api-requirements-google-vertex-ai-tab"
+       aria-labelledby="infer-api-requirements-google-vertex-ai"
+       hidden="">
+++++
+
+include::infer-api-requirements.asciidoc[tag=google-vertex-ai]
+
 ++++
   </div>
   <div tabindex="0"
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-requirements.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-requirements.asciidoc
index c9e7ca8b80ba6..eeecb4718658a 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-requirements.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-requirements.asciidoc
@@ -41,6 +41,15 @@ You can apply for access to Azure OpenAI by completing the form at https://aka.m
 
 // end::azure-ai-studio[]
 
+// tag::google-vertex-ai[]
+* A https://console.cloud.google.com/[Google Cloud account]
+* A project in Google Cloud
+* The Vertex AI API enabled in your project
+* A valid service account for the Google Vertex AI API
+* The service account must have the Vertex AI User role and the `aiplatform.endpoints.predict` permission.
+
+// end::google-vertex-ai[]
+
 // tag::mistral[]
 * A Mistral Account on https://console.mistral.ai/[La Plateforme]
 * An API key generated for your account
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-search-widget.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-search-widget.asciidoc
index 996148d80a4bd..b4f7f56a19b94 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-search-widget.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-search-widget.asciidoc
@@ -36,6 +36,12 @@
             aria-controls="infer-api-search-azure-ai-studio-tab"
             id="infer-api-search-azure-ai-studio">
       Azure AI Studio
+    </button>
+     <button role="tab"
+            aria-selected="false"
+            aria-controls="infer-api-search-google-vertex-ai-tab"
+            id="infer-api-search-google-vertex-ai">
+      Google Vertex AI
     </button>
     <button role="tab"
             aria-selected="false"
@@ -119,6 +125,17 @@ include::infer-api-search.asciidoc[tag=azure-openai]
 
 include::infer-api-search.asciidoc[tag=azure-ai-studio]
 
+++++
+  </div>
+  <div tabindex="0"
+       role="tabpanel"
+       id="infer-api-search-google-vertex-ai-tab"
+       aria-labelledby="infer-api-search-google-vertex-ai"
+       hidden="">
+++++
+
+include::infer-api-search.asciidoc[tag=google-vertex-ai]
+
 ++++
   </div>
   <div tabindex="0"
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-search.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-search.asciidoc
index fe1f58b6bd1a9..706db42669210 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-search.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-search.asciidoc
@@ -402,6 +402,71 @@ query from the `azure-ai-studio-embeddings` index sorted by their proximity to t
 
 // end::azure-ai-studio[]
 
+// tag::google-vertex-ai[]
+
+[source,console]
+--------------------------------------------------
+GET google-vertex-ai-embeddings/_search
+{
+  "knn": {
+    "field": "content_embedding",
+    "query_vector_builder": {
+      "text_embedding": {
+        "model_id": "google_vertex_ai_embeddings",
+        "model_text": "Calculate fuel cost"
+      }
+    },
+    "k": 10,
+    "num_candidates": 100
+  },
+  "_source": [
+    "id",
+    "content"
+  ]
+}
+--------------------------------------------------
+// TEST[skip:TBD]
+
+As a result, you receive the top 10 documents that are closest in meaning to the
+query from the `mistral-embeddings` index sorted by their proximity to the query:
+
+[source,console-result]
+--------------------------------------------------
+"hits": [
+      {
+        "_index": "google-vertex-ai-embeddings",
+        "_id": "Ryv0nZEBBFPLbFsdCbGn",
+        "_score": 0.86815524,
+        "_source": {
+          "id": 3041038,
+          "content": "For example, the cost of the fuel could be 96.9, the amount could be 10 pounds, and the distance covered could be 80 miles. To convert between Litres per 100KM and Miles Per Gallon, please provide a value and click on the required button.o calculate how much fuel you'll need for a given journey, please provide the distance in miles you will be covering on your journey, and the estimated MPG of your vehicle. To work out what MPG you are really getting, please provide the cost of the fuel, how much you spent on the fuel, and how far it took you."
+        }
+      },
+      {
+        "_index": "google-vertex-ai-embeddings",
+        "_id": "w4j0nZEBZ1nFq1oiHQvK",
+        "_score": 0.8676357,
+        "_source": {
+          "id": 1541469,
+          "content": "This driving cost calculator takes into consideration the fuel economy of the vehicle that you are travelling in as well as the fuel cost. This road trip gas calculator will give you an idea of how much would it cost to drive before you actually travel.his driving cost calculator takes into consideration the fuel economy of the vehicle that you are travelling in as well as the fuel cost. This road trip gas calculator will give you an idea of how much would it cost to drive before you actually travel."
+        }
+      },
+      {
+        "_index": "google-vertex-ai-embeddings",
+        "_id": "Hoj0nZEBZ1nFq1oiHQjJ",
+        "_score": 0.80510974,
+        "_source": {
+          "id": 7982559,
+          "content": "What's that light cost you? 1  Select your electric rate (or click to enter your own). 2  You can calculate results for up to four types of lights. 3  Select the type of lamp (i.e. 4  Select the lamp wattage (lamp lumens). 5  Enter the number of lights in use. 6  Select how long the lamps are in use (or click to enter your own; enter hours on per year). 7  Finally, ..."
+        }
+      },
+      (...)
+    ]
+--------------------------------------------------
+// NOTCONSOLE
+
+// end::google-vertex-ai[]
+
 // tag::mistral[]
 
 [source,console]
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-task-widget.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-task-widget.asciidoc
index 1dfa6077553fe..97d471af0d2fb 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-task-widget.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-task-widget.asciidoc
@@ -37,6 +37,12 @@
             id="infer-api-task-azure-ai-studio">
       Azure AI Studio
     </button>
+    <button role="tab"
+            aria-selected="false"
+            aria-controls="infer-api-task-google-vertex-ai-tab"
+            id="infer-api-task-google-vertex-ai">
+      Google Vertex AI
+    </button>
     <button role="tab"
             aria-selected="false"
             aria-controls="infer-api-task-mistral-tab"
@@ -119,6 +125,17 @@ include::infer-api-task.asciidoc[tag=azure-openai]
 
 include::infer-api-task.asciidoc[tag=azure-ai-studio]
 
+++++
+  </div>
+  <div tabindex="0"
+       role="tabpanel"
+       id="infer-api-task-google-vertex-ai-tab"
+       aria-labelledby="infer-api-task-google-vertex-ai"
+       hidden="">
+++++
+
+include::infer-api-task.asciidoc[tag=google-vertex-ai]
+
 ++++
   </div>
   <div tabindex="0"
diff --git a/docs/reference/tab-widgets/inference-api/infer-api-task.asciidoc b/docs/reference/tab-widgets/inference-api/infer-api-task.asciidoc
index 2b4aa1a200102..6a2bdbb5e79a4 100644
--- a/docs/reference/tab-widgets/inference-api/infer-api-task.asciidoc
+++ b/docs/reference/tab-widgets/inference-api/infer-api-task.asciidoc
@@ -178,6 +178,30 @@ Also, when using this model the recommended similarity measure to use in the
 
 // end::azure-ai-studio[]
 
+// tag::google-vertex-ai[]
+
+[source,console]
+------------------------------------------------------------
+PUT _inference/text_embedding/google_vertex_ai_embeddings <1>
+{
+    "service": "googlevertexai",
+    "service_settings": {
+        "service_account_json": "<service_account_json>", <2>
+        "model_id": "text-embedding-004", <3>
+        "location": "<location>", <4>
+        "project_id": "<project_id>" <5>
+    }
+}
+------------------------------------------------------------
+// TEST[skip:TBD]
+<1> The task type is `text_embedding` per the path. `google_vertex_ai_embeddings` is the unique identifier of the {infer} endpoint (its `inference_id`).
+<2> A valid service account in JSON format for the Google Vertex AI API.
+<3> For the list of the available models, refer to the https://cloud.google.com/vertex-ai/generative-ai/docs/model-reference/text-embeddings-api[Text embeddings API] page.
+<4> The name of the location to use for the {infer} task. Refer to https://cloud.google.com/vertex-ai/generative-ai/docs/learn/locations[Generative AI on Vertex AI locations] for available locations.
+<5> The name of the project to use for the {infer} task. 
+
+// end::google-vertex-ai[]
+
 // tag::mistral[]
 
 [source,console]

From 7e1b33048ddb4e02bb3f17070a00a475a5927542 Mon Sep 17 00:00:00 2001
From: Huaixinww <141887897+Huaixinww@users.noreply.github.com>
Date: Fri, 30 Aug 2024 20:04:11 +0800
Subject: [PATCH 071/144] [ML]Fix the bug where the run() function of
 ExecutableInferenceRequest throws an exception when get inferenceEntityId.
 (#112135)

---
 docs/changelog/112135.yaml                                    | 4 ++++
 .../external/http/sender/ExecutableInferenceRequest.java      | 2 +-
 .../external/request/amazonbedrock/AmazonBedrockRequest.java  | 4 +---
 3 files changed, 6 insertions(+), 4 deletions(-)
 create mode 100644 docs/changelog/112135.yaml

diff --git a/docs/changelog/112135.yaml b/docs/changelog/112135.yaml
new file mode 100644
index 0000000000000..d2ff6994b6196
--- /dev/null
+++ b/docs/changelog/112135.yaml
@@ -0,0 +1,4 @@
+pr: 112135 
+summary: Fix the bug where the run() function of ExecutableInferenceRequest throws an exception when get inferenceEntityId.
+area: Inference 
+type: bug
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/ExecutableInferenceRequest.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/ExecutableInferenceRequest.java
index 241466422e47b..979f6d199f630 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/ExecutableInferenceRequest.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/ExecutableInferenceRequest.java
@@ -29,7 +29,7 @@ record ExecutableInferenceRequest(
 
     @Override
     public void run() {
-        var inferenceEntityId = request.createHttpRequest().inferenceEntityId();
+        var inferenceEntityId = request.getInferenceEntityId();
 
         try {
             requestSender.send(logger, request, hasFinished, responseHandler, listener);
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/amazonbedrock/AmazonBedrockRequest.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/amazonbedrock/AmazonBedrockRequest.java
index e356212ed07fb..1ff7d67d16be2 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/amazonbedrock/AmazonBedrockRequest.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/amazonbedrock/AmazonBedrockRequest.java
@@ -37,12 +37,10 @@ public AmazonBedrockModel model() {
 
     /**
      * Amazon Bedrock uses the AWS SDK, and will not create its own Http Request
-     * But, this is needed for the ExecutableInferenceRequest to get the inferenceEntityId
-     * @return NoOp request
      */
     @Override
     public final HttpRequest createHttpRequest() {
-        return new HttpRequest(new NoOpHttpRequest(), inferenceId);
+        throw new UnsupportedOperationException("Amazon Bedrock does not use Http Requests");
     }
 
     /**

From 436c1da04bf5a0cb1f5bec2d87925005961e187c Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Fri, 30 Aug 2024 22:42:17 +1000
Subject: [PATCH 072/144] Mute
 org.elasticsearch.action.admin.cluster.stats.CCSTelemetrySnapshotTests
 testToXContent #112325

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 57cc7abb899e7..43ba2469af904 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -174,6 +174,9 @@ tests:
 - class: org.elasticsearch.xpack.searchablesnapshots.cache.shared.NodesCachesStatsIntegTests
   method: testNodesCachesStats
   issue: https://github.com/elastic/elasticsearch/issues/112384
+- class: org.elasticsearch.action.admin.cluster.stats.CCSTelemetrySnapshotTests
+  method: testToXContent
+  issue: https://github.com/elastic/elasticsearch/issues/112325
 
 # Examples:
 #

From 7ddbaa24ec76d510ba9cfe42aafe71082d52620e Mon Sep 17 00:00:00 2001
From: Rene Groeschke <rene@elastic.co>
Date: Fri, 30 Aug 2024 14:44:38 +0200
Subject: [PATCH 073/144] [Gradle] Simplify Build Scan setup (#112347)

- remove jenkins specific logic
- more simplification on build scan build logic
---
 .../groovy/elasticsearch.build-scan.gradle    | 79 +++----------------
 1 file changed, 9 insertions(+), 70 deletions(-)

diff --git a/build-tools-internal/src/main/groovy/elasticsearch.build-scan.gradle b/build-tools-internal/src/main/groovy/elasticsearch.build-scan.gradle
index 7cba4730e88da..a6dae60ddd524 100644
--- a/build-tools-internal/src/main/groovy/elasticsearch.build-scan.gradle
+++ b/build-tools-internal/src/main/groovy/elasticsearch.build-scan.gradle
@@ -19,11 +19,14 @@ import java.time.LocalDateTime
 develocity {
 
   buildScan {
-    URL jenkinsUrl = System.getenv('JENKINS_URL') ? new URL(System.getenv('JENKINS_URL')) : null
-    String buildKiteUrl = System.getenv('BUILDKITE_BUILD_URL') ? System.getenv('BUILDKITE_BUILD_URL') : null
+
+    def onCI = System.getenv('CI') ? Boolean.parseBoolean(System.getenv('CI')) : false
+
+    // Disable async upload in CI to ensure scan upload completes before CI agent is terminated
+    uploadInBackground = onCI == false
 
     // Automatically publish scans from Elasticsearch CI
-    if (jenkinsUrl?.host?.endsWith('elastic.co') || jenkinsUrl?.host?.endsWith('elastic.dev') || System.getenv('BUILDKITE') == 'true') {
+    if (onCI) {
       publishing.onlyIf { true }
       server = 'https://gradle-enterprise.elastic.co'
     } else if( server.isPresent() == false) {
@@ -38,73 +41,9 @@ develocity {
       if (BuildParams.inFipsJvm) {
         tag 'FIPS'
       }
-
-      // Jenkins-specific build scan metadata
-      if (jenkinsUrl) {
-        // Disable async upload in CI to ensure scan upload completes before CI agent is terminated
-        uploadInBackground = false
-
-        String buildNumber = System.getenv('BUILD_NUMBER')
-        String buildUrl = System.getenv('BUILD_URL')
-        String jobName = System.getenv('JOB_NAME')
-        String nodeName = System.getenv('NODE_NAME')
-        String jobBranch = System.getenv('ghprbTargetBranch') ?: System.getenv('JOB_BRANCH')
-
-        // Link to Jenkins worker logs and system metrics
-        if (nodeName) {
-          link 'System logs', "https://ci-stats.elastic.co/app/infra#/logs?&logFilter=(expression:'host.name:${nodeName}',kind:kuery)"
-          buildFinished {
-            link 'System metrics', "https://ci-stats.elastic.co/app/metrics/detail/host/${nodeName}"
-          }
-        }
-
-        // Parse job name in the case of matrix builds
-        // Matrix job names come in the form of "base-job-name/matrix_param1=value1,matrix_param2=value2"
-        def splitJobName = jobName.split('/')
-        if (splitJobName.length > 1 && splitJobName.last() ==~ /^([a-zA-Z0-9_\-]+=[a-zA-Z0-9_\-&\.]+,?)+$/) {
-          def baseJobName = splitJobName.dropRight(1).join('/')
-          tag baseJobName
-          tag splitJobName.last()
-          value 'Job Name', baseJobName
-          def matrixParams = splitJobName.last().split(',')
-          matrixParams.collect { it.split('=') }.each { param ->
-            value "MATRIX_${param[0].toUpperCase()}", param[1]
-          }
-        } else {
-          tag jobName
-          value 'Job Name', jobName
-        }
-
-        tag 'CI'
-        link 'CI Build', buildUrl
-        link 'GCP Upload',
-          "https://console.cloud.google.com/storage/browser/_details/elasticsearch-ci-artifacts/jobs/${URLEncoder.encode(jobName, "UTF-8")}/build/${buildNumber}.tar.bz2"
-        value 'Job Number', buildNumber
-        if (jobBranch) {
-          tag jobBranch
-          value 'Git Branch', jobBranch
-        }
-
-        System.getenv().getOrDefault('NODE_LABELS', '').split(' ').each {
-          value 'Jenkins Worker Label', it
-        }
-
-        // Add SCM information
-        def isPrBuild = System.getenv('ROOT_BUILD_CAUSE_GHPRBCAUSE') != null
-        if (isPrBuild) {
-          value 'Git Commit ID', System.getenv('ghprbActualCommit')
-          tag "pr/${System.getenv('ghprbPullId')}"
-          tag 'pull-request'
-          link 'Source', "https://github.com/elastic/elasticsearch/tree/${System.getenv('ghprbActualCommit')}"
-          link 'Pull Request', System.getenv('ghprbPullLink')
-        } else {
-          value 'Git Commit ID', BuildParams.gitRevision
-          link 'Source', "https://github.com/elastic/elasticsearch/tree/${BuildParams.gitRevision}"
-        }
-      } else if (buildKiteUrl) { //Buildkite-specific build scan metadata
-        // Disable async upload in CI to ensure scan upload completes before CI agent is terminated
-        uploadInBackground = false
-
+      println "onCI = $onCI"
+      if (onCI) { //Buildkite-specific build scan metadata
+        String buildKiteUrl = System.getenv('BUILDKITE_BUILD_URL')
         def branch = System.getenv('BUILDKITE_PULL_REQUEST_BASE_BRANCH') ?: System.getenv('BUILDKITE_BRANCH')
         def repoMatcher = System.getenv('BUILDKITE_REPO') =~ /(https:\/\/github\.com\/|git@github\.com:)(\S+)\.git/
         def repository = repoMatcher.matches() ? repoMatcher.group(2) : "<unknown>"

From e2efc0c2828eba29c2ce74d0b3db0294832901c7 Mon Sep 17 00:00:00 2001
From: Nik Everett <nik9000@gmail.com>
Date: Fri, 30 Aug 2024 09:01:45 -0400
Subject: [PATCH 074/144] ESQL: Fixup CASE tests (#112375)

Move a bunch of the tests for CASE into their own file. They were in the
parameterized tests which we were running over and over and over again
but we really just want to run them once.

I'm doing this before I really go and fix #112359
---
 .../scalar/conditional/CaseExtraTests.java    | 143 ++++++++++++++++++
 .../scalar/conditional/CaseTests.java         | 118 ---------------
 2 files changed, 143 insertions(+), 118 deletions(-)

diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/scalar/conditional/CaseExtraTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/scalar/conditional/CaseExtraTests.java
index 80a3cd48e5147..f2c4625f5a3cb 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/scalar/conditional/CaseExtraTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/scalar/conditional/CaseExtraTests.java
@@ -7,13 +7,31 @@
 
 package org.elasticsearch.xpack.esql.expression.function.scalar.conditional;
 
+import org.elasticsearch.common.breaker.CircuitBreaker;
+import org.elasticsearch.common.unit.ByteSizeValue;
+import org.elasticsearch.common.util.BigArrays;
+import org.elasticsearch.common.util.MockBigArrays;
+import org.elasticsearch.common.util.PageCacheRecycler;
+import org.elasticsearch.compute.data.Block;
+import org.elasticsearch.compute.data.BlockFactory;
+import org.elasticsearch.compute.data.Page;
+import org.elasticsearch.compute.operator.DriverContext;
+import org.elasticsearch.compute.operator.EvalOperator;
 import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xpack.esql.core.expression.Expression;
 import org.elasticsearch.xpack.esql.core.expression.Literal;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 import org.elasticsearch.xpack.esql.core.type.DataType;
+import org.elasticsearch.xpack.esql.expression.function.AbstractFunctionTestCase;
+import org.junit.After;
 
+import java.util.ArrayList;
+import java.util.Collections;
 import java.util.List;
+import java.util.function.Function;
+import java.util.stream.Stream;
 
+import static org.elasticsearch.compute.data.BlockUtils.toJavaObject;
 import static org.elasticsearch.xpack.esql.expression.function.AbstractFunctionTestCase.field;
 import static org.hamcrest.Matchers.equalTo;
 import static org.hamcrest.Matchers.sameInstance;
@@ -166,4 +184,129 @@ public void testPartialFoldLastAfterKeepingUnknown() {
             )
         );
     }
+
+    public void testEvalCase() {
+        testCase(caseExpr -> {
+            DriverContext driverContext = driverContext();
+            Page page = new Page(driverContext.blockFactory().newConstantIntBlockWith(0, 1));
+            try (
+                EvalOperator.ExpressionEvaluator eval = caseExpr.toEvaluator(AbstractFunctionTestCase::evaluator).get(driverContext);
+                Block block = eval.eval(page)
+            ) {
+                return toJavaObject(block, 0);
+            } finally {
+                page.releaseBlocks();
+            }
+        });
+    }
+
+    public void testFoldCase() {
+        testCase(caseExpr -> {
+            assertTrue(caseExpr.foldable());
+            return caseExpr.fold();
+        });
+    }
+
+    public void testCase(Function<Case, Object> toValue) {
+        assertEquals(1, toValue.apply(caseExpr(true, 1)));
+        assertNull(toValue.apply(caseExpr(false, 1)));
+        assertEquals(2, toValue.apply(caseExpr(false, 1, 2)));
+        assertEquals(1, toValue.apply(caseExpr(true, 1, true, 2)));
+        assertEquals(2, toValue.apply(caseExpr(false, 1, true, 2)));
+        assertNull(toValue.apply(caseExpr(false, 1, false, 2)));
+        assertEquals(3, toValue.apply(caseExpr(false, 1, false, 2, 3)));
+        assertNull(toValue.apply(caseExpr(true, null, 1)));
+        assertEquals(1, toValue.apply(caseExpr(false, null, 1)));
+        assertEquals(1, toValue.apply(caseExpr(false, field("ignored", DataType.INTEGER), 1)));
+        assertEquals(1, toValue.apply(caseExpr(true, 1, field("ignored", DataType.INTEGER))));
+    }
+
+    public void testIgnoreLeadingNulls() {
+        assertEquals(DataType.INTEGER, resolveType(false, null, 1));
+        assertEquals(DataType.INTEGER, resolveType(false, null, false, null, false, 2, null));
+        assertEquals(DataType.NULL, resolveType(false, null, null));
+        assertEquals(DataType.BOOLEAN, resolveType(false, null, field("bool", DataType.BOOLEAN)));
+    }
+
+    public void testCaseWithInvalidCondition() {
+        assertEquals("expected at least two arguments in [<case>] but got 1", resolveCase(1).message());
+        assertEquals("first argument of [<case>] must be [boolean], found value [1] type [integer]", resolveCase(1, 2).message());
+        assertEquals(
+            "third argument of [<case>] must be [boolean], found value [3] type [integer]",
+            resolveCase(true, 2, 3, 4, 5).message()
+        );
+    }
+
+    public void testCaseWithIncompatibleTypes() {
+        assertEquals("third argument of [<case>] must be [integer], found value [hi] type [keyword]", resolveCase(true, 1, "hi").message());
+        assertEquals(
+            "fourth argument of [<case>] must be [integer], found value [hi] type [keyword]",
+            resolveCase(true, 1, false, "hi", 5).message()
+        );
+        assertEquals(
+            "argument of [<case>] must be [integer], found value [hi] type [keyword]",
+            resolveCase(true, 1, false, 2, true, 5, "hi").message()
+        );
+    }
+
+    public void testCaseIsLazy() {
+        Case caseExpr = caseExpr(true, 1, true, 2);
+        DriverContext driveContext = driverContext();
+        EvalOperator.ExpressionEvaluator evaluator = caseExpr.toEvaluator(child -> {
+            Object value = child.fold();
+            if (value != null && value.equals(2)) {
+                return dvrCtx -> new EvalOperator.ExpressionEvaluator() {
+                    @Override
+                    public Block eval(Page page) {
+                        fail("Unexpected evaluation of 4th argument");
+                        return null;
+                    }
+
+                    @Override
+                    public void close() {}
+                };
+            }
+            return AbstractFunctionTestCase.evaluator(child);
+        }).get(driveContext);
+        Page page = new Page(driveContext.blockFactory().newConstantIntBlockWith(0, 1));
+        try (Block block = evaluator.eval(page)) {
+            assertEquals(1, toJavaObject(block, 0));
+        } finally {
+            page.releaseBlocks();
+        }
+    }
+
+    private static Case caseExpr(Object... args) {
+        List<Expression> exps = Stream.of(args).<Expression>map(arg -> {
+            if (arg instanceof Expression e) {
+                return e;
+            }
+            return new Literal(Source.synthetic(arg == null ? "null" : arg.toString()), arg, DataType.fromJava(arg));
+        }).toList();
+        return new Case(Source.synthetic("<case>"), exps.get(0), exps.subList(1, exps.size()));
+    }
+
+    private static Expression.TypeResolution resolveCase(Object... args) {
+        return caseExpr(args).resolveType();
+    }
+
+    private static DataType resolveType(Object... args) {
+        return caseExpr(args).dataType();
+    }
+
+    private final List<CircuitBreaker> breakers = Collections.synchronizedList(new ArrayList<>());
+
+    protected final DriverContext driverContext() {
+        BigArrays bigArrays = new MockBigArrays(PageCacheRecycler.NON_RECYCLING_INSTANCE, ByteSizeValue.ofMb(256)).withCircuitBreaking();
+        CircuitBreaker breaker = bigArrays.breakerService().getBreaker(CircuitBreaker.REQUEST);
+        breakers.add(breaker);
+        return new DriverContext(bigArrays, new BlockFactory(breaker, bigArrays));
+    }
+
+    @After
+    public void allMemoryReleased() {
+        for (CircuitBreaker breaker : breakers) {
+            assertThat(breaker.getUsed(), equalTo(0L));
+        }
+    }
 }
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/scalar/conditional/CaseTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/scalar/conditional/CaseTests.java
index f19ac0e08a419..97515db85e8c3 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/scalar/conditional/CaseTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/scalar/conditional/CaseTests.java
@@ -11,13 +11,7 @@
 import com.carrotsearch.randomizedtesting.annotations.ParametersFactory;
 
 import org.apache.lucene.util.BytesRef;
-import org.elasticsearch.compute.data.Block;
-import org.elasticsearch.compute.data.Page;
-import org.elasticsearch.compute.operator.DriverContext;
-import org.elasticsearch.compute.operator.EvalOperator;
 import org.elasticsearch.xpack.esql.core.expression.Expression;
-import org.elasticsearch.xpack.esql.core.expression.Expression.TypeResolution;
-import org.elasticsearch.xpack.esql.core.expression.Literal;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 import org.elasticsearch.xpack.esql.core.type.DataType;
 import org.elasticsearch.xpack.esql.expression.function.AbstractScalarFunctionTestCase;
@@ -25,11 +19,8 @@
 
 import java.math.BigInteger;
 import java.util.List;
-import java.util.function.Function;
 import java.util.function.Supplier;
-import java.util.stream.Stream;
 
-import static org.elasticsearch.compute.data.BlockUtils.toJavaObject;
 import static org.elasticsearch.xpack.esql.EsqlTestUtils.randomLiteral;
 import static org.hamcrest.Matchers.equalTo;
 import static org.hamcrest.Matchers.nullValue;
@@ -209,113 +200,4 @@ public static Iterable<Object[]> parameters() {
     protected Expression build(Source source, List<Expression> args) {
         return new Case(Source.EMPTY, args.get(0), args.subList(1, args.size()));
     }
-
-    public void testEvalCase() {
-        testCase(caseExpr -> {
-            DriverContext driverContext = driverContext();
-            Page page = new Page(driverContext.blockFactory().newConstantIntBlockWith(0, 1));
-            try (
-                EvalOperator.ExpressionEvaluator eval = caseExpr.toEvaluator(child -> evaluator(child)).get(driverContext);
-                Block block = eval.eval(page)
-            ) {
-                return toJavaObject(block, 0);
-            } finally {
-                page.releaseBlocks();
-            }
-        });
-    }
-
-    public void testFoldCase() {
-        testCase(caseExpr -> {
-            assertTrue(caseExpr.foldable());
-            return caseExpr.fold();
-        });
-    }
-
-    public void testCase(Function<Case, Object> toValue) {
-        assertEquals(1, toValue.apply(caseExpr(true, 1)));
-        assertNull(toValue.apply(caseExpr(false, 1)));
-        assertEquals(2, toValue.apply(caseExpr(false, 1, 2)));
-        assertEquals(1, toValue.apply(caseExpr(true, 1, true, 2)));
-        assertEquals(2, toValue.apply(caseExpr(false, 1, true, 2)));
-        assertNull(toValue.apply(caseExpr(false, 1, false, 2)));
-        assertEquals(3, toValue.apply(caseExpr(false, 1, false, 2, 3)));
-        assertNull(toValue.apply(caseExpr(true, null, 1)));
-        assertEquals(1, toValue.apply(caseExpr(false, null, 1)));
-        assertEquals(1, toValue.apply(caseExpr(false, field("ignored", DataType.INTEGER), 1)));
-        assertEquals(1, toValue.apply(caseExpr(true, 1, field("ignored", DataType.INTEGER))));
-    }
-
-    public void testIgnoreLeadingNulls() {
-        assertEquals(DataType.INTEGER, resolveType(false, null, 1));
-        assertEquals(DataType.INTEGER, resolveType(false, null, false, null, false, 2, null));
-        assertEquals(DataType.NULL, resolveType(false, null, null));
-        assertEquals(DataType.BOOLEAN, resolveType(false, null, field("bool", DataType.BOOLEAN)));
-    }
-
-    public void testCaseWithInvalidCondition() {
-        assertEquals("expected at least two arguments in [<case>] but got 1", resolveCase(1).message());
-        assertEquals("first argument of [<case>] must be [boolean], found value [1] type [integer]", resolveCase(1, 2).message());
-        assertEquals(
-            "third argument of [<case>] must be [boolean], found value [3] type [integer]",
-            resolveCase(true, 2, 3, 4, 5).message()
-        );
-    }
-
-    public void testCaseWithIncompatibleTypes() {
-        assertEquals("third argument of [<case>] must be [integer], found value [hi] type [keyword]", resolveCase(true, 1, "hi").message());
-        assertEquals(
-            "fourth argument of [<case>] must be [integer], found value [hi] type [keyword]",
-            resolveCase(true, 1, false, "hi", 5).message()
-        );
-        assertEquals(
-            "argument of [<case>] must be [integer], found value [hi] type [keyword]",
-            resolveCase(true, 1, false, 2, true, 5, "hi").message()
-        );
-    }
-
-    public void testCaseIsLazy() {
-        Case caseExpr = caseExpr(true, 1, true, 2);
-        DriverContext driveContext = driverContext();
-        EvalOperator.ExpressionEvaluator evaluator = caseExpr.toEvaluator(child -> {
-            Object value = child.fold();
-            if (value != null && value.equals(2)) {
-                return dvrCtx -> new EvalOperator.ExpressionEvaluator() {
-                    @Override
-                    public Block eval(Page page) {
-                        fail("Unexpected evaluation of 4th argument");
-                        return null;
-                    }
-
-                    @Override
-                    public void close() {}
-                };
-            }
-            return evaluator(child);
-        }).get(driveContext);
-        Page page = new Page(driveContext.blockFactory().newConstantIntBlockWith(0, 1));
-        try (Block block = evaluator.eval(page)) {
-            assertEquals(1, toJavaObject(block, 0));
-        } finally {
-            page.releaseBlocks();
-        }
-    }
-
-    private static Case caseExpr(Object... args) {
-        List<Expression> exps = Stream.of(args).<Expression>map(arg -> {
-            if (arg instanceof Expression e) {
-                return e;
-            }
-            return new Literal(Source.synthetic(arg == null ? "null" : arg.toString()), arg, DataType.fromJava(arg));
-        }).toList();
-        return new Case(Source.synthetic("<case>"), exps.get(0), exps.subList(1, exps.size()));
-    }
-
-    private static TypeResolution resolveCase(Object... args) {
-        return caseExpr(args).resolveType();
-    }
-
-    private static DataType resolveType(Object... args) {
-        return caseExpr(args).dataType();
-    }
 }

From 306491aa9dc80176ddde58902caa7b2d87f0e178 Mon Sep 17 00:00:00 2001
From: Armin Braun <me@obrown.io>
Date: Fri, 30 Aug 2024 15:17:18 +0200
Subject: [PATCH 075/144] Fix a few toString implementations+usages that affect
 test performance (#112380)

No need to precompute the toString for `ActionListener` and
`Releasable`, that's quite expensive at times. Also string concat is way
faster than formating these days, so use that in the transport channels.
Lastly, short-circuit some obvious spots in network address
serialization and remove code that duplicates the JDK (remove the IPV4
specific forbidden API because it makes no sense, but still needed to
disable the check to make the build green because of the exclude on the
parent class).
---
 .../src/main/java/org/elasticsearch/core/Releasables.java  | 5 +++--
 .../test/java/org/elasticsearch/core/ReleasablesTests.java | 2 +-
 .../main/java/org/elasticsearch/action/ActionListener.java | 4 ++--
 .../org/elasticsearch/common/network/InetAddresses.java    | 7 ++++---
 .../org/elasticsearch/common/network/NetworkAddress.java   | 4 ++--
 .../org/elasticsearch/transport/TaskTransportChannel.java  | 3 +--
 .../org/elasticsearch/transport/TcpTransportChannel.java   | 3 +--
 7 files changed, 14 insertions(+), 14 deletions(-)

diff --git a/libs/core/src/main/java/org/elasticsearch/core/Releasables.java b/libs/core/src/main/java/org/elasticsearch/core/Releasables.java
index 6e595436c9f54..45d98b7761110 100644
--- a/libs/core/src/main/java/org/elasticsearch/core/Releasables.java
+++ b/libs/core/src/main/java/org/elasticsearch/core/Releasables.java
@@ -149,8 +149,9 @@ public static Releasable assertOnce(final Releasable delegate) {
                 private final AtomicReference<Exception> firstCompletion = new AtomicReference<>();
 
                 private void assertFirstRun() {
-                    var previousRun = firstCompletion.compareAndExchange(null, new Exception(delegate.toString()));
-                    assert previousRun == null : previousRun; // reports the stack traces of both completions
+                    var previousRun = firstCompletion.compareAndExchange(null, new Exception("already executed"));
+                    // reports the stack traces of both completions
+                    assert previousRun == null : new AssertionError(delegate.toString(), previousRun);
                 }
 
                 @Override
diff --git a/libs/core/src/test/java/org/elasticsearch/core/ReleasablesTests.java b/libs/core/src/test/java/org/elasticsearch/core/ReleasablesTests.java
index d54c9b8104e8b..602437c27bd49 100644
--- a/libs/core/src/test/java/org/elasticsearch/core/ReleasablesTests.java
+++ b/libs/core/src/test/java/org/elasticsearch/core/ReleasablesTests.java
@@ -69,7 +69,7 @@ public String toString() {
                 .anyMatch(ste -> ste.toString().contains("CloserWithIdentifiableMethodNames.closeMethod2"))
         );
         assertTrue(
-            Arrays.stream(assertionError.getCause().getStackTrace())
+            Arrays.stream(assertionError.getCause().getCause().getStackTrace())
                 .anyMatch(ste -> ste.toString().contains("CloserWithIdentifiableMethodNames.closeMethod1"))
         );
     }
diff --git a/server/src/main/java/org/elasticsearch/action/ActionListener.java b/server/src/main/java/org/elasticsearch/action/ActionListener.java
index f3fa1dd2e105f..5841648700756 100644
--- a/server/src/main/java/org/elasticsearch/action/ActionListener.java
+++ b/server/src/main/java/org/elasticsearch/action/ActionListener.java
@@ -388,8 +388,8 @@ static <Response> ActionListener<Response> assertOnce(ActionListener<Response> d
                 private final AtomicReference<ElasticsearchException> firstCompletion = new AtomicReference<>();
 
                 private void assertFirstRun() {
-                    var previousRun = firstCompletion.compareAndExchange(null, new ElasticsearchException(delegate.toString()));
-                    assert previousRun == null : previousRun; // reports the stack traces of both completions
+                    var previousRun = firstCompletion.compareAndExchange(null, new ElasticsearchException("executed already"));
+                    assert previousRun == null : "[" + delegate + "] " + previousRun; // reports the stack traces of both completions
                 }
 
                 @Override
diff --git a/server/src/main/java/org/elasticsearch/common/network/InetAddresses.java b/server/src/main/java/org/elasticsearch/common/network/InetAddresses.java
index e902d55848406..292dba566d343 100644
--- a/server/src/main/java/org/elasticsearch/common/network/InetAddresses.java
+++ b/server/src/main/java/org/elasticsearch/common/network/InetAddresses.java
@@ -17,6 +17,7 @@
 
 package org.elasticsearch.common.network;
 
+import org.elasticsearch.core.SuppressForbidden;
 import org.elasticsearch.core.Tuple;
 
 import java.net.Inet4Address;
@@ -246,14 +247,14 @@ public static String toUriString(InetAddress ip) {
      * @return {@code String} containing the text-formatted IP address
      * @since 10.0
      */
+    @SuppressForbidden(reason = "java.net.Inet4Address#getHostAddress() is fine no need to duplicate its code")
     public static String toAddrString(InetAddress ip) {
         if (ip == null) {
             throw new NullPointerException("ip");
         }
-        if (ip instanceof Inet4Address) {
+        if (ip instanceof Inet4Address inet4Address) {
             // For IPv4, Java's formatting is good enough.
-            byte[] bytes = ip.getAddress();
-            return (bytes[0] & 0xff) + "." + (bytes[1] & 0xff) + "." + (bytes[2] & 0xff) + "." + (bytes[3] & 0xff);
+            return inet4Address.getHostAddress();
         }
         if ((ip instanceof Inet6Address) == false) {
             throw new IllegalArgumentException("ip");
diff --git a/server/src/main/java/org/elasticsearch/common/network/NetworkAddress.java b/server/src/main/java/org/elasticsearch/common/network/NetworkAddress.java
index f71bad1cd5cc5..bc73ba4a31d18 100644
--- a/server/src/main/java/org/elasticsearch/common/network/NetworkAddress.java
+++ b/server/src/main/java/org/elasticsearch/common/network/NetworkAddress.java
@@ -57,7 +57,7 @@ private NetworkAddress() {}
      * @return formatted string
      */
     public static String format(InetAddress address) {
-        return format(address, new PortsRange(""));
+        return InetAddresses.toAddrString(address);
     }
 
     /**
@@ -96,7 +96,7 @@ public static String format(InetSocketAddress address) {
      * @return formatted string
      */
     public static String format(InetAddress address, int port) {
-        return format(address, new PortsRange(String.valueOf(port)));
+        return (address instanceof Inet6Address ? InetAddresses.toUriString(address) : InetAddresses.toAddrString(address)) + ":" + port;
     }
 
     /**
diff --git a/server/src/main/java/org/elasticsearch/transport/TaskTransportChannel.java b/server/src/main/java/org/elasticsearch/transport/TaskTransportChannel.java
index d6a5b3436c938..01b06a1b9b580 100644
--- a/server/src/main/java/org/elasticsearch/transport/TaskTransportChannel.java
+++ b/server/src/main/java/org/elasticsearch/transport/TaskTransportChannel.java
@@ -9,7 +9,6 @@
 package org.elasticsearch.transport;
 
 import org.elasticsearch.TransportVersion;
-import org.elasticsearch.common.Strings;
 import org.elasticsearch.core.Releasable;
 
 public class TaskTransportChannel implements TransportChannel {
@@ -58,6 +57,6 @@ public TransportChannel getChannel() {
 
     @Override
     public String toString() {
-        return Strings.format("TaskTransportChannel{task=%d}{%s}", taskId, channel);
+        return "TaskTransportChannel{task=" + taskId + "}{" + channel + "}";
     }
 }
diff --git a/server/src/main/java/org/elasticsearch/transport/TcpTransportChannel.java b/server/src/main/java/org/elasticsearch/transport/TcpTransportChannel.java
index 36a87ac418698..b0bcc697b0273 100644
--- a/server/src/main/java/org/elasticsearch/transport/TcpTransportChannel.java
+++ b/server/src/main/java/org/elasticsearch/transport/TcpTransportChannel.java
@@ -9,7 +9,6 @@
 package org.elasticsearch.transport;
 
 import org.elasticsearch.TransportVersion;
-import org.elasticsearch.common.Strings;
 import org.elasticsearch.core.Releasable;
 
 public final class TcpTransportChannel implements TransportChannel {
@@ -89,6 +88,6 @@ public TcpChannel getChannel() {
 
     @Override
     public String toString() {
-        return Strings.format("TcpTransportChannel{req=%d}{%s}{%s}", requestId, action, channel);
+        return "TcpTransportChannel{req=" + requestId + "}{" + action + "}{" + channel + "}";
     }
 }

From 0489a37b4af8258eef27701681494960bbfa6b2f Mon Sep 17 00:00:00 2001
From: Chris Hegarty <62058229+ChrisHegarty@users.noreply.github.com>
Date: Fri, 30 Aug 2024 14:54:45 +0100
Subject: [PATCH 076/144] Upgrade Byte Buddy to 1.14.12 (#112390)

This commit bumps the Byte Buddy version to 1.14.12. This is needed to support class file versions generated by Java 21.

We already use this version of Byte Buddy elsewhere, so there is not need to update the gradle verification metadata.

This change is in preparation for an eventual bump of Elasticsearch to a minimum of JDK 21, in ES 9.0.
---
 gradle/build.versions.toml       | 2 +-
 gradle/verification-metadata.xml | 5 -----
 2 files changed, 1 insertion(+), 6 deletions(-)

diff --git a/gradle/build.versions.toml b/gradle/build.versions.toml
index 12f7776add17b..35c26ef10f9ec 100644
--- a/gradle/build.versions.toml
+++ b/gradle/build.versions.toml
@@ -11,7 +11,7 @@ apache-compress = "org.apache.commons:commons-compress:1.26.1"
 apache-rat = "org.apache.rat:apache-rat:0.11"
 asm = { group = "org.ow2.asm", name="asm", version.ref="asm" }
 asm-tree = { group = "org.ow2.asm", name="asm-tree", version.ref="asm" }
-bytebuddy = "net.bytebuddy:byte-buddy:1.12.10"
+bytebuddy = "net.bytebuddy:byte-buddy:1.14.12"
 checkstyle = "com.puppycrawl.tools:checkstyle:10.3"
 commons-codec = "commons-codec:commons-codec:1.11"
 commmons-io = "commons-io:commons-io:2.2"
diff --git a/gradle/verification-metadata.xml b/gradle/verification-metadata.xml
index 3a4f5ef9d240c..472a65f9c6f24 100644
--- a/gradle/verification-metadata.xml
+++ b/gradle/verification-metadata.xml
@@ -1664,11 +1664,6 @@
             <sha256 value="1d31696445697720527091754369082a6651bd49781b6005deb94e56753406f9" origin="Generated by Gradle"/>
          </artifact>
       </component>
-      <component group="net.bytebuddy" name="byte-buddy" version="1.12.10">
-         <artifact name="byte-buddy-1.12.10.jar">
-            <sha256 value="1a1ac9ce65eddcea54ead958387bb0b3863d02a2ffe856ab6a57ac79737c19cf" origin="Generated by Gradle"/>
-         </artifact>
-      </component>
       <component group="net.bytebuddy" name="byte-buddy" version="1.14.12">
          <artifact name="byte-buddy-1.14.12.jar">
             <sha256 value="970636134d61c183b19f8f58fa631e30d2f2abca344b37848a393cac7863dd70" origin="Generated by Gradle"/>

From 212fe035ea4939d10d8a55eaf882163d932ad914 Mon Sep 17 00:00:00 2001
From: Yang Wang <yang.wang@elastic.co>
Date: Sat, 31 Aug 2024 00:01:21 +1000
Subject: [PATCH 077/144] [Test] Fix
 SharedBlobCacheServiceTests.testGetMultiThreaded (#112322)

A cacheFileRegion can be concurrently evicted while its being incref'd.

See this comment
https://github.com/elastic/elasticsearch/blob/98fe686da4c5cb82d4b03719977be428dc7934e7/x-pack/plugin/blob-cache/src/main/java/org/elasticsearch/blobcache/shared/SharedBlobCacheService.java#L1812-L1813

The tryRead method also performs null and eviction check for io before
returing true.
https://github.com/elastic/elasticsearch/blob/98fe686da4c5cb82d4b03719977be428dc7934e7/x-pack/plugin/blob-cache/src/main/java/org/elasticsearch/blobcache/shared/SharedBlobCacheService.java#L926-L931

Resolves: #112314
---
 muted-tests.yml                                                | 3 ---
 .../blobcache/shared/SharedBlobCacheServiceTests.java          | 3 +--
 2 files changed, 1 insertion(+), 5 deletions(-)

diff --git a/muted-tests.yml b/muted-tests.yml
index 43ba2469af904..ba45c119f8e9e 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -154,9 +154,6 @@ tests:
 - class: org.elasticsearch.search.retriever.rankdoc.RankDocsSortBuilderTests
   method: testEqualsAndHashcode
   issue: https://github.com/elastic/elasticsearch/issues/112312
-- class: org.elasticsearch.blobcache.shared.SharedBlobCacheServiceTests
-  method: testGetMultiThreaded
-  issue: https://github.com/elastic/elasticsearch/issues/112314
 - class: org.elasticsearch.search.retriever.RankDocRetrieverBuilderIT
   method: testRankDocsRetrieverWithCollapse
   issue: https://github.com/elastic/elasticsearch/issues/112254
diff --git a/x-pack/plugin/blob-cache/src/test/java/org/elasticsearch/blobcache/shared/SharedBlobCacheServiceTests.java b/x-pack/plugin/blob-cache/src/test/java/org/elasticsearch/blobcache/shared/SharedBlobCacheServiceTests.java
index e405ed578b5a5..b6f5b550aea90 100644
--- a/x-pack/plugin/blob-cache/src/test/java/org/elasticsearch/blobcache/shared/SharedBlobCacheServiceTests.java
+++ b/x-pack/plugin/blob-cache/src/test/java/org/elasticsearch/blobcache/shared/SharedBlobCacheServiceTests.java
@@ -444,7 +444,6 @@ public void testMassiveDecay() throws IOException {
      * Exercise SharedBlobCacheService#get in multiple threads to trigger any assertion errors.
      * @throws IOException
      */
-    @AwaitsFix(bugUrl = "https://github.com/elastic/elasticsearch/issues/112305")
     public void testGetMultiThreaded() throws IOException {
         final int threads = between(2, 10);
         final int regionCount = between(1, 20);
@@ -494,11 +493,11 @@ public void testGetMultiThreaded() throws IOException {
                                     assert allowAlreadyClosed || e.getMessage().equals("evicted during free region allocation") : e;
                                     throw e;
                                 }
+                                assertTrue(cacheFileRegion.testOnlyNonVolatileIO() != null || cacheFileRegion.isEvicted());
                                 if (incRef && cacheFileRegion.tryIncRef()) {
                                     if (yield[i] == 0) {
                                         Thread.yield();
                                     }
-                                    assertNotNull(cacheFileRegion.testOnlyNonVolatileIO());
                                     cacheFileRegion.decRef();
                                 }
                                 if (evict[i] == 0) {

From ac735afbbd1cab8694c0e5613c8f2fdc8c765ac2 Mon Sep 17 00:00:00 2001
From: Pat Whelan <pat.whelan@elastic.co>
Date: Fri, 30 Aug 2024 11:20:00 -0400
Subject: [PATCH 078/144] [ML] Update response parsing for streaming (#112244)

Update Request and ResponseHandler for streaming HttpResult and
converting it to InferenceServiceResults.  This interface will be
implemented in a later change, but it defaults to non-streaming.
---
 .../external/http/retry/ResponseHandler.java  | 23 +++++++++++++++++++
 .../inference/external/request/Request.java   |  8 +++++++
 2 files changed, 31 insertions(+)

diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/retry/ResponseHandler.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/retry/ResponseHandler.java
index 3d38c1941e52f..c2ae39f10ae7a 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/retry/ResponseHandler.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/retry/ResponseHandler.java
@@ -13,6 +13,8 @@
 import org.elasticsearch.xpack.inference.external.request.Request;
 import org.elasticsearch.xpack.inference.logging.ThrottlerManager;
 
+import java.util.concurrent.Flow;
+
 /**
  * A contract for clients to specify behavior for handling http responses. Clients can pass this contract to the retry sender to parse
  * the response and help with logging.
@@ -47,4 +49,25 @@ public interface ResponseHandler {
      * @return a {@link String} indicating the request type that was sent (e.g. elser, elser hugging face etc)
      */
     String getRequestType();
+
+    /**
+     * Returns {@code true} if the response handler can handle streaming results, or {@code false} if can only parse the entire payload.
+     * Defaults to {@code false}.
+     */
+    default boolean canHandleStreamingResponses() {
+        return false;
+    }
+
+    /**
+     * A method for parsing the streamed response from the server.
+     * @param request The original request sent to the server
+     * @param result The first result that initiated the stream. If the result is HTTP 200, this result will not contain content bytes
+     * @param flow The remaining stream of results from the server.  If the result is HTTP 200, these results will contain content bytes
+     * @return an inference results with {@link InferenceServiceResults#publisher()} set and {@link InferenceServiceResults#isStreaming()}
+     * set to true
+     */
+    default InferenceServiceResults parseResult(Request request, HttpResult result, Flow.Publisher<HttpResult> flow) {
+        assert canHandleStreamingResponses() == false : "This must be implemented when canHandleStreamingResponses() == true";
+        throw new UnsupportedOperationException("This must be implemented when canHandleStreamingResponses() == true");
+    }
 }
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/Request.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/Request.java
index bfc32ecbc794d..200021d1b3965 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/Request.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/Request.java
@@ -31,4 +31,12 @@ public interface Request {
      * @return the unique identifier for the inference entity configuration
      */
     String getInferenceEntityId();
+
+    /**
+     * Streams the result in bytes to the {@link org.elasticsearch.inference.InferenceServiceResults}.
+     * Defaults to false.
+     */
+    default boolean isStreaming() {
+        return false;
+    }
 }

From b449f21457c5d1729d83969f17e675c83777c5ea Mon Sep 17 00:00:00 2001
From: Stanislav Malyshev <smalyshev@users.noreply.github.com>
Date: Fri, 30 Aug 2024 09:28:09 -0600
Subject: [PATCH 079/144] Convert CCSTelemetrySnapshotTests to use
 assertToXContentEquivalent (#112370)

---
 .../cluster/stats/CCSTelemetrySnapshotTests.java     | 12 ++++++++++--
 1 file changed, 10 insertions(+), 2 deletions(-)

diff --git a/server/src/test/java/org/elasticsearch/action/admin/cluster/stats/CCSTelemetrySnapshotTests.java b/server/src/test/java/org/elasticsearch/action/admin/cluster/stats/CCSTelemetrySnapshotTests.java
index 9f08934503b69..f5bfab15799f1 100644
--- a/server/src/test/java/org/elasticsearch/action/admin/cluster/stats/CCSTelemetrySnapshotTests.java
+++ b/server/src/test/java/org/elasticsearch/action/admin/cluster/stats/CCSTelemetrySnapshotTests.java
@@ -10,9 +10,12 @@
 
 import org.elasticsearch.action.admin.cluster.stats.CCSTelemetrySnapshot.PerClusterCCSTelemetry;
 import org.elasticsearch.action.admin.cluster.stats.LongMetric.LongMetricValue;
+import org.elasticsearch.common.bytes.BytesArray;
 import org.elasticsearch.common.io.stream.Writeable;
+import org.elasticsearch.common.xcontent.XContentHelper;
 import org.elasticsearch.core.Tuple;
 import org.elasticsearch.test.AbstractWireSerializingTestCase;
+import org.elasticsearch.xcontent.XContentType;
 
 import java.io.IOException;
 import java.io.InputStream;
@@ -21,6 +24,7 @@
 import java.util.Map;
 import java.util.TreeMap;
 
+import static org.elasticsearch.test.hamcrest.ElasticsearchAssertions.assertToXContentEquivalent;
 import static org.hamcrest.Matchers.closeTo;
 import static org.hamcrest.Matchers.equalTo;
 
@@ -309,8 +313,12 @@ public void testToXContent() throws IOException {
             clientCounts,
             perClusterCCSTelemetries
         );
-        String expected = readJSONFromResource("telemetry_test.json");
-        assertEquals(expected, snapshot.toString());
+        String expectedJson = readJSONFromResource("telemetry_test.json");
+        assertToXContentEquivalent(
+            new BytesArray(expectedJson),
+            XContentHelper.toXContent(snapshot, XContentType.JSON, randomBoolean()),
+            XContentType.JSON
+        );
     }
 
     private String readJSONFromResource(String fileName) throws IOException {

From c1d9e7ead52cae78b5d9fe48d998edeece246eae Mon Sep 17 00:00:00 2001
From: Nik Everett <nik9000@gmail.com>
Date: Fri, 30 Aug 2024 12:28:57 -0400
Subject: [PATCH 080/144] ESQL: Tighten assertion on `Block` (#112367)

This tightens the invariant on `Block` - namely that there are no `0`
length positions, at least none tracked by the `firstValueIndexes` in
`ArrayBlock` - instead, the only way a position can be `0` length is to
have been created with `appendNull`.

The only cause of these `0` length positions was ordinals blocks made by
`BlockHash`. This reworks that infrastructure to instead create those
with `appendNull`.
---
 .../blockhash/AbstractAddBlock.java           |  67 --------
 .../aggregation/blockhash/AddBlock.java       | 154 ++++++++++++++++++
 .../blockhash/BytesRef3BlockHash.java         |  11 +-
 .../blockhash/PackedValuesBlockHash.java      |  14 +-
 .../compute/data/AbstractArrayBlock.java      |   2 +-
 .../compute/data/AbstractBlockBuilder.java    |   1 +
 .../operator/mvdedupe/IntLongBlockAdd.java    |  25 +--
 .../operator/mvdedupe/LongLongBlockAdd.java   |  25 +--
 .../aggregation/blockhash/AddBlockTests.java  | 143 ++++++++++++++++
 9 files changed, 325 insertions(+), 117 deletions(-)
 delete mode 100644 x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/blockhash/AbstractAddBlock.java
 create mode 100644 x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/blockhash/AddBlock.java
 create mode 100644 x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/blockhash/AddBlockTests.java

diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/blockhash/AbstractAddBlock.java b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/blockhash/AbstractAddBlock.java
deleted file mode 100644
index a5997bbb7f482..0000000000000
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/blockhash/AbstractAddBlock.java
+++ /dev/null
@@ -1,67 +0,0 @@
-/*
- * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
- * or more contributor license agreements. Licensed under the Elastic License
- * 2.0; you may not use this file except in compliance with the Elastic License
- * 2.0.
- */
-
-package org.elasticsearch.compute.aggregation.blockhash;
-
-import org.elasticsearch.compute.aggregation.GroupingAggregatorFunction;
-import org.elasticsearch.compute.data.Block;
-import org.elasticsearch.compute.data.BlockFactory;
-import org.elasticsearch.compute.data.IntBlock;
-import org.elasticsearch.compute.data.Page;
-import org.elasticsearch.core.Releasable;
-
-/**
- * Helper for adding a {@link Page} worth of {@link Block}s to a {@link BlockHash}.
- */
-public class AbstractAddBlock implements Releasable {
-    private final BlockFactory blockFactory;
-    private final int emitBatchSize;
-    private final GroupingAggregatorFunction.AddInput addInput;
-
-    private int positionOffset = 0;
-    private int added = 0;
-    protected IntBlock.Builder ords;
-
-    public AbstractAddBlock(BlockFactory blockFactory, int emitBatchSize, GroupingAggregatorFunction.AddInput addInput) {
-        this.blockFactory = blockFactory;
-        this.emitBatchSize = emitBatchSize;
-        this.addInput = addInput;
-
-        this.ords = blockFactory.newIntBlockBuilder(emitBatchSize);
-    }
-
-    protected final void addedValue(int position) {
-        if (++added % emitBatchSize == 0) {
-            rollover(position + 1);
-        }
-    }
-
-    protected final void addedValueInMultivaluePosition(int position) {
-        if (++added % emitBatchSize == 0) {
-            ords.endPositionEntry();
-            rollover(position);
-            ords.beginPositionEntry();
-        }
-    }
-
-    protected final void emitOrds() {
-        try (IntBlock ordsBlock = ords.build()) {
-            addInput.add(positionOffset, ordsBlock);
-        }
-    }
-
-    private void rollover(int position) {
-        emitOrds();
-        positionOffset = position;
-        ords = blockFactory.newIntBlockBuilder(emitBatchSize); // TODO add a clear method to the builder?
-    }
-
-    @Override
-    public void close() {
-        ords.close();
-    }
-}
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/blockhash/AddBlock.java b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/blockhash/AddBlock.java
new file mode 100644
index 0000000000000..786c61e6f602a
--- /dev/null
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/blockhash/AddBlock.java
@@ -0,0 +1,154 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.compute.aggregation.blockhash;
+
+import org.elasticsearch.compute.aggregation.GroupingAggregatorFunction;
+import org.elasticsearch.compute.data.Block;
+import org.elasticsearch.compute.data.BlockFactory;
+import org.elasticsearch.compute.data.IntBlock;
+import org.elasticsearch.compute.data.Page;
+import org.elasticsearch.core.Releasable;
+
+/**
+ * Helper for adding a {@link Page} worth of {@link Block}s to a {@link BlockHash}
+ * while flushing the ordinals to the aggregations when we've accumulated
+ * {@link #emitBatchSize} ordinals. See {@link #appendOrdSv} and {@link #appendOrdInMv}
+ * for how to add values to it. After adding all values, call {@link #emitOrds} to
+ * flush the last batch of values to the aggs.
+ */
+public class AddBlock implements Releasable {
+    private final BlockFactory blockFactory;
+    private final int emitBatchSize;
+    private final GroupingAggregatorFunction.AddInput addInput;
+
+    private int positionOffset = 0;
+    private int added = 0;
+    private IntBlock.Builder ords;
+    /**
+     * State of the current position.
+     * <ul>
+     *     <li>If {@code -1} then this position is "empty". It hasn't
+     *     received any calls to {@link #appendOrdInMv}. When
+     *     {@link #appendOrdInMv} is called this will shift into the
+     *     "buffering" state by setting this to the provided ord.</li>
+     *     <li>If {@code >= 0} this position is "buffering" a single
+     *     ordinal. When {@link #appendOrdInMv} is called this will
+     *     {@link Block.Builder#beginPositionEntry() begin} a multivalued
+     *     field, add the buffered ordinal, add the provided ordinal,
+     *     and shift to {@code -2}.</li>
+     *     <li>If {@code -2} then this position is "streaming" and
+     *     calling {@link #appendOrdInMv} will add values immediately.</li>
+     * </ul>
+     * There's some extra complexity around emitting buffered values and shifting
+     * back into {@code -1}, but that's the gist of the states.
+     */
+    private int firstOrd = -1;
+
+    public AddBlock(BlockFactory blockFactory, int emitBatchSize, GroupingAggregatorFunction.AddInput addInput) {
+        this.blockFactory = blockFactory;
+        this.emitBatchSize = emitBatchSize;
+        this.addInput = addInput;
+
+        this.ords = blockFactory.newIntBlockBuilder(emitBatchSize);
+    }
+
+    /**
+     * Append a single valued ordinal. This will flush the ordinals to the aggs
+     * if we've added {@link #emitBatchSize}.
+     */
+    protected final void appendOrdSv(int position, int ord) {
+        assert firstOrd == -1 : "currently in a multivalue position";
+        ords.appendInt(ord);
+        if (++added % emitBatchSize == 0) {
+            rollover(position + 1);
+        }
+    }
+
+    /**
+     * Append a {@code null} valued ordinal. This will flush the ordinals
+     * to the aggs if we've added {@link #emitBatchSize}.
+     * @deprecated nulls should resolve to some value.
+     */
+    @Deprecated
+    protected final void appendNullSv(int position) {
+        ords.appendNull();
+        if (++added % emitBatchSize == 0) {
+            rollover(position + 1);
+        }
+    }
+
+    /**
+     * Append a value inside a multivalued ordinal. If the current position is
+     * not started this will begin the position. This will flush the ordinals to
+     * the aggs if we've added {@link #emitBatchSize}.This should be used by like:
+     * <pre>{@code
+     *  appendOrdInMv(position, ord);
+     *  appendOrdInMv(position, ord);
+     *  appendOrdInMv(position, ord);
+     *  finishMv();
+     * }</pre>
+     */
+    protected final void appendOrdInMv(int position, int ord) {
+        if (++added % emitBatchSize == 0) {
+            switch (firstOrd) {
+                case -1 -> ords.appendInt(ord);
+                case -2 -> {
+                    ords.appendInt(ord);
+                    ords.endPositionEntry();
+                }
+                default -> {
+                    assert firstOrd >= 0;
+                    ords.beginPositionEntry();
+                    ords.appendInt(firstOrd);
+                    ords.appendInt(ord);
+                    ords.endPositionEntry();
+                }
+            }
+            rollover(position);
+            firstOrd = -1;
+            return;
+        }
+        switch (firstOrd) {
+            case -1 -> firstOrd = ord;
+            case -2 -> ords.appendInt(ord);
+            default -> {
+                assert firstOrd >= 0;
+                ords.beginPositionEntry();
+                ords.appendInt(firstOrd);
+                ords.appendInt(ord);
+                firstOrd = -2;
+            }
+        }
+    }
+
+    protected final void finishMv() {
+        switch (firstOrd) {
+            case -1 -> ords.appendNull();
+            case -2 -> ords.endPositionEntry();
+            default -> ords.appendInt(firstOrd);
+        }
+        firstOrd = -1;
+    }
+
+    protected final void emitOrds() {
+        try (IntBlock ordsBlock = ords.build()) {
+            addInput.add(positionOffset, ordsBlock);
+        }
+    }
+
+    private void rollover(int position) {
+        emitOrds();
+        positionOffset = position;
+        ords = blockFactory.newIntBlockBuilder(emitBatchSize); // TODO add a clear method to the builder?
+    }
+
+    @Override
+    public void close() {
+        ords.close();
+    }
+}
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/blockhash/BytesRef3BlockHash.java b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/blockhash/BytesRef3BlockHash.java
index 626c5bb910ce3..07600cd7a1dc9 100644
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/blockhash/BytesRef3BlockHash.java
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/blockhash/BytesRef3BlockHash.java
@@ -98,7 +98,7 @@ private void addVectors(BytesRefVector v1, BytesRefVector v2, BytesRefVector v3,
         }
     }
 
-    private class AddWork extends AbstractAddBlock {
+    private class AddWork extends AddBlock {
         final IntBlock b1;
         final IntBlock b2;
         final IntBlock b3;
@@ -121,11 +121,9 @@ void add() {
                 int first3 = b3.getFirstValueIndex(i);
                 if (v1 == 1 && v2 == 1 && v3 == 1) {
                     long ord = hashOrdToGroup(finalHash.add(b1.getInt(first1), b2.getInt(first2), b3.getInt(first3)));
-                    ords.appendInt(Math.toIntExact(ord));
-                    addedValue(i);
+                    appendOrdSv(i, Math.toIntExact(ord));
                     continue;
                 }
-                ords.beginPositionEntry();
                 for (int i1 = 0; i1 < v1; i1++) {
                     int k1 = b1.getInt(first1 + i1);
                     for (int i2 = 0; i2 < v2; i2++) {
@@ -133,12 +131,11 @@ void add() {
                         for (int i3 = 0; i3 < v3; i3++) {
                             int k3 = b3.getInt(first3 + i3);
                             long ord = hashOrdToGroup(finalHash.add(k1, k2, k3));
-                            ords.appendInt(Math.toIntExact(ord));
-                            addedValueInMultivaluePosition(i);
+                            appendOrdInMv(i, Math.toIntExact(ord));
                         }
                     }
                 }
-                ords.endPositionEntry();
+                finishMv();
             }
             emitOrds();
         }
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/blockhash/PackedValuesBlockHash.java b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/blockhash/PackedValuesBlockHash.java
index 22fee4e595b2e..85b3cec274e39 100644
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/blockhash/PackedValuesBlockHash.java
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/blockhash/PackedValuesBlockHash.java
@@ -117,7 +117,7 @@ public void close() {
         }
     }
 
-    class AddWork extends AbstractAddBlock {
+    class AddWork extends AddBlock {
         final Group[] groups;
         final int positionCount;
         int position;
@@ -147,23 +147,17 @@ void add() {
 
         private void addSingleEntry() {
             fillBytesSv(groups);
-            ords.appendInt(Math.toIntExact(hashOrdToGroup(bytesRefHash.add(bytes.get()))));
-            addedValue(position);
+            appendOrdSv(position, Math.toIntExact(hashOrdToGroup(bytesRefHash.add(bytes.get()))));
         }
 
         private void addMultipleEntries() {
-            ords.beginPositionEntry();
             int g = 0;
             do {
                 fillBytesMv(groups, g);
-
-                // emit ords
-                ords.appendInt(Math.toIntExact(hashOrdToGroup(bytesRefHash.add(bytes.get()))));
-                addedValueInMultivaluePosition(position);
-
+                appendOrdInMv(position, Math.toIntExact(hashOrdToGroup(bytesRefHash.add(bytes.get()))));
                 g = rewindKeys(groups);
             } while (g >= 0);
-            ords.endPositionEntry();
+            finishMv();
             for (Group group : groups) {
                 group.valueOffset += group.valueCount;
             }
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/AbstractArrayBlock.java b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/AbstractArrayBlock.java
index 22f8dded57320..c14289ff2366b 100644
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/AbstractArrayBlock.java
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/AbstractArrayBlock.java
@@ -77,7 +77,7 @@ private boolean assertInvariants() {
         if (firstValueIndexes != null) {
             assert firstValueIndexes.length >= getPositionCount() + 1 : firstValueIndexes.length + " < " + positionCount;
             for (int i = 0; i < getPositionCount(); i++) {
-                assert firstValueIndexes[i + 1] >= firstValueIndexes[i] : firstValueIndexes[i + 1] + " < " + firstValueIndexes[i];
+                assert firstValueIndexes[i + 1] > firstValueIndexes[i] : firstValueIndexes[i + 1] + " <= " + firstValueIndexes[i];
             }
         }
         if (nullsMask != null) {
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/AbstractBlockBuilder.java b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/AbstractBlockBuilder.java
index 5fac64735155d..9ec726c6b250d 100644
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/AbstractBlockBuilder.java
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/data/AbstractBlockBuilder.java
@@ -79,6 +79,7 @@ public AbstractBlockBuilder beginPositionEntry() {
     }
 
     public AbstractBlockBuilder endPositionEntry() {
+        assert valueCount > firstValueIndexes[positionCount] : "use appendNull to build an empty position";
         positionCount++;
         positionEntryIsOpen = false;
         if (hasMultiValues == false && valueCount != positionCount) {
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/operator/mvdedupe/IntLongBlockAdd.java b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/operator/mvdedupe/IntLongBlockAdd.java
index 6decdfb7add6c..ecd7df1a7e6c4 100644
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/operator/mvdedupe/IntLongBlockAdd.java
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/operator/mvdedupe/IntLongBlockAdd.java
@@ -9,13 +9,13 @@
 
 import org.elasticsearch.common.util.LongLongHash;
 import org.elasticsearch.compute.aggregation.GroupingAggregatorFunction;
-import org.elasticsearch.compute.aggregation.blockhash.AbstractAddBlock;
+import org.elasticsearch.compute.aggregation.blockhash.AddBlock;
 import org.elasticsearch.compute.aggregation.blockhash.BlockHash;
 import org.elasticsearch.compute.data.BlockFactory;
 import org.elasticsearch.compute.data.IntBlock;
 import org.elasticsearch.compute.data.LongBlock;
 
-public class IntLongBlockAdd extends AbstractAddBlock {
+public class IntLongBlockAdd extends AddBlock {
     private final LongLongHash hash;
     private final MultivalueDedupeInt block1;
     private final MultivalueDedupeLong block2;
@@ -47,8 +47,7 @@ private void add1(int position) {
         int count = block1.block.getValueCount(position);
         switch (count) {
             case 0 -> {
-                ords.appendNull();
-                addedValue(position);
+                appendNullSv(position);
             }
             case 1 -> {
                 block1.w = 1;
@@ -72,8 +71,7 @@ private void add2(int position, boolean work1IsUnique) {
         int count = block2.block.getValueCount(position);
         switch (count) {
             case 0 -> {
-                ords.appendNull();
-                addedValue(position);
+                appendNullSv(position);
             }
             case 1 -> {
                 block2.w = 1;
@@ -96,12 +94,10 @@ private void add2(int position, boolean work1IsUnique) {
     private void finishAdd(int position, boolean work1IsUnique, boolean work2IsUnique) {
         if (block1.w == 1) {
             if (block2.w == 1) {
-                ords.appendInt(Math.toIntExact(BlockHash.hashOrdToGroup(hash.add(block1.work[0], block2.work[0]))));
-                addedValue(position);
+                appendOrdSv(position, Math.toIntExact(BlockHash.hashOrdToGroup(hash.add(block1.work[0], block2.work[0]))));
                 return;
             }
         }
-        ords.beginPositionEntry();
         if (work1IsUnique) {
             if (work2IsUnique) {
                 finishAddUniqueUnique(position);
@@ -115,7 +111,7 @@ private void finishAdd(int position, boolean work1IsUnique, boolean work2IsUniqu
                 finishAddSortedSorted(position);
             }
         }
-        ords.endPositionEntry();
+        finishMv();
     }
 
     private void finishAddUniqueUnique(int position) {
@@ -156,22 +152,19 @@ private void finishAddSortedSorted(int position) {
 
     private void finishAddUnique(int position, int v1) {
         for (int i = 0; i < block2.w; i++) {
-            ords.appendInt(Math.toIntExact(BlockHash.hashOrdToGroup(hash.add(v1, block2.work[i]))));
-            addedValueInMultivaluePosition(position);
+            appendOrdInMv(position, Math.toIntExact(BlockHash.hashOrdToGroup(hash.add(v1, block2.work[i]))));
         }
     }
 
     private void finishAddSorted(int position, int v1) {
         long prev2 = block2.work[0];
-        ords.appendInt(Math.toIntExact(BlockHash.hashOrdToGroup(hash.add(v1, prev2))));
-        addedValueInMultivaluePosition(position);
+        appendOrdInMv(position, Math.toIntExact(BlockHash.hashOrdToGroup(hash.add(v1, prev2))));
         for (int i = 1; i < block2.w; i++) {
             if (prev2 == block2.work[i]) {
                 continue;
             }
             prev2 = block2.work[i];
-            ords.appendInt(Math.toIntExact(BlockHash.hashOrdToGroup(hash.add(v1, prev2))));
-            addedValueInMultivaluePosition(position);
+            appendOrdInMv(position, Math.toIntExact(BlockHash.hashOrdToGroup(hash.add(v1, prev2))));
         }
     }
 }
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/operator/mvdedupe/LongLongBlockAdd.java b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/operator/mvdedupe/LongLongBlockAdd.java
index 34d5bad65b17b..1f117498b078e 100644
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/operator/mvdedupe/LongLongBlockAdd.java
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/operator/mvdedupe/LongLongBlockAdd.java
@@ -9,12 +9,12 @@
 
 import org.elasticsearch.common.util.LongLongHash;
 import org.elasticsearch.compute.aggregation.GroupingAggregatorFunction;
-import org.elasticsearch.compute.aggregation.blockhash.AbstractAddBlock;
+import org.elasticsearch.compute.aggregation.blockhash.AddBlock;
 import org.elasticsearch.compute.aggregation.blockhash.BlockHash;
 import org.elasticsearch.compute.data.BlockFactory;
 import org.elasticsearch.compute.data.LongBlock;
 
-public class LongLongBlockAdd extends AbstractAddBlock {
+public class LongLongBlockAdd extends AddBlock {
     private final LongLongHash hash;
     private final MultivalueDedupeLong block1;
     private final MultivalueDedupeLong block2;
@@ -46,8 +46,7 @@ private void add1(int position) {
         int count = block1.block.getValueCount(position);
         switch (count) {
             case 0 -> {
-                ords.appendNull();
-                addedValue(position);
+                appendNullSv(position);
             }
             case 1 -> {
                 block1.w = 1;
@@ -71,8 +70,7 @@ private void add2(int position, boolean work1IsUnique) {
         int count = block2.block.getValueCount(position);
         switch (count) {
             case 0 -> {
-                ords.appendNull();
-                addedValue(position);
+                appendNullSv(position);
             }
             case 1 -> {
                 block2.w = 1;
@@ -95,12 +93,10 @@ private void add2(int position, boolean work1IsUnique) {
     private void finishAdd(int position, boolean work1IsUnique, boolean work2IsUnique) {
         if (block1.w == 1) {
             if (block2.w == 1) {
-                ords.appendInt(Math.toIntExact(BlockHash.hashOrdToGroup(hash.add(block1.work[0], block2.work[0]))));
-                addedValue(position);
+                appendOrdSv(position, Math.toIntExact(BlockHash.hashOrdToGroup(hash.add(block1.work[0], block2.work[0]))));
                 return;
             }
         }
-        ords.beginPositionEntry();
         if (work1IsUnique) {
             if (work2IsUnique) {
                 finishAddUniqueUnique(position);
@@ -114,7 +110,7 @@ private void finishAdd(int position, boolean work1IsUnique, boolean work2IsUniqu
                 finishAddSortedSorted(position);
             }
         }
-        ords.endPositionEntry();
+        finishMv();
     }
 
     private void finishAddUniqueUnique(int position) {
@@ -155,22 +151,19 @@ private void finishAddSortedSorted(int position) {
 
     private void finishAddUnique(int position, long v1) {
         for (int i = 0; i < block2.w; i++) {
-            ords.appendInt(Math.toIntExact(BlockHash.hashOrdToGroup(hash.add(v1, block2.work[i]))));
-            addedValueInMultivaluePosition(position);
+            appendOrdInMv(position, Math.toIntExact(BlockHash.hashOrdToGroup(hash.add(v1, block2.work[i]))));
         }
     }
 
     private void finishAddSorted(int position, long v1) {
         long prev2 = block2.work[0];
-        ords.appendInt(Math.toIntExact(BlockHash.hashOrdToGroup(hash.add(v1, prev2))));
-        addedValueInMultivaluePosition(position);
+        appendOrdInMv(position, Math.toIntExact(BlockHash.hashOrdToGroup(hash.add(v1, prev2))));
         for (int i = 1; i < block2.w; i++) {
             if (prev2 == block2.work[i]) {
                 continue;
             }
             prev2 = block2.work[i];
-            ords.appendInt(Math.toIntExact(BlockHash.hashOrdToGroup(hash.add(v1, prev2))));
-            addedValueInMultivaluePosition(position);
+            appendOrdInMv(position, Math.toIntExact(BlockHash.hashOrdToGroup(hash.add(v1, prev2))));
         }
     }
 }
diff --git a/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/blockhash/AddBlockTests.java b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/blockhash/AddBlockTests.java
new file mode 100644
index 0000000000000..fbe696aa2997b
--- /dev/null
+++ b/x-pack/plugin/esql/compute/src/test/java/org/elasticsearch/compute/aggregation/blockhash/AddBlockTests.java
@@ -0,0 +1,143 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.compute.aggregation.blockhash;
+
+import org.elasticsearch.common.unit.ByteSizeValue;
+import org.elasticsearch.compute.aggregation.GroupingAggregatorFunction;
+import org.elasticsearch.compute.data.BlockFactory;
+import org.elasticsearch.compute.data.BlockFactoryTests;
+import org.elasticsearch.compute.data.IntBlock;
+import org.elasticsearch.compute.data.IntVector;
+import org.elasticsearch.test.ESTestCase;
+import org.junit.After;
+
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.List;
+
+import static org.hamcrest.Matchers.equalTo;
+
+public class AddBlockTests extends ESTestCase {
+    private final BlockFactory blockFactory = BlockFactoryTests.blockFactory(ByteSizeValue.ofGb(1));
+
+    public void testSv() {
+        TestAddInput result = new TestAddInput();
+        List<Added> expected = new ArrayList<>();
+        try (AddBlock add = new AddBlock(blockFactory, 3, result)) {
+            add.appendOrdSv(0, 0);
+            add.appendOrdSv(1, 2);
+            add.appendOrdSv(2, 3);
+            expected.add(added(0, 0, 2, 3));
+            assertThat(result.added, equalTo(expected));
+            add.appendOrdSv(3, 4);
+            add.emitOrds();
+        }
+        expected.add(added(3, 4));
+        assertThat(result.added, equalTo(expected));
+    }
+
+    public void testMvBlockEndsOnBatchBoundary() {
+        TestAddInput result = new TestAddInput();
+        List<Added> expected = new ArrayList<>();
+        try (AddBlock add = new AddBlock(blockFactory, 3, result)) {
+            add.appendOrdInMv(0, 0);
+            add.appendOrdInMv(0, 2);
+            add.appendOrdInMv(0, 3);
+            expected.add(new Added(0, List.of(List.of(0, 2, 3))));
+            assertThat(result.added, equalTo(expected));
+            add.appendOrdInMv(0, 4);
+            add.finishMv();
+            add.appendOrdInMv(1, 0);
+            add.appendOrdInMv(1, 2);
+            expected.add(new Added(0, List.of(List.of(4), List.of(0, 2))));
+            assertThat(result.added, equalTo(expected));
+            add.finishMv();
+            add.emitOrds();
+        }
+        // We uselessly flush an empty position if emitBatchSize lines up with the total count
+        expected.add(new Added(1, List.of(List.of())));
+        assertThat(result.added, equalTo(expected));
+    }
+
+    public void testMvPositionEndOnBatchBoundary() {
+        TestAddInput result = new TestAddInput();
+        List<Added> expected = new ArrayList<>();
+        try (AddBlock add = new AddBlock(blockFactory, 4, result)) {
+            add.appendOrdInMv(0, 0);
+            add.appendOrdInMv(0, 2);
+            add.appendOrdInMv(0, 3);
+            add.appendOrdInMv(0, 4);
+            expected.add(new Added(0, List.of(List.of(0, 2, 3, 4))));
+            assertThat(result.added, equalTo(expected));
+            add.finishMv();
+            add.appendOrdInMv(1, 0);
+            add.appendOrdInMv(1, 2);
+            add.finishMv();
+            add.emitOrds();
+        }
+        // Because the first position ended on a block boundary we uselessly emit an empty position there
+        expected.add(new Added(0, List.of(List.of(), List.of(0, 2))));
+        assertThat(result.added, equalTo(expected));
+    }
+
+    public void testMv() {
+        TestAddInput result = new TestAddInput();
+        List<Added> expected = new ArrayList<>();
+        try (AddBlock add = new AddBlock(blockFactory, 5, result)) {
+            add.appendOrdInMv(0, 0);
+            add.appendOrdInMv(0, 2);
+            add.appendOrdInMv(0, 3);
+            add.appendOrdInMv(0, 4);
+            add.finishMv();
+            add.appendOrdInMv(1, 0);
+            expected.add(new Added(0, List.of(List.of(0, 2, 3, 4), List.of(0))));
+            assertThat(result.added, equalTo(expected));
+            add.appendOrdInMv(1, 2);
+            add.finishMv();
+            add.emitOrds();
+        }
+        expected.add(new Added(1, List.of(List.of(2))));
+        assertThat(result.added, equalTo(expected));
+    }
+
+    @After
+    public void breakerClear() {
+        assertThat(blockFactory.breaker().getUsed(), equalTo(0L));
+    }
+
+    record Added(int positionOffset, List<List<Integer>> ords) {}
+
+    Added added(int positionOffset, int... ords) {
+        return new Added(positionOffset, Arrays.stream(ords).mapToObj(List::of).toList());
+    }
+
+    private class TestAddInput implements GroupingAggregatorFunction.AddInput {
+        private final List<Added> added = new ArrayList<>();
+
+        @Override
+        public void add(int positionOffset, IntBlock groupIds) {
+            List<List<Integer>> result = new ArrayList<>(groupIds.getPositionCount());
+            for (int p = 0; p < groupIds.getPositionCount(); p++) {
+                int valueCount = groupIds.getValueCount(p);
+                List<Integer> r = new ArrayList<>(valueCount);
+                result.add(r);
+                int start = groupIds.getFirstValueIndex(p);
+                int end = valueCount + start;
+                for (int i = start; i < end; i++) {
+                    r.add(groupIds.getInt(i));
+                }
+            }
+            added.add(new Added(positionOffset, result));
+        }
+
+        @Override
+        public void add(int positionOffset, IntVector groupIds) {
+            add(positionOffset, groupIds.asBlock());
+        }
+    }
+}

From b0002718850bbea122757e50a24fee4b1d0a9fdd Mon Sep 17 00:00:00 2001
From: Ryan Ernst <ryan@iernst.net>
Date: Fri, 30 Aug 2024 10:11:24 -0700
Subject: [PATCH 081/144] Update expert script example with termStats (#112377)

This commit fixes compilation of the expert script example to implement
the new required method of score script making termStats available.
---
 .../example/expertscript/ExpertScriptPlugin.java             | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/plugins/examples/script-expert-scoring/src/main/java/org/elasticsearch/example/expertscript/ExpertScriptPlugin.java b/plugins/examples/script-expert-scoring/src/main/java/org/elasticsearch/example/expertscript/ExpertScriptPlugin.java
index dc429538fec3b..7e177c4b7b6a0 100644
--- a/plugins/examples/script-expert-scoring/src/main/java/org/elasticsearch/example/expertscript/ExpertScriptPlugin.java
+++ b/plugins/examples/script-expert-scoring/src/main/java/org/elasticsearch/example/expertscript/ExpertScriptPlugin.java
@@ -124,6 +124,11 @@ public boolean needs_score() {
                 return false;  // Return true if the script needs the score
             }
 
+            @Override
+            public boolean needs_termStats() {
+                return false; // Return true if the script needs term statistics via get_termStats()
+            }
+
             @Override
             public ScoreScript newInstance(DocReader docReader)
                     throws IOException {

From 4ae88f98dca5d5b336adf174a8ce7040a681d8a9 Mon Sep 17 00:00:00 2001
From: Lee Hinman <dakrone@users.noreply.github.com>
Date: Fri, 30 Aug 2024 11:18:15 -0600
Subject: [PATCH 082/144] Add 'verbose' flag retrieving maximum_timestamp for
 get data stream API (#112303)

This commit adds support for the `verbose` querystring parameter to the
get data stream API (`GET /_data_stream/{name}`).

The flag defaults to "false".

When set to true, the `maximum_timestamp` for the data stream will be
retrieved and returned for each data stream retrieved. This is the same
information available from the data stream stats API (and internally
uses the same action to retrieval).
---
 docs/changelog/112303.yaml                    |  5 ++
 .../indices/get-data-stream.asciidoc          |  4 ++
 .../datastreams/DataStreamsPlugin.java        |  4 +-
 ...ava => TransportGetDataStreamsAction.java} | 64 +++++++++++++++----
 .../rest/RestGetDataStreamsAction.java        | 16 +++++
 .../action/GetDataStreamsRequestTests.java    | 34 +++++++++-
 .../action/GetDataStreamsResponseTests.java   | 27 ++++++--
 ...> TransportGetDataStreamsActionTests.java} | 52 ++++++++-------
 .../test/data_stream/10_basic.yml             | 62 ++++++++++++++++++
 .../api/indices.get_data_stream.json          |  4 ++
 .../org/elasticsearch/TransportVersions.java  |  2 +-
 .../datastreams/GetDataStreamAction.java      | 50 +++++++++++++--
 .../datastreams/GetDataStreamActionTests.java |  3 +-
 13 files changed, 276 insertions(+), 51 deletions(-)
 create mode 100644 docs/changelog/112303.yaml
 rename modules/data-streams/src/main/java/org/elasticsearch/datastreams/action/{GetDataStreamsTransportAction.java => TransportGetDataStreamsAction.java} (83%)
 rename modules/data-streams/src/test/java/org/elasticsearch/datastreams/action/{GetDataStreamsTransportActionTests.java => TransportGetDataStreamsActionTests.java} (91%)

diff --git a/docs/changelog/112303.yaml b/docs/changelog/112303.yaml
new file mode 100644
index 0000000000000..a363e621e4c48
--- /dev/null
+++ b/docs/changelog/112303.yaml
@@ -0,0 +1,5 @@
+pr: 112303
+summary: Add 'verbose' flag retrieving `maximum_timestamp` for get data stream API
+area: Data streams
+type: enhancement
+issues: []
diff --git a/docs/reference/indices/get-data-stream.asciidoc b/docs/reference/indices/get-data-stream.asciidoc
index b88a1a1be2a7e..6bf150897acab 100644
--- a/docs/reference/indices/get-data-stream.asciidoc
+++ b/docs/reference/indices/get-data-stream.asciidoc
@@ -105,6 +105,10 @@ Defaults to `open`.
 (Optional, Boolean) Functionality in preview:[]. If `true`, return all default settings in the response.
 Defaults to `false`.
 
+`verbose`::
+(Optional, Boolean). If `true`, Returns the `maximum_timestamp` corresponding to the `@timestamp` field for documents in the data stream.
+Defaults to `false`.
+
 [role="child_attributes"]
 [[get-data-stream-api-response-body]]
 ==== {api-response-body-title}
diff --git a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/DataStreamsPlugin.java b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/DataStreamsPlugin.java
index 615c0006a4ce6..3f3a70a94de2a 100644
--- a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/DataStreamsPlugin.java
+++ b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/DataStreamsPlugin.java
@@ -35,10 +35,10 @@
 import org.elasticsearch.datastreams.action.CreateDataStreamTransportAction;
 import org.elasticsearch.datastreams.action.DataStreamsStatsTransportAction;
 import org.elasticsearch.datastreams.action.DeleteDataStreamTransportAction;
-import org.elasticsearch.datastreams.action.GetDataStreamsTransportAction;
 import org.elasticsearch.datastreams.action.MigrateToDataStreamTransportAction;
 import org.elasticsearch.datastreams.action.ModifyDataStreamsTransportAction;
 import org.elasticsearch.datastreams.action.PromoteDataStreamTransportAction;
+import org.elasticsearch.datastreams.action.TransportGetDataStreamsAction;
 import org.elasticsearch.datastreams.lifecycle.DataStreamLifecycleErrorStore;
 import org.elasticsearch.datastreams.lifecycle.DataStreamLifecycleService;
 import org.elasticsearch.datastreams.lifecycle.action.DeleteDataStreamLifecycleAction;
@@ -218,7 +218,7 @@ public Collection<?> createComponents(PluginServices services) {
         List<ActionHandler<? extends ActionRequest, ? extends ActionResponse>> actions = new ArrayList<>();
         actions.add(new ActionHandler<>(CreateDataStreamAction.INSTANCE, CreateDataStreamTransportAction.class));
         actions.add(new ActionHandler<>(DeleteDataStreamAction.INSTANCE, DeleteDataStreamTransportAction.class));
-        actions.add(new ActionHandler<>(GetDataStreamAction.INSTANCE, GetDataStreamsTransportAction.class));
+        actions.add(new ActionHandler<>(GetDataStreamAction.INSTANCE, TransportGetDataStreamsAction.class));
         actions.add(new ActionHandler<>(DataStreamsStatsAction.INSTANCE, DataStreamsStatsTransportAction.class));
         actions.add(new ActionHandler<>(MigrateToDataStreamAction.INSTANCE, MigrateToDataStreamTransportAction.class));
         actions.add(new ActionHandler<>(PromoteDataStreamAction.INSTANCE, PromoteDataStreamTransportAction.class));
diff --git a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/action/GetDataStreamsTransportAction.java b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/action/TransportGetDataStreamsAction.java
similarity index 83%
rename from modules/data-streams/src/main/java/org/elasticsearch/datastreams/action/GetDataStreamsTransportAction.java
rename to modules/data-streams/src/main/java/org/elasticsearch/datastreams/action/TransportGetDataStreamsAction.java
index dcca32355082b..647001d2c9ef5 100644
--- a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/action/GetDataStreamsTransportAction.java
+++ b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/action/TransportGetDataStreamsAction.java
@@ -11,11 +11,13 @@
 import org.apache.logging.log4j.Logger;
 import org.elasticsearch.action.ActionListener;
 import org.elasticsearch.action.datastreams.DataStreamsActionUtil;
+import org.elasticsearch.action.datastreams.DataStreamsStatsAction;
 import org.elasticsearch.action.datastreams.GetDataStreamAction;
 import org.elasticsearch.action.datastreams.GetDataStreamAction.Response.IndexProperties;
 import org.elasticsearch.action.datastreams.GetDataStreamAction.Response.ManagedBy;
 import org.elasticsearch.action.support.ActionFilters;
 import org.elasticsearch.action.support.master.TransportMasterNodeReadAction;
+import org.elasticsearch.client.internal.Client;
 import org.elasticsearch.cluster.ClusterState;
 import org.elasticsearch.cluster.block.ClusterBlockException;
 import org.elasticsearch.cluster.block.ClusterBlockLevel;
@@ -30,7 +32,7 @@
 import org.elasticsearch.cluster.service.ClusterService;
 import org.elasticsearch.common.settings.ClusterSettings;
 import org.elasticsearch.common.settings.Settings;
-import org.elasticsearch.common.util.concurrent.EsExecutors;
+import org.elasticsearch.core.Nullable;
 import org.elasticsearch.core.Tuple;
 import org.elasticsearch.index.Index;
 import org.elasticsearch.index.IndexMode;
@@ -43,31 +45,35 @@
 
 import java.time.Instant;
 import java.util.ArrayList;
+import java.util.Arrays;
 import java.util.Comparator;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
+import java.util.stream.Collectors;
 
 import static org.elasticsearch.index.IndexSettings.PREFER_ILM_SETTING;
 
-public class GetDataStreamsTransportAction extends TransportMasterNodeReadAction<
+public class TransportGetDataStreamsAction extends TransportMasterNodeReadAction<
     GetDataStreamAction.Request,
     GetDataStreamAction.Response> {
 
-    private static final Logger LOGGER = LogManager.getLogger(GetDataStreamsTransportAction.class);
+    private static final Logger LOGGER = LogManager.getLogger(TransportGetDataStreamsAction.class);
     private final SystemIndices systemIndices;
     private final ClusterSettings clusterSettings;
     private final DataStreamGlobalRetentionSettings globalRetentionSettings;
+    private final Client client;
 
     @Inject
-    public GetDataStreamsTransportAction(
+    public TransportGetDataStreamsAction(
         TransportService transportService,
         ClusterService clusterService,
         ThreadPool threadPool,
         ActionFilters actionFilters,
         IndexNameExpressionResolver indexNameExpressionResolver,
         SystemIndices systemIndices,
-        DataStreamGlobalRetentionSettings globalRetentionSettings
+        DataStreamGlobalRetentionSettings globalRetentionSettings,
+        Client client
     ) {
         super(
             GetDataStreamAction.NAME,
@@ -78,11 +84,12 @@ public GetDataStreamsTransportAction(
             GetDataStreamAction.Request::new,
             indexNameExpressionResolver,
             GetDataStreamAction.Response::new,
-            EsExecutors.DIRECT_EXECUTOR_SERVICE
+            transportService.getThreadPool().executor(ThreadPool.Names.MANAGEMENT)
         );
         this.systemIndices = systemIndices;
         this.globalRetentionSettings = globalRetentionSettings;
         clusterSettings = clusterService.getClusterSettings();
+        this.client = client;
     }
 
     @Override
@@ -92,9 +99,42 @@ protected void masterOperation(
         ClusterState state,
         ActionListener<GetDataStreamAction.Response> listener
     ) throws Exception {
-        listener.onResponse(
-            innerOperation(state, request, indexNameExpressionResolver, systemIndices, clusterSettings, globalRetentionSettings)
-        );
+        if (request.verbose()) {
+            DataStreamsStatsAction.Request req = new DataStreamsStatsAction.Request();
+            req.indices(request.indices());
+            client.execute(DataStreamsStatsAction.INSTANCE, req, new ActionListener<>() {
+                @Override
+                public void onResponse(DataStreamsStatsAction.Response response) {
+                    final Map<String, Long> maxTimestamps = Arrays.stream(response.getDataStreams())
+                        .collect(
+                            Collectors.toMap(
+                                DataStreamsStatsAction.DataStreamStats::getDataStream,
+                                DataStreamsStatsAction.DataStreamStats::getMaximumTimestamp
+                            )
+                        );
+                    listener.onResponse(
+                        innerOperation(
+                            state,
+                            request,
+                            indexNameExpressionResolver,
+                            systemIndices,
+                            clusterSettings,
+                            globalRetentionSettings,
+                            maxTimestamps
+                        )
+                    );
+                }
+
+                @Override
+                public void onFailure(Exception e) {
+                    listener.onFailure(e);
+                }
+            });
+        } else {
+            listener.onResponse(
+                innerOperation(state, request, indexNameExpressionResolver, systemIndices, clusterSettings, globalRetentionSettings, null)
+            );
+        }
     }
 
     static GetDataStreamAction.Response innerOperation(
@@ -103,7 +143,8 @@ static GetDataStreamAction.Response innerOperation(
         IndexNameExpressionResolver indexNameExpressionResolver,
         SystemIndices systemIndices,
         ClusterSettings clusterSettings,
-        DataStreamGlobalRetentionSettings globalRetentionSettings
+        DataStreamGlobalRetentionSettings globalRetentionSettings,
+        @Nullable Map<String, Long> maxTimestamps
     ) {
         List<DataStream> dataStreams = getDataStreams(state, indexNameExpressionResolver, request);
         List<GetDataStreamAction.Response.DataStreamInfo> dataStreamInfos = new ArrayList<>(dataStreams.size());
@@ -216,7 +257,8 @@ public int compareTo(IndexInfo o) {
                     ilmPolicyName,
                     timeSeries,
                     backingIndicesSettingsValues,
-                    indexTemplatePreferIlmValue
+                    indexTemplatePreferIlmValue,
+                    maxTimestamps == null ? null : maxTimestamps.get(dataStream.getName())
                 )
             );
         }
diff --git a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/rest/RestGetDataStreamsAction.java b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/rest/RestGetDataStreamsAction.java
index c3178208d51c2..7fc86ec2c592e 100644
--- a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/rest/RestGetDataStreamsAction.java
+++ b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/rest/RestGetDataStreamsAction.java
@@ -45,6 +45,7 @@ protected RestChannelConsumer prepareRequest(RestRequest request, NodeClient cli
         );
         getDataStreamsRequest.includeDefaults(request.paramAsBoolean("include_defaults", false));
         getDataStreamsRequest.indicesOptions(IndicesOptions.fromRequest(request, getDataStreamsRequest.indicesOptions()));
+        getDataStreamsRequest.verbose(request.paramAsBoolean("verbose", false));
         return channel -> client.execute(GetDataStreamAction.INSTANCE, getDataStreamsRequest, new RestToXContentListener<>(channel));
     }
 
@@ -57,4 +58,19 @@ public boolean allowSystemIndexAccessByDefault() {
     public Set<String> supportedCapabilities() {
         return Set.of(DataStreamLifecycle.EFFECTIVE_RETENTION_REST_API_CAPABILITY);
     }
+
+    @Override
+    public Set<String> supportedQueryParameters() {
+        return Set.of(
+            "name",
+            "include_defaults",
+            "timeout",
+            "master_timeout",
+            IndicesOptions.WildcardOptions.EXPAND_WILDCARDS,
+            IndicesOptions.ConcreteTargetOptions.IGNORE_UNAVAILABLE,
+            IndicesOptions.WildcardOptions.ALLOW_NO_INDICES,
+            IndicesOptions.GatekeeperOptions.IGNORE_THROTTLED,
+            "verbose"
+        );
+    }
 }
diff --git a/modules/data-streams/src/test/java/org/elasticsearch/datastreams/action/GetDataStreamsRequestTests.java b/modules/data-streams/src/test/java/org/elasticsearch/datastreams/action/GetDataStreamsRequestTests.java
index 58bb3919d5a7c..824bec21b16e9 100644
--- a/modules/data-streams/src/test/java/org/elasticsearch/datastreams/action/GetDataStreamsRequestTests.java
+++ b/modules/data-streams/src/test/java/org/elasticsearch/datastreams/action/GetDataStreamsRequestTests.java
@@ -8,6 +8,7 @@
 package org.elasticsearch.datastreams.action;
 
 import org.elasticsearch.action.datastreams.GetDataStreamAction.Request;
+import org.elasticsearch.action.support.IndicesOptions;
 import org.elasticsearch.common.io.stream.Writeable;
 import org.elasticsearch.test.AbstractWireSerializingTestCase;
 
@@ -20,7 +21,7 @@ protected Writeable.Reader<Request> instanceReader() {
 
     @Override
     protected Request createTestInstance() {
-        return new Request(TEST_REQUEST_TIMEOUT, switch (randomIntBetween(1, 4)) {
+        var req = new Request(TEST_REQUEST_TIMEOUT, switch (randomIntBetween(1, 4)) {
             case 1 -> generateRandomStringArray(3, 8, false, false);
             case 2 -> {
                 String[] parameters = generateRandomStringArray(3, 8, false, false);
@@ -32,11 +33,40 @@ protected Request createTestInstance() {
             case 3 -> new String[] { "*" };
             default -> null;
         });
+        req.verbose(randomBoolean());
+        return req;
     }
 
     @Override
     protected Request mutateInstance(Request instance) {
-        return null;// TODO implement https://github.com/elastic/elasticsearch/issues/25929
+        var indices = instance.indices();
+        var indicesOpts = instance.indicesOptions();
+        var includeDefaults = instance.includeDefaults();
+        var verbose = instance.verbose();
+        switch (randomIntBetween(0, 3)) {
+            case 0 -> indices = randomValueOtherThan(indices, () -> generateRandomStringArray(3, 8, false, false));
+            case 1 -> indicesOpts = randomValueOtherThan(
+                indicesOpts,
+                () -> IndicesOptions.fromOptions(
+                    randomBoolean(),
+                    randomBoolean(),
+                    randomBoolean(),
+                    randomBoolean(),
+                    randomBoolean(),
+                    randomBoolean(),
+                    randomBoolean(),
+                    randomBoolean(),
+                    randomBoolean()
+                )
+            );
+            case 2 -> includeDefaults = includeDefaults == false;
+            case 3 -> verbose = verbose == false;
+        }
+        var newReq = new Request(instance.masterNodeTimeout(), indices);
+        newReq.includeDefaults(includeDefaults);
+        newReq.indicesOptions(indicesOpts);
+        newReq.verbose(verbose);
+        return newReq;
     }
 
 }
diff --git a/modules/data-streams/src/test/java/org/elasticsearch/datastreams/action/GetDataStreamsResponseTests.java b/modules/data-streams/src/test/java/org/elasticsearch/datastreams/action/GetDataStreamsResponseTests.java
index 4059127b5eb85..d4860de73213b 100644
--- a/modules/data-streams/src/test/java/org/elasticsearch/datastreams/action/GetDataStreamsResponseTests.java
+++ b/modules/data-streams/src/test/java/org/elasticsearch/datastreams/action/GetDataStreamsResponseTests.java
@@ -20,6 +20,7 @@
 import org.elasticsearch.index.Index;
 import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.test.AbstractWireSerializingTestCase;
+import org.elasticsearch.test.ESTestCase;
 import org.elasticsearch.xcontent.ToXContent;
 import org.elasticsearch.xcontent.XContentBuilder;
 import org.elasticsearch.xcontent.XContentFactory;
@@ -104,7 +105,8 @@ public void testResponseIlmAndDataStreamLifecycleRepresentation() throws Excepti
                 null,
                 null,
                 indexSettingsValues,
-                false
+                false,
+                null
             );
             Response response = new Response(List.of(dataStreamInfo));
             XContentBuilder contentBuilder = XContentFactory.jsonBuilder();
@@ -206,7 +208,8 @@ public void testResponseIlmAndDataStreamLifecycleRepresentation() throws Excepti
                 null,
                 null,
                 indexSettingsValues,
-                false
+                false,
+                null
             );
             Response response = new Response(List.of(dataStreamInfo));
             XContentBuilder contentBuilder = XContentFactory.jsonBuilder();
@@ -283,7 +286,8 @@ private Response.DataStreamInfo mutateInstance(Response.DataStreamInfo instance)
         var timeSeries = instance.getTimeSeries();
         var indexSettings = instance.getIndexSettingsValues();
         var templatePreferIlm = instance.templatePreferIlmValue();
-        switch (randomIntBetween(0, 6)) {
+        var maximumTimestamp = instance.getMaximumTimestamp();
+        switch (randomIntBetween(0, 7)) {
             case 0 -> dataStream = randomValueOtherThan(dataStream, DataStreamTestHelper::randomInstance);
             case 1 -> status = randomValueOtherThan(status, () -> randomFrom(ClusterHealthStatus.values()));
             case 2 -> indexTemplate = randomBoolean() && indexTemplate != null ? null : randomAlphaOfLengthBetween(2, 10);
@@ -305,8 +309,20 @@ private Response.DataStreamInfo mutateInstance(Response.DataStreamInfo instance)
                     )
             );
             case 6 -> templatePreferIlm = templatePreferIlm ? false : true;
+            case 7 -> maximumTimestamp = (maximumTimestamp == null)
+                ? randomNonNegativeLong()
+                : (usually() ? randomValueOtherThan(maximumTimestamp, ESTestCase::randomNonNegativeLong) : null);
         }
-        return new Response.DataStreamInfo(dataStream, status, indexTemplate, ilmPolicyName, timeSeries, indexSettings, templatePreferIlm);
+        return new Response.DataStreamInfo(
+            dataStream,
+            status,
+            indexTemplate,
+            ilmPolicyName,
+            timeSeries,
+            indexSettings,
+            templatePreferIlm,
+            maximumTimestamp
+        );
     }
 
     private List<Tuple<Instant, Instant>> generateRandomTimeSeries() {
@@ -342,7 +358,8 @@ private Response.DataStreamInfo generateRandomDataStreamInfo() {
             randomAlphaOfLengthBetween(2, 10),
             timeSeries != null ? new Response.TimeSeries(timeSeries) : null,
             generateRandomIndexSettingsValues(),
-            randomBoolean()
+            randomBoolean(),
+            usually() ? randomNonNegativeLong() : null
         );
     }
 }
diff --git a/modules/data-streams/src/test/java/org/elasticsearch/datastreams/action/GetDataStreamsTransportActionTests.java b/modules/data-streams/src/test/java/org/elasticsearch/datastreams/action/TransportGetDataStreamsActionTests.java
similarity index 91%
rename from modules/data-streams/src/test/java/org/elasticsearch/datastreams/action/GetDataStreamsTransportActionTests.java
rename to modules/data-streams/src/test/java/org/elasticsearch/datastreams/action/TransportGetDataStreamsActionTests.java
index 80d867ec7745e..e167e15576240 100644
--- a/modules/data-streams/src/test/java/org/elasticsearch/datastreams/action/GetDataStreamsTransportActionTests.java
+++ b/modules/data-streams/src/test/java/org/elasticsearch/datastreams/action/TransportGetDataStreamsActionTests.java
@@ -41,7 +41,7 @@
 import static org.hamcrest.Matchers.equalTo;
 import static org.hamcrest.Matchers.nullValue;
 
-public class GetDataStreamsTransportActionTests extends ESTestCase {
+public class TransportGetDataStreamsActionTests extends ESTestCase {
 
     private final IndexNameExpressionResolver resolver = TestIndexNameExpressionResolver.newInstance();
     private final SystemIndices systemIndices = new SystemIndices(List.of());
@@ -54,7 +54,7 @@ public void testGetDataStream() {
         final String dataStreamName = "my-data-stream";
         ClusterState cs = getClusterStateWithDataStreams(List.of(new Tuple<>(dataStreamName, 1)), List.of());
         GetDataStreamAction.Request req = new GetDataStreamAction.Request(TEST_REQUEST_TIMEOUT, new String[] { dataStreamName });
-        List<DataStream> dataStreams = GetDataStreamsTransportAction.getDataStreams(cs, resolver, req);
+        List<DataStream> dataStreams = TransportGetDataStreamsAction.getDataStreams(cs, resolver, req);
         assertThat(dataStreams, transformedItemsMatch(DataStream::getName, contains(dataStreamName)));
     }
 
@@ -69,19 +69,19 @@ public void testGetDataStreamsWithWildcards() {
             TEST_REQUEST_TIMEOUT,
             new String[] { dataStreamNames[1].substring(0, 5) + "*" }
         );
-        List<DataStream> dataStreams = GetDataStreamsTransportAction.getDataStreams(cs, resolver, req);
+        List<DataStream> dataStreams = TransportGetDataStreamsAction.getDataStreams(cs, resolver, req);
         assertThat(dataStreams, transformedItemsMatch(DataStream::getName, contains(dataStreamNames[1])));
 
         req = new GetDataStreamAction.Request(TEST_REQUEST_TIMEOUT, new String[] { "*" });
-        dataStreams = GetDataStreamsTransportAction.getDataStreams(cs, resolver, req);
+        dataStreams = TransportGetDataStreamsAction.getDataStreams(cs, resolver, req);
         assertThat(dataStreams, transformedItemsMatch(DataStream::getName, contains(dataStreamNames[1], dataStreamNames[0])));
 
         req = new GetDataStreamAction.Request(TEST_REQUEST_TIMEOUT, (String[]) null);
-        dataStreams = GetDataStreamsTransportAction.getDataStreams(cs, resolver, req);
+        dataStreams = TransportGetDataStreamsAction.getDataStreams(cs, resolver, req);
         assertThat(dataStreams, transformedItemsMatch(DataStream::getName, contains(dataStreamNames[1], dataStreamNames[0])));
 
         req = new GetDataStreamAction.Request(TEST_REQUEST_TIMEOUT, new String[] { "matches-none*" });
-        dataStreams = GetDataStreamsTransportAction.getDataStreams(cs, resolver, req);
+        dataStreams = TransportGetDataStreamsAction.getDataStreams(cs, resolver, req);
         assertThat(dataStreams, empty());
     }
 
@@ -96,21 +96,21 @@ public void testGetDataStreamsWithoutWildcards() {
             TEST_REQUEST_TIMEOUT,
             new String[] { dataStreamNames[0], dataStreamNames[1] }
         );
-        List<DataStream> dataStreams = GetDataStreamsTransportAction.getDataStreams(cs, resolver, req);
+        List<DataStream> dataStreams = TransportGetDataStreamsAction.getDataStreams(cs, resolver, req);
         assertThat(dataStreams, transformedItemsMatch(DataStream::getName, contains(dataStreamNames[1], dataStreamNames[0])));
 
         req = new GetDataStreamAction.Request(TEST_REQUEST_TIMEOUT, new String[] { dataStreamNames[1] });
-        dataStreams = GetDataStreamsTransportAction.getDataStreams(cs, resolver, req);
+        dataStreams = TransportGetDataStreamsAction.getDataStreams(cs, resolver, req);
         assertThat(dataStreams, transformedItemsMatch(DataStream::getName, contains(dataStreamNames[1])));
 
         req = new GetDataStreamAction.Request(TEST_REQUEST_TIMEOUT, new String[] { dataStreamNames[0] });
-        dataStreams = GetDataStreamsTransportAction.getDataStreams(cs, resolver, req);
+        dataStreams = TransportGetDataStreamsAction.getDataStreams(cs, resolver, req);
         assertThat(dataStreams, transformedItemsMatch(DataStream::getName, contains(dataStreamNames[0])));
 
         GetDataStreamAction.Request req2 = new GetDataStreamAction.Request(TEST_REQUEST_TIMEOUT, new String[] { "foo" });
         IndexNotFoundException e = expectThrows(
             IndexNotFoundException.class,
-            () -> GetDataStreamsTransportAction.getDataStreams(cs, resolver, req2)
+            () -> TransportGetDataStreamsAction.getDataStreams(cs, resolver, req2)
         );
         assertThat(e.getMessage(), containsString("no such index [foo]"));
     }
@@ -121,7 +121,7 @@ public void testGetNonexistentDataStream() {
         GetDataStreamAction.Request req = new GetDataStreamAction.Request(TEST_REQUEST_TIMEOUT, new String[] { dataStreamName });
         IndexNotFoundException e = expectThrows(
             IndexNotFoundException.class,
-            () -> GetDataStreamsTransportAction.getDataStreams(cs, resolver, req)
+            () -> TransportGetDataStreamsAction.getDataStreams(cs, resolver, req)
         );
         assertThat(e.getMessage(), containsString("no such index [" + dataStreamName + "]"));
     }
@@ -160,13 +160,14 @@ public void testGetTimeSeriesDataStream() {
         }
 
         var req = new GetDataStreamAction.Request(TEST_REQUEST_TIMEOUT, new String[] {});
-        var response = GetDataStreamsTransportAction.innerOperation(
+        var response = TransportGetDataStreamsAction.innerOperation(
             state,
             req,
             resolver,
             systemIndices,
             ClusterSettings.createBuiltInClusterSettings(),
-            dataStreamGlobalRetentionSettings
+            dataStreamGlobalRetentionSettings,
+            null
         );
         assertThat(
             response.getDataStreams(),
@@ -190,13 +191,14 @@ public void testGetTimeSeriesDataStream() {
             mBuilder.remove(dataStream.getIndices().get(1).getName());
             state = ClusterState.builder(state).metadata(mBuilder).build();
         }
-        response = GetDataStreamsTransportAction.innerOperation(
+        response = TransportGetDataStreamsAction.innerOperation(
             state,
             req,
             resolver,
             systemIndices,
             ClusterSettings.createBuiltInClusterSettings(),
-            dataStreamGlobalRetentionSettings
+            dataStreamGlobalRetentionSettings,
+            null
         );
         assertThat(
             response.getDataStreams(),
@@ -240,13 +242,14 @@ public void testGetTimeSeriesDataStreamWithOutOfOrderIndices() {
         }
 
         var req = new GetDataStreamAction.Request(TEST_REQUEST_TIMEOUT, new String[] {});
-        var response = GetDataStreamsTransportAction.innerOperation(
+        var response = TransportGetDataStreamsAction.innerOperation(
             state,
             req,
             resolver,
             systemIndices,
             ClusterSettings.createBuiltInClusterSettings(),
-            dataStreamGlobalRetentionSettings
+            dataStreamGlobalRetentionSettings,
+            null
         );
         assertThat(
             response.getDataStreams(),
@@ -283,13 +286,14 @@ public void testGetTimeSeriesMixedDataStream() {
         }
 
         var req = new GetDataStreamAction.Request(TEST_REQUEST_TIMEOUT, new String[] {});
-        var response = GetDataStreamsTransportAction.innerOperation(
+        var response = TransportGetDataStreamsAction.innerOperation(
             state,
             req,
             resolver,
             systemIndices,
             ClusterSettings.createBuiltInClusterSettings(),
-            dataStreamGlobalRetentionSettings
+            dataStreamGlobalRetentionSettings,
+            null
         );
 
         var name1 = DataStream.getDefaultBackingIndexName("ds-1", 1, instant.toEpochMilli());
@@ -328,13 +332,14 @@ public void testPassingGlobalRetention() {
         }
 
         var req = new GetDataStreamAction.Request(TEST_REQUEST_TIMEOUT, new String[] {});
-        var response = GetDataStreamsTransportAction.innerOperation(
+        var response = TransportGetDataStreamsAction.innerOperation(
             state,
             req,
             resolver,
             systemIndices,
             ClusterSettings.createBuiltInClusterSettings(),
-            dataStreamGlobalRetentionSettings
+            dataStreamGlobalRetentionSettings,
+            null
         );
         assertThat(response.getGlobalRetention(), nullValue());
         DataStreamGlobalRetention globalRetention = new DataStreamGlobalRetention(
@@ -353,13 +358,14 @@ public void testPassingGlobalRetention() {
             ),
             DataStreamFactoryRetention.emptyFactoryRetention()
         );
-        response = GetDataStreamsTransportAction.innerOperation(
+        response = TransportGetDataStreamsAction.innerOperation(
             state,
             req,
             resolver,
             systemIndices,
             ClusterSettings.createBuiltInClusterSettings(),
-            withGlobalRetentionSettings
+            withGlobalRetentionSettings,
+            null
         );
         assertThat(response.getGlobalRetention(), equalTo(globalRetention));
     }
diff --git a/modules/data-streams/src/yamlRestTest/resources/rest-api-spec/test/data_stream/10_basic.yml b/modules/data-streams/src/yamlRestTest/resources/rest-api-spec/test/data_stream/10_basic.yml
index ec0c82365a681..7d375d14f8d3a 100644
--- a/modules/data-streams/src/yamlRestTest/resources/rest-api-spec/test/data_stream/10_basic.yml
+++ b/modules/data-streams/src/yamlRestTest/resources/rest-api-spec/test/data_stream/10_basic.yml
@@ -1243,3 +1243,65 @@ setup:
   - do:
       indices.delete_index_template:
         name: match-all-hidden-template
+
+---
+"Get maximum_timestamp for the data stream":
+  - requires:
+       capabilities:
+         - method: GET
+           path: /_data_stream
+           parameters: [verbose]
+       test_runner_features: [allowed_warnings, capabilities]
+       reason: Verbose flag required for the test
+
+  - do:
+      allowed_warnings:
+        - "index template [my-template] has index patterns [data-*] matching patterns from existing older templates [global] with patterns (global => [*]); this template [my-template] will take precedence during new index creation"
+      indices.put_index_template:
+        name: my-template
+        body:
+          index_patterns: [data-*]
+          data_stream: {}
+
+  - do:
+      indices.create_data_stream:
+        name: data-stream1
+  - is_true: acknowledged
+
+  - do:
+      indices.get_data_stream:
+        name: data-stream1
+        verbose: false
+
+  - match: { data_streams.0.name: data-stream1 }
+  - is_false: data_streams.0.maximum_timestamp
+
+  - do:
+      indices.get_data_stream:
+        name: data-stream1
+        verbose: true
+
+  - match: { data_streams.0.name: data-stream1 }
+  # 0 because no documents have been indexed yet
+  - match: { data_streams.0.maximum_timestamp: 0 }
+
+  - do:
+      index:
+        index: data-stream1
+        refresh: true
+        body:
+          '@timestamp': '2020-12-12'
+          foo: bar
+
+  - do:
+      indices.get_data_stream:
+        name: data-stream1
+        verbose: true
+
+  - match: { data_streams.0.name: data-stream1 }
+  - match: { data_streams.0.maximum_timestamp: 1607731200000 }
+
+  - do:
+      indices.delete_data_stream:
+        name: data-stream1
+  - is_true: acknowledged
diff --git a/rest-api-spec/src/main/resources/rest-api-spec/api/indices.get_data_stream.json b/rest-api-spec/src/main/resources/rest-api-spec/api/indices.get_data_stream.json
index 59cd8521f275e..2a95e2552bb33 100644
--- a/rest-api-spec/src/main/resources/rest-api-spec/api/indices.get_data_stream.json
+++ b/rest-api-spec/src/main/resources/rest-api-spec/api/indices.get_data_stream.json
@@ -51,6 +51,10 @@
       "master_timeout":{
         "type":"time",
         "description":"Specify timeout for connection to master"
+      },
+      "verbose":{
+        "type":"boolean",
+        "description":"Whether the maximum timestamp for each data stream should be calculated and returned (default: false)"
       }
     }
   }
diff --git a/server/src/main/java/org/elasticsearch/TransportVersions.java b/server/src/main/java/org/elasticsearch/TransportVersions.java
index 7581ee7649696..a3db5cf328660 100644
--- a/server/src/main/java/org/elasticsearch/TransportVersions.java
+++ b/server/src/main/java/org/elasticsearch/TransportVersions.java
@@ -201,8 +201,8 @@ static TransportVersion def(int id) {
     public static final TransportVersion ADD_MANAGE_ROLES_PRIVILEGE = def(8_731_00_0);
     public static final TransportVersion REPOSITORIES_TELEMETRY = def(8_732_00_0);
     public static final TransportVersion ML_INFERENCE_ALIBABACLOUD_SEARCH_ADDED = def(8_733_00_0);
-
     public static final TransportVersion FIELD_CAPS_RESPONSE_INDEX_MODE = def(8_734_00_0);
+    public static final TransportVersion GET_DATA_STREAMS_VERBOSE = def(8_735_00_0);
 
     /*
      * STOP! READ THIS FIRST! No, really,
diff --git a/server/src/main/java/org/elasticsearch/action/datastreams/GetDataStreamAction.java b/server/src/main/java/org/elasticsearch/action/datastreams/GetDataStreamAction.java
index d09a90f9de4f0..2bcd824dfea3c 100644
--- a/server/src/main/java/org/elasticsearch/action/datastreams/GetDataStreamAction.java
+++ b/server/src/main/java/org/elasticsearch/action/datastreams/GetDataStreamAction.java
@@ -58,6 +58,7 @@ public static class Request extends MasterNodeReadRequest<Request> implements In
         private String[] names;
         private IndicesOptions indicesOptions = IndicesOptions.fromOptions(false, true, true, true, false, false, true, false);
         private boolean includeDefaults = false;
+        private boolean verbose = false;
 
         public Request(TimeValue masterNodeTimeout, String[] names) {
             super(masterNodeTimeout);
@@ -79,6 +80,10 @@ public String[] getNames() {
             return names;
         }
 
+        public boolean verbose() {
+            return verbose;
+        }
+
         @Override
         public ActionRequestValidationException validate() {
             return null;
@@ -93,6 +98,11 @@ public Request(StreamInput in) throws IOException {
             } else {
                 this.includeDefaults = false;
             }
+            if (in.getTransportVersion().onOrAfter(TransportVersions.GET_DATA_STREAMS_VERBOSE)) {
+                this.verbose = in.readBoolean();
+            } else {
+                this.verbose = false;
+            }
         }
 
         @Override
@@ -103,6 +113,9 @@ public void writeTo(StreamOutput out) throws IOException {
             if (out.getTransportVersion().onOrAfter(TransportVersions.V_8_9_X)) {
                 out.writeBoolean(includeDefaults);
             }
+            if (out.getTransportVersion().onOrAfter(TransportVersions.GET_DATA_STREAMS_VERBOSE)) {
+                out.writeBoolean(verbose);
+            }
         }
 
         @Override
@@ -112,12 +125,13 @@ public boolean equals(Object o) {
             Request request = (Request) o;
             return Arrays.equals(names, request.names)
                 && indicesOptions.equals(request.indicesOptions)
-                && includeDefaults == request.includeDefaults;
+                && includeDefaults == request.includeDefaults
+                && verbose == request.verbose;
         }
 
         @Override
         public int hashCode() {
-            int result = Objects.hash(indicesOptions, includeDefaults);
+            int result = Objects.hash(indicesOptions, includeDefaults, verbose);
             result = 31 * result + Arrays.hashCode(names);
             return result;
         }
@@ -156,6 +170,11 @@ public Request includeDefaults(boolean includeDefaults) {
             this.includeDefaults = includeDefaults;
             return this;
         }
+
+        public Request verbose(boolean verbose) {
+            this.verbose = verbose;
+            return this;
+        }
     }
 
     public static class Response extends ActionResponse implements ToXContentObject {
@@ -197,6 +216,7 @@ public static class DataStreamInfo implements SimpleDiffable<DataStreamInfo>, To
                 "time_since_last_auto_shard_event_millis"
             );
             public static final ParseField FAILURE_STORE_ENABLED = new ParseField("enabled");
+            public static final ParseField MAXIMUM_TIMESTAMP = new ParseField("maximum_timestamp");
 
             private final DataStream dataStream;
             private final ClusterHealthStatus dataStreamStatus;
@@ -208,6 +228,8 @@ public static class DataStreamInfo implements SimpleDiffable<DataStreamInfo>, To
             private final TimeSeries timeSeries;
             private final Map<Index, IndexProperties> indexSettingsValues;
             private final boolean templatePreferIlmValue;
+            @Nullable
+            private final Long maximumTimestamp;
 
             public DataStreamInfo(
                 DataStream dataStream,
@@ -216,7 +238,8 @@ public DataStreamInfo(
                 @Nullable String ilmPolicyName,
                 @Nullable TimeSeries timeSeries,
                 Map<Index, IndexProperties> indexSettingsValues,
-                boolean templatePreferIlmValue
+                boolean templatePreferIlmValue,
+                @Nullable Long maximumTimestamp
             ) {
                 this.dataStream = dataStream;
                 this.dataStreamStatus = dataStreamStatus;
@@ -225,6 +248,7 @@ public DataStreamInfo(
                 this.timeSeries = timeSeries;
                 this.indexSettingsValues = indexSettingsValues;
                 this.templatePreferIlmValue = templatePreferIlmValue;
+                this.maximumTimestamp = maximumTimestamp;
             }
 
             @SuppressWarnings("unchecked")
@@ -236,7 +260,8 @@ public DataStreamInfo(
                     in.readOptionalString(),
                     in.getTransportVersion().onOrAfter(TransportVersions.V_8_3_0) ? in.readOptionalWriteable(TimeSeries::new) : null,
                     in.getTransportVersion().onOrAfter(V_8_11_X) ? in.readMap(Index::new, IndexProperties::new) : Map.of(),
-                    in.getTransportVersion().onOrAfter(V_8_11_X) ? in.readBoolean() : true
+                    in.getTransportVersion().onOrAfter(V_8_11_X) ? in.readBoolean() : true,
+                    in.getTransportVersion().onOrAfter(TransportVersions.GET_DATA_STREAMS_VERBOSE) ? in.readOptionalVLong() : null
                 );
             }
 
@@ -271,6 +296,11 @@ public boolean templatePreferIlmValue() {
                 return templatePreferIlmValue;
             }
 
+            @Nullable
+            public Long getMaximumTimestamp() {
+                return maximumTimestamp;
+            }
+
             @Override
             public void writeTo(StreamOutput out) throws IOException {
                 dataStream.writeTo(out);
@@ -284,6 +314,9 @@ public void writeTo(StreamOutput out) throws IOException {
                     out.writeMap(indexSettingsValues);
                     out.writeBoolean(templatePreferIlmValue);
                 }
+                if (out.getTransportVersion().onOrAfter(TransportVersions.GET_DATA_STREAMS_VERBOSE)) {
+                    out.writeOptionalVLong(maximumTimestamp);
+                }
             }
 
             @Override
@@ -331,6 +364,9 @@ public XContentBuilder toXContent(
                 builder.field(ALLOW_CUSTOM_ROUTING.getPreferredName(), dataStream.isAllowCustomRouting());
                 builder.field(REPLICATED.getPreferredName(), dataStream.isReplicated());
                 builder.field(ROLLOVER_ON_WRITE.getPreferredName(), dataStream.rolloverOnWrite());
+                if (this.maximumTimestamp != null) {
+                    builder.field(MAXIMUM_TIMESTAMP.getPreferredName(), this.maximumTimestamp);
+                }
                 addAutoShardingEvent(builder, params, dataStream.getAutoShardingEvent());
                 if (timeSeries != null) {
                     builder.startObject(TIME_SERIES.getPreferredName());
@@ -431,7 +467,8 @@ public boolean equals(Object o) {
                     && Objects.equals(indexTemplate, that.indexTemplate)
                     && Objects.equals(ilmPolicyName, that.ilmPolicyName)
                     && Objects.equals(timeSeries, that.timeSeries)
-                    && Objects.equals(indexSettingsValues, that.indexSettingsValues);
+                    && Objects.equals(indexSettingsValues, that.indexSettingsValues)
+                    && Objects.equals(maximumTimestamp, that.maximumTimestamp);
             }
 
             @Override
@@ -443,7 +480,8 @@ public int hashCode() {
                     ilmPolicyName,
                     timeSeries,
                     indexSettingsValues,
-                    templatePreferIlmValue
+                    templatePreferIlmValue,
+                    maximumTimestamp
                 );
             }
         }
diff --git a/server/src/test/java/org/elasticsearch/action/datastreams/GetDataStreamActionTests.java b/server/src/test/java/org/elasticsearch/action/datastreams/GetDataStreamActionTests.java
index 285a41f976393..0515ec873bbfd 100644
--- a/server/src/test/java/org/elasticsearch/action/datastreams/GetDataStreamActionTests.java
+++ b/server/src/test/java/org/elasticsearch/action/datastreams/GetDataStreamActionTests.java
@@ -89,7 +89,8 @@ private static GetDataStreamAction.Response.DataStreamInfo newDataStreamInfo(boo
             null,
             null,
             Map.of(),
-            randomBoolean()
+            randomBoolean(),
+            null
         );
     }
 

From 3388bd03170db4ed5b73a382ef58589db596fee2 Mon Sep 17 00:00:00 2001
From: Nhat Nguyen <nhat.nguyen@elastic.co>
Date: Fri, 30 Aug 2024 10:28:31 -0700
Subject: [PATCH 083/144] Add index_mode to resolved indices in ESQL (#112371)

Add index_mode to the resolved indices in ESQL to enable appropriate
planning for METRICS and LOGS commands.
---
 .../org/elasticsearch/TransportVersions.java  |  2 +
 .../xpack/esql/index/EsIndex.java             | 45 ++++++++++++++-----
 .../xpack/esql/io/stream/PlanNamedTypes.java  |  3 +-
 .../xpack/esql/plan/logical/Enrich.java       |  3 +-
 .../xpack/esql/session/IndexResolver.java     |  8 ++--
 .../elasticsearch/xpack/esql/CsvTests.java    |  4 +-
 .../esql/index/EsIndexSerializationTests.java | 28 ++++++------
 .../LocalLogicalPlanOptimizerTests.java       |  5 +--
 .../LocalPhysicalPlanOptimizerTests.java      |  4 +-
 .../optimizer/LogicalPlanOptimizerTests.java  | 14 +++---
 .../optimizer/PhysicalPlanOptimizerTests.java |  2 +-
 .../ExchangeSinkExecSerializationTests.java   |  4 +-
 .../xpack/esql/planner/FilterTests.java       |  4 +-
 .../esql/planner/QueryTranslatorTests.java    |  5 ++-
 .../esql/plugin/DataNodeRequestTests.java     |  4 +-
 15 files changed, 81 insertions(+), 54 deletions(-)

diff --git a/server/src/main/java/org/elasticsearch/TransportVersions.java b/server/src/main/java/org/elasticsearch/TransportVersions.java
index a3db5cf328660..c57279ef6c443 100644
--- a/server/src/main/java/org/elasticsearch/TransportVersions.java
+++ b/server/src/main/java/org/elasticsearch/TransportVersions.java
@@ -204,6 +204,8 @@ static TransportVersion def(int id) {
     public static final TransportVersion FIELD_CAPS_RESPONSE_INDEX_MODE = def(8_734_00_0);
     public static final TransportVersion GET_DATA_STREAMS_VERBOSE = def(8_735_00_0);
 
+    public static final TransportVersion ESQL_ADD_INDEX_MODE_CONCRETE_INDICES = def(8_735_00_0);
+
     /*
      * STOP! READ THIS FIRST! No, really,
      *        ____ _____ ___  ____  _        ____  _____    _    ____    _____ _   _ ___ ____    _____ ___ ____  ____ _____ _
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/index/EsIndex.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/index/EsIndex.java
index d368c570a3f76..ce52b3a7611b3 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/index/EsIndex.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/index/EsIndex.java
@@ -6,44 +6,65 @@
  */
 package org.elasticsearch.xpack.esql.index;
 
+import org.elasticsearch.TransportVersions;
 import org.elasticsearch.common.io.stream.StreamInput;
 import org.elasticsearch.common.io.stream.StreamOutput;
 import org.elasticsearch.common.io.stream.Writeable;
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.xpack.esql.core.type.EsField;
 
 import java.io.IOException;
 import java.util.Map;
 import java.util.Objects;
 import java.util.Set;
+import java.util.stream.Collectors;
 
 public class EsIndex implements Writeable {
 
     private final String name;
     private final Map<String, EsField> mapping;
-    private final Set<String> concreteIndices;
+    private final Map<String, IndexMode> indexNameWithModes;
 
     public EsIndex(String name, Map<String, EsField> mapping) {
-        this(name, mapping, Set.of());
+        this(name, mapping, Map.of());
     }
 
-    public EsIndex(String name, Map<String, EsField> mapping, Set<String> concreteIndices) {
+    public EsIndex(String name, Map<String, EsField> mapping, Map<String, IndexMode> indexNameWithModes) {
         assert name != null;
         assert mapping != null;
         this.name = name;
         this.mapping = mapping;
-        this.concreteIndices = concreteIndices;
+        this.indexNameWithModes = indexNameWithModes;
     }
 
-    @SuppressWarnings("unchecked")
     public EsIndex(StreamInput in) throws IOException {
-        this(in.readString(), in.readImmutableMap(StreamInput::readString, EsField::readFrom), (Set<String>) in.readGenericValue());
+        this(in.readString(), in.readImmutableMap(StreamInput::readString, EsField::readFrom), readIndexNameWithModes(in));
     }
 
     @Override
     public void writeTo(StreamOutput out) throws IOException {
         out.writeString(name());
         out.writeMap(mapping(), (o, x) -> x.writeTo(out));
-        out.writeGenericValue(concreteIndices());
+        writeIndexNameWithModes(indexNameWithModes, out);
+    }
+
+    @SuppressWarnings("unchecked")
+    private static Map<String, IndexMode> readIndexNameWithModes(StreamInput in) throws IOException {
+        if (in.getTransportVersion().onOrAfter(TransportVersions.ESQL_ADD_INDEX_MODE_CONCRETE_INDICES)) {
+            return in.readMap(IndexMode::readFrom);
+        } else {
+            Set<String> indices = (Set<String>) in.readGenericValue();
+            assert indices != null;
+            return indices.stream().collect(Collectors.toMap(e -> e, e -> IndexMode.STANDARD));
+        }
+    }
+
+    private static void writeIndexNameWithModes(Map<String, IndexMode> concreteIndices, StreamOutput out) throws IOException {
+        if (out.getTransportVersion().onOrAfter(TransportVersions.ESQL_ADD_INDEX_MODE_CONCRETE_INDICES)) {
+            out.writeMap(concreteIndices, (o, v) -> IndexMode.writeTo(v, out));
+        } else {
+            out.writeGenericValue(concreteIndices.keySet());
+        }
     }
 
     public String name() {
@@ -54,8 +75,12 @@ public Map<String, EsField> mapping() {
         return mapping;
     }
 
+    public Map<String, IndexMode> indexNameWithModes() {
+        return indexNameWithModes;
+    }
+
     public Set<String> concreteIndices() {
-        return concreteIndices;
+        return indexNameWithModes.keySet();
     }
 
     @Override
@@ -65,7 +90,7 @@ public String toString() {
 
     @Override
     public int hashCode() {
-        return Objects.hash(name, mapping, concreteIndices);
+        return Objects.hash(name, mapping, indexNameWithModes);
     }
 
     @Override
@@ -81,6 +106,6 @@ public boolean equals(Object obj) {
         EsIndex other = (EsIndex) obj;
         return Objects.equals(name, other.name)
             && Objects.equals(mapping, other.mapping)
-            && Objects.equals(concreteIndices, other.concreteIndices);
+            && Objects.equals(indexNameWithModes, other.indexNameWithModes);
     }
 }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypes.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypes.java
index 56eab73cd042b..51d7f56f6bab2 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypes.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypes.java
@@ -12,6 +12,7 @@
 import org.elasticsearch.common.io.stream.StreamInput;
 import org.elasticsearch.common.io.stream.StreamOutput;
 import org.elasticsearch.common.util.iterable.Iterables;
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.index.query.QueryBuilder;
 import org.elasticsearch.transport.RemoteClusterAware;
 import org.elasticsearch.xpack.esql.core.expression.Alias;
@@ -161,7 +162,7 @@ static void writeEnrichExec(PlanStreamOutput out, EnrichExec enrich) throws IOEx
         } else {
             if (enrich.concreteIndices().keySet().equals(Set.of(RemoteClusterAware.LOCAL_CLUSTER_GROUP_KEY))) {
                 String concreteIndex = enrich.concreteIndices().get(RemoteClusterAware.LOCAL_CLUSTER_GROUP_KEY);
-                new EsIndex(concreteIndex, Map.of(), Set.of(concreteIndex)).writeTo(out);
+                new EsIndex(concreteIndex, Map.of(), Map.of(concreteIndex, IndexMode.STANDARD)).writeTo(out);
             } else {
                 throw new IllegalStateException("expected a single concrete enrich index; got " + enrich.concreteIndices());
             }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Enrich.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Enrich.java
index e0e40b0242fa7..a2b560d14ae21 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Enrich.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Enrich.java
@@ -14,6 +14,7 @@
 import org.elasticsearch.common.lucene.BytesRefs;
 import org.elasticsearch.common.util.Maps;
 import org.elasticsearch.common.util.iterable.Iterables;
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.transport.RemoteClusterAware;
 import org.elasticsearch.xpack.core.enrich.EnrichPolicy;
 import org.elasticsearch.xpack.esql.core.capabilities.Resolvables;
@@ -152,7 +153,7 @@ public void writeTo(StreamOutput out) throws IOException {
             Map<String, String> concreteIndices = concreteIndices();
             if (concreteIndices.keySet().equals(Set.of(RemoteClusterAware.LOCAL_CLUSTER_GROUP_KEY))) {
                 String enrichIndex = concreteIndices.get(RemoteClusterAware.LOCAL_CLUSTER_GROUP_KEY);
-                EsIndex esIndex = new EsIndex(enrichIndex, Map.of(), Set.of(enrichIndex));
+                EsIndex esIndex = new EsIndex(enrichIndex, Map.of(), Map.of(enrichIndex, IndexMode.STANDARD));
                 esIndex.writeTo(out);
             } else {
                 throw new IllegalStateException("expected a single enrich index; got " + concreteIndices);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/session/IndexResolver.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/session/IndexResolver.java
index 954b255f6d42f..0f26a68d3c31e 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/session/IndexResolver.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/session/IndexResolver.java
@@ -14,6 +14,8 @@
 import org.elasticsearch.action.support.IndicesOptions;
 import org.elasticsearch.client.internal.Client;
 import org.elasticsearch.common.Strings;
+import org.elasticsearch.common.util.Maps;
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.index.mapper.TimeSeriesParams;
 import org.elasticsearch.threadpool.ThreadPool;
 import org.elasticsearch.xpack.esql.action.EsqlResolveFieldsAction;
@@ -146,12 +148,12 @@ public IndexResolution mergedMappings(String indexPattern, FieldCapabilitiesResp
         }
         if (allEmpty) {
             // If all the mappings are empty we return an empty set of resolved indices to line up with QL
-            return IndexResolution.valid(new EsIndex(indexPattern, rootFields, Set.of()));
+            return IndexResolution.valid(new EsIndex(indexPattern, rootFields, Map.of()));
         }
 
-        Set<String> concreteIndices = new HashSet<>(fieldCapsResponse.getIndexResponses().size());
+        Map<String, IndexMode> concreteIndices = Maps.newMapWithExpectedSize(fieldCapsResponse.getIndexResponses().size());
         for (FieldCapabilitiesIndexResponse ir : fieldCapsResponse.getIndexResponses()) {
-            concreteIndices.add(ir.getIndexName());
+            concreteIndices.put(ir.getIndexName(), ir.getIndexMode());
         }
         return IndexResolution.valid(new EsIndex(indexPattern, rootFields, concreteIndices));
     }
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/CsvTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/CsvTests.java
index f30db1bf9bba2..e0f9b8690e289 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/CsvTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/CsvTests.java
@@ -32,6 +32,7 @@
 import org.elasticsearch.compute.operator.exchange.ExchangeSourceHandler;
 import org.elasticsearch.core.Releasables;
 import org.elasticsearch.core.Tuple;
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.logging.LogManager;
 import org.elasticsearch.logging.Logger;
 import org.elasticsearch.tasks.CancellableTask;
@@ -94,7 +95,6 @@
 import java.util.Collections;
 import java.util.List;
 import java.util.Map;
-import java.util.Set;
 import java.util.TreeMap;
 import java.util.concurrent.Executor;
 import java.util.concurrent.TimeUnit;
@@ -309,7 +309,7 @@ protected void assertResults(ExpectedResults expected, ActualResults actual, boo
 
     private static IndexResolution loadIndexResolution(String mappingName, String indexName) {
         var mapping = new TreeMap<>(loadMapping(mappingName));
-        return IndexResolution.valid(new EsIndex(indexName, mapping, Set.of(indexName)));
+        return IndexResolution.valid(new EsIndex(indexName, mapping, Map.of(indexName, IndexMode.STANDARD)));
     }
 
     private static EnrichResolution loadEnrichPolicies() {
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/index/EsIndexSerializationTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/index/EsIndexSerializationTests.java
index 504cf4ec1cd12..76fc8c52d91ab 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/index/EsIndexSerializationTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/index/EsIndexSerializationTests.java
@@ -10,6 +10,7 @@
 import org.elasticsearch.common.io.stream.BytesStreamOutput;
 import org.elasticsearch.common.io.stream.Writeable;
 import org.elasticsearch.common.unit.ByteSizeValue;
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.test.AbstractWireSerializingTestCase;
 import org.elasticsearch.xpack.esql.core.type.DataType;
 import org.elasticsearch.xpack.esql.core.type.EsField;
@@ -21,7 +22,6 @@
 
 import java.io.IOException;
 import java.util.HashMap;
-import java.util.HashSet;
 import java.util.Locale;
 import java.util.Map;
 import java.util.Set;
@@ -34,8 +34,7 @@ public class EsIndexSerializationTests extends AbstractWireSerializingTestCase<E
     public static EsIndex randomEsIndex() {
         String name = randomAlphaOfLength(5);
         Map<String, EsField> mapping = randomMapping();
-        Set<String> concreteIndices = randomConcreteIndices();
-        return new EsIndex(name, mapping, concreteIndices);
+        return new EsIndex(name, mapping, randomConcreteIndices());
     }
 
     private static Map<String, EsField> randomMapping() {
@@ -47,11 +46,11 @@ private static Map<String, EsField> randomMapping() {
         return result;
     }
 
-    private static Set<String> randomConcreteIndices() {
+    private static Map<String, IndexMode> randomConcreteIndices() {
         int size = between(0, 10);
-        Set<String> result = new HashSet<>(size);
+        Map<String, IndexMode> result = new HashMap<>(size);
         while (result.size() < size) {
-            result.add(randomAlphaOfLength(5));
+            result.put(randomAlphaOfLength(5), randomFrom(IndexMode.values()));
         }
         return result;
     }
@@ -75,14 +74,14 @@ protected EsIndex createTestInstance() {
     protected EsIndex mutateInstance(EsIndex instance) throws IOException {
         String name = instance.name();
         Map<String, EsField> mapping = instance.mapping();
-        Set<String> concreteIndices = instance.concreteIndices();
+        Map<String, IndexMode> indexedNameWithModes = instance.indexNameWithModes();
         switch (between(0, 2)) {
             case 0 -> name = randomValueOtherThan(name, () -> randomAlphaOfLength(5));
             case 1 -> mapping = randomValueOtherThan(mapping, EsIndexSerializationTests::randomMapping);
-            case 2 -> concreteIndices = randomValueOtherThan(concreteIndices, EsIndexSerializationTests::randomConcreteIndices);
+            case 2 -> indexedNameWithModes = randomValueOtherThan(indexedNameWithModes, EsIndexSerializationTests::randomConcreteIndices);
             default -> throw new IllegalArgumentException();
         }
-        return new EsIndex(name, mapping, concreteIndices);
+        return new EsIndex(name, mapping, indexedNameWithModes);
     }
 
     /**
@@ -126,10 +125,9 @@ public static EsIndex indexWithManyConflicts(boolean withParent) {
             fields.put("parent", parent);
         }
 
-        TreeSet<String> concrete = new TreeSet<>();
-        concrete.addAll(keywordIndices);
-        concrete.addAll(textIndices);
-
+        Map<String, IndexMode> concrete = new TreeMap<>();
+        keywordIndices.forEach(index -> concrete.put(index, randomFrom(IndexMode.values())));
+        textIndices.forEach(index -> concrete.put(index, randomFrom(IndexMode.values())));
         return new EsIndex("name", fields, concrete);
     }
 
@@ -138,7 +136,7 @@ public static EsIndex indexWithManyConflicts(boolean withParent) {
      * See {@link #testManyTypeConflicts(boolean, ByteSizeValue)} for more.
      */
     public void testManyTypeConflicts() throws IOException {
-        testManyTypeConflicts(false, ByteSizeValue.ofBytes(991027));
+        testManyTypeConflicts(false, ByteSizeValue.ofBytes(991026));
         /*
          * History:
          *  953.7kb - shorten error messages for UnsupportedAttributes #111973
@@ -151,7 +149,7 @@ public void testManyTypeConflicts() throws IOException {
      * See {@link #testManyTypeConflicts(boolean, ByteSizeValue)} for more.
      */
     public void testManyTypeConflictsWithParent() throws IOException {
-        testManyTypeConflicts(true, ByteSizeValue.ofBytes(1374498));
+        testManyTypeConflicts(true, ByteSizeValue.ofBytes(1374497));
         /*
          * History:
          * 16.9mb - start
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalLogicalPlanOptimizerTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalLogicalPlanOptimizerTests.java
index a3104b32dee34..2756a0fbd8016 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalLogicalPlanOptimizerTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalLogicalPlanOptimizerTests.java
@@ -53,7 +53,6 @@
 import java.util.List;
 import java.util.Locale;
 import java.util.Map;
-import java.util.Set;
 
 import static java.util.Collections.emptyMap;
 import static org.elasticsearch.xpack.esql.EsqlTestUtils.L;
@@ -89,7 +88,7 @@ public static void init() {
         parser = new EsqlParser();
 
         mapping = loadMapping("mapping-basic.json");
-        EsIndex test = new EsIndex("test", mapping, Set.of("test"));
+        EsIndex test = new EsIndex("test", mapping, Map.of("test", IndexMode.STANDARD));
         IndexResolution getIndexResult = IndexResolution.valid(test);
         logicalOptimizer = new LogicalPlanOptimizer(new LogicalOptimizerContext(EsqlTestUtils.TEST_CFG));
 
@@ -424,7 +423,7 @@ public void testSparseDocument() throws Exception {
 
         SearchStats searchStats = statsForExistingField("field000", "field001", "field002", "field003", "field004");
 
-        EsIndex index = new EsIndex("large", large, Set.of("large"));
+        EsIndex index = new EsIndex("large", large, Map.of("large", IndexMode.STANDARD));
         IndexResolution getIndexResult = IndexResolution.valid(index);
         var logicalOptimizer = new LogicalPlanOptimizer(new LogicalOptimizerContext(EsqlTestUtils.TEST_CFG));
 
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalPhysicalPlanOptimizerTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalPhysicalPlanOptimizerTests.java
index ee66e3043b62f..8a6712869d35e 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalPhysicalPlanOptimizerTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalPhysicalPlanOptimizerTests.java
@@ -13,6 +13,7 @@
 import org.elasticsearch.Build;
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.core.Tuple;
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.index.mapper.MapperService;
 import org.elasticsearch.index.mapper.MapperServiceTestCase;
 import org.elasticsearch.index.mapper.ParsedDocument;
@@ -66,7 +67,6 @@
 import java.util.List;
 import java.util.Locale;
 import java.util.Map;
-import java.util.Set;
 
 import static java.util.Arrays.asList;
 import static org.elasticsearch.xpack.esql.EsqlTestUtils.as;
@@ -139,7 +139,7 @@ public void init() {
 
     private Analyzer makeAnalyzer(String mappingFileName, EnrichResolution enrichResolution) {
         var mapping = loadMapping(mappingFileName);
-        EsIndex test = new EsIndex("test", mapping, Set.of("test"));
+        EsIndex test = new EsIndex("test", mapping, Map.of("test", IndexMode.STANDARD));
         IndexResolution getIndexResult = IndexResolution.valid(test);
 
         return new Analyzer(
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LogicalPlanOptimizerTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LogicalPlanOptimizerTests.java
index 74f95e3defbd3..5268eb4349af8 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LogicalPlanOptimizerTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LogicalPlanOptimizerTests.java
@@ -148,14 +148,12 @@
 import java.util.Arrays;
 import java.util.List;
 import java.util.Map;
-import java.util.Set;
 import java.util.function.BiFunction;
 import java.util.function.Function;
 
 import static java.util.Arrays.asList;
 import static java.util.Collections.emptyList;
 import static java.util.Collections.emptyMap;
-import static java.util.Collections.emptySet;
 import static java.util.Collections.singletonList;
 import static org.elasticsearch.test.ListMatcher.matchesList;
 import static org.elasticsearch.test.MapMatcher.assertMap;
@@ -250,7 +248,7 @@ public static void init() {
 
         // Most tests used data from the test index, so we load it here, and use it in the plan() function.
         mapping = loadMapping("mapping-basic.json");
-        EsIndex test = new EsIndex("test", mapping, Set.of("test"));
+        EsIndex test = new EsIndex("test", mapping, Map.of("test", IndexMode.STANDARD));
         IndexResolution getIndexResult = IndexResolution.valid(test);
         analyzer = new Analyzer(
             new AnalyzerContext(EsqlTestUtils.TEST_CFG, new EsqlFunctionRegistry(), getIndexResult, enrichResolution),
@@ -259,7 +257,7 @@ public static void init() {
 
         // Some tests use data from the airports index, so we load it here, and use it in the plan_airports() function.
         mappingAirports = loadMapping("mapping-airports.json");
-        EsIndex airports = new EsIndex("airports", mappingAirports, Set.of("airports"));
+        EsIndex airports = new EsIndex("airports", mappingAirports, Map.of("airports", IndexMode.STANDARD));
         IndexResolution getIndexResultAirports = IndexResolution.valid(airports);
         analyzerAirports = new Analyzer(
             new AnalyzerContext(EsqlTestUtils.TEST_CFG, new EsqlFunctionRegistry(), getIndexResultAirports, enrichResolution),
@@ -268,7 +266,7 @@ public static void init() {
 
         // Some tests need additional types, so we load that index here and use it in the plan_types() function.
         mappingTypes = loadMapping("mapping-all-types.json");
-        EsIndex types = new EsIndex("types", mappingTypes, Set.of("types"));
+        EsIndex types = new EsIndex("types", mappingTypes, Map.of("types", IndexMode.STANDARD));
         IndexResolution getIndexResultTypes = IndexResolution.valid(types);
         analyzerTypes = new Analyzer(
             new AnalyzerContext(EsqlTestUtils.TEST_CFG, new EsqlFunctionRegistry(), getIndexResultTypes, enrichResolution),
@@ -277,7 +275,7 @@ public static void init() {
 
         // Some tests use mappings from mapping-extra.json to be able to test more types so we load it here
         mappingExtra = loadMapping("mapping-extra.json");
-        EsIndex extra = new EsIndex("extra", mappingExtra, Set.of("extra"));
+        EsIndex extra = new EsIndex("extra", mappingExtra, Map.of("extra", IndexMode.STANDARD));
         IndexResolution getIndexResultExtra = IndexResolution.valid(extra);
         analyzerExtra = new Analyzer(
             new AnalyzerContext(EsqlTestUtils.TEST_CFG, new EsqlFunctionRegistry(), getIndexResultExtra, enrichResolution),
@@ -285,7 +283,7 @@ public static void init() {
         );
 
         metricMapping = loadMapping("k8s-mappings.json");
-        var metricsIndex = IndexResolution.valid(new EsIndex("k8s", metricMapping, Set.of("k8s")));
+        var metricsIndex = IndexResolution.valid(new EsIndex("k8s", metricMapping, Map.of("k8s", IndexMode.TIME_SERIES)));
         metricsAnalyzer = new Analyzer(
             new AnalyzerContext(EsqlTestUtils.TEST_CFG, new EsqlFunctionRegistry(), metricsIndex, enrichResolution),
             TEST_VERIFIER
@@ -4125,7 +4123,7 @@ private static boolean oneLeaveIsNull(Expression e) {
     }
 
     public void testEmptyMappingIndex() {
-        EsIndex empty = new EsIndex("empty_test", emptyMap(), emptySet());
+        EsIndex empty = new EsIndex("empty_test", emptyMap(), Map.of());
         IndexResolution getIndexResultAirports = IndexResolution.valid(empty);
         var analyzer = new Analyzer(
             new AnalyzerContext(EsqlTestUtils.TEST_CFG, new EsqlFunctionRegistry(), getIndexResultAirports, enrichResolution),
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/PhysicalPlanOptimizerTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/PhysicalPlanOptimizerTests.java
index 5b8a465b05f1c..6f489541a7815 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/PhysicalPlanOptimizerTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/PhysicalPlanOptimizerTests.java
@@ -240,7 +240,7 @@ TestDataSource makeTestDataSource(
         EnrichResolution enrichResolution
     ) {
         Map<String, EsField> mapping = loadMapping(mappingFileName);
-        EsIndex index = new EsIndex(indexName, mapping, Set.of("test"));
+        EsIndex index = new EsIndex(indexName, mapping, Map.of("test", IndexMode.STANDARD));
         IndexResolution getIndexResult = IndexResolution.valid(index);
         Analyzer analyzer = new Analyzer(new AnalyzerContext(config, functionRegistry, getIndexResult, enrichResolution), TEST_VERIFIER);
         return new TestDataSource(mapping, index, analyzer);
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSinkExecSerializationTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSinkExecSerializationTests.java
index be30ac20df64e..5b6c682044a8f 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSinkExecSerializationTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/ExchangeSinkExecSerializationTests.java
@@ -67,7 +67,7 @@ protected boolean alwaysEmptySource() {
      * See {@link #testManyTypeConflicts(boolean, ByteSizeValue)} for more.
      */
     public void testManyTypeConflicts() throws IOException {
-        testManyTypeConflicts(false, ByteSizeValue.ofBytes(1897374));
+        testManyTypeConflicts(false, ByteSizeValue.ofBytes(1897373));
         /*
          * History:
          *  2.3mb - shorten error messages for UnsupportedAttributes #111973
@@ -80,7 +80,7 @@ public void testManyTypeConflicts() throws IOException {
      * See {@link #testManyTypeConflicts(boolean, ByteSizeValue)} for more.
      */
     public void testManyTypeConflictsWithParent() throws IOException {
-        testManyTypeConflicts(true, ByteSizeValue.ofBytes(3271487));
+        testManyTypeConflicts(true, ByteSizeValue.ofBytes(3271486));
         /*
          * History:
          *  2 gb+ - start
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/planner/FilterTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/planner/FilterTests.java
index fcb27c3ba5673..cccac8c6342a1 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/planner/FilterTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/planner/FilterTests.java
@@ -13,6 +13,7 @@
 import org.elasticsearch.common.io.stream.NamedWriteableAwareStreamInput;
 import org.elasticsearch.common.io.stream.StreamInput;
 import org.elasticsearch.common.logging.LoggerMessageFormat;
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.index.query.AbstractQueryBuilder;
 import org.elasticsearch.index.query.BoolQueryBuilder;
 import org.elasticsearch.index.query.QueryBuilder;
@@ -45,7 +46,6 @@
 import java.io.UncheckedIOException;
 import java.util.List;
 import java.util.Map;
-import java.util.Set;
 
 import static java.util.Arrays.asList;
 import static org.elasticsearch.index.query.QueryBuilders.rangeQuery;
@@ -76,7 +76,7 @@ public static void init() {
         parser = new EsqlParser();
 
         Map<String, EsField> mapping = loadMapping("mapping-basic.json");
-        EsIndex test = new EsIndex("test", mapping, Set.of("test"));
+        EsIndex test = new EsIndex("test", mapping, Map.of("test", IndexMode.STANDARD));
         IndexResolution getIndexResult = IndexResolution.valid(test);
         logicalOptimizer = new LogicalPlanOptimizer(new LogicalOptimizerContext(EsqlTestUtils.TEST_CFG));
         physicalPlanOptimizer = new PhysicalPlanOptimizer(new PhysicalOptimizerContext(EsqlTestUtils.TEST_CFG));
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/planner/QueryTranslatorTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/planner/QueryTranslatorTests.java
index 7c64796abf521..760d8a327ad20 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/planner/QueryTranslatorTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/planner/QueryTranslatorTests.java
@@ -7,6 +7,7 @@
 
 package org.elasticsearch.xpack.esql.planner;
 
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.test.ESTestCase;
 import org.elasticsearch.xpack.esql.EsqlTestUtils;
 import org.elasticsearch.xpack.esql.analysis.Analyzer;
@@ -24,7 +25,7 @@
 import org.junit.BeforeClass;
 
 import java.util.List;
-import java.util.Set;
+import java.util.Map;
 
 import static org.elasticsearch.xpack.esql.EsqlTestUtils.loadMapping;
 import static org.elasticsearch.xpack.esql.EsqlTestUtils.withDefaultLimitWarning;
@@ -40,7 +41,7 @@ public class QueryTranslatorTests extends ESTestCase {
 
     private static Analyzer makeAnalyzer(String mappingFileName) {
         var mapping = loadMapping(mappingFileName);
-        EsIndex test = new EsIndex("test", mapping, Set.of("test"));
+        EsIndex test = new EsIndex("test", mapping, Map.of("test", IndexMode.STANDARD));
         IndexResolution getIndexResult = IndexResolution.valid(test);
 
         return new Analyzer(
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plugin/DataNodeRequestTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plugin/DataNodeRequestTests.java
index 2dc3a43cf3d71..325e8fbb6b652 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plugin/DataNodeRequestTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plugin/DataNodeRequestTests.java
@@ -12,6 +12,7 @@
 import org.elasticsearch.common.io.stream.Writeable;
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.index.Index;
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.index.query.TermQueryBuilder;
 import org.elasticsearch.index.shard.ShardId;
 import org.elasticsearch.search.SearchModule;
@@ -37,7 +38,6 @@
 import java.util.ArrayList;
 import java.util.List;
 import java.util.Map;
-import java.util.Set;
 
 import static org.elasticsearch.xpack.esql.ConfigurationTestUtils.randomConfiguration;
 import static org.elasticsearch.xpack.esql.ConfigurationTestUtils.randomTables;
@@ -262,7 +262,7 @@ protected DataNodeRequest mutateInstance(DataNodeRequest in) throws IOException
 
     static LogicalPlan parse(String query) {
         Map<String, EsField> mapping = loadMapping("mapping-basic.json");
-        EsIndex test = new EsIndex("test", mapping, Set.of("test"));
+        EsIndex test = new EsIndex("test", mapping, Map.of("test", IndexMode.STANDARD));
         IndexResolution getIndexResult = IndexResolution.valid(test);
         var logicalOptimizer = new LogicalPlanOptimizer(new LogicalOptimizerContext(TEST_CFG));
         var analyzer = new Analyzer(

From fb14e07d83d02ac39368d8fb7ab138eb5e9c186a Mon Sep 17 00:00:00 2001
From: Athena Brown <athena.brown@elastic.co>
Date: Fri, 30 Aug 2024 11:29:35 -0600
Subject: [PATCH 084/144] Check for disabling own user in Put User API
 (#112262)

Prior to this commit, the Put User API could be used to disable one's own user in the native realm, despite this being prevented in other APIs.

This commit adds a check to the Put User API to prevent native-realm users from disabling their own accounts.
---
 docs/changelog/112262.yaml                    |  6 +++
 .../authc/esnative/NativeRealmIntegTests.java | 18 +++++++
 .../action/user/TransportPutUserAction.java   | 23 +++++++++
 .../user/TransportPutUserActionTests.java     | 51 +++++++++++++++++--
 4 files changed, 93 insertions(+), 5 deletions(-)
 create mode 100644 docs/changelog/112262.yaml

diff --git a/docs/changelog/112262.yaml b/docs/changelog/112262.yaml
new file mode 100644
index 0000000000000..fe23c14c79c9e
--- /dev/null
+++ b/docs/changelog/112262.yaml
@@ -0,0 +1,6 @@
+pr: 112262
+summary: Check for disabling own user in Put User API
+area: Authentication
+type: bug
+issues:
+ - 90205
diff --git a/x-pack/plugin/security/src/internalClusterTest/java/org/elasticsearch/xpack/security/authc/esnative/NativeRealmIntegTests.java b/x-pack/plugin/security/src/internalClusterTest/java/org/elasticsearch/xpack/security/authc/esnative/NativeRealmIntegTests.java
index 3badd14ef8348..6a1fd9a15cd21 100644
--- a/x-pack/plugin/security/src/internalClusterTest/java/org/elasticsearch/xpack/security/authc/esnative/NativeRealmIntegTests.java
+++ b/x-pack/plugin/security/src/internalClusterTest/java/org/elasticsearch/xpack/security/authc/esnative/NativeRealmIntegTests.java
@@ -8,6 +8,7 @@
 
 import org.apache.lucene.util.CollectionUtil;
 import org.elasticsearch.ElasticsearchSecurityException;
+import org.elasticsearch.action.ActionRequestValidationException;
 import org.elasticsearch.action.ActionResponse;
 import org.elasticsearch.action.admin.cluster.health.ClusterHealthResponse;
 import org.elasticsearch.action.admin.cluster.snapshots.restore.RestoreSnapshotResponse;
@@ -147,6 +148,23 @@ public void testDeletingNonexistingUserAndRole() throws Exception {
         assertFalse("role shouldn't be found", resp2.found());
     }
 
+    public void testDisablingOwnUser() throws Exception {
+        preparePutUser("joe", "s3krit-password", hasher, SecuritySettingsSource.TEST_ROLE).get();
+        GetUsersResponse resp = new GetUsersRequestBuilder(client()).usernames("joe").get();
+        assertTrue("user should exist", resp.hasUsers());
+        String token = basicAuthHeaderValue("joe", new SecureString("s3krit-password"));
+        var joeClient = client().filterWithHeader(Collections.singletonMap("Authorization", token));
+        var joeSelfDisableRequest = new PutUserRequestBuilder(joeClient).username("joe")
+            .password("s3krit-password".toCharArray(), hasher)
+            .roles(SecuritySettingsSource.TEST_ROLE)
+            .enabled(false);
+        ActionRequestValidationException ex = expectThrows(ActionRequestValidationException.class, joeSelfDisableRequest::get);
+        assertThat(
+            ex.getMessage(),
+            containsString("native and reserved realm users may not update the enabled status of their own account")
+        );
+    }
+
     public void testGettingUserThatDoesntExist() throws Exception {
         GetUsersResponse resp = new GetUsersRequestBuilder(client()).usernames("joe").get();
         assertFalse("user should not exist", resp.hasUsers());
diff --git a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/user/TransportPutUserAction.java b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/user/TransportPutUserAction.java
index 5aa09e71b0082..d6bcbffc323e8 100644
--- a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/user/TransportPutUserAction.java
+++ b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/action/user/TransportPutUserAction.java
@@ -16,10 +16,12 @@
 import org.elasticsearch.injection.guice.Inject;
 import org.elasticsearch.tasks.Task;
 import org.elasticsearch.transport.TransportService;
+import org.elasticsearch.xpack.core.security.SecurityContext;
 import org.elasticsearch.xpack.core.security.action.user.PutUserAction;
 import org.elasticsearch.xpack.core.security.action.user.PutUserRequest;
 import org.elasticsearch.xpack.core.security.action.user.PutUserResponse;
 import org.elasticsearch.xpack.core.security.authc.esnative.ClientReservedRealm;
+import org.elasticsearch.xpack.core.security.authc.esnative.NativeRealmSettings;
 import org.elasticsearch.xpack.core.security.support.NativeRealmValidationUtil;
 import org.elasticsearch.xpack.core.security.support.Validation;
 import org.elasticsearch.xpack.core.security.user.AnonymousUser;
@@ -31,17 +33,20 @@ public class TransportPutUserAction extends HandledTransportAction<PutUserReques
 
     private final Settings settings;
     private final NativeUsersStore usersStore;
+    private final SecurityContext securityContext;
 
     @Inject
     public TransportPutUserAction(
         Settings settings,
         ActionFilters actionFilters,
         NativeUsersStore usersStore,
+        SecurityContext securityContext,
         TransportService transportService
     ) {
         super(PutUserAction.NAME, transportService, actionFilters, PutUserRequest::new, EsExecutors.DIRECT_EXECUTOR_SERVICE);
         this.settings = settings;
         this.usersStore = usersStore;
+        this.securityContext = securityContext;
     }
 
     @Override
@@ -73,6 +78,12 @@ public void onFailure(Exception e) {
     private ActionRequestValidationException validateRequest(PutUserRequest request) {
         ActionRequestValidationException validationException = null;
         final String username = request.username();
+        if (isDisablingOwnUser(request)) {
+            validationException = addValidationError(
+                "native and reserved realm users may not update the enabled status of their own account",
+                validationException
+            );
+        }
         if (ClientReservedRealm.isReserved(username, settings)) {
             if (AnonymousUser.isAnonymousUsername(username, settings)) {
                 validationException = addValidationError(
@@ -102,4 +113,16 @@ private ActionRequestValidationException validateRequest(PutUserRequest request)
         }
         return validationException;
     }
+
+    private boolean isDisablingOwnUser(PutUserRequest request) {
+        if (request.enabled() == false) {
+            final var effectiveSubject = securityContext.getAuthentication().getEffectiveSubject();
+            final var realmType = effectiveSubject.getRealm().getType();
+            // Only native or reserved realm users can be disabled via the API. If the realm of the effective subject is neither,
+            // the target must be a different user
+            return (NativeRealmSettings.TYPE.equals(realmType)) && effectiveSubject.getUser().principal().equals(request.username());
+        }
+        return false;
+    }
+
 }
diff --git a/x-pack/plugin/security/src/test/java/org/elasticsearch/xpack/security/action/user/TransportPutUserActionTests.java b/x-pack/plugin/security/src/test/java/org/elasticsearch/xpack/security/action/user/TransportPutUserActionTests.java
index 369d9bff15e88..978e734f124de 100644
--- a/x-pack/plugin/security/src/test/java/org/elasticsearch/xpack/security/action/user/TransportPutUserActionTests.java
+++ b/x-pack/plugin/security/src/test/java/org/elasticsearch/xpack/security/action/user/TransportPutUserActionTests.java
@@ -21,6 +21,7 @@
 import org.elasticsearch.threadpool.ThreadPool;
 import org.elasticsearch.transport.Transport;
 import org.elasticsearch.transport.TransportService;
+import org.elasticsearch.xpack.core.security.SecurityContext;
 import org.elasticsearch.xpack.core.security.action.user.PutUserRequest;
 import org.elasticsearch.xpack.core.security.action.user.PutUserResponse;
 import org.elasticsearch.xpack.core.security.authc.AuthenticationTestHelper;
@@ -69,7 +70,15 @@ public void testAnonymousUser() {
             null,
             Collections.emptySet()
         );
-        TransportPutUserAction action = new TransportPutUserAction(settings, mock(ActionFilters.class), usersStore, transportService);
+        final ThreadContext threadContext = new ThreadContext(Settings.EMPTY);
+        final SecurityContext securityContext = new SecurityContext(Settings.EMPTY, threadContext);
+        TransportPutUserAction action = new TransportPutUserAction(
+            settings,
+            mock(ActionFilters.class),
+            usersStore,
+            securityContext,
+            transportService
+        );
 
         PutUserRequest request = new PutUserRequest();
         request.username(anonymousUser.principal());
@@ -119,7 +128,15 @@ public void testReservedUser() {
             null,
             Collections.emptySet()
         );
-        TransportPutUserAction action = new TransportPutUserAction(Settings.EMPTY, mock(ActionFilters.class), usersStore, transportService);
+        final ThreadContext threadContext = new ThreadContext(Settings.EMPTY);
+        final SecurityContext securityContext = new SecurityContext(Settings.EMPTY, threadContext);
+        TransportPutUserAction action = new TransportPutUserAction(
+            Settings.EMPTY,
+            mock(ActionFilters.class),
+            usersStore,
+            securityContext,
+            transportService
+        );
 
         PutUserRequest request = new PutUserRequest();
         request.username(reserved.principal());
@@ -166,7 +183,15 @@ private void testValidUser(User user) {
             null,
             Collections.emptySet()
         );
-        TransportPutUserAction action = new TransportPutUserAction(Settings.EMPTY, mock(ActionFilters.class), usersStore, transportService);
+        final ThreadContext threadContext = new ThreadContext(Settings.EMPTY);
+        final SecurityContext securityContext = new SecurityContext(Settings.EMPTY, threadContext);
+        TransportPutUserAction action = new TransportPutUserAction(
+            Settings.EMPTY,
+            mock(ActionFilters.class),
+            usersStore,
+            securityContext,
+            transportService
+        );
 
         final boolean isCreate = randomBoolean();
         final PutUserRequest request = new PutUserRequest();
@@ -230,7 +255,15 @@ private void testInvalidUser(User user) {
             null,
             Collections.emptySet()
         );
-        TransportPutUserAction action = new TransportPutUserAction(Settings.EMPTY, mock(ActionFilters.class), usersStore, transportService);
+        final ThreadContext threadContext = new ThreadContext(Settings.EMPTY);
+        final SecurityContext securityContext = new SecurityContext(Settings.EMPTY, threadContext);
+        TransportPutUserAction action = new TransportPutUserAction(
+            Settings.EMPTY,
+            mock(ActionFilters.class),
+            usersStore,
+            securityContext,
+            transportService
+        );
 
         final PutUserRequest request = new PutUserRequest();
         request.username(user.principal());
@@ -291,7 +324,15 @@ public void testException() {
             null,
             Collections.emptySet()
         );
-        TransportPutUserAction action = new TransportPutUserAction(Settings.EMPTY, mock(ActionFilters.class), usersStore, transportService);
+        final ThreadContext threadContext = new ThreadContext(Settings.EMPTY);
+        final SecurityContext securityContext = new SecurityContext(Settings.EMPTY, threadContext);
+        TransportPutUserAction action = new TransportPutUserAction(
+            Settings.EMPTY,
+            mock(ActionFilters.class),
+            usersStore,
+            securityContext,
+            transportService
+        );
 
         final PutUserRequest request = new PutUserRequest();
         request.username(user.principal());

From ca823aaf7b975afd01cce6edc092e39a793573da Mon Sep 17 00:00:00 2001
From: Athena Brown <athena.brown@elastic.co>
Date: Fri, 30 Aug 2024 11:30:06 -0600
Subject: [PATCH 085/144] Fix TokenService always appearing used in Feature
 Usage (#112263)

This commit adjusts the license checks in `TokenService` so that it does not count as "used" when it checks a token, as this causes a high rate of false positives due to the authentication chain model.
---
 docs/changelog/112263.yaml                                | 6 ++++++
 .../elasticsearch/xpack/security/authc/TokenService.java  | 8 +++++---
 2 files changed, 11 insertions(+), 3 deletions(-)
 create mode 100644 docs/changelog/112263.yaml

diff --git a/docs/changelog/112263.yaml b/docs/changelog/112263.yaml
new file mode 100644
index 0000000000000..2d1321f327673
--- /dev/null
+++ b/docs/changelog/112263.yaml
@@ -0,0 +1,6 @@
+pr: 112263
+summary: Fix `TokenService` always appearing used in Feature Usage
+area: License
+type: bug
+issues:
+ - 61956
diff --git a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authc/TokenService.java b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authc/TokenService.java
index 26f6268aaa5dc..a7bc4d7b428b3 100644
--- a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authc/TokenService.java
+++ b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authc/TokenService.java
@@ -470,7 +470,7 @@ public static String hashTokenString(String accessTokenString) {
      * verification that the token has not been revoked or is expired.
      */
     void tryAuthenticateToken(SecureString token, ActionListener<UserToken> listener) {
-        if (isEnabled() && token != null) {
+        if (shouldTryRealm() && token != null) {
             decodeToken(token.toString(), true, listener.delegateResponse((l, e) -> {
                 if (isShardNotAvailableException(e)) {
                     l.onResponse(null);
@@ -1964,8 +1964,10 @@ private static String getTokenIdFromDocumentId(String docId) {
         }
     }
 
-    private boolean isEnabled() {
-        return enabled && Security.TOKEN_SERVICE_FEATURE.check(licenseState);
+    private boolean shouldTryRealm() {
+        // Check license without tracking because this is just checking if we should *try* the realm - if this realm doesn't match,
+        // the next realm in the list will be checked, and that's not "using the feature"
+        return enabled && Security.TOKEN_SERVICE_FEATURE.checkWithoutTracking(licenseState);
     }
 
     private void ensureEnabled() {

From e58644cd6f62e44f5da979916cff55d9f8063bb2 Mon Sep 17 00:00:00 2001
From: Ryan Ernst <ryan@iernst.net>
Date: Fri, 30 Aug 2024 11:12:39 -0700
Subject: [PATCH 086/144] Handle spaces in java library path (#106789)

This commit quotes the entire library path in case there are spaces in
any of the paths.
---
 build-tools-internal/src/main/groovy/elasticsearch.ide.gradle | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/build-tools-internal/src/main/groovy/elasticsearch.ide.gradle b/build-tools-internal/src/main/groovy/elasticsearch.ide.gradle
index 285c3a61b08c2..cae1116d37ea5 100644
--- a/build-tools-internal/src/main/groovy/elasticsearch.ide.gradle
+++ b/build-tools-internal/src/main/groovy/elasticsearch.ide.gradle
@@ -168,7 +168,7 @@ if (providers.systemProperty('idea.active').getOrNull() == 'true') {
               '-ea',
               '-Djava.security.manager=allow',
               '-Djava.locale.providers=SPI,COMPAT',
-              '-Des.nativelibs.path=' + testLibraryPath,
+              '-Des.nativelibs.path="' + testLibraryPath + '"',
               // TODO: only open these for mockito when it is modularized
               '--add-opens=java.base/java.security.cert=ALL-UNNAMED',
               '--add-opens=java.base/java.nio.channels=ALL-UNNAMED',

From aa37ea15f4cb8c4a7e4896e5b3a108087ca1c9b3 Mon Sep 17 00:00:00 2001
From: Nik Everett <nik9000@gmail.com>
Date: Fri, 30 Aug 2024 15:20:15 -0400
Subject: [PATCH 087/144] Bump a transport version (#112403)

Merge conflict gave us two identical versions.
---
 server/src/main/java/org/elasticsearch/TransportVersions.java | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/server/src/main/java/org/elasticsearch/TransportVersions.java b/server/src/main/java/org/elasticsearch/TransportVersions.java
index c57279ef6c443..edd00f55f3517 100644
--- a/server/src/main/java/org/elasticsearch/TransportVersions.java
+++ b/server/src/main/java/org/elasticsearch/TransportVersions.java
@@ -203,8 +203,7 @@ static TransportVersion def(int id) {
     public static final TransportVersion ML_INFERENCE_ALIBABACLOUD_SEARCH_ADDED = def(8_733_00_0);
     public static final TransportVersion FIELD_CAPS_RESPONSE_INDEX_MODE = def(8_734_00_0);
     public static final TransportVersion GET_DATA_STREAMS_VERBOSE = def(8_735_00_0);
-
-    public static final TransportVersion ESQL_ADD_INDEX_MODE_CONCRETE_INDICES = def(8_735_00_0);
+    public static final TransportVersion ESQL_ADD_INDEX_MODE_CONCRETE_INDICES = def(8_736_00_0);
 
     /*
      * STOP! READ THIS FIRST! No, really,

From b2d885c14280bb3c3b1896788229b47cf7369b86 Mon Sep 17 00:00:00 2001
From: Stanislav Malyshev <smalyshev@users.noreply.github.com>
Date: Fri, 30 Aug 2024 18:52:43 -0600
Subject: [PATCH 088/144] Add "CCS" label to validation schema (#112407)

---
 build-tools-internal/src/main/resources/changelog-schema.json | 1 +
 1 file changed, 1 insertion(+)

diff --git a/build-tools-internal/src/main/resources/changelog-schema.json b/build-tools-internal/src/main/resources/changelog-schema.json
index d8fc7d780ae58..593716954780b 100644
--- a/build-tools-internal/src/main/resources/changelog-schema.json
+++ b/build-tools-internal/src/main/resources/changelog-schema.json
@@ -28,6 +28,7 @@
             "Autoscaling",
             "CAT APIs",
             "CCR",
+            "CCS",
             "CRUD",
             "Client",
             "Cluster Coordination",

From df3dd3a402ff76d7fa5a9725ce0e784df81cfebd Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Sun, 1 Sep 2024 06:53:58 +1000
Subject: [PATCH 089/144] Mute
 org.elasticsearch.lucene.spatial.LatLonShapeDocValuesQueryTests
 testEmptySegment #112413

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index ba45c119f8e9e..5a4b20c3bd2f1 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -174,6 +174,9 @@ tests:
 - class: org.elasticsearch.action.admin.cluster.stats.CCSTelemetrySnapshotTests
   method: testToXContent
   issue: https://github.com/elastic/elasticsearch/issues/112325
+- class: org.elasticsearch.lucene.spatial.LatLonShapeDocValuesQueryTests
+  method: testEmptySegment
+  issue: https://github.com/elastic/elasticsearch/issues/112413
 
 # Examples:
 #

From a5d9ea62651948754b8c1fa01406e33c534153ac Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Sun, 1 Sep 2024 06:54:09 +1000
Subject: [PATCH 090/144] Mute
 org.elasticsearch.lucene.spatial.CartesianShapeDocValuesQueryTests
 testEmptySegment #112414

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 5a4b20c3bd2f1..c7135a1c68716 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -177,6 +177,9 @@ tests:
 - class: org.elasticsearch.lucene.spatial.LatLonShapeDocValuesQueryTests
   method: testEmptySegment
   issue: https://github.com/elastic/elasticsearch/issues/112413
+- class: org.elasticsearch.lucene.spatial.CartesianShapeDocValuesQueryTests
+  method: testEmptySegment
+  issue: https://github.com/elastic/elasticsearch/issues/112414
 
 # Examples:
 #

From b1795e9a13e8c5d3057dcf9108398ccdb194f622 Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Mon, 2 Sep 2024 06:44:10 +1000
Subject: [PATCH 091/144] Mute
 org.elasticsearch.search.retriever.RankDocRetrieverBuilderIT
 testRankDocsRetrieverWithNestedQuery #112421

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index c7135a1c68716..ed53c09863a2e 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -180,6 +180,9 @@ tests:
 - class: org.elasticsearch.lucene.spatial.CartesianShapeDocValuesQueryTests
   method: testEmptySegment
   issue: https://github.com/elastic/elasticsearch/issues/112414
+- class: org.elasticsearch.search.retriever.RankDocRetrieverBuilderIT
+  method: testRankDocsRetrieverWithNestedQuery
+  issue: https://github.com/elastic/elasticsearch/issues/112421
 
 # Examples:
 #

From caa3adf61636e9a91efdb1b3a215c0b81e6d246d Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Mon, 2 Sep 2024 14:34:58 +1000
Subject: [PATCH 092/144] Mute
 org.elasticsearch.indices.mapping.UpdateMappingIntegrationIT
 org.elasticsearch.indices.mapping.UpdateMappingIntegrationIT #112423

---
 muted-tests.yml | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index ed53c09863a2e..ec406e50b01c7 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -183,6 +183,8 @@ tests:
 - class: org.elasticsearch.search.retriever.RankDocRetrieverBuilderIT
   method: testRankDocsRetrieverWithNestedQuery
   issue: https://github.com/elastic/elasticsearch/issues/112421
+- class: org.elasticsearch.indices.mapping.UpdateMappingIntegrationIT
+  issue: https://github.com/elastic/elasticsearch/issues/112423
 
 # Examples:
 #

From 17120c097e4023d3c01c0884938f5ea6574145bc Mon Sep 17 00:00:00 2001
From: Ignacio Vera <ignacio.vera@elastic.co>
Date: Mon, 2 Sep 2024 07:31:07 +0200
Subject: [PATCH 093/144] Add workaround in SpatialPushDownGeoPointIT to avoid
 lucene issue (#112388)

---
 muted-tests.yml                                            | 3 ---
 .../xpack/esql/spatial/SpatialPushDownGeoPointIT.java      | 7 ++++++-
 2 files changed, 6 insertions(+), 4 deletions(-)

diff --git a/muted-tests.yml b/muted-tests.yml
index ec406e50b01c7..6a049833096b4 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -71,9 +71,6 @@ tests:
 - class: org.elasticsearch.nativeaccess.VectorSystemPropertyTests
   method: testSystemPropertyDisabled
   issue: https://github.com/elastic/elasticsearch/issues/110949
-- class: org.elasticsearch.xpack.esql.spatial.SpatialPushDownGeoPointIT
-  method: testPushedDownQueriesSingleValue
-  issue: https://github.com/elastic/elasticsearch/issues/111084
 - class: org.elasticsearch.multi_node.GlobalCheckpointSyncActionIT
   issue: https://github.com/elastic/elasticsearch/issues/111124
 - class: org.elasticsearch.cluster.PrevalidateShardPathIT
diff --git a/x-pack/plugin/esql/src/internalClusterTest/java/org/elasticsearch/xpack/esql/spatial/SpatialPushDownGeoPointIT.java b/x-pack/plugin/esql/src/internalClusterTest/java/org/elasticsearch/xpack/esql/spatial/SpatialPushDownGeoPointIT.java
index c4b22e0b55585..bea924ea2c22d 100644
--- a/x-pack/plugin/esql/src/internalClusterTest/java/org/elasticsearch/xpack/esql/spatial/SpatialPushDownGeoPointIT.java
+++ b/x-pack/plugin/esql/src/internalClusterTest/java/org/elasticsearch/xpack/esql/spatial/SpatialPushDownGeoPointIT.java
@@ -7,11 +7,14 @@
 
 package org.elasticsearch.xpack.esql.spatial;
 
+import org.apache.lucene.geo.GeoEncodingUtils;
 import org.elasticsearch.geo.GeometryTestUtils;
 import org.elasticsearch.geometry.Geometry;
 
 public class SpatialPushDownGeoPointIT extends SpatialPushDownTestCase {
 
+    private static final double LAT_MAX_VALUE = GeoEncodingUtils.decodeLatitude(Integer.MAX_VALUE - 3);
+
     @Override
     protected String fieldType() {
         return "geo_point";
@@ -19,7 +22,9 @@ protected String fieldType() {
 
     @Override
     protected Geometry getIndexGeometry() {
-        return GeometryTestUtils.randomPoint();
+        // This is to overcome lucene bug https://github.com/apache/lucene/issues/13703.
+        // Once it is fixed we can remove this workaround.
+        return randomValueOtherThanMany(p -> p.getLat() >= LAT_MAX_VALUE, GeometryTestUtils::randomPoint);
     }
 
     @Override

From 3d2ca69b7cff8e5e753494606fd58d65d9f03dcc Mon Sep 17 00:00:00 2001
From: Liam Thompson <32779855+leemthompo@users.noreply.github.com>
Date: Mon, 2 Sep 2024 09:28:35 +0100
Subject: [PATCH 094/144] [DOCS] Collapse some content in local dev setup for
 readability (#112355)

* [DOCS] Collapse some content in local dev setup for readability

* Reword collapsible text
---
 .../reference/quickstart/run-elasticsearch-locally.asciidoc | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/docs/reference/quickstart/run-elasticsearch-locally.asciidoc b/docs/reference/quickstart/run-elasticsearch-locally.asciidoc
index 0db395ba34b0a..8c75510ae860f 100644
--- a/docs/reference/quickstart/run-elasticsearch-locally.asciidoc
+++ b/docs/reference/quickstart/run-elasticsearch-locally.asciidoc
@@ -125,6 +125,10 @@ The service is started with a trial license. The trial license enables all featu
 
 To connect to the {es} cluster from a language client, you can use basic authentication with the `elastic` username and the password you set in the environment variable.
 
+.*Expand* for details
+[%collapsible]
+==============
+
 You'll use the following connection details:
 
 * **{es} endpoint**: `http://localhost:9200`
@@ -160,6 +164,8 @@ curl -u elastic:$ELASTIC_PASSWORD \
 ----
 // NOTCONSOLE
 
+==============
+
 [discrete]
 [[local-dev-next-steps]]
 === Next steps

From 6b17e329253060eaeb81b8cef8b06fd3bae5881a Mon Sep 17 00:00:00 2001
From: Ignacio Vera <ignacio.vera@elastic.co>
Date: Mon, 2 Sep 2024 10:31:19 +0200
Subject: [PATCH 095/144] Unmute test in LegacyGeoShapeWithDocValuesQueryTests
 (#112385)

---
 .../query/LegacyGeoShapeWithDocValuesQueryTests.java | 12 ------------
 1 file changed, 12 deletions(-)

diff --git a/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/query/LegacyGeoShapeWithDocValuesQueryTests.java b/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/query/LegacyGeoShapeWithDocValuesQueryTests.java
index 2bf77726870cf..ce40b19377bc6 100644
--- a/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/query/LegacyGeoShapeWithDocValuesQueryTests.java
+++ b/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/query/LegacyGeoShapeWithDocValuesQueryTests.java
@@ -220,16 +220,4 @@ public void testFieldAlias() throws IOException {
 
         assertHitCount(client().prepareSearch(defaultIndexName).setQuery(geoShapeQuery("alias", multiPoint)), 1L);
     }
-
-    @AwaitsFix(bugUrl = "https://github.com/elastic/elasticsearch/issues/86118")
-    @Override
-    public void testIndexPointsFromLine() throws Exception {
-        super.testIndexPointsFromLine();
-    }
-
-    @AwaitsFix(bugUrl = "https://github.com/elastic/elasticsearch/issues/86118")
-    @Override
-    public void testIndexPointsFromPolygon() throws Exception {
-        super.testIndexPointsFromPolygon();
-    }
 }

From 91f4023e27d0e0e97b22c26574dde981e99e9f56 Mon Sep 17 00:00:00 2001
From: Mary Gouseti <mary.gouseti@elastic.co>
Date: Mon, 2 Sep 2024 11:40:08 +0300
Subject: [PATCH 096/144] Expose global retention settings via data stream
 lifecycle API (#112210)

In this PR we expose the global retention via the `GET
_data_stream/{target}/_lifecycle` API.

Since the global retention is a main feature of the data stream
lifecycle we chose to expose it by default.

```
GET /_data_stream/my-data-stream/_lifecycle
{
 "global_retention": {
      "default_retention": "7d",
      "max_retention": "365d"
  },
  "data_streams": [...]
}
```
---
 docs/changelog/112210.yaml                    |  5 ++
 .../lifecycle/apis/get-lifecycle.asciidoc     | 30 ++++++-
 ...rial-manage-data-stream-retention.asciidoc | 16 +++-
 .../tutorial-manage-new-data-stream.asciidoc  |  3 +-
 .../RestGetDataStreamLifecycleAction.java     |  2 +-
 .../test/data_stream/lifecycle/20_basic.yml   | 83 +++++++++++++++++--
 .../data_stream/lifecycle/30_not_found.yml    |  8 +-
 .../GetDataStreamLifecycleAction.java         | 10 +++
 .../GetDataStreamLifecycleActionTests.java    | 76 +++++++++++++++--
 9 files changed, 206 insertions(+), 27 deletions(-)
 create mode 100644 docs/changelog/112210.yaml

diff --git a/docs/changelog/112210.yaml b/docs/changelog/112210.yaml
new file mode 100644
index 0000000000000..6483b8b01315c
--- /dev/null
+++ b/docs/changelog/112210.yaml
@@ -0,0 +1,5 @@
+pr: 112210
+summary: Expose global retention settings via data stream lifecycle API
+area: Data streams
+type: enhancement
+issues: []
diff --git a/docs/reference/data-streams/lifecycle/apis/get-lifecycle.asciidoc b/docs/reference/data-streams/lifecycle/apis/get-lifecycle.asciidoc
index 6bac1c7f7cc75..6323fac1eac2f 100644
--- a/docs/reference/data-streams/lifecycle/apis/get-lifecycle.asciidoc
+++ b/docs/reference/data-streams/lifecycle/apis/get-lifecycle.asciidoc
@@ -67,8 +67,18 @@ Name of the data stream.
 =====
 `data_retention`::
 (Optional, string)
+If defined, it represents the retention requested by the data stream owner for this data stream.
+
+`effective_retention`::
+(Optional, string)
 If defined, every document added to this data stream will be stored at least for this time frame. Any time after this
-duration the document could be deleted. When undefined, every document in this data stream will be stored indefinitely.
+duration the document could be deleted. When empty, every document in this data stream will be stored indefinitely.
+duration the document could be deleted. When empty, every document in this data stream will be stored indefinitely. The
+effective retention is calculated as described in the <<effective-retention-calculation, tutorial>>.
+
+`retention_determined_by`::
+(Optional, string)
+The source of the retention, it can be one of three values, `data_stream_configuration`, `default_retention` or `max_retention`.
 
 `rollover`::
 (Optional, object)
@@ -78,6 +88,21 @@ when the query param `include_defaults` is set to `true`. The contents of this f
 =====
 ====
 
+`global_retention`::
+(object)
+Contains the global max and default retention. When no global retention is configured, this will be an empty object.
++
+.Properties of `global_retention`
+[%collapsible%open]
+====
+`max_retention`::
+(Optional, string)
+The effective retention of data streams managed by the data stream lifecycle cannot exceed this value.
+`default_retention`::
+(Optional, string)
+This will be the effective retention of data streams managed by the data stream lifecycle that do not specify `data_retention`.
+====
+
 [[data-streams-get-lifecycle-example]]
 ==== {api-examples-title}
 
@@ -142,6 +167,7 @@ The response will look like the following:
         "retention_determined_by": "data_stream_configuration"
       }
     }
-  ]
+  ],
+  "global_retention": {}
 }
 --------------------------------------------------
diff --git a/docs/reference/data-streams/lifecycle/tutorial-manage-data-stream-retention.asciidoc b/docs/reference/data-streams/lifecycle/tutorial-manage-data-stream-retention.asciidoc
index 1b2996c62e2df..a7f0379a45167 100644
--- a/docs/reference/data-streams/lifecycle/tutorial-manage-data-stream-retention.asciidoc
+++ b/docs/reference/data-streams/lifecycle/tutorial-manage-data-stream-retention.asciidoc
@@ -189,19 +189,29 @@ We see that it will remain the same with what the user configured:
 [source,console-result]
 ----
 {
+  "global_retention" : {
+    "max_retention" : "90d",                                   <1>
+    "default_retention" : "7d"                                 <2>
+  },
   "data_streams": [
     {
       "name": "my-data-stream",
       "lifecycle": {
         "enabled": true,
-        "data_retention": "30d",
-        "effective_retention": "30d",
-        "retention_determined_by": "data_stream_configuration"
+        "data_retention": "30d",                                <3>
+        "effective_retention": "30d",                           <4>
+        "retention_determined_by": "data_stream_configuration"  <5>
       }
     }
   ]
 }
 ----
+<1> The maximum retention configured in the cluster.
+<2> The default retention configured in the cluster.
+<3> The requested retention for this data stream.
+<4> The retention that is applied by the data stream lifecycle on this data stream.
+<5> The configuration that determined the effective retention. In this case it's the `data_configuration` because
+it is less than the `max_retention`.
 
 [discrete]
 [[effective-retention-application]]
diff --git a/docs/reference/data-streams/lifecycle/tutorial-manage-new-data-stream.asciidoc b/docs/reference/data-streams/lifecycle/tutorial-manage-new-data-stream.asciidoc
index 01d51cdde3167..173b7a75dd28e 100644
--- a/docs/reference/data-streams/lifecycle/tutorial-manage-new-data-stream.asciidoc
+++ b/docs/reference/data-streams/lifecycle/tutorial-manage-new-data-stream.asciidoc
@@ -99,7 +99,8 @@ The result will look like this:
         "retention_determined_by": "data_stream_configuration"
       }
     }
-  ]
+  ],
+  "global_retention": {}
 }
 --------------------------------------------------
 <1> The name of your data stream.
diff --git a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/rest/RestGetDataStreamLifecycleAction.java b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/rest/RestGetDataStreamLifecycleAction.java
index 00f9d4da88301..ee325ed9655be 100644
--- a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/rest/RestGetDataStreamLifecycleAction.java
+++ b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/rest/RestGetDataStreamLifecycleAction.java
@@ -59,6 +59,6 @@ public boolean allowSystemIndexAccessByDefault() {
 
     @Override
     public Set<String> supportedCapabilities() {
-        return Set.of(DataStreamLifecycle.EFFECTIVE_RETENTION_REST_API_CAPABILITY);
+        return Set.of(DataStreamLifecycle.EFFECTIVE_RETENTION_REST_API_CAPABILITY, "data_stream_global_retention");
     }
 }
diff --git a/modules/data-streams/src/yamlRestTest/resources/rest-api-spec/test/data_stream/lifecycle/20_basic.yml b/modules/data-streams/src/yamlRestTest/resources/rest-api-spec/test/data_stream/lifecycle/20_basic.yml
index 1cf44312ae7d5..4bf6ccfbfa7ce 100644
--- a/modules/data-streams/src/yamlRestTest/resources/rest-api-spec/test/data_stream/lifecycle/20_basic.yml
+++ b/modules/data-streams/src/yamlRestTest/resources/rest-api-spec/test/data_stream/lifecycle/20_basic.yml
@@ -1,8 +1,8 @@
 setup:
-  - skip:
-      features: allowed_warnings
-      cluster_features: ["gte_v8.11.0"]
-      reason: "Data stream lifecycles only supported in 8.11+"
+  - requires:
+      cluster_features: [ "gte_v8.11.0" ]
+      reason: "Data stream lifecycle was released as tech preview in 8.11"
+      test_runner_features: allowed_warnings
   - do:
       allowed_warnings:
         - "index template [my-lifecycle] has index patterns [data-stream-with-lifecycle] matching patterns from existing older templates [global] with patterns (global => [*]); this template [my-lifecycle] will take precedence during new index creation"
@@ -25,6 +25,7 @@ setup:
         body:
           index_patterns: [simple-data-stream1]
           template:
+            lifecycle: {}
             mappings:
               properties:
                 '@timestamp':
@@ -39,27 +40,93 @@ setup:
         name: simple-data-stream1
 
 ---
-"Get data stream lifecycle":
+teardown:
+  - requires:
+      reason: "Global retention was exposed in 8.16+"
+      test_runner_features: [ capabilities ]
+      capabilities:
+        - method: GET
+          path: /_data_stream/{index}/_lifecycle
+          capabilities: [ 'data_stream_global_retention' ]
+  - do:
+      cluster.put_settings:
+        body:
+          persistent:
+            data_streams.lifecycle.retention.max: null
+            data_streams.lifecycle.retention.default: null
 
+---
+"Get data stream lifecycle":
+  - requires:
+      reason: "Global retention was exposed in 8.16+"
+      test_runner_features: [ capabilities ]
+      capabilities:
+        - method: GET
+          path: /_data_stream/{index}/_lifecycle
+          capabilities: [ 'data_stream_global_retention' ]
   - do:
       indices.get_data_lifecycle:
         name: "data-stream-with-lifecycle"
   - length: { data_streams: 1}
   - match: { data_streams.0.name: data-stream-with-lifecycle }
   - match: { data_streams.0.lifecycle.data_retention: '10d' }
+  - match: { data_streams.0.lifecycle.effective_retention: '10d' }
   - match: { data_streams.0.lifecycle.enabled: true}
+  - match: { global_retention: {} }
 
 ---
-"Get data stream with default lifecycle":
-  - skip:
-      awaits_fix: https://github.com/elastic/elasticsearch/pull/100187
+"Get data stream with default lifecycle configuration":
+  - requires:
+      reason: "Global retention was exposed in 8.16+"
+      test_runner_features: [ capabilities ]
+      capabilities:
+        - method: GET
+          path: /_data_stream/{index}/_lifecycle
+          capabilities: [ 'data_stream_global_retention' ]
+  - do:
+      indices.get_data_lifecycle:
+        name: "simple-data-stream1"
+  - length: { data_streams: 1}
+  - match: { data_streams.0.name: simple-data-stream1 }
+  - match: { data_streams.0.lifecycle.enabled: true}
+  - is_false: data_streams.0.lifecycle.effective_retention
+  - match: { global_retention: {} }
 
+---
+"Get data stream with global retention":
+  - requires:
+      reason: "Global retention was exposed in 8.16+"
+      test_runner_features: [ capabilities ]
+      capabilities:
+        - method: GET
+          path: /_data_stream/{index}/_lifecycle
+          capabilities: [ 'data_stream_global_retention' ]
+  - do:
+      cluster.put_settings:
+        body:
+          persistent:
+            data_streams.lifecycle.retention.default: "7d"
+            data_streams.lifecycle.retention.max: "9d"
   - do:
       indices.get_data_lifecycle:
         name: "simple-data-stream1"
   - length: { data_streams: 1}
   - match: { data_streams.0.name: simple-data-stream1 }
   - match: { data_streams.0.lifecycle.enabled: true}
+  - match: { data_streams.0.lifecycle.effective_retention: '7d'}
+  - match: { global_retention.default_retention: '7d' }
+  - match: { global_retention.max_retention: '9d' }
+
+  - do:
+      indices.get_data_lifecycle:
+        name: "data-stream-with-lifecycle"
+  - length: { data_streams: 1 }
+  - match: { data_streams.0.name: data-stream-with-lifecycle }
+  - match: { data_streams.0.lifecycle.data_retention: '10d' }
+  - match: { data_streams.0.lifecycle.effective_retention: '9d' }
+  - match: { data_streams.0.lifecycle.enabled: true }
+  - match: { global_retention.default_retention: '7d' }
+  - match: { global_retention.max_retention: '9d' }
 
 ---
 "Put data stream lifecycle":
diff --git a/modules/data-streams/src/yamlRestTest/resources/rest-api-spec/test/data_stream/lifecycle/30_not_found.yml b/modules/data-streams/src/yamlRestTest/resources/rest-api-spec/test/data_stream/lifecycle/30_not_found.yml
index 24d0a5649a619..a3252496ef592 100644
--- a/modules/data-streams/src/yamlRestTest/resources/rest-api-spec/test/data_stream/lifecycle/30_not_found.yml
+++ b/modules/data-streams/src/yamlRestTest/resources/rest-api-spec/test/data_stream/lifecycle/30_not_found.yml
@@ -1,8 +1,8 @@
 setup:
-  - skip:
-      features: allowed_warnings
-      cluster_features: ["gte_v8.11.0"]
-      reason: "Data stream lifecycle was GA in 8.11"
+  - requires:
+      cluster_features: [ "gte_v8.11.0" ]
+      reason: "Data stream lifecycle was released as tech preview in 8.11"
+      test_runner_features: allowed_warnings
   - do:
       allowed_warnings:
         - "index template [my-lifecycle] has index patterns [my-data-stream-1] matching patterns from existing older templates [global] with patterns (global => [*]); this template [my-lifecycle] will take precedence during new index creation"
diff --git a/server/src/main/java/org/elasticsearch/action/datastreams/lifecycle/GetDataStreamLifecycleAction.java b/server/src/main/java/org/elasticsearch/action/datastreams/lifecycle/GetDataStreamLifecycleAction.java
index 52af1341692eb..2ae6e544b3f53 100644
--- a/server/src/main/java/org/elasticsearch/action/datastreams/lifecycle/GetDataStreamLifecycleAction.java
+++ b/server/src/main/java/org/elasticsearch/action/datastreams/lifecycle/GetDataStreamLifecycleAction.java
@@ -254,6 +254,16 @@ public void writeTo(StreamOutput out) throws IOException {
         public Iterator<ToXContent> toXContentChunked(ToXContent.Params outerParams) {
             return Iterators.concat(Iterators.single((builder, params) -> {
                 builder.startObject();
+                builder.startObject("global_retention");
+                if (globalRetention != null) {
+                    if (globalRetention.maxRetention() != null) {
+                        builder.field("max_retention", globalRetention.maxRetention().getStringRep());
+                    }
+                    if (globalRetention.defaultRetention() != null) {
+                        builder.field("default_retention", globalRetention.defaultRetention().getStringRep());
+                    }
+                }
+                builder.endObject();
                 builder.startArray(DATA_STREAMS_FIELD.getPreferredName());
                 return builder;
             }),
diff --git a/server/src/test/java/org/elasticsearch/action/datastreams/lifecycle/GetDataStreamLifecycleActionTests.java b/server/src/test/java/org/elasticsearch/action/datastreams/lifecycle/GetDataStreamLifecycleActionTests.java
index 920e844055f6c..0edf5fd8b4ce7 100644
--- a/server/src/test/java/org/elasticsearch/action/datastreams/lifecycle/GetDataStreamLifecycleActionTests.java
+++ b/server/src/test/java/org/elasticsearch/action/datastreams/lifecycle/GetDataStreamLifecycleActionTests.java
@@ -12,6 +12,7 @@
 import org.elasticsearch.cluster.metadata.DataStreamGlobalRetention;
 import org.elasticsearch.cluster.metadata.DataStreamLifecycle;
 import org.elasticsearch.common.Strings;
+import org.elasticsearch.common.bytes.BytesReference;
 import org.elasticsearch.common.xcontent.XContentHelper;
 import org.elasticsearch.core.TimeValue;
 import org.elasticsearch.test.ESTestCase;
@@ -20,18 +21,80 @@
 import org.elasticsearch.xcontent.XContentType;
 
 import java.io.IOException;
+import java.util.List;
 import java.util.Map;
 
-import static org.elasticsearch.rest.RestRequest.PATH_RESTRICTED;
+import static org.elasticsearch.xcontent.ToXContent.EMPTY_PARAMS;
 import static org.hamcrest.Matchers.equalTo;
+import static org.hamcrest.Matchers.nullValue;
 
 public class GetDataStreamLifecycleActionTests extends ESTestCase {
 
+    @SuppressWarnings("unchecked")
+    public void testDefaultLifecycleResponseToXContent() throws Exception {
+        boolean isInternalDataStream = randomBoolean();
+        GetDataStreamLifecycleAction.Response.DataStreamLifecycle dataStreamLifecycle = createDataStreamLifecycle(
+            DataStreamLifecycle.DEFAULT,
+            isInternalDataStream
+        );
+        GetDataStreamLifecycleAction.Response response = new GetDataStreamLifecycleAction.Response(List.of(dataStreamLifecycle));
+        try (XContentBuilder builder = XContentBuilder.builder(XContentType.JSON.xContent())) {
+            builder.humanReadable(true);
+            response.toXContentChunked(ToXContent.EMPTY_PARAMS).forEachRemaining(xcontent -> {
+                try {
+                    xcontent.toXContent(builder, EMPTY_PARAMS);
+                } catch (IOException e) {
+                    logger.error(e.getMessage(), e);
+                    fail(e.getMessage());
+                }
+            });
+            Map<String, Object> resultMap = XContentHelper.convertToMap(BytesReference.bytes(builder), false, builder.contentType()).v2();
+            assertThat(resultMap.get("global_retention"), equalTo(Map.of()));
+            assertThat(resultMap.containsKey("data_streams"), equalTo(true));
+            List<Map<String, Object>> dataStreams = (List<Map<String, Object>>) resultMap.get("data_streams");
+            Map<String, Object> firstDataStream = dataStreams.get(0);
+            assertThat(firstDataStream.containsKey("lifecycle"), equalTo(true));
+            Map<String, Object> lifecycleResult = (Map<String, Object>) firstDataStream.get("lifecycle");
+            assertThat(lifecycleResult.get("enabled"), equalTo(true));
+            assertThat(lifecycleResult.get("data_retention"), nullValue());
+            assertThat(lifecycleResult.get("effective_retention"), nullValue());
+            assertThat(lifecycleResult.get("retention_determined_by"), nullValue());
+        }
+    }
+
+    @SuppressWarnings("unchecked")
+    public void testGlobalRetentionToXContent() {
+        TimeValue globalDefaultRetention = TimeValue.timeValueDays(10);
+        TimeValue globalMaxRetention = TimeValue.timeValueDays(50);
+        DataStreamGlobalRetention globalRetention = new DataStreamGlobalRetention(globalDefaultRetention, globalMaxRetention);
+        GetDataStreamLifecycleAction.Response response = new GetDataStreamLifecycleAction.Response(List.of(), null, globalRetention);
+        try (XContentBuilder builder = XContentBuilder.builder(XContentType.JSON.xContent())) {
+            builder.humanReadable(true);
+            response.toXContentChunked(ToXContent.EMPTY_PARAMS).forEachRemaining(xcontent -> {
+                try {
+                    xcontent.toXContent(builder, EMPTY_PARAMS);
+                } catch (IOException e) {
+                    logger.error(e.getMessage(), e);
+                    fail(e.getMessage());
+                }
+            });
+            Map<String, Object> resultMap = XContentHelper.convertToMap(BytesReference.bytes(builder), false, builder.contentType()).v2();
+            assertThat(resultMap.containsKey("global_retention"), equalTo(true));
+            Map<String, String> globalRetentionMap = (Map<String, String>) resultMap.get("global_retention");
+            assertThat(globalRetentionMap.get("max_retention"), equalTo(globalMaxRetention.getStringRep()));
+            assertThat(globalRetentionMap.get("default_retention"), equalTo(globalDefaultRetention.getStringRep()));
+            assertThat(resultMap.containsKey("data_streams"), equalTo(true));
+        } catch (Exception e) {
+            fail(e);
+        }
+    }
+
     @SuppressWarnings("unchecked")
     public void testDataStreamLifecycleToXContent() throws Exception {
         TimeValue configuredRetention = TimeValue.timeValueDays(100);
         TimeValue globalDefaultRetention = TimeValue.timeValueDays(10);
         TimeValue globalMaxRetention = TimeValue.timeValueDays(50);
+        DataStreamGlobalRetention globalRetention = new DataStreamGlobalRetention(globalDefaultRetention, globalMaxRetention);
         DataStreamLifecycle lifecycle = new DataStreamLifecycle(new DataStreamLifecycle.Retention(configuredRetention), null, null);
         {
             boolean isInternalDataStream = true;
@@ -39,7 +102,7 @@ public void testDataStreamLifecycleToXContent() throws Exception {
                 lifecycle,
                 isInternalDataStream
             );
-            Map<String, Object> resultMap = getXContentMap(explainIndexDataStreamLifecycle, globalDefaultRetention, globalMaxRetention);
+            Map<String, Object> resultMap = getXContentMap(explainIndexDataStreamLifecycle, globalRetention);
             Map<String, Object> lifecycleResult = (Map<String, Object>) resultMap.get("lifecycle");
             assertThat(lifecycleResult.get("data_retention"), equalTo(configuredRetention.getStringRep()));
             assertThat(lifecycleResult.get("effective_retention"), equalTo(configuredRetention.getStringRep()));
@@ -51,7 +114,7 @@ public void testDataStreamLifecycleToXContent() throws Exception {
                 lifecycle,
                 isInternalDataStream
             );
-            Map<String, Object> resultMap = getXContentMap(explainIndexDataStreamLifecycle, globalDefaultRetention, globalMaxRetention);
+            Map<String, Object> resultMap = getXContentMap(explainIndexDataStreamLifecycle, globalRetention);
             Map<String, Object> lifecycleResult = (Map<String, Object>) resultMap.get("lifecycle");
             assertThat(lifecycleResult.get("data_retention"), equalTo(configuredRetention.getStringRep()));
             assertThat(lifecycleResult.get("effective_retention"), equalTo(globalMaxRetention.getStringRep()));
@@ -71,14 +134,11 @@ private GetDataStreamLifecycleAction.Response.DataStreamLifecycle createDataStre
      */
     private Map<String, Object> getXContentMap(
         GetDataStreamLifecycleAction.Response.DataStreamLifecycle dataStreamLifecycle,
-        TimeValue globalDefaultRetention,
-        TimeValue globalMaxRetention
+        DataStreamGlobalRetention globalRetention
     ) throws IOException {
         try (XContentBuilder builder = XContentBuilder.builder(XContentType.JSON.xContent())) {
-            ToXContent.Params params = new ToXContent.MapParams(Map.of(PATH_RESTRICTED, "serverless"));
             RolloverConfiguration rolloverConfiguration = null;
-            DataStreamGlobalRetention globalRetention = new DataStreamGlobalRetention(globalDefaultRetention, globalMaxRetention);
-            dataStreamLifecycle.toXContent(builder, params, rolloverConfiguration, globalRetention);
+            dataStreamLifecycle.toXContent(builder, ToXContent.EMPTY_PARAMS, rolloverConfiguration, globalRetention);
             String serialized = Strings.toString(builder);
             return XContentHelper.convertToMap(XContentType.JSON.xContent(), serialized, randomBoolean());
         }

From dac7a8e483b33e0018ab2724fe0b1bc67d621d3d Mon Sep 17 00:00:00 2001
From: Ignacio Vera <ignacio.vera@elastic.co>
Date: Mon, 2 Sep 2024 10:45:02 +0200
Subject: [PATCH 097/144] Fix test configuration for merge policy in
 LatLonShapeDocValuesQueryTests and CartesianShapeDocValuesQueryTests
 (#112425)

---
 muted-tests.yml                                             | 6 ------
 .../lucene/spatial/CartesianShapeDocValuesQueryTests.java   | 4 ++--
 .../lucene/spatial/LatLonShapeDocValuesQueryTests.java      | 4 ++--
 3 files changed, 4 insertions(+), 10 deletions(-)

diff --git a/muted-tests.yml b/muted-tests.yml
index 6a049833096b4..3c8381f7e067b 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -171,12 +171,6 @@ tests:
 - class: org.elasticsearch.action.admin.cluster.stats.CCSTelemetrySnapshotTests
   method: testToXContent
   issue: https://github.com/elastic/elasticsearch/issues/112325
-- class: org.elasticsearch.lucene.spatial.LatLonShapeDocValuesQueryTests
-  method: testEmptySegment
-  issue: https://github.com/elastic/elasticsearch/issues/112413
-- class: org.elasticsearch.lucene.spatial.CartesianShapeDocValuesQueryTests
-  method: testEmptySegment
-  issue: https://github.com/elastic/elasticsearch/issues/112414
 - class: org.elasticsearch.search.retriever.RankDocRetrieverBuilderIT
   method: testRankDocsRetrieverWithNestedQuery
   issue: https://github.com/elastic/elasticsearch/issues/112421
diff --git a/server/src/test/java/org/elasticsearch/lucene/spatial/CartesianShapeDocValuesQueryTests.java b/server/src/test/java/org/elasticsearch/lucene/spatial/CartesianShapeDocValuesQueryTests.java
index e98b9016cca1c..2555dd41845b8 100644
--- a/server/src/test/java/org/elasticsearch/lucene/spatial/CartesianShapeDocValuesQueryTests.java
+++ b/server/src/test/java/org/elasticsearch/lucene/spatial/CartesianShapeDocValuesQueryTests.java
@@ -18,7 +18,7 @@
 import org.apache.lucene.index.IndexWriter;
 import org.apache.lucene.index.IndexWriterConfig;
 import org.apache.lucene.index.IndexableField;
-import org.apache.lucene.index.NoMergeScheduler;
+import org.apache.lucene.index.NoMergePolicy;
 import org.apache.lucene.index.SerialMergeScheduler;
 import org.apache.lucene.search.IndexSearcher;
 import org.apache.lucene.search.Query;
@@ -59,7 +59,7 @@ public void testEqualsAndHashcode() {
     public void testEmptySegment() throws Exception {
         IndexWriterConfig iwc = newIndexWriterConfig();
         // No merges
-        iwc.setMergeScheduler(NoMergeScheduler.INSTANCE);
+        iwc.setMergePolicy(NoMergePolicy.INSTANCE);
         Directory dir = newDirectory();
         IndexWriter w = new IndexWriter(dir, iwc);
         ShapeIndexer indexer = new CartesianShapeIndexer(FIELD_NAME);
diff --git a/server/src/test/java/org/elasticsearch/lucene/spatial/LatLonShapeDocValuesQueryTests.java b/server/src/test/java/org/elasticsearch/lucene/spatial/LatLonShapeDocValuesQueryTests.java
index e00b7fa4736b3..3a180a8d7cf8e 100644
--- a/server/src/test/java/org/elasticsearch/lucene/spatial/LatLonShapeDocValuesQueryTests.java
+++ b/server/src/test/java/org/elasticsearch/lucene/spatial/LatLonShapeDocValuesQueryTests.java
@@ -20,7 +20,7 @@
 import org.apache.lucene.index.IndexWriter;
 import org.apache.lucene.index.IndexWriterConfig;
 import org.apache.lucene.index.IndexableField;
-import org.apache.lucene.index.NoMergeScheduler;
+import org.apache.lucene.index.NoMergePolicy;
 import org.apache.lucene.index.SerialMergeScheduler;
 import org.apache.lucene.search.IndexSearcher;
 import org.apache.lucene.search.Query;
@@ -60,7 +60,7 @@ public void testEqualsAndHashcode() {
     public void testEmptySegment() throws Exception {
         IndexWriterConfig iwc = newIndexWriterConfig();
         // No merges
-        iwc.setMergeScheduler(NoMergeScheduler.INSTANCE);
+        iwc.setMergePolicy(NoMergePolicy.INSTANCE);
         Directory dir = newDirectory();
         IndexWriter w = new IndexWriter(dir, iwc);
         GeoShapeIndexer indexer = new GeoShapeIndexer(Orientation.CCW, FIELD_NAME);

From 1acba13a445713f9b5b95f17c3772b1b2c1c0772 Mon Sep 17 00:00:00 2001
From: Liam Thompson <32779855+leemthompo@users.noreply.github.com>
Date: Mon, 2 Sep 2024 10:22:41 +0100
Subject: [PATCH 098/144] [DOCS] Update documents and indices overview
 (#112394)

---
 docs/reference/intro.asciidoc | 143 ++++++++++++++++++++++------------
 1 file changed, 92 insertions(+), 51 deletions(-)

diff --git a/docs/reference/intro.asciidoc b/docs/reference/intro.asciidoc
index cd9c126e7b1fd..3ad5a9bd71c08 100644
--- a/docs/reference/intro.asciidoc
+++ b/docs/reference/intro.asciidoc
@@ -55,7 +55,7 @@ You can deploy {es} in various ways:
 [[elasticsearch-next-steps]]
 === Learn more
 
-Here are some resources to help you get started:
+Some resources to help you get started:
 
 * <<getting-started, Quickstart>>. A beginner's guide to deploying your first {es} instance, indexing data, and running queries.
 * https://elastic.co/webinars/getting-started-elasticsearch[Webinar: Introduction to {es}]. Register for our live webinars to learn directly from {es} experts.
@@ -63,58 +63,99 @@ Here are some resources to help you get started:
 ** Follow our tutorial https://www.elastic.co/search-labs/tutorials/search-tutorial/welcome[to build a hybrid search solution in Python].
 ** Check out the https://github.com/elastic/elasticsearch-labs?tab=readme-ov-file#elasticsearch-examples--apps[`elasticsearch-labs` repository] for a range of Python notebooks and apps for various use cases.
 
+// new html page 
 [[documents-indices]]
-=== Documents and indices
-
-{es} is a distributed document store. Instead of storing information as rows of
-columnar data, {es} stores complex data structures that have been serialized
-as JSON documents. When you have multiple {es} nodes in a cluster, stored
-documents are distributed across the cluster and can be accessed immediately
-from any node.
-
-When a document is stored, it is indexed and fully searchable in <<near-real-time,near real-time>>--within 1 second. {es} uses a data structure called an
-inverted index that supports very fast full-text searches. An inverted index
-lists every unique word that appears in any document and identifies all of the
-documents each word occurs in.
-
-An index can be thought of as an optimized collection of documents and each
-document is a collection of fields, which are the key-value pairs that contain
-your data. By default, {es} indexes all data in every field and each indexed
-field has a dedicated, optimized data structure. For example, text fields are
-stored in inverted indices, and numeric and geo fields are stored in BKD trees.
-The ability to use the per-field data structures to assemble and return search
-results is what makes {es} so fast.
-
-{es} also has the ability to be schema-less, which means that documents can be
-indexed without explicitly specifying how to handle each of the different fields
-that might occur in a document. When dynamic mapping is enabled, {es}
-automatically detects and adds new fields to the index. This default
-behavior makes it easy to index and explore your data--just start
-indexing documents and {es} will detect and map booleans, floating point and
-integer values, dates, and strings to the appropriate {es} data types.
-
-You can define rules to control dynamic mapping and explicitly
-define mappings to take full control of how fields are stored and indexed.
-
-Defining your own mappings enables you to:
-
-* Distinguish between full-text string fields and exact value string fields
-* Perform language-specific text analysis
-* Optimize fields for partial matching
-* Use custom date formats
-* Use data types such as `geo_point` and `geo_shape` that cannot be automatically
-detected
-
-It’s often useful to index the same field in different ways for different
-purposes. For example, you might want to index a string field as both a text
-field for full-text search and as a keyword field for sorting or aggregating
-your data. Or, you might choose to use more than one language analyzer to
-process the contents of a string field that contains user input.
-
-The analysis chain that is applied to a full-text field during indexing is also
-used at search time. When you query a full-text field, the query text undergoes
-the same analysis before the terms are looked up in the index.
+=== Indices, documents, and fields
+++++
+<titleabbrev>Indices and documents</titleabbrev>
+++++
 
+The index is the fundamental unit of storage in {es}, a logical namespace for storing data that share similar characteristics.
+After you have {es} <<elasticsearch-intro-deploy,deployed>>, you'll get started by creating an index to store your data.
+
+[TIP]
+====
+A closely related concept is a <<data-streams,data stream>>.
+This index abstraction is optimized for append-only time-series data, and is made up of hidden, auto-generated backing indices.
+If you're working with time-series data, we recommend the {observability-guide}[Elastic Observability] solution.
+====
+
+Some key facts about indices:
+
+* An index is a collection of documents
+* An index has a unique name
+* An index can also be referred to by an alias
+* An index has a mapping that defines the schema of its documents
+
+[discrete]
+[[elasticsearch-intro-documents-fields]]
+==== Documents and fields
+
+{es} serializes and stores data in the form of JSON documents.
+A document is a set of fields, which are key-value pairs that contain your data.
+Each document has a unique ID, which you can create or have {es} auto-generate.
+
+A simple {es} document might look like this:
+
+[source,js]
+----
+{
+  "_index": "my-first-elasticsearch-index",
+  "_id": "DyFpo5EBxE8fzbb95DOa",
+  "_version": 1,
+  "_seq_no": 0,
+  "_primary_term": 1,
+  "found": true,
+  "_source": {
+    "email": "john@smith.com",
+    "first_name": "John",
+    "last_name": "Smith",
+    "info": {
+      "bio": "Eco-warrior and defender of the weak",
+      "age": 25,
+      "interests": [
+        "dolphins",
+        "whales"
+      ]
+    },
+    "join_date": "2024/05/01"
+  }
+}
+----
+// NOTCONSOLE
+
+[discrete]
+[[elasticsearch-intro-documents-fields-data-metadata]]
+==== Data and metadata
+
+An indexed document contains data and metadata.
+In {es}, metadata fields are prefixed with an underscore.
+
+The most important metadata fields are:
+
+* `_source`. Contains the original JSON document.
+* `_index`. The name of the index where the document is stored.
+* `_id`. The document's ID. IDs must be unique per index.
+
+[discrete]
+[[elasticsearch-intro-documents-fields-mappings]]
+==== Mappings and data types
+
+Each index has a <<mapping,mapping>> or schema for how the fields in your documents are indexed.
+A mapping defines the <<mapping-types,data type>> for each field, how the field should be indexed,
+and how it should be stored.
+When adding documents to {es}, you have two options for mappings:
+
+* <<mapping-dynamic, Dynamic mapping>>. Let {es} automatically detect the data types and create the mappings for you. This is great for getting started quickly.
+* <<mapping-explicit, Explicit mapping>>. Define the mappings up front by specifying data types for each field. Recommended for production use cases.
+
+[TIP]
+====
+You can use a combination of dynamic and explicit mapping on the same index.
+This is useful when you have a mix of known and unknown fields in your data.
+====
+
+// New html page
 [[search-analyze]]
 === Search and analyze
 

From 0426e1fbd5dbf1eb9dae07f9af3592569165f5de Mon Sep 17 00:00:00 2001
From: Luke Whiting <luke.whiting@elastic.co>
Date: Mon, 2 Sep 2024 11:00:06 +0100
Subject: [PATCH 099/144] (API) Cluster Health report unassigned_primary_shards
 (#111727) (#112024)

This PR adds a count of currently unassigned primary shards to both the
`/_cat/health` and `/_cluster/health` endpoints. This is to aid cluster
administrators in estimating the time remaining for a cluster to go from
RED to YELLOW status as per enchancement request #111727.

Tests and doc updates are in place with this PR and manual testing with
`./gradlew run` has been conducted on the endpoints to ensure correct
output.

## Known Limitations * Testing   * Due to limitations in the YAML REST
test framework skip functionality, YAML REST tests for this endpoint are
disabled when running a mixed version cluster by using a cluster version
number synthetic feature to skip when any member of the cluster is not
at a version greater than when this change is due to be introduced
---
 docs/changelog/112024.yaml                    |   5 +
 docs/reference/cat/health.asciidoc            |  30 +++---
 docs/reference/cluster/health.asciidoc        |  62 ++++++-----
 .../test/cat.health/10_basic.yml              |  55 +++++++---
 .../test/cluster.health/10_basic.yml          | 101 ++++++++++++------
 .../cluster.health/20_request_timeout.yml     |  48 ++++++---
 .../org/elasticsearch/TransportVersions.java  |   1 +
 .../cluster/health/ClusterHealthResponse.java |   6 ++
 .../cluster/health/ClusterIndexHealth.java    |  25 +++++
 .../cluster/health/ClusterShardHealth.java    |  35 +++++-
 .../cluster/health/ClusterStateHealth.java    |  23 ++++
 .../cluster/RestClusterHealthAction.java      |   6 ++
 .../rest/action/cat/RestHealthAction.java     |  12 +++
 .../health/ClusterHealthResponsesTests.java   |   7 +-
 .../health/ClusterIndexHealthTests.java       |  30 ++++++
 .../health/ClusterShardHealthTests.java       |  25 ++++-
 .../health/ClusterStateHealthTests.java       |   1 +
 .../routing/RoutingTableGenerator.java        |   4 +
 18 files changed, 365 insertions(+), 111 deletions(-)
 create mode 100644 docs/changelog/112024.yaml

diff --git a/docs/changelog/112024.yaml b/docs/changelog/112024.yaml
new file mode 100644
index 0000000000000..e426693fba964
--- /dev/null
+++ b/docs/changelog/112024.yaml
@@ -0,0 +1,5 @@
+pr: 112024
+summary: (API) Cluster Health report `unassigned_primary_shards`
+area: Health
+type: enhancement
+issues: []
diff --git a/docs/reference/cat/health.asciidoc b/docs/reference/cat/health.asciidoc
index 04a11699d3ecf..ad39ace310807 100644
--- a/docs/reference/cat/health.asciidoc
+++ b/docs/reference/cat/health.asciidoc
@@ -6,8 +6,8 @@
 
 [IMPORTANT]
 ====
-cat APIs are only intended for human consumption using the command line or {kib} 
-console. They are _not_ intended for use by applications. For application 
+cat APIs are only intended for human consumption using the command line or {kib}
+console. They are _not_ intended for use by applications. For application
 consumption, use the <<cluster-health,cluster health API>>.
 ====
 
@@ -87,8 +87,8 @@ The API returns the following response:
 
 [source,txt]
 --------------------------------------------------
-epoch      timestamp cluster       status node.total node.data shards pri relo init unassign pending_tasks max_task_wait_time active_shards_percent
-1475871424 16:17:04  elasticsearch green           1         1      1   1    0    0        0             0                  -                100.0%
+epoch      timestamp cluster       status node.total node.data shards pri relo init unassign unassign.pri pending_tasks max_task_wait_time active_shards_percent
+1475871424 16:17:04  elasticsearch green           1         1      1   1    0    0        0            0             0                  -                100.0%
 --------------------------------------------------
 // TESTRESPONSE[s/1475871424 16:17:04/\\d+ \\d+:\\d+:\\d+/]
 // TESTRESPONSE[s/elasticsearch/[^ ]+/ s/0                  -/\\d+ (-|\\d+(\\.\\d+)?[ms]+)/ non_json]
@@ -107,11 +107,13 @@ The API returns the following response:
 
 [source,txt]
 --------------------------------------------------
-cluster       status node.total node.data shards pri relo init unassign pending_tasks max_task_wait_time active_shards_percent
-elasticsearch green           1         1      1   1    0    0        0             0                  -                100.0%
+cluster       status node.total node.data shards pri relo init unassign unassign.pri pending_tasks max_task_wait_time active_shards_percent
+elasticsearch green           1         1      1   1    0    0        0            0             0                  -                100.0%
 --------------------------------------------------
 // TESTRESPONSE[s/elasticsearch/[^ ]+/ s/0                  -/\\d+ (-|\\d+(\\.\\d+)?[ms]+)/ non_json]
 
+**Note**: The reported number of unassigned primary shards may be lower than the true value if your cluster contains nodes running a version below 8.16. For a more accurate count in this scenario, please use the <<cluster-health,cluster health API>>.
+
 [[cat-health-api-example-across-nodes]]
 ===== Example across nodes
 You can use the cat health API to verify the health of a cluster across nodes.
@@ -121,11 +123,11 @@ For example:
 --------------------------------------------------
 % pssh -i -h list.of.cluster.hosts curl -s localhost:9200/_cat/health
 [1] 20:20:52 [SUCCESS] es3.vm
-1384309218 18:20:18 foo green 3 3 3 3 0 0 0 0
+1384309218 18:20:18 foo green 3 3 3 3 0 0 0 0 0
 [2] 20:20:52 [SUCCESS] es1.vm
-1384309218 18:20:18 foo green 3 3 3 3 0 0 0 0
+1384309218 18:20:18 foo green 3 3 3 3 0 0 0 0 0
 [3] 20:20:52 [SUCCESS] es2.vm
-1384309218 18:20:18 foo green 3 3 3 3 0 0 0 0
+1384309218 18:20:18 foo green 3 3 3 3 0 0 0 0 0
 --------------------------------------------------
 // NOTCONSOLE
 
@@ -138,10 +140,10 @@ in a delayed loop. For example:
 [source,sh]
 --------------------------------------------------
 % while true; do curl localhost:9200/_cat/health; sleep 120; done
-1384309446 18:24:06 foo red 3 3 20 20 0 0 1812 0
-1384309566 18:26:06 foo yellow 3 3 950 916 0 12 870 0
-1384309686 18:28:06 foo yellow 3 3 1328 916 0 12 492 0
-1384309806 18:30:06 foo green 3 3 1832 916 4 0 0
+1384309446 18:24:06 foo red 3 3 20 20 0 0 1812 1121 0
+1384309566 18:26:06 foo yellow 3 3 950 916 0 12 870 421 0
+1384309686 18:28:06 foo yellow 3 3 1328 916 0 12 492 301 0
+1384309806 18:30:06 foo green 3 3 1832 916 4 0 0 0
 ^C
 --------------------------------------------------
 // NOTCONSOLE
@@ -149,4 +151,4 @@ in a delayed loop. For example:
 In this example, the recovery took roughly six minutes, from `18:24:06` to
 `18:30:06`. If this recovery took hours, you could continue to monitor the
 number of `UNASSIGNED` shards, which should drop. If the number of `UNASSIGNED`
-shards remains static, it would indicate an issue with the cluster recovery.
\ No newline at end of file
+shards remains static, it would indicate an issue with the cluster recovery.
diff --git a/docs/reference/cluster/health.asciidoc b/docs/reference/cluster/health.asciidoc
index 3a4058a55ce16..94eb80a03d12e 100644
--- a/docs/reference/cluster/health.asciidoc
+++ b/docs/reference/cluster/health.asciidoc
@@ -20,22 +20,22 @@ Returns the health status of a cluster.
 [[cluster-health-api-desc]]
 ==== {api-description-title}
 
-The cluster health API returns a simple status on the health of the 
+The cluster health API returns a simple status on the health of the
 cluster. You can also use the API to get the health status of only specified
 data streams and indices. For data streams, the API retrieves the health status
 of the stream's backing indices.
 
-The cluster health status is: `green`, `yellow` or `red`. On the shard level, a 
-`red` status indicates that the specific shard is not allocated in the cluster, 
-`yellow` means that the primary shard is allocated but replicas are not, and 
-`green` means that all shards are allocated. The index level status is 
-controlled by the worst shard status. The cluster status is controlled by the 
+The cluster health status is: `green`, `yellow` or `red`. On the shard level, a
+`red` status indicates that the specific shard is not allocated in the cluster,
+`yellow` means that the primary shard is allocated but replicas are not, and
+`green` means that all shards are allocated. The index level status is
+controlled by the worst shard status. The cluster status is controlled by the
 worst index status.
 
-One of the main benefits of the API is the ability to wait until the cluster 
-reaches a certain high water-mark health level. For example, the following will 
-wait for 50 seconds for the cluster to reach the `yellow` level (if it reaches 
-the `green` or `yellow` status before 50 seconds elapse, it will return at that 
+One of the main benefits of the API is the ability to wait until the cluster
+reaches a certain high water-mark health level. For example, the following will
+wait for 50 seconds for the cluster to reach the `yellow` level (if it reaches
+the `green` or `yellow` status before 50 seconds elapse, it will return at that
 point):
 
 [source,console]
@@ -58,31 +58,31 @@ To target all data streams and indices in a cluster, omit this parameter or use
 ==== {api-query-parms-title}
 
 `level`::
-    (Optional, string) Can be one of `cluster`, `indices` or `shards`. Controls 
+    (Optional, string) Can be one of `cluster`, `indices` or `shards`. Controls
     the details level of the health information returned. Defaults to `cluster`.
-    
+
 include::{es-ref-dir}/rest-api/common-parms.asciidoc[tag=local]
-    
+
 include::{es-ref-dir}/rest-api/common-parms.asciidoc[tag=timeoutparms]
 
 `wait_for_active_shards`::
-    (Optional, string) A number controlling to how many active shards to wait 
-    for, `all` to wait for all shards in the cluster to be active, or `0` to not 
+    (Optional, string) A number controlling to how many active shards to wait
+    for, `all` to wait for all shards in the cluster to be active, or `0` to not
     wait. Defaults to `0`.
-    
+
 `wait_for_events`::
-    (Optional, string) Can be one of `immediate`, `urgent`, `high`, `normal`, 
-    `low`, `languid`. Wait until all currently queued events with the given 
+    (Optional, string) Can be one of `immediate`, `urgent`, `high`, `normal`,
+    `low`, `languid`. Wait until all currently queued events with the given
     priority are processed.
 
 `wait_for_no_initializing_shards`::
-    (Optional, Boolean) A boolean value which controls whether to wait (until 
-    the timeout provided) for the cluster to have no shard initializations. 
+    (Optional, Boolean) A boolean value which controls whether to wait (until
+    the timeout provided) for the cluster to have no shard initializations.
     Defaults to false, which means it will not wait for initializing shards.
 
 `wait_for_no_relocating_shards`::
-    (Optional, Boolean) A boolean value which controls whether to wait (until 
-    the timeout provided) for the cluster to have no shard relocations. Defaults 
+    (Optional, Boolean) A boolean value which controls whether to wait (until
+    the timeout provided) for the cluster to have no shard relocations. Defaults
     to false, which means it will not wait for relocating shards.
 
 `wait_for_nodes`::
@@ -92,7 +92,7 @@ include::{es-ref-dir}/rest-api/common-parms.asciidoc[tag=timeoutparms]
     `lt(N)` notation.
 
 `wait_for_status`::
-    (Optional, string) One of `green`, `yellow` or `red`. Will wait (until the 
+    (Optional, string) One of `green`, `yellow` or `red`. Will wait (until the
     timeout provided) until the status of the cluster changes to the one
     provided or better, i.e. `green` > `yellow` > `red`. By default, will not
     wait for any status.
@@ -107,7 +107,7 @@ include::{es-ref-dir}/rest-api/common-parms.asciidoc[tag=timeoutparms]
 include::{es-ref-dir}/rest-api/common-parms.asciidoc[tag=cluster-health-status]
 
 `timed_out`::
-    (Boolean) If `false` the response returned within the period of 
+    (Boolean) If `false` the response returned within the period of
     time that is specified by the `timeout` parameter (`30s` by default).
 
 `number_of_nodes`::
@@ -131,23 +131,26 @@ include::{es-ref-dir}/rest-api/common-parms.asciidoc[tag=cluster-health-status]
 `unassigned_shards`::
     (integer) The number of shards that are not allocated.
 
+`unassigned_primary_shards`::
+    (integer) The number of shards that are primary but not allocated. **Note**: This number may be lower than the true value if your cluster contains nodes running a version below 8.16. For a more accurate count in this scenario, please use the <<cluster-health,cluster health API>>.
+
 `delayed_unassigned_shards`::
-    (integer) The number of shards whose allocation has been delayed by the 
+    (integer) The number of shards whose allocation has been delayed by the
     timeout settings.
 
 `number_of_pending_tasks`::
-    (integer) The number of cluster-level changes that have not yet been 
+    (integer) The number of cluster-level changes that have not yet been
     executed.
 
 `number_of_in_flight_fetch`::
     (integer) The number of unfinished fetches.
 
 `task_max_waiting_in_queue_millis`::
-    (integer) The time expressed in milliseconds since the earliest initiated task 
+    (integer) The time expressed in milliseconds since the earliest initiated task
     is waiting for being performed.
 
 `active_shards_percent_as_number`::
-    (float) The ratio of active shards in the cluster expressed as a percentage. 
+    (float) The ratio of active shards in the cluster expressed as a percentage.
 
 [[cluster-health-api-example]]
 ==== {api-examples-title}
@@ -158,7 +161,7 @@ GET _cluster/health
 --------------------------------------------------
 // TEST[s/^/PUT test1\n/]
 
-The API returns the following response in case of a quiet single node cluster 
+The API returns the following response in case of a quiet single node cluster
 with a single index with one shard and one replica:
 
 [source,console-result]
@@ -174,6 +177,7 @@ with a single index with one shard and one replica:
   "relocating_shards" : 0,
   "initializing_shards" : 0,
   "unassigned_shards" : 1,
+  "unassigned_primary_shards" : 0,
   "delayed_unassigned_shards": 0,
   "number_of_pending_tasks" : 0,
   "number_of_in_flight_fetch": 0,
diff --git a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/cat.health/10_basic.yml b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/cat.health/10_basic.yml
index 504b7c8f9b1b6..063c614859a3f 100644
--- a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/cat.health/10_basic.yml
+++ b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/cat.health/10_basic.yml
@@ -1,32 +1,45 @@
 ---
 "Help":
+  - requires:
+      capabilities:
+        - method: GET
+          path: /_cluster/health
+          capabilities: [ unassigned_pri_shard_count ]
+      test_runner_features: capabilities
+      reason: Capability required to run test
   - do:
       cat.health:
         help: true
 
   - match:
       $body: |
-               /^  epoch         .+ \n
-                   timestamp     .+ \n
-                   cluster       .+ \n
-                   status        .+ \n
-                   node.total    .+ \n
-                   node.data     .+ \n
-                   shards        .+ \n
-                   pri           .+ \n
-                   relo          .+ \n
-                   init          .+ \n
-                   unassign      .+ \n
-                   pending_tasks .+ \n
-                   max_task_wait_time .+ \n
-                   active_shards_percent .+ \n
-
+               /^  epoch         .+\n
+                   timestamp     .+\n
+                   cluster       .+\n
+                   status        .+\n
+                   node.total    .+\n
+                   node.data     .+\n
+                   shards        .+\n
+                   pri           .+\n
+                   relo          .+\n
+                   init          .+\n
+                   unassign      .+\n
+                   unassign.pri  .+\n
+                   pending_tasks .+\n
+                   max_task_wait_time .+\n
+                   active_shards_percent .+\n
                $/
 
 
 ---
 "Empty cluster":
-
+  - requires:
+      capabilities:
+        - method: GET
+          path: /_cluster/health
+          capabilities: [ unassigned_pri_shard_count ]
+      test_runner_features: capabilities
+      reason: Capability required to run test
   - do:
       cat.health: {}
 
@@ -44,6 +57,7 @@
                 \d+            \s+ # relo
                 \d+            \s+ # init
                 \d+            \s+ # unassign
+                \d+            \s+ # unassign.pri
                 \d+            \s+ # pending_tasks
                 (-|\d+(?:[.]\d+)?m?s) \s+ # max task waiting time
                 \d+\.\d+%             # active shards percent
@@ -54,7 +68,13 @@
 
 ---
 "With ts parameter":
-
+  - requires:
+      capabilities:
+        - method: GET
+          path: /_cluster/health
+          capabilities: [ unassigned_pri_shard_count ]
+      test_runner_features: capabilities
+      reason: Capability required to run test
   - do:
       cat.health:
         ts: false
@@ -71,6 +91,7 @@
                 \d+            \s+ # relo
                 \d+            \s+ # init
                 \d+            \s+ # unassign
+                \d+            \s+ # unassign.pri
                 \d+            \s+ # pending_tasks
                 (-|\d+(?:[.]\d+)?m?s) \s+ # max task waiting time
                 \d+\.\d+%             # active shards percent
diff --git a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/cluster.health/10_basic.yml b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/cluster.health/10_basic.yml
index a01b68e96bbd2..c1c9741eb5fa3 100644
--- a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/cluster.health/10_basic.yml
+++ b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/cluster.health/10_basic.yml
@@ -1,21 +1,38 @@
 ---
 "cluster health basic test":
+  - requires:
+      capabilities:
+        - method: GET
+          path: /_cluster/health
+          capabilities: [ unassigned_pri_shard_count ]
+      test_runner_features: capabilities
+      reason: Capability required to run test
+
   - do:
       cluster.health: {}
 
   - is_true:   cluster_name
   - is_false:  timed_out
-  - gte:       { number_of_nodes:         1 }
-  - gte:       { number_of_data_nodes:    1 }
-  - match:     { active_primary_shards:   0 }
-  - match:     { active_shards:           0 }
-  - match:     { relocating_shards:       0 }
-  - match:     { initializing_shards:     0 }
-  - match:     { unassigned_shards:       0 }
-  - gte:       { number_of_pending_tasks: 0 }
+  - gte:       { number_of_nodes:           1 }
+  - gte:       { number_of_data_nodes:      1 }
+  - match:     { active_primary_shards:     0 }
+  - match:     { active_shards:             0 }
+  - match:     { relocating_shards:         0 }
+  - match:     { initializing_shards:       0 }
+  - match:     { unassigned_shards:         0 }
+  - match:     { unassigned_primary_shards: 0 }
+  - gte:       { number_of_pending_tasks:   0 }
 
 ---
 "cluster health basic test, one index":
+  - requires:
+      capabilities:
+        - method: GET
+          path: /_cluster/health
+          capabilities: [ unassigned_pri_shard_count ]
+      test_runner_features: capabilities
+      reason: Capability required to run test
+
   - do:
       indices.create:
         index: test_index
@@ -31,17 +48,26 @@
 
   - is_true:   cluster_name
   - is_false:  timed_out
-  - gte:       { number_of_nodes:         1 }
-  - gte:       { number_of_data_nodes:    1 }
-  - gt:        { active_primary_shards:   0 }
-  - gt:        { active_shards:           0 }
-  - gte:       { relocating_shards:       0 }
-  - match:     { initializing_shards:     0 }
-  - match:     { unassigned_shards:       0 }
-  - gte:       { number_of_pending_tasks: 0 }
+  - gte:       { number_of_nodes:           1 }
+  - gte:       { number_of_data_nodes:      1 }
+  - gt:        { active_primary_shards:     0 }
+  - gt:        { active_shards:             0 }
+  - gte:       { relocating_shards:         0 }
+  - match:     { initializing_shards:       0 }
+  - match:     { unassigned_shards:         0 }
+  - match:     { unassigned_primary_shards: 0 }
+  - gte:       { number_of_pending_tasks:   0 }
 
 ---
 "cluster health basic test, one index with wait for active shards":
+  - requires:
+      capabilities:
+        - method: GET
+          path: /_cluster/health
+          capabilities: [ unassigned_pri_shard_count ]
+      test_runner_features: capabilities
+      reason: Capability required to run test
+
   - do:
       indices.create:
         index: test_index
@@ -57,17 +83,26 @@
 
   - is_true:   cluster_name
   - is_false:  timed_out
-  - gte:       { number_of_nodes:         1 }
-  - gte:       { number_of_data_nodes:    1 }
-  - gt:        { active_primary_shards:   0 }
-  - gt:        { active_shards:           0 }
-  - gte:       { relocating_shards:       0 }
-  - match:     { initializing_shards:     0 }
-  - match:     { unassigned_shards:       0 }
-  - gte:       { number_of_pending_tasks: 0 }
+  - gte:       { number_of_nodes:           1 }
+  - gte:       { number_of_data_nodes:      1 }
+  - gt:        { active_primary_shards:     0 }
+  - gt:        { active_shards:             0 }
+  - gte:       { relocating_shards:         0 }
+  - match:     { initializing_shards:       0 }
+  - match:     { unassigned_shards:         0 }
+  - match:     { unassigned_primary_shards: 0 }
+  - gte:       { number_of_pending_tasks:   0 }
 
 ---
 "cluster health basic test, one index with wait for all active shards":
+  - requires:
+      capabilities:
+        - method: GET
+          path: /_cluster/health
+          capabilities: [ unassigned_pri_shard_count ]
+      test_runner_features: capabilities
+      reason: Capability required to run test
+
   - do:
       indices.create:
         index: test_index
@@ -83,16 +118,18 @@
 
   - is_true:   cluster_name
   - is_false:  timed_out
-  - gte:       { number_of_nodes:         1 }
-  - gte:       { number_of_data_nodes:    1 }
-  - gt:        { active_primary_shards:   0 }
-  - gt:        { active_shards:           0 }
-  - gte:       { relocating_shards:       0 }
-  - match:     { initializing_shards:     0 }
-  - match:     { unassigned_shards:       0 }
-  - gte:       { number_of_pending_tasks: 0 }
+  - gte:       { number_of_nodes:           1 }
+  - gte:       { number_of_data_nodes:      1 }
+  - gt:        { active_primary_shards:     0 }
+  - gt:        { active_shards:             0 }
+  - gte:       { relocating_shards:         0 }
+  - match:     { initializing_shards:       0 }
+  - match:     { unassigned_shards:         0 }
+  - match:     { unassigned_primary_shards: 0 }
+  - gte:       { number_of_pending_tasks:   0 }
 
 ---
+
 "cluster health basic test, one index with wait for no initializing shards":
 
   - do:
diff --git a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/cluster.health/20_request_timeout.yml b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/cluster.health/20_request_timeout.yml
index 66a7cb2b48dbd..5b3103f416a72 100644
--- a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/cluster.health/20_request_timeout.yml
+++ b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/cluster.health/20_request_timeout.yml
@@ -1,5 +1,12 @@
 ---
 "cluster health request timeout on waiting for nodes":
+  - requires:
+      capabilities:
+        - method: GET
+          path: /_cluster/health
+          capabilities: [ unassigned_pri_shard_count ]
+      test_runner_features: capabilities
+      reason: Capability required to run test
   - do:
       catch: request_timeout
       cluster.health:
@@ -8,17 +15,25 @@
 
   - is_true:   cluster_name
   - is_true:   timed_out
-  - gte:       { number_of_nodes:         1 }
-  - gte:       { number_of_data_nodes:    1 }
-  - match:     { active_primary_shards:   0 }
-  - match:     { active_shards:           0 }
-  - match:     { relocating_shards:       0 }
-  - match:     { initializing_shards:     0 }
-  - match:     { unassigned_shards:       0 }
-  - gte:       { number_of_pending_tasks: 0 }
+  - gte:       { number_of_nodes:           1 }
+  - gte:       { number_of_data_nodes:      1 }
+  - match:     { active_primary_shards:     0 }
+  - match:     { active_shards:             0 }
+  - match:     { relocating_shards:         0 }
+  - match:     { initializing_shards:       0 }
+  - match:     { unassigned_shards:         0 }
+  - match:     { unassigned_primary_shards: 0 }
+  - gte:       { number_of_pending_tasks:   0 }
 
 ---
 "cluster health request timeout waiting for active shards":
+  - requires:
+      capabilities:
+        - method: GET
+          path: /_cluster/health
+          capabilities: [ unassigned_pri_shard_count ]
+      test_runner_features: capabilities
+      reason: Capability required to run test
   - do:
       catch: request_timeout
       cluster.health:
@@ -27,11 +42,12 @@
 
   - is_true:   cluster_name
   - is_true:   timed_out
-  - gte:       { number_of_nodes:         1 }
-  - gte:       { number_of_data_nodes:    1 }
-  - match:     { active_primary_shards:   0 }
-  - match:     { active_shards:           0 }
-  - match:     { relocating_shards:       0 }
-  - match:     { initializing_shards:     0 }
-  - match:     { unassigned_shards:       0 }
-  - gte:       { number_of_pending_tasks: 0 }
+  - gte:       { number_of_nodes:           1 }
+  - gte:       { number_of_data_nodes:      1 }
+  - match:     { active_primary_shards:     0 }
+  - match:     { active_shards:             0 }
+  - match:     { relocating_shards:         0 }
+  - match:     { initializing_shards:       0 }
+  - match:     { unassigned_shards:         0 }
+  - match:     { unassigned_primary_shards: 0 }
+  - gte:       { number_of_pending_tasks:   0 }
diff --git a/server/src/main/java/org/elasticsearch/TransportVersions.java b/server/src/main/java/org/elasticsearch/TransportVersions.java
index edd00f55f3517..5d1fb3a017f2f 100644
--- a/server/src/main/java/org/elasticsearch/TransportVersions.java
+++ b/server/src/main/java/org/elasticsearch/TransportVersions.java
@@ -204,6 +204,7 @@ static TransportVersion def(int id) {
     public static final TransportVersion FIELD_CAPS_RESPONSE_INDEX_MODE = def(8_734_00_0);
     public static final TransportVersion GET_DATA_STREAMS_VERBOSE = def(8_735_00_0);
     public static final TransportVersion ESQL_ADD_INDEX_MODE_CONCRETE_INDICES = def(8_736_00_0);
+    public static final TransportVersion UNASSIGNED_PRIMARY_COUNT_ON_CLUSTER_HEALTH = def(8_737_00_0);
 
     /*
      * STOP! READ THIS FIRST! No, really,
diff --git a/server/src/main/java/org/elasticsearch/action/admin/cluster/health/ClusterHealthResponse.java b/server/src/main/java/org/elasticsearch/action/admin/cluster/health/ClusterHealthResponse.java
index e7e2679e84eb5..8067f92a5a908 100644
--- a/server/src/main/java/org/elasticsearch/action/admin/cluster/health/ClusterHealthResponse.java
+++ b/server/src/main/java/org/elasticsearch/action/admin/cluster/health/ClusterHealthResponse.java
@@ -45,6 +45,7 @@ public class ClusterHealthResponse extends ActionResponse implements ToXContentO
     static final String RELOCATING_SHARDS = "relocating_shards";
     static final String INITIALIZING_SHARDS = "initializing_shards";
     static final String UNASSIGNED_SHARDS = "unassigned_shards";
+    static final String UNASSIGNED_PRIMARY_SHARDS = "unassigned_primary_shards";
     static final String INDICES = "indices";
 
     private String clusterName;
@@ -144,6 +145,10 @@ public int getUnassignedShards() {
         return clusterStateHealth.getUnassignedShards();
     }
 
+    public int getUnassignedPrimaryShards() {
+        return clusterStateHealth.getUnassignedPrimaryShards();
+    }
+
     public int getNumberOfNodes() {
         return clusterStateHealth.getNumberOfNodes();
     }
@@ -253,6 +258,7 @@ public XContentBuilder toXContent(XContentBuilder builder, Params params) throws
         builder.field(RELOCATING_SHARDS, getRelocatingShards());
         builder.field(INITIALIZING_SHARDS, getInitializingShards());
         builder.field(UNASSIGNED_SHARDS, getUnassignedShards());
+        builder.field(UNASSIGNED_PRIMARY_SHARDS, getUnassignedPrimaryShards());
         builder.field(DELAYED_UNASSIGNED_SHARDS, getDelayedUnassignedShards());
         builder.field(NUMBER_OF_PENDING_TASKS, getNumberOfPendingTasks());
         builder.field(NUMBER_OF_IN_FLIGHT_FETCH, getNumberOfInFlightFetch());
diff --git a/server/src/main/java/org/elasticsearch/cluster/health/ClusterIndexHealth.java b/server/src/main/java/org/elasticsearch/cluster/health/ClusterIndexHealth.java
index ad957f7a8f37f..46273e92b84b2 100644
--- a/server/src/main/java/org/elasticsearch/cluster/health/ClusterIndexHealth.java
+++ b/server/src/main/java/org/elasticsearch/cluster/health/ClusterIndexHealth.java
@@ -8,6 +8,7 @@
 
 package org.elasticsearch.cluster.health;
 
+import org.elasticsearch.TransportVersions;
 import org.elasticsearch.action.ClusterStatsLevel;
 import org.elasticsearch.cluster.metadata.IndexMetadata;
 import org.elasticsearch.cluster.routing.IndexRoutingTable;
@@ -33,6 +34,7 @@ public final class ClusterIndexHealth implements Writeable, ToXContentFragment {
     static final String RELOCATING_SHARDS = "relocating_shards";
     static final String INITIALIZING_SHARDS = "initializing_shards";
     static final String UNASSIGNED_SHARDS = "unassigned_shards";
+    static final String UNASSIGNED_PRIMARY_SHARDS = "unassigned_primary_shards";
     static final String SHARDS = "shards";
 
     private final String index;
@@ -42,6 +44,7 @@ public final class ClusterIndexHealth implements Writeable, ToXContentFragment {
     private final int relocatingShards;
     private final int initializingShards;
     private final int unassignedShards;
+    private final int unassignedPrimaryShards;
     private final int activePrimaryShards;
     private final ClusterHealthStatus status;
     private final Map<Integer, ClusterShardHealth> shards;
@@ -64,6 +67,7 @@ public ClusterIndexHealth(final IndexMetadata indexMetadata, final IndexRoutingT
         int computeActiveShards = 0;
         int computeRelocatingShards = 0;
         int computeInitializingShards = 0;
+        int computeUnassignedPrimaryShards = 0;
         int computeUnassignedShards = 0;
         for (ClusterShardHealth shardHealth : shards.values()) {
             if (shardHealth.isPrimaryActive()) {
@@ -73,6 +77,7 @@ public ClusterIndexHealth(final IndexMetadata indexMetadata, final IndexRoutingT
             computeRelocatingShards += shardHealth.getRelocatingShards();
             computeInitializingShards += shardHealth.getInitializingShards();
             computeUnassignedShards += shardHealth.getUnassignedShards();
+            computeUnassignedPrimaryShards += shardHealth.getUnassignedPrimaryShards();
 
             if (shardHealth.getStatus() == ClusterHealthStatus.RED) {
                 computeStatus = ClusterHealthStatus.RED;
@@ -91,6 +96,7 @@ public ClusterIndexHealth(final IndexMetadata indexMetadata, final IndexRoutingT
         this.relocatingShards = computeRelocatingShards;
         this.initializingShards = computeInitializingShards;
         this.unassignedShards = computeUnassignedShards;
+        this.unassignedPrimaryShards = computeUnassignedPrimaryShards;
     }
 
     public ClusterIndexHealth(final StreamInput in) throws IOException {
@@ -104,6 +110,11 @@ public ClusterIndexHealth(final StreamInput in) throws IOException {
         unassignedShards = in.readVInt();
         status = ClusterHealthStatus.readFrom(in);
         shards = in.readMapValues(ClusterShardHealth::new, ClusterShardHealth::getShardId);
+        if (in.getTransportVersion().onOrAfter(TransportVersions.UNASSIGNED_PRIMARY_COUNT_ON_CLUSTER_HEALTH)) {
+            unassignedPrimaryShards = in.readVInt();
+        } else {
+            unassignedPrimaryShards = 0;
+        }
     }
 
     /**
@@ -117,6 +128,7 @@ public ClusterIndexHealth(final StreamInput in) throws IOException {
         int relocatingShards,
         int initializingShards,
         int unassignedShards,
+        int unassignedPrimaryShards,
         int activePrimaryShards,
         ClusterHealthStatus status,
         Map<Integer, ClusterShardHealth> shards
@@ -128,6 +140,7 @@ public ClusterIndexHealth(final StreamInput in) throws IOException {
         this.relocatingShards = relocatingShards;
         this.initializingShards = initializingShards;
         this.unassignedShards = unassignedShards;
+        this.unassignedPrimaryShards = unassignedPrimaryShards;
         this.activePrimaryShards = activePrimaryShards;
         this.status = status;
         this.shards = shards;
@@ -165,6 +178,10 @@ public int getUnassignedShards() {
         return unassignedShards;
     }
 
+    public int getUnassignedPrimaryShards() {
+        return unassignedPrimaryShards;
+    }
+
     public ClusterHealthStatus getStatus() {
         return status;
     }
@@ -185,6 +202,9 @@ public void writeTo(final StreamOutput out) throws IOException {
         out.writeVInt(unassignedShards);
         out.writeByte(status.value());
         out.writeMapValues(shards);
+        if (out.getTransportVersion().onOrAfter(TransportVersions.UNASSIGNED_PRIMARY_COUNT_ON_CLUSTER_HEALTH)) {
+            out.writeVInt(unassignedPrimaryShards);
+        }
     }
 
     @Override
@@ -198,6 +218,7 @@ public XContentBuilder toXContent(final XContentBuilder builder, final Params pa
         builder.field(RELOCATING_SHARDS, getRelocatingShards());
         builder.field(INITIALIZING_SHARDS, getInitializingShards());
         builder.field(UNASSIGNED_SHARDS, getUnassignedShards());
+        builder.field(UNASSIGNED_PRIMARY_SHARDS, getUnassignedPrimaryShards());
 
         ClusterStatsLevel level = ClusterStatsLevel.of(params, ClusterStatsLevel.INDICES);
         if (level == ClusterStatsLevel.SHARDS) {
@@ -229,6 +250,8 @@ public String toString() {
             + initializingShards
             + ", unassignedShards="
             + unassignedShards
+            + ", unassignedPrimaryShards="
+            + unassignedPrimaryShards
             + ", activePrimaryShards="
             + activePrimaryShards
             + ", status="
@@ -250,6 +273,7 @@ public boolean equals(Object o) {
             && relocatingShards == that.relocatingShards
             && initializingShards == that.initializingShards
             && unassignedShards == that.unassignedShards
+            && unassignedPrimaryShards == that.unassignedPrimaryShards
             && activePrimaryShards == that.activePrimaryShards
             && status == that.status
             && Objects.equals(shards, that.shards);
@@ -265,6 +289,7 @@ public int hashCode() {
             relocatingShards,
             initializingShards,
             unassignedShards,
+            unassignedPrimaryShards,
             activePrimaryShards,
             status,
             shards
diff --git a/server/src/main/java/org/elasticsearch/cluster/health/ClusterShardHealth.java b/server/src/main/java/org/elasticsearch/cluster/health/ClusterShardHealth.java
index adb5a7caf2f45..7ebd90050bff3 100644
--- a/server/src/main/java/org/elasticsearch/cluster/health/ClusterShardHealth.java
+++ b/server/src/main/java/org/elasticsearch/cluster/health/ClusterShardHealth.java
@@ -8,6 +8,7 @@
 
 package org.elasticsearch.cluster.health;
 
+import org.elasticsearch.TransportVersions;
 import org.elasticsearch.cluster.routing.IndexShardRoutingTable;
 import org.elasticsearch.cluster.routing.RecoverySource;
 import org.elasticsearch.cluster.routing.ShardRouting;
@@ -30,6 +31,7 @@ public final class ClusterShardHealth implements Writeable, ToXContentFragment {
     static final String RELOCATING_SHARDS = "relocating_shards";
     static final String INITIALIZING_SHARDS = "initializing_shards";
     static final String UNASSIGNED_SHARDS = "unassigned_shards";
+    static final String UNASSIGNED_PRIMARY_SHARDS = "unassigned_primary_shards";
     static final String PRIMARY_ACTIVE = "primary_active";
 
     private final int shardId;
@@ -37,6 +39,7 @@ public final class ClusterShardHealth implements Writeable, ToXContentFragment {
     private final int activeShards;
     private final int relocatingShards;
     private final int initializingShards;
+    private final int unassignedPrimaryShards;
     private final int unassignedShards;
     private final boolean primaryActive;
 
@@ -45,6 +48,7 @@ public ClusterShardHealth(final int shardId, final IndexShardRoutingTable shardR
         int computeActiveShards = 0;
         int computeRelocatingShards = 0;
         int computeInitializingShards = 0;
+        int computeUnassignedPrimaryShards = 0;
         int computeUnassignedShards = 0;
         for (int j = 0; j < shardRoutingTable.size(); j++) {
             ShardRouting shardRouting = shardRoutingTable.shard(j);
@@ -57,6 +61,9 @@ public ClusterShardHealth(final int shardId, final IndexShardRoutingTable shardR
             } else if (shardRouting.initializing()) {
                 computeInitializingShards++;
             } else if (shardRouting.unassigned()) {
+                if (shardRouting.primary()) {
+                    computeUnassignedPrimaryShards++;
+                }
                 computeUnassignedShards++;
             }
         }
@@ -76,6 +83,7 @@ public ClusterShardHealth(final int shardId, final IndexShardRoutingTable shardR
         this.relocatingShards = computeRelocatingShards;
         this.initializingShards = computeInitializingShards;
         this.unassignedShards = computeUnassignedShards;
+        this.unassignedPrimaryShards = computeUnassignedPrimaryShards;
         this.primaryActive = primaryRouting.active();
     }
 
@@ -87,6 +95,11 @@ public ClusterShardHealth(final StreamInput in) throws IOException {
         initializingShards = in.readVInt();
         unassignedShards = in.readVInt();
         primaryActive = in.readBoolean();
+        if (in.getTransportVersion().onOrAfter(TransportVersions.UNASSIGNED_PRIMARY_COUNT_ON_CLUSTER_HEALTH)) {
+            unassignedPrimaryShards = in.readVInt();
+        } else {
+            unassignedPrimaryShards = 0;
+        }
     }
 
     /**
@@ -99,6 +112,7 @@ public ClusterShardHealth(final StreamInput in) throws IOException {
         int relocatingShards,
         int initializingShards,
         int unassignedShards,
+        int unassignedPrimaryShards,
         boolean primaryActive
     ) {
         this.shardId = shardId;
@@ -107,6 +121,7 @@ public ClusterShardHealth(final StreamInput in) throws IOException {
         this.relocatingShards = relocatingShards;
         this.initializingShards = initializingShards;
         this.unassignedShards = unassignedShards;
+        this.unassignedPrimaryShards = unassignedPrimaryShards;
         this.primaryActive = primaryActive;
     }
 
@@ -138,6 +153,10 @@ public int getUnassignedShards() {
         return unassignedShards;
     }
 
+    public int getUnassignedPrimaryShards() {
+        return unassignedPrimaryShards;
+    }
+
     @Override
     public void writeTo(final StreamOutput out) throws IOException {
         out.writeVInt(shardId);
@@ -147,6 +166,9 @@ public void writeTo(final StreamOutput out) throws IOException {
         out.writeVInt(initializingShards);
         out.writeVInt(unassignedShards);
         out.writeBoolean(primaryActive);
+        if (out.getTransportVersion().onOrAfter(TransportVersions.UNASSIGNED_PRIMARY_COUNT_ON_CLUSTER_HEALTH)) {
+            out.writeVInt(unassignedPrimaryShards);
+        }
     }
 
     /**
@@ -187,6 +209,7 @@ public XContentBuilder toXContent(XContentBuilder builder, Params params) throws
         builder.field(RELOCATING_SHARDS, getRelocatingShards());
         builder.field(INITIALIZING_SHARDS, getInitializingShards());
         builder.field(UNASSIGNED_SHARDS, getUnassignedShards());
+        builder.field(UNASSIGNED_PRIMARY_SHARDS, getUnassignedPrimaryShards());
         builder.endObject();
         return builder;
     }
@@ -206,12 +229,22 @@ public boolean equals(Object o) {
             && relocatingShards == that.relocatingShards
             && initializingShards == that.initializingShards
             && unassignedShards == that.unassignedShards
+            && unassignedPrimaryShards == that.unassignedPrimaryShards
             && primaryActive == that.primaryActive
             && status == that.status;
     }
 
     @Override
     public int hashCode() {
-        return Objects.hash(shardId, status, activeShards, relocatingShards, initializingShards, unassignedShards, primaryActive);
+        return Objects.hash(
+            shardId,
+            status,
+            activeShards,
+            relocatingShards,
+            initializingShards,
+            unassignedShards,
+            unassignedPrimaryShards,
+            primaryActive
+        );
     }
 }
diff --git a/server/src/main/java/org/elasticsearch/cluster/health/ClusterStateHealth.java b/server/src/main/java/org/elasticsearch/cluster/health/ClusterStateHealth.java
index 63f1c44b3d1e4..3f27d8d7c2c63 100644
--- a/server/src/main/java/org/elasticsearch/cluster/health/ClusterStateHealth.java
+++ b/server/src/main/java/org/elasticsearch/cluster/health/ClusterStateHealth.java
@@ -7,6 +7,7 @@
  */
 package org.elasticsearch.cluster.health;
 
+import org.elasticsearch.TransportVersions;
 import org.elasticsearch.cluster.ClusterState;
 import org.elasticsearch.cluster.metadata.IndexMetadata;
 import org.elasticsearch.cluster.routing.IndexRoutingTable;
@@ -30,6 +31,7 @@ public final class ClusterStateHealth implements Writeable {
     private final int activePrimaryShards;
     private final int initializingShards;
     private final int unassignedShards;
+    private final int unassignedPrimaryShards;
     private final double activeShardsPercent;
     private final ClusterHealthStatus status;
     private final Map<String, ClusterIndexHealth> indices;
@@ -58,6 +60,7 @@ public ClusterStateHealth(final ClusterState clusterState, final String[] concre
         int computeActiveShards = 0;
         int computeRelocatingShards = 0;
         int computeInitializingShards = 0;
+        int computeUnassignedPrimaryShards = 0;
         int computeUnassignedShards = 0;
         int totalShardCount = 0;
 
@@ -77,6 +80,7 @@ public ClusterStateHealth(final ClusterState clusterState, final String[] concre
             computeRelocatingShards += indexHealth.getRelocatingShards();
             computeInitializingShards += indexHealth.getInitializingShards();
             computeUnassignedShards += indexHealth.getUnassignedShards();
+            computeUnassignedPrimaryShards += indexHealth.getUnassignedPrimaryShards();
             if (indexHealth.getStatus() == ClusterHealthStatus.RED) {
                 computeStatus = ClusterHealthStatus.RED;
             } else if (indexHealth.getStatus() == ClusterHealthStatus.YELLOW && computeStatus != ClusterHealthStatus.RED) {
@@ -94,6 +98,7 @@ public ClusterStateHealth(final ClusterState clusterState, final String[] concre
         this.relocatingShards = computeRelocatingShards;
         this.initializingShards = computeInitializingShards;
         this.unassignedShards = computeUnassignedShards;
+        this.unassignedPrimaryShards = computeUnassignedPrimaryShards;
 
         // shortcut on green
         if (computeStatus.equals(ClusterHealthStatus.GREEN)) {
@@ -114,6 +119,11 @@ public ClusterStateHealth(final StreamInput in) throws IOException {
         status = ClusterHealthStatus.readFrom(in);
         indices = in.readMapValues(ClusterIndexHealth::new, ClusterIndexHealth::getIndex);
         activeShardsPercent = in.readDouble();
+        if (in.getTransportVersion().onOrAfter(TransportVersions.UNASSIGNED_PRIMARY_COUNT_ON_CLUSTER_HEALTH)) {
+            unassignedPrimaryShards = in.readVInt();
+        } else {
+            unassignedPrimaryShards = 0;
+        }
     }
 
     /**
@@ -125,6 +135,7 @@ public ClusterStateHealth(
         int relocatingShards,
         int initializingShards,
         int unassignedShards,
+        int unassignedPrimaryShards,
         int numberOfNodes,
         int numberOfDataNodes,
         double activeShardsPercent,
@@ -136,6 +147,7 @@ public ClusterStateHealth(
         this.relocatingShards = relocatingShards;
         this.initializingShards = initializingShards;
         this.unassignedShards = unassignedShards;
+        this.unassignedPrimaryShards = unassignedPrimaryShards;
         this.numberOfNodes = numberOfNodes;
         this.numberOfDataNodes = numberOfDataNodes;
         this.activeShardsPercent = activeShardsPercent;
@@ -159,6 +171,10 @@ public int getInitializingShards() {
         return initializingShards;
     }
 
+    public int getUnassignedPrimaryShards() {
+        return unassignedPrimaryShards;
+    }
+
     public int getUnassignedShards() {
         return unassignedShards;
     }
@@ -195,6 +211,9 @@ public void writeTo(final StreamOutput out) throws IOException {
         out.writeByte(status.value());
         out.writeMapValues(indices);
         out.writeDouble(activeShardsPercent);
+        if (out.getTransportVersion().onOrAfter(TransportVersions.UNASSIGNED_PRIMARY_COUNT_ON_CLUSTER_HEALTH)) {
+            out.writeVInt(unassignedPrimaryShards);
+        }
     }
 
     @Override
@@ -214,6 +233,8 @@ public String toString() {
             + initializingShards
             + ", unassignedShards="
             + unassignedShards
+            + ", unassignedPrimaryShards="
+            + unassignedPrimaryShards
             + ", activeShardsPercent="
             + activeShardsPercent
             + ", status="
@@ -235,6 +256,7 @@ public boolean equals(Object o) {
             && activePrimaryShards == that.activePrimaryShards
             && initializingShards == that.initializingShards
             && unassignedShards == that.unassignedShards
+            && unassignedPrimaryShards == that.unassignedPrimaryShards
             && Double.compare(that.activeShardsPercent, activeShardsPercent) == 0
             && status == that.status
             && Objects.equals(indices, that.indices);
@@ -250,6 +272,7 @@ public int hashCode() {
             activePrimaryShards,
             initializingShards,
             unassignedShards,
+            unassignedPrimaryShards,
             activeShardsPercent,
             status,
             indices
diff --git a/server/src/main/java/org/elasticsearch/rest/action/admin/cluster/RestClusterHealthAction.java b/server/src/main/java/org/elasticsearch/rest/action/admin/cluster/RestClusterHealthAction.java
index fe0c005046900..f5910f76f36c9 100644
--- a/server/src/main/java/org/elasticsearch/rest/action/admin/cluster/RestClusterHealthAction.java
+++ b/server/src/main/java/org/elasticsearch/rest/action/admin/cluster/RestClusterHealthAction.java
@@ -17,6 +17,7 @@
 import org.elasticsearch.cluster.health.ClusterHealthStatus;
 import org.elasticsearch.common.Priority;
 import org.elasticsearch.common.Strings;
+import org.elasticsearch.common.util.set.Sets;
 import org.elasticsearch.rest.BaseRestHandler;
 import org.elasticsearch.rest.RestRequest;
 import org.elasticsearch.rest.Scope;
@@ -111,4 +112,9 @@ public boolean canTripCircuitBreaker() {
         return false;
     }
 
+    @Override
+    public Set<String> supportedCapabilities() {
+        return Sets.union(Set.of("unassigned_pri_shard_count"), super.supportedCapabilities());
+    }
+
 }
diff --git a/server/src/main/java/org/elasticsearch/rest/action/cat/RestHealthAction.java b/server/src/main/java/org/elasticsearch/rest/action/cat/RestHealthAction.java
index ebde1a9dd052d..587423d0fa1fd 100644
--- a/server/src/main/java/org/elasticsearch/rest/action/cat/RestHealthAction.java
+++ b/server/src/main/java/org/elasticsearch/rest/action/cat/RestHealthAction.java
@@ -12,6 +12,7 @@
 import org.elasticsearch.action.admin.cluster.health.ClusterHealthResponse;
 import org.elasticsearch.client.internal.node.NodeClient;
 import org.elasticsearch.common.Table;
+import org.elasticsearch.common.util.set.Sets;
 import org.elasticsearch.rest.RestRequest;
 import org.elasticsearch.rest.RestResponse;
 import org.elasticsearch.rest.Scope;
@@ -20,6 +21,7 @@
 
 import java.util.List;
 import java.util.Locale;
+import java.util.Set;
 
 import static org.elasticsearch.rest.RestRequest.Method.GET;
 
@@ -71,6 +73,10 @@ protected Table getTableWithHeader(final RestRequest request) {
         t.addCell("relo", "alias:r,shards.relocating,shardsRelocating;text-align:right;desc:number of relocating nodes");
         t.addCell("init", "alias:i,shards.initializing,shardsInitializing;text-align:right;desc:number of initializing nodes");
         t.addCell("unassign", "alias:u,shards.unassigned,shardsUnassigned;text-align:right;desc:number of unassigned shards");
+        t.addCell(
+            "unassign.pri",
+            "alias:up,shards.unassigned.primary,shardsUnassignedPrimary;text-align:right;desc:number of unassigned primary shards"
+        );
         t.addCell("pending_tasks", "alias:pt,pendingTasks;text-align:right;desc:number of pending tasks");
         t.addCell("max_task_wait_time", "alias:mtwt,maxTaskWaitTime;text-align:right;desc:wait time of longest task pending");
         t.addCell("active_shards_percent", "alias:asp,activeShardsPercent;text-align:right;desc:active number of shards in percent");
@@ -91,10 +97,16 @@ private Table buildTable(final ClusterHealthResponse health, final RestRequest r
         t.addCell(health.getRelocatingShards());
         t.addCell(health.getInitializingShards());
         t.addCell(health.getUnassignedShards());
+        t.addCell(health.getUnassignedPrimaryShards());
         t.addCell(health.getNumberOfPendingTasks());
         t.addCell(health.getTaskMaxWaitingTime().millis() == 0 ? "-" : health.getTaskMaxWaitingTime());
         t.addCell(String.format(Locale.ROOT, "%1.1f%%", health.getActiveShardsPercent()));
         t.endRow();
         return t;
     }
+
+    @Override
+    public Set<String> supportedCapabilities() {
+        return Sets.union(Set.of("unassigned_pri_shard_count"), super.supportedCapabilities());
+    }
 }
diff --git a/server/src/test/java/org/elasticsearch/action/admin/cluster/health/ClusterHealthResponsesTests.java b/server/src/test/java/org/elasticsearch/action/admin/cluster/health/ClusterHealthResponsesTests.java
index 11655a93097cc..e18757e59c961 100644
--- a/server/src/test/java/org/elasticsearch/action/admin/cluster/health/ClusterHealthResponsesTests.java
+++ b/server/src/test/java/org/elasticsearch/action/admin/cluster/health/ClusterHealthResponsesTests.java
@@ -61,6 +61,7 @@ public class ClusterHealthResponsesTests extends AbstractXContentSerializingTest
             int activePrimaryShards = (int) parsedObjects[i++];
             int initializingShards = (int) parsedObjects[i++];
             int unassignedShards = (int) parsedObjects[i++];
+            int unassignedPrimaryShards = (int) parsedObjects[i++];
             double activeShardsPercent = (double) parsedObjects[i++];
             String statusStr = (String) parsedObjects[i++];
             ClusterHealthStatus status = ClusterHealthStatus.fromString(statusStr);
@@ -81,6 +82,7 @@ public class ClusterHealthResponsesTests extends AbstractXContentSerializingTest
                 relocatingShards,
                 initializingShards,
                 unassignedShards,
+                unassignedPrimaryShards,
                 numberOfNodes,
                 numberOfDataNodes,
                 activeShardsPercent,
@@ -121,6 +123,7 @@ public class ClusterHealthResponsesTests extends AbstractXContentSerializingTest
         PARSER.declareInt(constructorArg(), new ParseField(ClusterHealthResponse.ACTIVE_PRIMARY_SHARDS));
         PARSER.declareInt(constructorArg(), new ParseField(ClusterHealthResponse.INITIALIZING_SHARDS));
         PARSER.declareInt(constructorArg(), new ParseField(ClusterHealthResponse.UNASSIGNED_SHARDS));
+        PARSER.declareInt(constructorArg(), new ParseField(ClusterHealthResponse.UNASSIGNED_PRIMARY_SHARDS));
         PARSER.declareDouble(constructorArg(), new ParseField(ClusterHealthResponse.ACTIVE_SHARDS_PERCENT_AS_NUMBER));
         PARSER.declareString(constructorArg(), new ParseField(ClusterHealthResponse.STATUS));
         // Can be absent if LEVEL == 'cluster'
@@ -218,6 +221,7 @@ protected ClusterHealthResponse createTestInstance() {
             randomInt(100),
             randomInt(100),
             randomInt(100),
+            randomInt(100),
             randomDoubleBetween(0d, 100d, true),
             randomFrom(ClusterHealthStatus.values()),
             indices
@@ -327,7 +331,7 @@ protected ClusterHealthResponse mutateInstance(ClusterHealthResponse instance) {
                     instance.getNumberOfInFlightFetch(),
                     instance.getDelayedUnassignedShards(),
                     instance.getTaskMaxWaitingTime(),
-                    instance.isTimedOut() == false,
+                    instance.isTimedOut() ? false : true,
                     instance.getClusterStateHealth()
                 );
             case "clusterStateHealth":
@@ -338,6 +342,7 @@ protected ClusterHealthResponse mutateInstance(ClusterHealthResponse instance) {
                     state.getRelocatingShards(),
                     state.getInitializingShards(),
                     state.getUnassignedShards(),
+                    state.getUnassignedPrimaryShards(),
                     state.getNumberOfNodes(),
                     state.getNumberOfDataNodes(),
                     state.getActiveShardsPercent(),
diff --git a/server/src/test/java/org/elasticsearch/cluster/health/ClusterIndexHealthTests.java b/server/src/test/java/org/elasticsearch/cluster/health/ClusterIndexHealthTests.java
index 48d28462231a0..6ec9800839594 100644
--- a/server/src/test/java/org/elasticsearch/cluster/health/ClusterIndexHealthTests.java
+++ b/server/src/test/java/org/elasticsearch/cluster/health/ClusterIndexHealthTests.java
@@ -68,6 +68,7 @@ private void assertIndexHealth(
         assertThat(indexHealth.getRelocatingShards(), equalTo(counter.relocating));
         assertThat(indexHealth.getInitializingShards(), equalTo(counter.initializing));
         assertThat(indexHealth.getUnassignedShards(), equalTo(counter.unassigned));
+        assertThat(indexHealth.getUnassignedPrimaryShards(), equalTo(counter.unassignedPrimary));
         assertThat(indexHealth.getShards().size(), equalTo(indexMetadata.getNumberOfShards()));
         int totalShards = 0;
         for (ClusterShardHealth shardHealth : indexHealth.getShards().values()) {
@@ -98,6 +99,7 @@ public static ClusterIndexHealth randomIndexHealth(String indexName, ClusterStat
             randomInt(1000),
             randomInt(1000),
             randomInt(1000),
+            randomInt(1000),
             randomFrom(ClusterHealthStatus.values()),
             shards
         );
@@ -147,6 +149,7 @@ protected ClusterIndexHealth mutateInstance(ClusterIndexHealth instance) {
             "relocatingShards",
             "initializingShards",
             "unassignedShards",
+            "unassignedPrimaryShards",
             "activePrimaryShards",
             "status",
             "shards"
@@ -161,6 +164,7 @@ protected ClusterIndexHealth mutateInstance(ClusterIndexHealth instance) {
                     instance.getRelocatingShards(),
                     instance.getInitializingShards(),
                     instance.getUnassignedShards(),
+                    instance.getUnassignedPrimaryShards(),
                     instance.getActivePrimaryShards(),
                     instance.getStatus(),
                     instance.getShards()
@@ -174,6 +178,7 @@ protected ClusterIndexHealth mutateInstance(ClusterIndexHealth instance) {
                     instance.getRelocatingShards(),
                     instance.getInitializingShards(),
                     instance.getUnassignedShards(),
+                    instance.getUnassignedPrimaryShards(),
                     instance.getActivePrimaryShards(),
                     instance.getStatus(),
                     instance.getShards()
@@ -187,6 +192,7 @@ protected ClusterIndexHealth mutateInstance(ClusterIndexHealth instance) {
                     instance.getRelocatingShards(),
                     instance.getInitializingShards(),
                     instance.getUnassignedShards(),
+                    instance.getUnassignedPrimaryShards(),
                     instance.getActivePrimaryShards(),
                     instance.getStatus(),
                     instance.getShards()
@@ -200,6 +206,7 @@ protected ClusterIndexHealth mutateInstance(ClusterIndexHealth instance) {
                     instance.getRelocatingShards(),
                     instance.getInitializingShards(),
                     instance.getUnassignedShards(),
+                    instance.getUnassignedPrimaryShards(),
                     instance.getActivePrimaryShards(),
                     instance.getStatus(),
                     instance.getShards()
@@ -213,6 +220,7 @@ protected ClusterIndexHealth mutateInstance(ClusterIndexHealth instance) {
                     instance.getRelocatingShards() + between(1, 10),
                     instance.getInitializingShards(),
                     instance.getUnassignedShards(),
+                    instance.getUnassignedPrimaryShards(),
                     instance.getActivePrimaryShards(),
                     instance.getStatus(),
                     instance.getShards()
@@ -226,6 +234,7 @@ protected ClusterIndexHealth mutateInstance(ClusterIndexHealth instance) {
                     instance.getRelocatingShards(),
                     instance.getInitializingShards() + between(1, 10),
                     instance.getUnassignedShards(),
+                    instance.getUnassignedPrimaryShards(),
                     instance.getActivePrimaryShards(),
                     instance.getStatus(),
                     instance.getShards()
@@ -239,6 +248,21 @@ protected ClusterIndexHealth mutateInstance(ClusterIndexHealth instance) {
                     instance.getRelocatingShards(),
                     instance.getInitializingShards(),
                     instance.getUnassignedShards() + between(1, 10),
+                    instance.getUnassignedPrimaryShards(),
+                    instance.getActivePrimaryShards(),
+                    instance.getStatus(),
+                    instance.getShards()
+                );
+            case "unassignedPrimaryShards":
+                return new ClusterIndexHealth(
+                    instance.getIndex(),
+                    instance.getNumberOfShards(),
+                    instance.getNumberOfReplicas(),
+                    instance.getActiveShards(),
+                    instance.getRelocatingShards(),
+                    instance.getInitializingShards(),
+                    instance.getUnassignedShards(),
+                    instance.getUnassignedPrimaryShards() + between(1, 10),
                     instance.getActivePrimaryShards(),
                     instance.getStatus(),
                     instance.getShards()
@@ -252,6 +276,7 @@ protected ClusterIndexHealth mutateInstance(ClusterIndexHealth instance) {
                     instance.getRelocatingShards(),
                     instance.getInitializingShards(),
                     instance.getUnassignedShards(),
+                    instance.getUnassignedPrimaryShards(),
                     instance.getActivePrimaryShards() + between(1, 10),
                     instance.getStatus(),
                     instance.getShards()
@@ -268,6 +293,7 @@ protected ClusterIndexHealth mutateInstance(ClusterIndexHealth instance) {
                     instance.getRelocatingShards(),
                     instance.getInitializingShards(),
                     instance.getUnassignedShards(),
+                    instance.getUnassignedPrimaryShards(),
                     instance.getActivePrimaryShards(),
                     status,
                     instance.getShards()
@@ -288,6 +314,7 @@ protected ClusterIndexHealth mutateInstance(ClusterIndexHealth instance) {
                     instance.getRelocatingShards(),
                     instance.getInitializingShards(),
                     instance.getUnassignedShards(),
+                    instance.getUnassignedPrimaryShards(),
                     instance.getActivePrimaryShards(),
                     instance.getStatus(),
                     map
@@ -308,6 +335,7 @@ protected ClusterIndexHealth mutateInstance(ClusterIndexHealth instance) {
             int relocatingShards = (int) parsedObjects[i++];
             int initializingShards = (int) parsedObjects[i++];
             int unassignedShards = (int) parsedObjects[i++];
+            int unassignedPrimaryShards = (int) parsedObjects[i++];
             int activePrimaryShards = (int) parsedObjects[i++];
             String statusStr = (String) parsedObjects[i++];
             ClusterHealthStatus status = ClusterHealthStatus.fromString(statusStr);
@@ -330,6 +358,7 @@ protected ClusterIndexHealth mutateInstance(ClusterIndexHealth instance) {
                 relocatingShards,
                 initializingShards,
                 unassignedShards,
+                unassignedPrimaryShards,
                 activePrimaryShards,
                 status,
                 shards
@@ -349,6 +378,7 @@ protected ClusterIndexHealth mutateInstance(ClusterIndexHealth instance) {
         PARSER.declareInt(constructorArg(), new ParseField(ClusterIndexHealth.RELOCATING_SHARDS));
         PARSER.declareInt(constructorArg(), new ParseField(ClusterIndexHealth.INITIALIZING_SHARDS));
         PARSER.declareInt(constructorArg(), new ParseField(ClusterIndexHealth.UNASSIGNED_SHARDS));
+        PARSER.declareInt(constructorArg(), new ParseField(ClusterIndexHealth.UNASSIGNED_PRIMARY_SHARDS));
         PARSER.declareInt(constructorArg(), new ParseField(ClusterIndexHealth.ACTIVE_PRIMARY_SHARDS));
         PARSER.declareString(constructorArg(), new ParseField(ClusterIndexHealth.STATUS));
         // Can be absent if LEVEL == 'indices' or 'cluster'
diff --git a/server/src/test/java/org/elasticsearch/cluster/health/ClusterShardHealthTests.java b/server/src/test/java/org/elasticsearch/cluster/health/ClusterShardHealthTests.java
index 1e1eacba183d2..fec87a7b9634e 100644
--- a/server/src/test/java/org/elasticsearch/cluster/health/ClusterShardHealthTests.java
+++ b/server/src/test/java/org/elasticsearch/cluster/health/ClusterShardHealthTests.java
@@ -32,6 +32,7 @@ public class ClusterShardHealthTests extends AbstractXContentSerializingTestCase
             int relocatingShards = (int) parsedObjects[i++];
             int initializingShards = (int) parsedObjects[i++];
             int unassignedShards = (int) parsedObjects[i++];
+            int unassignedPrimaryShards = (int) parsedObjects[i++];
             String statusStr = (String) parsedObjects[i];
             ClusterHealthStatus status = ClusterHealthStatus.fromString(statusStr);
             return new ClusterShardHealth(
@@ -41,6 +42,7 @@ public class ClusterShardHealthTests extends AbstractXContentSerializingTestCase
                 relocatingShards,
                 initializingShards,
                 unassignedShards,
+                unassignedPrimaryShards,
                 primaryActive
             );
         }
@@ -52,6 +54,7 @@ public class ClusterShardHealthTests extends AbstractXContentSerializingTestCase
         PARSER.declareInt(constructorArg(), new ParseField(ClusterShardHealth.RELOCATING_SHARDS));
         PARSER.declareInt(constructorArg(), new ParseField(ClusterShardHealth.INITIALIZING_SHARDS));
         PARSER.declareInt(constructorArg(), new ParseField(ClusterShardHealth.UNASSIGNED_SHARDS));
+        PARSER.declareInt(constructorArg(), new ParseField(ClusterShardHealth.UNASSIGNED_PRIMARY_SHARDS));
         PARSER.declareString(constructorArg(), new ParseField(ClusterShardHealth.STATUS));
     }
 
@@ -79,6 +82,7 @@ static ClusterShardHealth randomShardHealth(int id) {
             randomInt(1000),
             randomInt(1000),
             randomInt(1000),
+            randomInt(1000),
             randomBoolean()
         );
     }
@@ -108,6 +112,7 @@ protected ClusterShardHealth mutateInstance(final ClusterShardHealth instance) {
             "relocatingShards",
             "initializingShards",
             "unassignedShards",
+            "unassignedPrimaryShards",
             "primaryActive"
         );
         switch (mutate) {
@@ -119,6 +124,7 @@ protected ClusterShardHealth mutateInstance(final ClusterShardHealth instance) {
                     instance.getRelocatingShards(),
                     instance.getInitializingShards(),
                     instance.getUnassignedShards(),
+                    instance.getUnassignedPrimaryShards(),
                     instance.isPrimaryActive()
                 );
             case "status":
@@ -132,6 +138,7 @@ protected ClusterShardHealth mutateInstance(final ClusterShardHealth instance) {
                     instance.getRelocatingShards(),
                     instance.getInitializingShards(),
                     instance.getUnassignedShards(),
+                    instance.getUnassignedPrimaryShards(),
                     instance.isPrimaryActive()
                 );
             case "activeShards":
@@ -142,6 +149,7 @@ protected ClusterShardHealth mutateInstance(final ClusterShardHealth instance) {
                     instance.getRelocatingShards(),
                     instance.getInitializingShards(),
                     instance.getUnassignedShards(),
+                    instance.getUnassignedPrimaryShards(),
                     instance.isPrimaryActive()
                 );
             case "relocatingShards":
@@ -152,6 +160,7 @@ protected ClusterShardHealth mutateInstance(final ClusterShardHealth instance) {
                     instance.getRelocatingShards() + between(1, 10),
                     instance.getInitializingShards(),
                     instance.getUnassignedShards(),
+                    instance.getUnassignedPrimaryShards(),
                     instance.isPrimaryActive()
                 );
             case "initializingShards":
@@ -162,6 +171,7 @@ protected ClusterShardHealth mutateInstance(final ClusterShardHealth instance) {
                     instance.getRelocatingShards(),
                     instance.getInitializingShards() + between(1, 10),
                     instance.getUnassignedShards(),
+                    instance.getUnassignedPrimaryShards(),
                     instance.isPrimaryActive()
                 );
             case "unassignedShards":
@@ -172,6 +182,18 @@ protected ClusterShardHealth mutateInstance(final ClusterShardHealth instance) {
                     instance.getRelocatingShards(),
                     instance.getInitializingShards(),
                     instance.getUnassignedShards() + between(1, 10),
+                    instance.getUnassignedPrimaryShards(),
+                    instance.isPrimaryActive()
+                );
+            case "unassignedPrimaryShards":
+                return new ClusterShardHealth(
+                    instance.getShardId(),
+                    instance.getStatus(),
+                    instance.getActiveShards(),
+                    instance.getRelocatingShards(),
+                    instance.getInitializingShards(),
+                    instance.getUnassignedShards(),
+                    instance.getUnassignedPrimaryShards() + between(1, 10),
                     instance.isPrimaryActive()
                 );
             case "primaryActive":
@@ -182,7 +204,8 @@ protected ClusterShardHealth mutateInstance(final ClusterShardHealth instance) {
                     instance.getRelocatingShards(),
                     instance.getInitializingShards(),
                     instance.getUnassignedShards(),
-                    instance.isPrimaryActive() == false
+                    instance.getUnassignedPrimaryShards(),
+                    instance.isPrimaryActive() ? false : true
                 );
             default:
                 throw new UnsupportedOperationException();
diff --git a/server/src/test/java/org/elasticsearch/cluster/health/ClusterStateHealthTests.java b/server/src/test/java/org/elasticsearch/cluster/health/ClusterStateHealthTests.java
index 96ff00488a1d2..7ef9e44eb8e7e 100644
--- a/server/src/test/java/org/elasticsearch/cluster/health/ClusterStateHealthTests.java
+++ b/server/src/test/java/org/elasticsearch/cluster/health/ClusterStateHealthTests.java
@@ -577,6 +577,7 @@ private void assertClusterHealth(ClusterStateHealth clusterStateHealth, RoutingT
         assertThat(clusterStateHealth.getInitializingShards(), equalTo(counter.initializing));
         assertThat(clusterStateHealth.getRelocatingShards(), equalTo(counter.relocating));
         assertThat(clusterStateHealth.getUnassignedShards(), equalTo(counter.unassigned));
+        assertThat(clusterStateHealth.getUnassignedPrimaryShards(), equalTo(counter.unassignedPrimary));
         assertThat(clusterStateHealth.getActiveShardsPercent(), is(allOf(greaterThanOrEqualTo(0.0), lessThanOrEqualTo(100.0))));
     }
 }
diff --git a/server/src/test/java/org/elasticsearch/cluster/routing/RoutingTableGenerator.java b/server/src/test/java/org/elasticsearch/cluster/routing/RoutingTableGenerator.java
index 2b09da7c6991d..409b25e9eb616 100644
--- a/server/src/test/java/org/elasticsearch/cluster/routing/RoutingTableGenerator.java
+++ b/server/src/test/java/org/elasticsearch/cluster/routing/RoutingTableGenerator.java
@@ -90,6 +90,7 @@ public static class ShardCounter {
         public int relocating;
         public int initializing;
         public int unassigned;
+        public int unassignedPrimary;
         public int primaryActive;
         public int primaryInactive;
         private boolean inactivePrimaryCausesRed = false;
@@ -129,6 +130,9 @@ public void update(ShardRouting shardRouting) {
             if (shardRouting.initializing()) {
                 initializing++;
             } else {
+                if (shardRouting.primary()) {
+                    unassignedPrimary++;
+                }
                 unassigned++;
             }
         }

From 62d544e03dd60c9854126b63c825da05775013f1 Mon Sep 17 00:00:00 2001
From: Niels Bauman <33722607+nielsbauman@users.noreply.github.com>
Date: Mon, 2 Sep 2024 17:35:07 +0200
Subject: [PATCH 100/144] Allow pathRestricted param in
 RestGetDataStreamsAction (#112434)

This is a follow-up of #112303 which prohibited this parameter. This
resulted in test failures on serverless.
---
 .../elasticsearch/datastreams/rest/RestGetDataStreamsAction.java | 1 +
 1 file changed, 1 insertion(+)

diff --git a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/rest/RestGetDataStreamsAction.java b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/rest/RestGetDataStreamsAction.java
index 7fc86ec2c592e..c3fd479616319 100644
--- a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/rest/RestGetDataStreamsAction.java
+++ b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/rest/RestGetDataStreamsAction.java
@@ -66,6 +66,7 @@ public Set<String> supportedQueryParameters() {
             "include_defaults",
             "timeout",
             "master_timeout",
+            RestRequest.PATH_RESTRICTED,
             IndicesOptions.WildcardOptions.EXPAND_WILDCARDS,
             IndicesOptions.ConcreteTargetOptions.IGNORE_UNAVAILABLE,
             IndicesOptions.WildcardOptions.ALLOW_NO_INDICES,

From 4f62da96dd7bca65b6c79ebe855083ddf6ad4b27 Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Tue, 3 Sep 2024 06:23:16 +1000
Subject: [PATCH 101/144] Mute
 org.elasticsearch.xpack.spatial.index.query.LegacyGeoShapeWithDocValuesQueryTests
 testIndexPointsFromLine #112438

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 3c8381f7e067b..cfa67ba495324 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -176,6 +176,9 @@ tests:
   issue: https://github.com/elastic/elasticsearch/issues/112421
 - class: org.elasticsearch.indices.mapping.UpdateMappingIntegrationIT
   issue: https://github.com/elastic/elasticsearch/issues/112423
+- class: org.elasticsearch.xpack.spatial.index.query.LegacyGeoShapeWithDocValuesQueryTests
+  method: testIndexPointsFromLine
+  issue: https://github.com/elastic/elasticsearch/issues/112438
 
 # Examples:
 #

From 2871b94603655ff3b6120788728bfbf7c009d27f Mon Sep 17 00:00:00 2001
From: Simon Cooper <simon.cooper@elastic.co>
Date: Tue, 3 Sep 2024 06:12:41 +0100
Subject: [PATCH 102/144] Make sure file accesses in DnRoleMapper are done in
 stack frames with permissions (#112400)

* Make sure file accesses are done in stack frames with permissions

* Update docs/changelog/112400.yaml

* Delete docs/changelog/112400.yaml

* Update docs/changelog/112400.yaml
---
 docs/changelog/112400.yaml                                   | 5 +++++
 .../xpack/security/authc/support/DnRoleMapper.java           | 4 +++-
 2 files changed, 8 insertions(+), 1 deletion(-)
 create mode 100644 docs/changelog/112400.yaml

diff --git a/docs/changelog/112400.yaml b/docs/changelog/112400.yaml
new file mode 100644
index 0000000000000..6d622e5fb5248
--- /dev/null
+++ b/docs/changelog/112400.yaml
@@ -0,0 +1,5 @@
+pr: 112400
+summary: Make sure file accesses in `DnRoleMapper` are done in stack frames with permissions
+area: Infra/Core
+type: bug
+issues: []
diff --git a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authc/support/DnRoleMapper.java b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authc/support/DnRoleMapper.java
index 0f8539e69bb32..3279bda791c52 100644
--- a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authc/support/DnRoleMapper.java
+++ b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authc/support/DnRoleMapper.java
@@ -114,7 +114,9 @@ public static Map<String, List<String>> parseFile(Path path, Logger logger, Stri
         }
 
         try {
-            Settings settings = Settings.builder().loadFromPath(path).build();
+            // create this here so it's in an allowed stack frame
+            var file = Files.newInputStream(path);
+            Settings settings = Settings.builder().loadFromStream(path.getFileName().toString(), file, false).build();
 
             Map<DN, Set<String>> dnToRoles = new HashMap<>();
             Set<String> roles = settings.names();

From 265c70423bb390c78d6d82527864653829379f4d Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Slobodan=20Adamovi=C4=87?=
 <slobodanadamovic@users.noreply.github.com>
Date: Tue, 3 Sep 2024 09:58:18 +0200
Subject: [PATCH 103/144] [DOCS] Add missing ELASTIC_PASSWORD in docker-compose
 (#112372)

This PR adds missing ELASTIC_PASSWORD environment variable to es02 and es03 nodes.

Resolves https://github.com/elastic/elasticsearch/issues/112235
---
 docs/reference/setup/install/docker/docker-compose.yml | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/docs/reference/setup/install/docker/docker-compose.yml b/docs/reference/setup/install/docker/docker-compose.yml
index 4b4ecf401b7d4..15d8c11e2f12f 100644
--- a/docs/reference/setup/install/docker/docker-compose.yml
+++ b/docs/reference/setup/install/docker/docker-compose.yml
@@ -117,6 +117,7 @@ services:
       - cluster.name=${CLUSTER_NAME}
       - cluster.initial_master_nodes=es01,es02,es03
       - discovery.seed_hosts=es01,es03
+      - ELASTIC_PASSWORD=${ELASTIC_PASSWORD}
       - bootstrap.memory_lock=true
       - xpack.security.enabled=true
       - xpack.security.http.ssl.enabled=true
@@ -156,6 +157,7 @@ services:
       - cluster.name=${CLUSTER_NAME}
       - cluster.initial_master_nodes=es01,es02,es03
       - discovery.seed_hosts=es01,es02
+      - ELASTIC_PASSWORD=${ELASTIC_PASSWORD}
       - bootstrap.memory_lock=true
       - xpack.security.enabled=true
       - xpack.security.http.ssl.enabled=true

From 9f98c44d10a8d27e0b56b15b8d8c966e32a35ab2 Mon Sep 17 00:00:00 2001
From: Yang Wang <yang.wang@elastic.co>
Date: Tue, 3 Sep 2024 18:07:30 +1000
Subject: [PATCH 104/144] Add 5 min initial delay for undesired allocation
 warning (#112427)

When a cluster just starts up, all shards may reside on a single node.
When a new node joins, it is likely half of the shards needs to relocate
to the new node. This temporary undesired allocation is expected and
should quickly resolve itself. This PR adds a 5 min initial delay so
that the cluster does not log warning in such situation.

Resolves: ES-9174
---
 .../allocator/DesiredBalanceReconciler.java      |  5 ++++-
 .../allocator/FrequencyCappedAction.java         | 10 +++-------
 .../allocator/DesiredBalanceReconcilerTests.java | 10 ++++++++--
 .../allocator/FrequencyCappedActionTests.java    | 16 ++++++++++++----
 4 files changed, 27 insertions(+), 14 deletions(-)

diff --git a/server/src/main/java/org/elasticsearch/cluster/routing/allocation/allocator/DesiredBalanceReconciler.java b/server/src/main/java/org/elasticsearch/cluster/routing/allocation/allocator/DesiredBalanceReconciler.java
index 24e7abca45d2d..3b1f6392ff7dc 100644
--- a/server/src/main/java/org/elasticsearch/cluster/routing/allocation/allocator/DesiredBalanceReconciler.java
+++ b/server/src/main/java/org/elasticsearch/cluster/routing/allocation/allocator/DesiredBalanceReconciler.java
@@ -89,7 +89,10 @@ public class DesiredBalanceReconciler {
     private final DoubleGauge undesiredAllocationsRatio;
 
     public DesiredBalanceReconciler(ClusterSettings clusterSettings, ThreadPool threadPool, MeterRegistry meterRegistry) {
-        this.undesiredAllocationLogInterval = new FrequencyCappedAction(threadPool);
+        this.undesiredAllocationLogInterval = new FrequencyCappedAction(
+            threadPool.relativeTimeInMillisSupplier(),
+            TimeValue.timeValueMinutes(5)
+        );
         clusterSettings.initializeAndWatch(UNDESIRED_ALLOCATIONS_LOG_INTERVAL_SETTING, this.undesiredAllocationLogInterval::setMinInterval);
         clusterSettings.initializeAndWatch(
             UNDESIRED_ALLOCATIONS_LOG_THRESHOLD_SETTING,
diff --git a/server/src/main/java/org/elasticsearch/cluster/routing/allocation/allocator/FrequencyCappedAction.java b/server/src/main/java/org/elasticsearch/cluster/routing/allocation/allocator/FrequencyCappedAction.java
index 85ec145783023..2531655608ebb 100644
--- a/server/src/main/java/org/elasticsearch/cluster/routing/allocation/allocator/FrequencyCappedAction.java
+++ b/server/src/main/java/org/elasticsearch/cluster/routing/allocation/allocator/FrequencyCappedAction.java
@@ -9,7 +9,6 @@
 package org.elasticsearch.cluster.routing.allocation.allocator;
 
 import org.elasticsearch.core.TimeValue;
-import org.elasticsearch.threadpool.ThreadPool;
 
 import java.util.function.LongSupplier;
 
@@ -21,15 +20,12 @@ public class FrequencyCappedAction {
     private final LongSupplier currentTimeMillisSupplier;
     private TimeValue minInterval;
 
-    private long next = -1;
+    private long next;
 
-    public FrequencyCappedAction(ThreadPool threadPool) {
-        this(threadPool.relativeTimeInMillisSupplier());
-    }
-
-    public FrequencyCappedAction(LongSupplier currentTimeMillisSupplier) {
+    public FrequencyCappedAction(LongSupplier currentTimeMillisSupplier, TimeValue initialDelay) {
         this.currentTimeMillisSupplier = currentTimeMillisSupplier;
         this.minInterval = TimeValue.MAX_VALUE;
+        this.next = currentTimeMillisSupplier.getAsLong() + initialDelay.getMillis();
     }
 
     public void setMinInterval(TimeValue minInterval) {
diff --git a/server/src/test/java/org/elasticsearch/cluster/routing/allocation/allocator/DesiredBalanceReconcilerTests.java b/server/src/test/java/org/elasticsearch/cluster/routing/allocation/allocator/DesiredBalanceReconcilerTests.java
index 615405645d6b2..326cda70dde82 100644
--- a/server/src/test/java/org/elasticsearch/cluster/routing/allocation/allocator/DesiredBalanceReconcilerTests.java
+++ b/server/src/test/java/org/elasticsearch/cluster/routing/allocation/allocator/DesiredBalanceReconcilerTests.java
@@ -55,6 +55,7 @@
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.util.Maps;
 import org.elasticsearch.common.util.concurrent.DeterministicTaskQueue;
+import org.elasticsearch.core.TimeValue;
 import org.elasticsearch.gateway.GatewayAllocator;
 import org.elasticsearch.index.IndexVersion;
 import org.elasticsearch.index.shard.ShardId;
@@ -1281,9 +1282,12 @@ public void testShouldLogOnTooManyUndesiredAllocations() {
             .build();
 
         var threadPool = mock(ThreadPool.class);
-        when(threadPool.relativeTimeInMillisSupplier()).thenReturn(new AtomicLong()::incrementAndGet);
+        final var timeInMillisSupplier = new AtomicLong();
+        when(threadPool.relativeTimeInMillisSupplier()).thenReturn(timeInMillisSupplier::incrementAndGet);
 
         var reconciler = new DesiredBalanceReconciler(createBuiltInClusterSettings(), threadPool, mock(MeterRegistry.class));
+        final long initialDelayInMillis = TimeValue.timeValueMinutes(5).getMillis();
+        timeInMillisSupplier.addAndGet(randomLongBetween(initialDelayInMillis, 2 * initialDelayInMillis));
 
         var expectedWarningMessage = "[100%] of assigned shards ("
             + shardCount
@@ -1323,7 +1327,9 @@ public void testShouldLogOnTooManyUndesiredAllocations() {
     }
 
     private static void reconcile(RoutingAllocation routingAllocation, DesiredBalance desiredBalance) {
-        new DesiredBalanceReconciler(createBuiltInClusterSettings(), mock(ThreadPool.class), mock(MeterRegistry.class)).reconcile(
+        final var threadPool = mock(ThreadPool.class);
+        when(threadPool.relativeTimeInMillisSupplier()).thenReturn(new AtomicLong()::incrementAndGet);
+        new DesiredBalanceReconciler(createBuiltInClusterSettings(), threadPool, mock(MeterRegistry.class)).reconcile(
             desiredBalance,
             routingAllocation
         );
diff --git a/server/src/test/java/org/elasticsearch/cluster/routing/allocation/allocator/FrequencyCappedActionTests.java b/server/src/test/java/org/elasticsearch/cluster/routing/allocation/allocator/FrequencyCappedActionTests.java
index 0e730c3647db7..fa2b926f11a63 100644
--- a/server/src/test/java/org/elasticsearch/cluster/routing/allocation/allocator/FrequencyCappedActionTests.java
+++ b/server/src/test/java/org/elasticsearch/cluster/routing/allocation/allocator/FrequencyCappedActionTests.java
@@ -8,6 +8,7 @@
 
 package org.elasticsearch.cluster.routing.allocation.allocator;
 
+import org.elasticsearch.core.TimeValue;
 import org.elasticsearch.test.ESTestCase;
 
 import java.util.concurrent.atomic.AtomicLong;
@@ -21,22 +22,29 @@ public void testFrequencyCapExecution() {
 
         var executions = new AtomicLong(0);
         var currentTime = new AtomicLong();
-        var action = new FrequencyCappedAction(currentTime::get);
+        final TimeValue initialDelay = randomBoolean() ? TimeValue.ZERO : TimeValue.timeValueSeconds(between(1, 300));
+        var action = new FrequencyCappedAction(currentTime::get, initialDelay);
 
         var minInterval = timeValueMillis(randomNonNegativeInt());
         action.setMinInterval(minInterval);
 
-        // initial execution should happen
         action.maybeExecute(executions::incrementAndGet);
+        if (initialDelay != TimeValue.ZERO) {
+            // Not executing due to initial delay
+            assertThat(executions.get(), equalTo(0L));
+            currentTime.addAndGet(randomLongBetween(initialDelay.millis(), initialDelay.millis() * 2));
+            action.maybeExecute(executions::incrementAndGet);
+        }
+        // initial execution should happen
         assertThat(executions.get(), equalTo(1L));
 
         // should not execute again too soon
-        currentTime.set(randomLongBetween(0, minInterval.millis() - 1));
+        currentTime.addAndGet(randomLongBetween(0, minInterval.millis() - 1));
         action.maybeExecute(executions::incrementAndGet);
         assertThat(executions.get(), equalTo(1L));
 
         // should execute min interval elapsed
-        currentTime.set(randomLongBetween(minInterval.millis(), Long.MAX_VALUE));
+        currentTime.addAndGet(randomLongBetween(minInterval.millis(), Long.MAX_VALUE));
         action.maybeExecute(executions::incrementAndGet);
         assertThat(executions.get(), equalTo(2L));
     }

From 06aa32b312d922ac364fb94cb2ff322ac831827b Mon Sep 17 00:00:00 2001
From: Ido Cohen <90558359+CohenIdo@users.noreply.github.com>
Date: Tue, 3 Sep 2024 11:40:25 +0300
Subject: [PATCH 105/144] [Cloud Security][CDR] Update Wiz vuln privileges

---
 .../KibanaOwnedReservedRoleDescriptors.java   | 99 ++++++++++++++-----
 .../authz/store/ReservedRolesStoreTests.java  | 30 +++++-
 2 files changed, 102 insertions(+), 27 deletions(-)

diff --git a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authz/store/KibanaOwnedReservedRoleDescriptors.java b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authz/store/KibanaOwnedReservedRoleDescriptors.java
index a0fe3d09eccc7..36d0240ed765b 100644
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authz/store/KibanaOwnedReservedRoleDescriptors.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authz/store/KibanaOwnedReservedRoleDescriptors.java
@@ -30,7 +30,8 @@
 import static org.elasticsearch.xpack.core.security.authz.store.ReservedRolesStore.getRemoteIndicesReadPrivileges;
 
 /**
- * This exists in a separate file so it can be assigned to the Kibana security team in the CODEOWNERS file
+ * This exists in a separate file so it can be assigned to the Kibana security
+ * team in the CODEOWNERS file
  */
 class KibanaOwnedReservedRoleDescriptors {
 
@@ -87,9 +88,11 @@ static RoleDescriptor kibanaSystem(String name) {
                 SuggestProfilesAction.NAME,
                 ProfileHasPrivilegesAction.NAME,
                 "write_fleet_secrets",
-                // To facilitate ML UI functionality being controlled using Kibana security privileges
+                // To facilitate ML UI functionality being controlled using Kibana security
+                // privileges
                 "manage_ml",
-                // The symbolic constant for this one is in SecurityActionMapper, so not accessible from X-Pack core
+                // The symbolic constant for this one is in SecurityActionMapper, so not
+                // accessible from X-Pack core
                 "cluster:admin/analyze",
                 // To facilitate using the file uploader functionality
                 "monitor_text_structure",
@@ -104,7 +107,8 @@ static RoleDescriptor kibanaSystem(String name) {
                     .build(),
                 RoleDescriptor.IndicesPrivileges.builder().indices(".monitoring-*").privileges("read", "read_cross_cluster").build(),
                 RoleDescriptor.IndicesPrivileges.builder().indices(".management-beats").privileges("create_index", "read", "write").build(),
-                // To facilitate ML UI functionality being controlled using Kibana security privileges
+                // To facilitate ML UI functionality being controlled using Kibana security
+                // privileges
                 RoleDescriptor.IndicesPrivileges.builder().indices(".ml-anomalies*", ".ml-stats-*").privileges("read").build(),
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices(".ml-annotations*", ".ml-notifications*")
@@ -139,12 +143,14 @@ static RoleDescriptor kibanaSystem(String name) {
                 RoleDescriptor.IndicesPrivileges.builder().indices("traces-apm.*").privileges("read", "read_cross_cluster").build(),
                 RoleDescriptor.IndicesPrivileges.builder().indices("traces-apm-*").privileges("read", "read_cross_cluster").build(),
 
-                // Logstash telemetry queries of kibana task runner to access Logstash metric indices
+                // Logstash telemetry queries of kibana task runner to access Logstash metric
+                // indices
                 RoleDescriptor.IndicesPrivileges.builder().indices("metrics-logstash.*").privileges("read").build(),
 
                 // Data telemetry reads mappings, metadata and stats of indices
                 RoleDescriptor.IndicesPrivileges.builder().indices("*").privileges("view_index_metadata", "monitor").build(),
-                // Endpoint diagnostic information. Kibana reads from these indices to send telemetry
+                // Endpoint diagnostic information. Kibana reads from these indices to send
+                // telemetry
                 RoleDescriptor.IndicesPrivileges.builder().indices(".logs-endpoint.diagnostic.collection-*").privileges("read").build(),
                 // Fleet secrets. Kibana can only write to this index.
                 RoleDescriptor.IndicesPrivileges.builder()
@@ -152,7 +158,8 @@ static RoleDescriptor kibanaSystem(String name) {
                     .privileges("write", "delete", "create_index")
                     .allowRestrictedIndices(true)
                     .build(),
-                // Other Fleet indices. Kibana reads and writes to these indices to manage Elastic Agents.
+                // Other Fleet indices. Kibana reads and writes to these indices to manage
+                // Elastic Agents.
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices(".fleet-actions*")
                     .privileges("all")
@@ -217,26 +224,32 @@ static RoleDescriptor kibanaSystem(String name) {
                     .indices(ReservedRolesStore.LISTS_INDEX, ReservedRolesStore.LISTS_ITEMS_INDEX)
                     .privileges("all")
                     .build(),
-                // "Alerts as data" internal backing indices used in Security Solution, Observability, etc.
-                // Kibana system user creates these indices; reads / writes to them via the aliases (see below).
+                // "Alerts as data" internal backing indices used in Security Solution,
+                // Observability, etc.
+                // Kibana system user creates these indices; reads / writes to them via the
+                // aliases (see below).
                 RoleDescriptor.IndicesPrivileges.builder().indices(ReservedRolesStore.ALERTS_BACKING_INDEX).privileges("all").build(),
-                // "Alerts as data" public index aliases used in Security Solution, Observability, etc.
+                // "Alerts as data" public index aliases used in Security Solution,
+                // Observability, etc.
                 // Kibana system user uses them to read / write alerts.
                 RoleDescriptor.IndicesPrivileges.builder().indices(ReservedRolesStore.ALERTS_INDEX_ALIAS).privileges("all").build(),
                 // "Alerts as data" public index alias used in Security Solution
                 // Kibana system user uses them to read / write alerts.
                 RoleDescriptor.IndicesPrivileges.builder().indices(ReservedRolesStore.PREVIEW_ALERTS_INDEX_ALIAS).privileges("all").build(),
                 // "Alerts as data" internal backing indices used in Security Solution
-                // Kibana system user creates these indices; reads / writes to them via the aliases (see below).
+                // Kibana system user creates these indices; reads / writes to them via the
+                // aliases (see below).
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices(ReservedRolesStore.PREVIEW_ALERTS_BACKING_INDEX_ALIAS)
                     .privileges("all")
                     .build(),
-                // Endpoint / Fleet policy responses. Kibana requires read access to send telemetry
+                // Endpoint / Fleet policy responses. Kibana requires read access to send
+                // telemetry
                 RoleDescriptor.IndicesPrivileges.builder().indices("metrics-endpoint.policy-*").privileges("read").build(),
                 // Endpoint metrics. Kibana requires read access to send telemetry
                 RoleDescriptor.IndicesPrivileges.builder().indices("metrics-endpoint.metrics-*").privileges("read").build(),
-                // Endpoint events. Kibana reads endpoint alert lineage for building and sending telemetry
+                // Endpoint events. Kibana reads endpoint alert lineage for building and sending
+                // telemetry
                 RoleDescriptor.IndicesPrivileges.builder().indices("logs-endpoint.events.*").privileges("read").build(),
                 // Fleet package install and upgrade
                 RoleDescriptor.IndicesPrivileges.builder()
@@ -261,39 +274,48 @@ static RoleDescriptor kibanaSystem(String name) {
                         "indices:admin/data_stream/lifecycle/put"
                     )
                     .build(),
-                // Endpoint specific action responses. Kibana reads and writes (for third party agents) to the index
+                // Endpoint specific action responses. Kibana reads and writes (for third party
+                // agents) to the index
                 // to display action responses to the user.
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices(".logs-endpoint.action.responses-*")
                     .privileges("auto_configure", "read", "write")
                     .build(),
-                // Endpoint specific actions. Kibana reads and writes to this index to track new actions and display them.
+                // Endpoint specific actions. Kibana reads and writes to this index to track new
+                // actions and display them.
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices(".logs-endpoint.actions-*")
                     .privileges("auto_configure", "read", "write")
                     .build(),
-                // Legacy Osquery manager specific action responses. Kibana reads from these to display responses to the user.
+                // Legacy Osquery manager specific action responses. Kibana reads from these to
+                // display responses to the user.
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices(".logs-osquery_manager.action.responses-*")
                     .privileges("auto_configure", "create_index", "read", "index", "delete")
                     .build(),
-                // Osquery manager specific action responses. Kibana reads from these to display responses to the user.
+                // Osquery manager specific action responses. Kibana reads from these to display
+                // responses to the user.
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices("logs-osquery_manager.action.responses-*")
                     .privileges("read", "view_index_metadata")
                     .build(),
-                // Osquery manager specific actions. Kibana reads and writes to this index to track new actions and display them.
+                // Osquery manager specific actions. Kibana reads and writes to this index to
+                // track new actions and display them.
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices(".logs-osquery_manager.actions-*")
                     .privileges("auto_configure", "create_index", "read", "index", "write", "delete")
                     .build(),
 
-                // Third party agent (that use non-Elastic Defend integrations) info logs indices.
+                // Third party agent (that use non-Elastic Defend integrations) info logs
+                // indices.
                 // Kibana reads from these to display agent status/info to the user.
-                // These are indices that filebeat writes to, and the data in these indices are ingested by Fleet integrations
-                // in order to provide support for response actions related to malicious events for such agents.
+                // These are indices that filebeat writes to, and the data in these indices are
+                // ingested by Fleet integrations
+                // in order to provide support for response actions related to malicious events
+                // for such agents.
                 RoleDescriptor.IndicesPrivileges.builder().indices("logs-sentinel_one.*", "logs-crowdstrike.*").privileges("read").build(),
-                // For ILM policy for APM, Endpoint, & Synthetics packages that have delete action
+                // For ILM policy for APM, Endpoint, & Synthetics packages that have delete
+                // action
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices(
                         ".logs-endpoint.diagnostic.collection-*",
@@ -332,7 +354,8 @@ static RoleDescriptor kibanaSystem(String name) {
                         TransportUpdateSettingsAction.TYPE.name()
                     )
                     .build(),
-                // For destination indices of the Threat Intel (ti_*) packages that ships a transform for supporting IOC expiration
+                // For destination indices of the Threat Intel (ti_*) packages that ships a
+                // transform for supporting IOC expiration
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices("logs-ti_*_latest.*")
                     .privileges(
@@ -346,7 +369,8 @@ static RoleDescriptor kibanaSystem(String name) {
                         TransportUpdateSettingsAction.TYPE.name()
                     )
                     .build(),
-                // For source indices of the Threat Intel (ti_*) packages that ships a transform for supporting IOC expiration
+                // For source indices of the Threat Intel (ti_*) packages that ships a transform
+                // for supporting IOC expiration
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices("logs-ti_*.*-*")
                     .privileges(
@@ -370,7 +394,8 @@ static RoleDescriptor kibanaSystem(String name) {
                         TransportUpdateSettingsAction.TYPE.name()
                     )
                     .build(),
-                // For src/dest indices of the Cloud Security Posture packages that ships a transform
+                // For src/dest indices of the Cloud Security Posture packages that ships a
+                // transform
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices("logs-cloud_security_posture.findings-*", "logs-cloud_security_posture.vulnerabilities-*")
                     .privileges("read", "view_index_metadata")
@@ -390,6 +415,27 @@ static RoleDescriptor kibanaSystem(String name) {
                         TransportUpdateSettingsAction.TYPE.name()
                     )
                     .build(),
+                RoleDescriptor.IndicesPrivileges.builder()
+                    .indices("logs-wiz.vulnerability-*")
+                    .privileges("read", "view_index_metadata")
+                    .build(),
+                RoleDescriptor.IndicesPrivileges.builder()
+                    // manage privilege required by the index alias
+                    .indices("security_solution-*.vulnerability_latest")
+                    .privileges("manage", TransportIndicesAliasesAction.NAME, TransportUpdateSettingsAction.TYPE.name())
+                    .build(),
+                RoleDescriptor.IndicesPrivileges.builder()
+                    .indices("security_solution-*.vulnerability_latest-*")
+                    .privileges(
+                        "create_index",
+                        "index",
+                        "manage",
+                        "read",
+                        "delete",
+                        TransportIndicesAliasesAction.NAME,
+                        TransportUpdateSettingsAction.TYPE.name()
+                    )
+                    .build(),
                 RoleDescriptor.IndicesPrivileges.builder().indices("risk-score.risk-*").privileges("all").build(),
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices(".asset-criticality.asset-criticality-*")
@@ -403,7 +449,8 @@ static RoleDescriptor kibanaSystem(String name) {
                 // SLO observability solution internal indices
                 // Kibana system user uses them to read / write slo data.
                 RoleDescriptor.IndicesPrivileges.builder().indices(".slo-observability.*").privileges("all").build(),
-                // Endpoint heartbeat. Kibana reads from these to determine metering/billing for endpoints.
+                // Endpoint heartbeat. Kibana reads from these to determine metering/billing for
+                // endpoints.
                 RoleDescriptor.IndicesPrivileges.builder().indices(".logs-endpoint.heartbeat-*").privileges("read").build(),
                 // For connectors telemetry. Will be removed once we switched to connectors API
                 RoleDescriptor.IndicesPrivileges.builder().indices(".elastic-connectors*").privileges("read").build() },
diff --git a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/authz/store/ReservedRolesStoreTests.java b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/authz/store/ReservedRolesStoreTests.java
index 0cdf7de63ca99..258b2378b8a1c 100644
--- a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/authz/store/ReservedRolesStoreTests.java
+++ b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/authz/store/ReservedRolesStoreTests.java
@@ -1609,13 +1609,41 @@ public void testKibanaSystemRole() {
             assertThat(kibanaRole.indices().allowedIndicesMatcher(RolloverAction.NAME).test(indexAbstraction), is(true));
         });
 
+        Arrays.asList("logs-wiz.vulnerability-" + randomAlphaOfLength(randomIntBetween(0, 13))).forEach((cspIndex) -> {
+            final IndexAbstraction indexAbstraction = mockIndexAbstraction(cspIndex);
+            assertThat(kibanaRole.indices().allowedIndicesMatcher("indices:foo").test(indexAbstraction), is(false));
+            assertThat(kibanaRole.indices().allowedIndicesMatcher("indices:bar").test(indexAbstraction), is(false));
+            assertThat(
+                kibanaRole.indices().allowedIndicesMatcher(TransportDeleteIndexAction.TYPE.name()).test(indexAbstraction),
+                is(false)
+            );
+            assertThat(kibanaRole.indices().allowedIndicesMatcher(GetIndexAction.NAME).test(indexAbstraction), is(true));
+            assertThat(
+                kibanaRole.indices().allowedIndicesMatcher(TransportCreateIndexAction.TYPE.name()).test(indexAbstraction),
+                is(false)
+            );
+            assertThat(kibanaRole.indices().allowedIndicesMatcher(TransportIndexAction.NAME).test(indexAbstraction), is(false));
+            assertThat(kibanaRole.indices().allowedIndicesMatcher(TransportDeleteAction.NAME).test(indexAbstraction), is(false));
+            assertThat(kibanaRole.indices().allowedIndicesMatcher(TransportSearchAction.TYPE.name()).test(indexAbstraction), is(true));
+            assertThat(kibanaRole.indices().allowedIndicesMatcher(TransportMultiSearchAction.TYPE.name()).test(indexAbstraction), is(true));
+            assertThat(kibanaRole.indices().allowedIndicesMatcher(TransportGetAction.TYPE.name()).test(indexAbstraction), is(true));
+            assertThat(kibanaRole.indices().allowedIndicesMatcher(READ_CROSS_CLUSTER_NAME).test(indexAbstraction), is(false));
+            assertThat(
+                kibanaRole.indices().allowedIndicesMatcher(TransportUpdateSettingsAction.TYPE.name()).test(indexAbstraction),
+                is(true)
+            );
+            assertThat(kibanaRole.indices().allowedIndicesMatcher(TransportPutMappingAction.TYPE.name()).test(indexAbstraction), is(true));
+            assertThat(kibanaRole.indices().allowedIndicesMatcher(RolloverAction.NAME).test(indexAbstraction), is(true));
+        });
+
         Arrays.asList(
             "logs-cloud_security_posture.findings_latest-default",
             "logs-cloud_security_posture.scores-default",
             "logs-cloud_security_posture.vulnerabilities_latest-default",
             "logs-cloud_security_posture.findings_latest-default-" + Version.CURRENT,
             "logs-cloud_security_posture.scores-default-" + Version.CURRENT,
-            "logs-cloud_security_posture.vulnerabilities_latest-default" + Version.CURRENT
+            "logs-cloud_security_posture.vulnerabilities_latest-default" + Version.CURRENT,
+            "security_solution-*.vulnerability_latest-" + Version.CURRENT
         ).forEach(indexName -> {
             logger.info("index name [{}]", indexName);
             final IndexAbstraction indexAbstraction = mockIndexAbstraction(indexName);

From 90f1fb667c20ed98627e9ad1233dd3d6b7920a25 Mon Sep 17 00:00:00 2001
From: Ioana Tagirta <ioanatia@users.noreply.github.com>
Date: Tue, 3 Sep 2024 12:46:20 +0200
Subject: [PATCH 106/144] [ES|QL] Document return value for locate in case
 substring is not found (#112202)

* Document return value for locate in case substring is not found

* Add note that string positions start from 1
---
 .../reference/esql/functions/description/locate.asciidoc | 2 +-
 .../esql/functions/kibana/definition/locate.json         | 2 +-
 docs/reference/esql/functions/kibana/docs/locate.md      | 2 ++
 .../qa/testFixtures/src/main/resources/meta.csv-spec     | 2 +-
 .../esql/expression/function/scalar/string/Locate.java   | 9 ++++-----
 5 files changed, 9 insertions(+), 8 deletions(-)

diff --git a/docs/reference/esql/functions/description/locate.asciidoc b/docs/reference/esql/functions/description/locate.asciidoc
index e5a6fba512432..b3f9d2a1ad78e 100644
--- a/docs/reference/esql/functions/description/locate.asciidoc
+++ b/docs/reference/esql/functions/description/locate.asciidoc
@@ -2,4 +2,4 @@
 
 *Description*
 
-Returns an integer that indicates the position of a keyword substring within another string.
+Returns an integer that indicates the position of a keyword substring within another string. Returns `0` if the substring cannot be found. Note that string positions start from `1`.
diff --git a/docs/reference/esql/functions/kibana/definition/locate.json b/docs/reference/esql/functions/kibana/definition/locate.json
index 2097c90b41958..a9ddc8c52368a 100644
--- a/docs/reference/esql/functions/kibana/definition/locate.json
+++ b/docs/reference/esql/functions/kibana/definition/locate.json
@@ -2,7 +2,7 @@
   "comment" : "This is generated by ESQL's AbstractFunctionTestCase. Do no edit it. See ../README.md for how to regenerate it.",
   "type" : "eval",
   "name" : "locate",
-  "description" : "Returns an integer that indicates the position of a keyword substring within another string.",
+  "description" : "Returns an integer that indicates the position of a keyword substring within another string.\nReturns `0` if the substring cannot be found.\nNote that string positions start from `1`.",
   "signatures" : [
     {
       "params" : [
diff --git a/docs/reference/esql/functions/kibana/docs/locate.md b/docs/reference/esql/functions/kibana/docs/locate.md
index 75275068d3096..412832e9b1587 100644
--- a/docs/reference/esql/functions/kibana/docs/locate.md
+++ b/docs/reference/esql/functions/kibana/docs/locate.md
@@ -4,6 +4,8 @@ This is generated by ESQL's AbstractFunctionTestCase. Do no edit it. See ../READ
 
 ### LOCATE
 Returns an integer that indicates the position of a keyword substring within another string.
+Returns `0` if the substring cannot be found.
+Note that string positions start from `1`.
 
 ```
 row a = "hello"
diff --git a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/meta.csv-spec b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/meta.csv-spec
index f1f66a9cb990c..325b984c36d34 100644
--- a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/meta.csv-spec
+++ b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/meta.csv-spec
@@ -284,7 +284,7 @@ ip_prefix     |Truncates an IP to a given prefix length.
 least         |Returns the minimum value from multiple columns. This is similar to <<esql-mv_min>> except it is intended to run on multiple columns at once.
 left          |Returns the substring that extracts 'length' chars from 'string' starting from the left.
 length        |Returns the character length of a string.
-locate        |Returns an integer that indicates the position of a keyword substring within another string.
+locate        |Returns an integer that indicates the position of a keyword substring within another string. Returns `0` if the substring cannot be found. Note that string positions start from `1`.
 log           |Returns the logarithm of a value to a base. The input can be any numeric value, the return value is always a double.  Logs of zero, negative numbers, and base of one return `null` as well as a warning.
 log10         |Returns the logarithm of a value to base 10. The input can be any numeric value, the return value is always a double.  Logs of 0 and negative numbers return `null` as well as a warning.
 ltrim         |Removes leading whitespaces from a string.
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/scalar/string/Locate.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/scalar/string/Locate.java
index ea088bdc412e8..f6eff2fcbd6b3 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/scalar/string/Locate.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/scalar/string/Locate.java
@@ -46,11 +46,10 @@ public class Locate extends EsqlScalarFunction implements OptionalArgument {
     private final Expression substr;
     private final Expression start;
 
-    @FunctionInfo(
-        returnType = "integer",
-        description = "Returns an integer that indicates the position of a keyword substring within another string.",
-        examples = @Example(file = "string", tag = "locate")
-    )
+    @FunctionInfo(returnType = "integer", description = """
+        Returns an integer that indicates the position of a keyword substring within another string.
+        Returns `0` if the substring cannot be found.
+        Note that string positions start from `1`.""", examples = @Example(file = "string", tag = "locate"))
     public Locate(
         Source source,
         @Param(name = "string", type = { "keyword", "text" }, description = "An input string") Expression str,

From 6d4d437cb109e3029ece465c78a78f63d2d8f4eb Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Christoph=20B=C3=BCscher?= <christophbuescher@posteo.de>
Date: Tue, 3 Sep 2024 13:51:37 +0200
Subject: [PATCH 107/144] Mute
 MetadataCreateIndexServiceTests.testValidateDotIndex because of Lucene RegExp
 tilde operator changes

---
 .../metadata/MetadataCreateIndexServiceTests.java | 15 +++++++++++++++
 1 file changed, 15 insertions(+)

diff --git a/server/src/test/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexServiceTests.java b/server/src/test/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexServiceTests.java
index f7d343b43b29c..0f2217fcb6936 100644
--- a/server/src/test/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexServiceTests.java
+++ b/server/src/test/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexServiceTests.java
@@ -8,6 +8,10 @@
 
 package org.elasticsearch.cluster.metadata;
 
+import org.apache.lucene.util.automaton.Automaton;
+import org.apache.lucene.util.automaton.CharacterRunAutomaton;
+import org.apache.lucene.util.automaton.Operations;
+import org.apache.lucene.util.automaton.RegExp;
 import org.elasticsearch.ExceptionsHelper;
 import org.elasticsearch.ResourceAlreadyExistsException;
 import org.elasticsearch.TransportVersion;
@@ -612,9 +616,20 @@ public void testCalculateNumRoutingShards() {
         }
     }
 
+    @AwaitsFix(bugUrl = "https://github.com/elastic/elasticsearch/issues/112453")
     public void testValidateDotIndex() {
         List<SystemIndexDescriptor> systemIndexDescriptors = new ArrayList<>();
         systemIndexDescriptors.add(SystemIndexDescriptorUtils.createUnmanaged(".test-one*", "test"));
+        //TODO Lucene 10 upgrade
+        // The "~" operator in Rexeg Automata doesn't seem to work as expected any more without minimization
+        Automaton patternAutomaton = new RegExp("\\.test-~(one.*)").toAutomaton();
+        assertTrue(
+            new CharacterRunAutomaton(Operations.determinize(patternAutomaton, Operations.DEFAULT_DETERMINIZE_WORK_LIMIT)).run(
+                ".test-~(one.*)"
+            )
+        );
+        // TODO remove this smoke test ^^^ once the issue is fixed
+
         systemIndexDescriptors.add(SystemIndexDescriptorUtils.createUnmanaged(".test-~(one*)", "test"));
         systemIndexDescriptors.add(SystemIndexDescriptorUtils.createUnmanaged(".pattern-test*", "test-1"));
 

From fdddde5fa42d47ff55be6bd91d85310f51941611 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Christoph=20B=C3=BCscher?= <christophbuescher@posteo.de>
Date: Tue, 3 Sep 2024 13:52:13 +0200
Subject: [PATCH 108/144] Revert "Mute
 MetadataCreateIndexServiceTests.testValidateDotIndex because of Lucene RegExp
 tilde operator changes"

This reverts commit 6d4d437cb109e3029ece465c78a78f63d2d8f4eb.
---
 .../metadata/MetadataCreateIndexServiceTests.java | 15 ---------------
 1 file changed, 15 deletions(-)

diff --git a/server/src/test/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexServiceTests.java b/server/src/test/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexServiceTests.java
index 0f2217fcb6936..f7d343b43b29c 100644
--- a/server/src/test/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexServiceTests.java
+++ b/server/src/test/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexServiceTests.java
@@ -8,10 +8,6 @@
 
 package org.elasticsearch.cluster.metadata;
 
-import org.apache.lucene.util.automaton.Automaton;
-import org.apache.lucene.util.automaton.CharacterRunAutomaton;
-import org.apache.lucene.util.automaton.Operations;
-import org.apache.lucene.util.automaton.RegExp;
 import org.elasticsearch.ExceptionsHelper;
 import org.elasticsearch.ResourceAlreadyExistsException;
 import org.elasticsearch.TransportVersion;
@@ -616,20 +612,9 @@ public void testCalculateNumRoutingShards() {
         }
     }
 
-    @AwaitsFix(bugUrl = "https://github.com/elastic/elasticsearch/issues/112453")
     public void testValidateDotIndex() {
         List<SystemIndexDescriptor> systemIndexDescriptors = new ArrayList<>();
         systemIndexDescriptors.add(SystemIndexDescriptorUtils.createUnmanaged(".test-one*", "test"));
-        //TODO Lucene 10 upgrade
-        // The "~" operator in Rexeg Automata doesn't seem to work as expected any more without minimization
-        Automaton patternAutomaton = new RegExp("\\.test-~(one.*)").toAutomaton();
-        assertTrue(
-            new CharacterRunAutomaton(Operations.determinize(patternAutomaton, Operations.DEFAULT_DETERMINIZE_WORK_LIMIT)).run(
-                ".test-~(one.*)"
-            )
-        );
-        // TODO remove this smoke test ^^^ once the issue is fixed
-
         systemIndexDescriptors.add(SystemIndexDescriptorUtils.createUnmanaged(".test-~(one*)", "test"));
         systemIndexDescriptors.add(SystemIndexDescriptorUtils.createUnmanaged(".pattern-test*", "test-1"));
 

From 301f3fb2ab65ee3e940b7b0099d394b0a3f1f087 Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Tue, 3 Sep 2024 23:18:24 +1000
Subject: [PATCH 109/144] Mute
 org.elasticsearch.xpack.esql.expression.function.aggregate.SpatialCentroidTests
 testAggregateIntermediate {TestCase=<geo_point> #2} #112461

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index cfa67ba495324..c1df0a7bf6300 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -179,6 +179,9 @@ tests:
 - class: org.elasticsearch.xpack.spatial.index.query.LegacyGeoShapeWithDocValuesQueryTests
   method: testIndexPointsFromLine
   issue: https://github.com/elastic/elasticsearch/issues/112438
+- class: org.elasticsearch.xpack.esql.expression.function.aggregate.SpatialCentroidTests
+  method: "testAggregateIntermediate {TestCase=<geo_point> #2}"
+  issue: https://github.com/elastic/elasticsearch/issues/112461
 
 # Examples:
 #

From 2a897d9e607cf4d86ce0fc69101e7e16af61a5aa Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Tue, 3 Sep 2024 23:18:45 +1000
Subject: [PATCH 110/144] Mute
 org.elasticsearch.xpack.esql.expression.function.aggregate.SpatialCentroidTests
 testAggregateIntermediate {TestCase=<geo_point>} #112463

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index c1df0a7bf6300..14dbba8dfdc0f 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -182,6 +182,9 @@ tests:
 - class: org.elasticsearch.xpack.esql.expression.function.aggregate.SpatialCentroidTests
   method: "testAggregateIntermediate {TestCase=<geo_point> #2}"
   issue: https://github.com/elastic/elasticsearch/issues/112461
+- class: org.elasticsearch.xpack.esql.expression.function.aggregate.SpatialCentroidTests
+  method: testAggregateIntermediate {TestCase=<geo_point>}
+  issue: https://github.com/elastic/elasticsearch/issues/112463
 
 # Examples:
 #

From cf4182d68f2311d49c9a8b9a87cdde9bec164107 Mon Sep 17 00:00:00 2001
From: Luigi Dell'Aquila <luigi.dellaquila@gmail.com>
Date: Tue, 3 Sep 2024 17:08:29 +0200
Subject: [PATCH 111/144] ES|QL: add Telemetry API and track top functions
 (#111226)

This adds `MeterRegistry` (ie. [APM
telemetry](https://github.com/elastic/elasticsearch/blob/main/modules/apm/METERING.md))
to ESQL.

It also adds logic to track most used commands (as it already did with
the phone-nome API) and most used functions.

The responsibility of collecting telemetry is now on EsqlSession, so
that it can easily be delegated to lower level components if we want to
collect further information.

The legacy Telemetry is still there, untouched
---
 docs/changelog/111226.yaml                    |   5 +
 .../testFixtures/src/main/resources/README.md |   2 +-
 .../xpack/esql/action/TelemetryIT.java        | 269 ++++++++++++++++++
 .../xpack/esql/analysis/Analyzer.java         |   6 +-
 .../xpack/esql/execution/PlanExecutor.java    |  17 +-
 .../xpack/esql/parser/LogicalPlanBuilder.java |   8 +-
 .../xpack/esql/plan/logical/Aggregate.java    |   8 +
 .../xpack/esql/plan/logical/Dissect.java      |   5 +
 .../xpack/esql/plan/logical/Drop.java         |   5 +
 .../xpack/esql/plan/logical/Enrich.java       |   5 +
 .../xpack/esql/plan/logical/EsRelation.java   |   5 +
 .../xpack/esql/plan/logical/Eval.java         |   5 +
 .../xpack/esql/plan/logical/Explain.java      |   5 +
 .../xpack/esql/plan/logical/Filter.java       |   5 +
 .../xpack/esql/plan/logical/Grok.java         |   5 +
 .../xpack/esql/plan/logical/InlineStats.java  |   5 +
 .../xpack/esql/plan/logical/Keep.java         |   5 +
 .../xpack/esql/plan/logical/Limit.java        |   5 +
 .../xpack/esql/plan/logical/LogicalPlan.java  |   2 +
 .../xpack/esql/plan/logical/Lookup.java       |   5 +
 .../xpack/esql/plan/logical/MvExpand.java     |   5 +
 .../xpack/esql/plan/logical/OrderBy.java      |   5 +
 .../xpack/esql/plan/logical/Project.java      |   8 +
 .../xpack/esql/plan/logical/Rename.java       |   5 +
 .../xpack/esql/plan/logical/Row.java          |   5 +
 .../xpack/esql/plan/logical/TopN.java         |   7 +
 .../esql/plan/logical/UnresolvedRelation.java |  27 +-
 .../xpack/esql/plan/logical/join/Join.java    |   5 +
 .../plan/logical/local/LocalRelation.java     |   8 +
 .../esql/plan/logical/meta/MetaFunctions.java |   5 +
 .../esql/plan/logical/show/ShowInfo.java      |   5 +
 .../xpack/esql/plugin/EsqlPlugin.java         |   2 +-
 .../xpack/esql/session/EsqlSession.java       |  42 +--
 .../xpack/esql/stats/PlanningMetrics.java     |  41 +++
 .../esql/stats/PlanningMetricsManager.java    |  94 ++++++
 .../elasticsearch/xpack/esql/CsvTests.java    |   4 +-
 .../xpack/esql/analysis/AnalyzerTests.java    |   3 +-
 .../LocalLogicalPlanOptimizerTests.java       |   5 +
 .../esql/parser/StatementParserTests.java     |  12 +-
 .../xpack/esql/plan/logical/PhasedTests.java  |   5 +
 .../esql/stats/PlanExecutorMetricsTests.java  |   3 +-
 41 files changed, 620 insertions(+), 53 deletions(-)
 create mode 100644 docs/changelog/111226.yaml
 create mode 100644 x-pack/plugin/esql/src/internalClusterTest/java/org/elasticsearch/xpack/esql/action/TelemetryIT.java
 create mode 100644 x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/stats/PlanningMetrics.java
 create mode 100644 x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/stats/PlanningMetricsManager.java

diff --git a/docs/changelog/111226.yaml b/docs/changelog/111226.yaml
new file mode 100644
index 0000000000000..1021a26fa789f
--- /dev/null
+++ b/docs/changelog/111226.yaml
@@ -0,0 +1,5 @@
+pr: 111226
+summary: "ES|QL: add Telemetry API and track top functions"
+area: ES|QL
+type: enhancement
+issues: []
diff --git a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/README.md b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/README.md
index 0f3a0c236eed9..7792a9e0dbc56 100644
--- a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/README.md
+++ b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/README.md
@@ -188,7 +188,7 @@ It is preferable to use `EsqlCapabilities` for new features, although all existi
 
 ### Warnings
 
-Some queries can return warnings, eg. for number overflows or when a multi-value is passed to a funciton
+Some queries can return warnings, eg. for number overflows or when a multi-value is passed to a function
 that does not support it.
 
 Each CSV-SPEC test has to also assert all the expected warnings.
diff --git a/x-pack/plugin/esql/src/internalClusterTest/java/org/elasticsearch/xpack/esql/action/TelemetryIT.java b/x-pack/plugin/esql/src/internalClusterTest/java/org/elasticsearch/xpack/esql/action/TelemetryIT.java
new file mode 100644
index 0000000000000..6dfc2401f5033
--- /dev/null
+++ b/x-pack/plugin/esql/src/internalClusterTest/java/org/elasticsearch/xpack/esql/action/TelemetryIT.java
@@ -0,0 +1,269 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.esql.action;
+
+import com.carrotsearch.randomizedtesting.annotations.Name;
+import com.carrotsearch.randomizedtesting.annotations.ParametersFactory;
+
+import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.cluster.metadata.IndexMetadata;
+import org.elasticsearch.cluster.node.DiscoveryNode;
+import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.common.util.CollectionUtils;
+import org.elasticsearch.plugins.Plugin;
+import org.elasticsearch.plugins.PluginsService;
+import org.elasticsearch.telemetry.Measurement;
+import org.elasticsearch.telemetry.TestTelemetryPlugin;
+import org.elasticsearch.xpack.esql.stats.PlanningMetricsManager;
+import org.junit.Before;
+
+import java.util.Collection;
+import java.util.List;
+import java.util.Map;
+import java.util.Set;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.TimeUnit;
+import java.util.stream.Collectors;
+
+import static org.elasticsearch.test.hamcrest.ElasticsearchAssertions.assertAcked;
+import static org.hamcrest.Matchers.hasSize;
+import static org.hamcrest.Matchers.is;
+
+public class TelemetryIT extends AbstractEsqlIntegTestCase {
+
+    record Test(String query, Map<String, Integer> expectedCommands, Map<String, Integer> expectedFunctions, boolean success) {}
+
+    private final Test testCase;
+
+    public TelemetryIT(@Name("TestCase") Test test) {
+        this.testCase = test;
+    }
+
+    @ParametersFactory
+    public static Iterable<Object[]> parameters() {
+        return List.of(
+            new Object[] {
+                new Test(
+                    """
+                        FROM idx
+                        | EVAL ip = to_ip(host), x = to_string(host), y = to_string(host)
+                        | STATS s = COUNT(*) by ip
+                        | KEEP ip
+                        | EVAL a = 10""",
+                    Map.ofEntries(Map.entry("FROM", 1), Map.entry("EVAL", 2), Map.entry("STATS", 1), Map.entry("KEEP", 1)),
+                    Map.ofEntries(Map.entry("TO_IP", 1), Map.entry("TO_STRING", 2), Map.entry("COUNT", 1)),
+                    true
+                ) },
+            new Object[] {
+                new Test(
+                    "FROM idx | EVAL ip = to_ip(host), x = to_string(host), y = to_string(host) "
+                        + "| STATS s = COUNT(*) by ip | KEEP ip | EVAL a = non_existing",
+                    Map.ofEntries(Map.entry("FROM", 1), Map.entry("EVAL", 2), Map.entry("STATS", 1), Map.entry("KEEP", 1)),
+                    Map.ofEntries(Map.entry("TO_IP", 1), Map.entry("TO_STRING", 2), Map.entry("COUNT", 1)),
+                    false
+                ) },
+            new Object[] {
+                new Test(
+                    """
+                        FROM idx
+                        | EVAL ip = to_ip(host), x = to_string(host), y = to_string(host)
+                        | EVAL ip = to_ip(host), x = to_string(host), y = to_string(host)
+                        | STATS s = COUNT(*) by ip | KEEP ip | EVAL a = 10
+                        """,
+                    Map.ofEntries(Map.entry("FROM", 1), Map.entry("EVAL", 3), Map.entry("STATS", 1), Map.entry("KEEP", 1)),
+                    Map.ofEntries(Map.entry("TO_IP", 2), Map.entry("TO_STRING", 4), Map.entry("COUNT", 1)),
+                    true
+                ) },
+            new Object[] {
+                new Test(
+                    """
+                        FROM idx | EVAL ip = to_ip(host), x = to_string(host), y = to_string(host)
+                        | WHERE id is not null AND id > 100 AND host RLIKE \".*foo\"
+                        | eval a = 10
+                        | drop host
+                        | rename a as foo
+                        | DROP foo
+                        """, // lowercase on purpose
+                    Map.ofEntries(
+                        Map.entry("FROM", 1),
+                        Map.entry("EVAL", 2),
+                        Map.entry("WHERE", 1),
+                        Map.entry("DROP", 2),
+                        Map.entry("RENAME", 1)
+                    ),
+                    Map.ofEntries(Map.entry("TO_IP", 1), Map.entry("TO_STRING", 2)),
+                    true
+                ) },
+            new Object[] {
+                new Test(
+                    """
+                        FROM idx
+                        | EVAL ip = to_ip(host), x = to_string(host), y = to_string(host)
+                        | GROK host "%{WORD:name} %{WORD}"
+                        | DISSECT host "%{surname}"
+                        """,
+                    Map.ofEntries(Map.entry("FROM", 1), Map.entry("EVAL", 1), Map.entry("GROK", 1), Map.entry("DISSECT", 1)),
+                    Map.ofEntries(Map.entry("TO_IP", 1), Map.entry("TO_STRING", 2)),
+                    true
+                ) },
+            new Object[] {
+                new Test("METRICS idx | LIMIT 10", Map.ofEntries(Map.entry("METRICS", 1), Map.entry("LIMIT", 1)), Map.ofEntries(), true) },
+            new Object[] {
+                new Test(
+                    "METRICS idx max(id) BY host | LIMIT 10",
+                    Map.ofEntries(Map.entry("METRICS", 1), Map.entry("LIMIT", 1), Map.entry("FROM TS", 1)),
+                    Map.ofEntries(Map.entry("MAX", 1)),
+                    true
+                ) },
+            new Object[] {
+                new Test(
+                    """
+                        FROM idx
+                        | EVAL ip = to_ip(host), x = to_string(host), y = to_string(host)
+                        | INLINESTATS max(id)
+                        """,
+                    Map.ofEntries(Map.entry("FROM", 1), Map.entry("EVAL", 1), Map.entry("INLINESTATS", 1)),
+                    Map.ofEntries(Map.entry("MAX", 1), Map.entry("TO_IP", 1), Map.entry("TO_STRING", 2)),
+                    true
+                ) }
+        );
+    }
+
+    @Before
+    public void init() {
+        DiscoveryNode dataNode = randomDataNode();
+        final String nodeName = dataNode.getName();
+        loadData(nodeName);
+    }
+
+    public void testMetrics() throws Exception {
+        DiscoveryNode dataNode = randomDataNode();
+        testQuery(dataNode, testCase);
+    }
+
+    private static void testQuery(DiscoveryNode dataNode, Test test) throws InterruptedException {
+        testQuery(dataNode, test.query, test.success, test.expectedCommands, test.expectedFunctions);
+    }
+
+    private static void testQuery(
+        DiscoveryNode dataNode,
+        String query,
+        Boolean success,
+        Map<String, Integer> expectedCommands,
+        Map<String, Integer> expectedFunctions
+    ) throws InterruptedException {
+        final var plugins = internalCluster().getInstance(PluginsService.class, dataNode.getName())
+            .filterPlugins(TestTelemetryPlugin.class)
+            .toList();
+        assertThat(plugins, hasSize(1));
+        TestTelemetryPlugin plugin = plugins.get(0);
+
+        try {
+            int successIterations = randomInt(10);
+            for (int i = 0; i < successIterations; i++) {
+                EsqlQueryRequest request = executeQuery(query);
+                CountDownLatch latch = new CountDownLatch(1);
+
+                final long iteration = i + 1;
+                client(dataNode.getName()).execute(EsqlQueryAction.INSTANCE, request, ActionListener.running(() -> {
+                    try {
+                        // test total commands used
+                        final List<Measurement> commandMeasurementsAll = measurements(plugin, PlanningMetricsManager.FEATURE_METRICS_ALL);
+                        assertAllUsages(expectedCommands, commandMeasurementsAll, iteration, success);
+
+                        // test num of queries using a command
+                        final List<Measurement> commandMeasurements = measurements(plugin, PlanningMetricsManager.FEATURE_METRICS);
+                        assertUsageInQuery(expectedCommands, commandMeasurements, iteration, success);
+
+                        // test total functions used
+                        final List<Measurement> functionMeasurementsAll = measurements(plugin, PlanningMetricsManager.FUNCTION_METRICS_ALL);
+                        assertAllUsages(expectedFunctions, functionMeasurementsAll, iteration, success);
+
+                        // test number of queries using a function
+                        final List<Measurement> functionMeasurements = measurements(plugin, PlanningMetricsManager.FUNCTION_METRICS);
+                        assertUsageInQuery(expectedFunctions, functionMeasurements, iteration, success);
+                    } finally {
+                        latch.countDown();
+                    }
+                }));
+                latch.await(30, TimeUnit.SECONDS);
+            }
+        } finally {
+            plugin.resetMeter();
+        }
+
+    }
+
+    private static void assertAllUsages(Map<String, Integer> expected, List<Measurement> metrics, long iteration, Boolean success) {
+        Set<String> found = featureNames(metrics);
+        assertThat(found, is(expected.keySet()));
+        for (Measurement metric : metrics) {
+            assertThat(metric.attributes().get(PlanningMetricsManager.SUCCESS), is(success));
+            String featureName = (String) metric.attributes().get(PlanningMetricsManager.FEATURE_NAME);
+            assertThat(metric.getLong(), is(iteration * expected.get(featureName)));
+        }
+    }
+
+    private static void assertUsageInQuery(Map<String, Integer> expected, List<Measurement> found, long iteration, Boolean success) {
+        Set<String> functionsFound;
+        functionsFound = featureNames(found);
+        assertThat(functionsFound, is(expected.keySet()));
+        for (Measurement measurement : found) {
+            assertThat(measurement.attributes().get(PlanningMetricsManager.SUCCESS), is(success));
+            assertThat(measurement.getLong(), is(iteration));
+        }
+    }
+
+    private static List<Measurement> measurements(TestTelemetryPlugin plugin, String metricKey) {
+        return Measurement.combine(plugin.getLongCounterMeasurement(metricKey));
+    }
+
+    private static Set<String> featureNames(List<Measurement> functionMeasurements) {
+        return functionMeasurements.stream()
+            .map(x -> x.attributes().get(PlanningMetricsManager.FEATURE_NAME))
+            .map(String.class::cast)
+            .collect(Collectors.toSet());
+    }
+
+    private static EsqlQueryRequest executeQuery(String query) {
+        EsqlQueryRequest request = EsqlQueryRequest.syncEsqlQueryRequest();
+        request.query(query);
+        request.pragmas(randomPragmas());
+        return request;
+    }
+
+    private static void loadData(String nodeName) {
+        int numDocs = randomIntBetween(1, 15);
+        assertAcked(
+            client().admin()
+                .indices()
+                .prepareCreate("idx")
+                .setSettings(
+                    Settings.builder()
+                        .put("index.routing.allocation.require._name", nodeName)
+                        .put(IndexMetadata.SETTING_NUMBER_OF_SHARDS, between(1, 5))
+                )
+                .setMapping("host", "type=keyword", "id", "type=long")
+        );
+        for (int i = 0; i < numDocs; i++) {
+            client().prepareIndex("idx").setSource("host", "192." + i, "id", i).get();
+        }
+
+        client().admin().indices().prepareRefresh("idx").get();
+    }
+
+    private DiscoveryNode randomDataNode() {
+        return randomFrom(clusterService().state().nodes().getDataNodes().values());
+    }
+
+    @Override
+    protected Collection<Class<? extends Plugin>> nodePlugins() {
+        return CollectionUtils.appendToCopy(super.nodePlugins(), TestTelemetryPlugin.class);
+    }
+
+}
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/analysis/Analyzer.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/analysis/Analyzer.java
index 5baced5bc93f2..664c9bffb6499 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/analysis/Analyzer.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/analysis/Analyzer.java
@@ -190,7 +190,8 @@ protected LogicalPlan rule(UnresolvedRelation plan, AnalyzerContext context) {
                         plan.frozen(),
                         plan.metadataFields(),
                         plan.indexMode(),
-                        context.indexResolution().toString()
+                        context.indexResolution().toString(),
+                        plan.commandName()
                     );
             }
             TableIdentifier table = plan.table();
@@ -202,7 +203,8 @@ protected LogicalPlan rule(UnresolvedRelation plan, AnalyzerContext context) {
                     plan.frozen(),
                     plan.metadataFields(),
                     plan.indexMode(),
-                    "invalid [" + table + "] resolution to [" + context.indexResolution() + "]"
+                    "invalid [" + table + "] resolution to [" + context.indexResolution() + "]",
+                    plan.commandName()
                 );
             }
 
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/execution/PlanExecutor.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/execution/PlanExecutor.java
index 88dfb7a377aa9..441fd91ee6b35 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/execution/PlanExecutor.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/execution/PlanExecutor.java
@@ -8,6 +8,7 @@
 package org.elasticsearch.xpack.esql.execution;
 
 import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.telemetry.metric.MeterRegistry;
 import org.elasticsearch.xpack.esql.action.EsqlQueryRequest;
 import org.elasticsearch.xpack.esql.analysis.PreAnalyzer;
 import org.elasticsearch.xpack.esql.analysis.Verifier;
@@ -22,6 +23,8 @@
 import org.elasticsearch.xpack.esql.session.IndexResolver;
 import org.elasticsearch.xpack.esql.session.Result;
 import org.elasticsearch.xpack.esql.stats.Metrics;
+import org.elasticsearch.xpack.esql.stats.PlanningMetrics;
+import org.elasticsearch.xpack.esql.stats.PlanningMetricsManager;
 import org.elasticsearch.xpack.esql.stats.QueryMetric;
 
 import java.util.function.BiConsumer;
@@ -36,14 +39,16 @@ public class PlanExecutor {
     private final Mapper mapper;
     private final Metrics metrics;
     private final Verifier verifier;
+    private final PlanningMetricsManager planningMetricsManager;
 
-    public PlanExecutor(IndexResolver indexResolver) {
+    public PlanExecutor(IndexResolver indexResolver, MeterRegistry meterRegistry) {
         this.indexResolver = indexResolver;
         this.preAnalyzer = new PreAnalyzer();
         this.functionRegistry = new EsqlFunctionRegistry();
         this.mapper = new Mapper(functionRegistry);
         this.metrics = new Metrics();
         this.verifier = new Verifier(metrics);
+        this.planningMetricsManager = new PlanningMetricsManager(meterRegistry);
     }
 
     public void esql(
@@ -54,6 +59,7 @@ public void esql(
         BiConsumer<PhysicalPlan, ActionListener<Result>> runPhase,
         ActionListener<Result> listener
     ) {
+        final PlanningMetrics planningMetrics = new PlanningMetrics();
         final var session = new EsqlSession(
             sessionId,
             cfg,
@@ -63,13 +69,18 @@ public void esql(
             functionRegistry,
             new LogicalPlanOptimizer(new LogicalOptimizerContext(cfg)),
             mapper,
-            verifier
+            verifier,
+            planningMetrics
         );
         QueryMetric clientId = QueryMetric.fromString("rest");
         metrics.total(clientId);
-        session.execute(request, runPhase, wrap(listener::onResponse, ex -> {
+        session.execute(request, runPhase, wrap(x -> {
+            planningMetricsManager.publish(planningMetrics, true);
+            listener.onResponse(x);
+        }, ex -> {
             // TODO when we decide if we will differentiate Kibana from REST, this String value will likely come from the request
             metrics.failed(clientId);
+            planningMetricsManager.publish(planningMetrics, false);
             listener.onFailure(ex);
         }));
     }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/parser/LogicalPlanBuilder.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/parser/LogicalPlanBuilder.java
index ffd2375a688ad..cc6273d4de292 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/parser/LogicalPlanBuilder.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/parser/LogicalPlanBuilder.java
@@ -288,7 +288,8 @@ public LogicalPlan visitFromCommand(EsqlBaseParser.FromCommandContext ctx) {
             false,
             List.of(metadataMap.values().toArray(Attribute[]::new)),
             IndexMode.STANDARD,
-            null
+            null,
+            "FROM"
         );
     }
 
@@ -497,7 +498,7 @@ public LogicalPlan visitMetricsCommand(EsqlBaseParser.MetricsCommandContext ctx)
         TableIdentifier table = new TableIdentifier(source, null, visitIndexPattern(ctx.indexPattern()));
 
         if (ctx.aggregates == null && ctx.grouping == null) {
-            return new UnresolvedRelation(source, table, false, List.of(), IndexMode.STANDARD, null);
+            return new UnresolvedRelation(source, table, false, List.of(), IndexMode.STANDARD, null, "METRICS");
         }
         final Stats stats = stats(source, ctx.grouping, ctx.aggregates);
         var relation = new UnresolvedRelation(
@@ -506,7 +507,8 @@ public LogicalPlan visitMetricsCommand(EsqlBaseParser.MetricsCommandContext ctx)
             false,
             List.of(new MetadataAttribute(source, MetadataAttribute.TSID_FIELD, DataType.KEYWORD, false)),
             IndexMode.TIME_SERIES,
-            null
+            null,
+            "FROM TS"
         );
         return new Aggregate(source, relation, Aggregate.AggregateType.METRICS, stats.groupings, stats.aggregates);
     }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Aggregate.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Aggregate.java
index 5b6fe8c0112c6..7ed2d04400be1 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Aggregate.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Aggregate.java
@@ -124,6 +124,14 @@ public List<? extends NamedExpression> aggregates() {
         return aggregates;
     }
 
+    @Override
+    public String commandName() {
+        return switch (aggregateType) {
+            case STANDARD -> "STATS";
+            case METRICS -> "METRICS";
+        };
+    }
+
     @Override
     public boolean expressionsResolved() {
         return Resolvables.resolved(groupings) && Resolvables.resolved(aggregates);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Dissect.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Dissect.java
index ae9805124890a..a83e102e51005 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Dissect.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Dissect.java
@@ -123,6 +123,11 @@ public boolean equals(Object o) {
         return Objects.equals(parser, dissect.parser);
     }
 
+    @Override
+    public String commandName() {
+        return "DISSECT";
+    }
+
     @Override
     public int hashCode() {
         return Objects.hash(super.hashCode(), parser);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Drop.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Drop.java
index 2df8727cf0e65..b32139c18e08e 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Drop.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Drop.java
@@ -38,6 +38,11 @@ public List<NamedExpression> removals() {
         return removals;
     }
 
+    @Override
+    public String commandName() {
+        return "DROP";
+    }
+
     @Override
     public boolean expressionsResolved() {
         return Resolvables.resolved(removals);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Enrich.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Enrich.java
index a2b560d14ae21..762d5ffcc4532 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Enrich.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Enrich.java
@@ -191,6 +191,11 @@ public Mode mode() {
         return mode;
     }
 
+    @Override
+    public String commandName() {
+        return "ENRICH";
+    }
+
     @Override
     public boolean expressionsResolved() {
         return policyName.resolved()
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/EsRelation.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/EsRelation.java
index b080c425d2312..0043362f23b87 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/EsRelation.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/EsRelation.java
@@ -140,6 +140,11 @@ public List<Attribute> output() {
         return attrs;
     }
 
+    @Override
+    public String commandName() {
+        return "FROM";
+    }
+
     @Override
     public boolean expressionsResolved() {
         // For unresolved expressions to exist in EsRelation is fine, as long as they are not used in later operations
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Eval.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Eval.java
index 2cecef42a42ac..6b217a7a81541 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Eval.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Eval.java
@@ -113,6 +113,11 @@ private List<Alias> renameAliases(List<Alias> originalAttributes, List<String> n
         return newFieldsWithUpdatedRefs;
     }
 
+    @Override
+    public String commandName() {
+        return "EVAL";
+    }
+
     @Override
     public boolean expressionsResolved() {
         return Resolvables.resolved(fields);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Explain.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Explain.java
index 009c9519a9fe5..38e7c19522df6 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Explain.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Explain.java
@@ -69,6 +69,11 @@ public List<Attribute> output() {
         );
     }
 
+    @Override
+    public String commandName() {
+        return "EXPLAIN";
+    }
+
     @Override
     public boolean expressionsResolved() {
         return true;
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Filter.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Filter.java
index aca1a83344f32..611793b583d7a 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Filter.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Filter.java
@@ -62,6 +62,11 @@ public Expression condition() {
         return condition;
     }
 
+    @Override
+    public String commandName() {
+        return "WHERE";
+    }
+
     @Override
     public boolean expressionsResolved() {
         return condition.resolved();
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Grok.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Grok.java
index 2f1c468415aa3..fcfd1ac0f04da 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Grok.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Grok.java
@@ -148,6 +148,11 @@ public boolean equals(Object o) {
         return Objects.equals(parser, grok.parser);
     }
 
+    @Override
+    public String commandName() {
+        return "GROK";
+    }
+
     @Override
     public int hashCode() {
         return Objects.hash(super.hashCode(), parser);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/InlineStats.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/InlineStats.java
index b37976c00ad06..dd71d1d85c8e2 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/InlineStats.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/InlineStats.java
@@ -112,6 +112,11 @@ public List<? extends NamedExpression> aggregates() {
         return aggregates;
     }
 
+    @Override
+    public String commandName() {
+        return "INLINESTATS";
+    }
+
     @Override
     public boolean expressionsResolved() {
         return Resolvables.resolved(groupings) && Resolvables.resolved(aggregates);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Keep.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Keep.java
index c1c8c9aff5ca6..4c03d68e6e6f7 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Keep.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Keep.java
@@ -44,4 +44,9 @@ public int hashCode() {
     public boolean equals(Object obj) {
         return super.equals(obj);
     }
+
+    @Override
+    public String commandName() {
+        return "KEEP";
+    }
 }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Limit.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Limit.java
index 00b9ad3c2b6a2..ea64b7687f4c0 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Limit.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Limit.java
@@ -57,6 +57,11 @@ public Expression limit() {
         return limit;
     }
 
+    @Override
+    public String commandName() {
+        return "LIMIT";
+    }
+
     @Override
     public boolean expressionsResolved() {
         return limit.resolved();
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/LogicalPlan.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/LogicalPlan.java
index b94d60a9face2..df81d730bcf1b 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/LogicalPlan.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/LogicalPlan.java
@@ -101,6 +101,8 @@ public boolean resolved() {
         return lazyResolved;
     }
 
+    public abstract String commandName();
+
     public abstract boolean expressionsResolved();
 
     @Override
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Lookup.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Lookup.java
index c0eaaa96b86d9..141d1a0945ddd 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Lookup.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Lookup.java
@@ -111,6 +111,11 @@ public JoinConfig joinConfig() {
         return new JoinConfig(JoinType.LEFT, matchFields, leftFields, rightFields);
     }
 
+    @Override
+    public String commandName() {
+        return "LOOKUP";
+    }
+
     @Override
     public boolean expressionsResolved() {
         return tableName.resolved() && Resolvables.resolved(matchFields) && localRelation != null;
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/MvExpand.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/MvExpand.java
index 98eb5d3fcc451..8519ca0350b6e 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/MvExpand.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/MvExpand.java
@@ -77,6 +77,11 @@ public Attribute expanded() {
         return expanded;
     }
 
+    @Override
+    public String commandName() {
+        return "MV_EXPAND";
+    }
+
     @Override
     public boolean expressionsResolved() {
         return target.resolved();
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/OrderBy.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/OrderBy.java
index 9b79f9510feaf..8756cddbc3c97 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/OrderBy.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/OrderBy.java
@@ -63,6 +63,11 @@ public List<Order> order() {
         return order;
     }
 
+    @Override
+    public String commandName() {
+        return "SORT";
+    }
+
     @Override
     public boolean expressionsResolved() {
         return Resolvables.resolved(order);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Project.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Project.java
index e12a8cb557fde..841e7fbe81896 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Project.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Project.java
@@ -78,6 +78,14 @@ public boolean resolved() {
         return super.resolved() && Expressions.anyMatch(projections, Functions::isAggregate) == false;
     }
 
+    @Override
+    public String commandName() {
+        // this could represent multiple commands (KEEP, DROP, RENAME)
+        // and should not be present in a pre-analyzed plan.
+        // maybe it should throw exception?
+        return "<project>";
+    }
+
     @Override
     public boolean expressionsResolved() {
         return Resolvables.resolved(projections);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Rename.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Rename.java
index e587d7ad94d0e..773d3fd015e5f 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Rename.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Rename.java
@@ -51,6 +51,11 @@ public List<Attribute> output() {
         return Expressions.asAttributes(projectionsAfterResolution);
     }
 
+    @Override
+    public String commandName() {
+        return "RENAME";
+    }
+
     @Override
     public boolean expressionsResolved() {
         for (var alias : renamings) {
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Row.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Row.java
index 0fe45e9182f0a..57cce3c26afc7 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Row.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Row.java
@@ -46,6 +46,11 @@ public List<Attribute> output() {
         return Expressions.asAttributes(fields);
     }
 
+    @Override
+    public String commandName() {
+        return "ROW";
+    }
+
     @Override
     public boolean expressionsResolved() {
         return Resolvables.resolved(fields);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/TopN.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/TopN.java
index a9a5dbddc544f..d6e0e4334bd47 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/TopN.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/TopN.java
@@ -55,6 +55,13 @@ public String getWriteableName() {
         return ENTRY.name;
     }
 
+    @Override
+    public String commandName() {
+        // this is the result of optimizations, it will never appear in a pre-analyzed plan
+        // maybe we should throw exception?
+        return "<top N>";
+    }
+
     @Override
     public boolean expressionsResolved() {
         return limit.resolved() && Resolvables.resolved(order);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/UnresolvedRelation.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/UnresolvedRelation.java
index 8414419529c47..fdc2321c8bef6 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/UnresolvedRelation.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/UnresolvedRelation.java
@@ -31,13 +31,20 @@ public class UnresolvedRelation extends LeafPlan implements Unresolvable {
     private final IndexMode indexMode;
     private final String unresolvedMsg;
 
+    /**
+     * Used by telemetry to say if this is the result of a FROM command
+     * or a METRICS command (or maybe something else in the future)
+     */
+    private final String commandName;
+
     public UnresolvedRelation(
         Source source,
         TableIdentifier table,
         boolean frozen,
         List<Attribute> metadataFields,
         IndexMode indexMode,
-        String unresolvedMessage
+        String unresolvedMessage,
+        String commandName
     ) {
         super(source);
         this.table = table;
@@ -45,6 +52,7 @@ public UnresolvedRelation(
         this.metadataFields = metadataFields;
         this.indexMode = indexMode;
         this.unresolvedMsg = unresolvedMessage == null ? "Unknown index [" + table.index() + "]" : unresolvedMessage;
+        this.commandName = commandName;
     }
 
     @Override
@@ -59,7 +67,7 @@ public String getWriteableName() {
 
     @Override
     protected NodeInfo<UnresolvedRelation> info() {
-        return NodeInfo.create(this, UnresolvedRelation::new, table, frozen, metadataFields, indexMode, unresolvedMsg);
+        return NodeInfo.create(this, UnresolvedRelation::new, table, frozen, metadataFields, indexMode, unresolvedMsg, commandName);
     }
 
     public TableIdentifier table() {
@@ -75,6 +83,21 @@ public boolean resolved() {
         return false;
     }
 
+    /**
+     *
+     * This is used by {@link org.elasticsearch.xpack.esql.stats.PlanningMetrics} to collect query statistics
+     * It can return
+     * <ul>
+     *     <li>"FROM" if this a <code>|FROM idx</code> command</li>
+     *     <li>"FROM TS" if it is the result of a <code>| METRICS idx some_aggs() BY fields</code> command</li>
+     *     <li>"METRICS" if it is the result of a <code>| METRICS idx</code> (no aggs, no groupings)</li>
+     * </ul>
+     */
+    @Override
+    public String commandName() {
+        return commandName;
+    }
+
     @Override
     public boolean expressionsResolved() {
         return false;
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/join/Join.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/join/Join.java
index 7ad1bcad2d9d0..b9004e3758c9b 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/join/Join.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/join/Join.java
@@ -185,6 +185,11 @@ public boolean resolved() {
         return childrenResolved() && expressionsResolved();
     }
 
+    @Override
+    public String commandName() {
+        return "JOIN";
+    }
+
     @Override
     public int hashCode() {
         return Objects.hash(config, left(), right());
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/local/LocalRelation.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/local/LocalRelation.java
index d6106bae6b6b8..07432481d2341 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/local/LocalRelation.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/local/LocalRelation.java
@@ -63,6 +63,14 @@ public LocalSupplier supplier() {
         return supplier;
     }
 
+    @Override
+    public String commandName() {
+        // this colud be an empty source, a lookup table or something else
+        // but it should not be present in a pre-analyzed plan
+        // maybe we sholud throw exception?
+        return "<local relation>";
+    }
+
     @Override
     public boolean expressionsResolved() {
         return true;
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/meta/MetaFunctions.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/meta/MetaFunctions.java
index 58c344219e6a9..029cb6164167c 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/meta/MetaFunctions.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/meta/MetaFunctions.java
@@ -116,6 +116,11 @@ private static BytesRef asBytesRefOrNull(String string) {
         return Strings.hasText(string) ? new BytesRef(string) : null;
     }
 
+    @Override
+    public String commandName() {
+        return "META FUNCTIONS";
+    }
+
     @Override
     public boolean expressionsResolved() {
         return true;
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/show/ShowInfo.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/show/ShowInfo.java
index 0fc30c96c809d..fa432537d27e3 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/show/ShowInfo.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/show/ShowInfo.java
@@ -58,6 +58,11 @@ public List<List<Object>> values() {
         return List.of(row);
     }
 
+    @Override
+    public String commandName() {
+        return "SHOW";
+    }
+
     @Override
     public boolean expressionsResolved() {
         return true;
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plugin/EsqlPlugin.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plugin/EsqlPlugin.java
index f0686baf68f6f..c630051e79a26 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plugin/EsqlPlugin.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plugin/EsqlPlugin.java
@@ -114,7 +114,7 @@ public Collection<?> createComponents(PluginServices services) {
         BlockFactory blockFactory = new BlockFactory(circuitBreaker, bigArrays, maxPrimitiveArrayBlockSize);
         setupSharedSecrets();
         return List.of(
-            new PlanExecutor(new IndexResolver(services.client())),
+            new PlanExecutor(new IndexResolver(services.client()), services.telemetryProvider().getMeterRegistry()),
             new ExchangeService(services.clusterService().getSettings(), services.threadPool(), ThreadPool.Names.SEARCH, blockFactory),
             blockFactory
         );
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/session/EsqlSession.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/session/EsqlSession.java
index 25d155ccfde07..29a32df8e6239 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/session/EsqlSession.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/session/EsqlSession.java
@@ -8,7 +8,6 @@
 package org.elasticsearch.xpack.esql.session;
 
 import org.elasticsearch.action.ActionListener;
-import org.elasticsearch.action.fieldcaps.FieldCapabilities;
 import org.elasticsearch.common.Strings;
 import org.elasticsearch.common.collect.Iterators;
 import org.elasticsearch.common.regex.Regex;
@@ -31,7 +30,6 @@
 import org.elasticsearch.xpack.esql.core.expression.MetadataAttribute;
 import org.elasticsearch.xpack.esql.core.expression.UnresolvedAttribute;
 import org.elasticsearch.xpack.esql.core.expression.UnresolvedStar;
-import org.elasticsearch.xpack.esql.core.type.InvalidMappedField;
 import org.elasticsearch.xpack.esql.core.util.Holder;
 import org.elasticsearch.xpack.esql.enrich.EnrichPolicyResolver;
 import org.elasticsearch.xpack.esql.enrich.ResolvedEnrichPolicy;
@@ -56,11 +54,11 @@
 import org.elasticsearch.xpack.esql.plan.physical.FragmentExec;
 import org.elasticsearch.xpack.esql.plan.physical.PhysicalPlan;
 import org.elasticsearch.xpack.esql.planner.Mapper;
+import org.elasticsearch.xpack.esql.stats.PlanningMetrics;
 
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.List;
-import java.util.Map;
 import java.util.Set;
 import java.util.function.BiConsumer;
 import java.util.function.BiFunction;
@@ -86,6 +84,7 @@ public class EsqlSession {
 
     private final Mapper mapper;
     private final PhysicalPlanOptimizer physicalPlanOptimizer;
+    private final PlanningMetrics planningMetrics;
 
     public EsqlSession(
         String sessionId,
@@ -96,7 +95,8 @@ public EsqlSession(
         EsqlFunctionRegistry functionRegistry,
         LogicalPlanOptimizer logicalPlanOptimizer,
         Mapper mapper,
-        Verifier verifier
+        Verifier verifier,
+        PlanningMetrics planningMetrics
     ) {
         this.sessionId = sessionId;
         this.configuration = configuration;
@@ -108,6 +108,7 @@ public EsqlSession(
         this.mapper = mapper;
         this.logicalPlanOptimizer = logicalPlanOptimizer;
         this.physicalPlanOptimizer = new PhysicalPlanOptimizer(new PhysicalOptimizerContext(configuration));
+        this.planningMetrics = planningMetrics;
     }
 
     public String sessionId() {
@@ -191,6 +192,7 @@ public void analyzedPlan(LogicalPlan parsed, ActionListener<LogicalPlan> listene
         }
 
         preAnalyze(parsed, (indices, policies) -> {
+            planningMetrics.gatherPreAnalysisMetrics(parsed);
             Analyzer analyzer = new Analyzer(new AnalyzerContext(configuration, functionRegistry, indices, policies), verifier);
             var plan = analyzer.analyze(parsed);
             plan.setAnalyzed();
@@ -395,36 +397,4 @@ public PhysicalPlan optimizedPhysicalPlan(LogicalPlan optimizedPlan) {
         LOGGER.debug("Optimized physical plan:\n{}", plan);
         return plan;
     }
-
-    public static InvalidMappedField specificValidity(String fieldName, Map<String, FieldCapabilities> types) {
-        boolean hasUnmapped = types.containsKey(IndexResolver.UNMAPPED);
-        boolean hasTypeConflicts = types.size() > (hasUnmapped ? 2 : 1);
-        String metricConflictsTypeName = null;
-        boolean hasMetricConflicts = false;
-
-        if (hasTypeConflicts == false) {
-            for (Map.Entry<String, FieldCapabilities> type : types.entrySet()) {
-                if (IndexResolver.UNMAPPED.equals(type.getKey())) {
-                    continue;
-                }
-                if (type.getValue().metricConflictsIndices() != null && type.getValue().metricConflictsIndices().length > 0) {
-                    hasMetricConflicts = true;
-                    metricConflictsTypeName = type.getKey();
-                    break;
-                }
-            }
-        }
-
-        InvalidMappedField result = null;
-        if (hasMetricConflicts) {
-            StringBuilder errorMessage = new StringBuilder();
-            errorMessage.append(
-                "mapped as different metric types in indices: ["
-                    + String.join(", ", types.get(metricConflictsTypeName).metricConflictsIndices())
-                    + "]"
-            );
-            result = new InvalidMappedField(fieldName, errorMessage.toString());
-        }
-        return result;
-    };
 }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/stats/PlanningMetrics.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/stats/PlanningMetrics.java
new file mode 100644
index 0000000000000..7b452e50fd525
--- /dev/null
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/stats/PlanningMetrics.java
@@ -0,0 +1,41 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.esql.stats;
+
+import org.elasticsearch.xpack.esql.expression.function.UnresolvedFunction;
+import org.elasticsearch.xpack.esql.plan.logical.LogicalPlan;
+
+import java.util.HashMap;
+import java.util.Locale;
+import java.util.Map;
+
+/**
+ * This class is responsible for collecting metrics related to ES|QL planning.
+ */
+public class PlanningMetrics {
+    private Map<String, Integer> commands = new HashMap<>();
+    private Map<String, Integer> functions = new HashMap<>();
+
+    public void gatherPreAnalysisMetrics(LogicalPlan plan) {
+        plan.forEachDown(p -> add(commands, p.commandName()));
+        plan.forEachExpressionDown(UnresolvedFunction.class, p -> add(functions, p.name().toUpperCase(Locale.ROOT)));
+    }
+
+    private void add(Map<String, Integer> map, String key) {
+        Integer cmd = map.get(key);
+        map.put(key, cmd == null ? 1 : cmd + 1);
+    }
+
+    public Map<String, Integer> commands() {
+        return commands;
+    }
+
+    public Map<String, Integer> functions() {
+        return functions;
+    }
+}
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/stats/PlanningMetricsManager.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/stats/PlanningMetricsManager.java
new file mode 100644
index 0000000000000..a2d00a1f530e9
--- /dev/null
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/stats/PlanningMetricsManager.java
@@ -0,0 +1,94 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.esql.stats;
+
+import org.elasticsearch.telemetry.metric.LongCounter;
+import org.elasticsearch.telemetry.metric.MeterRegistry;
+
+import java.util.Map;
+
+/**
+ * This class is responsible for publishing metrics related to ES|QL planning.
+ *
+ * @see <a href="https://github.com/elastic/elasticsearch/blob/main/modules/apm/METERING.md">METERING</a>
+ */
+public class PlanningMetricsManager {
+
+    // APM counters
+    private final LongCounter featuresCounter;
+    private final LongCounter featuresCounterAll;
+    private final LongCounter functionsCounter;
+    private final LongCounter functionsCounterAll;
+
+    public static String ESQL_PREFIX = "es.esql.";
+    public static String FEATURES_PREFIX = "commands.";
+    public static String FUNCTIONS_PREFIX = "functions.";
+
+    /**
+     * Number of times a command is used.
+     * If the command is used N times in a single query, this counter will be incremented by N
+     */
+    public static final String FEATURE_METRICS_ALL = ESQL_PREFIX + FEATURES_PREFIX + "usages.total";
+
+    /**
+     * Queries that use a command.
+     * If a query uses a command N times, this will still be incremented by one only
+     */
+    public static final String FEATURE_METRICS = ESQL_PREFIX + FEATURES_PREFIX + "queries.total";
+
+    /**
+     * Number of times a function is used.
+     * If the function is used N times in a single query, this counter will be incremented by N
+     */
+    public static final String FUNCTION_METRICS_ALL = ESQL_PREFIX + FUNCTIONS_PREFIX + "usages.total";
+
+    /**
+     * Queries that use a command.
+     * If a query uses a command N times, this will still be incremented by one only
+     */
+    public static final String FUNCTION_METRICS = ESQL_PREFIX + FUNCTIONS_PREFIX + "queries.total";
+    public static final String FEATURE_NAME = "feature_name";
+
+    /**
+     * the query was executed successfully or not
+     */
+    public static final String SUCCESS = "success";
+
+    public PlanningMetricsManager(MeterRegistry meterRegistry) {
+        featuresCounter = meterRegistry.registerLongCounter(
+            FEATURE_METRICS,
+            "ESQL features, total number of queries that use them",
+            "unit"
+        );
+        featuresCounterAll = meterRegistry.registerLongCounter(FEATURE_METRICS_ALL, "ESQL features, total usage", "unit");
+        functionsCounter = meterRegistry.registerLongCounter(
+            FUNCTION_METRICS,
+            "ESQL functions, total number of queries that use them",
+            "unit"
+        );
+        functionsCounterAll = meterRegistry.registerLongCounter(FUNCTION_METRICS_ALL, "ESQL functions, total usage", "unit");
+    }
+
+    /**
+     * Publishes the collected metrics to the meter registry
+     */
+    public void publish(PlanningMetrics metrics, boolean success) {
+        metrics.commands().entrySet().forEach(x -> incCommand(x.getKey(), x.getValue(), success));
+        metrics.functions().entrySet().forEach(x -> incFunction(x.getKey(), x.getValue(), success));
+    }
+
+    private void incCommand(String name, int count, boolean success) {
+        this.featuresCounter.incrementBy(1, Map.ofEntries(Map.entry(FEATURE_NAME, name), Map.entry(SUCCESS, success)));
+        this.featuresCounterAll.incrementBy(count, Map.ofEntries(Map.entry(FEATURE_NAME, name), Map.entry(SUCCESS, success)));
+    }
+
+    private void incFunction(String name, int count, boolean success) {
+        this.functionsCounter.incrementBy(1, Map.ofEntries(Map.entry(FEATURE_NAME, name), Map.entry(SUCCESS, success)));
+        this.functionsCounterAll.incrementBy(count, Map.ofEntries(Map.entry(FEATURE_NAME, name), Map.entry(SUCCESS, success)));
+    }
+}
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/CsvTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/CsvTests.java
index e0f9b8690e289..a7d8c98a606b5 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/CsvTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/CsvTests.java
@@ -85,6 +85,7 @@
 import org.elasticsearch.xpack.esql.session.EsqlSession;
 import org.elasticsearch.xpack.esql.session.Result;
 import org.elasticsearch.xpack.esql.stats.DisabledSearchStats;
+import org.elasticsearch.xpack.esql.stats.PlanningMetrics;
 import org.junit.After;
 import org.junit.Before;
 import org.mockito.Mockito;
@@ -409,7 +410,8 @@ private ActualResults executePlan(BigArrays bigArrays) throws Exception {
             functionRegistry,
             new LogicalPlanOptimizer(new LogicalOptimizerContext(configuration)),
             mapper,
-            TEST_VERIFIER
+            TEST_VERIFIER,
+            new PlanningMetrics()
         );
         TestPhysicalOperationProviders physicalOperationProviders = testOperationProviders(testDataset);
 
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/analysis/AnalyzerTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/analysis/AnalyzerTests.java
index e4872b24558bc..b534320f60c10 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/analysis/AnalyzerTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/analysis/AnalyzerTests.java
@@ -95,7 +95,8 @@ public class AnalyzerTests extends ESTestCase {
         false,
         List.of(),
         IndexMode.STANDARD,
-        null
+        null,
+        "FROM"
     );
 
     private static final int MAX_LIMIT = EsqlPlugin.QUERY_RESULT_TRUNCATION_MAX_SIZE.getDefault(Settings.EMPTY);
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalLogicalPlanOptimizerTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalLogicalPlanOptimizerTests.java
index 2756a0fbd8016..5c166e92ab152 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalLogicalPlanOptimizerTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalLogicalPlanOptimizerTests.java
@@ -243,6 +243,11 @@ public UnaryPlan replaceChild(LogicalPlan newChild) {
             return new MockFieldAttributeCommand(source(), newChild, field);
         }
 
+        @Override
+        public String commandName() {
+            return "MOCK";
+        }
+
         @Override
         public boolean expressionsResolved() {
             return true;
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/parser/StatementParserTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/parser/StatementParserTests.java
index 6980171a7bcd7..0d4615b44aa35 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/parser/StatementParserTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/parser/StatementParserTests.java
@@ -1670,12 +1670,20 @@ public void testInvalidAlias() {
     }
 
     private LogicalPlan unresolvedRelation(String index) {
-        return new UnresolvedRelation(EMPTY, new TableIdentifier(EMPTY, null, index), false, List.of(), IndexMode.STANDARD, null);
+        return new UnresolvedRelation(EMPTY, new TableIdentifier(EMPTY, null, index), false, List.of(), IndexMode.STANDARD, null, "FROM");
     }
 
     private LogicalPlan unresolvedTSRelation(String index) {
         List<Attribute> metadata = List.of(new MetadataAttribute(EMPTY, MetadataAttribute.TSID_FIELD, DataType.KEYWORD, false));
-        return new UnresolvedRelation(EMPTY, new TableIdentifier(EMPTY, null, index), false, metadata, IndexMode.TIME_SERIES, null);
+        return new UnresolvedRelation(
+            EMPTY,
+            new TableIdentifier(EMPTY, null, index),
+            false,
+            metadata,
+            IndexMode.TIME_SERIES,
+            null,
+            "FROM TS"
+        );
     }
 
     public void testMetricWithGroupKeyAsAgg() {
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/logical/PhasedTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/logical/PhasedTests.java
index 5e45de6c77c42..edf75170adc63 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/logical/PhasedTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/logical/PhasedTests.java
@@ -110,6 +110,11 @@ public String getWriteableName() {
             throw new UnsupportedOperationException("not serialized");
         }
 
+        @Override
+        public String commandName() {
+            return "DUMMY";
+        }
+
         @Override
         public boolean expressionsResolved() {
             throw new UnsupportedOperationException();
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/stats/PlanExecutorMetricsTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/stats/PlanExecutorMetricsTests.java
index d3795c9e9d953..cef04727bb8ed 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/stats/PlanExecutorMetricsTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/stats/PlanExecutorMetricsTests.java
@@ -14,6 +14,7 @@
 import org.elasticsearch.action.fieldcaps.IndexFieldCapabilities;
 import org.elasticsearch.client.internal.Client;
 import org.elasticsearch.index.IndexMode;
+import org.elasticsearch.telemetry.metric.MeterRegistry;
 import org.elasticsearch.test.ESTestCase;
 import org.elasticsearch.threadpool.TestThreadPool;
 import org.elasticsearch.threadpool.ThreadPool;
@@ -98,7 +99,7 @@ public void testFailedMetric() {
             return null;
         }).when(esqlClient).execute(eq(EsqlResolveFieldsAction.TYPE), any(), any());
 
-        var planExecutor = new PlanExecutor(indexResolver);
+        var planExecutor = new PlanExecutor(indexResolver, MeterRegistry.NOOP);
         var enrichResolver = mockEnrichResolver();
 
         var request = new EsqlQueryRequest();

From 111030b20dc13fad38a13575c1c9a7796323b7f8 Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Wed, 4 Sep 2024 01:53:28 +1000
Subject: [PATCH 112/144] Mute org.elasticsearch.xpack.esql.action.ManyShardsIT
 testRejection #112406

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 14dbba8dfdc0f..78e7c92b2fa72 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -185,6 +185,9 @@ tests:
 - class: org.elasticsearch.xpack.esql.expression.function.aggregate.SpatialCentroidTests
   method: testAggregateIntermediate {TestCase=<geo_point>}
   issue: https://github.com/elastic/elasticsearch/issues/112463
+- class: org.elasticsearch.xpack.esql.action.ManyShardsIT
+  method: testRejection
+  issue: https://github.com/elastic/elasticsearch/issues/112406
 
 # Examples:
 #

From f83d6bebd6256b9dc9c2c49e773b4794b06b48a0 Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Wed, 4 Sep 2024 01:53:44 +1000
Subject: [PATCH 113/144] Mute org.elasticsearch.xpack.esql.action.ManyShardsIT
 testConcurrentQueries #112424

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 78e7c92b2fa72..9223b781b177d 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -188,6 +188,9 @@ tests:
 - class: org.elasticsearch.xpack.esql.action.ManyShardsIT
   method: testRejection
   issue: https://github.com/elastic/elasticsearch/issues/112406
+- class: org.elasticsearch.xpack.esql.action.ManyShardsIT
+  method: testConcurrentQueries
+  issue: https://github.com/elastic/elasticsearch/issues/112424
 
 # Examples:
 #

From 46e73b86b1e66556f271127dc30b79bbeb6f3045 Mon Sep 17 00:00:00 2001
From: Luigi Dell'Aquila <luigi.dellaquila@gmail.com>
Date: Tue, 3 Sep 2024 18:12:24 +0200
Subject: [PATCH 114/144] ES|QL: Fix #112117 by skipping tests in v < 8.14
 (#112468)

Skipping some tests in v < 8.14 because of missing syntax in previous
versions. Other tests with the same syntax (right above these two) have
the same skip

Fixes https://github.com/elastic/elasticsearch/issues/112117 Fixes
https://github.com/elastic/elasticsearch/issues/112118
---
 muted-tests.yml                                             | 6 ------
 .../esql/qa/testFixtures/src/main/resources/stats.csv-spec  | 4 ++--
 2 files changed, 2 insertions(+), 8 deletions(-)

diff --git a/muted-tests.yml b/muted-tests.yml
index 9223b781b177d..6f52c67ab5170 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -128,12 +128,6 @@ tests:
 - class: org.elasticsearch.xpack.ml.integration.MlJobIT
   method: testDeleteJobAfterMissingIndex
   issue: https://github.com/elastic/elasticsearch/issues/112088
-- class: org.elasticsearch.xpack.esql.qa.mixed.MixedClusterEsqlSpecIT
-  method: test {stats.ByTwoCalculatedSecondOverwrites SYNC}
-  issue: https://github.com/elastic/elasticsearch/issues/112117
-- class: org.elasticsearch.xpack.esql.qa.mixed.MixedClusterEsqlSpecIT
-  method: test {stats.ByTwoCalculatedSecondOverwritesReferencingFirst SYNC}
-  issue: https://github.com/elastic/elasticsearch/issues/112118
 - class: org.elasticsearch.xpack.test.rest.XPackRestIT
   method: test {p0=transform/preview_transforms/Test preview transform latest}
   issue: https://github.com/elastic/elasticsearch/issues/112144
diff --git a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/stats.csv-spec b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/stats.csv-spec
index 3be846630d5b8..02a2cac0513c0 100644
--- a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/stats.csv-spec
+++ b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/stats.csv-spec
@@ -1618,7 +1618,7 @@ m:i | o:i   | l:i | s:i
 1   | 39729 | 1   | 39729
 ;
 
-byTwoCalculatedSecondOverwrites
+byTwoCalculatedSecondSameNameAsFirst#[skip:-8.13.99,reason:supported in 8.14]
 FROM employees
 | STATS m = MAX(salary) by l = salary + 1, l = languages + 1
 | SORT m
@@ -1633,7 +1633,7 @@ FROM employees
 74970 | 4
 ;
 
-byTwoCalculatedSecondOverwritesReferencingFirst
+byTwoCalculatedSecondShadowingAndReferencingFirst#[skip:-8.13.99,reason:supported in 8.14]
 FROM employees
 | EVAL l = languages
 | STATS m = MAX(salary) by l = l + 1, l = l + 1

From a55cf5c08670b6fe91649d858e6361703bb108a5 Mon Sep 17 00:00:00 2001
From: Pat Whelan <pat.whelan@elastic.co>
Date: Tue, 3 Sep 2024 12:14:04 -0400
Subject: [PATCH 115/144] [ML] Create StreamingHttpResultPublisher (#112026)

Adds streaming support to Inference API's Apache Client code by
implementing an Apache HttpAsyncResponseConsumer.  The ResponseConsumer
will read response bytes as it gets them, converting them into an
Inference HttpResult object.

This leverages Java's Flow API to stream HttpResults from the Apache
client back through the Inference API.  The Flow API has the hooks and
patterns to:
1. Send a stream of elements from source (Publisher) to consumer
   (Subscriber).
2. Control the rate that elements are sent, the Subscriber requests for
   the next element from the Publisher.
3. Bi-directional cancel methods, either the Publisher or the Subscriber
   can communicate when the stream is canceled.
4. Chain processing via Flow.Processor for when a Subscriber needs to
   mutate the elements from the Publisher, which we will do to convert
   the HttpResult to an InferenceServiceResults in a later change.

Co-authored-by: Elastic Machine <elasticmachine@users.noreply.github.com>
---
 docs/changelog/112026.yaml                    |   5 +
 .../inference/external/http/HttpClient.java   |  48 +-
 .../external/http/RequestBasedTaskRunner.java |  62 ++
 .../http/StreamingHttpResultPublisher.java    | 228 +++++++
 .../external/request/HttpRequest.java         |   6 +
 .../external/http/HttpClientTests.java        |  56 +-
 .../http/RequestBasedTaskRunnerTests.java     | 157 +++++
 .../StreamingHttpResultPublisherTests.java    | 632 ++++++++++++++++++
 8 files changed, 1188 insertions(+), 6 deletions(-)
 create mode 100644 docs/changelog/112026.yaml
 create mode 100644 x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/RequestBasedTaskRunner.java
 create mode 100644 x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/StreamingHttpResultPublisher.java
 create mode 100644 x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/http/RequestBasedTaskRunnerTests.java
 create mode 100644 x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/http/StreamingHttpResultPublisherTests.java

diff --git a/docs/changelog/112026.yaml b/docs/changelog/112026.yaml
new file mode 100644
index 0000000000000..fedf001923ab4
--- /dev/null
+++ b/docs/changelog/112026.yaml
@@ -0,0 +1,5 @@
+pr: 112026
+summary: Create `StreamingHttpResultPublisher`
+area: Machine Learning
+type: enhancement
+issues: []
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/HttpClient.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/HttpClient.java
index 5ae137419b366..6b04b66cb7c11 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/HttpClient.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/HttpClient.java
@@ -13,6 +13,7 @@
 import org.apache.http.impl.nio.client.CloseableHttpAsyncClient;
 import org.apache.http.impl.nio.client.HttpAsyncClientBuilder;
 import org.apache.http.impl.nio.conn.PoolingNHttpClientConnectionManager;
+import org.apache.http.protocol.HttpContext;
 import org.apache.logging.log4j.LogManager;
 import org.apache.logging.log4j.Logger;
 import org.elasticsearch.action.ActionListener;
@@ -25,6 +26,7 @@
 import java.io.IOException;
 import java.util.Objects;
 import java.util.concurrent.CancellationException;
+import java.util.concurrent.Flow;
 import java.util.concurrent.atomic.AtomicReference;
 
 import static org.elasticsearch.core.Strings.format;
@@ -143,10 +145,54 @@ private void respondUsingUtilityThread(HttpResponse response, HttpRequest reques
         });
     }
 
-    private void failUsingUtilityThread(Exception exception, ActionListener<HttpResult> listener) {
+    private void failUsingUtilityThread(Exception exception, ActionListener<?> listener) {
         threadPool.executor(UTILITY_THREAD_POOL_NAME).execute(() -> listener.onFailure(exception));
     }
 
+    public void stream(HttpRequest request, HttpContext context, ActionListener<Flow.Publisher<HttpResult>> listener) throws IOException {
+        // The caller must call start() first before attempting to send a request
+        assert status.get() == Status.STARTED : "call start() before attempting to send a request";
+
+        // apache can sometimes send us the same error in the consumer and the callback
+        // sometimes it sends us an error just on the callback
+        // notifyOnce will dedupe for us
+        var callOnceListener = ActionListener.notifyOnce(listener);
+
+        SocketAccess.doPrivileged(
+            () -> client.execute(
+                request.requestProducer(),
+                new StreamingHttpResultPublisher(threadPool, settings, callOnceListener),
+                context,
+                new FutureCallback<>() {
+                    @Override
+                    public void completed(HttpResponse response) {
+                        // StreamingHttpResultPublisher will publish results to the Flow.Publisher returned in the ActionListener
+                    }
+
+                    @Override
+                    public void failed(Exception ex) {
+                        throttlerManager.warn(
+                            logger,
+                            format("Request from inference entity id [%s] failed", request.inferenceEntityId()),
+                            ex
+                        );
+                        failUsingUtilityThread(ex, callOnceListener);
+                    }
+
+                    @Override
+                    public void cancelled() {
+                        failUsingUtilityThread(
+                            new CancellationException(
+                                format("Request from inference entity id [%s] was cancelled", request.inferenceEntityId())
+                            ),
+                            callOnceListener
+                        );
+                    }
+                }
+            )
+        );
+    }
+
     @Override
     public void close() throws IOException {
         status.set(Status.STOPPED);
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/RequestBasedTaskRunner.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/RequestBasedTaskRunner.java
new file mode 100644
index 0000000000000..85aac661e6091
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/RequestBasedTaskRunner.java
@@ -0,0 +1,62 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.http;
+
+import org.elasticsearch.common.util.concurrent.EsExecutors;
+import org.elasticsearch.threadpool.ThreadPool;
+
+import java.util.Objects;
+import java.util.concurrent.atomic.AtomicBoolean;
+import java.util.concurrent.atomic.AtomicInteger;
+
+/**
+ * <p>Runs a command synchronously on at most one thread.  Threads make a request to run the command.  If no thread is running the command,
+ * then the command will start on the provided {@link #threadPool}'s {@link #executorServiceName}.  If a thread is currently running the
+ * command, then that thread is notified to rerun the command after it is finished.</p>
+ *
+ * <p>This guarantees only one thread is working on a command at a given point in time.</p>
+ */
+class RequestBasedTaskRunner {
+    private final Runnable command;
+    private final ThreadPool threadPool;
+    private final String executorServiceName;
+    private final AtomicInteger loopCount = new AtomicInteger(0);
+    private final AtomicBoolean isRunning = new AtomicBoolean(true);
+
+    RequestBasedTaskRunner(Runnable command, ThreadPool threadPool, String executorServiceName) {
+        this.command = Objects.requireNonNull(command);
+        this.threadPool = Objects.requireNonNull(threadPool);
+        this.executorServiceName = Objects.requireNonNull(executorServiceName);
+    }
+
+    /**
+     * If there is currently a thread running in a loop, it should pick up this new request.
+     * If not, check if this thread is one of ours and reuse it.
+     * Else, offload to a new thread so we do not block another threadpool's thread.
+     */
+    public void requestNextRun() {
+        if (loopCount.getAndIncrement() == 0) {
+            var currentThreadPool = EsExecutors.executorName(Thread.currentThread().getName());
+            if (executorServiceName.equalsIgnoreCase(currentThreadPool)) {
+                run();
+            } else {
+                threadPool.executor(executorServiceName).execute(this::run);
+            }
+        }
+    }
+
+    public void cancel() {
+        isRunning.set(false);
+    }
+
+    private void run() {
+        do {
+            command.run();
+        } while (isRunning.get() && loopCount.decrementAndGet() > 0);
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/StreamingHttpResultPublisher.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/StreamingHttpResultPublisher.java
new file mode 100644
index 0000000000000..49a9048a69df1
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/StreamingHttpResultPublisher.java
@@ -0,0 +1,228 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.http;
+
+import org.apache.http.HttpResponse;
+import org.apache.http.nio.ContentDecoder;
+import org.apache.http.nio.IOControl;
+import org.apache.http.nio.protocol.HttpAsyncResponseConsumer;
+import org.apache.http.nio.util.SimpleInputBuffer;
+import org.apache.http.protocol.HttpContext;
+import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.threadpool.ThreadPool;
+
+import java.io.IOException;
+import java.util.Deque;
+import java.util.Objects;
+import java.util.concurrent.ConcurrentLinkedDeque;
+import java.util.concurrent.Flow;
+import java.util.concurrent.atomic.AtomicBoolean;
+import java.util.concurrent.atomic.AtomicLong;
+
+import static org.elasticsearch.xpack.inference.InferencePlugin.UTILITY_THREAD_POOL_NAME;
+
+/**
+ * <p>Streams responses from Apache's HttpAsyncResponseConsumer to Java's Flow.Publisher.</p>
+ *
+ * <p>The ActionListener is called once when the HttpResponse is initially received to establish the Flow.  All subsequent responses and
+ * errors will be sent through the Flow API.  Consumers are expected to call #onSubscribe with a
+ * {@link java.util.concurrent.Flow.Subscriber} when the ActionListener is called.  Consumers can then begin using the resulting
+ * {@link java.util.concurrent.Flow.Subscription} to request HttpResults from this publisher.</p>
+ *
+ * <p>Consumers should expect the first HttpResult to represent the overall HttpResponse.  Apache opens the channel with an HttpResponse
+ * before it starts sending response bytes.  If the HttpResponse is an error, Apache may only send an HttpResponse with an HttpEntity,
+ * so this publisher will send a single HttpResult. If the HttpResponse is healthy, Apache will send an HttpResponse with or without
+ * the HttpEntity.</p>
+ */
+class StreamingHttpResultPublisher implements HttpAsyncResponseConsumer<HttpResponse>, Flow.Publisher<HttpResult> {
+    private final HttpSettings settings;
+    private final ActionListener<Flow.Publisher<HttpResult>> listener;
+
+    // used to manage the HTTP response
+    private volatile HttpResponse response;
+    private volatile Exception ex;
+
+    // used to control the state of this publisher (Apache) and its interaction with its subscriber
+    private final AtomicBoolean isDone = new AtomicBoolean(false);
+    private final AtomicBoolean subscriptionCanceled = new AtomicBoolean(false);
+    private volatile Flow.Subscriber<? super HttpResult> subscriber;
+
+    private final RequestBasedTaskRunner taskRunner;
+    private final AtomicBoolean pendingRequest = new AtomicBoolean(false);
+    private final Deque<Runnable> queue = new ConcurrentLinkedDeque<>();
+
+    // used to control the flow of data from the Apache client, if we're producing more bytes than we can consume then we'll pause
+    private final AtomicLong bytesInQueue = new AtomicLong(0);
+    private final Object ioLock = new Object();
+    private volatile IOControl savedIoControl;
+
+    StreamingHttpResultPublisher(ThreadPool threadPool, HttpSettings settings, ActionListener<Flow.Publisher<HttpResult>> listener) {
+        this.settings = Objects.requireNonNull(settings);
+        this.listener = Objects.requireNonNull(listener);
+
+        this.taskRunner = new RequestBasedTaskRunner(new OffloadThread(), threadPool, UTILITY_THREAD_POOL_NAME);
+    }
+
+    @Override
+    public void responseReceived(HttpResponse httpResponse) throws IOException {
+        this.response = httpResponse;
+        var firstResponse = HttpResult.create(settings.getMaxResponseSize(), response);
+        this.queue.offer(() -> subscriber.onNext(firstResponse));
+        this.listener.onResponse(this);
+    }
+
+    @Override
+    public void subscribe(Flow.Subscriber<? super HttpResult> subscriber) {
+        if (this.subscriber != null) {
+            subscriber.onError(new IllegalStateException("Only one subscriber is allowed for this Publisher."));
+            return;
+        }
+
+        this.subscriber = subscriber;
+        subscriber.onSubscribe(new HttpSubscription());
+    }
+
+    @Override
+    public void consumeContent(ContentDecoder contentDecoder, IOControl ioControl) throws IOException {
+        // if the subscriber canceled us, tell Apache
+        if (subscriptionCanceled.get()) {
+            ioControl.shutdown();
+            return;
+        }
+
+        var buffer = new SimpleInputBuffer(4096);
+        var consumed = buffer.consumeContent(contentDecoder);
+        var allBytes = new byte[consumed];
+        buffer.read(allBytes);
+
+        // we can have empty bytes, don't bother sending them
+        if (allBytes.length > 0) {
+            queue.offer(() -> {
+                subscriber.onNext(new HttpResult(response, allBytes));
+                var currentBytesInQueue = bytesInQueue.updateAndGet(current -> Long.max(0, current - allBytes.length));
+                if (savedIoControl != null) {
+                    var maxBytes = settings.getMaxResponseSize().getBytes() * 0.5;
+                    if (currentBytesInQueue <= maxBytes) {
+                        resumeProducer();
+                    }
+                }
+            });
+        }
+
+        // always check if totalByteSize > the configured setting in case the settings change
+        if (bytesInQueue.accumulateAndGet(allBytes.length, Long::sum) >= settings.getMaxResponseSize().getBytes()) {
+            pauseProducer(ioControl);
+        }
+
+        // always run in case we're waking up from a pause and need to start a new thread
+        taskRunner.requestNextRun();
+    }
+
+    private void pauseProducer(IOControl ioControl) {
+        ioControl.suspendInput();
+        synchronized (ioLock) {
+            savedIoControl = ioControl;
+        }
+    }
+
+    private void resumeProducer() {
+        synchronized (ioLock) {
+            if (savedIoControl != null) {
+                savedIoControl.requestInput();
+                savedIoControl = null;
+            }
+        }
+    }
+
+    @Override
+    public void responseCompleted(HttpContext httpContext) {}
+
+    // called when Apache is failing the response
+    @Override
+    public void failed(Exception e) {
+        if (this.isDone.compareAndSet(false, true)) {
+            ex = e;
+            queue.offer(() -> subscriber.onError(e));
+            taskRunner.requestNextRun();
+        }
+    }
+
+    // called when Apache is done with the response
+    @Override
+    public void close() {
+        if (isDone.compareAndSet(false, true)) {
+            queue.offer(() -> subscriber.onComplete());
+            taskRunner.requestNextRun();
+        }
+    }
+
+    // called when Apache is canceling the response
+    @Override
+    public boolean cancel() {
+        close();
+        return true;
+    }
+
+    @Override
+    public Exception getException() {
+        return ex;
+    }
+
+    @Override
+    public HttpResponse getResult() {
+        return response;
+    }
+
+    @Override
+    public boolean isDone() {
+        return isDone.get();
+    }
+
+    private class HttpSubscription implements Flow.Subscription {
+        @Override
+        public void request(long n) {
+            if (subscriptionCanceled.get()) {
+                return;
+            }
+
+            if (n > 0) {
+                pendingRequest.set(true);
+                taskRunner.requestNextRun();
+            } else {
+                // per Subscription's spec, fail the subscriber and stop the processor
+                cancel();
+                subscriber.onError(new IllegalArgumentException("Subscriber requested a non-positive number " + n));
+            }
+        }
+
+        @Override
+        public void cancel() {
+            if (subscriptionCanceled.compareAndSet(false, true)) {
+                taskRunner.cancel();
+            }
+        }
+    }
+
+    private class OffloadThread implements Runnable {
+        @Override
+        public void run() {
+            if (subscriptionCanceled.get()) {
+                return;
+            }
+
+            if (queue.isEmpty() == false && pendingRequest.compareAndSet(true, false)) {
+                var next = queue.poll();
+                if (next != null) {
+                    next.run();
+                } else {
+                    pendingRequest.set(true);
+                }
+            }
+        }
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/HttpRequest.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/HttpRequest.java
index d81d16d6cbe10..ce72cb8b0b65a 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/HttpRequest.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/HttpRequest.java
@@ -8,6 +8,8 @@
 package org.elasticsearch.xpack.inference.external.request;
 
 import org.apache.http.client.methods.HttpRequestBase;
+import org.apache.http.nio.client.methods.HttpAsyncMethods;
+import org.apache.http.nio.protocol.HttpAsyncRequestProducer;
 
 import java.util.Objects;
 
@@ -19,4 +21,8 @@ public record HttpRequest(HttpRequestBase httpRequestBase, String inferenceEntit
         Objects.requireNonNull(httpRequestBase);
         Objects.requireNonNull(inferenceEntityId);
     }
+
+    public HttpAsyncRequestProducer requestProducer() {
+        return HttpAsyncMethods.create(httpRequestBase);
+    }
 }
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/http/HttpClientTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/http/HttpClientTests.java
index 3fb6d14e66674..aa27bf0d2fc81 100644
--- a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/http/HttpClientTests.java
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/http/HttpClientTests.java
@@ -8,7 +8,6 @@
 package org.elasticsearch.xpack.inference.external.http;
 
 import org.apache.http.HttpHeaders;
-import org.apache.http.HttpResponse;
 import org.apache.http.client.methods.HttpPost;
 import org.apache.http.client.methods.HttpUriRequest;
 import org.apache.http.client.protocol.HttpClientContext;
@@ -19,6 +18,7 @@
 import org.apache.http.impl.nio.client.CloseableHttpAsyncClient;
 import org.apache.http.impl.nio.conn.PoolingNHttpClientConnectionManager;
 import org.apache.http.impl.nio.reactor.DefaultConnectingIOReactor;
+import org.apache.http.nio.protocol.HttpAsyncRequestProducer;
 import org.apache.http.nio.reactor.IOReactorException;
 import org.elasticsearch.ElasticsearchException;
 import org.elasticsearch.action.support.PlainActionFuture;
@@ -41,6 +41,7 @@
 import java.net.URISyntaxException;
 import java.nio.charset.StandardCharsets;
 import java.util.concurrent.CancellationException;
+import java.util.concurrent.Flow;
 import java.util.concurrent.Future;
 import java.util.concurrent.TimeUnit;
 
@@ -116,8 +117,7 @@ public void testSend_FailedCallsOnFailure() throws Exception {
         var asyncClient = mock(CloseableHttpAsyncClient.class);
 
         doAnswer(invocation -> {
-            @SuppressWarnings("unchecked")
-            FutureCallback<HttpResponse> listener = (FutureCallback<HttpResponse>) invocation.getArguments()[2];
+            FutureCallback<?> listener = invocation.getArgument(2);
             listener.failed(new ElasticsearchException("failure"));
             return mock(Future.class);
         }).when(asyncClient).execute(any(HttpUriRequest.class), any(), any());
@@ -139,8 +139,7 @@ public void testSend_CancelledCallsOnFailure() throws Exception {
         var asyncClient = mock(CloseableHttpAsyncClient.class);
 
         doAnswer(invocation -> {
-            @SuppressWarnings("unchecked")
-            FutureCallback<HttpResponse> listener = (FutureCallback<HttpResponse>) invocation.getArguments()[2];
+            FutureCallback<?> listener = invocation.getArgument(2);
             listener.cancelled();
             return mock(Future.class);
         }).when(asyncClient).execute(any(HttpUriRequest.class), any(), any());
@@ -161,6 +160,53 @@ public void testSend_CancelledCallsOnFailure() throws Exception {
         }
     }
 
+    public void testStream_FailedCallsOnFailure() throws Exception {
+        var asyncClient = mock(CloseableHttpAsyncClient.class);
+
+        doAnswer(invocation -> {
+            FutureCallback<?> listener = invocation.getArgument(3);
+            listener.failed(new ElasticsearchException("failure"));
+            return mock(Future.class);
+        }).when(asyncClient).execute(any(HttpAsyncRequestProducer.class), any(), any(), any());
+
+        var httpPost = createHttpPost(webServer.getPort(), "a", "b");
+
+        try (var client = new HttpClient(emptyHttpSettings(), asyncClient, threadPool, mockThrottlerManager())) {
+            client.start();
+
+            PlainActionFuture<Flow.Publisher<HttpResult>> listener = new PlainActionFuture<>();
+            client.stream(httpPost, HttpClientContext.create(), listener);
+
+            var thrownException = expectThrows(ElasticsearchException.class, () -> listener.actionGet(TIMEOUT));
+            assertThat(thrownException.getMessage(), is("failure"));
+        }
+    }
+
+    public void testStream_CancelledCallsOnFailure() throws Exception {
+        var asyncClient = mock(CloseableHttpAsyncClient.class);
+
+        doAnswer(invocation -> {
+            FutureCallback<?> listener = invocation.getArgument(3);
+            listener.cancelled();
+            return mock(Future.class);
+        }).when(asyncClient).execute(any(HttpAsyncRequestProducer.class), any(), any(), any());
+
+        var httpPost = createHttpPost(webServer.getPort(), "a", "b");
+
+        try (var client = new HttpClient(emptyHttpSettings(), asyncClient, threadPool, mockThrottlerManager())) {
+            client.start();
+
+            PlainActionFuture<Flow.Publisher<HttpResult>> listener = new PlainActionFuture<>();
+            client.stream(httpPost, HttpClientContext.create(), listener);
+
+            var thrownException = expectThrows(CancellationException.class, () -> listener.actionGet(TIMEOUT));
+            assertThat(
+                thrownException.getMessage(),
+                is(Strings.format("Request from inference entity id [%s] was cancelled", httpPost.inferenceEntityId()))
+            );
+        }
+    }
+
     @SuppressWarnings("unchecked")
     public void testStart_MultipleCallsOnlyStartTheClientOnce() throws Exception {
         var asyncClient = mock(CloseableHttpAsyncClient.class);
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/http/RequestBasedTaskRunnerTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/http/RequestBasedTaskRunnerTests.java
new file mode 100644
index 0000000000000..d24bdbe444f52
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/http/RequestBasedTaskRunnerTests.java
@@ -0,0 +1,157 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.http;
+
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.threadpool.ThreadPool;
+import org.junit.After;
+import org.junit.Before;
+
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.atomic.AtomicInteger;
+import java.util.concurrent.locks.ReentrantLock;
+
+import static org.elasticsearch.xpack.inference.InferencePlugin.UTILITY_THREAD_POOL_NAME;
+import static org.elasticsearch.xpack.inference.Utils.inferenceUtilityPool;
+import static org.hamcrest.Matchers.equalTo;
+import static org.mockito.Mockito.spy;
+import static org.mockito.Mockito.times;
+import static org.mockito.Mockito.verify;
+
+public class RequestBasedTaskRunnerTests extends ESTestCase {
+    private ThreadPool threadPool;
+
+    @Before
+    public void setUp() throws Exception {
+        super.setUp();
+        threadPool = spy(createThreadPool(inferenceUtilityPool()));
+    }
+
+    @After
+    public void tearDown() throws Exception {
+        terminate(threadPool);
+        super.tearDown();
+    }
+
+    public void testLoopOneAtATime() throws Exception {
+        // count the number of times the runnable is called
+        var counter = new AtomicInteger(0);
+
+        // block the runnable and wait for the test thread to take an action
+        var lock = new ReentrantLock();
+        var condition = lock.newCondition();
+        Runnable block = () -> {
+            try {
+                try {
+                    lock.lock();
+                    condition.await();
+                } finally {
+                    lock.unlock();
+                }
+            } catch (InterruptedException e) {
+                fail(e, "did not unblock the thread in time, likely during threadpool terminate");
+            }
+        };
+        Runnable unblock = () -> {
+            try {
+                lock.lock();
+                condition.signalAll();
+            } finally {
+                lock.unlock();
+            }
+        };
+
+        var runner = new RequestBasedTaskRunner(() -> {
+            counter.incrementAndGet();
+            block.run();
+        }, threadPool, UTILITY_THREAD_POOL_NAME);
+
+        // given we have not called requestNextRun, then no thread should have started
+        assertThat(counter.get(), equalTo(0));
+        verify(threadPool, times(0)).executor(UTILITY_THREAD_POOL_NAME);
+
+        runner.requestNextRun();
+
+        // given that we have called requestNextRun, then 1 thread should run once
+        assertBusy(() -> {
+            verify(threadPool, times(1)).executor(UTILITY_THREAD_POOL_NAME);
+            assertThat(counter.get(), equalTo(1));
+        });
+
+        // given that we have called requestNextRun while a thread was running, and the thread was blocked
+        runner.requestNextRun();
+        // then 1 thread should run once
+        verify(threadPool, times(1)).executor(UTILITY_THREAD_POOL_NAME);
+        assertThat(counter.get(), equalTo(1));
+
+        // given the thread is unblocked
+        unblock.run();
+        // then 1 thread should run twice
+        verify(threadPool, times(1)).executor(UTILITY_THREAD_POOL_NAME);
+        assertBusy(() -> assertThat(counter.get(), equalTo(2)));
+
+        // given the thread is unblocked again, but there were only two calls to requestNextRun
+        unblock.run();
+        // then 1 thread should run twice
+        verify(threadPool, times(1)).executor(UTILITY_THREAD_POOL_NAME);
+        assertBusy(() -> assertThat(counter.get(), equalTo(2)));
+
+        // given no thread is running, when we call requestNextRun
+        runner.requestNextRun();
+        // then a second thread should start for the third run
+        assertBusy(() -> {
+            verify(threadPool, times(2)).executor(UTILITY_THREAD_POOL_NAME);
+            assertThat(counter.get(), equalTo(3));
+        });
+
+        // given the thread is unblocked, then it should exit and rejoin the threadpool
+        unblock.run();
+        assertTrue("Test thread should unblock after all runs complete", terminate(threadPool));
+
+        // final check - we ran three times on two threads
+        verify(threadPool, times(2)).executor(UTILITY_THREAD_POOL_NAME);
+        assertThat(counter.get(), equalTo(3));
+    }
+
+    public void testCancel() throws Exception {
+        // count the number of times the runnable is called
+        var counter = new AtomicInteger(0);
+        var latch = new CountDownLatch(1);
+        var runner = new RequestBasedTaskRunner(() -> {
+            counter.incrementAndGet();
+            try {
+                latch.await();
+            } catch (InterruptedException e) {
+                fail(e, "did not unblock the thread in time, likely during threadpool terminate");
+            }
+        }, threadPool, UTILITY_THREAD_POOL_NAME);
+
+        // given that we have called requestNextRun, then 1 thread should run once
+        runner.requestNextRun();
+        assertBusy(() -> {
+            verify(threadPool, times(1)).executor(UTILITY_THREAD_POOL_NAME);
+            assertThat(counter.get(), equalTo(1));
+        });
+
+        // given that a thread is running, three more calls will be queued
+        runner.requestNextRun();
+        runner.requestNextRun();
+        runner.requestNextRun();
+
+        // when we cancel the thread, then the thread should immediately exit and rejoin
+        runner.cancel();
+        latch.countDown();
+        assertTrue("Test thread should unblock after all runs complete", terminate(threadPool));
+
+        // given that we called cancel, when we call requestNextRun then no thread should start
+        runner.requestNextRun();
+        verify(threadPool, times(1)).executor(UTILITY_THREAD_POOL_NAME);
+        assertThat(counter.get(), equalTo(1));
+    }
+
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/http/StreamingHttpResultPublisherTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/http/StreamingHttpResultPublisherTests.java
new file mode 100644
index 0000000000000..92a332fe545e3
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/http/StreamingHttpResultPublisherTests.java
@@ -0,0 +1,632 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.http;
+
+import org.apache.http.HttpResponse;
+import org.apache.http.nio.ContentDecoder;
+import org.apache.http.nio.IOControl;
+import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.common.unit.ByteSizeValue;
+import org.elasticsearch.common.util.concurrent.EsExecutors;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.threadpool.ThreadPool;
+import org.junit.Before;
+
+import java.io.IOException;
+import java.nio.ByteBuffer;
+import java.nio.charset.StandardCharsets;
+import java.util.concurrent.CompletableFuture;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.ExecutionException;
+import java.util.concurrent.ExecutorService;
+import java.util.concurrent.Flow;
+import java.util.concurrent.TimeUnit;
+import java.util.concurrent.TimeoutException;
+import java.util.concurrent.atomic.AtomicReference;
+
+import static org.elasticsearch.xpack.inference.InferencePlugin.UTILITY_THREAD_POOL_NAME;
+import static org.elasticsearch.xpack.inference.Utils.inferenceUtilityPool;
+import static org.hamcrest.Matchers.equalTo;
+import static org.hamcrest.Matchers.instanceOf;
+import static org.hamcrest.Matchers.is;
+import static org.hamcrest.Matchers.notNullValue;
+import static org.hamcrest.Matchers.nullValue;
+import static org.mockito.ArgumentMatchers.any;
+import static org.mockito.Mockito.doAnswer;
+import static org.mockito.Mockito.mock;
+import static org.mockito.Mockito.spy;
+import static org.mockito.Mockito.times;
+import static org.mockito.Mockito.verify;
+import static org.mockito.Mockito.verifyNoMoreInteractions;
+import static org.mockito.Mockito.when;
+
+public class StreamingHttpResultPublisherTests extends ESTestCase {
+    private static final byte[] message = "hello".getBytes(StandardCharsets.UTF_8);
+    private static final long maxBytes = message.length;
+    private ThreadPool threadPool;
+    private HttpSettings settings;
+    private ActionListener<Flow.Publisher<HttpResult>> listener;
+    private StreamingHttpResultPublisher publisher;
+
+    @Before
+    public void setUp() throws Exception {
+        super.setUp();
+        threadPool = mock(ThreadPool.class);
+        settings = mock(HttpSettings.class);
+        listener = ActionListener.noop();
+
+        when(threadPool.executor(UTILITY_THREAD_POOL_NAME)).thenReturn(EsExecutors.DIRECT_EXECUTOR_SERVICE);
+        when(settings.getMaxResponseSize()).thenReturn(ByteSizeValue.ofBytes(maxBytes));
+
+        publisher = new StreamingHttpResultPublisher(threadPool, settings, listener);
+    }
+
+    /**
+     * When we receive an http response
+     * Then we call the listener
+     * And we queue the initial payload
+     */
+    public void testFirstResponseCallsListener() throws IOException {
+        var latch = new CountDownLatch(1);
+        var listener = ActionListener.<Flow.Publisher<HttpResult>>wrap(
+            r -> latch.countDown(),
+            e -> fail("Listener onFailure should never be called.")
+        );
+        publisher = new StreamingHttpResultPublisher(threadPool, settings, listener);
+
+        publisher.responseReceived(mock(HttpResponse.class));
+
+        assertThat("Listener's onResponse should be called when we receive a response", latch.getCount(), equalTo(0L));
+    }
+
+    /**
+     * This test combines 4 test since it's easier to verify the exchange of data at once.
+     *
+     * Given that the subscriber has not requested data
+     * When we receive an http response
+     * Then the publisher enqueues data
+     *
+     * Given that the initial http response is queued
+     * When the subscriber requests data
+     * Then the subscriber immediately pulls from the queue
+     *
+     * Given that the queue is empty
+     * When the subscriber requests data
+     * Then no data is sent
+     *
+     * Given that the subscriber has requested data
+     * When the publisher enqueues data
+     * Then the publisher immediately sends that data
+     */
+    public void testSubscriberAndPublisherExchange() throws IOException {
+        var subscriber = new TestSubscriber();
+        publisher.responseReceived(mock(HttpResponse.class));
+
+        // subscribe
+        publisher.subscribe(subscriber);
+        assertThat("subscribe must call onSubscribe", subscriber.subscription, notNullValue());
+        assertThat("onNext should only be called once we have requested data", subscriber.httpResult, nullValue());
+
+        // request the initial http response
+        subscriber.requestData();
+        assertThat("onNext was called with the initial HttpResponse", subscriber.httpResult, notNullValue());
+        assertTrue("HttpResponse has an empty body (because there is no HttpEntity)", subscriber.httpResult.isBodyEmpty());
+        subscriber.httpResult = null; // reset test
+
+        // subscriber requests data, publisher has not sent data yet
+        subscriber.requestData();
+        assertThat("onNext should only be called once we have data to process", subscriber.httpResult, nullValue());
+
+        // publisher sends data
+        publisher.consumeContent(contentDecoder(message), mock(IOControl.class));
+        assertThat("onNext was called with " + new String(message, StandardCharsets.UTF_8), subscriber.httpResult.body(), equalTo(message));
+    }
+
+    /**
+     * When Apache sends a non-200 HttpResponse
+     * Then we enqueue the only HttpResult and close the stream
+     */
+    public void testNon200Response() throws IOException {
+        var subscriber = new TestSubscriber();
+        // Apache sends a single response and closes the consumer
+        publisher.responseReceived(mock(HttpResponse.class));
+        publisher.close();
+
+        // subscriber requests data
+        publisher.subscribe(subscriber);
+        assertThat("subscribe must call onSubscribe", subscriber.subscription, notNullValue());
+        subscriber.requestData();
+        assertThat("onNext was called with the initial HttpResponse", subscriber.httpResult, notNullValue());
+        assertTrue("HttpResponse has an empty body (because there is no HttpEntity)", subscriber.httpResult.isBodyEmpty());
+        subscriber.requestData();
+        assertTrue("Publisher has been closed", publisher.isDone());
+        assertTrue("Subscriber has been completed", subscriber.completed);
+    }
+
+    /**
+     * When we load too many bytes into memory
+     * Then we pause the Apache IO stream
+     */
+    public void testPauseApache() throws IOException {
+        var ioControl = mock(IOControl.class);
+        publisher.responseReceived(mock(HttpResponse.class));
+        when(settings.getMaxResponseSize()).thenReturn(ByteSizeValue.ofBytes(maxBytes - 1));
+
+        publisher.consumeContent(contentDecoder(message), ioControl);
+
+        verify(ioControl).suspendInput();
+    }
+
+    /**
+     * When we empty the bytes from memory
+     * Then we resume the Apache IO stream
+     */
+    public void testResumeApache() throws IOException {
+        var subscriber = new TestSubscriber();
+        publisher.responseReceived(mock(HttpResponse.class));
+        publisher.subscribe(subscriber);
+        subscriber.requestData();
+        subscriber.httpResult = null;
+
+        var ioControl = mock(IOControl.class);
+        when(settings.getMaxResponseSize()).thenReturn(ByteSizeValue.ofBytes(maxBytes - 1));
+        publisher.consumeContent(contentDecoder(message), ioControl);
+        verify(ioControl).suspendInput();
+
+        subscriber.requestData();
+        verify(ioControl).requestInput();
+    }
+
+    /**
+     * When the publisher sends data to the subscriber
+     * Then we should decrement the current number of bytes in the queue
+     */
+    public void testTotalBytesDecrement() throws IOException {
+        var longMessage = "message".getBytes(StandardCharsets.UTF_8);
+        var shortMessage = "a ".getBytes(StandardCharsets.UTF_8);
+        when(settings.getMaxResponseSize()).thenReturn(ByteSizeValue.ofBytes(longMessage.length));
+
+        var subscriber = new TestSubscriber();
+        publisher.responseReceived(mock(HttpResponse.class));
+        publisher.subscribe(subscriber);
+        subscriber.requestData();
+        subscriber.httpResult = null;
+
+        var ioControl = mock(IOControl.class);
+        publisher.consumeContent(contentDecoder(shortMessage), ioControl);
+        verify(ioControl, times(0)).suspendInput();
+        publisher.consumeContent(contentDecoder(longMessage), ioControl);
+        // consumeContent should check that bytesInQueue == consumedBytes and pause
+        verify(ioControl, times(1)).suspendInput();
+
+        // requesting data should reduce bytesInQueue but not resume yet because we haven't reduced totalbytes enough
+        subscriber.requestData();
+        verify(ioControl, times(0)).requestInput();
+        // now it should unpause
+        subscriber.requestData();
+        verify(ioControl, times(1)).requestInput();
+
+        // bytesInQueue should be 0, so increase maxResponseSize and verify we don't pause when we consume the same number of bytes
+        when(settings.getMaxResponseSize()).thenReturn(ByteSizeValue.ofBytes(longMessage.length + 1));
+        publisher.consumeContent(contentDecoder(longMessage), ioControl);
+        verifyNoMoreInteractions(ioControl);
+    }
+
+    /**
+     * Given an error from Apache
+     * When the subscriber requests the next set of data
+     * Then the subscriber receives the error from Apache
+     */
+    public void testErrorBeforeRequest() {
+        var subscriber = subscribe();
+        var exception = new NullPointerException("test");
+
+        publisher.failed(exception);
+        assertThat("subscriber receives exception on next request", subscriber.throwable, nullValue());
+
+        subscriber.requestData();
+        assertThat("subscriber receives exception", subscriber.throwable, is(exception));
+    }
+
+    /**
+     * Given the subscriber is waiting for data
+     * When Apache sends an error
+     * Then the subscriber immediately receives the error
+     */
+    public void testErrorAfterRequest() {
+        var subscriber = subscribe();
+        var exception = new NullPointerException("test");
+
+        subscriber.requestData();
+        publisher.failed(exception);
+        assertThat("subscriber receives exception", subscriber.throwable, is(exception));
+    }
+
+    /**
+     * Given the queue is being processed
+     * When Apache sends an error before the subscriber asks for more data
+     * Then the error will be handled the next time the subscriber requests data
+     */
+    public void testErrorWhileRunningBeforeRequest() throws IOException {
+        var exception = new NullPointerException("test");
+        var subscriber = runBefore(() -> publisher.failed(exception));
+
+        subscriber.requestData();
+        assertThat("subscriber receives exception on next request", subscriber.throwable, nullValue());
+
+        subscriber.requestData();
+        assertThat("subscriber receives exception", subscriber.throwable, is(exception));
+    }
+
+    /**
+     * Given the queue is being processed
+     * When Apache sends an error after the subscriber asks for more data
+     * Then the error will be forwarded by the queue processor thread
+     */
+    public void testErrorWhileRunningAfterRequest() throws IOException {
+        var exception = new NullPointerException("test");
+        var subscriber = runAfter(() -> publisher.failed(exception));
+
+        subscriber.requestData();
+        assertThat("subscriber receives exception", subscriber.throwable, is(exception));
+    }
+
+    /**
+     * Given Apache closed response processing
+     * When the subscriber requests more data
+     * Then the subscriber is marked as completed
+     */
+    public void testCloseBeforeRequest() {
+        var subscriber = subscribe();
+
+        publisher.close();
+        assertFalse("onComplete should not be called until the subscriber requests it", subscriber.completed);
+
+        subscriber.requestData();
+        assertTrue("onComplete should now be called", subscriber.completed);
+    }
+
+    /**
+     * Given the subscriber is waiting for more data
+     * When Apache closes response processing
+     * Then the subscriber is marked as completed
+     */
+    public void testCloseAfterRequest() {
+        var subscriber = subscribe();
+
+        subscriber.requestData();
+        publisher.close();
+        assertTrue("onComplete should be called", subscriber.completed);
+    }
+
+    /**
+     * Given the queue is being processed
+     * When Apache closes the publisher
+     * Then the close will be handled the next time the subscriber requests data
+     */
+    public void testCloseWhileRunningBeforeRequest() throws IOException {
+        var subscriber = runBefore(publisher::close);
+
+        subscriber.requestData();
+        assertFalse("onComplete should not be called until the subscriber requests it", subscriber.completed);
+
+        subscriber.requestData();
+        assertTrue("onComplete should now be called", subscriber.completed);
+    }
+
+    /**
+     * Given the queue is being processed
+     * When Apache closes the publisher after the subscriber asks for more data
+     * Then the close will be handled by the queue processor thread
+     */
+    public void testCloseWhileRunningAfterRequest() throws IOException {
+        var subscriber = runAfter(publisher::close);
+        subscriber.requestData();
+        assertTrue("onComplete should now be called", subscriber.completed);
+    }
+
+    /**
+     * Given Apache cancels response processing
+     * When the subscriber requests more data
+     * Then the subscriber is marked as completed
+     */
+    public void testCancelBeforeRequest() {
+        var subscriber = subscribe();
+
+        publisher.cancel();
+        assertFalse("onComplete should not be called until the subscriber requests it", subscriber.completed);
+
+        subscriber.requestData();
+        assertTrue("onComplete should now be called", subscriber.completed);
+    }
+
+    /**
+     * Given the subscriber is waiting for more data
+     * When Apache cancels response processing
+     * Then the subscriber is marked as completed
+     */
+    public void testCancelAfterRequest() {
+        var subscriber = subscribe();
+
+        subscriber.requestData();
+        publisher.cancel();
+        assertTrue("onComplete should be called", subscriber.completed);
+    }
+
+    /**
+     * Given the queue is being processed
+     * When Apache cancels the publisher
+     * Then the cancel will be handled the next time the subscriber requests data
+     */
+    public void testApacheCancelWhileRunningBeforeRequest() throws IOException {
+        TestSubscriber subscriber = runBefore(publisher::cancel);
+
+        subscriber.requestData();
+        assertFalse("onComplete should not be called until the subscriber requests it", subscriber.completed);
+
+        subscriber.requestData();
+        assertTrue("onComplete should now be called", subscriber.completed);
+    }
+
+    /**
+     * Given the queue is being processed
+     * When Apache cancels the publisher after the subscriber asks for more data
+     * Then the cancel will be handled by the queue processor thread
+     */
+    public void testApacheCancelWhileRunningAfterRequest() throws IOException {
+        TestSubscriber subscriber = runAfter(publisher::cancel);
+
+        subscriber.requestData();
+        assertTrue("onComplete should now be called", subscriber.completed);
+    }
+
+    /**
+     * When a subscriber requests a negative number
+     * Then the subscription should call onError with an IllegalArgumentException
+     */
+    public void testRequestingANegativeNumberFails() {
+        TestSubscriber subscriber = subscribe();
+
+        subscriber.subscription.request(-1);
+
+        assertThat(
+            "onError should be called with an IllegalArgumentException",
+            subscriber.throwable,
+            instanceOf(IllegalArgumentException.class)
+        );
+    }
+
+    /**
+     * When a subscriber requests a negative number
+     * Then the subscription should call onError with an IllegalArgumentException
+     */
+    public void testRequestingZeroFails() {
+        TestSubscriber subscriber = subscribe();
+
+        subscriber.subscription.request(0);
+
+        assertThat(
+            "onError should be called with an IllegalArgumentException",
+            subscriber.throwable,
+            instanceOf(IllegalArgumentException.class)
+        );
+    }
+
+    /**
+     * Given a subscriber is already subscribed
+     * When a second subscriber subscribes
+     * Then that subscriber should receive an IllegalStateException
+     */
+    public void testDoubleSubscribeFails() {
+        publisher.subscribe(mock());
+
+        var subscriber = new TestSubscriber();
+        publisher.subscribe(subscriber);
+        assertThat(subscriber.throwable, notNullValue());
+        assertThat(subscriber.throwable, instanceOf(IllegalStateException.class));
+    }
+
+    /**
+     * Given the thread is an ML Utility thread
+     * When a new request is processed
+     * Then it should reuse that ML Utility thread
+     */
+    public void testReuseMlThread() throws IOException, ExecutionException, InterruptedException, TimeoutException {
+        try {
+            threadPool = spy(createThreadPool(inferenceUtilityPool()));
+            publisher = new StreamingHttpResultPublisher(threadPool, settings, listener);
+            var subscriber = new TestSubscriber();
+            publisher.responseReceived(mock(HttpResponse.class));
+            publisher.subscribe(subscriber);
+
+            CompletableFuture.runAsync(subscriber::requestData, threadPool.executor(UTILITY_THREAD_POOL_NAME)).get(5, TimeUnit.SECONDS);
+            verify(threadPool, times(1)).executor(UTILITY_THREAD_POOL_NAME);
+            assertThat("onNext was called with the initial HttpResponse", subscriber.httpResult, notNullValue());
+            assertTrue("HttpResponse has an empty body (because there is no HttpEntity)", subscriber.httpResult.isBodyEmpty());
+        } finally {
+            terminate(threadPool);
+        }
+    }
+
+    /**
+     * Given that content is still streaming
+     * When a user cancels the Subscription
+     * Then the background thread should stop processing data
+     */
+    public void testCancelBreaksInfiniteLoop() throws Exception {
+        try {
+            var futureHolder = new AtomicReference<CompletableFuture<Void>>();
+            threadPool = spy(createThreadPool(inferenceUtilityPool()));
+            doAnswer(utilityThreadPool -> {
+                var realExecutorService = (ExecutorService) utilityThreadPool.callRealMethod();
+                var executorServiceSpy = spy(realExecutorService);
+                doAnswer(runnable -> {
+                    futureHolder.set(CompletableFuture.runAsync(runnable.getArgument(0), realExecutorService));
+                    return null; // void
+                }).when(executorServiceSpy).execute(any(Runnable.class));
+                return executorServiceSpy;
+            }).when(threadPool).executor(UTILITY_THREAD_POOL_NAME);
+
+            publisher = new StreamingHttpResultPublisher(threadPool, settings, listener);
+            publisher.responseReceived(mock(HttpResponse.class));
+            // create an infinitely running Subscriber
+            var subscriber = new Flow.Subscriber<HttpResult>() {
+                Flow.Subscription subscription;
+                boolean completed = false;
+
+                @Override
+                public void onSubscribe(Flow.Subscription subscription) {
+                    this.subscription = subscription;
+                    subscription.request(1);
+                }
+
+                @Override
+                public void onNext(HttpResult item) {
+                    try {
+                        publisher.consumeContent(contentDecoder(message), mock(IOControl.class));
+                    } catch (IOException e) {
+                        fail(e, "Failed to publish content for testCancelBreaksInfiniteLoop.");
+                    }
+                    subscription.request(1); // run infinitely
+                }
+
+                @Override
+                public void onError(Throwable throwable) {
+                    fail(throwable, "onError should never be called");
+                }
+
+                @Override
+                public void onComplete() {
+                    completed = true;
+                }
+            };
+            publisher.subscribe(subscriber);
+
+            // verify the thread has started
+            assertThat("Thread should have started on subscribe", futureHolder.get(), notNullValue());
+            assertFalse("Thread should still be running", futureHolder.get().isDone());
+
+            subscriber.subscription.cancel();
+            assertBusy(() -> assertTrue("Thread was not canceled in 10 seconds.", futureHolder.get().isDone()));
+        } finally {
+            terminate(threadPool);
+        }
+    }
+
+    /**
+     * Given the message queue is currently being processed
+     * When a new message is added to the queue
+     * Then a new processor thread is not started to process that message
+     */
+    public void testOnlyRunOneAtATime() throws IOException {
+        // start with a message published
+        publisher.responseReceived(mock(HttpResponse.class));
+        TestSubscriber subscriber = new TestSubscriber() {
+            public void onNext(HttpResult item) {
+                try {
+                    // publish a second message
+                    publisher.consumeContent(contentDecoder(message), mock(IOControl.class));
+                    super.requestData();
+                    // and then exit out of the loop
+                    publisher.cancel();
+                } catch (IOException e) {
+                    throw new RuntimeException(e);
+                }
+                super.onNext(item);
+            }
+        };
+        publisher.subscribe(subscriber);
+
+        verify(threadPool, times(0)).executor(UTILITY_THREAD_POOL_NAME);
+        subscriber.requestData();
+        verify(threadPool, times(1)).executor(UTILITY_THREAD_POOL_NAME);
+    }
+
+    private static ContentDecoder contentDecoder(byte[] message) {
+        return new ContentDecoder() {
+            boolean sendBytes = true;
+
+            @Override
+            public int read(ByteBuffer byteBuffer) {
+                if (sendBytes) {
+                    sendBytes = false;
+                    byteBuffer.put(message);
+                    return message.length;
+                }
+                return 0;
+            }
+
+            @Override
+            public boolean isCompleted() {
+                return true;
+            }
+        };
+    }
+
+    private TestSubscriber subscribe() {
+        var subscriber = new TestSubscriber();
+        publisher.subscribe(subscriber);
+        return subscriber;
+    }
+
+    private TestSubscriber runBefore(Runnable runDuringOnNext) throws IOException {
+        publisher.responseReceived(mock(HttpResponse.class));
+        TestSubscriber subscriber = new TestSubscriber() {
+            public void onNext(HttpResult item) {
+                runDuringOnNext.run();
+                super.onNext(item);
+            }
+        };
+        publisher.subscribe(subscriber);
+        return subscriber;
+    }
+
+    private TestSubscriber runAfter(Runnable runDuringOnNext) throws IOException {
+        publisher.responseReceived(mock(HttpResponse.class));
+        TestSubscriber subscriber = new TestSubscriber() {
+            public void onNext(HttpResult item) {
+                runDuringOnNext.run();
+                super.requestData();
+                super.onNext(item);
+            }
+        };
+        publisher.subscribe(subscriber);
+        return subscriber;
+    }
+
+    private static class TestSubscriber implements Flow.Subscriber<HttpResult> {
+        private Flow.Subscription subscription;
+        private HttpResult httpResult;
+        private Throwable throwable;
+        private boolean completed;
+
+        @Override
+        public void onSubscribe(Flow.Subscription subscription) {
+            this.subscription = subscription;
+        }
+
+        @Override
+        public void onNext(HttpResult item) {
+            this.httpResult = item;
+        }
+
+        @Override
+        public void onError(Throwable throwable) {
+            this.throwable = throwable;
+        }
+
+        @Override
+        public void onComplete() {
+            this.completed = true;
+        }
+
+        private void requestData() {
+            subscription.request(1);
+        }
+    }
+}

From 87e257e8739f64d61f13ed01f0c9e72dad65c5d9 Mon Sep 17 00:00:00 2001
From: Pat Whelan <pat.whelan@elastic.co>
Date: Tue, 3 Sep 2024 12:17:41 -0400
Subject: [PATCH 116/144] [ML] Register Task while Streaming (#112369)

While Inference is streaming a response, register a Task in the
TaskManager to represent the stream.  When the Stream finishes, either
through completion or error, we will unregister the Task.  If a user
cancels the Task, it should close out the stream.
---
 docs/changelog/112369.yaml                    |   5 +
 .../inference/action/InferenceAction.java     |  24 ++-
 .../inference/src/main/java/module-info.java  |   1 +
 .../InferenceNamedWriteablesProvider.java     |   3 +
 .../action/TransportInferenceAction.java      |  26 ++-
 .../xpack/inference/action/task/FlowTask.java |  64 ++++++
 .../action/task/StreamingTaskManager.java     | 198 ++++++++++++++++++
 .../task/StreamingTaskManagerTests.java       | 192 +++++++++++++++++
 8 files changed, 508 insertions(+), 5 deletions(-)
 create mode 100644 docs/changelog/112369.yaml
 create mode 100644 x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/action/task/FlowTask.java
 create mode 100644 x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/action/task/StreamingTaskManager.java
 create mode 100644 x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/action/task/StreamingTaskManagerTests.java

diff --git a/docs/changelog/112369.yaml b/docs/changelog/112369.yaml
new file mode 100644
index 0000000000000..fb1c4775f7a12
--- /dev/null
+++ b/docs/changelog/112369.yaml
@@ -0,0 +1,5 @@
+pr: 112369
+summary: Register Task while Streaming
+area: Machine Learning
+type: enhancement
+issues: []
diff --git a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/inference/action/InferenceAction.java b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/inference/action/InferenceAction.java
index c38f508db1b6a..d898f961651f1 100644
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/inference/action/InferenceAction.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/inference/action/InferenceAction.java
@@ -164,6 +164,10 @@ public TimeValue getInferenceTimeout() {
             return inferenceTimeout;
         }
 
+        public boolean isStreaming() {
+            return false;
+        }
+
         @Override
         public ActionRequestValidationException validate() {
             if (input == null) {
@@ -326,9 +330,19 @@ public String toString() {
     public static class Response extends ActionResponse implements ChunkedToXContentObject {
 
         private final InferenceServiceResults results;
+        private final boolean isStreaming;
+        private final Flow.Publisher<ChunkedToXContent> publisher;
 
         public Response(InferenceServiceResults results) {
             this.results = results;
+            this.isStreaming = false;
+            this.publisher = null;
+        }
+
+        public Response(InferenceServiceResults results, Flow.Publisher<ChunkedToXContent> publisher) {
+            this.results = results;
+            this.isStreaming = true;
+            this.publisher = publisher;
         }
 
         public Response(StreamInput in) throws IOException {
@@ -340,6 +354,9 @@ public Response(StreamInput in) throws IOException {
                 // hugging face elser and elser
                 results = transformToServiceResults(List.of(in.readNamedWriteable(InferenceResults.class)));
             }
+            // streaming isn't supported via Writeable yet
+            this.isStreaming = false;
+            this.publisher = null;
         }
 
         @SuppressWarnings("deprecation")
@@ -398,7 +415,7 @@ public InferenceServiceResults getResults() {
          * Currently set to false while it is being implemented.
          */
         public boolean isStreaming() {
-            return false;
+            return isStreaming;
         }
 
         /**
@@ -407,8 +424,8 @@ public boolean isStreaming() {
          * If the RestResponse is closed, it will cancel the subscription.
          */
         public Flow.Publisher<ChunkedToXContent> publisher() {
-            assert isStreaming() == false : "This must be implemented when isStreaming() == true";
-            throw new UnsupportedOperationException("This must be implemented when isStreaming() == true");
+            assert isStreaming() : "this should only be called after isStreaming() verifies this object is non-null";
+            return publisher;
         }
 
         @Override
@@ -418,6 +435,7 @@ public void writeTo(StreamOutput out) throws IOException {
             } else {
                 out.writeNamedWriteable(results.transformToLegacyFormat().get(0));
             }
+            // streaming isn't supported via Writeable yet
         }
 
         @Override
diff --git a/x-pack/plugin/inference/src/main/java/module-info.java b/x-pack/plugin/inference/src/main/java/module-info.java
index a7e5718a0920e..49abe14dbf302 100644
--- a/x-pack/plugin/inference/src/main/java/module-info.java
+++ b/x-pack/plugin/inference/src/main/java/module-info.java
@@ -33,6 +33,7 @@
     exports org.elasticsearch.xpack.inference.rest;
     exports org.elasticsearch.xpack.inference.services;
     exports org.elasticsearch.xpack.inference;
+    exports org.elasticsearch.xpack.inference.action.task;
 
     provides org.elasticsearch.features.FeatureSpecification with org.elasticsearch.xpack.inference.InferenceFeatures;
 }
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/InferenceNamedWriteablesProvider.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/InferenceNamedWriteablesProvider.java
index d4810ba930b44..62c2c5fd61992 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/InferenceNamedWriteablesProvider.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/InferenceNamedWriteablesProvider.java
@@ -25,6 +25,7 @@
 import org.elasticsearch.xpack.core.inference.results.LegacyTextEmbeddingResults;
 import org.elasticsearch.xpack.core.inference.results.RankedDocsResults;
 import org.elasticsearch.xpack.core.inference.results.SparseEmbeddingResults;
+import org.elasticsearch.xpack.inference.action.task.StreamingTaskManager;
 import org.elasticsearch.xpack.inference.services.alibabacloudsearch.AlibabaCloudSearchServiceSettings;
 import org.elasticsearch.xpack.inference.services.alibabacloudsearch.embeddings.AlibabaCloudSearchEmbeddingsServiceSettings;
 import org.elasticsearch.xpack.inference.services.alibabacloudsearch.embeddings.AlibabaCloudSearchEmbeddingsTaskSettings;
@@ -126,6 +127,8 @@ public static List<NamedWriteableRegistry.Entry> getNamedWriteables() {
         addEisNamedWriteables(namedWriteables);
         addAlibabaCloudSearchNamedWriteables(namedWriteables);
 
+        namedWriteables.addAll(StreamingTaskManager.namedWriteables());
+
         return namedWriteables;
     }
 
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/action/TransportInferenceAction.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/action/TransportInferenceAction.java
index 81669a573a5d1..054cfe1017cad 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/action/TransportInferenceAction.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/action/TransportInferenceAction.java
@@ -12,22 +12,28 @@
 import org.elasticsearch.action.support.ActionFilters;
 import org.elasticsearch.action.support.HandledTransportAction;
 import org.elasticsearch.common.util.concurrent.EsExecutors;
+import org.elasticsearch.common.xcontent.ChunkedToXContent;
 import org.elasticsearch.inference.InferenceService;
 import org.elasticsearch.inference.InferenceServiceRegistry;
+import org.elasticsearch.inference.InferenceServiceResults;
 import org.elasticsearch.inference.Model;
 import org.elasticsearch.injection.guice.Inject;
 import org.elasticsearch.rest.RestStatus;
 import org.elasticsearch.tasks.Task;
 import org.elasticsearch.transport.TransportService;
 import org.elasticsearch.xpack.core.inference.action.InferenceAction;
+import org.elasticsearch.xpack.inference.action.task.StreamingTaskManager;
 import org.elasticsearch.xpack.inference.registry.ModelRegistry;
 import org.elasticsearch.xpack.inference.telemetry.InferenceStats;
 
 public class TransportInferenceAction extends HandledTransportAction<InferenceAction.Request, InferenceAction.Response> {
+    private static final String STREAMING_INFERENCE_TASK_TYPE = "streaming_inference";
+    private static final String STREAMING_TASK_ACTION = "xpack/inference/streaming_inference[n]";
 
     private final ModelRegistry modelRegistry;
     private final InferenceServiceRegistry serviceRegistry;
     private final InferenceStats inferenceStats;
+    private final StreamingTaskManager streamingTaskManager;
 
     @Inject
     public TransportInferenceAction(
@@ -35,12 +41,14 @@ public TransportInferenceAction(
         ActionFilters actionFilters,
         ModelRegistry modelRegistry,
         InferenceServiceRegistry serviceRegistry,
-        InferenceStats inferenceStats
+        InferenceStats inferenceStats,
+        StreamingTaskManager streamingTaskManager
     ) {
         super(InferenceAction.NAME, transportService, actionFilters, InferenceAction.Request::new, EsExecutors.DIRECT_EXECUTOR_SERVICE);
         this.modelRegistry = modelRegistry;
         this.serviceRegistry = serviceRegistry;
         this.inferenceStats = inferenceStats;
+        this.streamingTaskManager = streamingTaskManager;
     }
 
     @Override
@@ -100,7 +108,21 @@ private void inferOnService(
             request.getTaskSettings(),
             request.getInputType(),
             request.getInferenceTimeout(),
-            listener.delegateFailureAndWrap((l, inferenceResults) -> l.onResponse(new InferenceAction.Response(inferenceResults)))
+            createListener(request, listener)
         );
     }
+
+    private ActionListener<InferenceServiceResults> createListener(
+        InferenceAction.Request request,
+        ActionListener<InferenceAction.Response> listener
+    ) {
+        if (request.isStreaming()) {
+            return listener.delegateFailureAndWrap((l, inferenceResults) -> {
+                var taskProcessor = streamingTaskManager.<ChunkedToXContent>create(STREAMING_INFERENCE_TASK_TYPE, STREAMING_TASK_ACTION);
+                inferenceResults.publisher().subscribe(taskProcessor);
+                l.onResponse(new InferenceAction.Response(inferenceResults, taskProcessor));
+            });
+        }
+        return listener.delegateFailureAndWrap((l, inferenceResults) -> l.onResponse(new InferenceAction.Response(inferenceResults)));
+    };
 }
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/action/task/FlowTask.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/action/task/FlowTask.java
new file mode 100644
index 0000000000000..b565f7adc36fe
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/action/task/FlowTask.java
@@ -0,0 +1,64 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.action.task;
+
+import org.elasticsearch.common.io.stream.StreamOutput;
+import org.elasticsearch.tasks.CancellableTask;
+import org.elasticsearch.tasks.Task;
+import org.elasticsearch.tasks.TaskId;
+import org.elasticsearch.xcontent.XContentBuilder;
+
+import java.io.IOException;
+import java.util.Map;
+import java.util.concurrent.atomic.AtomicReference;
+
+class FlowTask extends CancellableTask {
+    private final AtomicReference<FlowStatus> flowStatus = new AtomicReference<>(FlowStatus.CONNECTING);
+
+    FlowTask(long id, String type, String action, String description, TaskId parentTaskId, Map<String, String> headers) {
+        super(id, type, action, description, parentTaskId, headers);
+    }
+
+    @Override
+    public Status getStatus() {
+        return flowStatus.get();
+    }
+
+    public void updateStatus(FlowStatus status) {
+        flowStatus.set(status);
+    }
+
+    enum FlowStatus implements Task.Status {
+        CONNECTING("Connecting"),
+        CONNECTED("Connected");
+
+        static final String NAME = "streaming_task_manager_flow_status";
+        static final Reader<FlowStatus> STREAM_READER = in -> FlowStatus.valueOf(in.readString());
+
+        private final String status;
+
+        FlowStatus(String status) {
+            this.status = status;
+        }
+
+        @Override
+        public String getWriteableName() {
+            return NAME;
+        }
+
+        @Override
+        public void writeTo(StreamOutput out) throws IOException {
+            out.writeString(status);
+        }
+
+        @Override
+        public XContentBuilder toXContent(XContentBuilder builder, Params params) throws IOException {
+            return builder.startObject().field("status", status).endObject();
+        }
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/action/task/StreamingTaskManager.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/action/task/StreamingTaskManager.java
new file mode 100644
index 0000000000000..8aa437c773608
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/action/task/StreamingTaskManager.java
@@ -0,0 +1,198 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.action.task;
+
+import org.apache.logging.log4j.LogManager;
+import org.apache.logging.log4j.Logger;
+import org.elasticsearch.common.io.stream.NamedWriteableRegistry;
+import org.elasticsearch.injection.guice.Inject;
+import org.elasticsearch.tasks.Task;
+import org.elasticsearch.tasks.TaskAwareRequest;
+import org.elasticsearch.tasks.TaskId;
+import org.elasticsearch.tasks.TaskManager;
+import org.elasticsearch.threadpool.ThreadPool;
+import org.elasticsearch.transport.TransportService;
+
+import java.util.List;
+import java.util.Map;
+import java.util.concurrent.Flow;
+import java.util.concurrent.atomic.AtomicBoolean;
+import java.util.concurrent.atomic.AtomicLong;
+
+/**
+ * A wrapper around the {@link TaskManager} that creates a new {@link Task} to observe and control a {@link Flow}.  When the Flow is
+ * initiated, a new Task is registered in the TaskManager that represents the Flow.  When the Flow ends, either through completion or error,
+ * the Task will close in the TaskManager.  If a user manually closes the Task, it will cancel and close the underlying Flow.
+ */
+public class StreamingTaskManager {
+    private final TaskManager taskManager;
+    private final ThreadPool threadPool;
+
+    @Inject
+    public StreamingTaskManager(TransportService transportService, ThreadPool threadPool) {
+        this(transportService.getTaskManager(), threadPool);
+    }
+
+    StreamingTaskManager(TaskManager taskManager, ThreadPool threadPool) {
+        this.taskManager = taskManager;
+        this.threadPool = threadPool;
+    }
+
+    public <E> Flow.Processor<E, E> create(String taskType, String taskAction) {
+        return new TaskBackedProcessor<>(taskType, taskAction);
+    }
+
+    public static List<NamedWriteableRegistry.Entry> namedWriteables() {
+        return List.of(new NamedWriteableRegistry.Entry(Task.Status.class, FlowTask.FlowStatus.NAME, FlowTask.FlowStatus.STREAM_READER));
+    }
+
+    private class TaskBackedProcessor<E> implements Flow.Processor<E, E> {
+        private static final Logger log = LogManager.getLogger(TaskBackedProcessor.class);
+        private final String taskType;
+        private final String taskAction;
+        private Flow.Subscriber<? super E> downstream;
+        private Flow.Subscription upstream;
+        private FlowTask task;
+        private final AtomicBoolean isClosed = new AtomicBoolean(false);
+        private final AtomicLong pendingRequests = new AtomicLong();
+
+        private TaskBackedProcessor(String taskType, String taskAction) {
+            this.taskType = taskType;
+            this.taskAction = taskAction;
+        }
+
+        @Override
+        public void subscribe(Flow.Subscriber<? super E> subscriber) {
+            if (downstream != null) {
+                subscriber.onError(new IllegalStateException("Another subscriber is already subscribed."));
+                return;
+            }
+
+            downstream = subscriber;
+            openOrUpdateTask();
+            downstream.onSubscribe(forwardingSubscription());
+        }
+
+        private void openOrUpdateTask() {
+            if (task != null) {
+                task.updateStatus(FlowTask.FlowStatus.CONNECTED);
+            } else {
+                try (var ignored = threadPool.getThreadContext().newTraceContext()) {
+                    task = (FlowTask) taskManager.register(taskType, taskAction, new TaskAwareRequest() {
+                        @Override
+                        public void setParentTask(TaskId taskId) {
+                            throw new UnsupportedOperationException("parent task id for streaming results shouldn't change");
+                        }
+
+                        @Override
+                        public void setRequestId(long requestId) {
+                            throw new UnsupportedOperationException("does not have request ID");
+                        }
+
+                        @Override
+                        public TaskId getParentTask() {
+                            return TaskId.EMPTY_TASK_ID;
+                        }
+
+                        @Override
+                        public Task createTask(long id, String type, String action, TaskId parentTaskId, Map<String, String> headers) {
+                            var flowTask = new FlowTask(id, type, action, "", parentTaskId, headers);
+                            flowTask.addListener(TaskBackedProcessor.this::cancelTask);
+                            return flowTask;
+                        }
+                    });
+                }
+            }
+        }
+
+        private void cancelTask() {
+            if (isClosed.compareAndSet(false, true)) {
+                if (upstream != null) {
+                    upstream.cancel();
+                }
+                if (downstream != null) {
+                    downstream.onComplete();
+                }
+            }
+        }
+
+        private Flow.Subscription forwardingSubscription() {
+            return new Flow.Subscription() {
+                @Override
+                public void request(long n) {
+                    if (isClosed.get()) {
+                        downstream.onComplete(); // shouldn't happen, but reinforce that we're no longer listening
+                    } else if (upstream != null) {
+                        upstream.request(n);
+                    } else {
+                        pendingRequests.accumulateAndGet(n, Long::sum);
+                    }
+                }
+
+                @Override
+                public void cancel() {
+                    finishTask();
+                    if (upstream != null) {
+                        upstream.cancel();
+                    }
+                }
+            };
+        }
+
+        @Override
+        public void onSubscribe(Flow.Subscription subscription) {
+            if (isClosed.get()) {
+                subscription.cancel();
+                return;
+            }
+
+            upstream = subscription;
+            openOrUpdateTask();
+            var currentRequestCount = pendingRequests.getAndSet(0);
+            if (currentRequestCount != 0) {
+                upstream.request(currentRequestCount);
+            }
+        }
+
+        @Override
+        public void onNext(E item) {
+            if (isClosed.get()) {
+                upstream.cancel(); // shouldn't happen, but reinforce that we're no longer listening
+            } else {
+                downstream.onNext(item);
+            }
+        }
+
+        @Override
+        public void onError(Throwable throwable) {
+            finishTask();
+            if (downstream != null) {
+                downstream.onError(throwable);
+            } else {
+                log.atDebug()
+                    .withThrowable(throwable)
+                    .log("onError was called before the downstream subscription, rethrowing to close listener.");
+                throw new IllegalStateException("onError was called before the downstream subscription", throwable);
+            }
+        }
+
+        @Override
+        public void onComplete() {
+            finishTask();
+            if (downstream != null) {
+                downstream.onComplete();
+            }
+        }
+
+        private void finishTask() {
+            if (isClosed.compareAndSet(false, true) && task != null) {
+                taskManager.unregister(task);
+            }
+        }
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/action/task/StreamingTaskManagerTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/action/task/StreamingTaskManagerTests.java
new file mode 100644
index 0000000000000..8ca4a5f2aa309
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/action/task/StreamingTaskManagerTests.java
@@ -0,0 +1,192 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.action.task;
+
+import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.common.util.concurrent.ThreadContext;
+import org.elasticsearch.tasks.CancellableTask;
+import org.elasticsearch.tasks.TaskAwareRequest;
+import org.elasticsearch.tasks.TaskCancelHelper;
+import org.elasticsearch.tasks.TaskId;
+import org.elasticsearch.tasks.TaskManager;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.threadpool.ThreadPool;
+import org.junit.After;
+import org.junit.Before;
+import org.mockito.ArgumentCaptor;
+
+import java.util.Map;
+import java.util.concurrent.Flow;
+import java.util.concurrent.atomic.AtomicReference;
+
+import static org.mockito.ArgumentMatchers.any;
+import static org.mockito.ArgumentMatchers.anyInt;
+import static org.mockito.ArgumentMatchers.eq;
+import static org.mockito.ArgumentMatchers.same;
+import static org.mockito.Mockito.doAnswer;
+import static org.mockito.Mockito.mock;
+import static org.mockito.Mockito.never;
+import static org.mockito.Mockito.only;
+import static org.mockito.Mockito.times;
+import static org.mockito.Mockito.verify;
+import static org.mockito.Mockito.when;
+
+public class StreamingTaskManagerTests extends ESTestCase {
+    private static final String taskType = "taskType";
+    private static final String taskAction = "taskAction";
+
+    private TaskManager taskManager;
+    private StreamingTaskManager streamingTaskManager;
+
+    @Before
+    public void setUp() throws Exception {
+        super.setUp();
+        taskManager = mock();
+        ThreadPool threadPool = mock();
+        streamingTaskManager = new StreamingTaskManager(taskManager, threadPool);
+
+        when(threadPool.getThreadContext()).thenReturn(new ThreadContext(Settings.EMPTY));
+        doAnswer(ans -> {
+            TaskAwareRequest taskAwareRequest = ans.getArgument(2);
+            return taskAwareRequest.createTask(1L, taskType, taskAction, TaskId.EMPTY_TASK_ID, Map.of());
+        }).when(taskManager).register(any(), any(), any());
+    }
+
+    @After
+    public void tearDown() throws Exception {
+        super.tearDown();
+    }
+
+    public void testSubscribeRegistersTask() {
+        var processor = streamingTaskManager.create(taskType, taskAction);
+
+        processor.subscribe(mock());
+
+        verify(taskManager, only()).register(eq(taskType), eq(taskAction), any());
+    }
+
+    public void testCancelPropagatesUpstreamAndDownstream() {
+        var task = new AtomicReference<CancellableTask>();
+        doAnswer(ans -> {
+            TaskAwareRequest taskAwareRequest = ans.getArgument(2);
+            var registeredTask = (CancellableTask) taskAwareRequest.createTask(1L, taskType, taskAction, TaskId.EMPTY_TASK_ID, Map.of());
+            task.set(registeredTask);
+            return registeredTask;
+        }).when(taskManager).register(any(), any(), any());
+
+        Flow.Subscriber<Object> downstream = mock();
+        Flow.Subscription upstream = mock();
+
+        var processor = streamingTaskManager.create(taskType, taskAction);
+        processor.subscribe(downstream);
+        processor.onSubscribe(upstream);
+
+        TaskCancelHelper.cancel(task.get(), "for testing");
+
+        verify(downstream, times(1)).onComplete();
+        verify(upstream, times(1)).cancel();
+    }
+
+    public void testRequestBeforeOnSubscribe() {
+        var processor = streamingTaskManager.create(taskType, taskAction);
+        var expectedRequestCount = randomLongBetween(2, 100);
+
+        Flow.Subscriber<Object> downstream = mock();
+        processor.subscribe(downstream);
+
+        var subscription = ArgumentCaptor.forClass(Flow.Subscription.class);
+        verify(downstream, times(1)).onSubscribe(subscription.capture());
+        subscription.getValue().request(expectedRequestCount);
+
+        Flow.Subscription upstream = mock();
+        processor.onSubscribe(upstream);
+        verify(upstream, times(1)).request(eq(expectedRequestCount));
+    }
+
+    public void testRequestAfterOnSubscribe() {
+        var processor = streamingTaskManager.create(taskType, taskAction);
+        var expectedRequestCount = randomLongBetween(2, 100);
+
+        Flow.Subscription upstream = mock();
+        processor.onSubscribe(upstream);
+        verify(upstream, never()).request(anyInt());
+
+        Flow.Subscriber<Object> downstream = mock();
+        processor.subscribe(downstream);
+
+        var subscription = ArgumentCaptor.forClass(Flow.Subscription.class);
+        verify(downstream, times(1)).onSubscribe(subscription.capture());
+
+        subscription.getValue().request(expectedRequestCount);
+        verify(upstream, times(1)).request(eq(expectedRequestCount));
+    }
+
+    public void testOnErrorUnregistersTask() {
+        var expectedError = new IllegalStateException("blah");
+        var processor = streamingTaskManager.create(taskType, taskAction);
+        var downstream = establishFlow(processor);
+
+        processor.onError(expectedError);
+
+        verify(downstream, times(1)).onError(expectedError);
+        verify(taskManager, times(1)).unregister(any());
+    }
+
+    private Flow.Subscriber<Object> establishFlow(Flow.Processor<Object, Object> processor) {
+        Flow.Subscription upstream = mock();
+        processor.onSubscribe(upstream);
+        Flow.Subscriber<Object> downstream = mock();
+        processor.subscribe(downstream);
+        return downstream;
+    }
+
+    public void testOnCompleteUnregistersTask() {
+        var processor = streamingTaskManager.create(taskType, taskAction);
+        var downstream = establishFlow(processor);
+
+        processor.onComplete();
+
+        verify(downstream, times(1)).onComplete();
+        verify(taskManager, times(1)).unregister(any());
+    }
+
+    public void testOnNextForwardsItem() {
+        var expectedItem = new Object();
+        var processor = streamingTaskManager.create(taskType, taskAction);
+        var downstream = establishFlow(processor);
+
+        processor.onNext(expectedItem);
+
+        verify(downstream, times(1)).onNext(same(expectedItem));
+    }
+
+    public void testOnNextAfterCancelDoesNotForwardItem() {
+        var expectedItem = new Object();
+        var task = new AtomicReference<CancellableTask>();
+        doAnswer(ans -> {
+            TaskAwareRequest taskAwareRequest = ans.getArgument(2);
+            var registeredTask = (CancellableTask) taskAwareRequest.createTask(1L, taskType, taskAction, TaskId.EMPTY_TASK_ID, Map.of());
+            task.set(registeredTask);
+            return registeredTask;
+        }).when(taskManager).register(any(), any(), any());
+
+        var processor = streamingTaskManager.create(taskType, taskAction);
+        var downstream = establishFlow(processor);
+
+        TaskCancelHelper.cancel(task.get(), "test");
+        processor.onNext(expectedItem);
+
+        verify(downstream, never()).onNext(any());
+    }
+
+    public void testCancelBeforeSubscriptionThrowsException() {
+        var processor = streamingTaskManager.create(taskType, taskAction);
+
+        assertThrows(IllegalStateException.class, () -> processor.onError(new NullPointerException()));
+    }
+}

From adfbb3d22c2ad83be5ba629dd32c99de8323ff1a Mon Sep 17 00:00:00 2001
From: Oleksandr Kolomiiets <oleksandr.kolomiiets@elastic.co>
Date: Tue, 3 Sep 2024 09:19:10 -0700
Subject: [PATCH 117/144] Fix synthetic source tests for shape (#112373)

---
 ...GeoShapeWithDocValuesFieldMapperTests.java |  2 +-
 .../GeometricShapeSyntheticSourceSupport.java | 92 +++++++++++--------
 .../index/mapper/ShapeFieldMapperTests.java   |  2 +-
 3 files changed, 54 insertions(+), 42 deletions(-)

diff --git a/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/mapper/GeoShapeWithDocValuesFieldMapperTests.java b/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/mapper/GeoShapeWithDocValuesFieldMapperTests.java
index 55fcf1b7d39b4..5999a3ff1e151 100644
--- a/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/mapper/GeoShapeWithDocValuesFieldMapperTests.java
+++ b/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/mapper/GeoShapeWithDocValuesFieldMapperTests.java
@@ -428,7 +428,7 @@ protected Object generateRandomInputValue(MappedFieldType ft) {
 
     @Override
     protected SyntheticSourceSupport syntheticSourceSupport(boolean ignoreMalformed) {
-        return new GeometricShapeSyntheticSourceSupport(ignoreMalformed);
+        return new GeometricShapeSyntheticSourceSupport(GeometricShapeSyntheticSourceSupport.FieldType.GEO_SHAPE, ignoreMalformed);
     }
 
     @Override
diff --git a/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/mapper/GeometricShapeSyntheticSourceSupport.java b/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/mapper/GeometricShapeSyntheticSourceSupport.java
index 4325eb41ceefa..e1a91bb592ce7 100644
--- a/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/mapper/GeometricShapeSyntheticSourceSupport.java
+++ b/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/mapper/GeometricShapeSyntheticSourceSupport.java
@@ -17,6 +17,7 @@
 import org.elasticsearch.index.mapper.MapperTestCase;
 import org.elasticsearch.test.ESTestCase;
 import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xpack.spatial.util.GeoTestUtils;
 
 import java.io.IOException;
 import java.util.List;
@@ -32,9 +33,11 @@
  * Synthetic source support for fields the index geometry shapes: shape, geo_shape.
  */
 public class GeometricShapeSyntheticSourceSupport implements MapperTestCase.SyntheticSourceSupport {
+    private final FieldType fieldType;
     private final boolean ignoreMalformed;
 
-    public GeometricShapeSyntheticSourceSupport(boolean ignoreMalformed) {
+    public GeometricShapeSyntheticSourceSupport(FieldType fieldType, boolean ignoreMalformed) {
+        this.fieldType = fieldType;
         this.ignoreMalformed = ignoreMalformed;
     }
 
@@ -92,48 +95,42 @@ private Value generateValue() {
         var type = randomFrom(ShapeType.values());
         var isGeoJson = randomBoolean();
 
-        return switch (type) {
-            // LINEARRING and CIRCLE are not supported as inputs to fields so just return points
-            case POINT, LINEARRING, CIRCLE -> {
-                var point = GeometryTestUtils.randomPoint(false);
-                yield value(point, isGeoJson);
+        while (true) {
+            Geometry candidateGeometry = switch (type) {
+                // LINEARRING and CIRCLE are not supported as inputs to fields so just return points
+                case POINT, LINEARRING, CIRCLE -> GeometryTestUtils.randomPoint(false);
+                case MULTIPOINT -> GeometryTestUtils.randomMultiPoint(false);
+                case LINESTRING -> GeometryTestUtils.randomLine(false);
+                case MULTILINESTRING -> GeometryTestUtils.randomMultiLine(false);
+                case POLYGON -> GeometryTestUtils.randomPolygon(false);
+                case MULTIPOLYGON -> GeometryTestUtils.randomMultiPolygon(false);
+                case GEOMETRYCOLLECTION -> GeometryTestUtils.randomGeometryCollectionWithoutCircle(false);
+                case ENVELOPE -> GeometryTestUtils.randomRectangle();
+            };
+
+            try {
+                if (fieldType == FieldType.GEO_SHAPE) {
+                    GeoTestUtils.binaryGeoShapeDocValuesField("f", candidateGeometry);
+                } else {
+                    GeoTestUtils.binaryCartesianShapeDocValuesField("f", candidateGeometry);
+                }
+
+                if (type == ShapeType.ENVELOPE) {
+                    var wktString = WellKnownText.toWKT(candidateGeometry);
+
+                    return new Value(wktString, wktString);
+                }
+
+                return value(candidateGeometry, isGeoJson);
+            } catch (IllegalArgumentException ignored) {
+                // It's malformed somehow, loop
             }
-            case MULTIPOINT -> {
-                var multiPoint = GeometryTestUtils.randomMultiPoint(false);
-                yield value(multiPoint, isGeoJson);
-            }
-            case LINESTRING -> {
-                var line = GeometryTestUtils.randomLine(false);
-                yield value(line, isGeoJson);
-            }
-            case MULTILINESTRING -> {
-                var multiPoint = GeometryTestUtils.randomMultiLine(false);
-                yield value(multiPoint, isGeoJson);
-            }
-            case POLYGON -> {
-                var polygon = GeometryTestUtils.randomPolygon(false);
-                yield value(polygon, isGeoJson);
-            }
-            case MULTIPOLYGON -> {
-                var multiPolygon = GeometryTestUtils.randomMultiPolygon(false);
-                yield value(multiPolygon, isGeoJson);
-            }
-            case GEOMETRYCOLLECTION -> {
-                var multiPolygon = GeometryTestUtils.randomGeometryCollectionWithoutCircle(false);
-                yield value(multiPolygon, isGeoJson);
-            }
-            case ENVELOPE -> {
-                var rectangle = GeometryTestUtils.randomRectangle();
-                var wktString = WellKnownText.toWKT(rectangle);
-
-                yield new Value(wktString, wktString);
-            }
-        };
+        }
     }
 
-    private static Value value(Geometry geometry, boolean isGeoJson) {
+    private Value value(Geometry geometry, boolean isGeoJson) {
         var wktString = WellKnownText.toWKT(geometry);
-        var normalizedWktString = GeometryNormalizer.needsNormalize(Orientation.RIGHT, geometry)
+        var normalizedWktString = fieldType == FieldType.GEO_SHAPE && GeometryNormalizer.needsNormalize(Orientation.RIGHT, geometry)
             ? WellKnownText.toWKT(GeometryNormalizer.apply(Orientation.RIGHT, geometry))
             : wktString;
 
@@ -146,7 +143,7 @@ private static Value value(Geometry geometry, boolean isGeoJson) {
     }
 
     private void mapping(XContentBuilder b) throws IOException {
-        b.field("type", "geo_shape");
+        b.field("type", fieldType.getName());
         if (rarely()) {
             b.field("index", false);
         }
@@ -162,4 +159,19 @@ private void mapping(XContentBuilder b) throws IOException {
     public List<MapperTestCase.SyntheticSourceInvalidExample> invalidExample() throws IOException {
         return List.of();
     }
+
+    public enum FieldType {
+        GEO_SHAPE("geo_shape"),
+        SHAPE("shape");
+
+        private final String name;
+
+        FieldType(String name) {
+            this.name = name;
+        }
+
+        public String getName() {
+            return name;
+        }
+    }
 }
diff --git a/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/mapper/ShapeFieldMapperTests.java b/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/mapper/ShapeFieldMapperTests.java
index 28297f32297e6..35ccfe8deb5fe 100644
--- a/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/mapper/ShapeFieldMapperTests.java
+++ b/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/mapper/ShapeFieldMapperTests.java
@@ -368,7 +368,7 @@ protected Object generateRandomInputValue(MappedFieldType ft) {
 
     @Override
     protected SyntheticSourceSupport syntheticSourceSupport(boolean ignoreMalformed) {
-        return new GeometricShapeSyntheticSourceSupport(ignoreMalformed);
+        return new GeometricShapeSyntheticSourceSupport(GeometricShapeSyntheticSourceSupport.FieldType.SHAPE, ignoreMalformed);
     }
 
     @Override

From c455984820a3d1825c04ecdc4a3246e76e512e5c Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Wed, 4 Sep 2024 02:43:12 +1000
Subject: [PATCH 118/144] Mute
 org.elasticsearch.xpack.inference.external.http.RequestBasedTaskRunnerTests
 testLoopOneAtATime #112471

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 6f52c67ab5170..45c286375a1ed 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -185,6 +185,9 @@ tests:
 - class: org.elasticsearch.xpack.esql.action.ManyShardsIT
   method: testConcurrentQueries
   issue: https://github.com/elastic/elasticsearch/issues/112424
+- class: org.elasticsearch.xpack.inference.external.http.RequestBasedTaskRunnerTests
+  method: testLoopOneAtATime
+  issue: https://github.com/elastic/elasticsearch/issues/112471
 
 # Examples:
 #

From b0a00561d18867021a67b443e2b7ebbe0ff3d699 Mon Sep 17 00:00:00 2001
From: Mark Vieira <portugee@gmail.com>
Date: Tue, 3 Sep 2024 10:42:29 -0700
Subject: [PATCH 119/144] Add Github action for keeping jdk upgrade branch in
 sync

---
 .github/workflows/sync-main-to-jdk-branch.yml | 20 +++++++++++++++++++
 1 file changed, 20 insertions(+)
 create mode 100644 .github/workflows/sync-main-to-jdk-branch.yml

diff --git a/.github/workflows/sync-main-to-jdk-branch.yml b/.github/workflows/sync-main-to-jdk-branch.yml
new file mode 100644
index 0000000000000..a04db44fe6c54
--- /dev/null
+++ b/.github/workflows/sync-main-to-jdk-branch.yml
@@ -0,0 +1,20 @@
+# Daily update of JDK update branch with changes from main
+name: "Merge main to es-9.0-bump branch"
+on:
+  schedule:
+    - cron: '0 5 * * *'
+
+jobs:
+  merge-branch:
+    runs-on: ubuntu-latest
+    steps:
+      - name: checkout
+        uses: actions/checkout@master
+
+      - name: merge
+        uses: devmasx/merge-branch@1.4.0
+        with:
+          type: 'now'
+          from_branch: main
+          target_branch: es-9.0-bump
+          github_token: ${{ secrets.ELASTICSEARCHMACHINE_TOKEN }}

From 42ac585e7f92f10ce2271438e640d51efd1bd417 Mon Sep 17 00:00:00 2001
From: Mark Vieira <portugee@gmail.com>
Date: Tue, 3 Sep 2024 10:47:02 -0700
Subject: [PATCH 120/144] Allow for manual invocation

---
 .github/workflows/sync-main-to-jdk-branch.yml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.github/workflows/sync-main-to-jdk-branch.yml b/.github/workflows/sync-main-to-jdk-branch.yml
index a04db44fe6c54..9570ca96a3370 100644
--- a/.github/workflows/sync-main-to-jdk-branch.yml
+++ b/.github/workflows/sync-main-to-jdk-branch.yml
@@ -3,6 +3,7 @@ name: "Merge main to es-9.0-bump branch"
 on:
   schedule:
     - cron: '0 5 * * *'
+  workflow_dispatch: {}
 
 jobs:
   merge-branch:

From aefdd7680f7887e2bac4297cfadf8a5c3cdc9bd6 Mon Sep 17 00:00:00 2001
From: Mark Vieira <portugee@gmail.com>
Date: Tue, 3 Sep 2024 10:51:44 -0700
Subject: [PATCH 121/144] Fix branch name in github action nworkflow

---
 .github/workflows/sync-main-to-jdk-branch.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/sync-main-to-jdk-branch.yml b/.github/workflows/sync-main-to-jdk-branch.yml
index 9570ca96a3370..ff87d5cd71178 100644
--- a/.github/workflows/sync-main-to-jdk-branch.yml
+++ b/.github/workflows/sync-main-to-jdk-branch.yml
@@ -1,5 +1,5 @@
 # Daily update of JDK update branch with changes from main
-name: "Merge main to es-9.0-bump branch"
+name: "Merge main to openjdk23-bundle branch"
 on:
   schedule:
     - cron: '0 5 * * *'
@@ -17,5 +17,5 @@ jobs:
         with:
           type: 'now'
           from_branch: main
-          target_branch: es-9.0-bump
+          target_branch: openjdk23-bundle
           github_token: ${{ secrets.ELASTICSEARCHMACHINE_TOKEN }}

From 699194844ec2d44a45a6e932c47eacb4e3596759 Mon Sep 17 00:00:00 2001
From: Mark Vieira <portugee@gmail.com>
Date: Tue, 3 Sep 2024 10:55:44 -0700
Subject: [PATCH 122/144] Remove from branch and just use current branch

---
 .github/workflows/sync-main-to-jdk-branch.yml | 1 -
 1 file changed, 1 deletion(-)

diff --git a/.github/workflows/sync-main-to-jdk-branch.yml b/.github/workflows/sync-main-to-jdk-branch.yml
index ff87d5cd71178..1ae48c6eaa116 100644
--- a/.github/workflows/sync-main-to-jdk-branch.yml
+++ b/.github/workflows/sync-main-to-jdk-branch.yml
@@ -16,6 +16,5 @@ jobs:
         uses: devmasx/merge-branch@1.4.0
         with:
           type: 'now'
-          from_branch: main
           target_branch: openjdk23-bundle
           github_token: ${{ secrets.ELASTICSEARCHMACHINE_TOKEN }}

From e6525deefac463e551846b99be39407e5e0f0f44 Mon Sep 17 00:00:00 2001
From: Marc Lopez Rubio <marc5.12@outlook.com>
Date: Tue, 3 Sep 2024 11:38:13 -0700
Subject: [PATCH 123/144] logs-apm.error-*: define log.level field as keyword
 (#112440)

Defines `log.level` as a `keyword` for all apm error logs.

---------

Signed-off-by: Marc Lopez Rubio <marc5.12@outlook.com>
---
 docs/changelog/112440.yaml                    |  5 ++++
 .../logs-apm.error@mappings.yaml              |  3 ++
 .../src/main/resources/resources.yaml         |  2 +-
 .../rest-api-spec/test/20_error_logs.yml      | 28 +++++++++++++++++++
 4 files changed, 37 insertions(+), 1 deletion(-)
 create mode 100644 docs/changelog/112440.yaml
 create mode 100644 x-pack/plugin/apm-data/src/yamlRestTest/resources/rest-api-spec/test/20_error_logs.yml

diff --git a/docs/changelog/112440.yaml b/docs/changelog/112440.yaml
new file mode 100644
index 0000000000000..f208474fa2686
--- /dev/null
+++ b/docs/changelog/112440.yaml
@@ -0,0 +1,5 @@
+pr: 112440
+summary: "logs-apm.error-*: define log.level field as keyword"
+area: Data streams
+type: bug
+issues: []
diff --git a/x-pack/plugin/apm-data/src/main/resources/component-templates/logs-apm.error@mappings.yaml b/x-pack/plugin/apm-data/src/main/resources/component-templates/logs-apm.error@mappings.yaml
index c1d004b4e7bf4..6c83f40252354 100644
--- a/x-pack/plugin/apm-data/src/main/resources/component-templates/logs-apm.error@mappings.yaml
+++ b/x-pack/plugin/apm-data/src/main/resources/component-templates/logs-apm.error@mappings.yaml
@@ -6,6 +6,9 @@ _meta:
 template:
   mappings:
     properties:
+      # log.*
+      log.level:
+        type: keyword
       # error.*
       error.custom:
         type: object
diff --git a/x-pack/plugin/apm-data/src/main/resources/resources.yaml b/x-pack/plugin/apm-data/src/main/resources/resources.yaml
index 3e66769d939ad..0502a8c559ff6 100644
--- a/x-pack/plugin/apm-data/src/main/resources/resources.yaml
+++ b/x-pack/plugin/apm-data/src/main/resources/resources.yaml
@@ -1,7 +1,7 @@
 # "version" holds the version of the templates and ingest pipelines installed
 # by xpack-plugin apm-data. This must be increased whenever an existing template or
 # pipeline is changed, in order for it to be updated on Elasticsearch upgrade.
-version: 8
+version: 9
 
 component-templates:
   # Data lifecycle.
diff --git a/x-pack/plugin/apm-data/src/yamlRestTest/resources/rest-api-spec/test/20_error_logs.yml b/x-pack/plugin/apm-data/src/yamlRestTest/resources/rest-api-spec/test/20_error_logs.yml
new file mode 100644
index 0000000000000..5d2a6ec29ff4c
--- /dev/null
+++ b/x-pack/plugin/apm-data/src/yamlRestTest/resources/rest-api-spec/test/20_error_logs.yml
@@ -0,0 +1,28 @@
+---
+setup:
+  - do:
+      cluster.health:
+        wait_for_events: languid
+---
+"Test logs-apm.error-* error log fields":
+  - do:
+      bulk:
+        index: logs-apm.error-log-level-testing
+        refresh: true
+        body:
+          - create: {}
+          - '{"@timestamp": "2017-06-22", "log": {"level": "error"}, "error": {"log": {"message": "loglevel"}, "exception": [{"message": "exception_used"}]}}'
+
+          - create: {}
+          - '{"@timestamp": "2017-06-22", "log": {"level": "warn"}, "error": {"log": {"message": "loglevel"}, "exception": [{"message": "exception_used"}]}}'
+
+  - is_false: errors
+
+  - do:
+      search:
+        index: logs-apm.error-log-level-testing
+        body:
+          fields: ["log.level"]
+  - length: { hits.hits: 2 }
+  - match: { hits.hits.0.fields: { "log.level": ["error"] } }
+  - match: { hits.hits.1.fields: { "log.level": ["warn"] } }

From d59ca365cf27d8b26713eaa7269701360538c724 Mon Sep 17 00:00:00 2001
From: Mark Vieira <portugee@gmail.com>
Date: Tue, 3 Sep 2024 11:45:18 -0700
Subject: [PATCH 124/144] Update cron schedule

---
 .github/workflows/sync-main-to-jdk-branch.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/sync-main-to-jdk-branch.yml b/.github/workflows/sync-main-to-jdk-branch.yml
index 1ae48c6eaa116..eea3348529284 100644
--- a/.github/workflows/sync-main-to-jdk-branch.yml
+++ b/.github/workflows/sync-main-to-jdk-branch.yml
@@ -2,7 +2,7 @@
 name: "Merge main to openjdk23-bundle branch"
 on:
   schedule:
-    - cron: '0 5 * * *'
+    - cron: '30 17 * * *'
   workflow_dispatch: {}
 
 jobs:

From d946d0cd98cbc2a77d1c9294e59efe40bf5da04b Mon Sep 17 00:00:00 2001
From: elasticsearchmachine
 <58790826+elasticsearchmachine@users.noreply.github.com>
Date: Wed, 4 Sep 2024 14:29:25 +1000
Subject: [PATCH 125/144] Mute
 org.elasticsearch.xpack.spatial.index.query.LegacyGeoShapeWithDocValuesQueryTests
 testIndexPointsFromPolygon #112464

---
 muted-tests.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/muted-tests.yml b/muted-tests.yml
index 45c286375a1ed..1a8b0e8526c89 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -188,6 +188,9 @@ tests:
 - class: org.elasticsearch.xpack.inference.external.http.RequestBasedTaskRunnerTests
   method: testLoopOneAtATime
   issue: https://github.com/elastic/elasticsearch/issues/112471
+- class: org.elasticsearch.xpack.spatial.index.query.LegacyGeoShapeWithDocValuesQueryTests
+  method: testIndexPointsFromPolygon
+  issue: https://github.com/elastic/elasticsearch/issues/112464
 
 # Examples:
 #

From 0aff606b357dd492735ec9bbbced6e309de54387 Mon Sep 17 00:00:00 2001
From: Albert Zaharovits <albert.zaharovits@elastic.co>
Date: Wed, 4 Sep 2024 09:47:54 +0300
Subject: [PATCH 126/144] Avoid passing in the cluster state parameter to
 methods related to index creation (#112466)

Avoids the ClusterState type as a method parameter in favor of the more specific
Metadata, RoutingTable, and ClusterBlocks ones.
---
 .../indices/rollover/LazyRolloverAction.java  |  3 +-
 .../rollover/MetadataRolloverService.java     | 10 +--
 .../rollover/TransportRolloverAction.java     |  3 +-
 .../metadata/MetadataCreateIndexService.java  | 89 +++++++++++++------
 .../metadata/MetadataIndexStateService.java   |  2 +-
 .../MetadataUpdateSettingsService.java        |  7 +-
 .../ShardsCapacityHealthIndicatorService.java | 36 ++++++--
 .../indices/ShardLimitValidator.java          | 84 +++++++++--------
 .../snapshots/RestoreService.java             | 17 +++-
 .../MetadataCreateIndexServiceTests.java      | 76 ++++++++--------
 ...dsCapacityHealthIndicatorServiceTests.java | 18 ++--
 .../indices/ShardLimitValidatorTests.java     | 25 ++++--
 .../downsample/TransportDownsampleAction.java |  2 +-
 13 files changed, 235 insertions(+), 137 deletions(-)

diff --git a/server/src/main/java/org/elasticsearch/action/admin/indices/rollover/LazyRolloverAction.java b/server/src/main/java/org/elasticsearch/action/admin/indices/rollover/LazyRolloverAction.java
index ef72fdd93caeb..65b768a1c629f 100644
--- a/server/src/main/java/org/elasticsearch/action/admin/indices/rollover/LazyRolloverAction.java
+++ b/server/src/main/java/org/elasticsearch/action/admin/indices/rollover/LazyRolloverAction.java
@@ -21,6 +21,7 @@
 import org.elasticsearch.cluster.metadata.DataStream;
 import org.elasticsearch.cluster.metadata.IndexNameExpressionResolver;
 import org.elasticsearch.cluster.metadata.Metadata;
+import org.elasticsearch.cluster.metadata.MetadataCreateIndexService;
 import org.elasticsearch.cluster.metadata.MetadataDataStreamsService;
 import org.elasticsearch.cluster.routing.allocation.AllocationService;
 import org.elasticsearch.cluster.routing.allocation.allocator.AllocationActionMultiListener;
@@ -134,7 +135,7 @@ protected void masterOperation(
             );
             final String trialSourceIndexName = trialRolloverNames.sourceName();
             final String trialRolloverIndexName = trialRolloverNames.rolloverName();
-            MetadataRolloverService.validateIndexName(clusterState, trialRolloverIndexName);
+            MetadataCreateIndexService.validateIndexName(trialRolloverIndexName, clusterState.metadata(), clusterState.routingTable());
 
             assert metadata.dataStreams().containsKey(rolloverRequest.getRolloverTarget()) : "Auto-rollover applies only to data streams";
 
diff --git a/server/src/main/java/org/elasticsearch/action/admin/indices/rollover/MetadataRolloverService.java b/server/src/main/java/org/elasticsearch/action/admin/indices/rollover/MetadataRolloverService.java
index 9d34b9ab5f126..b8d975f82980d 100644
--- a/server/src/main/java/org/elasticsearch/action/admin/indices/rollover/MetadataRolloverService.java
+++ b/server/src/main/java/org/elasticsearch/action/admin/indices/rollover/MetadataRolloverService.java
@@ -179,10 +179,6 @@ public RolloverResult rolloverClusterState(
         };
     }
 
-    public static void validateIndexName(ClusterState state, String index) {
-        MetadataCreateIndexService.validateIndexName(index, state);
-    }
-
     /**
      * Returns the names that rollover would use, but does not perform the actual rollover
      */
@@ -252,7 +248,8 @@ private RolloverResult rolloverAlias(
         final Boolean isHidden = IndexMetadata.INDEX_HIDDEN_SETTING.exists(createIndexRequest.settings())
             ? IndexMetadata.INDEX_HIDDEN_SETTING.get(createIndexRequest.settings())
             : null;
-        MetadataCreateIndexService.validateIndexName(rolloverIndexName, currentState); // fails if the index already exists
+        MetadataCreateIndexService.validateIndexName(rolloverIndexName, metadata, currentState.routingTable()); // fails if the index
+                                                                                                                // already exists
         checkNoDuplicatedAliasInIndexTemplate(metadata, rolloverIndexName, aliasName, isHidden);
         if (onlyValidate) {
             return new RolloverResult(rolloverIndexName, sourceIndexName, currentState);
@@ -328,7 +325,8 @@ private RolloverResult rolloverDataStream(
         final Tuple<String, Long> nextIndexAndGeneration = dataStream.nextWriteIndexAndGeneration(metadata, dataStreamIndices);
         final String newWriteIndexName = nextIndexAndGeneration.v1();
         final long newGeneration = nextIndexAndGeneration.v2();
-        MetadataCreateIndexService.validateIndexName(newWriteIndexName, currentState); // fails if the index already exists
+        MetadataCreateIndexService.validateIndexName(newWriteIndexName, metadata, currentState.routingTable()); // fails if the index
+                                                                                                                // already exists
         if (onlyValidate) {
             return new RolloverResult(newWriteIndexName, isLazyCreation ? NON_EXISTENT_SOURCE : originalWriteIndex.getName(), currentState);
         }
diff --git a/server/src/main/java/org/elasticsearch/action/admin/indices/rollover/TransportRolloverAction.java b/server/src/main/java/org/elasticsearch/action/admin/indices/rollover/TransportRolloverAction.java
index 9df3be1994fdf..c997795bb3b89 100644
--- a/server/src/main/java/org/elasticsearch/action/admin/indices/rollover/TransportRolloverAction.java
+++ b/server/src/main/java/org/elasticsearch/action/admin/indices/rollover/TransportRolloverAction.java
@@ -36,6 +36,7 @@
 import org.elasticsearch.cluster.metadata.IndexMetadataStats;
 import org.elasticsearch.cluster.metadata.IndexNameExpressionResolver;
 import org.elasticsearch.cluster.metadata.Metadata;
+import org.elasticsearch.cluster.metadata.MetadataCreateIndexService;
 import org.elasticsearch.cluster.metadata.MetadataDataStreamsService;
 import org.elasticsearch.cluster.routing.allocation.AllocationService;
 import org.elasticsearch.cluster.routing.allocation.allocator.AllocationActionMultiListener;
@@ -179,7 +180,7 @@ protected void masterOperation(
         );
         final String trialSourceIndexName = trialRolloverNames.sourceName();
         final String trialRolloverIndexName = trialRolloverNames.rolloverName();
-        MetadataRolloverService.validateIndexName(clusterState, trialRolloverIndexName);
+        MetadataCreateIndexService.validateIndexName(trialRolloverIndexName, metadata, clusterState.routingTable());
 
         boolean isDataStream = metadata.dataStreams().containsKey(rolloverRequest.getRolloverTarget());
         if (rolloverRequest.isLazy()) {
diff --git a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexService.java b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexService.java
index 07dcb7baf0777..02b7312b4a99d 100644
--- a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexService.java
+++ b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexService.java
@@ -167,7 +167,7 @@ public MetadataCreateIndexService(
     /**
      * Validate the name for an index against some static rules and a cluster state.
      */
-    public static void validateIndexName(String index, ClusterState state) {
+    public static void validateIndexName(String index, Metadata metadata, RoutingTable routingTable) {
         validateIndexOrAliasName(index, InvalidIndexNameException::new);
         if (index.toLowerCase(Locale.ROOT).equals(index) == false) {
             throw new InvalidIndexNameException(index, "must be lowercase");
@@ -175,13 +175,13 @@ public static void validateIndexName(String index, ClusterState state) {
 
         // NOTE: dot-prefixed index names are validated after template application, not here
 
-        if (state.routingTable().hasIndex(index)) {
-            throw new ResourceAlreadyExistsException(state.routingTable().index(index).getIndex());
+        if (routingTable.hasIndex(index)) {
+            throw new ResourceAlreadyExistsException(routingTable.index(index).getIndex());
         }
-        if (state.metadata().hasIndex(index)) {
-            throw new ResourceAlreadyExistsException(state.metadata().index(index).getIndex());
+        if (metadata.hasIndex(index)) {
+            throw new ResourceAlreadyExistsException(metadata.index(index).getIndex());
         }
-        if (state.metadata().hasAlias(index)) {
+        if (metadata.hasAlias(index)) {
             throw new InvalidIndexNameException(index, "already exists as alias");
         }
     }
@@ -344,7 +344,7 @@ public ClusterState applyCreateIndexRequest(
         normalizeRequestSetting(request);
         logger.trace("executing IndexCreationTask for [{}] against cluster state version [{}]", request, currentState.version());
 
-        validate(request, currentState);
+        validate(request, currentState.metadata(), currentState.routingTable());
 
         final Index recoverFromIndex = request.recoverFrom();
         final IndexMetadata sourceMetadata = recoverFromIndex == null ? null : currentState.metadata().getIndexSafe(recoverFromIndex);
@@ -1069,7 +1069,9 @@ static Settings aggregateIndexSettings(
         if (sourceMetadata != null) {
             assert request.resizeType() != null;
             prepareResizeIndexSettings(
-                currentState,
+                currentState.metadata(),
+                currentState.blocks(),
+                currentState.routingTable(),
                 indexSettingsBuilder,
                 request.recoverFrom(),
                 request.index(),
@@ -1084,7 +1086,7 @@ static Settings aggregateIndexSettings(
          * We can not validate settings until we have applied templates, otherwise we do not know the actual settings
          * that will be used to create this index.
          */
-        shardLimitValidator.validateShardLimit(indexSettings, currentState);
+        shardLimitValidator.validateShardLimit(indexSettings, currentState.nodes(), currentState.metadata());
         validateSoftDeleteSettings(indexSettings);
         validateTranslogRetentionSettings(indexSettings);
         validateStoreTypeSetting(indexSettings);
@@ -1363,8 +1365,8 @@ private static void validateActiveShardCount(ActiveShardCount waitForActiveShard
         }
     }
 
-    private void validate(CreateIndexClusterStateUpdateRequest request, ClusterState state) {
-        validateIndexName(request.index(), state);
+    private void validate(CreateIndexClusterStateUpdateRequest request, Metadata metadata, RoutingTable routingTable) {
+        validateIndexName(request.index(), metadata, routingTable);
         validateIndexSettings(request.index(), request.settings(), forbidPrivateIndexSettings);
     }
 
@@ -1428,8 +1430,15 @@ private static List<String> validateIndexCustomPath(Settings settings, @Nullable
      *
      * @return the list of nodes at least one instance of the source index shards are allocated
      */
-    static List<String> validateShrinkIndex(ClusterState state, String sourceIndex, String targetIndexName, Settings targetIndexSettings) {
-        IndexMetadata sourceMetadata = validateResize(state, sourceIndex, targetIndexName, targetIndexSettings);
+    static List<String> validateShrinkIndex(
+        Metadata metadata,
+        ClusterBlocks clusterBlocks,
+        RoutingTable routingTable,
+        String sourceIndex,
+        String targetIndexName,
+        Settings targetIndexSettings
+    ) {
+        IndexMetadata sourceMetadata = validateResize(metadata, clusterBlocks, sourceIndex, targetIndexName, targetIndexSettings);
         if (sourceMetadata.isSearchableSnapshot()) {
             throw new IllegalArgumentException("can't shrink searchable snapshot index [" + sourceIndex + ']');
         }
@@ -1441,7 +1450,7 @@ static List<String> validateShrinkIndex(ClusterState state, String sourceIndex,
         }
 
         // now check that index is all on one node
-        final IndexRoutingTable table = state.routingTable().index(sourceIndex);
+        final IndexRoutingTable table = routingTable.index(sourceIndex);
         Map<String, AtomicInteger> nodesToNumRouting = new HashMap<>();
         int numShards = sourceMetadata.getNumberOfShards();
         for (ShardRouting routing : table.shardsWithState(ShardRoutingState.STARTED)) {
@@ -1461,16 +1470,28 @@ static List<String> validateShrinkIndex(ClusterState state, String sourceIndex,
         return nodesToAllocateOn;
     }
 
-    static void validateSplitIndex(ClusterState state, String sourceIndex, String targetIndexName, Settings targetIndexSettings) {
-        IndexMetadata sourceMetadata = validateResize(state, sourceIndex, targetIndexName, targetIndexSettings);
+    static void validateSplitIndex(
+        Metadata metadata,
+        ClusterBlocks clusterBlocks,
+        String sourceIndex,
+        String targetIndexName,
+        Settings targetIndexSettings
+    ) {
+        IndexMetadata sourceMetadata = validateResize(metadata, clusterBlocks, sourceIndex, targetIndexName, targetIndexSettings);
         if (sourceMetadata.isSearchableSnapshot()) {
             throw new IllegalArgumentException("can't split searchable snapshot index [" + sourceIndex + ']');
         }
         IndexMetadata.selectSplitShard(0, sourceMetadata, INDEX_NUMBER_OF_SHARDS_SETTING.get(targetIndexSettings));
     }
 
-    static void validateCloneIndex(ClusterState state, String sourceIndex, String targetIndexName, Settings targetIndexSettings) {
-        IndexMetadata sourceMetadata = validateResize(state, sourceIndex, targetIndexName, targetIndexSettings);
+    static void validateCloneIndex(
+        Metadata metadata,
+        ClusterBlocks clusterBlocks,
+        String sourceIndex,
+        String targetIndexName,
+        Settings targetIndexSettings
+    ) {
+        IndexMetadata sourceMetadata = validateResize(metadata, clusterBlocks, sourceIndex, targetIndexName, targetIndexSettings);
         if (sourceMetadata.isSearchableSnapshot()) {
             for (Setting<?> nonCloneableSetting : Arrays.asList(INDEX_STORE_TYPE_SETTING, INDEX_RECOVERY_TYPE_SETTING)) {
                 if (nonCloneableSetting.exists(targetIndexSettings) == false) {
@@ -1487,16 +1508,22 @@ static void validateCloneIndex(ClusterState state, String sourceIndex, String ta
         IndexMetadata.selectCloneShard(0, sourceMetadata, INDEX_NUMBER_OF_SHARDS_SETTING.get(targetIndexSettings));
     }
 
-    static IndexMetadata validateResize(ClusterState state, String sourceIndex, String targetIndexName, Settings targetIndexSettings) {
-        if (state.metadata().hasIndex(targetIndexName)) {
-            throw new ResourceAlreadyExistsException(state.metadata().index(targetIndexName).getIndex());
+    static IndexMetadata validateResize(
+        Metadata metadata,
+        ClusterBlocks clusterBlocks,
+        String sourceIndex,
+        String targetIndexName,
+        Settings targetIndexSettings
+    ) {
+        if (metadata.hasIndex(targetIndexName)) {
+            throw new ResourceAlreadyExistsException(metadata.index(targetIndexName).getIndex());
         }
-        final IndexMetadata sourceMetadata = state.metadata().index(sourceIndex);
+        final IndexMetadata sourceMetadata = metadata.index(sourceIndex);
         if (sourceMetadata == null) {
             throw new IndexNotFoundException(sourceIndex);
         }
 
-        IndexAbstraction source = state.metadata().getIndicesLookup().get(sourceIndex);
+        IndexAbstraction source = metadata.getIndicesLookup().get(sourceIndex);
         assert source != null;
         if (source.getParentDataStream() != null && source.getParentDataStream().getWriteIndex().equals(sourceMetadata.getIndex())) {
             throw new IllegalArgumentException(
@@ -1509,7 +1536,7 @@ static IndexMetadata validateResize(ClusterState state, String sourceIndex, Stri
             );
         }
         // ensure index is read-only
-        if (state.blocks().indexBlocked(ClusterBlockLevel.WRITE, sourceIndex) == false) {
+        if (clusterBlocks.indexBlocked(ClusterBlockLevel.WRITE, sourceIndex) == false) {
             throw new IllegalStateException("index " + sourceIndex + " must be read-only to resize index. use \"index.blocks.write=true\"");
         }
 
@@ -1522,7 +1549,9 @@ static IndexMetadata validateResize(ClusterState state, String sourceIndex, Stri
     }
 
     static void prepareResizeIndexSettings(
-        final ClusterState currentState,
+        final Metadata metadata,
+        final ClusterBlocks clusterBlocks,
+        final RoutingTable routingTable,
         final Settings.Builder indexSettingsBuilder,
         final Index resizeSourceIndex,
         final String resizeIntoName,
@@ -1530,20 +1559,22 @@ static void prepareResizeIndexSettings(
         final boolean copySettings,
         final IndexScopedSettings indexScopedSettings
     ) {
-        final IndexMetadata sourceMetadata = currentState.metadata().index(resizeSourceIndex.getName());
+        final IndexMetadata sourceMetadata = metadata.index(resizeSourceIndex.getName());
         if (type == ResizeType.SHRINK) {
             final List<String> nodesToAllocateOn = validateShrinkIndex(
-                currentState,
+                metadata,
+                clusterBlocks,
+                routingTable,
                 resizeSourceIndex.getName(),
                 resizeIntoName,
                 indexSettingsBuilder.build()
             );
             indexSettingsBuilder.put(INDEX_SHRINK_INITIAL_RECOVERY_KEY, Strings.arrayToCommaDelimitedString(nodesToAllocateOn.toArray()));
         } else if (type == ResizeType.SPLIT) {
-            validateSplitIndex(currentState, resizeSourceIndex.getName(), resizeIntoName, indexSettingsBuilder.build());
+            validateSplitIndex(metadata, clusterBlocks, resizeSourceIndex.getName(), resizeIntoName, indexSettingsBuilder.build());
             indexSettingsBuilder.putNull(INDEX_SHRINK_INITIAL_RECOVERY_KEY);
         } else if (type == ResizeType.CLONE) {
-            validateCloneIndex(currentState, resizeSourceIndex.getName(), resizeIntoName, indexSettingsBuilder.build());
+            validateCloneIndex(metadata, clusterBlocks, resizeSourceIndex.getName(), resizeIntoName, indexSettingsBuilder.build());
             indexSettingsBuilder.putNull(INDEX_SHRINK_INITIAL_RECOVERY_KEY);
         } else {
             throw new IllegalStateException("unknown resize type is " + type);
diff --git a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataIndexStateService.java b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataIndexStateService.java
index be12198cbaaaa..272c107883043 100644
--- a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataIndexStateService.java
+++ b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataIndexStateService.java
@@ -1100,7 +1100,7 @@ private ClusterState openIndices(final Index[] indices, final ClusterState curre
                 }
             }
 
-            shardLimitValidator.validateShardLimit(currentState, indices);
+            shardLimitValidator.validateShardLimit(currentState.nodes(), currentState.metadata(), indices);
             if (indicesToOpen.isEmpty()) {
                 return currentState;
             }
diff --git a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java
index 5891b953acfca..3272462dd3725 100644
--- a/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java
+++ b/server/src/main/java/org/elasticsearch/cluster/metadata/MetadataUpdateSettingsService.java
@@ -255,7 +255,12 @@ ClusterState execute(ClusterState currentState) {
                 final int updatedNumberOfReplicas = IndexMetadata.INDEX_NUMBER_OF_REPLICAS_SETTING.get(openSettings);
                 if (preserveExisting == false) {
                     // Verify that this won't take us over the cluster shard limit.
-                    shardLimitValidator.validateShardLimitOnReplicaUpdate(currentState, request.indices(), updatedNumberOfReplicas);
+                    shardLimitValidator.validateShardLimitOnReplicaUpdate(
+                        currentState.nodes(),
+                        currentState.metadata(),
+                        request.indices(),
+                        updatedNumberOfReplicas
+                    );
 
                     /*
                      * We do not update the in-sync allocation IDs as they will be removed upon the first index operation
diff --git a/server/src/main/java/org/elasticsearch/health/node/ShardsCapacityHealthIndicatorService.java b/server/src/main/java/org/elasticsearch/health/node/ShardsCapacityHealthIndicatorService.java
index e5ced00905744..e591e8a681764 100644
--- a/server/src/main/java/org/elasticsearch/health/node/ShardsCapacityHealthIndicatorService.java
+++ b/server/src/main/java/org/elasticsearch/health/node/ShardsCapacityHealthIndicatorService.java
@@ -8,7 +8,8 @@
 
 package org.elasticsearch.health.node;
 
-import org.elasticsearch.cluster.ClusterState;
+import org.elasticsearch.cluster.metadata.Metadata;
+import org.elasticsearch.cluster.node.DiscoveryNodes;
 import org.elasticsearch.cluster.service.ClusterService;
 import org.elasticsearch.common.TriFunction;
 import org.elasticsearch.common.settings.Setting;
@@ -124,8 +125,18 @@ public HealthIndicatorResult calculate(boolean verbose, int maxAffectedResources
         var shardLimitsMetadata = healthMetadata.getShardLimitsMetadata();
         return mergeIndicators(
             verbose,
-            calculateFrom(shardLimitsMetadata.maxShardsPerNode(), state, ShardLimitValidator::checkShardLimitForNormalNodes),
-            calculateFrom(shardLimitsMetadata.maxShardsPerNodeFrozen(), state, ShardLimitValidator::checkShardLimitForFrozenNodes)
+            calculateFrom(
+                shardLimitsMetadata.maxShardsPerNode(),
+                state.nodes(),
+                state.metadata(),
+                ShardLimitValidator::checkShardLimitForNormalNodes
+            ),
+            calculateFrom(
+                shardLimitsMetadata.maxShardsPerNodeFrozen(),
+                state.nodes(),
+                state.metadata(),
+                ShardLimitValidator::checkShardLimitForFrozenNodes
+            )
         );
     }
 
@@ -173,13 +184,18 @@ private HealthIndicatorResult mergeIndicators(boolean verbose, StatusResult data
         );
     }
 
-    static StatusResult calculateFrom(int maxShardsPerNodeSetting, ClusterState state, ShardsCapacityChecker checker) {
-        var result = checker.check(maxShardsPerNodeSetting, 5, 1, state);
+    static StatusResult calculateFrom(
+        int maxShardsPerNodeSetting,
+        DiscoveryNodes discoveryNodes,
+        Metadata metadata,
+        ShardsCapacityChecker checker
+    ) {
+        var result = checker.check(maxShardsPerNodeSetting, 5, 1, discoveryNodes, metadata);
         if (result.canAddShards() == false) {
             return new StatusResult(HealthStatus.RED, result);
         }
 
-        result = checker.check(maxShardsPerNodeSetting, 10, 1, state);
+        result = checker.check(maxShardsPerNodeSetting, 10, 1, discoveryNodes, metadata);
         if (result.canAddShards() == false) {
             return new StatusResult(HealthStatus.YELLOW, result);
         }
@@ -225,6 +241,12 @@ record StatusResult(HealthStatus status, ShardLimitValidator.Result result) {}
 
     @FunctionalInterface
     interface ShardsCapacityChecker {
-        ShardLimitValidator.Result check(int maxConfiguredShardsPerNode, int numberOfNewShards, int replicas, ClusterState state);
+        ShardLimitValidator.Result check(
+            int maxConfiguredShardsPerNode,
+            int numberOfNewShards,
+            int replicas,
+            DiscoveryNodes discoveryNodes,
+            Metadata metadata
+        );
     }
 }
diff --git a/server/src/main/java/org/elasticsearch/indices/ShardLimitValidator.java b/server/src/main/java/org/elasticsearch/indices/ShardLimitValidator.java
index f58ee757cc511..b8841adb4d885 100644
--- a/server/src/main/java/org/elasticsearch/indices/ShardLimitValidator.java
+++ b/server/src/main/java/org/elasticsearch/indices/ShardLimitValidator.java
@@ -8,10 +8,11 @@
 
 package org.elasticsearch.indices;
 
-import org.elasticsearch.cluster.ClusterState;
 import org.elasticsearch.cluster.metadata.IndexMetadata;
+import org.elasticsearch.cluster.metadata.Metadata;
 import org.elasticsearch.cluster.node.DiscoveryNode;
 import org.elasticsearch.cluster.node.DiscoveryNodeRole;
+import org.elasticsearch.cluster.node.DiscoveryNodes;
 import org.elasticsearch.cluster.service.ClusterService;
 import org.elasticsearch.common.ReferenceDocs;
 import org.elasticsearch.common.ValidationException;
@@ -95,16 +96,22 @@ public int getShardLimitPerNode() {
      * Checks whether an index can be created without going over the cluster shard limit.
      *
      * @param settings       the settings of the index to be created
-     * @param state          the current cluster state
+     * @param discoveryNodes the nodes in the cluster
+     * @param metadata       the cluster state metadata
      * @throws ValidationException if creating this index would put the cluster over the cluster shard limit
      */
-    public void validateShardLimit(final Settings settings, final ClusterState state) {
+    public void validateShardLimit(final Settings settings, final DiscoveryNodes discoveryNodes, final Metadata metadata) {
         final int numberOfShards = INDEX_NUMBER_OF_SHARDS_SETTING.get(settings);
         final int numberOfReplicas = IndexMetadata.INDEX_NUMBER_OF_REPLICAS_SETTING.get(settings);
         final int shardsToCreate = numberOfShards * (1 + numberOfReplicas);
         final boolean frozen = FROZEN_GROUP.equals(INDEX_SETTING_SHARD_LIMIT_GROUP.get(settings));
 
-        final var result = checkShardLimitOnBothGroups(frozen == false ? shardsToCreate : 0, frozen ? shardsToCreate : 0, state);
+        final var result = checkShardLimitOnBothGroups(
+            frozen == false ? shardsToCreate : 0,
+            frozen ? shardsToCreate : 0,
+            discoveryNodes,
+            metadata
+        );
         if (result.canAddShards == false) {
             final ValidationException e = new ValidationException();
             e.addValidationError(errorMessageFrom(result));
@@ -116,15 +123,16 @@ public void validateShardLimit(final Settings settings, final ClusterState state
      * Validates whether a list of indices can be opened without going over the cluster shard limit.  Only counts indices which are
      * currently closed and will be opened, ignores indices which are already open.
      *
-     * @param currentState The current cluster state.
-     * @param indicesToOpen The indices which are to be opened.
+     * @param discoveryNodes The nodes in the cluster
+     * @param metadata       The cluster state metadata
+     * @param indicesToOpen  The indices which are to be opened.
      * @throws ValidationException If this operation would take the cluster over the limit and enforcement is enabled.
      */
-    public void validateShardLimit(ClusterState currentState, Index[] indicesToOpen) {
+    public void validateShardLimit(DiscoveryNodes discoveryNodes, Metadata metadata, Index[] indicesToOpen) {
         int frozen = 0;
         int normal = 0;
         for (Index index : indicesToOpen) {
-            IndexMetadata imd = currentState.metadata().index(index);
+            IndexMetadata imd = metadata.index(index);
             if (imd.getState().equals(IndexMetadata.State.CLOSE)) {
                 int totalNewShards = imd.getNumberOfShards() * (1 + imd.getNumberOfReplicas());
                 if (FROZEN_GROUP.equals(INDEX_SETTING_SHARD_LIMIT_GROUP.get(imd.getSettings()))) {
@@ -135,7 +143,7 @@ public void validateShardLimit(ClusterState currentState, Index[] indicesToOpen)
             }
         }
 
-        var result = checkShardLimitOnBothGroups(normal, frozen, currentState);
+        var result = checkShardLimitOnBothGroups(normal, frozen, discoveryNodes, metadata);
         if (result.canAddShards == false) {
             ValidationException ex = new ValidationException();
             ex.addValidationError(errorMessageFrom(result));
@@ -143,12 +151,12 @@ public void validateShardLimit(ClusterState currentState, Index[] indicesToOpen)
         }
     }
 
-    public void validateShardLimitOnReplicaUpdate(ClusterState currentState, Index[] indices, int replicas) {
+    public void validateShardLimitOnReplicaUpdate(DiscoveryNodes discoveryNodes, Metadata metadata, Index[] indices, int replicas) {
         int frozen = 0;
         int normal = 0;
         for (Index index : indices) {
-            IndexMetadata imd = currentState.metadata().index(index);
-            int totalNewShards = getTotalNewShards(index, currentState, replicas);
+            IndexMetadata imd = metadata.index(index);
+            int totalNewShards = getTotalNewShards(index, metadata, replicas);
             if (FROZEN_GROUP.equals(INDEX_SETTING_SHARD_LIMIT_GROUP.get(imd.getSettings()))) {
                 frozen += totalNewShards;
             } else {
@@ -156,7 +164,7 @@ public void validateShardLimitOnReplicaUpdate(ClusterState currentState, Index[]
             }
         }
 
-        var result = checkShardLimitOnBothGroups(normal, frozen, currentState);
+        var result = checkShardLimitOnBothGroups(normal, frozen, discoveryNodes, metadata);
         if (result.canAddShards == false) {
             ValidationException ex = new ValidationException();
             ex.addValidationError(errorMessageFrom(result));
@@ -164,8 +172,8 @@ public void validateShardLimitOnReplicaUpdate(ClusterState currentState, Index[]
         }
     }
 
-    private static int getTotalNewShards(Index index, ClusterState currentState, int updatedNumberOfReplicas) {
-        IndexMetadata indexMetadata = currentState.metadata().index(index);
+    private static int getTotalNewShards(Index index, Metadata metadata, int updatedNumberOfReplicas) {
+        IndexMetadata indexMetadata = metadata.index(index);
         int shardsInIndex = indexMetadata.getNumberOfShards();
         int oldNumberOfReplicas = indexMetadata.getNumberOfReplicas();
         int replicaIncrease = updatedNumberOfReplicas - oldNumberOfReplicas;
@@ -181,21 +189,22 @@ private static int getTotalNewShards(Index index, ClusterState currentState, int
      *
      * @param newShards       The number of normal shards to be added by this operation
      * @param newFrozenShards The number of frozen shards to be added by this operation
-     * @param state           The current cluster state
+     * @param discoveryNodes  The nodes in the cluster
+     * @param metadata        The cluster state metadata
      */
-    private Result checkShardLimitOnBothGroups(int newShards, int newFrozenShards, ClusterState state) {
+    private Result checkShardLimitOnBothGroups(int newShards, int newFrozenShards, DiscoveryNodes discoveryNodes, Metadata metadata) {
         // we verify the two limits independently. This also means that if they have mixed frozen and other data-roles nodes, such a mixed
         // node can have both 1000 normal and 3000 frozen shards. This is the trade-off to keep the simplicity of the counts. We advocate
         // against such mixed nodes for production use anyway.
-        int frozenNodeCount = nodeCount(state, ShardLimitValidator::hasFrozen);
-        int normalNodeCount = nodeCount(state, ShardLimitValidator::hasNonFrozen);
+        int frozenNodeCount = nodeCount(discoveryNodes, ShardLimitValidator::hasFrozen);
+        int normalNodeCount = nodeCount(discoveryNodes, ShardLimitValidator::hasNonFrozen);
 
-        var result = checkShardLimit(newShards, state, getShardLimitPerNode(), normalNodeCount, NORMAL_GROUP);
+        var result = checkShardLimit(newShards, metadata, getShardLimitPerNode(), normalNodeCount, NORMAL_GROUP);
         // fail-fast: in case there's no room on the `normal` nodes, just return the result of that check.
         if (result.canAddShards() == false) {
             return result;
         }
-        return checkShardLimit(newFrozenShards, state, shardLimitPerNodeFrozen.get(), frozenNodeCount, FROZEN_GROUP);
+        return checkShardLimit(newFrozenShards, metadata, shardLimitPerNodeFrozen.get(), frozenNodeCount, FROZEN_GROUP);
     }
 
     /**
@@ -205,20 +214,21 @@ private Result checkShardLimitOnBothGroups(int newShards, int newFrozenShards, C
      * @param maxConfiguredShardsPerNode The maximum available number of shards to be allocated within a node
      * @param numberOfNewShards          The number of primary shards that we want to be able to add to the cluster
      * @param replicas                   The number of replicas of the primary shards that we want to be able to add to the cluster
-     * @param state                      The cluster state, used to get cluster settings and to get the number of open shards already in
-     *                                   the cluster
+     * @param discoveryNodes             The nodes in the cluster, used to get the number of open shard already in the cluster
+     * @param metadata                   The cluster state metadata, used to get the cluster settings
      */
     public static Result checkShardLimitForNormalNodes(
         int maxConfiguredShardsPerNode,
         int numberOfNewShards,
         int replicas,
-        ClusterState state
+        DiscoveryNodes discoveryNodes,
+        Metadata metadata
     ) {
         return checkShardLimit(
             numberOfNewShards * (1 + replicas),
-            state,
+            metadata,
             maxConfiguredShardsPerNode,
-            nodeCount(state, ShardLimitValidator::hasNonFrozen),
+            nodeCount(discoveryNodes, ShardLimitValidator::hasNonFrozen),
             NORMAL_GROUP
         );
     }
@@ -230,27 +240,28 @@ public static Result checkShardLimitForNormalNodes(
      * @param maxConfiguredShardsPerNode The maximum available number of shards to be allocated within a node
      * @param numberOfNewShards          The number of primary shards that we want to be able to add to the cluster
      * @param replicas                   The number of replicas of the primary shards that we want to be able to add to the cluster
-     * @param state                      The cluster state, used to get cluster settings and to get the number of open shards already in
-     *                                   the cluster
+     * @param discoveryNodes             The nodes in the cluster, used to get the number of open shard already in the cluster
+     * @param metadata                   The cluster state metadata, used to get the cluster settings
      */
     public static Result checkShardLimitForFrozenNodes(
         int maxConfiguredShardsPerNode,
         int numberOfNewShards,
         int replicas,
-        ClusterState state
+        DiscoveryNodes discoveryNodes,
+        Metadata metadata
     ) {
         return checkShardLimit(
             numberOfNewShards * (1 + replicas),
-            state,
+            metadata,
             maxConfiguredShardsPerNode,
-            nodeCount(state, ShardLimitValidator::hasFrozen),
+            nodeCount(discoveryNodes, ShardLimitValidator::hasFrozen),
             FROZEN_GROUP
         );
     }
 
-    private static Result checkShardLimit(int newShards, ClusterState state, int maxConfiguredShardsPerNode, int nodeCount, String group) {
+    private static Result checkShardLimit(int newShards, Metadata metadata, int maxConfiguredShardsPerNode, int nodeCount, String group) {
         int maxShardsInCluster = maxConfiguredShardsPerNode * nodeCount;
-        int currentOpenShards = state.getMetadata().getTotalOpenIndexShards();
+        int currentOpenShards = metadata.getTotalOpenIndexShards();
 
         // Only enforce the shard limit if we have at least one data node, so that we don't block
         // index creation during cluster setup
@@ -261,8 +272,7 @@ private static Result checkShardLimit(int newShards, ClusterState state, int max
         if ((currentOpenShards + newShards) > maxShardsInCluster) {
             Predicate<IndexMetadata> indexMetadataPredicate = imd -> imd.getState().equals(IndexMetadata.State.OPEN)
                 && group.equals(INDEX_SETTING_SHARD_LIMIT_GROUP.get(imd.getSettings()));
-            long currentFilteredShards = state.metadata()
-                .indices()
+            long currentFilteredShards = metadata.indices()
                 .values()
                 .stream()
                 .filter(indexMetadataPredicate)
@@ -276,8 +286,8 @@ private static Result checkShardLimit(int newShards, ClusterState state, int max
         return new Result(true, Optional.empty(), newShards, maxShardsInCluster, group);
     }
 
-    private static int nodeCount(ClusterState state, Predicate<DiscoveryNode> nodePredicate) {
-        return (int) state.getNodes().getDataNodes().values().stream().filter(nodePredicate).count();
+    private static int nodeCount(DiscoveryNodes discoveryNodes, Predicate<DiscoveryNode> nodePredicate) {
+        return (int) discoveryNodes.getDataNodes().values().stream().filter(nodePredicate).count();
     }
 
     private static boolean hasFrozen(DiscoveryNode node) {
diff --git a/server/src/main/java/org/elasticsearch/snapshots/RestoreService.java b/server/src/main/java/org/elasticsearch/snapshots/RestoreService.java
index d8987495f9035..a2d8d6374a457 100644
--- a/server/src/main/java/org/elasticsearch/snapshots/RestoreService.java
+++ b/server/src/main/java/org/elasticsearch/snapshots/RestoreService.java
@@ -1343,8 +1343,12 @@ public ClusterState execute(ClusterState currentState) {
                 if (currentIndexMetadata == null) {
                     // Index doesn't exist - create it and start recovery
                     // Make sure that the index we are about to create has a valid name
-                    ensureValidIndexName(currentState, snapshotIndexMetadata, renamedIndexName);
-                    shardLimitValidator.validateShardLimit(snapshotIndexMetadata.getSettings(), currentState);
+                    ensureValidIndexName(currentState.metadata(), currentState.routingTable(), snapshotIndexMetadata, renamedIndexName);
+                    shardLimitValidator.validateShardLimit(
+                        snapshotIndexMetadata.getSettings(),
+                        currentState.nodes(),
+                        currentState.metadata()
+                    );
 
                     final IndexMetadata.Builder indexMdBuilder = restoreToCreateNewIndex(
                         snapshotIndexMetadata,
@@ -1789,9 +1793,14 @@ private static IndexMetadata.Builder restoreOverClosedIndex(
         return indexMdBuilder;
     }
 
-    private void ensureValidIndexName(ClusterState currentState, IndexMetadata snapshotIndexMetadata, String renamedIndexName) {
+    private void ensureValidIndexName(
+        Metadata metadata,
+        RoutingTable routingTable,
+        IndexMetadata snapshotIndexMetadata,
+        String renamedIndexName
+    ) {
         final boolean isHidden = snapshotIndexMetadata.isHidden();
-        MetadataCreateIndexService.validateIndexName(renamedIndexName, currentState);
+        MetadataCreateIndexService.validateIndexName(renamedIndexName, metadata, routingTable);
         createIndexService.validateDotIndex(renamedIndexName, isHidden);
         createIndexService.validateIndexSettings(renamedIndexName, snapshotIndexMetadata.getSettings(), false);
     }
diff --git a/server/src/test/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexServiceTests.java b/server/src/test/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexServiceTests.java
index f7d343b43b29c..01394a7abbcd5 100644
--- a/server/src/test/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexServiceTests.java
+++ b/server/src/test/java/org/elasticsearch/cluster/metadata/MetadataCreateIndexServiceTests.java
@@ -170,18 +170,14 @@ public void testValidateShrinkIndex() {
 
         assertEquals(
             "index [source] already exists",
-            expectThrows(
-                ResourceAlreadyExistsException.class,
-                () -> MetadataCreateIndexService.validateShrinkIndex(state, "target", "source", Settings.EMPTY)
-            ).getMessage()
+            expectThrows(ResourceAlreadyExistsException.class, () -> validateShrinkIndex(state, "target", "source", Settings.EMPTY))
+                .getMessage()
         );
 
         assertEquals(
             "no such index [no_such_index]",
-            expectThrows(
-                IndexNotFoundException.class,
-                () -> MetadataCreateIndexService.validateShrinkIndex(state, "no_such_index", "target", Settings.EMPTY)
-            ).getMessage()
+            expectThrows(IndexNotFoundException.class, () -> validateShrinkIndex(state, "no_such_index", "target", Settings.EMPTY))
+                .getMessage()
         );
 
         Settings targetSettings = Settings.builder().put("index.number_of_shards", 1).build();
@@ -189,7 +185,7 @@ public void testValidateShrinkIndex() {
             "can't shrink an index with only one shard",
             expectThrows(
                 IllegalArgumentException.class,
-                () -> MetadataCreateIndexService.validateShrinkIndex(
+                () -> validateShrinkIndex(
                     createClusterState("source", 1, 0, Settings.builder().put("index.blocks.write", true).build()),
                     "source",
                     "target",
@@ -202,7 +198,7 @@ public void testValidateShrinkIndex() {
             "the number of target shards [10] must be less that the number of source shards [5]",
             expectThrows(
                 IllegalArgumentException.class,
-                () -> MetadataCreateIndexService.validateShrinkIndex(
+                () -> validateShrinkIndex(
                     createClusterState("source", 5, 0, Settings.builder().put("index.blocks.write", true).build()),
                     "source",
                     "target",
@@ -215,7 +211,7 @@ public void testValidateShrinkIndex() {
             "index source must be read-only to resize index. use \"index.blocks.write=true\"",
             expectThrows(
                 IllegalStateException.class,
-                () -> MetadataCreateIndexService.validateShrinkIndex(
+                () -> validateShrinkIndex(
                     createClusterState("source", randomIntBetween(2, 100), randomIntBetween(0, 10), Settings.EMPTY),
                     "source",
                     "target",
@@ -228,7 +224,7 @@ public void testValidateShrinkIndex() {
             "index source must have all shards allocated on the same node to shrink index",
             expectThrows(
                 IllegalStateException.class,
-                () -> MetadataCreateIndexService.validateShrinkIndex(state, "source", "target", targetSettings)
+                () -> validateShrinkIndex(state, "source", "target", targetSettings)
 
             ).getMessage()
         );
@@ -236,7 +232,7 @@ public void testValidateShrinkIndex() {
             "the number of source shards [8] must be a multiple of [3]",
             expectThrows(
                 IllegalArgumentException.class,
-                () -> MetadataCreateIndexService.validateShrinkIndex(
+                () -> validateShrinkIndex(
                     createClusterState("source", 8, randomIntBetween(0, 10), Settings.builder().put("index.blocks.write", true).build()),
                     "source",
                     "target",
@@ -267,12 +263,7 @@ public void testValidateShrinkIndex() {
         do {
             targetShards = randomIntBetween(1, numShards / 2);
         } while (isShrinkable(numShards, targetShards) == false);
-        MetadataCreateIndexService.validateShrinkIndex(
-            clusterState,
-            "source",
-            "target",
-            Settings.builder().put("index.number_of_shards", targetShards).build()
-        );
+        validateShrinkIndex(clusterState, "source", "target", Settings.builder().put("index.number_of_shards", targetShards).build());
     }
 
     public void testValidateSplitIndex() {
@@ -287,25 +278,21 @@ public void testValidateSplitIndex() {
 
         assertEquals(
             "index [source] already exists",
-            expectThrows(
-                ResourceAlreadyExistsException.class,
-                () -> MetadataCreateIndexService.validateSplitIndex(state, "target", "source", targetSettings)
-            ).getMessage()
+            expectThrows(ResourceAlreadyExistsException.class, () -> validateSplitIndex(state, "target", "source", targetSettings))
+                .getMessage()
         );
 
         assertEquals(
             "no such index [no_such_index]",
-            expectThrows(
-                IndexNotFoundException.class,
-                () -> MetadataCreateIndexService.validateSplitIndex(state, "no_such_index", "target", targetSettings)
-            ).getMessage()
+            expectThrows(IndexNotFoundException.class, () -> validateSplitIndex(state, "no_such_index", "target", targetSettings))
+                .getMessage()
         );
 
         assertEquals(
             "the number of source shards [10] must be less that the number of target shards [5]",
             expectThrows(
                 IllegalArgumentException.class,
-                () -> MetadataCreateIndexService.validateSplitIndex(
+                () -> validateSplitIndex(
                     createClusterState("source", 10, 0, Settings.builder().put("index.blocks.write", true).build()),
                     "source",
                     "target",
@@ -318,7 +305,7 @@ public void testValidateSplitIndex() {
             "index source must be read-only to resize index. use \"index.blocks.write=true\"",
             expectThrows(
                 IllegalStateException.class,
-                () -> MetadataCreateIndexService.validateSplitIndex(
+                () -> validateSplitIndex(
                     createClusterState("source", randomIntBetween(2, 100), randomIntBetween(0, 10), Settings.EMPTY),
                     "source",
                     "target",
@@ -331,7 +318,7 @@ public void testValidateSplitIndex() {
             "the number of source shards [3] must be a factor of [4]",
             expectThrows(
                 IllegalArgumentException.class,
-                () -> MetadataCreateIndexService.validateSplitIndex(
+                () -> validateSplitIndex(
                     createClusterState("source", 3, randomIntBetween(0, 10), Settings.builder().put("index.blocks.write", true).build()),
                     "source",
                     "target",
@@ -367,12 +354,7 @@ public void testValidateSplitIndex() {
         routingTable = ESAllocationTestCase.startInitializingShardsAndReroute(service, clusterState, "source").routingTable();
         clusterState = ClusterState.builder(clusterState).routingTable(routingTable).build();
 
-        MetadataCreateIndexService.validateSplitIndex(
-            clusterState,
-            "source",
-            "target",
-            Settings.builder().put("index.number_of_shards", targetShards).build()
-        );
+        validateSplitIndex(clusterState, "source", "target", Settings.builder().put("index.number_of_shards", targetShards).build());
     }
 
     public void testPrepareResizeIndexSettings() {
@@ -528,7 +510,9 @@ private void runPrepareResizeIndexSettingsTest(
             additionalIndexScopedSettings.stream()
         ).collect(Collectors.toSet());
         MetadataCreateIndexService.prepareResizeIndexSettings(
-            clusterState,
+            clusterState.metadata(),
+            clusterState.blocks(),
+            clusterState.routingTable(),
             indexSettingsBuilder,
             clusterState.metadata().index(indexName).getIndex(),
             "target",
@@ -576,9 +560,10 @@ public void testValidateIndexName() throws Exception {
     }
 
     private static void validateIndexName(MetadataCreateIndexService metadataCreateIndexService, String indexName, String errorMessage) {
+        ClusterState state = ClusterState.builder(ClusterName.DEFAULT).build();
         InvalidIndexNameException e = expectThrows(
             InvalidIndexNameException.class,
-            () -> MetadataCreateIndexService.validateIndexName(indexName, ClusterState.builder(ClusterName.DEFAULT).build())
+            () -> MetadataCreateIndexService.validateIndexName(indexName, state.metadata(), state.routingTable())
         );
         assertThat(e.getMessage(), endsWith(errorMessage));
     }
@@ -1423,4 +1408,19 @@ private void withTemporaryClusterService(BiConsumer<ClusterService, ThreadPool>
             threadPool.shutdown();
         }
     }
+
+    private List<String> validateShrinkIndex(ClusterState state, String sourceIndex, String targetIndexName, Settings targetIndexSettings) {
+        return MetadataCreateIndexService.validateShrinkIndex(
+            state.metadata(),
+            state.blocks(),
+            state.routingTable(),
+            sourceIndex,
+            targetIndexName,
+            targetIndexSettings
+        );
+    }
+
+    private void validateSplitIndex(ClusterState state, String sourceIndex, String targetIndexName, Settings targetIndexSettings) {
+        MetadataCreateIndexService.validateSplitIndex(state.metadata(), state.blocks(), sourceIndex, targetIndexName, targetIndexSettings);
+    }
 }
diff --git a/server/src/test/java/org/elasticsearch/health/node/ShardsCapacityHealthIndicatorServiceTests.java b/server/src/test/java/org/elasticsearch/health/node/ShardsCapacityHealthIndicatorServiceTests.java
index 1c3d0d486b282..a5a61eab4df9e 100644
--- a/server/src/test/java/org/elasticsearch/health/node/ShardsCapacityHealthIndicatorServiceTests.java
+++ b/server/src/test/java/org/elasticsearch/health/node/ShardsCapacityHealthIndicatorServiceTests.java
@@ -341,8 +341,10 @@ public void testCalculateMethods() {
             maxConfiguredShardsPerNode,
             numberOfNewShards,
             replicas,
-            state) -> {
-            assertEquals(mockedState, state);
+            discoveryNodes,
+            metadata) -> {
+            assertEquals(mockedState.nodes(), discoveryNodes);
+            assertEquals(mockedState.metadata(), metadata);
             assertEquals(randomMaxShardsPerNodeSetting, maxConfiguredShardsPerNode);
             return new ShardLimitValidator.Result(
                 numberOfNewShards != shardsToAdd && replicas == 1,
@@ -353,13 +355,19 @@ public void testCalculateMethods() {
             );
         };
 
-        assertEquals(calculateFrom(randomMaxShardsPerNodeSetting, mockedState, checkerWrapper.apply(5)).status(), RED);
-        assertEquals(calculateFrom(randomMaxShardsPerNodeSetting, mockedState, checkerWrapper.apply(10)).status(), YELLOW);
+        assertEquals(
+            calculateFrom(randomMaxShardsPerNodeSetting, mockedState.nodes(), mockedState.metadata(), checkerWrapper.apply(5)).status(),
+            RED
+        );
+        assertEquals(
+            calculateFrom(randomMaxShardsPerNodeSetting, mockedState.nodes(), mockedState.metadata(), checkerWrapper.apply(10)).status(),
+            YELLOW
+        );
 
         // Let's cover the holes :)
         Stream.of(randomIntBetween(1, 4), randomIntBetween(6, 9), randomIntBetween(11, Integer.MAX_VALUE))
             .map(checkerWrapper)
-            .map(checker -> calculateFrom(randomMaxShardsPerNodeSetting, mockedState, checker))
+            .map(checker -> calculateFrom(randomMaxShardsPerNodeSetting, mockedState.nodes(), mockedState.metadata(), checker))
             .map(ShardsCapacityHealthIndicatorService.StatusResult::status)
             .forEach(status -> assertEquals(status, GREEN));
     }
diff --git a/server/src/test/java/org/elasticsearch/indices/ShardLimitValidatorTests.java b/server/src/test/java/org/elasticsearch/indices/ShardLimitValidatorTests.java
index 0eea536ddbff1..36b0711ad6c13 100644
--- a/server/src/test/java/org/elasticsearch/indices/ShardLimitValidatorTests.java
+++ b/server/src/test/java/org/elasticsearch/indices/ShardLimitValidatorTests.java
@@ -41,7 +41,13 @@ public class ShardLimitValidatorTests extends ESTestCase {
 
     @FunctionalInterface
     interface CheckShardLimitMethod {
-        ShardLimitValidator.Result call(int maxConfiguredShardsPerNode, int numberOfNewShards, int replicas, ClusterState state);
+        ShardLimitValidator.Result call(
+            int maxConfiguredShardsPerNode,
+            int numberOfNewShards,
+            int replicas,
+            DiscoveryNodes discoveryNodes,
+            Metadata metadata
+        );
     }
 
     public void testOverShardLimit() {
@@ -63,7 +69,8 @@ private void testOverShardLimit(CheckShardLimitMethod targetMethod, String group
             counts.getShardsPerNode(),
             counts.getFailingIndexShards(),
             counts.getFailingIndexReplicas(),
-            state
+            state.nodes(),
+            state.metadata()
         );
 
         int totalShards = counts.getFailingIndexShards() * (1 + counts.getFailingIndexReplicas());
@@ -113,7 +120,13 @@ private void testUnderShardLimit(CheckShardLimitMethod targetMethod, String grou
         int existingShards = counts.getFirstIndexShards() * (1 + counts.getFirstIndexReplicas());
         int availableRoom = maxShardsInCluster - existingShards;
         int shardsToAdd = randomIntBetween(1, Math.max(availableRoom / (replicas + 1), 1));
-        ShardLimitValidator.Result shardLimitsResult = targetMethod.call(counts.getShardsPerNode(), shardsToAdd, replicas, state);
+        ShardLimitValidator.Result shardLimitsResult = targetMethod.call(
+            counts.getShardsPerNode(),
+            shardsToAdd,
+            replicas,
+            state.nodes(),
+            state.metadata()
+        );
         assertTrue(shardLimitsResult.canAddShards());
         assertEquals(shardLimitsResult.maxShardsInCluster(), counts.getShardsPerNode() * nodesInCluster);
         assertEquals(shardLimitsResult.totalShardsToAdd(), shardsToAdd * (replicas + 1));
@@ -142,7 +155,7 @@ public void testValidateShardLimitOpenIndices() {
         ShardLimitValidator shardLimitValidator = createTestShardLimitService(counts.getShardsPerNode(), group);
         ValidationException exception = expectThrows(
             ValidationException.class,
-            () -> shardLimitValidator.validateShardLimit(state, indices)
+            () -> shardLimitValidator.validateShardLimit(state.nodes(), state.metadata(), indices)
         );
         assertEquals(
             "Validation Failed: 1: this action would add ["
@@ -168,11 +181,11 @@ public void testValidateShardLimitUpdateReplicas() {
 
         final Index[] indices = getIndices(state);
         final ShardLimitValidator shardLimitValidator = createTestShardLimitService(shardsPerNode, group);
-        shardLimitValidator.validateShardLimitOnReplicaUpdate(state, indices, nodesInCluster - 1);
+        shardLimitValidator.validateShardLimitOnReplicaUpdate(state.nodes(), state.metadata(), indices, nodesInCluster - 1);
 
         ValidationException exception = expectThrows(
             ValidationException.class,
-            () -> shardLimitValidator.validateShardLimitOnReplicaUpdate(state, indices, nodesInCluster)
+            () -> shardLimitValidator.validateShardLimitOnReplicaUpdate(state.nodes(), state.metadata(), indices, nodesInCluster)
         );
         assertEquals(
             "Validation Failed: 1: this action would add ["
diff --git a/x-pack/plugin/downsample/src/main/java/org/elasticsearch/xpack/downsample/TransportDownsampleAction.java b/x-pack/plugin/downsample/src/main/java/org/elasticsearch/xpack/downsample/TransportDownsampleAction.java
index d8c9acff156ce..58a0370efb50e 100644
--- a/x-pack/plugin/downsample/src/main/java/org/elasticsearch/xpack/downsample/TransportDownsampleAction.java
+++ b/x-pack/plugin/downsample/src/main/java/org/elasticsearch/xpack/downsample/TransportDownsampleAction.java
@@ -267,7 +267,7 @@ protected void masterOperation(
             return;
         }
         try {
-            MetadataCreateIndexService.validateIndexName(downsampleIndexName, state);
+            MetadataCreateIndexService.validateIndexName(downsampleIndexName, state.metadata(), state.routingTable());
         } catch (ResourceAlreadyExistsException e) {
             // ignore index already exists
         }

From c21fc968d4180b025e2be2eb1bd7a4b503aeffbd Mon Sep 17 00:00:00 2001
From: Armin Braun <me@obrown.io>
Date: Wed, 4 Sep 2024 09:26:00 +0200
Subject: [PATCH 127/144] Remove unnecessary synchronization from
 InternalTestCluster (#112420)

I think we can drop some of the synchronization here without making any
other changes. This significantly reduces JIT CPU time in internal
cluster tests, which by way of allowing more parallel runs of the tests
speeds them up.
---
 .../test/InternalTestCluster.java             | 48 ++++++++++++-------
 1 file changed, 32 insertions(+), 16 deletions(-)

diff --git a/test/framework/src/main/java/org/elasticsearch/test/InternalTestCluster.java b/test/framework/src/main/java/org/elasticsearch/test/InternalTestCluster.java
index 332df7123fd1b..38b8dfecc0b5e 100644
--- a/test/framework/src/main/java/org/elasticsearch/test/InternalTestCluster.java
+++ b/test/framework/src/main/java/org/elasticsearch/test/InternalTestCluster.java
@@ -656,12 +656,17 @@ private NodeAndClient getOrBuildRandomNode() {
     }
 
     private NodeAndClient getRandomNodeAndClient() {
-        return getRandomNodeAndClient(Predicates.always());
+        var n = nodes;
+        ensureOpen();
+        if (n.isEmpty()) {
+            return null;
+        }
+        return randomFrom(n.values());
     }
 
-    private synchronized NodeAndClient getRandomNodeAndClient(Predicate<NodeAndClient> predicate) {
-        ensureOpen();
+    private NodeAndClient getRandomNodeAndClient(Predicate<NodeAndClient> predicate) {
         List<NodeAndClient> values = nodes.values().stream().filter(predicate).collect(Collectors.toList());
+        ensureOpen();
         if (values.isEmpty() == false) {
             return randomFrom(random, values);
         }
@@ -819,10 +824,17 @@ private static String getRoleSuffix(Settings settings) {
     }
 
     @Override
-    public synchronized Client client() {
-        ensureOpen();
+    public Client client() {
         /* Randomly return a client to one of the nodes in the cluster */
-        return getOrBuildRandomNode().client();
+        NodeAndClient c = getRandomNodeAndClient();
+        ensureOpen();
+        if (c == null) {
+            synchronized (this) {
+                return getOrBuildRandomNode().client();
+            }
+        } else {
+            return c.client();
+        }
     }
 
     /**
@@ -923,7 +935,7 @@ public synchronized void close() throws IOException {
     private final class NodeAndClient implements Closeable {
         private MockNode node;
         private final Settings originalNodeSettings;
-        private Client nodeClient;
+        private volatile Client nodeClient;
         private final AtomicBoolean closed = new AtomicBoolean(false);
         private final String name;
         private final int nodeAndClientId;
@@ -937,10 +949,14 @@ private final class NodeAndClient implements Closeable {
         }
 
         Node node() {
+            ensureNotClosed();
+            return node;
+        }
+
+        private void ensureNotClosed() {
             if (closed.get()) {
                 throw new RuntimeException("already closed");
             }
-            return node;
         }
 
         public int nodeAndClientId() {
@@ -961,21 +977,21 @@ Client client() {
 
         // TODO: collapse these together?
         Client nodeClient() {
-            if (closed.get()) {
-                throw new RuntimeException("already closed");
-            }
             return getOrBuildNodeClient();
         }
 
         private Client getOrBuildNodeClient() {
+            var n = nodeClient;
+            if (n != null) {
+                ensureNotClosed();
+                return n;
+            }
             synchronized (InternalTestCluster.this) {
-                if (closed.get()) {
-                    throw new RuntimeException("already closed");
-                }
+                ensureNotClosed();
                 if (nodeClient == null) {
-                    nodeClient = node.client();
+                    nodeClient = clientWrapper.apply(node.client());
                 }
-                return clientWrapper.apply(nodeClient);
+                return nodeClient;
             }
         }
 

From 07b56e938189fe27a379706ad91b5c3b13f900ba Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Aur=C3=A9lien=20FOUCRET?= <aurelien.foucret@gmail.com>
Date: Wed, 4 Sep 2024 10:05:30 +0200
Subject: [PATCH 128/144] Ensure _termStats is supported with function_score
 (#112349)

---
 .../191_term_statistics_function_score.yml    | 680 ++++++++++++++++++
 .../search/function/FunctionScoreQuery.java   |  12 +
 .../search/function/ScriptScoreFunction.java  |  19 +
 3 files changed, 711 insertions(+)
 create mode 100644 modules/lang-painless/src/yamlRestTest/resources/rest-api-spec/test/painless/191_term_statistics_function_score.yml

diff --git a/modules/lang-painless/src/yamlRestTest/resources/rest-api-spec/test/painless/191_term_statistics_function_score.yml b/modules/lang-painless/src/yamlRestTest/resources/rest-api-spec/test/painless/191_term_statistics_function_score.yml
new file mode 100644
index 0000000000000..de4d6530f4a92
--- /dev/null
+++ b/modules/lang-painless/src/yamlRestTest/resources/rest-api-spec/test/painless/191_term_statistics_function_score.yml
@@ -0,0 +1,680 @@
+setup:
+  - requires:
+      cluster_features: ["script.term_stats"]
+      reason: "support for term stats has been added in 8.16"
+
+  - do:
+      indices.create:
+        index: test-index
+        body:
+          settings:
+            number_of_shards: "2"
+          mappings:
+            properties:
+              title:
+                type: text
+              genre:
+                type: text
+                fields:
+                  keyword:
+                    type: keyword
+
+  - do:
+      index: { refresh: true, index: test-index, id: "1", routing: 0, body: {"title": "Star wars", "genre": "Sci-fi"} }
+  - do:
+      index: { refresh: true, index: test-index, id: "2", routing: 1, body: {"title": "Star trek", "genre": "Sci-fi"} }
+  - do:
+      index: { refresh: true, index: test-index, id: "3", routing: 1, body: {"title": "Rambo", "genre": "War movie"} }
+  - do:
+      index: { refresh: true, index: test-index, id: "4", routing: 1, body: {"title": "Rambo II", "genre": "War movie"} }
+
+---
+"match query: uniqueTermsCount without DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { match: { "title": "Star wars" } }
+              script_score:
+                script:
+                  source: "return _termStats.uniqueTermsCount()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 2 }
+  - match: { hits.hits.1._score: 2 }
+
+---
+"match query: uniqueTermsCount with DFS":
+  - do:
+      search:
+        search_type: dfs_query_then_fetch
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { match: { "title": "Star wars" } }
+              script_score:
+                script:
+                  source: "return _termStats.uniqueTermsCount()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 2 }
+  - match: { hits.hits.1._score: 2 }
+
+---
+"match query: matchedTermsCount without DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { match: { "title": "Star wars" } }
+              script_score:
+                script:
+                  source: "return _termStats.matchedTermsCount()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 2 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"match query: matchedTermsCount with DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        search_type: dfs_query_then_fetch
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { match: { "title": "Star wars" } }
+              script_score:
+                script:
+                  source: "return _termStats.matchedTermsCount()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 2 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"match query: docFreq min without DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { match: { "title": "Star wars" } }
+              script_score:
+                script:
+                  source: "return _termStats.docFreq().getMin()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 1 }
+  - match: { hits.hits.1._score: 0 }
+
+---
+"match query: docFreq min with DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        search_type: dfs_query_then_fetch
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { match: { "title": "Star wars" } }
+              script_score:
+                script:
+                  source: "return _termStats.docFreq().getMin()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 1 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"match query: docFreq max without DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { match: { "title": "Star wars" } }
+              script_score:
+                script:
+                  source: "return _termStats.docFreq().getMax()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 1 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"match query: docFreq max with DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        search_type: dfs_query_then_fetch
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { match: { "title": "Star wars" } }
+              script_score:
+                script:
+                  source: "return _termStats.docFreq().getMax()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 2 }
+  - match: { hits.hits.1._score: 2 }
+
+---
+"match query: totalTermFreq sum without DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { match: { "title": "Star wars" } }
+              script_score:
+                script:
+                  source: "return _termStats.totalTermFreq().getSum()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 2 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"match query: totalTermFreq sum with DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        search_type: dfs_query_then_fetch
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { match: { "title": "Star wars" } }
+              script_score:
+                script:
+                  source: "return _termStats.totalTermFreq().getSum()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 3 }
+  - match: { hits.hits.1._score: 3 }
+
+---
+"match query: termFreq sum without DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { match: { "title": "Star wars" } }
+              script_score:
+                script:
+                  source: "return _termStats.termFreq().getSum()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 2 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"match query: termFreq sum with DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        search_type: dfs_query_then_fetch
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { match: { "title": "Star wars" } }
+              script_score:
+                script:
+                  source: "return _termStats.termFreq().getSum()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 2 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"match query: termPositions avg without DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { match: { "title": "Star wars" } }
+              script_score:
+                script:
+                  source: "return _termStats.termPositions().getAverage()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 1.5 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"match query: termPositions avg with DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        search_type: dfs_query_then_fetch
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { match: { "title": "Star wars" } }
+              script_score:
+                script:
+                  source: "return _termStats.termPositions().getAverage()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 1.5 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"term query: uniqueTermsCount without DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { term: { "genre.keyword": "Sci-fi" } }
+              script_score:
+                script:
+                  source: "return _termStats.uniqueTermsCount()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 1 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"term query: uniqueTermsCount with DFS":
+  - do:
+      search:
+        search_type: dfs_query_then_fetch
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { term: { "genre.keyword": "Sci-fi" } }
+              script_score:
+                script:
+                  source: "return _termStats.uniqueTermsCount()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 1 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"term query: matchedTermsCount without DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { term: { "genre.keyword": "Sci-fi" } }
+              script_score:
+                script:
+                  source: "return _termStats.matchedTermsCount()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 1 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"term query: matchedTermsCount with DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        search_type: dfs_query_then_fetch
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { term: { "genre.keyword": "Sci-fi" } }
+              script_score:
+                script:
+                  source: "return _termStats.matchedTermsCount()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 1 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"term query: docFreq min without DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { term: { "genre.keyword": "Sci-fi" } }
+              script_score:
+                script:
+                  source: "return _termStats.docFreq().getMin()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 1 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"term query: docFreq min with DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        search_type: dfs_query_then_fetch
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { term: { "genre.keyword": "Sci-fi" } }
+              script_score:
+                script:
+                  source: "return _termStats.docFreq().getMin()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 2 }
+  - match: { hits.hits.1._score: 2 }
+
+---
+"term query: docFreq max without DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { term: { "genre.keyword": "Sci-fi" } }
+              script_score:
+                script:
+                  source: "return _termStats.docFreq().getMax()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 1 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"term query: docFreq max with DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        search_type: dfs_query_then_fetch
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { term: { "genre.keyword": "Sci-fi" } }
+              script_score:
+                script:
+                  source: "return _termStats.docFreq().getMax()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 2 }
+  - match: { hits.hits.1._score: 2 }
+
+---
+"term query: totalTermFreq sum without DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { term: { "genre.keyword": "Sci-fi" } }
+              script_score:
+                script:
+                  source: "return _termStats.totalTermFreq().getSum()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 1 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"term query: totalTermFreq sum with DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        search_type: dfs_query_then_fetch
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { term: { "genre.keyword": "Sci-fi" } }
+              script_score:
+                script:
+                  source: "return _termStats.totalTermFreq().getSum()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 2 }
+  - match: { hits.hits.1._score: 2 }
+
+---
+"term query: termFreq sum without DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { term: { "genre.keyword": "Sci-fi" } }
+              script_score:
+                script:
+                  source: "return _termStats.termFreq().getSum()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 1 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"term query: termFreq sum with DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        search_type: dfs_query_then_fetch
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { term: { "genre.keyword": "Sci-fi" } }
+              script_score:
+                script:
+                  source: "return _termStats.termFreq().getSum()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 1 }
+  - match: { hits.hits.1._score: 1 }
+
+---
+"term query: termPositions avg without DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { term: { "genre.keyword": "Sci-fi" } }
+              script_score:
+                script:
+                  source: "return _termStats.termPositions().getAverage()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 0 }
+  - match: { hits.hits.1._score: 0 }
+
+---
+"term query: termPositions avg with DFS":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        search_type: dfs_query_then_fetch
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query: { term: { "genre.keyword": "Sci-fi" } }
+              script_score:
+                script:
+                  source: "return _termStats.termPositions().getAverage()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 0 }
+  - match: { hits.hits.1._score: 0 }
+
+---
+"Complex bool query: uniqueTermsCount":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query:
+                bool:
+                  must:
+                    match: { "title": "star wars" }
+                  should:
+                    term: { "genre.keyword": "Sci-fi" }
+                  filter:
+                    match: { "genre" : "sci"}
+                  must_not:
+                    term: { "genre.keyword": "War" }
+              script_score:
+                script:
+                  source: "return _termStats.uniqueTermsCount()"
+  - match: { hits.total: 2 }
+  - match: { hits.hits.0._score: 4 }
+  - match: { hits.hits.1._score: 4 }
+
+
+---
+"match_all query: uniqueTermsCount":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query:
+                match_all: {}
+              script_score:
+                script:
+                  source: "return _termStats.uniqueTermsCount()"
+  - match: { hits.total: 4 }
+  - match: { hits.hits.0._score: 0 }
+  - match: { hits.hits.1._score: 0 }
+  - match: { hits.hits.2._score: 0 }
+  - match: { hits.hits.3._score: 0 }
+
+---
+"match_all query: docFreq":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query:
+                match_all: {}
+              script_score:
+                script:
+                  source: "return _termStats.docFreq().getMax()"
+  - match: { hits.total: 4 }
+  - match: { hits.hits.0._score: 0 }
+  - match: { hits.hits.1._score: 0 }
+  - match: { hits.hits.2._score: 0 }
+  - match: { hits.hits.3._score: 0 }
+
+---
+"match_all query: totalTermFreq":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query:
+                match_all: {}
+              script_score:
+                script:
+                  source: "return _termStats.totalTermFreq().getSum()"
+  - match: { hits.total: 4 }
+  - match: { hits.hits.0._score: 0 }
+  - match: { hits.hits.1._score: 0 }
+  - match: { hits.hits.2._score: 0 }
+  - match: { hits.hits.3._score: 0 }
+
+---
+"match_all query: termFreq":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query:
+                match_all: {}
+              script_score:
+                script:
+                  source: "return _termStats.termFreq().getMax()"
+  - match: { hits.total: 4 }
+  - match: { hits.hits.0._score: 0 }
+  - match: { hits.hits.1._score: 0 }
+  - match: { hits.hits.2._score: 0 }
+  - match: { hits.hits.3._score: 0 }
+
+---
+"match_all query: termPositions":
+  - do:
+      search:
+        rest_total_hits_as_int: true
+        index: test-index
+        body:
+          query:
+            function_score:
+              boost_mode: replace
+              query:
+                match_all: {}
+              script_score:
+                script:
+                  source: "return _termStats.termPositions().getSum()"
+  - match: { hits.total: 4 }
+  - match: { hits.hits.0._score: 0 }
+  - match: { hits.hits.1._score: 0 }
+  - match: { hits.hits.2._score: 0 }
+  - match: { hits.hits.3._score: 0 }
diff --git a/server/src/main/java/org/elasticsearch/common/lucene/search/function/FunctionScoreQuery.java b/server/src/main/java/org/elasticsearch/common/lucene/search/function/FunctionScoreQuery.java
index aed11297d4285..c47d0154fe048 100644
--- a/server/src/main/java/org/elasticsearch/common/lucene/search/function/FunctionScoreQuery.java
+++ b/server/src/main/java/org/elasticsearch/common/lucene/search/function/FunctionScoreQuery.java
@@ -10,6 +10,7 @@
 
 import org.apache.lucene.index.IndexReader;
 import org.apache.lucene.index.LeafReaderContext;
+import org.apache.lucene.index.Term;
 import org.apache.lucene.search.BooleanClause;
 import org.apache.lucene.search.Explanation;
 import org.apache.lucene.search.FilterScorer;
@@ -25,14 +26,17 @@
 import org.elasticsearch.common.io.stream.StreamOutput;
 import org.elasticsearch.common.io.stream.Writeable;
 import org.elasticsearch.common.lucene.Lucene;
+import org.elasticsearch.script.ScriptTermStats;
 
 import java.io.IOException;
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collections;
+import java.util.HashSet;
 import java.util.List;
 import java.util.Locale;
 import java.util.Objects;
+import java.util.Set;
 
 /**
  * A query that allows for a pluggable boost function / filter. If it matches
@@ -241,6 +245,14 @@ public Weight createWeight(IndexSearcher searcher, org.apache.lucene.search.Scor
                     1f
                 );
             }
+            if (functions[i] instanceof ScriptScoreFunction scriptScoreFunction && scriptScoreFunction.needsTermStats()) {
+                subQueryScoreMode = org.apache.lucene.search.ScoreMode.COMPLETE;
+                // We collect the different terms used in the child query.
+                final Set<Term> terms = new HashSet<>();
+                this.visit(QueryVisitor.termCollector(terms));
+                scriptScoreFunction.setTermStatsFactory((ctx, docIdSupplier) -> new ScriptTermStats(searcher, ctx, docIdSupplier, terms));
+
+            }
         }
         Weight subQueryWeight = subQuery.createWeight(searcher, subQueryScoreMode, boost);
         return new CustomBoostFactorWeight(this, subQueryWeight, filterWeights, subQueryScoreMode.needsScores());
diff --git a/server/src/main/java/org/elasticsearch/common/lucene/search/function/ScriptScoreFunction.java b/server/src/main/java/org/elasticsearch/common/lucene/search/function/ScriptScoreFunction.java
index 6b8a75337b8ee..70233ed8ead6d 100644
--- a/server/src/main/java/org/elasticsearch/common/lucene/search/function/ScriptScoreFunction.java
+++ b/server/src/main/java/org/elasticsearch/common/lucene/search/function/ScriptScoreFunction.java
@@ -15,10 +15,13 @@
 import org.elasticsearch.script.ExplainableScoreScript;
 import org.elasticsearch.script.ScoreScript;
 import org.elasticsearch.script.Script;
+import org.elasticsearch.script.ScriptTermStats;
 import org.elasticsearch.search.lookup.SearchLookup;
 
 import java.io.IOException;
 import java.util.Objects;
+import java.util.function.BiFunction;
+import java.util.function.IntSupplier;
 
 public class ScriptScoreFunction extends ScoreFunction {
 
@@ -45,6 +48,8 @@ public float score() {
     private final int shardId;
     private final String indexName;
 
+    private BiFunction<LeafReaderContext, IntSupplier, ScriptTermStats> termStatsFactory;
+
     public ScriptScoreFunction(Script sScript, ScoreScript.LeafFactory script, SearchLookup lookup, String indexName, int shardId) {
         super(CombineFunction.REPLACE);
         this.sScript = sScript;
@@ -61,6 +66,12 @@ public LeafScoreFunction getLeafScoreFunction(LeafReaderContext ctx) throws IOEx
         leafScript.setScorer(scorer);
         leafScript._setIndexName(indexName);
         leafScript._setShard(shardId);
+
+        if (script.needs_termStats()) {
+            assert termStatsFactory != null;
+            leafScript._setTermStats(termStatsFactory.apply(ctx, scorer::docID));
+        }
+
         return new LeafScoreFunction() {
 
             private double score(int docId, float subQueryScore, ScoreScript.ExplanationHolder holder) throws IOException {
@@ -111,6 +122,14 @@ public boolean needsScores() {
         return script.needs_score();
     }
 
+    public boolean needsTermStats() {
+        return script.needs_termStats();
+    }
+
+    public void setTermStatsFactory(BiFunction<LeafReaderContext, IntSupplier, ScriptTermStats> termStatsFactory) {
+        this.termStatsFactory = termStatsFactory;
+    }
+
     @Override
     public String toString() {
         return "script" + sScript.toString();

From 2fde9106188c9a348311592313f06f196feb2a30 Mon Sep 17 00:00:00 2001
From: Simon Cooper <simon.cooper@elastic.co>
Date: Wed, 4 Sep 2024 09:14:28 +0100
Subject: [PATCH 129/144] Deprecate Version.fromString (#112470)

Version.fromString should not be used further, and existing uses (especially in production code) need to be reduced. Mark it deprecated to dissuade further use of this method.
---
 server/src/main/java/org/elasticsearch/Version.java | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/server/src/main/java/org/elasticsearch/Version.java b/server/src/main/java/org/elasticsearch/Version.java
index 333669ca8079c..b751daf0e2d98 100644
--- a/server/src/main/java/org/elasticsearch/Version.java
+++ b/server/src/main/java/org/elasticsearch/Version.java
@@ -270,7 +270,9 @@ public static Version max(Version version1, Version version2) {
 
     /**
      * Returns the version given its string representation, current version if the argument is null or empty
+     * @deprecated Use of semantic release versions should be minimized; please avoid use of this method if possible.
      */
+    @Deprecated
     public static Version fromString(String version) {
         if (Strings.hasLength(version) == false) {
             return Version.CURRENT;

From 9b96665f5d6380702e98ed949acc0c07844faa15 Mon Sep 17 00:00:00 2001
From: Alexander Spies <alexander.spies@elastic.co>
Date: Wed, 4 Sep 2024 10:21:48 +0200
Subject: [PATCH 130/144] ESQL: Fix synthetic attribute pruning (#111413)

- Fix ProjectAwayColumns to handle synthetic attributes and mark synthetically introduced Aliases as synthetic again.
- Fix QueryPlan.references()
- Simplify ProjectAwayColumns.
- Simplify DependencyConsistency.
- Make AggregateExec track the intermediate attributes it actually outputs/requries.
---
 docs/changelog/111413.yaml                    |   6 +
 .../org/elasticsearch/TransportVersions.java  |   1 +
 .../xpack/esql/core/expression/Attribute.java |  11 +-
 .../esql/core/expression/FieldAttribute.java  |  48 ++--
 .../esql/core/expression/NamedExpression.java |   4 +
 .../expression/FieldAttributeTestUtils.java   |  27 ++
 .../compute/aggregation/AggregatorMode.java   |  13 +-
 .../xpack/esql/analysis/Analyzer.java         |  32 ++-
 .../optimizer/LocalPhysicalPlanOptimizer.java |   5 +
 .../esql/optimizer/LogicalPlanOptimizer.java  |  13 +-
 .../xpack/esql/optimizer/LogicalVerifier.java |   4 +-
 .../xpack/esql/optimizer/OptimizerRules.java  | 123 +--------
 .../esql/optimizer/PhysicalPlanOptimizer.java |  88 ++-----
 .../esql/optimizer/PhysicalVerifier.java      |   4 +-
 .../ReplaceOrderByExpressionWithEval.java     |   2 +-
 .../xpack/esql/plan/QueryPlan.java            |  16 +-
 .../xpack/esql/plan/logical/Aggregate.java    |  16 +-
 .../xpack/esql/plan/logical/Drop.java         |   1 -
 .../xpack/esql/plan/logical/Enrich.java       |   5 +
 .../xpack/esql/plan/logical/Eval.java         |  12 +
 .../xpack/esql/plan/logical/LeafPlan.java     |   6 +
 .../xpack/esql/plan/logical/Lookup.java       |   5 +
 .../xpack/esql/plan/logical/MvExpand.java     |   5 +
 .../xpack/esql/plan/logical/RegexExtract.java |   6 +
 .../esql/plan/logical/UnresolvedRelation.java |  13 -
 .../xpack/esql/plan/logical/join/Join.java    |   5 +
 .../esql/plan/physical/AggregateExec.java     |  90 +++++--
 .../xpack/esql/plan/physical/EnrichExec.java  |   6 +
 .../xpack/esql/plan/physical/EvalExec.java    |   7 +
 .../esql/plan/physical/FieldExtractExec.java  |  11 +
 .../esql/plan/physical/HashJoinExec.java      |   6 +
 .../xpack/esql/plan/physical/LeafExec.java    |   6 +
 .../esql/plan/physical/MvExpandExec.java      |   6 +
 .../xpack/esql/plan/physical/OutputExec.java  |   6 +
 .../esql/plan/physical/RegexExtractExec.java  |   6 +
 .../AbstractPhysicalOperationProviders.java   |  26 +-
 .../esql/planner/LocalExecutionPlanner.java   |   3 +-
 .../xpack/esql/planner/Mapper.java            |  36 ++-
 .../xpack/esql/planner/PlannerUtils.java      |   3 +-
 .../xpack/esql/session/EsqlSession.java       |  15 +-
 .../function/FieldAttributeTests.java         |   6 +-
 .../esql/io/stream/PlanNamedTypesTests.java   |   3 +-
 .../LocalLogicalPlanOptimizerTests.java       |   5 +
 .../LocalPhysicalPlanOptimizerTests.java      |   2 +-
 .../optimizer/PhysicalPlanOptimizerTests.java | 242 ++++++++++++++++--
 .../xpack/esql/plan/logical/PhasedTests.java  |   6 +
 .../AggregateExecSerializationTests.java      |  19 +-
 .../session/IndexResolverFieldNamesTests.java |  20 ++
 48 files changed, 656 insertions(+), 345 deletions(-)
 create mode 100644 docs/changelog/111413.yaml
 create mode 100644 x-pack/plugin/esql-core/src/test/java/org/elasticsearch/xpack/esql/core/expression/FieldAttributeTestUtils.java

diff --git a/docs/changelog/111413.yaml b/docs/changelog/111413.yaml
new file mode 100644
index 0000000000000..0eae45b17d0c4
--- /dev/null
+++ b/docs/changelog/111413.yaml
@@ -0,0 +1,6 @@
+pr: 111413
+summary: "ESQL: Fix synthetic attribute pruning"
+area: ES|QL
+type: bug
+issues:
+ - 105821
diff --git a/server/src/main/java/org/elasticsearch/TransportVersions.java b/server/src/main/java/org/elasticsearch/TransportVersions.java
index 5d1fb3a017f2f..6640b8b5eac8f 100644
--- a/server/src/main/java/org/elasticsearch/TransportVersions.java
+++ b/server/src/main/java/org/elasticsearch/TransportVersions.java
@@ -205,6 +205,7 @@ static TransportVersion def(int id) {
     public static final TransportVersion GET_DATA_STREAMS_VERBOSE = def(8_735_00_0);
     public static final TransportVersion ESQL_ADD_INDEX_MODE_CONCRETE_INDICES = def(8_736_00_0);
     public static final TransportVersion UNASSIGNED_PRIMARY_COUNT_ON_CLUSTER_HEALTH = def(8_737_00_0);
+    public static final TransportVersion ESQL_AGGREGATE_EXEC_TRACKS_INTERMEDIATE_ATTRS = def(8_738_00_0);
 
     /*
      * STOP! READ THIS FIRST! No, really,
diff --git a/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/Attribute.java b/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/Attribute.java
index 3dda28a8abf9d..05c414298fd33 100644
--- a/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/Attribute.java
+++ b/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/Attribute.java
@@ -28,6 +28,11 @@
  * The rest are not as they are not part of the projection and thus are not part of the derived table.
  */
 public abstract class Attribute extends NamedExpression {
+    /**
+     * Changing this will break bwc with 8.15, see {@link FieldAttribute#fieldName()}.
+     */
+    protected static final String SYNTHETIC_ATTRIBUTE_NAME_PREFIX = "$$";
+
     public static List<NamedWriteableRegistry.Entry> getNamedWriteables() {
         // TODO add UnsupportedAttribute when these are moved to the same project
         return List.of(FieldAttribute.ENTRY, MetadataAttribute.ENTRY, ReferenceAttribute.ENTRY);
@@ -49,6 +54,10 @@ public Attribute(Source source, String name, Nullability nullability, NameId id,
         this.nullability = nullability;
     }
 
+    public static String rawTemporaryName(String inner, String outer, String suffix) {
+        return SYNTHETIC_ATTRIBUTE_NAME_PREFIX + inner + "$" + outer + "$" + suffix;
+    }
+
     @Override
     public final Expression replaceChildren(List<Expression> newChildren) {
         throw new UnsupportedOperationException("this type of node doesn't have any children to replace");
@@ -123,7 +132,7 @@ public boolean equals(Object obj) {
 
     @Override
     public String toString() {
-        return name() + "{" + label() + "}" + "#" + id();
+        return name() + "{" + label() + (synthetic() ? "$" : "") + "}" + "#" + id();
     }
 
     @Override
diff --git a/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/FieldAttribute.java b/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/FieldAttribute.java
index 37f2cf863d53e..b5d44d98f476e 100644
--- a/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/FieldAttribute.java
+++ b/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/FieldAttribute.java
@@ -30,9 +30,6 @@
  * - nestedParent - if nested, what's the parent (which might not be the immediate one)
  */
 public class FieldAttribute extends TypedAttribute {
-    // TODO: This constant should not be used if possible; use .synthetic()
-    // https://github.com/elastic/elasticsearch/issues/105821
-    public static final String SYNTHETIC_ATTRIBUTE_NAME_PREFIX = "$$";
 
     static final NamedWriteableRegistry.Entry ENTRY = new NamedWriteableRegistry.Entry(
         Attribute.class,
@@ -52,6 +49,10 @@ public FieldAttribute(Source source, FieldAttribute parent, String name, EsField
         this(source, parent, name, field, Nullability.TRUE, null, false);
     }
 
+    public FieldAttribute(Source source, FieldAttribute parent, String name, EsField field, boolean synthetic) {
+        this(source, parent, name, field, Nullability.TRUE, null, synthetic);
+    }
+
     public FieldAttribute(
         Source source,
         FieldAttribute parent,
@@ -64,7 +65,11 @@ public FieldAttribute(
         this(source, parent, name, field.getDataType(), field, nullability, id, synthetic);
     }
 
-    public FieldAttribute(
+    /**
+     * Used only for testing. Do not use this otherwise, as an explicitly set type will be ignored the next time this FieldAttribute is
+     * {@link FieldAttribute#clone}d.
+     */
+    FieldAttribute(
         Source source,
         FieldAttribute parent,
         String name,
@@ -147,28 +152,7 @@ public String getWriteableName() {
 
     @Override
     protected NodeInfo<FieldAttribute> info() {
-        return NodeInfo.create(
-            this,
-            (source, parent1, name, type, field1, qualifier, nullability, id, synthetic) -> new FieldAttribute(
-                source,
-                parent1,
-                name,
-                type,
-                field1,
-                qualifier,
-                nullability,
-                id,
-                synthetic
-            ),
-            parent,
-            name(),
-            dataType(),
-            field,
-            (String) null,
-            nullable(),
-            id(),
-            synthetic()
-        );
+        return NodeInfo.create(this, FieldAttribute::new, parent, name(), dataType(), field, (String) null, nullable(), id(), synthetic());
     }
 
     public FieldAttribute parent() {
@@ -185,9 +169,9 @@ public String path() {
     public String fieldName() {
         // Before 8.15, the field name was the same as the attribute's name.
         // On later versions, the attribute can be renamed when creating synthetic attributes.
-        // TODO: We should use synthetic() to check for that case.
-        // https://github.com/elastic/elasticsearch/issues/105821
-        if (name().startsWith(SYNTHETIC_ATTRIBUTE_NAME_PREFIX) == false) {
+        // Because until 8.15, we couldn't set `synthetic` to true due to a bug, in that version such FieldAttributes are marked by their
+        // name starting with `$$`.
+        if ((synthetic() || name().startsWith(SYNTHETIC_ATTRIBUTE_NAME_PREFIX)) == false) {
             return name();
         }
         return Strings.hasText(path) ? path + "." + field.getName() : field.getName();
@@ -211,9 +195,15 @@ private FieldAttribute innerField(EsField type) {
 
     @Override
     protected Attribute clone(Source source, String name, DataType type, Nullability nullability, NameId id, boolean synthetic) {
+        // Ignore `type`, this must be the same as the field's type.
         return new FieldAttribute(source, parent, name, field, nullability, id, synthetic);
     }
 
+    @Override
+    public Attribute withDataType(DataType type) {
+        throw new UnsupportedOperationException("FieldAttribute obtains its type from the contained EsField.");
+    }
+
     @Override
     public int hashCode() {
         return Objects.hash(super.hashCode(), path, field);
diff --git a/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/NamedExpression.java b/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/NamedExpression.java
index 266ad8e2bb051..ba467910bed0d 100644
--- a/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/NamedExpression.java
+++ b/x-pack/plugin/esql-core/src/main/java/org/elasticsearch/xpack/esql/core/expression/NamedExpression.java
@@ -51,6 +51,10 @@ public NameId id() {
         return id;
     }
 
+    /**
+     * Synthetic named expressions are not user defined and usually created during optimizations and substitutions, e.g. when turning
+     * {@code ... | STATS x = avg(2*field)} into {@code ... | EVAL $$synth$attribute = 2*field | STATS x = avg($$synth$attribute)}.
+     */
     public boolean synthetic() {
         return synthetic;
     }
diff --git a/x-pack/plugin/esql-core/src/test/java/org/elasticsearch/xpack/esql/core/expression/FieldAttributeTestUtils.java b/x-pack/plugin/esql-core/src/test/java/org/elasticsearch/xpack/esql/core/expression/FieldAttributeTestUtils.java
new file mode 100644
index 0000000000000..1662b7f973c9d
--- /dev/null
+++ b/x-pack/plugin/esql-core/src/test/java/org/elasticsearch/xpack/esql/core/expression/FieldAttributeTestUtils.java
@@ -0,0 +1,27 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.esql.core.expression;
+
+import org.elasticsearch.xpack.esql.core.tree.Source;
+import org.elasticsearch.xpack.esql.core.type.DataType;
+import org.elasticsearch.xpack.esql.core.type.EsField;
+
+public class FieldAttributeTestUtils {
+    public static final FieldAttribute newFieldAttributeWithType(
+        Source source,
+        FieldAttribute parent,
+        String name,
+        DataType type,
+        EsField field,
+        Nullability nullability,
+        NameId id,
+        boolean synthetic
+    ) {
+        return new FieldAttribute(source, parent, name, type, field, nullability, id, synthetic);
+    }
+}
diff --git a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/AggregatorMode.java b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/AggregatorMode.java
index 22b20a445c196..706dcd02ed1ce 100644
--- a/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/AggregatorMode.java
+++ b/x-pack/plugin/esql/compute/src/main/java/org/elasticsearch/compute/aggregation/AggregatorMode.java
@@ -9,13 +9,24 @@
 
 public enum AggregatorMode {
 
+    /**
+     * Maps raw inputs to intermediate outputs.
+     */
     INITIAL(false, true),
 
+    /**
+     * Maps intermediate inputs to intermediate outputs.
+     */
     INTERMEDIATE(true, true),
 
+    /**
+     * Maps intermediate inputs to final outputs.
+     */
     FINAL(true, false),
 
-    // most useful for testing
+    /**
+     * Maps raw inputs to final outputs. Most useful for testing.
+     */
     SINGLE(false, false);
 
     private final boolean inputPartial;
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/analysis/Analyzer.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/analysis/Analyzer.java
index 664c9bffb6499..4f9ef3df29a85 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/analysis/Analyzer.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/analysis/Analyzer.java
@@ -26,7 +26,6 @@
 import org.elasticsearch.xpack.esql.core.expression.Expressions;
 import org.elasticsearch.xpack.esql.core.expression.FieldAttribute;
 import org.elasticsearch.xpack.esql.core.expression.Literal;
-import org.elasticsearch.xpack.esql.core.expression.NameId;
 import org.elasticsearch.xpack.esql.core.expression.NamedExpression;
 import org.elasticsearch.xpack.esql.core.expression.Nullability;
 import org.elasticsearch.xpack.esql.core.expression.ReferenceAttribute;
@@ -65,7 +64,6 @@
 import org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic.EsqlArithmeticOperation;
 import org.elasticsearch.xpack.esql.expression.predicate.operator.comparison.In;
 import org.elasticsearch.xpack.esql.index.EsIndex;
-import org.elasticsearch.xpack.esql.optimizer.LogicalPlanOptimizer;
 import org.elasticsearch.xpack.esql.plan.TableIdentifier;
 import org.elasticsearch.xpack.esql.plan.logical.Drop;
 import org.elasticsearch.xpack.esql.plan.logical.Enrich;
@@ -1249,12 +1247,10 @@ private Expression createIfDoesNotAlreadyExist(
             List<FieldAttribute> unionFieldAttributes
         ) {
             // Generate new ID for the field and suffix it with the data type to maintain unique attribute names.
-            String unionTypedFieldName = LogicalPlanOptimizer.rawTemporaryName(
-                fa.name(),
-                "converted_to",
-                resolvedField.getDataType().typeName()
-            );
-            FieldAttribute unionFieldAttribute = new FieldAttribute(fa.source(), fa.parent(), unionTypedFieldName, resolvedField);
+            // NOTE: The name has to start with $$ to not break bwc with 8.15 - in that version, this is how we had to mark this as
+            // synthetic to work around a bug.
+            String unionTypedFieldName = Attribute.rawTemporaryName(fa.name(), "converted_to", resolvedField.getDataType().typeName());
+            FieldAttribute unionFieldAttribute = new FieldAttribute(fa.source(), fa.parent(), unionTypedFieldName, resolvedField, true);
             int existingIndex = unionFieldAttributes.indexOf(unionFieldAttribute);
             if (existingIndex >= 0) {
                 // Do not generate multiple name/type combinations with different IDs
@@ -1280,8 +1276,16 @@ private MultiTypeEsField resolvedMultiTypeEsField(FieldAttribute fa, HashMap<Typ
 
         private Expression typeSpecificConvert(AbstractConvertFunction convert, Source source, DataType type, InvalidMappedField mtf) {
             EsField field = new EsField(mtf.getName(), type, mtf.getProperties(), mtf.isAggregatable());
-            NameId id = ((FieldAttribute) convert.field()).id();
-            FieldAttribute resolvedAttr = new FieldAttribute(source, null, field.getName(), field, Nullability.TRUE, id, false);
+            FieldAttribute originalFieldAttr = (FieldAttribute) convert.field();
+            FieldAttribute resolvedAttr = new FieldAttribute(
+                source,
+                originalFieldAttr.parent(),
+                originalFieldAttr.name(),
+                field,
+                originalFieldAttr.nullable(),
+                originalFieldAttr.id(),
+                true
+            );
             return convert.replaceChildren(Collections.singletonList(resolvedAttr));
         }
     }
@@ -1330,11 +1334,11 @@ private static LogicalPlan planWithoutSyntheticAttributes(LogicalPlan plan) {
             List<Attribute> newOutput = new ArrayList<>(output.size());
 
             for (Attribute attr : output) {
-                // TODO: this should really use .synthetic()
-                // https://github.com/elastic/elasticsearch/issues/105821
-                if (attr.name().startsWith(FieldAttribute.SYNTHETIC_ATTRIBUTE_NAME_PREFIX) == false) {
-                    newOutput.add(attr);
+                // Do not let the synthetic union type field attributes end up in the final output.
+                if (attr.synthetic() && attr instanceof FieldAttribute) {
+                    continue;
                 }
+                newOutput.add(attr);
             }
 
             return newOutput.size() == output.size() ? plan : new Project(Source.EMPTY, plan, newOutput);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/LocalPhysicalPlanOptimizer.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/LocalPhysicalPlanOptimizer.java
index ccab93df187fe..dad8973919e10 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/LocalPhysicalPlanOptimizer.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/LocalPhysicalPlanOptimizer.java
@@ -552,6 +552,10 @@ private Tuple<List<Attribute>, List<Stat>> pushableStats(AggregateExec aggregate
                             singletonList(agg),
                             emptyList()
                         );
+                        // TODO: the attributes have been recreated here; they will have wrong name ids, and the dependency check will
+                        // probably fail when we fix https://github.com/elastic/elasticsearch/issues/105436.
+                        // We may need to refactor AbstractPhysicalOperationProviders.intermediateAttributes so it doesn't return just
+                        // a list of attributes, but a mapping from the logical to the physical attributes.
                         tuple.v1().addAll(intermediateAttributes);
                         tuple.v2().add(stat);
                     }
@@ -604,6 +608,7 @@ && allowedForDocValues(fieldAttribute, agg, foundAttributes)) {
                             agg.groupings(),
                             orderedAggregates,
                             agg.getMode(),
+                            agg.intermediateAttributes(),
                             agg.estimatedRowSize()
                         );
                     }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/LogicalPlanOptimizer.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/LogicalPlanOptimizer.java
index 282f46e0de7bb..5fcd0e00d866a 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/LogicalPlanOptimizer.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/LogicalPlanOptimizer.java
@@ -15,7 +15,6 @@
 import org.elasticsearch.xpack.esql.core.expression.AttributeMap;
 import org.elasticsearch.xpack.esql.core.expression.Expression;
 import org.elasticsearch.xpack.esql.core.expression.Expressions;
-import org.elasticsearch.xpack.esql.core.expression.FieldAttribute;
 import org.elasticsearch.xpack.esql.core.expression.NameId;
 import org.elasticsearch.xpack.esql.core.expression.NamedExpression;
 import org.elasticsearch.xpack.esql.core.expression.ReferenceAttribute;
@@ -123,15 +122,11 @@ public LogicalPlanOptimizer(LogicalOptimizerContext optimizerContext) {
     public static String temporaryName(Expression inner, Expression outer, int suffix) {
         String in = toString(inner);
         String out = toString(outer);
-        return rawTemporaryName(in, out, String.valueOf(suffix));
+        return Attribute.rawTemporaryName(in, out, String.valueOf(suffix));
     }
 
     public static String locallyUniqueTemporaryName(String inner, String outer) {
-        return FieldAttribute.SYNTHETIC_ATTRIBUTE_NAME_PREFIX + inner + "$" + outer + "$" + new NameId();
-    }
-
-    public static String rawTemporaryName(String inner, String outer, String suffix) {
-        return FieldAttribute.SYNTHETIC_ATTRIBUTE_NAME_PREFIX + inner + "$" + outer + "$" + suffix;
+        return Attribute.rawTemporaryName(inner, outer, (new NameId()).toString());
     }
 
     static String toString(Expression ex) {
@@ -373,9 +368,7 @@ private static AttributeReplacement renameAttributesInExpressions(
                 if (attributeNamesToRename.contains(attr.name())) {
                     Alias renamedAttribute = aliasesForReplacedAttributes.computeIfAbsent(attr, a -> {
                         String tempName = locallyUniqueTemporaryName(a.name(), "temp_name");
-                        // TODO: this should be synthetic
-                        // blocked on https://github.com/elastic/elasticsearch/issues/98703
-                        return new Alias(a.source(), tempName, a, null, false);
+                        return new Alias(a.source(), tempName, a, null, true);
                     });
                     return renamedAttribute.toAttribute();
                 }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/LogicalVerifier.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/LogicalVerifier.java
index cd61b4eb8892c..e95959d38f328 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/LogicalVerifier.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/LogicalVerifier.java
@@ -9,12 +9,12 @@
 
 import org.elasticsearch.xpack.esql.capabilities.Validatable;
 import org.elasticsearch.xpack.esql.common.Failures;
-import org.elasticsearch.xpack.esql.optimizer.OptimizerRules.LogicalPlanDependencyCheck;
+import org.elasticsearch.xpack.esql.optimizer.OptimizerRules.DependencyConsistency;
 import org.elasticsearch.xpack.esql.plan.logical.LogicalPlan;
 
 public final class LogicalVerifier {
 
-    private static final LogicalPlanDependencyCheck DEPENDENCY_CHECK = new LogicalPlanDependencyCheck();
+    private static final DependencyConsistency<LogicalPlan> DEPENDENCY_CHECK = new DependencyConsistency<>();
     public static final LogicalVerifier INSTANCE = new LogicalVerifier();
 
     private LogicalVerifier() {}
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/OptimizerRules.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/OptimizerRules.java
index 733fe2e8762bb..7808bcbd86545 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/OptimizerRules.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/OptimizerRules.java
@@ -10,33 +10,8 @@
 import org.elasticsearch.xpack.esql.common.Failures;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
 import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
-import org.elasticsearch.xpack.esql.core.expression.Expressions;
 import org.elasticsearch.xpack.esql.core.expression.NameId;
-import org.elasticsearch.xpack.esql.plan.GeneratingPlan;
 import org.elasticsearch.xpack.esql.plan.QueryPlan;
-import org.elasticsearch.xpack.esql.plan.logical.Aggregate;
-import org.elasticsearch.xpack.esql.plan.logical.Enrich;
-import org.elasticsearch.xpack.esql.plan.logical.EsRelation;
-import org.elasticsearch.xpack.esql.plan.logical.InlineStats;
-import org.elasticsearch.xpack.esql.plan.logical.LogicalPlan;
-import org.elasticsearch.xpack.esql.plan.logical.MvExpand;
-import org.elasticsearch.xpack.esql.plan.logical.Row;
-import org.elasticsearch.xpack.esql.plan.logical.local.LocalRelation;
-import org.elasticsearch.xpack.esql.plan.physical.AggregateExec;
-import org.elasticsearch.xpack.esql.plan.physical.EnrichExec;
-import org.elasticsearch.xpack.esql.plan.physical.EsQueryExec;
-import org.elasticsearch.xpack.esql.plan.physical.EsSourceExec;
-import org.elasticsearch.xpack.esql.plan.physical.EsStatsQueryExec;
-import org.elasticsearch.xpack.esql.plan.physical.EvalExec;
-import org.elasticsearch.xpack.esql.plan.physical.ExchangeExec;
-import org.elasticsearch.xpack.esql.plan.physical.ExchangeSourceExec;
-import org.elasticsearch.xpack.esql.plan.physical.FieldExtractExec;
-import org.elasticsearch.xpack.esql.plan.physical.LocalSourceExec;
-import org.elasticsearch.xpack.esql.plan.physical.MvExpandExec;
-import org.elasticsearch.xpack.esql.plan.physical.PhysicalPlan;
-import org.elasticsearch.xpack.esql.plan.physical.RegexExtractExec;
-import org.elasticsearch.xpack.esql.plan.physical.RowExec;
-import org.elasticsearch.xpack.esql.plan.physical.ShowExec;
 
 import java.util.HashSet;
 import java.util.Set;
@@ -50,10 +25,11 @@ private OptimizerRules() {}
     static class DependencyConsistency<P extends QueryPlan<P>> {
 
         void checkPlan(P p, Failures failures) {
-            AttributeSet refs = references(p);
+            AttributeSet refs = p.references();
             AttributeSet input = p.inputSet();
-            AttributeSet generated = generates(p);
-            AttributeSet missing = refs.subtract(input).subtract(generated);
+            AttributeSet missing = refs.subtract(input);
+            // TODO: for Joins, we should probably check if the required fields from the left child are actually in the left child, not
+            // just any child (and analogously for the right child).
             if (missing.isEmpty() == false) {
                 failures.add(fail(p, "Plan [{}] optimized incorrectly due to missing references {}", p.nodeString(), missing));
             }
@@ -73,96 +49,5 @@ void checkPlan(P p, Failures failures) {
                 }
             }
         }
-
-        protected AttributeSet references(P p) {
-            return p.references();
-        }
-
-        protected AttributeSet generates(P p) {
-            return AttributeSet.EMPTY;
-        }
-    }
-
-    static class LogicalPlanDependencyCheck extends DependencyConsistency<LogicalPlan> {
-        @Override
-        protected AttributeSet references(LogicalPlan plan) {
-            if (plan instanceof Enrich enrich) {
-                // The enrichFields are NamedExpressions, so we compute their references as well when just calling enrich.references().
-                // But they are not actually referring to attributes from the input plan - only the match field does.
-                return enrich.matchField().references();
-            }
-            return super.references(plan);
-        }
-
-        @Override
-        protected AttributeSet generates(LogicalPlan logicalPlan) {
-            // source-like operators
-            if (logicalPlan instanceof EsRelation
-                || logicalPlan instanceof LocalRelation
-                || logicalPlan instanceof Row
-                || logicalPlan instanceof Aggregate
-                || logicalPlan instanceof InlineStats) {
-                return logicalPlan.outputSet();
-            }
-            if (logicalPlan instanceof GeneratingPlan<?> generating) {
-                return new AttributeSet(generating.generatedAttributes());
-            }
-            if (logicalPlan instanceof MvExpand mvExpand) {
-                return new AttributeSet(mvExpand.expanded());
-            }
-
-            return AttributeSet.EMPTY;
-        }
-    }
-
-    static class PhysicalPlanDependencyCheck extends DependencyConsistency<PhysicalPlan> {
-        @Override
-        protected AttributeSet generates(PhysicalPlan physicalPlan) {
-            // source-like operators
-            if (physicalPlan instanceof EsSourceExec
-                || physicalPlan instanceof EsStatsQueryExec
-                || physicalPlan instanceof EsQueryExec
-                || physicalPlan instanceof LocalSourceExec
-                || physicalPlan instanceof RowExec
-                || physicalPlan instanceof ExchangeExec
-                || physicalPlan instanceof ExchangeSourceExec
-                || physicalPlan instanceof AggregateExec
-                || physicalPlan instanceof ShowExec) {
-                return physicalPlan.outputSet();
-            }
-
-            if (physicalPlan instanceof FieldExtractExec fieldExtractExec) {
-                return new AttributeSet(fieldExtractExec.attributesToExtract());
-            }
-            if (physicalPlan instanceof EvalExec eval) {
-                return new AttributeSet(Expressions.asAttributes(eval.fields()));
-            }
-            if (physicalPlan instanceof RegexExtractExec extract) {
-                return new AttributeSet(extract.extractedFields());
-            }
-            if (physicalPlan instanceof MvExpandExec mvExpand) {
-                return new AttributeSet(mvExpand.expanded());
-            }
-            if (physicalPlan instanceof EnrichExec enrich) {
-                return new AttributeSet(Expressions.asAttributes(enrich.enrichFields()));
-            }
-
-            return AttributeSet.EMPTY;
-        }
-
-        @Override
-        protected AttributeSet references(PhysicalPlan plan) {
-            if (plan instanceof AggregateExec aggregate) {
-                if (aggregate.getMode() == AggregateExec.Mode.FINAL) {
-                    // lousy hack - need to generate the intermediate aggs yet the intermediateAggs method keep creating new IDs on each
-                    // call
-                    // in practice, the final aggregate should clearly declare the expected properties not hold on the original ones
-                    // as they no longer apply
-                    return aggregate.inputSet();
-                }
-            }
-            return plan.references();
-        }
     }
-
 }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/PhysicalPlanOptimizer.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/PhysicalPlanOptimizer.java
index 2a410d6f386a4..d8d1668c092b0 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/PhysicalPlanOptimizer.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/PhysicalPlanOptimizer.java
@@ -11,12 +11,9 @@
 import org.elasticsearch.xpack.esql.common.Failure;
 import org.elasticsearch.xpack.esql.core.expression.Alias;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
-import org.elasticsearch.xpack.esql.core.expression.AttributeMap;
 import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
-import org.elasticsearch.xpack.esql.core.expression.Expression;
 import org.elasticsearch.xpack.esql.core.expression.Expressions;
 import org.elasticsearch.xpack.esql.core.expression.Literal;
-import org.elasticsearch.xpack.esql.core.expression.NamedExpression;
 import org.elasticsearch.xpack.esql.core.rule.ParameterizedRuleExecutor;
 import org.elasticsearch.xpack.esql.core.rule.Rule;
 import org.elasticsearch.xpack.esql.core.rule.RuleExecutor;
@@ -25,15 +22,9 @@
 import org.elasticsearch.xpack.esql.plan.logical.Aggregate;
 import org.elasticsearch.xpack.esql.plan.logical.Eval;
 import org.elasticsearch.xpack.esql.plan.logical.Project;
-import org.elasticsearch.xpack.esql.plan.physical.AggregateExec;
-import org.elasticsearch.xpack.esql.plan.physical.EnrichExec;
 import org.elasticsearch.xpack.esql.plan.physical.ExchangeExec;
 import org.elasticsearch.xpack.esql.plan.physical.FragmentExec;
-import org.elasticsearch.xpack.esql.plan.physical.HashJoinExec;
-import org.elasticsearch.xpack.esql.plan.physical.MvExpandExec;
 import org.elasticsearch.xpack.esql.plan.physical.PhysicalPlan;
-import org.elasticsearch.xpack.esql.plan.physical.ProjectExec;
-import org.elasticsearch.xpack.esql.plan.physical.RegexExtractExec;
 import org.elasticsearch.xpack.esql.plan.physical.UnaryExec;
 
 import java.util.ArrayList;
@@ -89,53 +80,18 @@ static class ProjectAwayColumns extends Rule<PhysicalPlan, PhysicalPlan> {
 
         @Override
         public PhysicalPlan apply(PhysicalPlan plan) {
-            var projectAll = new Holder<>(TRUE);
-            var keepCollecting = new Holder<>(TRUE);
-            var attributes = new AttributeSet();
-            var aliases = new AttributeMap<Expression>();
+            Holder<Boolean> keepTraversing = new Holder<>(TRUE);
+            // Invariant: if we add a projection with these attributes after the current plan node, the plan remains valid
+            // and the overall output will not change.
+            Holder<AttributeSet> requiredAttributes = new Holder<>(plan.outputSet());
 
-            return plan.transformDown(UnaryExec.class, p -> {
-                // no need for project all
-                if (p instanceof ProjectExec || p instanceof AggregateExec) {
-                    projectAll.set(FALSE);
+            // This will require updating should we choose to have non-unary execution plans in the future.
+            return plan.transformDown(UnaryExec.class, currentPlanNode -> {
+                if (keepTraversing.get() == false) {
+                    return currentPlanNode;
                 }
-                if (keepCollecting.get()) {
-                    p.forEachExpression(NamedExpression.class, ne -> {
-                        var attr = ne.toAttribute();
-                        // filter out attributes declared as aliases before
-                        if (ne instanceof Alias as) {
-                            aliases.put(attr, as.child());
-                            attributes.remove(attr);
-                        } else {
-                            // skip synthetically added attributes (the ones from AVG), see LogicalPlanOptimizer.SubstituteSurrogates
-                            if (attr.synthetic() == false && aliases.containsKey(attr) == false) {
-                                attributes.add(attr);
-                            }
-                        }
-                    });
-                    if (p instanceof RegexExtractExec ree) {
-                        attributes.removeAll(ree.extractedFields());
-                    }
-                    if (p instanceof MvExpandExec mvee) {
-                        attributes.remove(mvee.expanded());
-                    }
-                    if (p instanceof HashJoinExec join) {
-                        attributes.removeAll(join.addedFields());
-                        for (Attribute rhs : join.rightFields()) {
-                            if (join.leftFields().stream().anyMatch(x -> x.semanticEquals(rhs)) == false) {
-                                attributes.remove(rhs);
-                            }
-                        }
-                    }
-                    if (p instanceof EnrichExec ee) {
-                        for (NamedExpression enrichField : ee.enrichFields()) {
-                            // TODO: why is this different then the remove above?
-                            attributes.remove(enrichField instanceof Alias a ? a.child() : enrichField);
-                        }
-                    }
-                }
-                if (p instanceof ExchangeExec exec) {
-                    keepCollecting.set(FALSE);
+                if (currentPlanNode instanceof ExchangeExec exec) {
+                    keepTraversing.set(FALSE);
                     var child = exec.child();
                     // otherwise expect a Fragment
                     if (child instanceof FragmentExec fragmentExec) {
@@ -143,8 +99,7 @@ public PhysicalPlan apply(PhysicalPlan plan) {
 
                         // no need for projection when dealing with aggs
                         if (logicalFragment instanceof Aggregate == false) {
-                            var selectAll = projectAll.get();
-                            var output = selectAll ? exec.child().output() : new ArrayList<>(attributes);
+                            List<Attribute> output = new ArrayList<>(requiredAttributes.get());
                             // if all the fields are filtered out, it's only the count that matters
                             // however until a proper fix (see https://github.com/elastic/elasticsearch/issues/98703)
                             // add a synthetic field (so it doesn't clash with the user defined one) to return a constant
@@ -156,19 +111,22 @@ public PhysicalPlan apply(PhysicalPlan plan) {
                                 output = Expressions.asAttributes(fields);
                             }
                             // add a logical projection (let the local replanning remove it if needed)
-                            p = exec.replaceChild(
-                                new FragmentExec(
-                                    Source.EMPTY,
-                                    new Project(logicalFragment.source(), logicalFragment, output),
-                                    fragmentExec.esFilter(),
-                                    fragmentExec.estimatedRowSize(),
-                                    fragmentExec.reducer()
-                                )
+                            FragmentExec newChild = new FragmentExec(
+                                Source.EMPTY,
+                                new Project(logicalFragment.source(), logicalFragment, output),
+                                fragmentExec.esFilter(),
+                                fragmentExec.estimatedRowSize(),
+                                fragmentExec.reducer()
                             );
+                            return new ExchangeExec(exec.source(), output, exec.inBetweenAggs(), newChild);
                         }
                     }
+                } else {
+                    AttributeSet childOutput = currentPlanNode.inputSet();
+                    AttributeSet addedAttributes = currentPlanNode.outputSet().subtract(childOutput);
+                    requiredAttributes.set(requiredAttributes.get().subtract(addedAttributes).combine(currentPlanNode.references()));
                 }
-                return p;
+                return currentPlanNode;
             });
         }
     }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/PhysicalVerifier.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/PhysicalVerifier.java
index 7843464650e37..f9ce83d5c1f15 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/PhysicalVerifier.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/PhysicalVerifier.java
@@ -10,7 +10,7 @@
 import org.elasticsearch.xpack.esql.common.Failure;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
 import org.elasticsearch.xpack.esql.core.expression.Expressions;
-import org.elasticsearch.xpack.esql.optimizer.OptimizerRules.PhysicalPlanDependencyCheck;
+import org.elasticsearch.xpack.esql.optimizer.OptimizerRules.DependencyConsistency;
 import org.elasticsearch.xpack.esql.plan.physical.FieldExtractExec;
 import org.elasticsearch.xpack.esql.plan.physical.PhysicalPlan;
 
@@ -24,7 +24,7 @@
 public final class PhysicalVerifier {
 
     public static final PhysicalVerifier INSTANCE = new PhysicalVerifier();
-    private static final PhysicalPlanDependencyCheck DEPENDENCY_CHECK = new PhysicalPlanDependencyCheck();
+    private static final DependencyConsistency<PhysicalPlan> DEPENDENCY_CHECK = new DependencyConsistency<>();
 
     private PhysicalVerifier() {}
 
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/rules/ReplaceOrderByExpressionWithEval.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/rules/ReplaceOrderByExpressionWithEval.java
index 3886982a16aba..9bb28f38ea65f 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/rules/ReplaceOrderByExpressionWithEval.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/rules/ReplaceOrderByExpressionWithEval.java
@@ -18,7 +18,7 @@
 import java.util.ArrayList;
 import java.util.List;
 
-import static org.elasticsearch.xpack.esql.optimizer.LogicalPlanOptimizer.rawTemporaryName;
+import static org.elasticsearch.xpack.esql.core.expression.Attribute.rawTemporaryName;
 
 public final class ReplaceOrderByExpressionWithEval extends OptimizerRules.OptimizerRule<OrderBy> {
     private static int counter = 0;
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/QueryPlan.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/QueryPlan.java
index 3ee56771bc3f7..e34e0b8e27863 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/QueryPlan.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/QueryPlan.java
@@ -66,15 +66,27 @@ public List<Expression> expressions() {
     }
 
     /**
-     * Returns the expressions referenced on this query plan node.
+     * The attributes required to be in the {@link QueryPlan#inputSet()} for this plan to be valid.
+     * Excludes generated references.
+     * <p>
+     * E.g. for {@code EVAL x = 2*some_field, y = 2*x} this includes {@code some_field} but neither {@code x} nor {@code y}.
+     * For {@code ENRICH some_policy ON field WITH some_enrich_field} this includes {@code field} but excludes the generated reference
+     * {@code some_enrich_field}.
      */
     public AttributeSet references() {
         if (lazyReferences == null) {
-            lazyReferences = Expressions.references(expressions());
+            lazyReferences = computeReferences();
         }
         return lazyReferences;
     }
 
+    /**
+     * This very likely needs to be overridden for {@link QueryPlan#references} to be correct when inheriting.
+     */
+    protected AttributeSet computeReferences() {
+        return Expressions.references(expressions());
+    }
+
     //
     // pass Object.class as a type token to pick Collections of expressions not just expressions
     //
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Aggregate.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Aggregate.java
index 7ed2d04400be1..8445c8236c45a 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Aggregate.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Aggregate.java
@@ -12,6 +12,7 @@
 import org.elasticsearch.common.io.stream.StreamOutput;
 import org.elasticsearch.xpack.esql.core.capabilities.Resolvables;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
 import org.elasticsearch.xpack.esql.core.expression.Expression;
 import org.elasticsearch.xpack.esql.core.expression.Expressions;
 import org.elasticsearch.xpack.esql.core.expression.NamedExpression;
@@ -140,11 +141,24 @@ public boolean expressionsResolved() {
     @Override
     public List<Attribute> output() {
         if (lazyOutput == null) {
-            lazyOutput = mergeOutputAttributes(Expressions.asAttributes(aggregates()), emptyList());
+            lazyOutput = output(aggregates);
         }
         return lazyOutput;
     }
 
+    public static List<Attribute> output(List<? extends NamedExpression> aggregates) {
+        return mergeOutputAttributes(Expressions.asAttributes(aggregates), emptyList());
+    }
+
+    @Override
+    protected AttributeSet computeReferences() {
+        return computeReferences(aggregates, groupings);
+    }
+
+    public static AttributeSet computeReferences(List<? extends NamedExpression> aggregates, List<? extends Expression> groupings) {
+        return Expressions.references(groupings).combine(Expressions.references(aggregates));
+    }
+
     @Override
     public int hashCode() {
         return Objects.hash(aggregateType, groupings, aggregates, child());
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Drop.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Drop.java
index b32139c18e08e..add5a2d576c00 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Drop.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Drop.java
@@ -38,7 +38,6 @@ public List<NamedExpression> removals() {
         return removals;
     }
 
-    @Override
     public String commandName() {
         return "DROP";
     }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Enrich.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Enrich.java
index 762d5ffcc4532..fcb5d9dbd61cf 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Enrich.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Enrich.java
@@ -20,6 +20,7 @@
 import org.elasticsearch.xpack.esql.core.capabilities.Resolvables;
 import org.elasticsearch.xpack.esql.core.expression.Alias;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
 import org.elasticsearch.xpack.esql.core.expression.EmptyAttribute;
 import org.elasticsearch.xpack.esql.core.expression.Expression;
 import org.elasticsearch.xpack.esql.core.expression.NameId;
@@ -192,6 +193,10 @@ public Mode mode() {
     }
 
     @Override
+    protected AttributeSet computeReferences() {
+        return matchField.references();
+    }
+
     public String commandName() {
         return "ENRICH";
     }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Eval.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Eval.java
index 6b217a7a81541..b24a87d365020 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Eval.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Eval.java
@@ -14,6 +14,8 @@
 import org.elasticsearch.xpack.esql.core.expression.Alias;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
 import org.elasticsearch.xpack.esql.core.expression.AttributeMap;
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
+import org.elasticsearch.xpack.esql.core.expression.Expressions;
 import org.elasticsearch.xpack.esql.core.expression.NameId;
 import org.elasticsearch.xpack.esql.core.expression.ReferenceAttribute;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
@@ -69,6 +71,16 @@ public List<Attribute> output() {
         return lazyOutput;
     }
 
+    @Override
+    protected AttributeSet computeReferences() {
+        return computeReferences(fields);
+    }
+
+    public static AttributeSet computeReferences(List<Alias> fields) {
+        AttributeSet generated = new AttributeSet(asAttributes(fields));
+        return Expressions.references(fields).subtract(generated);
+    }
+
     @Override
     public List<Attribute> generatedAttributes() {
         return asAttributes(fields);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/LeafPlan.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/LeafPlan.java
index d21b61a81cd9e..008dcbb475546 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/LeafPlan.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/LeafPlan.java
@@ -6,6 +6,7 @@
  */
 package org.elasticsearch.xpack.esql.plan.logical;
 
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 
 import java.util.Collections;
@@ -17,6 +18,11 @@ protected LeafPlan(Source source) {
         super(source, Collections.emptyList());
     }
 
+    @Override
+    protected AttributeSet computeReferences() {
+        return AttributeSet.EMPTY;
+    }
+
     @Override
     public final LogicalPlan replaceChildren(List<LogicalPlan> newChildren) {
         throw new UnsupportedOperationException("this type of node doesn't have any children to replace");
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Lookup.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Lookup.java
index 141d1a0945ddd..d6ab24fe44c99 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Lookup.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Lookup.java
@@ -13,6 +13,7 @@
 import org.elasticsearch.core.Nullable;
 import org.elasticsearch.xpack.esql.core.capabilities.Resolvables;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
 import org.elasticsearch.xpack.esql.core.expression.Expression;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
@@ -112,6 +113,10 @@ public JoinConfig joinConfig() {
     }
 
     @Override
+    protected AttributeSet computeReferences() {
+        return new AttributeSet(matchFields);
+    }
+
     public String commandName() {
         return "LOOKUP";
     }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/MvExpand.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/MvExpand.java
index 8519ca0350b6e..46ebc43d698a6 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/MvExpand.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/MvExpand.java
@@ -11,6 +11,7 @@
 import org.elasticsearch.common.io.stream.StreamInput;
 import org.elasticsearch.common.io.stream.StreamOutput;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
 import org.elasticsearch.xpack.esql.core.expression.NamedExpression;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
@@ -78,6 +79,10 @@ public Attribute expanded() {
     }
 
     @Override
+    protected AttributeSet computeReferences() {
+        return target.references();
+    }
+
     public String commandName() {
         return "MV_EXPAND";
     }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/RegexExtract.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/RegexExtract.java
index f95bee92d4e1a..ab813f1a9c737 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/RegexExtract.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/RegexExtract.java
@@ -8,6 +8,7 @@
 package org.elasticsearch.xpack.esql.plan.logical;
 
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
 import org.elasticsearch.xpack.esql.core.expression.Expression;
 import org.elasticsearch.xpack.esql.core.expression.NameId;
 import org.elasticsearch.xpack.esql.core.tree.Source;
@@ -39,6 +40,11 @@ public List<Attribute> output() {
         return mergeOutputAttributes(extractedFields, child().output());
     }
 
+    @Override
+    protected AttributeSet computeReferences() {
+        return input.references();
+    }
+
     public Expression input() {
         return input;
     }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/UnresolvedRelation.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/UnresolvedRelation.java
index fdc2321c8bef6..0dfbe4936e4e3 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/UnresolvedRelation.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/UnresolvedRelation.java
@@ -10,9 +10,6 @@
 import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.xpack.esql.core.capabilities.Unresolvable;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
-import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
-import org.elasticsearch.xpack.esql.core.expression.MetadataAttribute;
-import org.elasticsearch.xpack.esql.core.expression.UnresolvedAttribute;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 import org.elasticsearch.xpack.esql.plan.TableIdentifier;
@@ -121,16 +118,6 @@ public String unresolvedMessage() {
         return unresolvedMsg;
     }
 
-    @Override
-    public AttributeSet references() {
-        AttributeSet refs = super.references();
-        if (indexMode == IndexMode.TIME_SERIES) {
-            refs = new AttributeSet(refs);
-            refs.add(new UnresolvedAttribute(source(), MetadataAttribute.TIMESTAMP_FIELD));
-        }
-        return refs;
-    }
-
     @Override
     public int hashCode() {
         return Objects.hash(source(), table, metadataFields, indexMode, unresolvedMsg);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/join/Join.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/join/Join.java
index b9004e3758c9b..e920028f04cb9 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/join/Join.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/join/Join.java
@@ -76,6 +76,11 @@ public JoinConfig config() {
         return config;
     }
 
+    @Override
+    protected AttributeSet computeReferences() {
+        return Expressions.references(config.leftFields()).combine(Expressions.references(config.rightFields()));
+    }
+
     @Override
     protected NodeInfo<Join> info() {
         // Do not just add the JoinConfig as a whole - this would prevent correctly registering the
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/AggregateExec.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/AggregateExec.java
index 42fb0ab0bdf3e..f003abca7d1da 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/AggregateExec.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/AggregateExec.java
@@ -7,17 +7,20 @@
 
 package org.elasticsearch.xpack.esql.plan.physical;
 
+import org.elasticsearch.TransportVersions;
 import org.elasticsearch.common.io.stream.NamedWriteableRegistry;
 import org.elasticsearch.common.io.stream.StreamInput;
 import org.elasticsearch.common.io.stream.StreamOutput;
+import org.elasticsearch.compute.aggregation.AggregatorMode;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
 import org.elasticsearch.xpack.esql.core.expression.Expression;
-import org.elasticsearch.xpack.esql.core.expression.Expressions;
 import org.elasticsearch.xpack.esql.core.expression.NamedExpression;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 import org.elasticsearch.xpack.esql.io.stream.PlanStreamInput;
 import org.elasticsearch.xpack.esql.io.stream.PlanStreamOutput;
+import org.elasticsearch.xpack.esql.plan.logical.Aggregate;
 
 import java.io.IOException;
 import java.util.List;
@@ -32,8 +35,13 @@ public class AggregateExec extends UnaryExec implements EstimatesRowSize {
 
     private final List<? extends Expression> groupings;
     private final List<? extends NamedExpression> aggregates;
+    /**
+     * The output attributes of {@link AggregatorMode#INITIAL} and {@link AggregatorMode#INTERMEDIATE} aggregations, resp.
+     * the input attributes of {@link AggregatorMode#FINAL} and {@link AggregatorMode#INTERMEDIATE} aggregations.
+     */
+    private final List<Attribute> intermediateAttributes;
 
-    private final Mode mode;
+    private final AggregatorMode mode;
 
     /**
      * Estimate of the number of bytes that'll be loaded per position before
@@ -41,34 +49,33 @@ public class AggregateExec extends UnaryExec implements EstimatesRowSize {
      */
     private final Integer estimatedRowSize;
 
-    public enum Mode {
-        SINGLE,
-        PARTIAL, // maps raw inputs to intermediate outputs
-        FINAL, // maps intermediate inputs to final outputs
-    }
-
     public AggregateExec(
         Source source,
         PhysicalPlan child,
         List<? extends Expression> groupings,
         List<? extends NamedExpression> aggregates,
-        Mode mode,
+        AggregatorMode mode,
+        List<Attribute> intermediateAttributes,
         Integer estimatedRowSize
     ) {
         super(source, child);
         this.groupings = groupings;
         this.aggregates = aggregates;
         this.mode = mode;
+        this.intermediateAttributes = intermediateAttributes;
         this.estimatedRowSize = estimatedRowSize;
     }
 
     private AggregateExec(StreamInput in) throws IOException {
+        // This is only deserialized as part of node level reduction, which is turned off until at least 8.16.
+        // So, we do not have to consider previous transport versions here, because old nodes will not send AggregateExecs to new nodes.
         this(
             Source.readFrom((PlanStreamInput) in),
             ((PlanStreamInput) in).readPhysicalPlanNode(),
             in.readNamedWriteableCollectionAsList(Expression.class),
             in.readNamedWriteableCollectionAsList(NamedExpression.class),
-            in.readEnum(AggregateExec.Mode.class),
+            in.readEnum(AggregatorMode.class),
+            in.readNamedWriteableCollectionAsList(Attribute.class),
             in.readOptionalVInt()
         );
     }
@@ -79,7 +86,12 @@ public void writeTo(StreamOutput out) throws IOException {
         ((PlanStreamOutput) out).writePhysicalPlanNode(child());
         out.writeNamedWriteableCollection(groupings());
         out.writeNamedWriteableCollection(aggregates());
-        out.writeEnum(getMode());
+        if (out.getTransportVersion().onOrAfter(TransportVersions.ESQL_AGGREGATE_EXEC_TRACKS_INTERMEDIATE_ATTRS)) {
+            out.writeEnum(getMode());
+            out.writeNamedWriteableCollection(intermediateAttributes());
+        } else {
+            out.writeEnum(AggregateExec.Mode.fromAggregatorMode(getMode()));
+        }
         out.writeOptionalVInt(estimatedRowSize());
     }
 
@@ -90,12 +102,12 @@ public String getWriteableName() {
 
     @Override
     protected NodeInfo<AggregateExec> info() {
-        return NodeInfo.create(this, AggregateExec::new, child(), groupings, aggregates, mode, estimatedRowSize);
+        return NodeInfo.create(this, AggregateExec::new, child(), groupings, aggregates, mode, intermediateAttributes, estimatedRowSize);
     }
 
     @Override
     public AggregateExec replaceChild(PhysicalPlan newChild) {
-        return new AggregateExec(source(), newChild, groupings, aggregates, mode, estimatedRowSize);
+        return new AggregateExec(source(), newChild, groupings, aggregates, mode, intermediateAttributes, estimatedRowSize);
     }
 
     public List<? extends Expression> groupings() {
@@ -106,8 +118,8 @@ public List<? extends NamedExpression> aggregates() {
         return aggregates;
     }
 
-    public AggregateExec withMode(Mode newMode) {
-        return new AggregateExec(source(), child(), groupings, aggregates, newMode, estimatedRowSize);
+    public AggregateExec withMode(AggregatorMode newMode) {
+        return new AggregateExec(source(), child(), groupings, aggregates, newMode, intermediateAttributes, estimatedRowSize);
     }
 
     /**
@@ -122,21 +134,60 @@ public Integer estimatedRowSize() {
     public PhysicalPlan estimateRowSize(State state) {
         state.add(false, aggregates);  // The groupings are contained within the aggregates
         int size = state.consumeAllFields(true);
-        return Objects.equals(this.estimatedRowSize, size) ? this : new AggregateExec(source(), child(), groupings, aggregates, mode, size);
+        return Objects.equals(this.estimatedRowSize, size)
+            ? this
+            : new AggregateExec(source(), child(), groupings, aggregates, mode, intermediateAttributes, size);
     }
 
-    public Mode getMode() {
+    public AggregatorMode getMode() {
         return mode;
     }
 
+    /**
+     * Used only for bwc when de-/serializing.
+     */
+    @Deprecated
+    private enum Mode {
+        SINGLE,
+        PARTIAL, // maps raw inputs to intermediate outputs
+        FINAL; // maps intermediate inputs to final outputs
+
+        static Mode fromAggregatorMode(AggregatorMode aggregatorMode) {
+            return switch (aggregatorMode) {
+                case SINGLE -> SINGLE;
+                case INITIAL -> PARTIAL;
+                case FINAL -> FINAL;
+                // If needed, we could have this return an PARTIAL instead; that's how intermediate aggs were encoded in the past for
+                // data node level reduction.
+                case INTERMEDIATE -> throw new UnsupportedOperationException(
+                    "cannot turn intermediate aggregation into single, partial or final."
+                );
+            };
+        }
+    }
+
+    /**
+     * Aggregations are usually performed in two steps, first partial (e.g. locally on a data node) then final (on the coordinator node).
+     * These are the intermediate attributes output by a partial aggregation or consumed by a final one.
+     * C.f. {@link org.elasticsearch.xpack.esql.planner.AbstractPhysicalOperationProviders#intermediateAttributes}.
+     */
+    public List<Attribute> intermediateAttributes() {
+        return intermediateAttributes;
+    }
+
     @Override
     public List<Attribute> output() {
-        return Expressions.asAttributes(aggregates);
+        return mode.isOutputPartial() ? intermediateAttributes : Aggregate.output(aggregates);
+    }
+
+    @Override
+    protected AttributeSet computeReferences() {
+        return mode.isInputPartial() ? new AttributeSet(intermediateAttributes) : Aggregate.computeReferences(aggregates, groupings);
     }
 
     @Override
     public int hashCode() {
-        return Objects.hash(groupings, aggregates, mode, estimatedRowSize, child());
+        return Objects.hash(groupings, aggregates, mode, intermediateAttributes, estimatedRowSize, child());
     }
 
     @Override
@@ -153,6 +204,7 @@ public boolean equals(Object obj) {
         return Objects.equals(groupings, other.groupings)
             && Objects.equals(aggregates, other.aggregates)
             && Objects.equals(mode, other.mode)
+            && Objects.equals(intermediateAttributes, other.intermediateAttributes)
             && Objects.equals(estimatedRowSize, other.estimatedRowSize)
             && Objects.equals(child(), other.child());
     }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EnrichExec.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EnrichExec.java
index bdf1c006f8b17..fc710d92b4f0e 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EnrichExec.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EnrichExec.java
@@ -7,6 +7,7 @@
 package org.elasticsearch.xpack.esql.plan.physical;
 
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
 import org.elasticsearch.xpack.esql.core.expression.NamedExpression;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
@@ -59,6 +60,11 @@ public EnrichExec(
         this.enrichFields = enrichFields;
     }
 
+    @Override
+    protected AttributeSet computeReferences() {
+        return matchField.references();
+    }
+
     @Override
     protected NodeInfo<EnrichExec> info() {
         return NodeInfo.create(
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EvalExec.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EvalExec.java
index 97b81914f8889..860ba1489f572 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EvalExec.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/EvalExec.java
@@ -12,10 +12,12 @@
 import org.elasticsearch.common.io.stream.StreamOutput;
 import org.elasticsearch.xpack.esql.core.expression.Alias;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 import org.elasticsearch.xpack.esql.io.stream.PlanStreamInput;
 import org.elasticsearch.xpack.esql.io.stream.PlanStreamOutput;
+import org.elasticsearch.xpack.esql.plan.logical.Eval;
 
 import java.io.IOException;
 import java.util.List;
@@ -62,6 +64,11 @@ public List<Attribute> output() {
         return mergeOutputAttributes(fields, child().output());
     }
 
+    @Override
+    protected AttributeSet computeReferences() {
+        return Eval.computeReferences(fields);
+    }
+
     @Override
     public UnaryExec replaceChild(PhysicalPlan newChild) {
         return new EvalExec(source(), newChild, fields);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/FieldExtractExec.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/FieldExtractExec.java
index 71ac67e931dd8..d2df97734f195 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/FieldExtractExec.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/FieldExtractExec.java
@@ -8,6 +8,7 @@
 package org.elasticsearch.xpack.esql.plan.physical;
 
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.NodeUtils;
 import org.elasticsearch.xpack.esql.core.tree.Source;
@@ -48,6 +49,16 @@ public static Attribute extractSourceAttributesFrom(PhysicalPlan plan) {
         return null;
     }
 
+    @Override
+    protected AttributeSet computeReferences() {
+        AttributeSet required = new AttributeSet(docValuesAttributes);
+
+        required.add(sourceAttribute);
+        required.addAll(attributesToExtract);
+
+        return required;
+    }
+
     @Override
     protected NodeInfo<FieldExtractExec> info() {
         return NodeInfo.create(this, FieldExtractExec::new, child(), attributesToExtract, docValuesAttributes);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/HashJoinExec.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/HashJoinExec.java
index 0415a5cbb9132..b1daef8cb2e5c 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/HashJoinExec.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/HashJoinExec.java
@@ -9,6 +9,7 @@
 
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
 import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
+import org.elasticsearch.xpack.esql.core.expression.Expressions;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 import org.elasticsearch.xpack.esql.io.stream.PlanStreamInput;
@@ -98,6 +99,11 @@ public List<Attribute> output() {
         return output;
     }
 
+    @Override
+    protected AttributeSet computeReferences() {
+        return Expressions.references(leftFields);
+    }
+
     @Override
     public HashJoinExec replaceChild(PhysicalPlan newChild) {
         return new HashJoinExec(source(), newChild, joinData, matchFields, leftFields, rightFields, output);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/LeafExec.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/LeafExec.java
index dd8d4e4f1de21..042357b55d7e8 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/LeafExec.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/LeafExec.java
@@ -7,6 +7,7 @@
 
 package org.elasticsearch.xpack.esql.plan.physical;
 
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 
 import java.util.Collections;
@@ -18,6 +19,11 @@ protected LeafExec(Source source) {
         super(source, Collections.emptyList());
     }
 
+    @Override
+    protected AttributeSet computeReferences() {
+        return AttributeSet.EMPTY;
+    }
+
     @Override
     public final LeafExec replaceChildren(List<PhysicalPlan> newChildren) {
         throw new UnsupportedOperationException("this type of node doesn't have any children to replace");
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/MvExpandExec.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/MvExpandExec.java
index ebf7d1aba7b8a..2e7531a880742 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/MvExpandExec.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/MvExpandExec.java
@@ -7,6 +7,7 @@
 package org.elasticsearch.xpack.esql.plan.physical;
 
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
 import org.elasticsearch.xpack.esql.core.expression.NamedExpression;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
@@ -29,6 +30,11 @@ public MvExpandExec(Source source, PhysicalPlan child, NamedExpression target, A
         this.output = calculateOutput(child.output(), target, expanded);
     }
 
+    @Override
+    protected AttributeSet computeReferences() {
+        return target.references();
+    }
+
     @Override
     protected NodeInfo<MvExpandExec> info() {
         return NodeInfo.create(this, MvExpandExec::new, child(), target, expanded);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/OutputExec.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/OutputExec.java
index 84f83b00665f3..b4a5608e31dfd 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/OutputExec.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/OutputExec.java
@@ -8,6 +8,7 @@
 package org.elasticsearch.xpack.esql.plan.physical;
 
 import org.elasticsearch.compute.data.Page;
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 
@@ -31,6 +32,11 @@ public Consumer<Page> getPageConsumer() {
         return pageConsumer;
     }
 
+    @Override
+    protected AttributeSet computeReferences() {
+        return AttributeSet.EMPTY;
+    }
+
     @Override
     public UnaryExec replaceChild(PhysicalPlan newChild) {
         return new OutputExec(source(), newChild, pageConsumer);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/RegexExtractExec.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/RegexExtractExec.java
index 6bc35fc1bdded..bbc76cad54373 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/RegexExtractExec.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/RegexExtractExec.java
@@ -8,6 +8,7 @@
 package org.elasticsearch.xpack.esql.plan.physical;
 
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
 import org.elasticsearch.xpack.esql.core.expression.Expression;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 
@@ -32,6 +33,11 @@ public List<Attribute> output() {
         return mergeOutputAttributes(extractedFields, child().output());
     }
 
+    @Override
+    protected AttributeSet computeReferences() {
+        return inputExpression.references();
+    }
+
     public Expression inputExpression() {
         return inputExpression;
     }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/AbstractPhysicalOperationProviders.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/AbstractPhysicalOperationProviders.java
index 3971e79cdc6d9..0e71963e29270 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/AbstractPhysicalOperationProviders.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/AbstractPhysicalOperationProviders.java
@@ -51,23 +51,17 @@ public final PhysicalOperation groupingPhysicalOperation(
     ) {
         Layout.Builder layout = new Layout.Builder();
         Operator.OperatorFactory operatorFactory = null;
-        AggregateExec.Mode mode = aggregateExec.getMode();
+        AggregatorMode aggregatorMode = aggregateExec.getMode();
         var aggregates = aggregateExec.aggregates();
 
         var sourceLayout = source.layout;
-        AggregatorMode aggregatorMode;
 
-        if (mode == AggregateExec.Mode.FINAL) {
-            aggregatorMode = AggregatorMode.FINAL;
-        } else if (mode == AggregateExec.Mode.PARTIAL) {
-            if (aggregateExec.child() instanceof ExchangeSourceExec) {// the reducer step at data node (local) level
-                aggregatorMode = AggregatorMode.INTERMEDIATE;
-            } else {
-                aggregatorMode = AggregatorMode.INITIAL;
-            }
-        } else {
-            assert false : "Invalid aggregator mode [" + mode + "]";
-            aggregatorMode = AggregatorMode.SINGLE;
+        if (aggregatorMode != AggregatorMode.INITIAL && aggregatorMode != AggregatorMode.FINAL) {
+            assert false : "Invalid aggregator mode [" + aggregatorMode + "]";
+        }
+        if (aggregatorMode == AggregatorMode.INITIAL && aggregateExec.child() instanceof ExchangeSourceExec) {
+            // the reducer step at data node (local) level
+            aggregatorMode = AggregatorMode.INTERMEDIATE;
         }
 
         if (aggregateExec.groupings().isEmpty()) {
@@ -75,7 +69,7 @@ public final PhysicalOperation groupingPhysicalOperation(
             List<Aggregator.Factory> aggregatorFactories = new ArrayList<>();
 
             // append channels to the layout
-            if (mode == AggregateExec.Mode.FINAL) {
+            if (aggregatorMode == AggregatorMode.FINAL) {
                 layout.append(aggregates);
             } else {
                 layout.append(aggregateMapper.mapNonGrouping(aggregates));
@@ -122,7 +116,7 @@ public final PhysicalOperation groupingPhysicalOperation(
                             // check if there's any alias used in grouping - no need for the final reduction since the intermediate data
                             // is in the output form
                             // if the group points to an alias declared in the aggregate, use the alias child as source
-                            else if (mode == AggregateExec.Mode.PARTIAL) {
+                            else if (aggregatorMode == AggregatorMode.INITIAL || aggregatorMode == AggregatorMode.INTERMEDIATE) {
                                 if (groupAttribute.semanticEquals(a.toAttribute())) {
                                     groupAttribute = attr;
                                     break;
@@ -136,7 +130,7 @@ else if (mode == AggregateExec.Mode.PARTIAL) {
                 groupSpecs.add(new GroupSpec(groupInput == null ? null : groupInput.channel(), groupAttribute));
             }
 
-            if (mode == AggregateExec.Mode.FINAL) {
+            if (aggregatorMode == AggregatorMode.FINAL) {
                 for (var agg : aggregates) {
                     if (Alias.unwrap(agg) instanceof AggregateFunction) {
                         layout.append(agg);
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/LocalExecutionPlanner.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/LocalExecutionPlanner.java
index 60d76f1a8593a..b28c80211c649 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/LocalExecutionPlanner.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/LocalExecutionPlanner.java
@@ -10,6 +10,7 @@
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.util.BigArrays;
 import org.elasticsearch.compute.Describable;
+import org.elasticsearch.compute.aggregation.AggregatorMode;
 import org.elasticsearch.compute.data.Block;
 import org.elasticsearch.compute.data.BlockFactory;
 import org.elasticsearch.compute.data.ElementType;
@@ -168,7 +169,7 @@ public LocalExecutionPlan plan(PhysicalPlan localPhysicalPlan) {
         // workaround for https://github.com/elastic/elasticsearch/issues/99782
         localPhysicalPlan = localPhysicalPlan.transformUp(
             AggregateExec.class,
-            a -> a.getMode() == AggregateExec.Mode.FINAL ? new ProjectExec(a.source(), a, Expressions.asAttributes(a.aggregates())) : a
+            a -> a.getMode() == AggregatorMode.FINAL ? new ProjectExec(a.source(), a, Expressions.asAttributes(a.aggregates())) : a
         );
         PhysicalOperation physicalOperation = plan(localPhysicalPlan, context);
 
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/Mapper.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/Mapper.java
index 299149c6daabc..9613fa1f3fcde 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/Mapper.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/Mapper.java
@@ -8,7 +8,9 @@
 package org.elasticsearch.xpack.esql.planner;
 
 import org.elasticsearch.common.lucene.BytesRefs;
+import org.elasticsearch.compute.aggregation.AggregatorMode;
 import org.elasticsearch.xpack.esql.EsqlIllegalArgumentException;
+import org.elasticsearch.xpack.esql.core.expression.Attribute;
 import org.elasticsearch.xpack.esql.expression.function.EsqlFunctionRegistry;
 import org.elasticsearch.xpack.esql.plan.logical.Aggregate;
 import org.elasticsearch.xpack.esql.plan.logical.BinaryPlan;
@@ -52,9 +54,7 @@
 import org.elasticsearch.xpack.esql.plan.physical.ShowExec;
 import org.elasticsearch.xpack.esql.plan.physical.TopNExec;
 
-import static org.elasticsearch.xpack.esql.plan.physical.AggregateExec.Mode;
-import static org.elasticsearch.xpack.esql.plan.physical.AggregateExec.Mode.FINAL;
-import static org.elasticsearch.xpack.esql.plan.physical.AggregateExec.Mode.PARTIAL;
+import java.util.List;
 
 /**
  * <p>This class is part of the planner</p>
@@ -216,9 +216,13 @@ private PhysicalPlan map(UnaryPlan p, PhysicalPlan child) {
     }
 
     private PhysicalPlan map(Aggregate aggregate, PhysicalPlan child) {
+        List<Attribute> intermediateAttributes = AbstractPhysicalOperationProviders.intermediateAttributes(
+            aggregate.aggregates(),
+            aggregate.groupings()
+        );
         // in local mode the only aggregate that can appear is the partial side under an exchange
         if (localMode) {
-            child = aggExec(aggregate, child, PARTIAL);
+            child = aggExec(aggregate, child, AggregatorMode.INITIAL, intermediateAttributes);
         }
         // otherwise create both sides of the aggregate (for parallelism purposes), if no fragment is present
         // TODO: might be easier long term to end up with just one node and split if necessary instead of doing that always at this stage
@@ -226,23 +230,35 @@ private PhysicalPlan map(Aggregate aggregate, PhysicalPlan child) {
             child = addExchangeForFragment(aggregate, child);
             // exchange was added - use the intermediates for the output
             if (child instanceof ExchangeExec exchange) {
-                var output = AbstractPhysicalOperationProviders.intermediateAttributes(aggregate.aggregates(), aggregate.groupings());
-                child = new ExchangeExec(child.source(), output, true, exchange.child());
+                child = new ExchangeExec(child.source(), intermediateAttributes, true, exchange.child());
             }
             // if no exchange was added, create the partial aggregate
             else {
-                child = aggExec(aggregate, child, PARTIAL);
+                child = aggExec(aggregate, child, AggregatorMode.INITIAL, intermediateAttributes);
             }
 
             // regardless, always add the final agg
-            child = aggExec(aggregate, child, FINAL);
+            child = aggExec(aggregate, child, AggregatorMode.FINAL, intermediateAttributes);
         }
 
         return child;
     }
 
-    private static AggregateExec aggExec(Aggregate aggregate, PhysicalPlan child, Mode aggMode) {
-        return new AggregateExec(aggregate.source(), child, aggregate.groupings(), aggregate.aggregates(), aggMode, null);
+    private static AggregateExec aggExec(
+        Aggregate aggregate,
+        PhysicalPlan child,
+        AggregatorMode aggMode,
+        List<Attribute> intermediateAttributes
+    ) {
+        return new AggregateExec(
+            aggregate.source(),
+            child,
+            aggregate.groupings(),
+            aggregate.aggregates(),
+            aggMode,
+            intermediateAttributes,
+            null
+        );
     }
 
     private PhysicalPlan map(Limit limit, PhysicalPlan child) {
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/PlannerUtils.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/PlannerUtils.java
index 29be49e60ad37..d2568e5f5031c 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/PlannerUtils.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/PlannerUtils.java
@@ -10,6 +10,7 @@
 import org.elasticsearch.common.Strings;
 import org.elasticsearch.common.breaker.NoopCircuitBreaker;
 import org.elasticsearch.common.util.BigArrays;
+import org.elasticsearch.compute.aggregation.AggregatorMode;
 import org.elasticsearch.compute.data.BlockFactory;
 import org.elasticsearch.compute.data.ElementType;
 import org.elasticsearch.core.Tuple;
@@ -97,7 +98,7 @@ public static PhysicalPlan dataNodeReductionPlan(LogicalPlan plan, PhysicalPlan
                 Mapper mapper = new Mapper(true);
                 var physicalPlan = EstimatesRowSize.estimateRowSize(0, mapper.map(plan));
                 var aggregate = (AggregateExec) physicalPlan.collectFirstChildren(AggregateExec.class::isInstance).get(0);
-                return aggregate.withMode(AggregateExec.Mode.PARTIAL);
+                return aggregate.withMode(AggregatorMode.INITIAL);
             } else {
                 throw new EsqlIllegalArgumentException("unsupported unary physical plan node [" + pipelineBreaker.nodeName() + "]");
             }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/session/EsqlSession.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/session/EsqlSession.java
index 29a32df8e6239..674f2c3c2ee65 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/session/EsqlSession.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/session/EsqlSession.java
@@ -13,6 +13,7 @@
 import org.elasticsearch.common.regex.Regex;
 import org.elasticsearch.compute.operator.DriverProfile;
 import org.elasticsearch.core.Releasables;
+import org.elasticsearch.index.IndexMode;
 import org.elasticsearch.index.query.QueryBuilder;
 import org.elasticsearch.logging.LogManager;
 import org.elasticsearch.logging.Logger;
@@ -27,6 +28,7 @@
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
 import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
 import org.elasticsearch.xpack.esql.core.expression.EmptyAttribute;
+import org.elasticsearch.xpack.esql.core.expression.Expressions;
 import org.elasticsearch.xpack.esql.core.expression.MetadataAttribute;
 import org.elasticsearch.xpack.esql.core.expression.UnresolvedAttribute;
 import org.elasticsearch.xpack.esql.core.expression.UnresolvedStar;
@@ -50,6 +52,7 @@
 import org.elasticsearch.xpack.esql.plan.logical.Phased;
 import org.elasticsearch.xpack.esql.plan.logical.Project;
 import org.elasticsearch.xpack.esql.plan.logical.RegexExtract;
+import org.elasticsearch.xpack.esql.plan.logical.UnresolvedRelation;
 import org.elasticsearch.xpack.esql.plan.physical.EstimatesRowSize;
 import org.elasticsearch.xpack.esql.plan.physical.FragmentExec;
 import org.elasticsearch.xpack.esql.plan.physical.PhysicalPlan;
@@ -292,14 +295,19 @@ static Set<String> fieldNames(LogicalPlan parsed, Set<String> enrichPolicyMatchF
                 }
                 // but keep the inputs needed by Grok/Dissect
                 references.addAll(re.input().references());
-            } else if (p instanceof Enrich) {
-                AttributeSet enrichRefs = p.references();
+            } else if (p instanceof Enrich enrich) {
+                AttributeSet enrichRefs = Expressions.references(enrich.enrichFields());
+                enrichRefs = enrichRefs.combine(enrich.matchField().references());
                 // Enrich adds an EmptyAttribute if no match field is specified
                 // The exact name of the field will be added later as part of enrichPolicyMatchFields Set
                 enrichRefs.removeIf(attr -> attr instanceof EmptyAttribute);
                 references.addAll(enrichRefs);
             } else {
                 references.addAll(p.references());
+                if (p instanceof UnresolvedRelation ur && ur.indexMode() == IndexMode.TIME_SERIES) {
+                    // METRICS aggs generally rely on @timestamp without the user having to mention it.
+                    references.add(new UnresolvedAttribute(ur.source(), MetadataAttribute.TIMESTAMP_FIELD));
+                }
                 // special handling for UnresolvedPattern (which is not an UnresolvedAttribute)
                 p.forEachExpression(UnresolvedNamePattern.class, up -> {
                     var ua = new UnresolvedAttribute(up.source(), up.name());
@@ -317,10 +325,11 @@ static Set<String> fieldNames(LogicalPlan parsed, Set<String> enrichPolicyMatchF
             // remove any already discovered UnresolvedAttributes that are in fact aliases defined later down in the tree
             // for example "from test | eval x = salary | stats max = max(x) by gender"
             // remove the UnresolvedAttribute "x", since that is an Alias defined in "eval"
+            AttributeSet planRefs = Expressions.references(p.expressions());
             p.forEachExpressionDown(Alias.class, alias -> {
                 // do not remove the UnresolvedAttribute that has the same name as its alias, ie "rename id = id"
                 // or the UnresolvedAttributes that are used in Functions that have aliases "STATS id = MAX(id)"
-                if (p.references().names().contains(alias.name())) {
+                if (planRefs.names().contains(alias.name())) {
                     return;
                 }
                 references.removeIf(attr -> matchByName(attr, alias.name(), keepCommandReferences.contains(attr)));
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/FieldAttributeTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/FieldAttributeTests.java
index 8090a20ddc836..e8f0333791844 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/FieldAttributeTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/FieldAttributeTests.java
@@ -15,6 +15,8 @@
 import org.elasticsearch.xpack.esql.core.type.EsField;
 import org.elasticsearch.xpack.esql.type.AbstractEsFieldTypeTests;
 
+import static org.elasticsearch.xpack.esql.core.expression.FieldAttributeTestUtils.newFieldAttributeWithType;
+
 public class FieldAttributeTests extends AbstractAttributeTestCase<FieldAttribute> {
     public static FieldAttribute createFieldAttribute(int maxDepth, boolean onlyRepresentable) {
         Source source = Source.EMPTY;
@@ -26,7 +28,7 @@ public static FieldAttribute createFieldAttribute(int maxDepth, boolean onlyRepr
         EsField field = AbstractEsFieldTypeTests.randomAnyEsField(maxDepth);
         Nullability nullability = randomFrom(Nullability.values());
         boolean synthetic = randomBoolean();
-        return new FieldAttribute(source, parent, name, type, field, nullability, new NameId(), synthetic);
+        return newFieldAttributeWithType(source, parent, name, type, field, nullability, new NameId(), synthetic);
     }
 
     @Override
@@ -51,6 +53,6 @@ protected FieldAttribute mutate(FieldAttribute instance) {
             case 4 -> nullability = randomValueOtherThan(nullability, () -> randomFrom(Nullability.values()));
             case 5 -> synthetic = false == synthetic;
         }
-        return new FieldAttribute(source, parent, name, type, field, nullability, new NameId(), synthetic);
+        return newFieldAttributeWithType(source, parent, name, type, field, nullability, new NameId(), synthetic);
     }
 }
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypesTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypesTests.java
index a3d1e70e558d6..853062676a0dc 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypesTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypesTests.java
@@ -55,6 +55,7 @@
 
 import static org.elasticsearch.test.ListMatcher.matchesList;
 import static org.elasticsearch.test.MapMatcher.assertMap;
+import static org.elasticsearch.xpack.esql.core.expression.FieldAttributeTestUtils.newFieldAttributeWithType;
 import static org.hamcrest.Matchers.equalTo;
 
 public class PlanNamedTypesTests extends ESTestCase {
@@ -127,7 +128,7 @@ static FieldAttribute randomFieldAttributeOrNull() {
     }
 
     static FieldAttribute randomFieldAttribute() {
-        return new FieldAttribute(
+        return newFieldAttributeWithType(
             Source.EMPTY,
             randomFieldAttributeOrNull(), // parent
             randomAlphaOfLength(randomIntBetween(1, 25)), // name
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalLogicalPlanOptimizerTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalLogicalPlanOptimizerTests.java
index 5c166e92ab152..8ee84daf06802 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalLogicalPlanOptimizerTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalLogicalPlanOptimizerTests.java
@@ -16,6 +16,7 @@
 import org.elasticsearch.xpack.esql.analysis.AnalyzerContext;
 import org.elasticsearch.xpack.esql.core.expression.Alias;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
 import org.elasticsearch.xpack.esql.core.expression.Expression;
 import org.elasticsearch.xpack.esql.core.expression.Expressions;
 import org.elasticsearch.xpack.esql.core.expression.FieldAttribute;
@@ -229,6 +230,10 @@ public MockFieldAttributeCommand(Source source, LogicalPlan child, FieldAttribut
         }
 
         @Override
+        protected AttributeSet computeReferences() {
+            return AttributeSet.EMPTY;
+        }
+
         public void writeTo(StreamOutput out) {
             throw new UnsupportedOperationException("not serialized");
         }
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalPhysicalPlanOptimizerTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalPhysicalPlanOptimizerTests.java
index 8a6712869d35e..eeb720084e635 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalPhysicalPlanOptimizerTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/LocalPhysicalPlanOptimizerTests.java
@@ -69,11 +69,11 @@
 import java.util.Map;
 
 import static java.util.Arrays.asList;
+import static org.elasticsearch.compute.aggregation.AggregatorMode.FINAL;
 import static org.elasticsearch.xpack.esql.EsqlTestUtils.as;
 import static org.elasticsearch.xpack.esql.EsqlTestUtils.configuration;
 import static org.elasticsearch.xpack.esql.EsqlTestUtils.loadMapping;
 import static org.elasticsearch.xpack.esql.EsqlTestUtils.withDefaultLimitWarning;
-import static org.elasticsearch.xpack.esql.plan.physical.AggregateExec.Mode.FINAL;
 import static org.elasticsearch.xpack.esql.plan.physical.EsStatsQueryExec.StatsType;
 import static org.hamcrest.Matchers.contains;
 import static org.hamcrest.Matchers.equalTo;
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/PhysicalPlanOptimizerTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/PhysicalPlanOptimizerTests.java
index 6f489541a7815..32993ca90cd83 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/PhysicalPlanOptimizerTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/optimizer/PhysicalPlanOptimizerTests.java
@@ -45,6 +45,7 @@
 import org.elasticsearch.xpack.esql.core.expression.predicate.logical.Not;
 import org.elasticsearch.xpack.esql.core.expression.predicate.logical.Or;
 import org.elasticsearch.xpack.esql.core.expression.predicate.operator.comparison.BinaryComparison;
+import org.elasticsearch.xpack.esql.core.tree.Source;
 import org.elasticsearch.xpack.esql.core.type.DataType;
 import org.elasticsearch.xpack.esql.core.type.EsField;
 import org.elasticsearch.xpack.esql.enrich.ResolvedEnrichPolicy;
@@ -62,6 +63,8 @@
 import org.elasticsearch.xpack.esql.expression.function.scalar.spatial.SpatialRelatesFunction;
 import org.elasticsearch.xpack.esql.expression.function.scalar.spatial.SpatialWithin;
 import org.elasticsearch.xpack.esql.expression.function.scalar.spatial.StDistance;
+import org.elasticsearch.xpack.esql.expression.function.scalar.string.ToLower;
+import org.elasticsearch.xpack.esql.expression.function.scalar.string.ToUpper;
 import org.elasticsearch.xpack.esql.expression.predicate.operator.comparison.Equals;
 import org.elasticsearch.xpack.esql.expression.predicate.operator.comparison.EsqlBinaryComparison;
 import org.elasticsearch.xpack.esql.expression.predicate.operator.comparison.GreaterThan;
@@ -124,6 +127,8 @@
 import java.util.stream.Collectors;
 
 import static java.util.Arrays.asList;
+import static org.elasticsearch.compute.aggregation.AggregatorMode.FINAL;
+import static org.elasticsearch.compute.aggregation.AggregatorMode.INITIAL;
 import static org.elasticsearch.core.Tuple.tuple;
 import static org.elasticsearch.index.query.QueryBuilders.boolQuery;
 import static org.elasticsearch.index.query.QueryBuilders.existsQuery;
@@ -144,9 +149,8 @@
 import static org.elasticsearch.xpack.esql.core.type.DataType.GEO_POINT;
 import static org.elasticsearch.xpack.esql.parser.ExpressionBuilder.MAX_EXPRESSION_DEPTH;
 import static org.elasticsearch.xpack.esql.parser.LogicalPlanBuilder.MAX_QUERY_DEPTH;
-import static org.elasticsearch.xpack.esql.plan.physical.AggregateExec.Mode.FINAL;
-import static org.elasticsearch.xpack.esql.plan.physical.AggregateExec.Mode.PARTIAL;
 import static org.hamcrest.Matchers.contains;
+import static org.hamcrest.Matchers.containsInAnyOrder;
 import static org.hamcrest.Matchers.containsString;
 import static org.hamcrest.Matchers.equalTo;
 import static org.hamcrest.Matchers.hasItem;
@@ -554,7 +558,18 @@ public void testExtractorMultiEvalWithDifferentNames() {
         var extract = as(project.child(), FieldExtractExec.class);
         assertThat(
             names(extract.attributesToExtract()),
-            contains("_meta_field", "emp_no", "first_name", "gender", "job", "job.raw", "languages", "last_name", "long_noidx", "salary")
+            containsInAnyOrder(
+                "_meta_field",
+                "emp_no",
+                "first_name",
+                "gender",
+                "job",
+                "job.raw",
+                "languages",
+                "last_name",
+                "long_noidx",
+                "salary"
+            )
         );
     }
 
@@ -584,7 +599,18 @@ public void testExtractorMultiEvalWithSameName() {
         var extract = as(project.child(), FieldExtractExec.class);
         assertThat(
             names(extract.attributesToExtract()),
-            contains("_meta_field", "emp_no", "first_name", "gender", "job", "job.raw", "languages", "last_name", "long_noidx", "salary")
+            containsInAnyOrder(
+                "_meta_field",
+                "emp_no",
+                "first_name",
+                "gender",
+                "job",
+                "job.raw",
+                "languages",
+                "last_name",
+                "long_noidx",
+                "salary"
+            )
         );
     }
 
@@ -2072,6 +2098,139 @@ public void testFieldExtractWithoutSourceAttributes() {
         );
     }
 
+    public void testProjectAwayColumns() {
+        var rule = new PhysicalPlanOptimizer.ProjectAwayColumns();
+
+        // FROM test | limit 10000
+        //
+        // as physical plan:
+        //
+        // LimitExec[10000[INTEGER]]
+        // \_ExchangeExec[[],false]
+        // \_FragmentExec[filter=null, estimatedRowSize=0, reducer=[], fragment=[<>
+        // EsRelation[test][some_field1{f}#2, some_field2{f}#3]<>]]
+
+        EsRelation relation = new EsRelation(
+            Source.EMPTY,
+            new EsIndex(
+                "test",
+                Map.of(
+                    "some_field1",
+                    new EsField("some_field1", DataType.KEYWORD, Map.of(), true),
+                    "some_field2",
+                    new EsField("some_field2", DataType.KEYWORD, Map.of(), true)
+                )
+            ),
+            IndexMode.STANDARD,
+            false
+        );
+        Attribute some_field1 = relation.output().get(0);
+        Attribute some_field2 = relation.output().get(1);
+        FragmentExec fragment = new FragmentExec(relation);
+        ExchangeExec exchange = new ExchangeExec(Source.EMPTY, fragment);
+        LimitExec limitThenFragment = new LimitExec(Source.EMPTY, exchange, new Literal(Source.EMPTY, 10000, DataType.INTEGER));
+
+        // All the relation's fields are required.
+        PhysicalPlan plan = rule.apply(limitThenFragment);
+        Project project = as(
+            as(as(as(plan, LimitExec.class).child(), ExchangeExec.class).child(), FragmentExec.class).fragment(),
+            Project.class
+        );
+        assertThat(project.projections(), containsInAnyOrder(some_field1, some_field2));
+
+        // FROM test | limit 10000 | keep some_field1
+        ProjectExec projectLimitThenFragment = new ProjectExec(Source.EMPTY, limitThenFragment, List.of(some_field1));
+        plan = rule.apply(projectLimitThenFragment);
+        project = as(
+            as(as(as(as(plan, ProjectExec.class).child(), LimitExec.class).child(), ExchangeExec.class).child(), FragmentExec.class)
+                .fragment(),
+            Project.class
+        );
+        assertThat(project.projections(), contains(some_field1));
+
+        // FROM test | limit 10000 | eval x = to_lower(some_field1)
+        Alias x = new Alias(Source.EMPTY, "x", new ToLower(Source.EMPTY, some_field1, config));
+        EvalExec evalLimitThenFragment = new EvalExec(Source.EMPTY, limitThenFragment, List.of(x));
+        plan = rule.apply(evalLimitThenFragment);
+        project = as(
+            as(as(as(as(plan, EvalExec.class).child(), LimitExec.class).child(), ExchangeExec.class).child(), FragmentExec.class)
+                .fragment(),
+            Project.class
+        );
+        assertThat(project.projections(), containsInAnyOrder(some_field1, some_field2));
+
+        // FROM test | limit 10000 | eval x = to_lower(some_field1) | keep x
+        ProjectExec projectEvalLimitThenFragment = new ProjectExec(Source.EMPTY, evalLimitThenFragment, List.of(x.toAttribute()));
+        plan = rule.apply(projectEvalLimitThenFragment);
+        project = as(
+            as(
+                as(as(as(as(plan, ProjectExec.class).child(), EvalExec.class).child(), LimitExec.class).child(), ExchangeExec.class)
+                    .child(),
+                FragmentExec.class
+            ).fragment(),
+            Project.class
+        );
+        assertThat(project.projections(), contains(some_field1));
+
+        // FROM test | limit 10000 | rename some_field1 as some_field2
+        ProjectExec renameLimitThenFragment = new ProjectExec(
+            Source.EMPTY,
+            limitThenFragment,
+            List.of(new Alias(Source.EMPTY, some_field2.name(), some_field1))
+        );
+        plan = rule.apply(renameLimitThenFragment);
+        project = as(
+            as(as(as(as(plan, ProjectExec.class).child(), LimitExec.class).child(), ExchangeExec.class).child(), FragmentExec.class)
+                .fragment(),
+            Project.class
+        );
+        assertThat(project.projections(), contains(some_field1));
+
+        // FROM test | limit 10000 | eval x = to_lower(some_field1), y = to_upper(x) | keep y
+        Alias y = new Alias(Source.EMPTY, "y", new ToUpper(Source.EMPTY, x.toAttribute(), config));
+        EvalExec evalTwiceLimitThenFragment = new EvalExec(Source.EMPTY, limitThenFragment, List.of(x, y));
+        ProjectExec projectEvalTwiceLimitThenFragment = new ProjectExec(Source.EMPTY, evalTwiceLimitThenFragment, List.of(y.toAttribute()));
+        plan = rule.apply(projectEvalTwiceLimitThenFragment);
+        project = as(
+            as(
+                as(as(as(as(plan, ProjectExec.class).child(), EvalExec.class).child(), LimitExec.class).child(), ExchangeExec.class)
+                    .child(),
+                FragmentExec.class
+            ).fragment(),
+            Project.class
+        );
+        assertThat(project.projections(), contains(some_field1));
+    }
+
+    /**
+     * Expects
+     * ProjectExec[[avg(emp_no){r}#3]]
+     * \_EvalExec[[$$SUM$avg(emp_no)$0{r:s}#14 / $$COUNT$avg(emp_no)$1{r:s}#15 AS avg(emp_no)]]
+     *   \_LimitExec[1000[INTEGER]]
+     *     \_AggregateExec[[],[SUM(emp_no{f}#4) AS $$SUM$avg(emp_no)$0, COUNT(emp_no{f}#4) AS $$COUNT$avg(emp_no)$1],FINAL,[sum{r}#16, seen{
+     * r}#17, count{r}#18, seen{r}#19],24]
+     *       \_ExchangeExec[[sum{r}#16, seen{r}#17, count{r}#18, seen{r}#19],true]
+     *         \_AggregateExec[[],[SUM(emp_no{f}#4) AS $$SUM$avg(emp_no)$0, COUNT(emp_no{f}#4) AS $$COUNT$avg(emp_no)$1],INITIAL,[sum{r}#37,
+     *           seen{r}#38, count{r}#39, seen{r}#40],16]
+     *           \_FieldExtractExec[emp_no{f}#4]
+     *             \_EsQueryExec[test], indexMode[standard], query[{"exists":{"field":"emp_no","boost":1.0}}][_doc{f}#41], limit[], sort[]
+     *               estimatedRowSize[8]
+     */
+    public void testProjectAwayColumnsDoesNothingForPipelineBreakingAggs() {
+        var plan = optimizedPlan(physicalPlan("""
+            from test
+            | stats avg(emp_no)
+            """));
+
+        ProjectExec project = as(plan, ProjectExec.class);
+        EvalExec eval = as(project.child(), EvalExec.class);
+        LimitExec limit = as(eval.child(), LimitExec.class);
+        AggregateExec finalAgg = as(limit.child(), AggregateExec.class);
+        ExchangeExec exchange = as(finalAgg.child(), ExchangeExec.class);
+        // No projection inserted here.
+        AggregateExec initialAgg = as(exchange.child(), AggregateExec.class);
+    }
+
     /**
      * Expects
      * ProjectExec[[x{r}#3]]
@@ -2083,7 +2242,7 @@ public void testFieldExtractWithoutSourceAttributes() {
      *           \_EsQueryExec[test], query[{"esql_single_value":{"field":"emp_no","next":{"range":{"emp_no":{"gt":10,"boost":1.0}}}}}]
      *            [_doc{f}#13], limit[10000], sort[] estimatedRowSize[8]
      */
-    public void testProjectAllFieldsWhenOnlyTheCountMatters() {
+    public void testProjectAwayAllColumnsWhenOnlyTheCountMatters() {
         var plan = optimizedPlan(physicalPlan("""
             from test
             | where emp_no > 10
@@ -2101,6 +2260,42 @@ public void testProjectAllFieldsWhenOnlyTheCountMatters() {
         eval = as(project.child(), EvalExec.class);
         assertThat(Expressions.names(eval.fields()), contains(nullField));
         var source = source(eval.child());
+        assertThat(Expressions.names(source.attrs()), contains("_doc"));
+    }
+
+    /**
+     * Expects
+     *
+     * LimitExec[10000[INTEGER]]
+     * \_AggregateExec[[],[COUNT([2a][KEYWORD]) AS count(*)],FINAL,[count{r}#13, seen{r}#14],8]
+     *   \_AggregateExec[[],[COUNT([2a][KEYWORD]) AS count(*)],INITIAL,[count{r}#13, seen{r}#14],8]
+     *     \_LimitExec[10[INTEGER]]
+     *       \_ExchangeExec[[&lt;all-fields-projected&gt;{r:s}#28],false]
+     *         \_ProjectExec[[&lt;all-fields-projected&gt;{r:s}#28]]
+     *           \_EvalExec[[null[NULL] AS &lt;all-fields-projected&gt;]]
+     *             \_EsQueryExec[test], indexMode[standard], query[][_doc{f}#29], limit[10], sort[] estimatedRowSize[4]
+     */
+    public void testProjectAwayAllColumnsWhenOnlyTheCountMattersInStats() {
+        var plan = optimizedPlan(physicalPlan("""
+            from test
+            | limit 10
+            | stats count(*)
+            """));
+
+        var limit = as(plan, LimitExec.class);
+        var aggFinal = as(limit.child(), AggregateExec.class);
+        var aggInitial = as(aggFinal.child(), AggregateExec.class);
+        var limit10 = as(aggInitial.child(), LimitExec.class);
+
+        var exchange = as(limit10.child(), ExchangeExec.class);
+        var project = as(exchange.child(), ProjectExec.class);
+        var eval = as(project.child(), EvalExec.class);
+        EsQueryExec esQuery = as(eval.child(), EsQueryExec.class);
+
+        var nullField = "<all-fields-projected>";
+        assertThat(Expressions.names(project.projections()), contains(nullField));
+        assertThat(Expressions.names(eval.fields()), contains(nullField));
+        assertThat(Expressions.names(esQuery.attrs()), contains("_doc"));
     }
 
     /**
@@ -2131,7 +2326,7 @@ public void testAvgSurrogateFunctionAfterRenameAndLimit() {
         var aggFinal = as(limit.child(), AggregateExec.class);
         assertThat(aggFinal.getMode(), equalTo(FINAL));
         var aggPartial = as(aggFinal.child(), AggregateExec.class);
-        assertThat(aggPartial.getMode(), equalTo(PARTIAL));
+        assertThat(aggPartial.getMode(), equalTo(INITIAL));
         limit = as(aggPartial.child(), LimitExec.class);
         assertThat(limit.limit(), instanceOf(Literal.class));
         assertThat(limit.limit().fold(), equalTo(10));
@@ -2239,7 +2434,8 @@ public void testGlobalAggFoldingOutput() {
         var limit = as(optimized, LimitExec.class);
         var aggFinal = as(limit.child(), AggregateExec.class);
         var aggPartial = as(aggFinal.child(), AggregateExec.class);
-        assertThat(Expressions.names(aggPartial.output()), contains("c"));
+        // The partial aggregation's output is determined via AbstractPhysicalOperationProviders.intermediateAttributes()
+        assertThat(Expressions.names(aggPartial.output()), contains("count", "seen"));
         limit = as(aggPartial.child(), LimitExec.class);
         var exchange = as(limit.child(), ExchangeExec.class);
         var project = as(exchange.child(), ProjectExec.class);
@@ -2375,7 +2571,7 @@ public void testSpatialTypesAndStatsUseDocValuesNestedLiteral() {
         assertThat("No groupings in aggregation", agg.groupings().size(), equalTo(0));
         assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, false);
         agg = as(agg.child(), AggregateExec.class);
-        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(PARTIAL));
+        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(INITIAL));
         assertThat("No groupings in aggregation", agg.groupings().size(), equalTo(0));
         assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, false);
         var eval = as(agg.child(), EvalExec.class);
@@ -2389,7 +2585,7 @@ public void testSpatialTypesAndStatsUseDocValuesNestedLiteral() {
         assertThat("No groupings in aggregation", agg.groupings().size(), equalTo(0));
         assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, false);
         agg = as(agg.child(), AggregateExec.class);
-        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(PARTIAL));
+        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(INITIAL));
         assertThat("No groupings in aggregation", agg.groupings().size(), equalTo(0));
         assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, false);
         eval = as(agg.child(), EvalExec.class);
@@ -2444,7 +2640,7 @@ public void testSpatialTypesAndStatsUseDocValuesMultiAggregations() {
         assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, false);
         exchange = as(agg.child(), ExchangeExec.class);
         agg = as(exchange.child(), AggregateExec.class);
-        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(PARTIAL));
+        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(INITIAL));
         // below the exchange (in data node) the aggregation is using doc-values
         assertAggregation(agg, "count", Count.class);
         assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, true);
@@ -2512,7 +2708,7 @@ public void testSpatialTypesAndStatsUseDocValuesMultiSpatialAggregations() {
         assertAggregation(agg, "cities", SpatialCentroid.class, GEO_POINT, false);
         exchange = as(agg.child(), ExchangeExec.class);
         agg = as(exchange.child(), AggregateExec.class);
-        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(PARTIAL));
+        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(INITIAL));
         // below the exchange (in data node) the aggregation is using doc-values
         assertAggregation(agg, "count", Count.class);
         assertAggregation(agg, "airports", SpatialCentroid.class, GEO_POINT, true);
@@ -2578,7 +2774,7 @@ public void testSpatialTypesAndStatsUseDocValuesMultiAggregationsFiltered() {
         assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, false);
         exchange = as(agg.child(), ExchangeExec.class);
         agg = as(exchange.child(), AggregateExec.class);
-        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(PARTIAL));
+        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(INITIAL));
         // below the exchange (in data node) the aggregation is using doc-values
         assertAggregation(agg, "count", Count.class);
         assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, true);
@@ -2647,7 +2843,7 @@ public void testSpatialTypesAndStatsUseDocValuesMultiAggregationsGrouped() {
         assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, false);
         exchange = as(agg.child(), ExchangeExec.class);
         agg = as(exchange.child(), AggregateExec.class);
-        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(PARTIAL));
+        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(INITIAL));
         att = as(agg.groupings().get(0), Attribute.class);
         assertThat(att.name(), equalTo("scalerank"));
         // below the exchange (in data node) the aggregation is using doc-values
@@ -2700,7 +2896,7 @@ public void testSpatialTypesAndStatsUseDocValuesMultiAggregationsGroupedAggregat
         assertAggregation(agg, "count", Sum.class);
         assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, false);
         agg = as(agg.child(), AggregateExec.class);
-        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(PARTIAL));
+        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(INITIAL));
         assertThat("No groupings in aggregation", agg.groupings().size(), equalTo(0));
         assertAggregation(agg, "count", Sum.class);
         assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, false);
@@ -2726,7 +2922,7 @@ public void testSpatialTypesAndStatsUseDocValuesMultiAggregationsGroupedAggregat
         assertAggregation(agg, "count", Sum.class);
         assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, false);
         agg = as(agg.child(), AggregateExec.class);
-        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(PARTIAL));
+        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(INITIAL));
         assertThat("No groupings in aggregation", agg.groupings().size(), equalTo(0));
         assertAggregation(agg, "count", Sum.class);
         assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, false);
@@ -2743,7 +2939,7 @@ public void testSpatialTypesAndStatsUseDocValuesMultiAggregationsGroupedAggregat
         att = as(agg.groupings().get(0), Attribute.class);
         assertThat(att.name(), equalTo("scalerank"));
         // below the exchange (in data node) the aggregation is using doc-values
-        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(PARTIAL));
+        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(INITIAL));
         assertAggregation(agg, "count", Count.class);
         assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, true);
         var extract = as(agg.child(), FieldExtractExec.class);
@@ -3037,7 +3233,7 @@ public void testPushDownSpatialRelatesStringToSourceAndUseDocValuesForCentroid()
             assertAggregation(agg, "centroid", SpatialCentroid.class, test.locationType(), false);
             exchange = as(agg.child(), ExchangeExec.class);
             agg = as(exchange.child(), AggregateExec.class);
-            assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(PARTIAL));
+            assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(INITIAL));
             // below the exchange (in data node) the aggregation is using doc-values
             assertAggregation(agg, "count", Count.class);
             assertAggregation(agg, "centroid", SpatialCentroid.class, test.locationType(), true);
@@ -3144,7 +3340,7 @@ public void testPushSpatialIntersectsStringToSourceAndUseDocValuesForCentroid()
             assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, false);
             exchange = as(agg.child(), ExchangeExec.class);
             agg = as(exchange.child(), AggregateExec.class);
-            assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(PARTIAL));
+            assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(INITIAL));
             // below the exchange (in data node) the aggregation is using doc-values
             assertAggregation(agg, "count", Count.class);
             assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, true);
@@ -3249,7 +3445,7 @@ AND ST_INTERSECTS(TO_GEOSHAPE("POLYGON((42 14, 43 14, 43 15, 42 15, 42 14))"), l
             assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, false);
             exchange = as(agg.child(), ExchangeExec.class);
             agg = as(exchange.child(), AggregateExec.class);
-            assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(PARTIAL));
+            assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(INITIAL));
             // below the exchange (in data node) the aggregation is using doc-values
             assertAggregation(agg, "count", Count.class);
             assertAggregation(agg, "centroid", SpatialCentroid.class, GEO_POINT, true);
@@ -3330,7 +3526,7 @@ public void testIntersectsOnTwoPointFieldAndBothCentroidUsesDocValues() {
         assertAggregation(agg, "city_location", SpatialCentroid.class, GEO_POINT, false);
         exchange = as(agg.child(), ExchangeExec.class);
         agg = as(exchange.child(), AggregateExec.class);
-        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(PARTIAL));
+        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(INITIAL));
         // below the exchange (in data node) the aggregation is using doc-values
         assertAggregation(agg, "count", Count.class);
         assertAggregation(agg, "location", SpatialCentroid.class, GEO_POINT, true);
@@ -3376,7 +3572,7 @@ public void testIntersectsOnTwoPointFieldAndOneCentroidUsesDocValues() {
             assertAggregation(agg, aggFieldName, SpatialCentroid.class, GEO_POINT, false);
             exchange = as(agg.child(), ExchangeExec.class);
             agg = as(exchange.child(), AggregateExec.class);
-            assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(PARTIAL));
+            assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(INITIAL));
             // below the exchange (in data node) the aggregation is using doc-values
             assertAggregation(agg, "count", Count.class);
             assertAggregation(agg, aggFieldName, SpatialCentroid.class, GEO_POINT, true);
@@ -3422,7 +3618,7 @@ AND ST_INTERSECTS(city_location, TO_GEOSHAPE("POLYGON((42 14, 43 14, 43 15, 42 1
         assertAggregation(agg, "city_location", SpatialCentroid.class, GEO_POINT, false);
         exchange = as(agg.child(), ExchangeExec.class);
         agg = as(exchange.child(), AggregateExec.class);
-        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(PARTIAL));
+        assertThat("Aggregation is PARTIAL", agg.getMode(), equalTo(INITIAL));
         // below the exchange (in data node) the aggregation is using doc-values
         assertAggregation(agg, "count", Count.class);
         assertAggregation(agg, "location", SpatialCentroid.class, GEO_POINT, true);
@@ -3825,7 +4021,7 @@ public void testEnrichBeforeAggregation() {
             var finalAggs = as(limit.child(), AggregateExec.class);
             assertThat(finalAggs.getMode(), equalTo(FINAL));
             var partialAggs = as(finalAggs.child(), AggregateExec.class);
-            assertThat(partialAggs.getMode(), equalTo(PARTIAL));
+            assertThat(partialAggs.getMode(), equalTo(INITIAL));
             var enrich = as(partialAggs.child(), EnrichExec.class);
             assertThat(enrich.mode(), equalTo(Enrich.Mode.COORDINATOR));
             assertThat(enrich.concreteIndices(), equalTo(Map.of("", ".enrich-departments-3")));
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/logical/PhasedTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/logical/PhasedTests.java
index edf75170adc63..a4aef74d0e10a 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/logical/PhasedTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/logical/PhasedTests.java
@@ -13,6 +13,7 @@
 import org.elasticsearch.test.ESTestCase;
 import org.elasticsearch.xpack.esql.core.expression.Alias;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
 import org.elasticsearch.xpack.esql.core.expression.Literal;
 import org.elasticsearch.xpack.esql.core.expression.ReferenceAttribute;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
@@ -149,6 +150,11 @@ public List<Attribute> output() {
             return child().output();
         }
 
+        @Override
+        protected AttributeSet computeReferences() {
+            return AttributeSet.EMPTY;
+        }
+
         @Override
         public LogicalPlan firstPhase() {
             return child();
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/AggregateExecSerializationTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/AggregateExecSerializationTests.java
index ca9dd2045004e..fee1dc6894cc7 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/AggregateExecSerializationTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/plan/physical/AggregateExecSerializationTests.java
@@ -7,6 +7,8 @@
 
 package org.elasticsearch.xpack.esql.plan.physical;
 
+import org.elasticsearch.compute.aggregation.AggregatorMode;
+import org.elasticsearch.xpack.esql.core.expression.Attribute;
 import org.elasticsearch.xpack.esql.core.expression.Expression;
 import org.elasticsearch.xpack.esql.core.expression.NamedExpression;
 import org.elasticsearch.xpack.esql.core.tree.Source;
@@ -23,9 +25,10 @@ public static AggregateExec randomAggregateExec(int depth) {
         PhysicalPlan child = randomChild(depth);
         List<Expression> groupings = randomFieldAttributes(0, 5, false).stream().map(a -> (Expression) a).toList();
         List<? extends NamedExpression> aggregates = AggregateSerializationTests.randomAggregates();
-        AggregateExec.Mode mode = randomFrom(AggregateExec.Mode.values());
+        AggregatorMode mode = randomFrom(AggregatorMode.values());
+        List<Attribute> intermediateAttributes = randomFieldAttributes(0, 5, false);
         Integer estimatedRowSize = randomEstimatedRowSize();
-        return new AggregateExec(source, child, groupings, aggregates, mode, estimatedRowSize);
+        return new AggregateExec(source, child, groupings, aggregates, mode, intermediateAttributes, estimatedRowSize);
     }
 
     @Override
@@ -38,20 +41,22 @@ protected AggregateExec mutateInstance(AggregateExec instance) throws IOExceptio
         PhysicalPlan child = instance.child();
         List<? extends Expression> groupings = instance.groupings();
         List<? extends NamedExpression> aggregates = instance.aggregates();
-        AggregateExec.Mode mode = instance.getMode();
+        List<Attribute> intermediateAttributes = instance.intermediateAttributes();
+        AggregatorMode mode = instance.getMode();
         Integer estimatedRowSize = instance.estimatedRowSize();
-        switch (between(0, 4)) {
+        switch (between(0, 5)) {
             case 0 -> child = randomValueOtherThan(child, () -> randomChild(0));
             case 1 -> groupings = randomValueOtherThan(groupings, () -> randomFieldAttributes(0, 5, false));
             case 2 -> aggregates = randomValueOtherThan(aggregates, AggregateSerializationTests::randomAggregates);
-            case 3 -> mode = randomValueOtherThan(mode, () -> randomFrom(AggregateExec.Mode.values()));
-            case 4 -> estimatedRowSize = randomValueOtherThan(
+            case 3 -> mode = randomValueOtherThan(mode, () -> randomFrom(AggregatorMode.values()));
+            case 4 -> intermediateAttributes = randomValueOtherThan(intermediateAttributes, () -> randomFieldAttributes(0, 5, false));
+            case 5 -> estimatedRowSize = randomValueOtherThan(
                 estimatedRowSize,
                 AbstractPhysicalPlanSerializationTests::randomEstimatedRowSize
             );
             default -> throw new IllegalStateException();
         }
-        return new AggregateExec(instance.source(), child, groupings, aggregates, mode, estimatedRowSize);
+        return new AggregateExec(instance.source(), child, groupings, aggregates, mode, intermediateAttributes, estimatedRowSize);
     }
 
     @Override
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/session/IndexResolverFieldNamesTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/session/IndexResolverFieldNamesTests.java
index 925601bded425..d0d800431360f 100644
--- a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/session/IndexResolverFieldNamesTests.java
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/session/IndexResolverFieldNamesTests.java
@@ -1227,6 +1227,26 @@ public void testEnrichOnDefaultField() {
         assertThat(fieldNames, equalTo(ALL_FIELDS));
     }
 
+    public void testMetrics() {
+        Set<String> fieldNames = EsqlSession.fieldNames(parser.createStatement("""
+            METRICS k8s bytes=sum(rate(network.total_bytes_in)), sum(rate(network.total_cost)) BY cluster"""), Set.of());
+        assertThat(
+            fieldNames,
+            equalTo(
+                Set.of(
+                    "@timestamp",
+                    "@timestamp.*",
+                    "network.total_bytes_in",
+                    "network.total_bytes_in.*",
+                    "network.total_cost",
+                    "network.total_cost.*",
+                    "cluster",
+                    "cluster.*"
+                )
+            )
+        );
+    }
+
     private void assertFieldNames(String query, Set<String> expected) {
         Set<String> fieldNames = EsqlSession.fieldNames(parser.createStatement(query), Collections.emptySet());
         assertThat(fieldNames, equalTo(expected));

From b25962232d4dd6a0aa66cd67091a5e69e79bcd91 Mon Sep 17 00:00:00 2001
From: Simon Cooper <simon.cooper@elastic.co>
Date: Wed, 4 Sep 2024 09:32:17 +0100
Subject: [PATCH 131/144] Create IndexVersionAllocationDecider (#102708)

Create IndexVersionAllocationDecider as a counterpart to NodeVersionAllocationDecider, that checks the max index version rather than node version
---
 .../elasticsearch/cluster/ClusterModule.java  |   2 +
 .../IndexVersionAllocationDecider.java        | 142 ++++
 .../decider/NodeVersionAllocationDecider.java |   2 +-
 .../cluster/ClusterModuleTests.java           |  18 +-
 .../IndexVersionAllocationDeciderTests.java   | 699 ++++++++++++++++++
 .../NodeVersionAllocationDeciderTests.java    |  22 +-
 .../core/ilm/SetSingleNodeAllocateStep.java   |   2 +
 7 files changed, 865 insertions(+), 22 deletions(-)
 create mode 100644 server/src/main/java/org/elasticsearch/cluster/routing/allocation/decider/IndexVersionAllocationDecider.java
 create mode 100644 server/src/test/java/org/elasticsearch/cluster/routing/allocation/IndexVersionAllocationDeciderTests.java

diff --git a/server/src/main/java/org/elasticsearch/cluster/ClusterModule.java b/server/src/main/java/org/elasticsearch/cluster/ClusterModule.java
index 3fba3a7bdbe13..e399e739da047 100644
--- a/server/src/main/java/org/elasticsearch/cluster/ClusterModule.java
+++ b/server/src/main/java/org/elasticsearch/cluster/ClusterModule.java
@@ -45,6 +45,7 @@
 import org.elasticsearch.cluster.routing.allocation.decider.DiskThresholdDecider;
 import org.elasticsearch.cluster.routing.allocation.decider.EnableAllocationDecider;
 import org.elasticsearch.cluster.routing.allocation.decider.FilterAllocationDecider;
+import org.elasticsearch.cluster.routing.allocation.decider.IndexVersionAllocationDecider;
 import org.elasticsearch.cluster.routing.allocation.decider.MaxRetryAllocationDecider;
 import org.elasticsearch.cluster.routing.allocation.decider.NodeReplacementAllocationDecider;
 import org.elasticsearch.cluster.routing.allocation.decider.NodeShutdownAllocationDecider;
@@ -364,6 +365,7 @@ public static Collection<AllocationDecider> createAllocationDeciders(
         addAllocationDecider(deciders, new ClusterRebalanceAllocationDecider(clusterSettings));
         addAllocationDecider(deciders, new ConcurrentRebalanceAllocationDecider(clusterSettings));
         addAllocationDecider(deciders, new EnableAllocationDecider(clusterSettings));
+        addAllocationDecider(deciders, new IndexVersionAllocationDecider());
         addAllocationDecider(deciders, new NodeVersionAllocationDecider());
         addAllocationDecider(deciders, new SnapshotInProgressAllocationDecider());
         addAllocationDecider(deciders, new RestoreInProgressAllocationDecider());
diff --git a/server/src/main/java/org/elasticsearch/cluster/routing/allocation/decider/IndexVersionAllocationDecider.java b/server/src/main/java/org/elasticsearch/cluster/routing/allocation/decider/IndexVersionAllocationDecider.java
new file mode 100644
index 0000000000000..05f79e967ff46
--- /dev/null
+++ b/server/src/main/java/org/elasticsearch/cluster/routing/allocation/decider/IndexVersionAllocationDecider.java
@@ -0,0 +1,142 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.cluster.routing.allocation.decider;
+
+import org.elasticsearch.cluster.routing.RecoverySource;
+import org.elasticsearch.cluster.routing.RecoverySource.SnapshotRecoverySource;
+import org.elasticsearch.cluster.routing.RoutingNode;
+import org.elasticsearch.cluster.routing.RoutingNodes;
+import org.elasticsearch.cluster.routing.ShardRouting;
+import org.elasticsearch.cluster.routing.allocation.RoutingAllocation;
+
+/**
+ * An allocation decider that prevents relocation or allocation from nodes
+ * that might not be index compatible. If we relocate from a node that uses
+ * a newer index version than the node we relocate to this might cause {@link org.apache.lucene.index.IndexFormatTooNewException}
+ * on the lowest level since it might have already written segments that use a new postings format or codec that is not
+ * available on the target node.
+ */
+public class IndexVersionAllocationDecider extends AllocationDecider {
+
+    public static final String NAME = "index_version";
+
+    @Override
+    public Decision canAllocate(ShardRouting shardRouting, RoutingNode node, RoutingAllocation allocation) {
+        if (shardRouting.primary()) {
+            if (shardRouting.currentNodeId() == null) {
+                if (shardRouting.recoverySource().getType() == RecoverySource.Type.SNAPSHOT) {
+                    // restoring from a snapshot - check that the node can handle the version
+                    return isVersionCompatible((SnapshotRecoverySource) shardRouting.recoverySource(), node, allocation);
+                } else {
+                    // existing or fresh primary on the node
+                    return allocation.decision(Decision.YES, NAME, "no existing allocation, assuming compatible");
+                }
+            } else {
+                // relocating primary, only migrate to newer host
+                return isIndexVersionCompatibleRelocatePrimary(allocation.routingNodes(), shardRouting.currentNodeId(), node, allocation);
+            }
+        } else {
+            final ShardRouting primary = allocation.routingNodes().activePrimary(shardRouting.shardId());
+            // check that active primary has a newer version so that peer recovery works
+            if (primary != null) {
+                return isIndexVersionCompatibleAllocatingReplica(allocation.routingNodes(), primary.currentNodeId(), node, allocation);
+            } else {
+                // ReplicaAfterPrimaryActiveAllocationDecider should prevent this case from occurring
+                return allocation.decision(Decision.YES, NAME, "no active primary shard yet");
+            }
+        }
+    }
+
+    @Override
+    public Decision canForceAllocateDuringReplace(ShardRouting shardRouting, RoutingNode node, RoutingAllocation allocation) {
+        return canAllocate(shardRouting, node, allocation);
+    }
+
+    private static Decision isIndexVersionCompatibleRelocatePrimary(
+        final RoutingNodes routingNodes,
+        final String sourceNodeId,
+        final RoutingNode target,
+        final RoutingAllocation allocation
+    ) {
+        final RoutingNode source = routingNodes.node(sourceNodeId);
+        if (target.node().getMaxIndexVersion().onOrAfter(source.node().getMaxIndexVersion())) {
+            return allocation.decision(
+                Decision.YES,
+                NAME,
+                "can relocate primary shard from a node with index version [%s] to a node with equal-or-newer index version [%s]",
+                source.node().getMaxIndexVersion().toReleaseVersion(),
+                target.node().getMaxIndexVersion().toReleaseVersion()
+            );
+        } else {
+            return allocation.decision(
+                Decision.NO,
+                NAME,
+                "cannot relocate primary shard from a node with index version [%s] to a node with older index version [%s]",
+                source.node().getMaxIndexVersion().toReleaseVersion(),
+                target.node().getMaxIndexVersion().toReleaseVersion()
+            );
+        }
+    }
+
+    private static Decision isIndexVersionCompatibleAllocatingReplica(
+        final RoutingNodes routingNodes,
+        final String sourceNodeId,
+        final RoutingNode target,
+        final RoutingAllocation allocation
+    ) {
+        final RoutingNode source = routingNodes.node(sourceNodeId);
+        if (target.node().getMaxIndexVersion().onOrAfter(source.node().getMaxIndexVersion())) {
+            /* we can allocate if we can recover from a node that is younger or on the same version
+             * if the primary is already running on a newer version that won't work due to possible
+             * differences in the lucene index format etc.*/
+            return allocation.decision(
+                Decision.YES,
+                NAME,
+                "can allocate replica shard to a node with index version [%s]"
+                    + " since this is equal-or-newer than the primary index version [%s]",
+                target.node().getMaxIndexVersion().toReleaseVersion(),
+                source.node().getMaxIndexVersion().toReleaseVersion()
+            );
+        } else {
+            return allocation.decision(
+                Decision.NO,
+                NAME,
+                "cannot allocate replica shard to a node with index version [%s]"
+                    + " since this is older than the primary index version [%s]",
+                target.node().getMaxIndexVersion().toReleaseVersion(),
+                source.node().getMaxIndexVersion().toReleaseVersion()
+            );
+        }
+    }
+
+    private static Decision isVersionCompatible(
+        SnapshotRecoverySource recoverySource,
+        final RoutingNode target,
+        final RoutingAllocation allocation
+    ) {
+        if (target.node().getMaxIndexVersion().onOrAfter(recoverySource.version())) {
+            /* we can allocate if we can restore from a snapshot that is older or on the same version */
+            return allocation.decision(
+                Decision.YES,
+                NAME,
+                "max supported index version [%s] is the same or newer than snapshot version [%s]",
+                target.node().getMaxIndexVersion().toReleaseVersion(),
+                recoverySource.version().toReleaseVersion()
+            );
+        } else {
+            return allocation.decision(
+                Decision.NO,
+                NAME,
+                "max supported index version [%s] is older than the snapshot version [%s]",
+                target.node().getMaxIndexVersion().toReleaseVersion(),
+                recoverySource.version().toReleaseVersion()
+            );
+        }
+    }
+}
diff --git a/server/src/main/java/org/elasticsearch/cluster/routing/allocation/decider/NodeVersionAllocationDecider.java b/server/src/main/java/org/elasticsearch/cluster/routing/allocation/decider/NodeVersionAllocationDecider.java
index 0c25d30593abd..033fbe38154ca 100644
--- a/server/src/main/java/org/elasticsearch/cluster/routing/allocation/decider/NodeVersionAllocationDecider.java
+++ b/server/src/main/java/org/elasticsearch/cluster/routing/allocation/decider/NodeVersionAllocationDecider.java
@@ -30,7 +30,7 @@ public class NodeVersionAllocationDecider extends AllocationDecider {
     public Decision canAllocate(ShardRouting shardRouting, RoutingNode node, RoutingAllocation allocation) {
         if (shardRouting.primary()) {
             if (shardRouting.currentNodeId() == null) {
-                if (shardRouting.recoverySource() != null && shardRouting.recoverySource().getType() == RecoverySource.Type.SNAPSHOT) {
+                if (shardRouting.recoverySource().getType() == RecoverySource.Type.SNAPSHOT) {
                     // restoring from a snapshot - check that the node can handle the version
                     return isVersionCompatible((SnapshotRecoverySource) shardRouting.recoverySource(), node, allocation);
                 } else {
diff --git a/server/src/test/java/org/elasticsearch/cluster/ClusterModuleTests.java b/server/src/test/java/org/elasticsearch/cluster/ClusterModuleTests.java
index 544151d2adcd4..cac6fd5c28f85 100644
--- a/server/src/test/java/org/elasticsearch/cluster/ClusterModuleTests.java
+++ b/server/src/test/java/org/elasticsearch/cluster/ClusterModuleTests.java
@@ -21,6 +21,7 @@
 import org.elasticsearch.cluster.routing.allocation.decider.DiskThresholdDecider;
 import org.elasticsearch.cluster.routing.allocation.decider.EnableAllocationDecider;
 import org.elasticsearch.cluster.routing.allocation.decider.FilterAllocationDecider;
+import org.elasticsearch.cluster.routing.allocation.decider.IndexVersionAllocationDecider;
 import org.elasticsearch.cluster.routing.allocation.decider.MaxRetryAllocationDecider;
 import org.elasticsearch.cluster.routing.allocation.decider.NodeReplacementAllocationDecider;
 import org.elasticsearch.cluster.routing.allocation.decider.NodeShutdownAllocationDecider;
@@ -49,17 +50,20 @@
 import org.elasticsearch.test.gateway.TestGatewayAllocator;
 import org.elasticsearch.threadpool.TestThreadPool;
 import org.elasticsearch.threadpool.ThreadPool;
+import org.hamcrest.Matcher;
+import org.hamcrest.Matchers;
 import org.junit.AfterClass;
 import org.junit.BeforeClass;
 
-import java.util.Arrays;
 import java.util.Collection;
 import java.util.Collections;
-import java.util.Iterator;
 import java.util.List;
 import java.util.Map;
 import java.util.concurrent.TimeUnit;
 import java.util.function.Supplier;
+import java.util.stream.Stream;
+
+import static org.hamcrest.Matchers.contains;
 
 public class ClusterModuleTests extends ModuleTestCase {
     private ClusterInfoService clusterInfoService = EmptyClusterInfoService.INSTANCE;
@@ -232,7 +236,7 @@ public void testShardsAllocatorFactoryNull() {
     // running them. If the order of the deciders is changed for a valid reason, the order should be
     // changed in the test too.
     public void testAllocationDeciderOrder() {
-        List<Class<? extends AllocationDecider>> expectedDeciders = Arrays.asList(
+        Stream<Class<? extends AllocationDecider>> expectedDeciders = Stream.of(
             MaxRetryAllocationDecider.class,
             ResizeAllocationDecider.class,
             ReplicaAfterPrimaryActiveAllocationDecider.class,
@@ -240,6 +244,7 @@ public void testAllocationDeciderOrder() {
             ClusterRebalanceAllocationDecider.class,
             ConcurrentRebalanceAllocationDecider.class,
             EnableAllocationDecider.class,
+            IndexVersionAllocationDecider.class,
             NodeVersionAllocationDecider.class,
             SnapshotInProgressAllocationDecider.class,
             RestoreInProgressAllocationDecider.class,
@@ -257,12 +262,7 @@ public void testAllocationDeciderOrder() {
             new ClusterSettings(Settings.EMPTY, ClusterSettings.BUILT_IN_CLUSTER_SETTINGS),
             Collections.emptyList()
         );
-        Iterator<AllocationDecider> iter = deciders.iterator();
-        int idx = 0;
-        while (iter.hasNext()) {
-            AllocationDecider decider = iter.next();
-            assertSame(decider.getClass(), expectedDeciders.get(idx++));
-        }
+        assertThat(deciders, contains(expectedDeciders.<Matcher<? super AllocationDecider>>map(Matchers::instanceOf).toList()));
     }
 
     public void testRejectsReservedExistingShardsAllocatorName() {
diff --git a/server/src/test/java/org/elasticsearch/cluster/routing/allocation/IndexVersionAllocationDeciderTests.java b/server/src/test/java/org/elasticsearch/cluster/routing/allocation/IndexVersionAllocationDeciderTests.java
new file mode 100644
index 0000000000000..ee46e8da5755d
--- /dev/null
+++ b/server/src/test/java/org/elasticsearch/cluster/routing/allocation/IndexVersionAllocationDeciderTests.java
@@ -0,0 +1,699 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0 and the Server Side Public License, v 1; you may not use this file except
+ * in compliance with, at your election, the Elastic License 2.0 or the Server
+ * Side Public License, v 1.
+ */
+
+package org.elasticsearch.cluster.routing.allocation;
+
+import org.elasticsearch.Version;
+import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.cluster.ClusterName;
+import org.elasticsearch.cluster.ClusterState;
+import org.elasticsearch.cluster.ESAllocationTestCase;
+import org.elasticsearch.cluster.EmptyClusterInfoService;
+import org.elasticsearch.cluster.TestShardRoutingRoleStrategies;
+import org.elasticsearch.cluster.metadata.IndexMetadata;
+import org.elasticsearch.cluster.metadata.Metadata;
+import org.elasticsearch.cluster.node.DiscoveryNode;
+import org.elasticsearch.cluster.node.DiscoveryNodeUtils;
+import org.elasticsearch.cluster.node.DiscoveryNodes;
+import org.elasticsearch.cluster.routing.AllocationId;
+import org.elasticsearch.cluster.routing.IndexRoutingTable;
+import org.elasticsearch.cluster.routing.IndexShardRoutingTable;
+import org.elasticsearch.cluster.routing.RecoverySource.SnapshotRecoverySource;
+import org.elasticsearch.cluster.routing.RoutingChangesObserver;
+import org.elasticsearch.cluster.routing.RoutingNode;
+import org.elasticsearch.cluster.routing.RoutingNodes;
+import org.elasticsearch.cluster.routing.RoutingNodesHelper;
+import org.elasticsearch.cluster.routing.RoutingTable;
+import org.elasticsearch.cluster.routing.ShardRouting;
+import org.elasticsearch.cluster.routing.ShardRoutingHelper;
+import org.elasticsearch.cluster.routing.ShardRoutingState;
+import org.elasticsearch.cluster.routing.allocation.allocator.BalancedShardsAllocator;
+import org.elasticsearch.cluster.routing.allocation.command.AllocationCommands;
+import org.elasticsearch.cluster.routing.allocation.decider.AllocationDeciders;
+import org.elasticsearch.cluster.routing.allocation.decider.ClusterRebalanceAllocationDecider;
+import org.elasticsearch.cluster.routing.allocation.decider.Decision;
+import org.elasticsearch.cluster.routing.allocation.decider.IndexVersionAllocationDecider;
+import org.elasticsearch.cluster.routing.allocation.decider.ReplicaAfterPrimaryActiveAllocationDecider;
+import org.elasticsearch.common.UUIDs;
+import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.common.util.set.Sets;
+import org.elasticsearch.index.Index;
+import org.elasticsearch.index.IndexVersion;
+import org.elasticsearch.index.IndexVersions;
+import org.elasticsearch.index.shard.ShardId;
+import org.elasticsearch.repositories.IndexId;
+import org.elasticsearch.snapshots.EmptySnapshotsInfoService;
+import org.elasticsearch.snapshots.InternalSnapshotsInfoService;
+import org.elasticsearch.snapshots.Snapshot;
+import org.elasticsearch.snapshots.SnapshotId;
+import org.elasticsearch.snapshots.SnapshotShardSizeInfo;
+import org.elasticsearch.test.gateway.TestGatewayAllocator;
+import org.elasticsearch.test.index.IndexVersionUtils;
+
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.Collections;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+
+import static java.util.Collections.shuffle;
+import static org.elasticsearch.cluster.routing.RoutingNodesHelper.shardsWithState;
+import static org.elasticsearch.cluster.routing.ShardRoutingState.INITIALIZING;
+import static org.elasticsearch.cluster.routing.ShardRoutingState.STARTED;
+import static org.elasticsearch.cluster.routing.ShardRoutingState.UNASSIGNED;
+import static org.elasticsearch.cluster.routing.TestShardRouting.shardRoutingBuilder;
+import static org.hamcrest.Matchers.equalTo;
+import static org.hamcrest.Matchers.notNullValue;
+import static org.hamcrest.Matchers.nullValue;
+import static org.hamcrest.core.Is.is;
+
+public class IndexVersionAllocationDeciderTests extends ESAllocationTestCase {
+
+    public void testDoNotAllocateFromPrimary() {
+        AllocationService strategy = createAllocationService(
+            Settings.builder()
+                .put("cluster.routing.allocation.node_concurrent_recoveries", 10)
+                .put(ClusterRebalanceAllocationDecider.CLUSTER_ROUTING_ALLOCATION_ALLOW_REBALANCE_SETTING.getKey(), "always")
+                .put("cluster.routing.allocation.cluster_concurrent_rebalance", -1)
+                .build()
+        );
+
+        logger.info("Building initial routing table");
+
+        Metadata metadata = Metadata.builder()
+            .put(IndexMetadata.builder("test").settings(settings(IndexVersion.current())).numberOfShards(5).numberOfReplicas(2))
+            .build();
+
+        RoutingTable initialRoutingTable = RoutingTable.builder(TestShardRoutingRoleStrategies.DEFAULT_ROLE_ONLY)
+            .addAsNew(metadata.index("test"))
+            .build();
+
+        ClusterState clusterState = ClusterState.builder(ClusterName.DEFAULT).metadata(metadata).routingTable(initialRoutingTable).build();
+
+        assertThat(clusterState.routingTable().index("test").size(), equalTo(5));
+        for (int i = 0; i < clusterState.routingTable().index("test").size(); i++) {
+            assertThat(clusterState.routingTable().index("test").shard(i).size(), equalTo(3));
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(0).state(), equalTo(UNASSIGNED));
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(1).state(), equalTo(UNASSIGNED));
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(2).state(), equalTo(UNASSIGNED));
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(0).currentNodeId(), nullValue());
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(1).currentNodeId(), nullValue());
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(2).currentNodeId(), nullValue());
+        }
+
+        logger.info("start two nodes and fully start the shards");
+        clusterState = ClusterState.builder(clusterState)
+            .nodes(DiscoveryNodes.builder().add(newNode("node1")).add(newNode("node2")))
+            .build();
+        clusterState = strategy.reroute(clusterState, "reroute", ActionListener.noop());
+
+        for (int i = 0; i < clusterState.routingTable().index("test").size(); i++) {
+            assertThat(clusterState.routingTable().index("test").shard(i).size(), equalTo(3));
+            assertThat(clusterState.routingTable().index("test").shard(i).primaryShard().state(), equalTo(INITIALIZING));
+            assertThat(clusterState.routingTable().index("test").shard(i).replicaShardsWithState(UNASSIGNED).size(), equalTo(2));
+
+        }
+
+        logger.info("start all the primary shards, replicas will start initializing");
+        clusterState = startInitializingShardsAndReroute(strategy, clusterState);
+
+        for (int i = 0; i < clusterState.routingTable().index("test").size(); i++) {
+            assertThat(clusterState.routingTable().index("test").shard(i).size(), equalTo(3));
+            assertThat(clusterState.routingTable().index("test").shard(i).primaryShard().state(), equalTo(STARTED));
+            assertThat(clusterState.routingTable().index("test").shard(i).replicaShardsWithState(INITIALIZING).size(), equalTo(1));
+            assertThat(clusterState.routingTable().index("test").shard(i).replicaShardsWithState(UNASSIGNED).size(), equalTo(1));
+        }
+
+        clusterState = startInitializingShardsAndReroute(strategy, clusterState);
+
+        for (int i = 0; i < clusterState.routingTable().index("test").size(); i++) {
+            assertThat(clusterState.routingTable().index("test").shard(i).size(), equalTo(3));
+            assertThat(clusterState.routingTable().index("test").shard(i).primaryShard().state(), equalTo(STARTED));
+            assertThat(clusterState.routingTable().index("test").shard(i).replicaShardsWithState(STARTED).size(), equalTo(1));
+            assertThat(clusterState.routingTable().index("test").shard(i).replicaShardsWithState(UNASSIGNED).size(), equalTo(1));
+        }
+
+        clusterState = ClusterState.builder(clusterState)
+            .nodes(
+                DiscoveryNodes.builder(clusterState.nodes()).add(newNode("node3", Version.CURRENT, IndexVersionUtils.getPreviousVersion()))
+            )
+            .build();
+        clusterState = strategy.reroute(clusterState, "reroute", ActionListener.noop());
+
+        for (int i = 0; i < clusterState.routingTable().index("test").size(); i++) {
+            assertThat(clusterState.routingTable().index("test").shard(i).size(), equalTo(3));
+            assertThat(clusterState.routingTable().index("test").shard(i).primaryShard().state(), equalTo(STARTED));
+            assertThat(clusterState.routingTable().index("test").shard(i).replicaShardsWithState(STARTED).size(), equalTo(1));
+            assertThat(clusterState.routingTable().index("test").shard(i).replicaShardsWithState(UNASSIGNED).size(), equalTo(1));
+        }
+
+        clusterState = ClusterState.builder(clusterState).nodes(DiscoveryNodes.builder(clusterState.nodes()).add(newNode("node4"))).build();
+        clusterState = strategy.reroute(clusterState, "reroute", ActionListener.noop());
+
+        for (int i = 0; i < clusterState.routingTable().index("test").size(); i++) {
+            assertThat(clusterState.routingTable().index("test").shard(i).size(), equalTo(3));
+            assertThat(clusterState.routingTable().index("test").shard(i).primaryShard().state(), equalTo(STARTED));
+            assertThat(clusterState.routingTable().index("test").shard(i).replicaShardsWithState(STARTED).size(), equalTo(1));
+            assertThat(clusterState.routingTable().index("test").shard(i).replicaShardsWithState(INITIALIZING).size(), equalTo(1));
+        }
+
+        clusterState = startInitializingShardsAndReroute(strategy, clusterState);
+
+        for (int i = 0; i < clusterState.routingTable().index("test").size(); i++) {
+            assertThat(clusterState.routingTable().index("test").shard(i).size(), equalTo(3));
+            assertThat(clusterState.routingTable().index("test").shard(i).primaryShard().state(), equalTo(STARTED));
+            assertThat(clusterState.routingTable().index("test").shard(i).replicaShardsWithState(STARTED).size(), equalTo(2));
+        }
+    }
+
+    public void testRandom() {
+        AllocationService service = createAllocationService(
+            Settings.builder()
+                .put("cluster.routing.allocation.node_concurrent_recoveries", 10)
+                .put(ClusterRebalanceAllocationDecider.CLUSTER_ROUTING_ALLOCATION_ALLOW_REBALANCE_SETTING.getKey(), "always")
+                .put("cluster.routing.allocation.cluster_concurrent_rebalance", -1)
+                .build()
+        );
+
+        logger.info("Building initial routing table");
+        Metadata.Builder builder = Metadata.builder();
+        RoutingTable.Builder rtBuilder = RoutingTable.builder(TestShardRoutingRoleStrategies.DEFAULT_ROLE_ONLY);
+        int numIndices = between(1, 20);
+        for (int i = 0; i < numIndices; i++) {
+            builder.put(
+                IndexMetadata.builder("test_" + i)
+                    .settings(settings(IndexVersion.current()))
+                    .numberOfShards(between(1, 5))
+                    .numberOfReplicas(between(0, 2))
+            );
+        }
+        Metadata metadata = builder.build();
+
+        for (int i = 0; i < numIndices; i++) {
+            rtBuilder.addAsNew(metadata.index("test_" + i));
+        }
+        RoutingTable routingTable = rtBuilder.build();
+
+        ClusterState clusterState = ClusterState.builder(ClusterName.DEFAULT).metadata(metadata).routingTable(routingTable).build();
+        assertThat(shardsWithState(clusterState.getRoutingNodes(), UNASSIGNED).size(), equalTo((int) routingTable.allShards().count()));
+        List<DiscoveryNode> nodes = new ArrayList<>();
+        int nodeIdx = 0;
+        int iters = scaledRandomIntBetween(10, 100);
+        for (int i = 0; i < iters; i++) {
+            DiscoveryNodes.Builder nodesBuilder = DiscoveryNodes.builder();
+            int numNodes = between(1, 20);
+            if (nodes.size() > numNodes) {
+                shuffle(nodes, random());
+                nodes = nodes.subList(0, numNodes);
+            } else {
+                for (int j = nodes.size(); j < numNodes; j++) {
+                    if (frequently()) {
+                        if (randomBoolean()) {
+                            nodes.add(newNode("node" + (nodeIdx++), Version.CURRENT, IndexVersionUtils.getPreviousVersion()));
+                        } else {
+                            nodes.add(newNode("node" + (nodeIdx++), Version.CURRENT, IndexVersion.current()));
+                        }
+                    } else {
+                        nodes.add(newNode("node" + (nodeIdx++), Version.CURRENT, IndexVersionUtils.randomVersion()));
+                    }
+                }
+            }
+            for (DiscoveryNode node : nodes) {
+                nodesBuilder.add(node);
+            }
+            clusterState = ClusterState.builder(clusterState).nodes(nodesBuilder).build();
+            clusterState = stabilize(clusterState, service);
+        }
+    }
+
+    public void testRollingRestart() {
+        AllocationService service = createAllocationService(
+            Settings.builder()
+                .put("cluster.routing.allocation.node_concurrent_recoveries", 10)
+                .put(ClusterRebalanceAllocationDecider.CLUSTER_ROUTING_ALLOCATION_ALLOW_REBALANCE_SETTING.getKey(), "always")
+                .put("cluster.routing.allocation.cluster_concurrent_rebalance", -1)
+                .build()
+        );
+
+        logger.info("Building initial routing table");
+
+        Metadata metadata = Metadata.builder()
+            .put(IndexMetadata.builder("test").settings(settings(IndexVersion.current())).numberOfShards(5).numberOfReplicas(2))
+            .build();
+
+        RoutingTable routingTable = RoutingTable.builder(TestShardRoutingRoleStrategies.DEFAULT_ROLE_ONLY)
+            .addAsNew(metadata.index("test"))
+            .build();
+
+        ClusterState clusterState = ClusterState.builder(ClusterName.DEFAULT).metadata(metadata).routingTable(routingTable).build();
+
+        assertThat(clusterState.routingTable().index("test").size(), equalTo(5));
+        for (int i = 0; i < clusterState.routingTable().index("test").size(); i++) {
+            assertThat(clusterState.routingTable().index("test").shard(i).size(), equalTo(3));
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(0).state(), equalTo(UNASSIGNED));
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(1).state(), equalTo(UNASSIGNED));
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(2).state(), equalTo(UNASSIGNED));
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(0).currentNodeId(), nullValue());
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(1).currentNodeId(), nullValue());
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(2).currentNodeId(), nullValue());
+        }
+        clusterState = ClusterState.builder(clusterState)
+            .nodes(
+                DiscoveryNodes.builder()
+                    .add(newNode("old0", Version.CURRENT, IndexVersionUtils.getPreviousVersion()))
+                    .add(newNode("old1", Version.CURRENT, IndexVersionUtils.getPreviousVersion()))
+                    .add(newNode("old2", Version.CURRENT, IndexVersionUtils.getPreviousVersion()))
+            )
+            .build();
+        clusterState = stabilize(clusterState, service);
+
+        clusterState = ClusterState.builder(clusterState)
+            .nodes(
+                DiscoveryNodes.builder()
+                    .add(newNode("old0", Version.CURRENT, IndexVersionUtils.getPreviousVersion()))
+                    .add(newNode("old1", Version.CURRENT, IndexVersionUtils.getPreviousVersion()))
+                    .add(newNode("new0"))
+            )
+            .build();
+
+        clusterState = stabilize(clusterState, service);
+
+        clusterState = ClusterState.builder(clusterState)
+            .nodes(
+                DiscoveryNodes.builder()
+                    .add(newNode("node0", Version.CURRENT, IndexVersionUtils.getPreviousVersion()))
+                    .add(newNode("new1"))
+                    .add(newNode("new0"))
+            )
+            .build();
+
+        clusterState = stabilize(clusterState, service);
+
+        clusterState = ClusterState.builder(clusterState)
+            .nodes(DiscoveryNodes.builder().add(newNode("new2")).add(newNode("new1")).add(newNode("new0")))
+            .build();
+
+        clusterState = stabilize(clusterState, service);
+        for (int i = 0; i < clusterState.routingTable().index("test").size(); i++) {
+            assertThat(clusterState.routingTable().index("test").shard(i).size(), equalTo(3));
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(0).state(), equalTo(STARTED));
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(1).state(), equalTo(STARTED));
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(2).state(), equalTo(STARTED));
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(0).currentNodeId(), notNullValue());
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(1).currentNodeId(), notNullValue());
+            assertThat(clusterState.routingTable().index("test").shard(i).shard(2).currentNodeId(), notNullValue());
+        }
+    }
+
+    public void testRebalanceDoesNotAllocatePrimaryAndReplicasOnDifferentVersionNodes() {
+        ShardId shard1 = new ShardId("test1", "_na_", 0);
+        ShardId shard2 = new ShardId("test2", "_na_", 0);
+        final DiscoveryNode newNode = DiscoveryNodeUtils.builder("newNode").roles(MASTER_DATA_ROLES).build();
+        final DiscoveryNode oldNode1 = DiscoveryNodeUtils.builder("oldNode1")
+            .roles(MASTER_DATA_ROLES)
+            .version(Version.CURRENT, IndexVersions.MINIMUM_COMPATIBLE, IndexVersionUtils.getPreviousVersion())
+            .build();
+        final DiscoveryNode oldNode2 = DiscoveryNodeUtils.builder("oldNode2")
+            .roles(MASTER_DATA_ROLES)
+            .version(Version.CURRENT, IndexVersions.MINIMUM_COMPATIBLE, IndexVersionUtils.getPreviousVersion())
+            .build();
+        AllocationId allocationId1P = AllocationId.newInitializing();
+        AllocationId allocationId1R = AllocationId.newInitializing();
+        AllocationId allocationId2P = AllocationId.newInitializing();
+        AllocationId allocationId2R = AllocationId.newInitializing();
+        Metadata metadata = Metadata.builder()
+            .put(
+                IndexMetadata.builder(shard1.getIndexName())
+                    .settings(settings(IndexVersion.current()).put(Settings.EMPTY))
+                    .numberOfShards(1)
+                    .numberOfReplicas(1)
+                    .putInSyncAllocationIds(0, Sets.newHashSet(allocationId1P.getId(), allocationId1R.getId()))
+            )
+            .put(
+                IndexMetadata.builder(shard2.getIndexName())
+                    .settings(settings(IndexVersion.current()).put(Settings.EMPTY))
+                    .numberOfShards(1)
+                    .numberOfReplicas(1)
+                    .putInSyncAllocationIds(0, Sets.newHashSet(allocationId2P.getId(), allocationId2R.getId()))
+            )
+            .build();
+        RoutingTable routingTable = RoutingTable.builder()
+            .add(
+                IndexRoutingTable.builder(shard1.getIndex())
+                    .addIndexShard(
+                        new IndexShardRoutingTable.Builder(shard1).addShard(
+                            shardRoutingBuilder(shard1.getIndexName(), shard1.getId(), newNode.getId(), true, ShardRoutingState.STARTED)
+                                .withAllocationId(allocationId1P)
+                                .build()
+                        )
+                            .addShard(
+                                shardRoutingBuilder(
+                                    shard1.getIndexName(),
+                                    shard1.getId(),
+                                    oldNode1.getId(),
+                                    false,
+                                    ShardRoutingState.STARTED
+                                ).withAllocationId(allocationId1R).build()
+                            )
+                    )
+            )
+            .add(
+                IndexRoutingTable.builder(shard2.getIndex())
+                    .addIndexShard(
+                        new IndexShardRoutingTable.Builder(shard2).addShard(
+                            shardRoutingBuilder(shard2.getIndexName(), shard2.getId(), newNode.getId(), true, ShardRoutingState.STARTED)
+                                .withAllocationId(allocationId2P)
+                                .build()
+                        )
+                            .addShard(
+                                shardRoutingBuilder(
+                                    shard2.getIndexName(),
+                                    shard2.getId(),
+                                    oldNode1.getId(),
+                                    false,
+                                    ShardRoutingState.STARTED
+                                ).withAllocationId(allocationId2R).build()
+                            )
+                    )
+            )
+            .build();
+        ClusterState state = ClusterState.builder(ClusterName.DEFAULT)
+            .metadata(metadata)
+            .routingTable(routingTable)
+            .nodes(DiscoveryNodes.builder().add(newNode).add(oldNode1).add(oldNode2))
+            .build();
+        AllocationDeciders allocationDeciders = new AllocationDeciders(Collections.singleton(new IndexVersionAllocationDecider()));
+        AllocationService strategy = new MockAllocationService(
+            allocationDeciders,
+            new TestGatewayAllocator(),
+            new BalancedShardsAllocator(Settings.EMPTY),
+            EmptyClusterInfoService.INSTANCE,
+            EmptySnapshotsInfoService.INSTANCE
+        );
+        state = strategy.reroute(state, new AllocationCommands(), true, false, false, ActionListener.noop()).clusterState();
+        // the two indices must stay as is, the replicas cannot move to oldNode2 because versions don't match
+        assertThat(state.routingTable().index(shard2.getIndex()).shardsWithState(ShardRoutingState.RELOCATING).size(), equalTo(0));
+        assertThat(state.routingTable().index(shard1.getIndex()).shardsWithState(ShardRoutingState.RELOCATING).size(), equalTo(0));
+    }
+
+    public void testRestoreDoesNotAllocateSnapshotOnOlderNodes() {
+        final DiscoveryNode newNode = DiscoveryNodeUtils.builder("newNode").roles(MASTER_DATA_ROLES).build();
+        final DiscoveryNode oldNode1 = DiscoveryNodeUtils.builder("oldNode1")
+            .roles(MASTER_DATA_ROLES)
+            .version(Version.CURRENT, IndexVersions.MINIMUM_COMPATIBLE, IndexVersionUtils.getPreviousVersion())
+            .build();
+        final DiscoveryNode oldNode2 = DiscoveryNodeUtils.builder("oldNode2")
+            .roles(MASTER_DATA_ROLES)
+            .version(Version.CURRENT, IndexVersions.MINIMUM_COMPATIBLE, IndexVersionUtils.getPreviousVersion())
+            .build();
+
+        final Snapshot snapshot = new Snapshot("rep1", new SnapshotId("snp1", UUIDs.randomBase64UUID()));
+        final IndexId indexId = new IndexId("test", UUIDs.randomBase64UUID(random()));
+
+        final int numberOfShards = randomIntBetween(1, 3);
+        final IndexMetadata.Builder indexMetadata = IndexMetadata.builder("test")
+            .settings(settings(IndexVersion.current()))
+            .numberOfShards(numberOfShards)
+            .numberOfReplicas(randomIntBetween(0, 3));
+        for (int i = 0; i < numberOfShards; i++) {
+            indexMetadata.putInSyncAllocationIds(i, Collections.singleton("_test_"));
+        }
+        Metadata metadata = Metadata.builder().put(indexMetadata).build();
+
+        final Map<InternalSnapshotsInfoService.SnapshotShard, Long> snapshotShardSizes = new HashMap<>(numberOfShards);
+        final Index index = metadata.index("test").getIndex();
+        for (int i = 0; i < numberOfShards; i++) {
+            final ShardId shardId = new ShardId(index, i);
+            snapshotShardSizes.put(new InternalSnapshotsInfoService.SnapshotShard(snapshot, indexId, shardId), randomNonNegativeLong());
+        }
+
+        ClusterState state = ClusterState.builder(ClusterName.DEFAULT)
+            .metadata(metadata)
+            .routingTable(
+                RoutingTable.builder(TestShardRoutingRoleStrategies.DEFAULT_ROLE_ONLY)
+                    .addAsRestore(
+                        metadata.index("test"),
+                        new SnapshotRecoverySource(UUIDs.randomBase64UUID(), snapshot, IndexVersion.current(), indexId)
+                    )
+                    .build()
+            )
+            .nodes(DiscoveryNodes.builder().add(newNode).add(oldNode1).add(oldNode2))
+            .build();
+        AllocationDeciders allocationDeciders = new AllocationDeciders(
+            Arrays.asList(new ReplicaAfterPrimaryActiveAllocationDecider(), new IndexVersionAllocationDecider())
+        );
+        AllocationService strategy = new MockAllocationService(
+            allocationDeciders,
+            new TestGatewayAllocator(),
+            new BalancedShardsAllocator(Settings.EMPTY),
+            EmptyClusterInfoService.INSTANCE,
+            () -> new SnapshotShardSizeInfo(snapshotShardSizes)
+        );
+        state = strategy.reroute(state, new AllocationCommands(), true, false, false, ActionListener.noop()).clusterState();
+
+        // Make sure that primary shards are only allocated on the new node
+        for (int i = 0; i < numberOfShards; i++) {
+            assertEquals("newNode", state.routingTable().index("test").shard(i).primaryShard().currentNodeId());
+        }
+    }
+
+    private ClusterState stabilize(ClusterState clusterState, AllocationService service) {
+        logger.trace("RoutingNodes: {}", clusterState.getRoutingNodes());
+
+        clusterState = service.disassociateDeadNodes(clusterState, true, "reroute");
+        RoutingNodes routingNodes = clusterState.getRoutingNodes();
+        assertRecoveryIndexVersions(routingNodes);
+
+        logger.info("complete rebalancing");
+        boolean changed;
+        do {
+            logger.trace("RoutingNodes: {}", clusterState.getRoutingNodes());
+            ClusterState newState = startInitializingShardsAndReroute(service, clusterState);
+            changed = newState.equals(clusterState) == false;
+            clusterState = newState;
+            routingNodes = clusterState.getRoutingNodes();
+            assertRecoveryIndexVersions(routingNodes);
+        } while (changed);
+        return clusterState;
+    }
+
+    private void assertRecoveryIndexVersions(RoutingNodes routingNodes) {
+        logger.trace("RoutingNodes: {}", routingNodes);
+
+        List<ShardRouting> mutableShardRoutings = shardsWithState(routingNodes, ShardRoutingState.RELOCATING);
+        for (ShardRouting r : mutableShardRoutings) {
+            if (r.primary()) {
+                String toId = r.relocatingNodeId();
+                String fromId = r.currentNodeId();
+                assertThat(fromId, notNullValue());
+                assertThat(toId, notNullValue());
+                logger.trace(
+                    "From: {} with IndexVersion: {} to: {} with IndexVersion: {}",
+                    fromId,
+                    routingNodes.node(fromId).node().getMaxIndexVersion(),
+                    toId,
+                    routingNodes.node(toId).node().getMaxIndexVersion()
+                );
+                assertTrue(
+                    routingNodes.node(toId).node().getMaxIndexVersion().onOrAfter(routingNodes.node(fromId).node().getMaxIndexVersion())
+                );
+            } else {
+                ShardRouting primary = routingNodes.activePrimary(r.shardId());
+                assertThat(primary, notNullValue());
+                String fromId = primary.currentNodeId();
+                String toId = r.relocatingNodeId();
+                logger.trace(
+                    "From: {} with IndexVersion: {} to: {} with IndexVersion: {}",
+                    fromId,
+                    routingNodes.node(fromId).node().getMaxIndexVersion(),
+                    toId,
+                    routingNodes.node(toId).node().getMaxIndexVersion()
+                );
+                assertTrue(
+                    routingNodes.node(toId).node().getMaxIndexVersion().onOrAfter(routingNodes.node(fromId).node().getMaxIndexVersion())
+                );
+            }
+        }
+
+        mutableShardRoutings = shardsWithState(routingNodes, ShardRoutingState.INITIALIZING);
+        for (ShardRouting r : mutableShardRoutings) {
+            if (r.primary() == false) {
+                ShardRouting primary = routingNodes.activePrimary(r.shardId());
+                assertThat(primary, notNullValue());
+                String fromId = primary.currentNodeId();
+                String toId = r.currentNodeId();
+                logger.trace(
+                    "From: {} with IndexVersion: {} to: {} with IndexVersion: {}",
+                    fromId,
+                    routingNodes.node(fromId).node().getMaxIndexVersion(),
+                    toId,
+                    routingNodes.node(toId).node().getMaxIndexVersion()
+                );
+                assertTrue(
+                    routingNodes.node(toId).node().getMaxIndexVersion().onOrAfter(routingNodes.node(fromId).node().getMaxIndexVersion())
+                );
+            }
+        }
+    }
+
+    public void testMessages() {
+
+        Metadata metadata = Metadata.builder()
+            .put(IndexMetadata.builder("test").settings(settings(IndexVersion.current())).numberOfShards(1).numberOfReplicas(1))
+            .build();
+
+        RoutingTable initialRoutingTable = RoutingTable.builder(TestShardRoutingRoleStrategies.DEFAULT_ROLE_ONLY)
+            .addAsNew(metadata.index("test"))
+            .build();
+
+        RoutingNode newNode = RoutingNodesHelper.routingNode("newNode", newNode("newNode", Version.CURRENT, IndexVersion.current()));
+        RoutingNode oldNode = RoutingNodesHelper.routingNode(
+            "oldNode",
+            newNode("oldNode", Version.CURRENT, IndexVersionUtils.getPreviousVersion())
+        );
+
+        final ClusterName clusterName = ClusterName.DEFAULT;
+        ClusterState clusterState = ClusterState.builder(clusterName)
+            .metadata(metadata)
+            .routingTable(initialRoutingTable)
+            .nodes(DiscoveryNodes.builder().add(newNode.node()).add(oldNode.node()))
+            .build();
+
+        final ShardId shardId = clusterState.routingTable().index("test").shard(0).shardId();
+        final ShardRouting primaryShard = clusterState.routingTable().shardRoutingTable(shardId).primaryShard();
+        final ShardRouting replicaShard = clusterState.routingTable().shardRoutingTable(shardId).replicaShards().get(0);
+
+        RoutingAllocation routingAllocation = new RoutingAllocation(null, clusterState, null, null, 0);
+        routingAllocation.debugDecision(true);
+
+        final IndexVersionAllocationDecider allocationDecider = new IndexVersionAllocationDecider();
+        Decision decision = allocationDecider.canAllocate(primaryShard, newNode, routingAllocation);
+        assertThat(decision.type(), is(Decision.Type.YES));
+        assertThat(decision.getExplanation(), is("no existing allocation, assuming compatible"));
+
+        decision = allocationDecider.canAllocate(ShardRoutingHelper.initialize(primaryShard, "oldNode"), newNode, routingAllocation);
+        assertThat(decision.type(), is(Decision.Type.YES));
+        assertThat(
+            decision.getExplanation(),
+            is(
+                "can relocate primary shard from a node with index version ["
+                    + oldNode.node().getMaxIndexVersion().toReleaseVersion()
+                    + "] to a node with equal-or-newer index version ["
+                    + newNode.node().getMaxIndexVersion().toReleaseVersion()
+                    + "]"
+            )
+        );
+
+        decision = allocationDecider.canAllocate(ShardRoutingHelper.initialize(primaryShard, "newNode"), oldNode, routingAllocation);
+        assertThat(decision.type(), is(Decision.Type.NO));
+        assertThat(
+            decision.getExplanation(),
+            is(
+                "cannot relocate primary shard from a node with index version ["
+                    + newNode.node().getMaxIndexVersion().toReleaseVersion()
+                    + "] to a node with older index version ["
+                    + oldNode.node().getMaxIndexVersion().toReleaseVersion()
+                    + "]"
+            )
+        );
+
+        final IndexId indexId = new IndexId("test", UUIDs.randomBase64UUID(random()));
+        final SnapshotRecoverySource newVersionSnapshot = new SnapshotRecoverySource(
+            UUIDs.randomBase64UUID(),
+            new Snapshot("rep1", new SnapshotId("snp1", UUIDs.randomBase64UUID())),
+            newNode.node().getMaxIndexVersion(),
+            indexId
+        );
+        final SnapshotRecoverySource oldVersionSnapshot = new SnapshotRecoverySource(
+            UUIDs.randomBase64UUID(),
+            new Snapshot("rep1", new SnapshotId("snp1", UUIDs.randomBase64UUID())),
+            oldNode.node().getMaxIndexVersion(),
+            indexId
+        );
+
+        decision = allocationDecider.canAllocate(
+            ShardRoutingHelper.newWithRestoreSource(primaryShard, newVersionSnapshot),
+            oldNode,
+            routingAllocation
+        );
+        assertThat(decision.type(), is(Decision.Type.NO));
+        assertThat(
+            decision.getExplanation(),
+            is(
+                "max supported index version ["
+                    + oldNode.node().getMaxIndexVersion().toReleaseVersion()
+                    + "] is older than the snapshot version ["
+                    + newNode.node().getMaxIndexVersion().toReleaseVersion()
+                    + "]"
+            )
+        );
+
+        decision = allocationDecider.canAllocate(
+            ShardRoutingHelper.newWithRestoreSource(primaryShard, oldVersionSnapshot),
+            newNode,
+            routingAllocation
+        );
+        assertThat(decision.type(), is(Decision.Type.YES));
+        assertThat(
+            decision.getExplanation(),
+            is(
+                "max supported index version ["
+                    + newNode.node().getMaxIndexVersion().toReleaseVersion()
+                    + "] is the same or newer than snapshot version ["
+                    + oldNode.node().getMaxIndexVersion().toReleaseVersion()
+                    + "]"
+            )
+        );
+
+        final RoutingChangesObserver routingChangesObserver = new RoutingChangesObserver() {
+        };
+        final RoutingNodes routingNodes = clusterState.mutableRoutingNodes();
+        final ShardRouting startedPrimary = routingNodes.startShard(
+            routingNodes.initializeShard(primaryShard, "newNode", null, 0, routingChangesObserver),
+            routingChangesObserver,
+            ShardRouting.UNAVAILABLE_EXPECTED_SHARD_SIZE
+        );
+        routingAllocation = new RoutingAllocation(null, routingNodes, clusterState, null, null, 0);
+        routingAllocation.debugDecision(true);
+
+        decision = allocationDecider.canAllocate(replicaShard, oldNode, routingAllocation);
+        assertThat(decision.type(), is(Decision.Type.NO));
+        assertThat(
+            decision.getExplanation(),
+            is(
+                "cannot allocate replica shard to a node with index version ["
+                    + oldNode.node().getMaxIndexVersion().toReleaseVersion()
+                    + "] since this is older than the primary index version ["
+                    + newNode.node().getMaxIndexVersion().toReleaseVersion()
+                    + "]"
+            )
+        );
+
+        routingNodes.startShard(
+            routingNodes.relocateShard(startedPrimary, "oldNode", 0, "test", routingChangesObserver).v2(),
+            routingChangesObserver,
+            ShardRouting.UNAVAILABLE_EXPECTED_SHARD_SIZE
+        );
+        routingAllocation = new RoutingAllocation(null, routingNodes, clusterState, null, null, 0);
+        routingAllocation.debugDecision(true);
+
+        decision = allocationDecider.canAllocate(replicaShard, newNode, routingAllocation);
+        assertThat(decision.type(), is(Decision.Type.YES));
+        assertThat(
+            decision.getExplanation(),
+            is(
+                "can allocate replica shard to a node with index version ["
+                    + newNode.node().getMaxIndexVersion().toReleaseVersion()
+                    + "] since this is equal-or-newer than the primary index version ["
+                    + oldNode.node().getMaxIndexVersion().toReleaseVersion()
+                    + "]"
+            )
+        );
+    }
+}
diff --git a/server/src/test/java/org/elasticsearch/cluster/routing/allocation/NodeVersionAllocationDeciderTests.java b/server/src/test/java/org/elasticsearch/cluster/routing/allocation/NodeVersionAllocationDeciderTests.java
index a9a02cedf2766..cf710be75b536 100644
--- a/server/src/test/java/org/elasticsearch/cluster/routing/allocation/NodeVersionAllocationDeciderTests.java
+++ b/server/src/test/java/org/elasticsearch/cluster/routing/allocation/NodeVersionAllocationDeciderTests.java
@@ -217,14 +217,12 @@ public void testRandom() {
                 for (int j = nodes.size(); j < numNodes; j++) {
                     if (frequently()) {
                         if (randomBoolean()) {
-                            nodes.add(
-                                newNode("node" + (nodeIdx++), VersionUtils.getPreviousVersion(), IndexVersionUtils.getPreviousVersion())
-                            );
+                            nodes.add(newNode("node" + (nodeIdx++), VersionUtils.getPreviousVersion(), IndexVersion.current()));
                         } else {
                             nodes.add(newNode("node" + (nodeIdx++), Version.CURRENT, IndexVersion.current()));
                         }
                     } else {
-                        nodes.add(newNode("node" + (nodeIdx++), VersionUtils.randomVersion(random()), IndexVersionUtils.randomVersion()));
+                        nodes.add(newNode("node" + (nodeIdx++), VersionUtils.randomVersion(random()), IndexVersion.current()));
                     }
                 }
             }
@@ -270,9 +268,9 @@ public void testRollingRestart() {
         clusterState = ClusterState.builder(clusterState)
             .nodes(
                 DiscoveryNodes.builder()
-                    .add(newNode("old0", VersionUtils.getPreviousVersion(), IndexVersionUtils.getPreviousVersion()))
-                    .add(newNode("old1", VersionUtils.getPreviousVersion(), IndexVersionUtils.getPreviousVersion()))
-                    .add(newNode("old2", VersionUtils.getPreviousVersion(), IndexVersionUtils.getPreviousVersion()))
+                    .add(newNode("old0", VersionUtils.getPreviousVersion(), IndexVersion.current()))
+                    .add(newNode("old1", VersionUtils.getPreviousVersion(), IndexVersion.current()))
+                    .add(newNode("old2", VersionUtils.getPreviousVersion(), IndexVersion.current()))
             )
             .build();
         clusterState = stabilize(clusterState, service);
@@ -280,8 +278,8 @@ public void testRollingRestart() {
         clusterState = ClusterState.builder(clusterState)
             .nodes(
                 DiscoveryNodes.builder()
-                    .add(newNode("old0", VersionUtils.getPreviousVersion(), IndexVersionUtils.getPreviousVersion()))
-                    .add(newNode("old1", VersionUtils.getPreviousVersion(), IndexVersionUtils.getPreviousVersion()))
+                    .add(newNode("old0", VersionUtils.getPreviousVersion(), IndexVersion.current()))
+                    .add(newNode("old1", VersionUtils.getPreviousVersion(), IndexVersion.current()))
                     .add(newNode("new0"))
             )
             .build();
@@ -291,7 +289,7 @@ public void testRollingRestart() {
         clusterState = ClusterState.builder(clusterState)
             .nodes(
                 DiscoveryNodes.builder()
-                    .add(newNode("node0", VersionUtils.getPreviousVersion(), IndexVersionUtils.getPreviousVersion()))
+                    .add(newNode("node0", VersionUtils.getPreviousVersion(), IndexVersion.current()))
                     .add(newNode("new1"))
                     .add(newNode("new0"))
             )
@@ -321,11 +319,11 @@ public void testRebalanceDoesNotAllocatePrimaryAndReplicasOnDifferentVersionNode
         final DiscoveryNode newNode = DiscoveryNodeUtils.builder("newNode").roles(MASTER_DATA_ROLES).build();
         final DiscoveryNode oldNode1 = DiscoveryNodeUtils.builder("oldNode1")
             .roles(MASTER_DATA_ROLES)
-            .version(VersionUtils.getPreviousVersion(), IndexVersions.MINIMUM_COMPATIBLE, IndexVersionUtils.getPreviousVersion())
+            .version(VersionUtils.getPreviousVersion(), IndexVersions.MINIMUM_COMPATIBLE, IndexVersion.current())
             .build();
         final DiscoveryNode oldNode2 = DiscoveryNodeUtils.builder("oldNode2")
             .roles(MASTER_DATA_ROLES)
-            .version(VersionUtils.getPreviousVersion(), IndexVersions.MINIMUM_COMPATIBLE, IndexVersionUtils.getPreviousVersion())
+            .version(VersionUtils.getPreviousVersion(), IndexVersions.MINIMUM_COMPATIBLE, IndexVersion.current())
             .build();
         AllocationId allocationId1P = AllocationId.newInitializing();
         AllocationId allocationId1R = AllocationId.newInitializing();
diff --git a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ilm/SetSingleNodeAllocateStep.java b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ilm/SetSingleNodeAllocateStep.java
index 1f636205bd867..1744d0e0384fd 100644
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ilm/SetSingleNodeAllocateStep.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/ilm/SetSingleNodeAllocateStep.java
@@ -21,6 +21,7 @@
 import org.elasticsearch.cluster.routing.allocation.decider.AllocationDeciders;
 import org.elasticsearch.cluster.routing.allocation.decider.Decision;
 import org.elasticsearch.cluster.routing.allocation.decider.FilterAllocationDecider;
+import org.elasticsearch.cluster.routing.allocation.decider.IndexVersionAllocationDecider;
 import org.elasticsearch.cluster.routing.allocation.decider.NodeReplacementAllocationDecider;
 import org.elasticsearch.cluster.routing.allocation.decider.NodeShutdownAllocationDecider;
 import org.elasticsearch.cluster.routing.allocation.decider.NodeVersionAllocationDecider;
@@ -74,6 +75,7 @@ public void performAction(
                     new ClusterSettings(Settings.EMPTY, ClusterSettings.BUILT_IN_CLUSTER_SETTINGS)
                 ),
                 DataTierAllocationDecider.INSTANCE,
+                new IndexVersionAllocationDecider(),
                 new NodeVersionAllocationDecider(),
                 new NodeShutdownAllocationDecider(),
                 new NodeReplacementAllocationDecider()

From 6cfbeafe14cf74465aa75b666b3a34da11a50693 Mon Sep 17 00:00:00 2001
From: Luca Cavanna <javanna@apache.org>
Date: Wed, 4 Sep 2024 10:50:18 +0200
Subject: [PATCH 132/144] Clarify comment in
 SearchExecutionContext#setLookupProviders (#112487)

Remove a TODO around asserting that setLookupProviders is only called as part of the fetch phase.
That is not the case, hence we are not going to address that, but it makes sense to replace the
TODO with a comment that clarifies how the method may be used and called.
---
 .../org/elasticsearch/index/query/SearchExecutionContext.java  | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/server/src/main/java/org/elasticsearch/index/query/SearchExecutionContext.java b/server/src/main/java/org/elasticsearch/index/query/SearchExecutionContext.java
index f25a0c73ac25d..106a5e811c48d 100644
--- a/server/src/main/java/org/elasticsearch/index/query/SearchExecutionContext.java
+++ b/server/src/main/java/org/elasticsearch/index/query/SearchExecutionContext.java
@@ -511,7 +511,8 @@ public void setLookupProviders(
         SourceProvider sourceProvider,
         Function<LeafReaderContext, LeafFieldLookupProvider> fieldLookupProvider
     ) {
-        // TODO can we assert that this is only called during FetchPhase?
+        // This isn't called only during fetch phase: there's scenarios where fetch phase is executed as part of the query phase,
+        // as well as runtime fields loaded from _source that do need a source provider as part of executing the query
         this.lookup = new SearchLookup(
             this::getFieldType,
             (fieldType, searchLookup, fielddataOperation) -> indexFieldDataLookup.apply(

From fd41724fa6b4f0977689ef552af30da82e859da6 Mon Sep 17 00:00:00 2001
From: Armin Braun <me@obrown.io>
Date: Wed, 4 Sep 2024 10:52:51 +0200
Subject: [PATCH 133/144] Avoid building O(N) list in can_match phase (#112458)

We can be a little faster and memory efficient here by not building a
list of shard requests up-front and instead building them as we need
them.
---
 .../action/search/CanMatchNodeRequest.java             |  4 ----
 .../java/org/elasticsearch/search/SearchService.java   | 10 ++++------
 2 files changed, 4 insertions(+), 10 deletions(-)

diff --git a/server/src/main/java/org/elasticsearch/action/search/CanMatchNodeRequest.java b/server/src/main/java/org/elasticsearch/action/search/CanMatchNodeRequest.java
index bc50a9f8f0c2c..30fa4caa79a15 100644
--- a/server/src/main/java/org/elasticsearch/action/search/CanMatchNodeRequest.java
+++ b/server/src/main/java/org/elasticsearch/action/search/CanMatchNodeRequest.java
@@ -229,10 +229,6 @@ public List<Shard> getShardLevelRequests() {
         return shards;
     }
 
-    public List<ShardSearchRequest> createShardSearchRequests() {
-        return shards.stream().map(this::createShardSearchRequest).toList();
-    }
-
     public ShardSearchRequest createShardSearchRequest(Shard r) {
         ShardSearchRequest shardSearchRequest = new ShardSearchRequest(
             new OriginalIndices(r.indices, indicesOptions),
diff --git a/server/src/main/java/org/elasticsearch/search/SearchService.java b/server/src/main/java/org/elasticsearch/search/SearchService.java
index 67d5d6337d77c..9dc44d5f66948 100644
--- a/server/src/main/java/org/elasticsearch/search/SearchService.java
+++ b/server/src/main/java/org/elasticsearch/search/SearchService.java
@@ -1664,13 +1664,11 @@ public AliasFilter buildAliasFilter(ClusterState state, String index, Set<String
     }
 
     public void canMatch(CanMatchNodeRequest request, ActionListener<CanMatchNodeResponse> listener) {
-        final List<ShardSearchRequest> shardSearchRequests = request.createShardSearchRequests();
-        final List<CanMatchNodeResponse.ResponseOrFailure> responses = new ArrayList<>(shardSearchRequests.size());
-        for (ShardSearchRequest shardSearchRequest : shardSearchRequests) {
-            CanMatchShardResponse canMatchShardResponse;
+        var shardLevelRequests = request.getShardLevelRequests();
+        final List<CanMatchNodeResponse.ResponseOrFailure> responses = new ArrayList<>(shardLevelRequests.size());
+        for (var shardLevelRequest : shardLevelRequests) {
             try {
-                canMatchShardResponse = canMatch(shardSearchRequest);
-                responses.add(new CanMatchNodeResponse.ResponseOrFailure(canMatchShardResponse));
+                responses.add(new CanMatchNodeResponse.ResponseOrFailure(canMatch(request.createShardSearchRequest(shardLevelRequest))));
             } catch (Exception e) {
                 responses.add(new CanMatchNodeResponse.ResponseOrFailure(e));
             }

From 3a8edf51977ceed59ea2763dd8341df74685e0c8 Mon Sep 17 00:00:00 2001
From: Armin Braun <me@obrown.io>
Date: Wed, 4 Sep 2024 10:59:13 +0200
Subject: [PATCH 134/144] Fix O(N) list building in
 TransportSearchAction.asyncSearchExecutor (#112474)

This at least avoids the O(N) list building which is needlessly heavy
for large index counts. Not sure the logic makes
perfect sense in all cases, but it should remain practically unchanged
for now (except when there's more than 2 indices and they're all system
ones).
---
 .../action/search/TransportSearchAction.java  | 27 +++++++++++++------
 1 file changed, 19 insertions(+), 8 deletions(-)

diff --git a/server/src/main/java/org/elasticsearch/action/search/TransportSearchAction.java b/server/src/main/java/org/elasticsearch/action/search/TransportSearchAction.java
index 32ee9c331295c..e29b07eeffe11 100644
--- a/server/src/main/java/org/elasticsearch/action/search/TransportSearchAction.java
+++ b/server/src/main/java/org/elasticsearch/action/search/TransportSearchAction.java
@@ -1285,16 +1285,27 @@ private void executeSearch(
     }
 
     Executor asyncSearchExecutor(final String[] indices) {
-        final List<String> executorsForIndices = Arrays.stream(indices).map(executorSelector::executorForSearch).toList();
-        if (executorsForIndices.size() == 1) { // all indices have same executor
-            return threadPool.executor(executorsForIndices.get(0));
+        boolean seenSystem = false;
+        boolean seenCritical = false;
+        for (String index : indices) {
+            final String executorName = executorSelector.executorForSearch(index);
+            switch (executorName) {
+                case SYSTEM_READ -> seenSystem = true;
+                case SYSTEM_CRITICAL_READ -> seenCritical = true;
+                default -> {
+                    return threadPool.executor(executorName);
+                }
+            }
         }
-        if (executorsForIndices.size() == 2
-            && executorsForIndices.contains(SYSTEM_READ)
-            && executorsForIndices.contains(SYSTEM_CRITICAL_READ)) { // mix of critical and non critical system indices
-            return threadPool.executor(SYSTEM_READ);
+        final String executor;
+        if (seenSystem == false && seenCritical) {
+            executor = SYSTEM_CRITICAL_READ;
+        } else if (seenSystem) {
+            executor = SYSTEM_READ;
+        } else {
+            executor = ThreadPool.Names.SEARCH;
         }
-        return threadPool.executor(ThreadPool.Names.SEARCH);
+        return threadPool.executor(executor);
     }
 
     static BiFunction<String, String, Transport.Connection> buildConnectionLookup(

From 3747765ab86085975e743da4425f852fdf993e04 Mon Sep 17 00:00:00 2001
From: Ignacio Vera <ignacio.vera@elastic.co>
Date: Wed, 4 Sep 2024 11:12:11 +0200
Subject: [PATCH 135/144] [DOC] geo_shape field type supports geo_hex
 aggregation (#112448)

---
 docs/reference/mapping/types/geo-shape.asciidoc | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/docs/reference/mapping/types/geo-shape.asciidoc b/docs/reference/mapping/types/geo-shape.asciidoc
index 20f79df8950af..e50c7d73b1b76 100644
--- a/docs/reference/mapping/types/geo-shape.asciidoc
+++ b/docs/reference/mapping/types/geo-shape.asciidoc
@@ -18,9 +18,8 @@ Documents using this type can be used:
 ** a <<query-dsl-geo-shape-query,`geo_shape` query>> (for example, intersecting polygons).
 * to aggregate documents by geographic grids:
 ** either <<search-aggregations-bucket-geohashgrid-aggregation,`geo_hash`>>
-** or <<search-aggregations-bucket-geotilegrid-aggregation,`geo_tile`>>.
-
-Grid aggregations over `geo_hex` grids are not supported for `geo_shape` fields.
+** or <<search-aggregations-bucket-geotilegrid-aggregation,`geo_tile`>>
+** or <<search-aggregations-bucket-geohexgrid-aggregation,`geo_hex`>>
 
 [[geo-shape-mapping-options]]
 [discrete]

From 435df33bfaf4d62b3eddef26e2c0613a6ea165cc Mon Sep 17 00:00:00 2001
From: Ignacio Vera <ignacio.vera@elastic.co>
Date: Wed, 4 Sep 2024 11:16:23 +0200
Subject: [PATCH 136/144] Fix tests in LegacyGeoShapeWithDocValuesQueryTests
 (#112467)

Similar to what we did in #86118, it filters out points with longitude 180.
---
 muted-tests.yml                                             | 6 ------
 .../index/query/LegacyGeoShapeWithDocValuesQueryTests.java  | 5 +++++
 2 files changed, 5 insertions(+), 6 deletions(-)

diff --git a/muted-tests.yml b/muted-tests.yml
index 1a8b0e8526c89..7830bb09670a0 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -170,9 +170,6 @@ tests:
   issue: https://github.com/elastic/elasticsearch/issues/112421
 - class: org.elasticsearch.indices.mapping.UpdateMappingIntegrationIT
   issue: https://github.com/elastic/elasticsearch/issues/112423
-- class: org.elasticsearch.xpack.spatial.index.query.LegacyGeoShapeWithDocValuesQueryTests
-  method: testIndexPointsFromLine
-  issue: https://github.com/elastic/elasticsearch/issues/112438
 - class: org.elasticsearch.xpack.esql.expression.function.aggregate.SpatialCentroidTests
   method: "testAggregateIntermediate {TestCase=<geo_point> #2}"
   issue: https://github.com/elastic/elasticsearch/issues/112461
@@ -188,9 +185,6 @@ tests:
 - class: org.elasticsearch.xpack.inference.external.http.RequestBasedTaskRunnerTests
   method: testLoopOneAtATime
   issue: https://github.com/elastic/elasticsearch/issues/112471
-- class: org.elasticsearch.xpack.spatial.index.query.LegacyGeoShapeWithDocValuesQueryTests
-  method: testIndexPointsFromPolygon
-  issue: https://github.com/elastic/elasticsearch/issues/112464
 
 # Examples:
 #
diff --git a/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/query/LegacyGeoShapeWithDocValuesQueryTests.java b/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/query/LegacyGeoShapeWithDocValuesQueryTests.java
index ce40b19377bc6..053931a882e4c 100644
--- a/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/query/LegacyGeoShapeWithDocValuesQueryTests.java
+++ b/x-pack/plugin/spatial/src/test/java/org/elasticsearch/xpack/spatial/index/query/LegacyGeoShapeWithDocValuesQueryTests.java
@@ -27,6 +27,7 @@
 import org.elasticsearch.xpack.spatial.LocalStateSpatialPlugin;
 
 import java.io.IOException;
+import java.util.Arrays;
 import java.util.Collection;
 import java.util.Collections;
 
@@ -220,4 +221,8 @@ public void testFieldAlias() throws IOException {
 
         assertHitCount(client().prepareSearch(defaultIndexName).setQuery(geoShapeQuery("alias", multiPoint)), 1L);
     }
+
+    protected boolean ignoreLons(double[] lons) {
+        return Arrays.stream(lons).anyMatch(v -> v == 180);
+    }
 }

From ec51cba1764facd3dd6b71703f5a59f804434d67 Mon Sep 17 00:00:00 2001
From: Armin Braun <me@obrown.io>
Date: Wed, 4 Sep 2024 12:27:13 +0200
Subject: [PATCH 137/144] Speedup reading ClusterFeatures from the wire
 (#112492)

This shows up as rather heavy at times, we can speed it up
by skipping collecting the temporary map and reading the lookup
into an array instead of a list.
---
 .../java/org/elasticsearch/cluster/ClusterFeatures.java    | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/server/src/main/java/org/elasticsearch/cluster/ClusterFeatures.java b/server/src/main/java/org/elasticsearch/cluster/ClusterFeatures.java
index 95cc53376af59..bab68303e8de5 100644
--- a/server/src/main/java/org/elasticsearch/cluster/ClusterFeatures.java
+++ b/server/src/main/java/org/elasticsearch/cluster/ClusterFeatures.java
@@ -140,11 +140,10 @@ private static void writeCanonicalSets(StreamOutput out, Map<String, Set<String>
         out.writeMap(nodeFeatureSetIndexes, StreamOutput::writeVInt);
     }
 
+    @SuppressWarnings("unchecked")
     private static Map<String, Set<String>> readCanonicalSets(StreamInput in) throws IOException {
-        List<Set<String>> featureSets = in.readCollectionAsList(i -> i.readCollectionAsImmutableSet(StreamInput::readString));
-        Map<String, Integer> nodeIndexes = in.readMap(StreamInput::readVInt);
-
-        return nodeIndexes.entrySet().stream().collect(Collectors.toUnmodifiableMap(Map.Entry::getKey, e -> featureSets.get(e.getValue())));
+        Set<String>[] featureSets = in.readArray(i -> i.readCollectionAsImmutableSet(StreamInput::readString), Set[]::new);
+        return in.readImmutableMap(streamInput -> featureSets[streamInput.readVInt()]);
     }
 
     public static ClusterFeatures readFrom(StreamInput in) throws IOException {

From 3d8353861768cde38a3afbb734249951b34e58a3 Mon Sep 17 00:00:00 2001
From: Luke Whiting <luke.whiting@elastic.co>
Date: Wed, 4 Sep 2024 11:29:38 +0100
Subject: [PATCH 138/144] Refactor health endpoint tests to use more readable
 style (#112433)

This changes the mutate object method in 3 health endpoint related tests to use a lambda switch and local
variable pattern that's more compact and understandable

This is the promised follow up to #112024
---
 .../health/ClusterHealthResponsesTests.java   | 135 ++++-------
 .../health/ClusterIndexHealthTests.java       | 220 ++++--------------
 .../health/ClusterShardHealthTests.java       | 137 +++--------
 3 files changed, 112 insertions(+), 380 deletions(-)

diff --git a/server/src/test/java/org/elasticsearch/action/admin/cluster/health/ClusterHealthResponsesTests.java b/server/src/test/java/org/elasticsearch/action/admin/cluster/health/ClusterHealthResponsesTests.java
index e18757e59c961..6d089f24f8b2c 100644
--- a/server/src/test/java/org/elasticsearch/action/admin/cluster/health/ClusterHealthResponsesTests.java
+++ b/server/src/test/java/org/elasticsearch/action/admin/cluster/health/ClusterHealthResponsesTests.java
@@ -263,103 +263,46 @@ protected Predicate<String> getRandomFieldsExcludeFilter() {
 
     @Override
     protected ClusterHealthResponse mutateInstance(ClusterHealthResponse instance) {
-        String mutate = randomFrom(
-            "clusterName",
-            "numberOfPendingTasks",
-            "numberOfInFlightFetch",
-            "delayedUnassignedShards",
-            "taskMaxWaitingTime",
-            "timedOut",
-            "clusterStateHealth"
-        );
-        switch (mutate) {
-            case "clusterName":
-                return new ClusterHealthResponse(
-                    instance.getClusterName() + randomAlphaOfLengthBetween(2, 5),
-                    instance.getNumberOfPendingTasks(),
-                    instance.getNumberOfInFlightFetch(),
-                    instance.getDelayedUnassignedShards(),
-                    instance.getTaskMaxWaitingTime(),
-                    instance.isTimedOut(),
-                    instance.getClusterStateHealth()
-                );
-            case "numberOfPendingTasks":
-                return new ClusterHealthResponse(
-                    instance.getClusterName(),
-                    instance.getNumberOfPendingTasks() + between(1, 10),
-                    instance.getNumberOfInFlightFetch(),
-                    instance.getDelayedUnassignedShards(),
-                    instance.getTaskMaxWaitingTime(),
-                    instance.isTimedOut(),
-                    instance.getClusterStateHealth()
-                );
-            case "numberOfInFlightFetch":
-                return new ClusterHealthResponse(
-                    instance.getClusterName(),
-                    instance.getNumberOfPendingTasks(),
-                    instance.getNumberOfInFlightFetch() + between(1, 10),
-                    instance.getDelayedUnassignedShards(),
-                    instance.getTaskMaxWaitingTime(),
-                    instance.isTimedOut(),
-                    instance.getClusterStateHealth()
-                );
-            case "delayedUnassignedShards":
-                return new ClusterHealthResponse(
-                    instance.getClusterName(),
-                    instance.getNumberOfPendingTasks(),
-                    instance.getNumberOfInFlightFetch(),
-                    instance.getDelayedUnassignedShards() + between(1, 10),
-                    instance.getTaskMaxWaitingTime(),
-                    instance.isTimedOut(),
-                    instance.getClusterStateHealth()
-                );
-            case "taskMaxWaitingTime":
+        String clusterName = instance.getClusterName();
+        int numberOfPendingTasks = instance.getNumberOfPendingTasks();
+        int numberOfInFlightFetch = instance.getNumberOfInFlightFetch();
+        int delayedUnassignedShards = instance.getDelayedUnassignedShards();
+        TimeValue taskMaxWaitingTime = instance.getTaskMaxWaitingTime();
+        boolean timedOut = instance.isTimedOut();
+        ClusterStateHealth clusterStateHealth = instance.getClusterStateHealth();
 
-                return new ClusterHealthResponse(
-                    instance.getClusterName(),
-                    instance.getNumberOfPendingTasks(),
-                    instance.getNumberOfInFlightFetch(),
-                    instance.getDelayedUnassignedShards(),
-                    new TimeValue(instance.getTaskMaxWaitingTime().millis() + between(1, 10)),
-                    instance.isTimedOut(),
-                    instance.getClusterStateHealth()
-                );
-            case "timedOut":
-                return new ClusterHealthResponse(
-                    instance.getClusterName(),
-                    instance.getNumberOfPendingTasks(),
-                    instance.getNumberOfInFlightFetch(),
-                    instance.getDelayedUnassignedShards(),
-                    instance.getTaskMaxWaitingTime(),
-                    instance.isTimedOut() ? false : true,
-                    instance.getClusterStateHealth()
-                );
-            case "clusterStateHealth":
-                ClusterStateHealth state = instance.getClusterStateHealth();
-                ClusterStateHealth newState = new ClusterStateHealth(
-                    state.getActivePrimaryShards() + between(1, 10),
-                    state.getActiveShards(),
-                    state.getRelocatingShards(),
-                    state.getInitializingShards(),
-                    state.getUnassignedShards(),
-                    state.getUnassignedPrimaryShards(),
-                    state.getNumberOfNodes(),
-                    state.getNumberOfDataNodes(),
-                    state.getActiveShardsPercent(),
-                    state.getStatus(),
-                    state.getIndices()
-                );
-                return new ClusterHealthResponse(
-                    instance.getClusterName(),
-                    instance.getNumberOfPendingTasks(),
-                    instance.getNumberOfInFlightFetch(),
-                    instance.getDelayedUnassignedShards(),
-                    instance.getTaskMaxWaitingTime(),
-                    instance.isTimedOut(),
-                    newState
-                );
-            default:
-                throw new UnsupportedOperationException();
+        switch (randomIntBetween(0, 6)) {
+            case 0 -> clusterName += randomAlphaOfLengthBetween(2, 5);
+            case 1 -> numberOfPendingTasks += between(1, 10);
+            case 2 -> numberOfInFlightFetch += between(1, 10);
+            case 3 -> delayedUnassignedShards += between(1, 10);
+            case 4 -> taskMaxWaitingTime = new TimeValue(instance.getTaskMaxWaitingTime().millis() + between(1, 10));
+            case 5 -> timedOut = timedOut ? false : true;
+            case 6 -> clusterStateHealth = new ClusterStateHealth(
+                clusterStateHealth.getActivePrimaryShards() + between(1, 10),
+                clusterStateHealth.getActiveShards(),
+                clusterStateHealth.getRelocatingShards(),
+                clusterStateHealth.getInitializingShards(),
+                clusterStateHealth.getUnassignedShards(),
+                clusterStateHealth.getUnassignedPrimaryShards(),
+                clusterStateHealth.getNumberOfNodes(),
+                clusterStateHealth.getNumberOfDataNodes(),
+                clusterStateHealth.getActiveShardsPercent(),
+                clusterStateHealth.getStatus(),
+                clusterStateHealth.getIndices()
+            );
+            default -> throw new UnsupportedOperationException();
         }
+
+        return new ClusterHealthResponse(
+            clusterName,
+            numberOfPendingTasks,
+            numberOfInFlightFetch,
+            delayedUnassignedShards,
+            taskMaxWaitingTime,
+            timedOut,
+            clusterStateHealth
+        );
     }
+
 }
diff --git a/server/src/test/java/org/elasticsearch/cluster/health/ClusterIndexHealthTests.java b/server/src/test/java/org/elasticsearch/cluster/health/ClusterIndexHealthTests.java
index 6ec9800839594..832bc227b177c 100644
--- a/server/src/test/java/org/elasticsearch/cluster/health/ClusterIndexHealthTests.java
+++ b/server/src/test/java/org/elasticsearch/cluster/health/ClusterIndexHealthTests.java
@@ -22,7 +22,6 @@
 import org.elasticsearch.xcontent.XContentParser;
 
 import java.io.IOException;
-import java.util.Arrays;
 import java.util.Collections;
 import java.util.HashMap;
 import java.util.List;
@@ -141,187 +140,52 @@ protected Predicate<String> getRandomFieldsExcludeFilter() {
 
     @Override
     protected ClusterIndexHealth mutateInstance(ClusterIndexHealth instance) {
-        String mutate = randomFrom(
-            "index",
-            "numberOfShards",
-            "numberOfReplicas",
-            "activeShards",
-            "relocatingShards",
-            "initializingShards",
-            "unassignedShards",
-            "unassignedPrimaryShards",
-            "activePrimaryShards",
-            "status",
-            "shards"
-        );
-        switch (mutate) {
-            case "index":
-                return new ClusterIndexHealth(
-                    instance.getIndex() + randomAlphaOfLengthBetween(2, 5),
-                    instance.getNumberOfShards(),
-                    instance.getNumberOfReplicas(),
-                    instance.getActiveShards(),
-                    instance.getRelocatingShards(),
-                    instance.getInitializingShards(),
-                    instance.getUnassignedShards(),
-                    instance.getUnassignedPrimaryShards(),
-                    instance.getActivePrimaryShards(),
-                    instance.getStatus(),
-                    instance.getShards()
-                );
-            case "numberOfShards":
-                return new ClusterIndexHealth(
-                    instance.getIndex(),
-                    instance.getNumberOfShards() + between(1, 10),
-                    instance.getNumberOfReplicas(),
-                    instance.getActiveShards(),
-                    instance.getRelocatingShards(),
-                    instance.getInitializingShards(),
-                    instance.getUnassignedShards(),
-                    instance.getUnassignedPrimaryShards(),
-                    instance.getActivePrimaryShards(),
-                    instance.getStatus(),
-                    instance.getShards()
-                );
-            case "numberOfReplicas":
-                return new ClusterIndexHealth(
-                    instance.getIndex(),
-                    instance.getNumberOfShards(),
-                    instance.getNumberOfReplicas() + between(1, 10),
-                    instance.getActiveShards(),
-                    instance.getRelocatingShards(),
-                    instance.getInitializingShards(),
-                    instance.getUnassignedShards(),
-                    instance.getUnassignedPrimaryShards(),
-                    instance.getActivePrimaryShards(),
-                    instance.getStatus(),
-                    instance.getShards()
-                );
-            case "activeShards":
-                return new ClusterIndexHealth(
-                    instance.getIndex(),
-                    instance.getNumberOfShards(),
-                    instance.getNumberOfReplicas(),
-                    instance.getActiveShards() + between(1, 10),
-                    instance.getRelocatingShards(),
-                    instance.getInitializingShards(),
-                    instance.getUnassignedShards(),
-                    instance.getUnassignedPrimaryShards(),
-                    instance.getActivePrimaryShards(),
-                    instance.getStatus(),
-                    instance.getShards()
-                );
-            case "relocatingShards":
-                return new ClusterIndexHealth(
-                    instance.getIndex(),
-                    instance.getNumberOfShards(),
-                    instance.getNumberOfReplicas(),
-                    instance.getActiveShards(),
-                    instance.getRelocatingShards() + between(1, 10),
-                    instance.getInitializingShards(),
-                    instance.getUnassignedShards(),
-                    instance.getUnassignedPrimaryShards(),
-                    instance.getActivePrimaryShards(),
-                    instance.getStatus(),
-                    instance.getShards()
-                );
-            case "initializingShards":
-                return new ClusterIndexHealth(
-                    instance.getIndex(),
-                    instance.getNumberOfShards(),
-                    instance.getNumberOfReplicas(),
-                    instance.getActiveShards(),
-                    instance.getRelocatingShards(),
-                    instance.getInitializingShards() + between(1, 10),
-                    instance.getUnassignedShards(),
-                    instance.getUnassignedPrimaryShards(),
-                    instance.getActivePrimaryShards(),
-                    instance.getStatus(),
-                    instance.getShards()
-                );
-            case "unassignedShards":
-                return new ClusterIndexHealth(
-                    instance.getIndex(),
-                    instance.getNumberOfShards(),
-                    instance.getNumberOfReplicas(),
-                    instance.getActiveShards(),
-                    instance.getRelocatingShards(),
-                    instance.getInitializingShards(),
-                    instance.getUnassignedShards() + between(1, 10),
-                    instance.getUnassignedPrimaryShards(),
-                    instance.getActivePrimaryShards(),
-                    instance.getStatus(),
-                    instance.getShards()
-                );
-            case "unassignedPrimaryShards":
-                return new ClusterIndexHealth(
-                    instance.getIndex(),
-                    instance.getNumberOfShards(),
-                    instance.getNumberOfReplicas(),
-                    instance.getActiveShards(),
-                    instance.getRelocatingShards(),
-                    instance.getInitializingShards(),
-                    instance.getUnassignedShards(),
-                    instance.getUnassignedPrimaryShards() + between(1, 10),
-                    instance.getActivePrimaryShards(),
-                    instance.getStatus(),
-                    instance.getShards()
-                );
-            case "activePrimaryShards":
-                return new ClusterIndexHealth(
-                    instance.getIndex(),
-                    instance.getNumberOfShards(),
-                    instance.getNumberOfReplicas(),
-                    instance.getActiveShards(),
-                    instance.getRelocatingShards(),
-                    instance.getInitializingShards(),
-                    instance.getUnassignedShards(),
-                    instance.getUnassignedPrimaryShards(),
-                    instance.getActivePrimaryShards() + between(1, 10),
-                    instance.getStatus(),
-                    instance.getShards()
-                );
-            case "status":
-                ClusterHealthStatus status = randomFrom(
-                    Arrays.stream(ClusterHealthStatus.values()).filter(value -> value.equals(instance.getStatus()) == false).toList()
-                );
-                return new ClusterIndexHealth(
-                    instance.getIndex(),
-                    instance.getNumberOfShards(),
-                    instance.getNumberOfReplicas(),
-                    instance.getActiveShards(),
-                    instance.getRelocatingShards(),
-                    instance.getInitializingShards(),
-                    instance.getUnassignedShards(),
-                    instance.getUnassignedPrimaryShards(),
-                    instance.getActivePrimaryShards(),
-                    status,
-                    instance.getShards()
-                );
-            case "shards":
-                Map<Integer, ClusterShardHealth> map;
+        String index = instance.getIndex();
+        int numberOfShards = instance.getNumberOfShards();
+        int numberOfReplicas = instance.getNumberOfReplicas();
+        int activeShards = instance.getActiveShards();
+        int relocatingShards = instance.getRelocatingShards();
+        int initializingShards = instance.getInitializingShards();
+        int unassignedShards = instance.getUnassignedShards();
+        int unassignedPrimaryShards = instance.getUnassignedPrimaryShards();
+        int activePrimaryShards = instance.getActivePrimaryShards();
+        ClusterHealthStatus status = instance.getStatus();
+        Map<Integer, ClusterShardHealth> shards = new HashMap<>(instance.getShards());
+
+        switch (randomIntBetween(0, 10)) {
+            case 0 -> index += randomAlphaOfLengthBetween(2, 5);
+            case 1 -> numberOfShards += between(1, 10);
+            case 2 -> numberOfReplicas += between(1, 10);
+            case 3 -> activeShards += between(1, 10);
+            case 4 -> relocatingShards += between(1, 10);
+            case 5 -> initializingShards += between(1, 10);
+            case 6 -> unassignedShards += between(1, 10);
+            case 7 -> unassignedPrimaryShards += between(1, 10);
+            case 8 -> activePrimaryShards += between(1, 10);
+            case 9 -> status = randomValueOtherThan(instance.getStatus(), () -> randomFrom(ClusterHealthStatus.values()));
+            case 10 -> {
                 if (instance.getShards().isEmpty()) {
-                    map = Collections.singletonMap(0, ClusterShardHealthTests.randomShardHealth(0));
+                    shards = Map.of(0, ClusterShardHealthTests.randomShardHealth(0));
                 } else {
-                    map = new HashMap<>(instance.getShards());
-                    map.remove(map.keySet().iterator().next());
+                    shards.remove(shards.keySet().iterator().next());
                 }
-                return new ClusterIndexHealth(
-                    instance.getIndex(),
-                    instance.getNumberOfShards(),
-                    instance.getNumberOfReplicas(),
-                    instance.getActiveShards(),
-                    instance.getRelocatingShards(),
-                    instance.getInitializingShards(),
-                    instance.getUnassignedShards(),
-                    instance.getUnassignedPrimaryShards(),
-                    instance.getActivePrimaryShards(),
-                    instance.getStatus(),
-                    map
-                );
-            default:
-                throw new UnsupportedOperationException();
+            }
+            default -> throw new UnsupportedOperationException();
         }
+
+        return new ClusterIndexHealth(
+            index,
+            numberOfShards,
+            numberOfReplicas,
+            activeShards,
+            relocatingShards,
+            initializingShards,
+            unassignedShards,
+            unassignedPrimaryShards,
+            activePrimaryShards,
+            status,
+            shards
+        );
     }
 
     private static final ConstructingObjectParser<ClusterIndexHealth, String> PARSER = new ConstructingObjectParser<>(
diff --git a/server/src/test/java/org/elasticsearch/cluster/health/ClusterShardHealthTests.java b/server/src/test/java/org/elasticsearch/cluster/health/ClusterShardHealthTests.java
index fec87a7b9634e..d5960f317f36a 100644
--- a/server/src/test/java/org/elasticsearch/cluster/health/ClusterShardHealthTests.java
+++ b/server/src/test/java/org/elasticsearch/cluster/health/ClusterShardHealthTests.java
@@ -14,7 +14,6 @@
 import org.elasticsearch.xcontent.XContentParser;
 
 import java.io.IOException;
-import java.util.Arrays;
 import java.util.function.Predicate;
 
 import static org.elasticsearch.common.xcontent.XContentParserUtils.ensureExpectedToken;
@@ -104,111 +103,37 @@ protected Predicate<String> getRandomFieldsExcludeFilter() {
     }
 
     @Override
-    protected ClusterShardHealth mutateInstance(final ClusterShardHealth instance) {
-        String mutate = randomFrom(
-            "shardId",
-            "status",
-            "activeShards",
-            "relocatingShards",
-            "initializingShards",
-            "unassignedShards",
-            "unassignedPrimaryShards",
-            "primaryActive"
-        );
-        switch (mutate) {
-            case "shardId":
-                return new ClusterShardHealth(
-                    instance.getShardId() + between(1, 10),
-                    instance.getStatus(),
-                    instance.getActiveShards(),
-                    instance.getRelocatingShards(),
-                    instance.getInitializingShards(),
-                    instance.getUnassignedShards(),
-                    instance.getUnassignedPrimaryShards(),
-                    instance.isPrimaryActive()
-                );
-            case "status":
-                ClusterHealthStatus status = randomFrom(
-                    Arrays.stream(ClusterHealthStatus.values()).filter(value -> value.equals(instance.getStatus()) == false).toList()
-                );
-                return new ClusterShardHealth(
-                    instance.getShardId(),
-                    status,
-                    instance.getActiveShards(),
-                    instance.getRelocatingShards(),
-                    instance.getInitializingShards(),
-                    instance.getUnassignedShards(),
-                    instance.getUnassignedPrimaryShards(),
-                    instance.isPrimaryActive()
-                );
-            case "activeShards":
-                return new ClusterShardHealth(
-                    instance.getShardId(),
-                    instance.getStatus(),
-                    instance.getActiveShards() + between(1, 10),
-                    instance.getRelocatingShards(),
-                    instance.getInitializingShards(),
-                    instance.getUnassignedShards(),
-                    instance.getUnassignedPrimaryShards(),
-                    instance.isPrimaryActive()
-                );
-            case "relocatingShards":
-                return new ClusterShardHealth(
-                    instance.getShardId(),
-                    instance.getStatus(),
-                    instance.getActiveShards(),
-                    instance.getRelocatingShards() + between(1, 10),
-                    instance.getInitializingShards(),
-                    instance.getUnassignedShards(),
-                    instance.getUnassignedPrimaryShards(),
-                    instance.isPrimaryActive()
-                );
-            case "initializingShards":
-                return new ClusterShardHealth(
-                    instance.getShardId(),
-                    instance.getStatus(),
-                    instance.getActiveShards(),
-                    instance.getRelocatingShards(),
-                    instance.getInitializingShards() + between(1, 10),
-                    instance.getUnassignedShards(),
-                    instance.getUnassignedPrimaryShards(),
-                    instance.isPrimaryActive()
-                );
-            case "unassignedShards":
-                return new ClusterShardHealth(
-                    instance.getShardId(),
-                    instance.getStatus(),
-                    instance.getActiveShards(),
-                    instance.getRelocatingShards(),
-                    instance.getInitializingShards(),
-                    instance.getUnassignedShards() + between(1, 10),
-                    instance.getUnassignedPrimaryShards(),
-                    instance.isPrimaryActive()
-                );
-            case "unassignedPrimaryShards":
-                return new ClusterShardHealth(
-                    instance.getShardId(),
-                    instance.getStatus(),
-                    instance.getActiveShards(),
-                    instance.getRelocatingShards(),
-                    instance.getInitializingShards(),
-                    instance.getUnassignedShards(),
-                    instance.getUnassignedPrimaryShards() + between(1, 10),
-                    instance.isPrimaryActive()
-                );
-            case "primaryActive":
-                return new ClusterShardHealth(
-                    instance.getShardId(),
-                    instance.getStatus(),
-                    instance.getActiveShards(),
-                    instance.getRelocatingShards(),
-                    instance.getInitializingShards(),
-                    instance.getUnassignedShards(),
-                    instance.getUnassignedPrimaryShards(),
-                    instance.isPrimaryActive() ? false : true
-                );
-            default:
-                throw new UnsupportedOperationException();
+    protected ClusterShardHealth mutateInstance(ClusterShardHealth instance) {
+        int shardId = instance.getShardId();
+        ClusterHealthStatus status = instance.getStatus();
+        int activeShards = instance.getActiveShards();
+        int relocatingShards = instance.getRelocatingShards();
+        int initializingShards = instance.getInitializingShards();
+        int unassignedShards = instance.getUnassignedShards();
+        int unassignedPrimaryShards = instance.getUnassignedPrimaryShards();
+        boolean primaryActive = instance.isPrimaryActive();
+
+        switch (randomIntBetween(0, 7)) {
+            case 0 -> shardId += between(1, 10);
+            case 1 -> status = randomValueOtherThan(status, () -> randomFrom(ClusterHealthStatus.values()));
+            case 2 -> activeShards += between(1, 10);
+            case 3 -> relocatingShards += between(1, 10);
+            case 4 -> initializingShards += between(1, 10);
+            case 5 -> unassignedShards += between(1, 10);
+            case 6 -> unassignedPrimaryShards += between(1, 10);
+            case 7 -> primaryActive = primaryActive ? false : true;
+            default -> throw new UnsupportedOperationException();
         }
+
+        return new ClusterShardHealth(
+            shardId,
+            status,
+            activeShards,
+            relocatingShards,
+            initializingShards,
+            unassignedShards,
+            unassignedPrimaryShards,
+            primaryActive
+        );
     }
 }

From 069a4d49a57194eff2f112395bf73ad90d8fef61 Mon Sep 17 00:00:00 2001
From: Armin Braun <me@obrown.io>
Date: Wed, 4 Sep 2024 12:51:17 +0200
Subject: [PATCH 139/144] Save needlessly collecting list in
 InternalMappedSignificantTerms (#112502)

No need to allocate a list+stream to do an unsafe(ish) cast.
---
 .../bucket/terms/InternalMappedSignificantTerms.java           | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/server/src/main/java/org/elasticsearch/search/aggregations/bucket/terms/InternalMappedSignificantTerms.java b/server/src/main/java/org/elasticsearch/search/aggregations/bucket/terms/InternalMappedSignificantTerms.java
index c0d7103e42e8e..0b09ad3d3d85e 100644
--- a/server/src/main/java/org/elasticsearch/search/aggregations/bucket/terms/InternalMappedSignificantTerms.java
+++ b/server/src/main/java/org/elasticsearch/search/aggregations/bucket/terms/InternalMappedSignificantTerms.java
@@ -71,8 +71,9 @@ protected final void writeTermTypeInfoTo(StreamOutput out) throws IOException {
     }
 
     @Override
+    @SuppressWarnings({ "rawtypes", "unchecked" })
     public Iterator<SignificantTerms.Bucket> iterator() {
-        return buckets.stream().map(bucket -> (SignificantTerms.Bucket) bucket).toList().iterator();
+        return (Iterator) buckets.iterator();
     }
 
     @Override

From 2982fc61e81fa23ed03f7b51854af9f5352666bb Mon Sep 17 00:00:00 2001
From: Dai Sugimori <daisuke.sugimori@elastic.co>
Date: Wed, 4 Sep 2024 19:55:56 +0900
Subject: [PATCH 140/144] [DOCS] Add docs for new Lucene's filters for Japanese
 text. (#112356)

---
 docs/plugins/analysis-kuromoji.asciidoc | 120 ++++++++++++++++++++++++
 1 file changed, 120 insertions(+)

diff --git a/docs/plugins/analysis-kuromoji.asciidoc b/docs/plugins/analysis-kuromoji.asciidoc
index 1f114e9ad9ed6..b1d1d5a751057 100644
--- a/docs/plugins/analysis-kuromoji.asciidoc
+++ b/docs/plugins/analysis-kuromoji.asciidoc
@@ -624,3 +624,123 @@ Which results in:
   } ]
 }
 --------------------------------------------------
+
+[[analysis-kuromoji-hiragana-uppercase]]
+==== `hiragana_uppercase` token filter
+
+The `hiragana_uppercase` token filter normalizes small letters (捨て仮名) in hiragana into standard letters.
+This filter is useful if you want to search against old style Japanese text such as
+patents, legal documents, contract policies, etc.
+
+For example:
+
+[source,console]
+--------------------------------------------------
+PUT kuromoji_sample
+{
+  "settings": {
+    "index": {
+      "analysis": {
+        "analyzer": {
+          "my_analyzer": {
+            "tokenizer": "kuromoji_tokenizer",
+            "filter": [
+              "hiragana_uppercase"
+            ]
+          }
+        }
+      }
+    }
+  }
+}
+
+GET kuromoji_sample/_analyze
+{
+  "analyzer": "my_analyzer",
+  "text": "ちょっとまって"
+}
+--------------------------------------------------
+
+Which results in:
+
+[source,console-result]
+--------------------------------------------------
+{
+  "tokens": [
+    {
+      "token": "ちよつと",
+      "start_offset": 0,
+      "end_offset": 4,
+      "type": "word",
+      "position": 0
+    },
+    {
+      "token": "まつ",
+      "start_offset": 4,
+      "end_offset": 6,
+      "type": "word",
+      "position": 1
+    },
+    {
+      "token": "て",
+      "start_offset": 6,
+      "end_offset": 7,
+      "type": "word",
+      "position": 2
+    }
+  ]
+}
+--------------------------------------------------
+
+[[analysis-kuromoji-katakana-uppercase]]
+==== `katakana_uppercase` token filter
+
+The `katakana_uppercase` token filter normalizes small letters (捨て仮名) in katakana into standard letters.
+This filter is useful if you want to search against old style Japanese text such as
+patents, legal documents, contract policies, etc.
+
+For example:
+
+[source,console]
+--------------------------------------------------
+PUT kuromoji_sample
+{
+  "settings": {
+    "index": {
+      "analysis": {
+        "analyzer": {
+          "my_analyzer": {
+            "tokenizer": "kuromoji_tokenizer",
+            "filter": [
+              "katakana_uppercase"
+            ]
+          }
+        }
+      }
+    }
+  }
+}
+
+GET kuromoji_sample/_analyze
+{
+  "analyzer": "my_analyzer",
+  "text": "ストップウォッチ"
+}
+--------------------------------------------------
+
+Which results in:
+
+[source,console-result]
+--------------------------------------------------
+{
+  "tokens": [
+    {
+      "token": "ストツプウオツチ",
+      "start_offset": 0,
+      "end_offset": 8,
+      "type": "word",
+      "position": 0
+    }
+  ]
+}
+--------------------------------------------------

From 0074c14bfa438579f1dfc39d89d9cce1d1543c62 Mon Sep 17 00:00:00 2001
From: Simon Cooper <simon.cooper@elastic.co>
Date: Wed, 4 Sep 2024 12:19:29 +0100
Subject: [PATCH 141/144] Add known issue for role mappings file bug to 8.15.0
 (#112504)

---
 docs/reference/release-notes/8.15.0.asciidoc | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/docs/reference/release-notes/8.15.0.asciidoc b/docs/reference/release-notes/8.15.0.asciidoc
index 2069c1bd96ff0..bed1912fc1b84 100644
--- a/docs/reference/release-notes/8.15.0.asciidoc
+++ b/docs/reference/release-notes/8.15.0.asciidoc
@@ -26,6 +26,10 @@ memory lock feature (issue: {es-issue}111847[#111847])
 <<api-conventions-number-values,incorrectly>> assume that this value will be within a particular range (e.g. that it fits into a 32-bit
 signed integer) may encounter errors (issue: {es-issue}111854[#111854])
 
+* Elasticsearch will not start if custom role mappings are configured using the
+`xpack.security.authc.realms.*.files.role_mapping` configuration option. As a workaround, custom role mappings
+can be configured using the https://www.elastic.co/guide/en/elasticsearch/reference/current/security-api-put-role-mapping.html[REST API] (issue: {es-issue}112503[#112503])
+
 [[breaking-8.15.0]]
 [float]
 === Breaking changes

From a36d90cf34d5d190e8a0830c99cc04be66da0af8 Mon Sep 17 00:00:00 2001
From: Simon Cooper <simon.cooper@elastic.co>
Date: Wed, 4 Sep 2024 13:42:40 +0100
Subject: [PATCH 142/144] Use CLDR locale provider on JDK 23+ (#110222)

JDK 23 removes the COMPAT locale provider, leaving CLDR as the only option. This commit configures Elasticsearch
to use the CLDR provider when on JDK 23, but still use the existing COMPAT provider when on JDK 22 and below.

This causes some differences in locale behaviour; this also adapts various tests to still work whether run on COMPAT or CLDR.
---
 .../src/main/groovy/elasticsearch.ide.gradle  |  2 +-
 .../internal/ElasticsearchTestBasePlugin.java |  2 +-
 .../server/cli/SystemJvmOptions.java          | 17 +++++++++++-----
 .../painless-field-context.asciidoc           |  6 +++---
 .../painless-execute-script.asciidoc          |  2 +-
 .../bucket/composite-aggregation.asciidoc     |  2 +-
 .../bucket/datehistogram-aggregation.asciidoc |  4 ++--
 .../indices/index-templates.asciidoc          |  2 +-
 docs/reference/mapping/runtime.asciidoc       |  6 +++---
 docs/reference/ml/ml-shared.asciidoc          |  2 +-
 .../search-your-data/search-api.asciidoc      |  2 +-
 .../test/painless/65_runtime_doc_values.yml   | 20 +++++++++----------
 .../test/runtime_fields/10_keyword.yml        |  6 +++---
 .../13_keyword_calculated_at_index.yml        |  4 ++--
 .../runtime_fields/40_runtime_mappings.yml    |  4 ++--
 .../runtime_fields/80_multiple_indices.yml    |  2 +-
 muted-tests.yml                               | 15 --------------
 .../rest-api-spec/test/eql/10_basic.yml       |  2 +-
 .../test/eql/20_runtime_mappings.yml          |  2 +-
 .../search/180_locale_dependent_mapping.yml   | 10 +++++-----
 .../search/query/SearchQueryIT.java           | 16 +++++----------
 ...vedComposableIndexTemplateActionTests.java |  4 ++--
 .../common/time/DateFormattersTests.java      | 10 +++++-----
 .../index/mapper/DateFieldMapperTests.java    |  4 ++--
 .../elasticsearch/license/LicenseUtils.java   |  2 +-
 .../ClusterStateLicenseServiceTests.java      |  5 -----
 .../rest-api-spec/test/eql/10_basic.yml       |  2 +-
 .../test/eql/20_runtime_mappings.yml          |  2 +-
 .../DateTimeFormatProcessorTests.java         |  6 +++---
 .../xpack/security/PermissionsIT.java         |  2 +-
 30 files changed, 73 insertions(+), 92 deletions(-)

diff --git a/build-tools-internal/src/main/groovy/elasticsearch.ide.gradle b/build-tools-internal/src/main/groovy/elasticsearch.ide.gradle
index cae1116d37ea5..dd8b582adb92f 100644
--- a/build-tools-internal/src/main/groovy/elasticsearch.ide.gradle
+++ b/build-tools-internal/src/main/groovy/elasticsearch.ide.gradle
@@ -167,7 +167,7 @@ if (providers.systemProperty('idea.active').getOrNull() == 'true') {
             vmParameters = [
               '-ea',
               '-Djava.security.manager=allow',
-              '-Djava.locale.providers=SPI,COMPAT',
+              '-Djava.locale.providers=SPI,CLDR',
               '-Des.nativelibs.path="' + testLibraryPath + '"',
               // TODO: only open these for mockito when it is modularized
               '--add-opens=java.base/java.security.cert=ALL-UNNAMED',
diff --git a/build-tools-internal/src/main/java/org/elasticsearch/gradle/internal/ElasticsearchTestBasePlugin.java b/build-tools-internal/src/main/java/org/elasticsearch/gradle/internal/ElasticsearchTestBasePlugin.java
index 689c8ddecb057..2d6964c041fe2 100644
--- a/build-tools-internal/src/main/java/org/elasticsearch/gradle/internal/ElasticsearchTestBasePlugin.java
+++ b/build-tools-internal/src/main/java/org/elasticsearch/gradle/internal/ElasticsearchTestBasePlugin.java
@@ -92,7 +92,7 @@ public void execute(Task t) {
                     mkdirs(test.getWorkingDir().toPath().resolve("temp").toFile());
 
                     // TODO remove once jvm.options are added to test system properties
-                    test.systemProperty("java.locale.providers", "SPI,COMPAT");
+                    test.systemProperty("java.locale.providers", "SPI,CLDR");
                 }
             });
             test.getJvmArgumentProviders().add(nonInputProperties);
diff --git a/distribution/tools/server-cli/src/main/java/org/elasticsearch/server/cli/SystemJvmOptions.java b/distribution/tools/server-cli/src/main/java/org/elasticsearch/server/cli/SystemJvmOptions.java
index 94e2d538c0ad0..2d707f150cc8b 100644
--- a/distribution/tools/server-cli/src/main/java/org/elasticsearch/server/cli/SystemJvmOptions.java
+++ b/distribution/tools/server-cli/src/main/java/org/elasticsearch/server/cli/SystemJvmOptions.java
@@ -10,6 +10,7 @@
 
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.util.concurrent.EsExecutors;
+import org.elasticsearch.core.UpdateForV9;
 
 import java.util.List;
 import java.util.Map;
@@ -59,11 +60,7 @@ static List<String> systemJvmOptions(Settings nodeSettings, final Map<String, St
                 "-Dlog4j.shutdownHookEnabled=false",
                 "-Dlog4j2.disable.jmx=true",
                 "-Dlog4j2.formatMsgNoLookups=true",
-                /*
-                 * Due to internationalization enhancements in JDK 9 Elasticsearch need to set the provider to COMPAT otherwise time/date
-                 * parsing will break in an incompatible way for some date patterns and locales.
-                 */
-                "-Djava.locale.providers=SPI,COMPAT",
+                "-Djava.locale.providers=" + getLocaleProviders(),
                 maybeEnableNativeAccess(),
                 maybeOverrideDockerCgroup(distroType),
                 maybeSetActiveProcessorCount(nodeSettings),
@@ -75,6 +72,16 @@ static List<String> systemJvmOptions(Settings nodeSettings, final Map<String, St
         ).filter(e -> e.isEmpty() == false).collect(Collectors.toList());
     }
 
+    @UpdateForV9    // only use CLDR in v9+
+    private static String getLocaleProviders() {
+        /*
+         * Specify SPI to load IsoCalendarDataProvider (see #48209), specifying the first day of week as Monday.
+         * When on pre-23, use COMPAT instead to maintain existing date formats as much as we can.
+         * When on JDK 23+, use the default CLDR locale database, as COMPAT was removed in JDK 23.
+         */
+        return Runtime.version().feature() >= 23 ? "SPI,CLDR" : "SPI,COMPAT";
+    }
+
     /*
      * The virtual file /proc/self/cgroup should list the current cgroup
      * membership. For each hierarchy, you can follow the cgroup path from
diff --git a/docs/painless/painless-contexts/painless-field-context.asciidoc b/docs/painless/painless-contexts/painless-field-context.asciidoc
index 2f4e27dd11e6b..661af8e64d1e0 100644
--- a/docs/painless/painless-contexts/painless-field-context.asciidoc
+++ b/docs/painless/painless-contexts/painless-field-context.asciidoc
@@ -64,14 +64,14 @@ actors that appear in each play:
 ----
 GET seats/_search
 {
-  "size": 2, 
+  "size": 2,
   "query": {
     "match_all": {}
   },
   "script_fields": {
     "day-of-week": {
       "script": {
-        "source": "doc['datetime'].value.getDayOfWeekEnum().getDisplayName(TextStyle.FULL, Locale.ROOT)"
+        "source": "doc['datetime'].value.getDayOfWeekEnum().getDisplayName(TextStyle.FULL, Locale.ENGLISH)"
       }
     },
     "number-of-actors": {
@@ -132,4 +132,4 @@ GET seats/_search
   }
 }
 ----
-// TESTRESPONSE[s/"took" : 68/"took" : "$body.took"/]
\ No newline at end of file
+// TESTRESPONSE[s/"took" : 68/"took" : "$body.took"/]
diff --git a/docs/painless/painless-guide/painless-execute-script.asciidoc b/docs/painless/painless-guide/painless-execute-script.asciidoc
index 4417daeb63efa..771a6818d45e8 100644
--- a/docs/painless/painless-guide/painless-execute-script.asciidoc
+++ b/docs/painless/painless-guide/painless-execute-script.asciidoc
@@ -749,7 +749,7 @@ POST /_scripts/painless/_execute
 {
   "script": {
     "source": """
-      emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));
+      emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));
     """
   },
   "context": "keyword_field",
diff --git a/docs/reference/aggregations/bucket/composite-aggregation.asciidoc b/docs/reference/aggregations/bucket/composite-aggregation.asciidoc
index 807ec93132d37..ded01237c23c8 100644
--- a/docs/reference/aggregations/bucket/composite-aggregation.asciidoc
+++ b/docs/reference/aggregations/bucket/composite-aggregation.asciidoc
@@ -156,7 +156,7 @@ GET /_search
       "type": "keyword",
       "script": """
         emit(doc['timestamp'].value.dayOfWeekEnum
-          .getDisplayName(TextStyle.FULL, Locale.ROOT))
+          .getDisplayName(TextStyle.FULL, Locale.ENGLISH))
       """
     }
   },
diff --git a/docs/reference/aggregations/bucket/datehistogram-aggregation.asciidoc b/docs/reference/aggregations/bucket/datehistogram-aggregation.asciidoc
index 3511ec9e63b02..ef62f263a54a8 100644
--- a/docs/reference/aggregations/bucket/datehistogram-aggregation.asciidoc
+++ b/docs/reference/aggregations/bucket/datehistogram-aggregation.asciidoc
@@ -582,7 +582,7 @@ For example, the offset of `+19d` will result in buckets with names like `2022-0
 
 Increasing the offset to `+20d`, each document will appear in a bucket for the previous month,
 with all bucket keys ending with the same day of the month, as normal.
-However, further increasing to `+28d`, 
+However, further increasing to `+28d`,
 what used to be a February bucket has now become `"2022-03-01"`.
 
 [source,console,id=datehistogram-aggregation-offset-example-28d]
@@ -819,7 +819,7 @@ POST /sales/_search?size=0
   "runtime_mappings": {
     "date.day_of_week": {
       "type": "keyword",
-      "script": "emit(doc['date'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT))"
+      "script": "emit(doc['date'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH))"
     }
   },
   "aggs": {
diff --git a/docs/reference/indices/index-templates.asciidoc b/docs/reference/indices/index-templates.asciidoc
index 538fb5b97860a..66911716ffee2 100644
--- a/docs/reference/indices/index-templates.asciidoc
+++ b/docs/reference/indices/index-templates.asciidoc
@@ -102,7 +102,7 @@ PUT _component_template/runtime_component_template
         "day_of_week": {
           "type": "keyword",
           "script": {
-            "source": "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT))"
+            "source": "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH))"
           }
         }
       }
diff --git a/docs/reference/mapping/runtime.asciidoc b/docs/reference/mapping/runtime.asciidoc
index dc21fcfb9261e..190081fa801b4 100644
--- a/docs/reference/mapping/runtime.asciidoc
+++ b/docs/reference/mapping/runtime.asciidoc
@@ -135,7 +135,7 @@ PUT my-index-000001/
       "day_of_week": {
         "type": "keyword",
         "script": {
-          "source": "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT))"
+          "source": "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH))"
         }
       }
     },
@@ -291,7 +291,7 @@ GET my-index-000001/_search
     "day_of_week": {
       "type": "keyword",
       "script": {
-        "source": "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT))"
+        "source": "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH))"
       }
     }
   },
@@ -667,7 +667,7 @@ PUT my-index-000001/
       "day_of_week": {
         "type": "keyword",
         "script": {
-          "source": "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT))"
+          "source": "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH))"
         }
       }
     },
diff --git a/docs/reference/ml/ml-shared.asciidoc b/docs/reference/ml/ml-shared.asciidoc
index 44c2012f502e1..97122141d7558 100644
--- a/docs/reference/ml/ml-shared.asciidoc
+++ b/docs/reference/ml/ml-shared.asciidoc
@@ -951,7 +951,7 @@ For example:
   "day_of_week": {
     "type": "keyword",
     "script": {
-      "source": "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT))"
+      "source": "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH))"
     }
   }
 }
diff --git a/docs/reference/search/search-your-data/search-api.asciidoc b/docs/reference/search/search-your-data/search-api.asciidoc
index 496812a0cedb4..98c5a48b7559b 100644
--- a/docs/reference/search/search-your-data/search-api.asciidoc
+++ b/docs/reference/search/search-your-data/search-api.asciidoc
@@ -173,7 +173,7 @@ GET /my-index-000001/_search
       "script": {
         "source":
         """emit(doc['@timestamp'].value.dayOfWeekEnum
-        .getDisplayName(TextStyle.FULL, Locale.ROOT))"""
+        .getDisplayName(TextStyle.FULL, Locale.ENGLISH))"""
       }
     }
   },
diff --git a/modules/lang-painless/src/yamlRestTest/resources/rest-api-spec/test/painless/65_runtime_doc_values.yml b/modules/lang-painless/src/yamlRestTest/resources/rest-api-spec/test/painless/65_runtime_doc_values.yml
index 148b8e55e1a4a..b5190a579f62d 100644
--- a/modules/lang-painless/src/yamlRestTest/resources/rest-api-spec/test/painless/65_runtime_doc_values.yml
+++ b/modules/lang-painless/src/yamlRestTest/resources/rest-api-spec/test/painless/65_runtime_doc_values.yml
@@ -12,7 +12,7 @@ setup:
                 script:
                   source: |
                     for (date in field('date')) {
-                      emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));
+                      emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));
                     }
               total_value_double:
                 type: double
@@ -55,7 +55,7 @@ setup:
                   source: |
                     if (doc.containsKey('date')) {
                       for (date in doc['date']) {
-                        emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));
+                        emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));
                       }
                     }
               doc_total_value_double:
@@ -737,7 +737,7 @@ setup:
               script:
                 source: |
                   for (date in field('date')) {
-                    emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));
+                    emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));
                   }
           sort: [ { rank: asc } ]
           script_fields:
@@ -758,7 +758,7 @@ setup:
               script:
                 source: |
                   for (date in field('date')) {
-                    emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));
+                    emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));
                   }
           sort: [ { rank: asc } ]
           script_fields:
@@ -924,7 +924,7 @@ setup:
                 source: |
                   if (doc.containsKey('date')) {
                     for (date in doc['date']) {
-                      emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));
+                      emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));
                     }
                   }
           sort: [ { rank: asc } ]
@@ -947,7 +947,7 @@ setup:
                 source: |
                   if (doc.containsKey('date')) {
                     for (date in doc['date']) {
-                      emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));
+                      emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));
                     }
                   }
           sort: [ { rank: asc } ]
@@ -1133,7 +1133,7 @@ setup:
               script:
                 source: |
                   for (date in field('date')) {
-                    emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));
+                    emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));
                   }
           sort: [ { rank: asc } ]
           script_fields:
@@ -1156,7 +1156,7 @@ setup:
               script:
                 source: |
                   for (date in field('date')) {
-                    emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));
+                    emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));
                   }
           sort: [ { rank: asc } ]
           script_fields:
@@ -1337,7 +1337,7 @@ setup:
                 source: |
                   if (doc.containsKey('date')) {
                     for (date in doc['date']) {
-                      emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));
+                      emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));
                     }
                   }
           sort: [ { rank: asc } ]
@@ -1362,7 +1362,7 @@ setup:
                 source: |
                   if (doc.containsKey('date')) {
                     for (date in doc['date']) {
-                      emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));
+                      emit(date.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));
                     }
                   }
           sort: [ { rank: asc } ]
diff --git a/modules/runtime-fields-common/src/yamlRestTest/resources/rest-api-spec/test/runtime_fields/10_keyword.yml b/modules/runtime-fields-common/src/yamlRestTest/resources/rest-api-spec/test/runtime_fields/10_keyword.yml
index 7bd7b6c7779e2..11214907eb17e 100644
--- a/modules/runtime-fields-common/src/yamlRestTest/resources/rest-api-spec/test/runtime_fields/10_keyword.yml
+++ b/modules/runtime-fields-common/src/yamlRestTest/resources/rest-api-spec/test/runtime_fields/10_keyword.yml
@@ -12,7 +12,7 @@ setup:
               day_of_week:
                 type: keyword
                 script: |
-                  emit(doc['timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));
+                  emit(doc['timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));
               # Test fetching from _source
               day_of_week_from_source:
                 type: keyword
@@ -75,7 +75,7 @@ setup:
   - match: {sensor.mappings.runtime.day_of_week.type: keyword }
   - match:
       sensor.mappings.runtime.day_of_week.script.source: |
-        emit(doc['timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));
+        emit(doc['timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));
   - match: {sensor.mappings.runtime.day_of_week.script.lang: painless }
 
 # --- TODO get field mappings needs to be adapted
@@ -90,7 +90,7 @@ setup:
 #        type: keyword
 #        script:
 #          source: |
-#            emit(doc['timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));
+#            emit(doc['timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));
 #          lang: painless
 #        meta: {}
 #
diff --git a/modules/runtime-fields-common/src/yamlRestTest/resources/rest-api-spec/test/runtime_fields/13_keyword_calculated_at_index.yml b/modules/runtime-fields-common/src/yamlRestTest/resources/rest-api-spec/test/runtime_fields/13_keyword_calculated_at_index.yml
index 1c10a017a5c33..4bedfa3e923a8 100644
--- a/modules/runtime-fields-common/src/yamlRestTest/resources/rest-api-spec/test/runtime_fields/13_keyword_calculated_at_index.yml
+++ b/modules/runtime-fields-common/src/yamlRestTest/resources/rest-api-spec/test/runtime_fields/13_keyword_calculated_at_index.yml
@@ -21,7 +21,7 @@ setup:
               day_of_week:
                 type: keyword
                 script: |
-                  emit(doc['timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));
+                  emit(doc['timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));
               # Test fetching from _source
               day_of_week_from_source:
                 type: keyword
@@ -74,7 +74,7 @@ setup:
   - match: {sensor.mappings.properties.day_of_week.type: keyword }
   - match:
       sensor.mappings.properties.day_of_week.script.source: |
-        emit(doc['timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));
+        emit(doc['timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));
   - match: {sensor.mappings.properties.day_of_week.script.lang: painless }
 
 ---
diff --git a/modules/runtime-fields-common/src/yamlRestTest/resources/rest-api-spec/test/runtime_fields/40_runtime_mappings.yml b/modules/runtime-fields-common/src/yamlRestTest/resources/rest-api-spec/test/runtime_fields/40_runtime_mappings.yml
index 0e7d0b78bba47..b6acc7a18345a 100644
--- a/modules/runtime-fields-common/src/yamlRestTest/resources/rest-api-spec/test/runtime_fields/40_runtime_mappings.yml
+++ b/modules/runtime-fields-common/src/yamlRestTest/resources/rest-api-spec/test/runtime_fields/40_runtime_mappings.yml
@@ -34,7 +34,7 @@ setup:
             day_of_week:
               type: keyword
               script:
-                source: "emit(doc['timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT))"
+                source: "emit(doc['timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH))"
 
   - match: {indices:                             ["test-1"]}
   - length: {fields.timestamp:                            1}
@@ -78,7 +78,7 @@ setup:
             day_of_week:
               type: keyword
               script:
-                source: "emit(doc['timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT))"
+                source: "emit(doc['timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH))"
 
   - match: {indices:                    ["test-1", "test-2"]}
   - length: {fields.day_of_week:                          1}
diff --git a/modules/runtime-fields-common/src/yamlRestTest/resources/rest-api-spec/test/runtime_fields/80_multiple_indices.yml b/modules/runtime-fields-common/src/yamlRestTest/resources/rest-api-spec/test/runtime_fields/80_multiple_indices.yml
index 0c571975098b2..dc52350a25a75 100644
--- a/modules/runtime-fields-common/src/yamlRestTest/resources/rest-api-spec/test/runtime_fields/80_multiple_indices.yml
+++ b/modules/runtime-fields-common/src/yamlRestTest/resources/rest-api-spec/test/runtime_fields/80_multiple_indices.yml
@@ -12,7 +12,7 @@ setup:
               day_of_week:
                 type: keyword
                 script: |
-                  emit(doc['timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));
+                  emit(doc['timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));
               tomorrow:
                 type: date
                 script:
diff --git a/muted-tests.yml b/muted-tests.yml
index 7830bb09670a0..8d445ab0d5c1d 100644
--- a/muted-tests.yml
+++ b/muted-tests.yml
@@ -1,25 +1,10 @@
 tests:
-- class: "org.elasticsearch.xpack.textstructure.structurefinder.TimestampFormatFinderTests"
-  issue: "https://github.com/elastic/elasticsearch/issues/108855"
-  method: "testGuessIsDayFirstFromLocale"
-- class: "org.elasticsearch.test.rest.ClientYamlTestSuiteIT"
-  issue: "https://github.com/elastic/elasticsearch/issues/108857"
-  method: "test {yaml=search/180_locale_dependent_mapping/Test Index and Search locale dependent mappings / dates}"
 - class: "org.elasticsearch.upgrades.SearchStatesIT"
   issue: "https://github.com/elastic/elasticsearch/issues/108991"
   method: "testCanMatch"
 - class: "org.elasticsearch.upgrades.MlTrainedModelsUpgradeIT"
   issue: "https://github.com/elastic/elasticsearch/issues/108993"
   method: "testTrainedModelInference"
-- class: "org.elasticsearch.xpack.security.CoreWithSecurityClientYamlTestSuiteIT"
-  issue: "https://github.com/elastic/elasticsearch/issues/109188"
-  method: "test {yaml=search/180_locale_dependent_mapping/Test Index and Search locale dependent mappings / dates}"
-- class: "org.elasticsearch.xpack.esql.qa.mixed.EsqlClientYamlIT"
-  issue: "https://github.com/elastic/elasticsearch/issues/109189"
-  method: "test {p0=esql/70_locale/Date format with Italian locale}"
-- class: "org.elasticsearch.xpack.test.rest.XPackRestIT"
-  issue: "https://github.com/elastic/elasticsearch/issues/109200"
-  method: "test {p0=esql/70_locale/Date format with Italian locale}"
 - class: org.elasticsearch.smoketest.DocsClientYamlTestSuiteIT
   method: test {yaml=reference/esql/esql-async-query-api/line_17}
   issue: https://github.com/elastic/elasticsearch/issues/109260
diff --git a/qa/ccs-common-rest/src/yamlRestTest/resources/rest-api-spec/test/eql/10_basic.yml b/qa/ccs-common-rest/src/yamlRestTest/resources/rest-api-spec/test/eql/10_basic.yml
index e35282bb6bfde..05d90d582e7f2 100644
--- a/qa/ccs-common-rest/src/yamlRestTest/resources/rest-api-spec/test/eql/10_basic.yml
+++ b/qa/ccs-common-rest/src/yamlRestTest/resources/rest-api-spec/test/eql/10_basic.yml
@@ -13,7 +13,7 @@ setup:
                 day_of_week:
                   type: keyword
                   script:
-                    source: "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT))"
+                    source: "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH))"
   - do:
       bulk:
         refresh: true
diff --git a/qa/ccs-common-rest/src/yamlRestTest/resources/rest-api-spec/test/eql/20_runtime_mappings.yml b/qa/ccs-common-rest/src/yamlRestTest/resources/rest-api-spec/test/eql/20_runtime_mappings.yml
index 58462786f9a2f..1c1a39a7bc1ac 100644
--- a/qa/ccs-common-rest/src/yamlRestTest/resources/rest-api-spec/test/eql/20_runtime_mappings.yml
+++ b/qa/ccs-common-rest/src/yamlRestTest/resources/rest-api-spec/test/eql/20_runtime_mappings.yml
@@ -9,7 +9,7 @@ setup:
                 day_of_week:
                   type: keyword
                   script:
-                    source: "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT))"
+                    source: "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH))"
   - do:
       bulk:
         refresh: true
diff --git a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/search/180_locale_dependent_mapping.yml b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/search/180_locale_dependent_mapping.yml
index c4815304e0799..7c345b7d4d3ac 100644
--- a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/search/180_locale_dependent_mapping.yml
+++ b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/search/180_locale_dependent_mapping.yml
@@ -11,26 +11,26 @@
                       date_field:
                           type: date
                           format: "E, d MMM yyyy HH:mm:ss Z"
-                          locale: "de"
+                          locale: "fr"
   - do:
       bulk:
           refresh: true
           body:
               - '{"index": {"_index": "test_index", "_id": "1"}}'
-              - '{"date_field": "Mi, 06 Dez 2000 02:55:00 -0800"}'
+              - '{"date_field": "mer., 6 déc. 2000 02:55:00 -0800"}'
               - '{"index": {"_index": "test_index", "_id": "2"}}'
-              - '{"date_field": "Do, 07 Dez 2000 02:55:00 -0800"}'
+              - '{"date_field": "jeu., 7 déc. 2000 02:55:00 -0800"}'
 
   - do:
       search:
           rest_total_hits_as_int: true
           index: test_index
-          body: {"query" : {"range" : {"date_field" : {"gte": "Di, 05 Dez 2000 02:55:00 -0800", "lte": "Do, 07 Dez 2000 00:00:00 -0800"}}}}
+          body: {"query" : {"range" : {"date_field" : {"gte": "mar., 5 déc. 2000 02:55:00 -0800", "lte": "jeu., 7 déc. 2000 00:00:00 -0800"}}}}
   - match: { hits.total: 1 }
 
   - do:
       search:
           rest_total_hits_as_int: true
           index: test_index
-          body: {"query" : {"range" : {"date_field" : {"gte": "Di, 05 Dez 2000 02:55:00 -0800", "lte": "Fr, 08 Dez 2000 00:00:00 -0800"}}}}
+          body: {"query" : {"range" : {"date_field" : {"gte": "mar., 5 déc. 2000 02:55:00 -0800", "lte": "ven., 8 déc. 2000 00:00:00 -0800"}}}}
   - match: { hits.total: 2 }
diff --git a/server/src/internalClusterTest/java/org/elasticsearch/search/query/SearchQueryIT.java b/server/src/internalClusterTest/java/org/elasticsearch/search/query/SearchQueryIT.java
index 384395bcb78e7..0a30de1bb3741 100644
--- a/server/src/internalClusterTest/java/org/elasticsearch/search/query/SearchQueryIT.java
+++ b/server/src/internalClusterTest/java/org/elasticsearch/search/query/SearchQueryIT.java
@@ -1629,14 +1629,8 @@ public void testRangeQueryWithTimeZone() throws Exception {
      * Test range with a custom locale, e.g. "de" in this case. Documents here mention the day of week
      * as "Mi" for "Mittwoch (Wednesday" and "Do" for "Donnerstag (Thursday)" and the month in the query
      * as "Dez" for "Dezember (December)".
-     * Note: this test currently needs the JVM arg `-Djava.locale.providers=SPI,COMPAT` to be set.
-     * When running with gradle this is done implicitly through the BuildPlugin, but when running from
-     * an IDE this might need to be set manually in the run configuration. See also CONTRIBUTING.md section
-     * on "Configuring IDEs And Running Tests".
      */
     public void testRangeQueryWithLocaleMapping() throws Exception {
-        assert ("SPI,COMPAT".equals(System.getProperty("java.locale.providers"))) : "`-Djava.locale.providers=SPI,COMPAT` needs to be set";
-
         assertAcked(
             prepareCreate("test").setMapping(
                 jsonBuilder().startObject()
@@ -1644,7 +1638,7 @@ public void testRangeQueryWithLocaleMapping() throws Exception {
                     .startObject("date_field")
                     .field("type", "date")
                     .field("format", "E, d MMM yyyy HH:mm:ss Z")
-                    .field("locale", "de")
+                    .field("locale", "fr")
                     .endObject()
                     .endObject()
                     .endObject()
@@ -1653,19 +1647,19 @@ public void testRangeQueryWithLocaleMapping() throws Exception {
 
         indexRandom(
             true,
-            prepareIndex("test").setId("1").setSource("date_field", "Mi, 06 Dez 2000 02:55:00 -0800"),
-            prepareIndex("test").setId("2").setSource("date_field", "Do, 07 Dez 2000 02:55:00 -0800")
+            prepareIndex("test").setId("1").setSource("date_field", "mer., 6 déc. 2000 02:55:00 -0800"),
+            prepareIndex("test").setId("2").setSource("date_field", "jeu., 7 déc. 2000 02:55:00 -0800")
         );
 
         assertHitCount(
             prepareSearch("test").setQuery(
-                QueryBuilders.rangeQuery("date_field").gte("Di, 05 Dez 2000 02:55:00 -0800").lte("Do, 07 Dez 2000 00:00:00 -0800")
+                QueryBuilders.rangeQuery("date_field").gte("mar., 5 déc. 2000 02:55:00 -0800").lte("jeu., 7 déc. 2000 00:00:00 -0800")
             ),
             1L
         );
         assertHitCount(
             prepareSearch("test").setQuery(
-                QueryBuilders.rangeQuery("date_field").gte("Di, 05 Dez 2000 02:55:00 -0800").lte("Fr, 08 Dez 2000 00:00:00 -0800")
+                QueryBuilders.rangeQuery("date_field").gte("mar., 5 déc. 2000 02:55:00 -0800").lte("ven., 8 déc. 2000 00:00:00 -0800")
             ),
             2L
         );
diff --git a/server/src/test/java/org/elasticsearch/action/admin/indices/template/reservedstate/ReservedComposableIndexTemplateActionTests.java b/server/src/test/java/org/elasticsearch/action/admin/indices/template/reservedstate/ReservedComposableIndexTemplateActionTests.java
index 32a74fef61209..e0d27bf3dc49d 100644
--- a/server/src/test/java/org/elasticsearch/action/admin/indices/template/reservedstate/ReservedComposableIndexTemplateActionTests.java
+++ b/server/src/test/java/org/elasticsearch/action/admin/indices/template/reservedstate/ReservedComposableIndexTemplateActionTests.java
@@ -270,7 +270,7 @@ public void testAddRemoveComponentTemplates() throws Exception {
                         "day_of_week": {
                           "type": "keyword",
                           "script": {
-                            "source": "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT))"
+                            "source": "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH))"
                           }
                         }
                       }
@@ -294,7 +294,7 @@ public void testAddRemoveComponentTemplates() throws Exception {
                         "day_of_week": {
                           "type": "keyword",
                           "script": {
-                            "source": "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT))"
+                            "source": "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH))"
                           }
                         }
                       }
diff --git a/server/src/test/java/org/elasticsearch/common/time/DateFormattersTests.java b/server/src/test/java/org/elasticsearch/common/time/DateFormattersTests.java
index a9b7cb74e548e..6762431477488 100644
--- a/server/src/test/java/org/elasticsearch/common/time/DateFormattersTests.java
+++ b/server/src/test/java/org/elasticsearch/common/time/DateFormattersTests.java
@@ -880,11 +880,11 @@ public void testCustomTimeFormats() {
 
     public void testCustomLocales() {
         // also ensure that locale based dates are the same
-        DateFormatter formatter = DateFormatter.forPattern("E, d MMM yyyy HH:mm:ss Z").withLocale(LocaleUtils.parse("de"));
-        assertParses("Di, 05 Dez 2000 02:55:00 -0800", formatter);
-        assertParses("Mi, 06 Dez 2000 02:55:00 -0800", formatter);
-        assertParses("Do, 07 Dez 2000 00:00:00 -0800", formatter);
-        assertParses("Fr, 08 Dez 2000 00:00:00 -0800", formatter);
+        DateFormatter formatter = DateFormatter.forPattern("E, d MMM yyyy HH:mm:ss Z").withLocale(LocaleUtils.parse("fr"));
+        assertParses("mar., 5 déc. 2000 02:55:00 -0800", formatter);
+        assertParses("mer., 6 déc. 2000 02:55:00 -0800", formatter);
+        assertParses("jeu., 7 déc. 2000 00:00:00 -0800", formatter);
+        assertParses("ven., 8 déc. 2000 00:00:00 -0800", formatter);
     }
 
     public void testFormatsValidParsing() {
diff --git a/server/src/test/java/org/elasticsearch/index/mapper/DateFieldMapperTests.java b/server/src/test/java/org/elasticsearch/index/mapper/DateFieldMapperTests.java
index 9cfdb2c46a291..4efdd43b5cd71 100644
--- a/server/src/test/java/org/elasticsearch/index/mapper/DateFieldMapperTests.java
+++ b/server/src/test/java/org/elasticsearch/index/mapper/DateFieldMapperTests.java
@@ -183,10 +183,10 @@ public void testChangeFormat() throws IOException {
 
     public void testChangeLocale() throws IOException {
         DocumentMapper mapper = createDocumentMapper(
-            fieldMapping(b -> b.field("type", "date").field("format", "E, d MMM yyyy HH:mm:ss Z").field("locale", "de"))
+            fieldMapping(b -> b.field("type", "date").field("format", "E, d MMM yyyy HH:mm:ss Z").field("locale", "fr"))
         );
 
-        mapper.parse(source(b -> b.field("field", "Mi, 06 Dez 2000 02:55:00 -0800")));
+        mapper.parse(source(b -> b.field("field", "mer., 6 déc. 2000 02:55:00 -0800")));
     }
 
     public void testNullValue() throws IOException {
diff --git a/x-pack/plugin/core/src/main/java/org/elasticsearch/license/LicenseUtils.java b/x-pack/plugin/core/src/main/java/org/elasticsearch/license/LicenseUtils.java
index 42f0ddb3f5234..b27c1bb9d449c 100644
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/license/LicenseUtils.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/license/LicenseUtils.java
@@ -25,7 +25,7 @@
 public class LicenseUtils {
 
     public static final String EXPIRED_FEATURE_METADATA = "es.license.expired.feature";
-    public static final DateFormatter DATE_FORMATTER = DateFormatter.forPattern("EEEE, MMMM dd, yyyy");
+    public static final DateFormatter DATE_FORMATTER = DateFormatter.forPattern("EEEE, MMMM dd, yyyy").withLocale(Locale.ENGLISH);
 
     /**
      * Exception to be thrown when a feature action requires a valid license, but license
diff --git a/x-pack/plugin/core/src/test/java/org/elasticsearch/license/ClusterStateLicenseServiceTests.java b/x-pack/plugin/core/src/test/java/org/elasticsearch/license/ClusterStateLicenseServiceTests.java
index c0c7c5c59d24b..aaadecef6021c 100644
--- a/x-pack/plugin/core/src/test/java/org/elasticsearch/license/ClusterStateLicenseServiceTests.java
+++ b/x-pack/plugin/core/src/test/java/org/elasticsearch/license/ClusterStateLicenseServiceTests.java
@@ -65,11 +65,6 @@
 import static org.mockito.Mockito.verify;
 import static org.mockito.Mockito.when;
 
-/**
- * Due to changes in JDK9 where locale data is used from CLDR, the licence message will differ in jdk 8 and jdk9+
- * https://openjdk.java.net/jeps/252
- * We run ES with -Djava.locale.providers=SPI,COMPAT and same option has to be applied when running this test from IDE
- */
 public class ClusterStateLicenseServiceTests extends ESTestCase {
 
     // must use member mock for generic
diff --git a/x-pack/plugin/eql/qa/rest/src/yamlRestTest/resources/rest-api-spec/test/eql/10_basic.yml b/x-pack/plugin/eql/qa/rest/src/yamlRestTest/resources/rest-api-spec/test/eql/10_basic.yml
index dc9fd1e475cc9..e49264d76d5e9 100644
--- a/x-pack/plugin/eql/qa/rest/src/yamlRestTest/resources/rest-api-spec/test/eql/10_basic.yml
+++ b/x-pack/plugin/eql/qa/rest/src/yamlRestTest/resources/rest-api-spec/test/eql/10_basic.yml
@@ -13,7 +13,7 @@ setup:
                 day_of_week:
                   type: keyword
                   script:
-                    source: "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT))"
+                    source: "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH))"
   - do:
       bulk:
         refresh: true
diff --git a/x-pack/plugin/eql/qa/rest/src/yamlRestTest/resources/rest-api-spec/test/eql/20_runtime_mappings.yml b/x-pack/plugin/eql/qa/rest/src/yamlRestTest/resources/rest-api-spec/test/eql/20_runtime_mappings.yml
index 58462786f9a2f..1c1a39a7bc1ac 100644
--- a/x-pack/plugin/eql/qa/rest/src/yamlRestTest/resources/rest-api-spec/test/eql/20_runtime_mappings.yml
+++ b/x-pack/plugin/eql/qa/rest/src/yamlRestTest/resources/rest-api-spec/test/eql/20_runtime_mappings.yml
@@ -9,7 +9,7 @@ setup:
                 day_of_week:
                   type: keyword
                   script:
-                    source: "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT))"
+                    source: "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH))"
   - do:
       bulk:
         refresh: true
diff --git a/x-pack/plugin/sql/src/test/java/org/elasticsearch/xpack/sql/expression/function/scalar/datetime/DateTimeFormatProcessorTests.java b/x-pack/plugin/sql/src/test/java/org/elasticsearch/xpack/sql/expression/function/scalar/datetime/DateTimeFormatProcessorTests.java
index 997447c525e43..5294fa05dfdea 100644
--- a/x-pack/plugin/sql/src/test/java/org/elasticsearch/xpack/sql/expression/function/scalar/datetime/DateTimeFormatProcessorTests.java
+++ b/x-pack/plugin/sql/src/test/java/org/elasticsearch/xpack/sql/expression/function/scalar/datetime/DateTimeFormatProcessorTests.java
@@ -157,12 +157,12 @@ public void testFormatting() {
             new DateTimeFormat(Source.EMPTY, dateTime, l("YYYY-MM-dd HH:mm:ss.SSSSSSSS"), zoneId).makePipe().asProcessor().process(null)
         );
         assertEquals("+1000", new DateTimeFormat(Source.EMPTY, dateTime, l("Z"), zoneId).makePipe().asProcessor().process(null));
-        assertEquals("Etc/GMT-10", new DateTimeFormat(Source.EMPTY, dateTime, l("z"), zoneId).makePipe().asProcessor().process(null));
+        assertEquals("GMT+10:00", new DateTimeFormat(Source.EMPTY, dateTime, l("z"), zoneId).makePipe().asProcessor().process(null));
         assertEquals("Etc/GMT-10", new DateTimeFormat(Source.EMPTY, dateTime, l("VV"), zoneId).makePipe().asProcessor().process(null));
 
         zoneId = ZoneId.of("America/Sao_Paulo");
         assertEquals("-0300", new DateTimeFormat(Source.EMPTY, dateTime, l("Z"), zoneId).makePipe().asProcessor().process(null));
-        assertEquals("BRT", new DateTimeFormat(Source.EMPTY, dateTime, l("z"), zoneId).makePipe().asProcessor().process(null));
+        assertEquals("GMT-03:00", new DateTimeFormat(Source.EMPTY, dateTime, l("z"), zoneId).makePipe().asProcessor().process(null));
         assertEquals(
             "America/Sao_Paulo",
             new DateTimeFormat(Source.EMPTY, dateTime, l("VV"), zoneId).makePipe().asProcessor().process(null)
@@ -208,7 +208,7 @@ public void testFormatting() {
         );
         assertEquals("Z", new Format(Source.EMPTY, dateTime, l("Z"), zoneId).makePipe().asProcessor().process(null));
         assertEquals("+10", new Format(Source.EMPTY, dateTime, l("z"), zoneId).makePipe().asProcessor().process(null));
-        assertEquals("Etc/GMT-10", new Format(Source.EMPTY, dateTime, l("K"), zoneId).makePipe().asProcessor().process(null));
+        assertEquals("GMT+10:00", new Format(Source.EMPTY, dateTime, l("K"), zoneId).makePipe().asProcessor().process(null));
 
         assertEquals("1", new Format(Source.EMPTY, dateTime, l("F"), zoneId).makePipe().asProcessor().process(null));
         assertEquals("12", new Format(Source.EMPTY, dateTime, l("FF"), zoneId).makePipe().asProcessor().process(null));
diff --git a/x-pack/qa/runtime-fields/with-security/src/javaRestTest/java/org/elasticsearch/xpack/security/PermissionsIT.java b/x-pack/qa/runtime-fields/with-security/src/javaRestTest/java/org/elasticsearch/xpack/security/PermissionsIT.java
index e938e61734ba6..a76317d42e196 100644
--- a/x-pack/qa/runtime-fields/with-security/src/javaRestTest/java/org/elasticsearch/xpack/security/PermissionsIT.java
+++ b/x-pack/qa/runtime-fields/with-security/src/javaRestTest/java/org/elasticsearch/xpack/security/PermissionsIT.java
@@ -290,7 +290,7 @@ public void testPainlessExecuteWithIndexRequiresReadPrivileges() throws IOExcept
         painlessExecute.setJsonEntity("""
             {
               "script": {
-                "source": "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ROOT));"
+                "source": "emit(doc['@timestamp'].value.dayOfWeekEnum.getDisplayName(TextStyle.FULL, Locale.ENGLISH));"
               },
               "context": "keyword_field",
               "context_setup": {

From d41885347fe872ae832369b368d4d3c33b6e676e Mon Sep 17 00:00:00 2001
From: Mike Barretta <mike.barretta@elastic.co>
Date: Wed, 4 Sep 2024 09:34:01 -0400
Subject: [PATCH 143/144] Missing link added to fips-140-compliance.asciidoc
 (#112477) (#112516)

completed a missing link to the support matrix
---
 docs/reference/security/fips-140-compliance.asciidoc | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/docs/reference/security/fips-140-compliance.asciidoc b/docs/reference/security/fips-140-compliance.asciidoc
index bf880213c2073..5bf73d43541d6 100644
--- a/docs/reference/security/fips-140-compliance.asciidoc
+++ b/docs/reference/security/fips-140-compliance.asciidoc
@@ -55,7 +55,8 @@ so that the JVM uses FIPS validated implementations of NIST recommended cryptogr
 
 Elasticsearch has been tested with Bouncy Castle's https://repo1.maven.org/maven2/org/bouncycastle/bc-fips/1.0.2.4/bc-fips-1.0.2.4.jar[bc-fips 1.0.2.4]
 and https://repo1.maven.org/maven2/org/bouncycastle/bctls-fips/1.0.17/bctls-fips-1.0.17.jar[bctls-fips 1.0.17].
-Please refer to the [Support Matrix] for details on which combinations of JVM and security provider are supported in FIPS mode. Elasticsearch does not ship with a FIPS certified provider. It is the responsibility of the user
+Please refer to the {es}
+https://www.elastic.co/support/matrix#matrix_jvm[JVM support matrix] for details on which combinations of JVM and security provider are supported in FIPS mode. Elasticsearch does not ship with a FIPS certified provider. It is the responsibility of the user
 to install and configure the security provider to ensure compliance with FIPS 140-2. Using a FIPS certified provider will ensure that only
 approved cryptographic algorithms are used.
 

From d5bae2cdee5d1874070dd15cd641379edc6594a2 Mon Sep 17 00:00:00 2001
From: Kostas Krikellas <131142368+kkrik-es@users.noreply.github.com>
Date: Wed, 4 Sep 2024 18:12:19 +0300
Subject: [PATCH 144/144] Control storing array source with index setting
 (#112397)

Introduce an index setting that forces storing the source of leaf field
and object arrays in synthetic source mode. Nested objects are excluded
as they already preserve ordering in synthetic source.

Next step is to introduce override params at the mapper level that will
allow disabling the source, or storing the source for arrays (if not
enabled at index level), or storing the source for both arrays and
singletons. This will happen in follow-up changes, so that we can
benchmark the impact of this change in parallel.

Related to #112012
---
 docs/changelog/112397.yaml                    |   5 +
 ...ogsIndexModeRandomDataChallengeRestIT.java |  11 +
 .../indices.create/20_synthetic_source.yml    | 398 ----------
 .../21_synthetic_source_stored.yml            | 732 ++++++++++++++++++
 .../common/settings/IndexScopedSettings.java  |   1 +
 .../elasticsearch/index/IndexSettings.java    |  12 +
 .../index/mapper/DocumentParser.java          |  11 +-
 .../index/mapper/DocumentParserContext.java   |   4 +
 .../elasticsearch/index/mapper/Mapper.java    |  53 ++
 .../index/mapper/MapperFeatures.java          |   3 +-
 .../mapper/IgnoredSourceFieldMapperTests.java | 110 +++
 11 files changed, 938 insertions(+), 402 deletions(-)
 create mode 100644 docs/changelog/112397.yaml
 create mode 100644 rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/indices.create/21_synthetic_source_stored.yml

diff --git a/docs/changelog/112397.yaml b/docs/changelog/112397.yaml
new file mode 100644
index 0000000000000..e67478ec69b1c
--- /dev/null
+++ b/docs/changelog/112397.yaml
@@ -0,0 +1,5 @@
+pr: 112397
+summary: Control storing array source with index setting
+area: Mapping
+type: enhancement
+issues: []
diff --git a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/StandardVersusLogsIndexModeRandomDataChallengeRestIT.java b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/StandardVersusLogsIndexModeRandomDataChallengeRestIT.java
index 8bd62480f333d..ad4302cb04b44 100644
--- a/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/StandardVersusLogsIndexModeRandomDataChallengeRestIT.java
+++ b/modules/data-streams/src/javaRestTest/java/org/elasticsearch/datastreams/logsdb/qa/StandardVersusLogsIndexModeRandomDataChallengeRestIT.java
@@ -8,9 +8,11 @@
 
 package org.elasticsearch.datastreams.logsdb.qa;
 
+import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.time.DateFormatter;
 import org.elasticsearch.common.time.FormatNames;
 import org.elasticsearch.core.CheckedConsumer;
+import org.elasticsearch.index.mapper.Mapper;
 import org.elasticsearch.index.mapper.ObjectMapper;
 import org.elasticsearch.logsdb.datageneration.DataGenerator;
 import org.elasticsearch.logsdb.datageneration.DataGeneratorSpecification;
@@ -36,12 +38,14 @@
  */
 public class StandardVersusLogsIndexModeRandomDataChallengeRestIT extends StandardVersusLogsIndexModeChallengeRestIT {
     private final ObjectMapper.Subobjects subobjects;
+    private final boolean keepArraySource;
 
     private final DataGenerator dataGenerator;
 
     public StandardVersusLogsIndexModeRandomDataChallengeRestIT() {
         super();
         this.subobjects = randomFrom(ObjectMapper.Subobjects.values());
+        this.keepArraySource = randomBoolean();
 
         var specificationBuilder = DataGeneratorSpecification.builder().withFullyDynamicMapping(randomBoolean());
         if (subobjects != ObjectMapper.Subobjects.ENABLED) {
@@ -120,6 +124,13 @@ public void contenderMappings(XContentBuilder builder) throws IOException {
         }
     }
 
+    @Override
+    public void contenderSettings(Settings.Builder builder) {
+        if (keepArraySource) {
+            builder.put(Mapper.SYNTHETIC_SOURCE_KEEP_INDEX_SETTING.getKey(), "arrays");
+        }
+    }
+
     @Override
     protected XContentBuilder generateDocument(final Instant timestamp) throws IOException {
         var document = XContentFactory.jsonBuilder();
diff --git a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/indices.create/20_synthetic_source.yml b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/indices.create/20_synthetic_source.yml
index fa08efe402b43..265aec75dc9c2 100644
--- a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/indices.create/20_synthetic_source.yml
+++ b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/indices.create/20_synthetic_source.yml
@@ -446,260 +446,6 @@ mixed disabled and enabled objects:
   - match: { hits.hits.0._source.path.to.bad.value: false }
 
 
----
-object array:
-  - requires:
-      cluster_features: ["mapper.track_ignored_source"]
-      reason: requires tracking ignored source
-
-  - do:
-      indices.create:
-        index: test
-        body:
-          mappings:
-            _source:
-              mode: synthetic
-            properties:
-              id:
-                type: integer
-              regular:
-                properties:
-                  span:
-                    properties:
-                      id:
-                        type: keyword
-                  trace:
-                    properties:
-                      id:
-                        type: keyword
-              stored:
-                store_array_source: true
-                properties:
-                  span:
-                    properties:
-                      id:
-                        type: keyword
-                  trace:
-                    properties:
-                      id:
-                        type: keyword
-
-  - do:
-      bulk:
-        index: test
-        refresh: true
-        body:
-          - '{ "create": { } }'
-          - '{  "id": 1, "regular": [ { "trace": { "id": "a" }, "span": { "id": "1" } }, { "trace": { "id": "b" }, "span": { "id": "1" } } ] }'
-          - '{ "create": { } }'
-          - '{  "id": 2, "stored": [ { "trace": { "id": "a" }, "span": { "id": "1" } }, { "trace": { "id": "b" }, "span": { "id": "1" } } ] }'
-
-  - do:
-      search:
-        index: test
-        sort: id
-
-  - length: { hits.hits.0._source.regular: 2 }
-  - match: { hits.hits.0._source.regular.span.id: "1" }
-  - match: { hits.hits.0._source.regular.trace.id: [ "a", "b" ] }
-
-  - length: { hits.hits.1._source.stored: 2 }
-  - match: { hits.hits.1._source.stored.0.trace.id: a  }
-  - match: { hits.hits.1._source.stored.0.span.id: "1"  }
-  - match: { hits.hits.1._source.stored.1.trace.id: b }
-  - match: { hits.hits.1._source.stored.1.span.id: "1" }
-
-
----
-object array within array:
-  - requires:
-      cluster_features: ["mapper.track_ignored_source"]
-      reason: requires tracking ignored source
-
-  - do:
-      indices.create:
-        index: test
-        body:
-          mappings:
-            _source:
-              mode: synthetic
-            properties:
-              stored:
-                store_array_source: true
-                properties:
-                  path:
-                    store_array_source: true
-                    properties:
-                      to:
-                        properties:
-                          trace:
-                            type: keyword
-
-  - do:
-      bulk:
-        index: test
-        refresh: true
-        body:
-          - '{ "create": { } }'
-          - '{ "stored": [ { "path": [{ "to": { "trace": "A" } }, { "to": { "trace": "B" } } ] }, { "path": { "to": { "trace": "C" } } } ] }'
-
-  - do:
-      search:
-        index: test
-
-  - length: { hits.hits.0._source.stored: 2 }
-  - match: { hits.hits.0._source.stored.0.path.0.to.trace: A }
-  - match: { hits.hits.0._source.stored.0.path.1.to.trace: B }
-  - match: { hits.hits.0._source.stored.1.path.to.trace: C }
-
-
----
-no object array:
-  - requires:
-      cluster_features: ["mapper.track_ignored_source"]
-      reason: requires tracking ignored source
-
-  - do:
-      indices.create:
-        index: test
-        body:
-          mappings:
-            _source:
-              mode: synthetic
-            properties:
-              stored:
-                store_array_source: true
-                properties:
-                  span:
-                    properties:
-                      id:
-                        type: keyword
-                  trace:
-                    properties:
-                      id:
-                        type: keyword
-
-  - do:
-      bulk:
-        index: test
-        refresh: true
-        body:
-          - '{ "create": { } }'
-          - '{ "stored": { "trace": { "id": "a" }, "span": { "id": "b" } } }'
-
-  - do:
-      search:
-        index: test
-
-  - match: { hits.hits.0._source.stored.trace.id: a  }
-  - match: { hits.hits.0._source.stored.span.id: b  }
-
-
----
-field ordering in object array:
-  - requires:
-      cluster_features: ["mapper.track_ignored_source"]
-      reason: requires tracking ignored source
-
-  - do:
-      indices.create:
-        index: test
-        body:
-          mappings:
-            _source:
-              mode: synthetic
-            properties:
-              a:
-                type: keyword
-              b:
-                store_array_source: true
-                properties:
-                  aa:
-                    type: keyword
-                  bb:
-                    type: keyword
-              c:
-                type: keyword
-              d:
-                store_array_source: true
-                properties:
-                  aa:
-                    type: keyword
-                  bb:
-                    type: keyword
-
-  - do:
-      bulk:
-        index: test
-        refresh: true
-        body:
-          - '{ "create": { } }'
-          - '{ "c": 1, "d": [ { "bb": 10, "aa": 20 }, { "aa": 30, "bb": 40 } ], "a": 2, "b": [ { "bb": 100, "aa": 200 }, { "aa": 300, "bb": 400 } ] }'
-
-  - do:
-      search:
-        index: test
-
-  - length: { hits.hits.0._source: 4 }
-  - match: { hits.hits.0._source: { "a": "2", "b": [ { "bb": 100, "aa": 200 }, { "aa": 300, "bb": 400 } ], "c": "1", "d": [ { "bb": 10, "aa": 20 }, { "aa": 30, "bb": 40 } ] } }
-
-
----
-nested object array next to other fields:
-  - requires:
-      cluster_features: ["mapper.track_ignored_source"]
-      reason: requires tracking ignored source
-
-  - do:
-      indices.create:
-        index: test
-        body:
-          mappings:
-            _source:
-              mode: synthetic
-            properties:
-              a:
-                type: keyword
-              b:
-                properties:
-                  c:
-                    store_array_source: true
-                    properties:
-                      aa:
-                        type: keyword
-                      bb:
-                        type: keyword
-                  d:
-                    properties:
-                      aa:
-                        type: keyword
-                      bb:
-                        type: keyword
-                  e:
-                    type: keyword
-              f:
-                type: keyword
-
-  - do:
-      bulk:
-        index: test
-        refresh: true
-        body:
-          - '{ "create": { } }'
-          - '{ "a": 1, "b": { "c": [ { "bb": 10, "aa": 20 }, { "aa": 30, "bb": 40 } ], "d": [ { "bb": 100, "aa": 200 }, { "aa": 300, "bb": 400 } ], "e": 1000 }, "f": 2000 }'
-
-  - do:
-      search:
-        index: test
-
-  - match: { hits.hits.0._source.a: "1" }
-  - match: { hits.hits.0._source.b.c:  [{ "bb": 10, "aa": 20 }, { "aa": 30, "bb": 40 }] }
-  - match: { hits.hits.0._source.b.d.aa: [ "200", "300" ] }
-  - match: { hits.hits.0._source.b.d.bb: [ "100", "400" ] }
-  - match: { hits.hits.0._source.b.e: "1000" }
-  - match: { hits.hits.0._source.f: "2000" }
-
-
 ---
 object with dynamic override:
   - requires:
@@ -1157,99 +903,6 @@ doubly nested object:
   - match:  { hits.hits.3._source.id: 3 }
 
 
----
-nested object with stored array:
-  - requires:
-      cluster_features: ["mapper.track_ignored_source"]
-      reason: requires tracking ignored source
-
-  - do:
-      indices.create:
-        index: test
-        body:
-          mappings:
-            _source:
-              mode: synthetic
-            properties:
-              name:
-                type: keyword
-              nested_array_regular:
-                type: nested
-              nested_array_stored:
-                type: nested
-                store_array_source: true
-
-  - do:
-      bulk:
-        index: test
-        refresh: true
-        body:
-          - '{ "create": { } }'
-          - '{ "name": "A", "nested_array_regular": [ { "b": [ { "c": 10 }, { "c": 100 } ] }, { "b": [ { "c": 20 }, { "c": 200 } ] } ] }'
-          - '{ "create": { } }'
-          - '{ "name": "B", "nested_array_stored": [ { "b": [ { "c": 10 }, { "c": 100 } ] }, { "b": [ { "c": 20 }, { "c": 200 } ] } ] }'
-
-  - match: { errors: false }
-
-  - do:
-      search:
-        index: test
-        sort: name
-  - match:  { hits.total.value: 2 }
-  - match:  { hits.hits.0._source.name: A }
-  - match: { hits.hits.0._source.nested_array_regular.0.b.c: [ 10, 100] }
-  - match: { hits.hits.0._source.nested_array_regular.1.b.c: [ 20, 200] }
-  - match: { hits.hits.1._source.name: B }
-  - match: { hits.hits.1._source.nested_array_stored.0.b.0.c: 10 }
-  - match: { hits.hits.1._source.nested_array_stored.0.b.1.c: 100 }
-  - match: { hits.hits.1._source.nested_array_stored.1.b.0.c: 20 }
-  - match: { hits.hits.1._source.nested_array_stored.1.b.1.c: 200 }
-
----
-empty nested object sorted as a first document:
-  - requires:
-      cluster_features: ["mapper.track_ignored_source"]
-      reason: requires tracking ignored source
-
-  - do:
-      indices.create:
-        index: test
-        body:
-          settings:
-            index:
-              sort.field: "name"
-              sort.order: "asc"
-          mappings:
-            _source:
-              mode: synthetic
-            properties:
-              name:
-                type: keyword
-              nested:
-                type: nested
-
-  - do:
-      bulk:
-        index: test
-        refresh: true
-        body:
-          - '{ "create": { } }'
-          - '{ "name": "B", "nested": { "a": "b" } }'
-          - '{ "create": { } }'
-          - '{ "name": "A" }'
-
-  - match: { errors: false }
-
-  - do:
-      search:
-        index: test
-        sort: name
-
-  - match:  { hits.total.value: 2 }
-  - match: { hits.hits.0._source.name: A }
-  - match: { hits.hits.1._source.name: B }
-  - match: { hits.hits.1._source.nested.a: "b" }
-
 ---
 subobjects auto:
   - requires:
@@ -1337,54 +990,3 @@ subobjects auto:
   - match: { hits.hits.3._source.id: 4  }
   - match: { hits.hits.3._source.auto_obj.foo: 40 }
   - match: { hits.hits.3._source.auto_obj.foo\.bar: 400 }
-
----
-# 112156
-stored field under object with store_array_source:
-  - requires:
-      cluster_features: ["mapper.source.synthetic_source_stored_fields_advance_fix"]
-      reason: requires bug fix to be implemented
-
-  - do:
-      indices.create:
-        index: test
-        body:
-          settings:
-            index:
-              sort.field: "name"
-              sort.order: "asc"
-          mappings:
-            _source:
-              mode: synthetic
-            properties:
-              name:
-                type: keyword
-              obj:
-                store_array_source: true
-                properties:
-                  foo:
-                    type: keyword
-                    store: true
-
-  - do:
-      bulk:
-        index: test
-        refresh: true
-        body:
-          - '{ "create": { } }'
-          - '{ "name": "B", "obj": null }'
-          - '{ "create": { } }'
-          - '{ "name": "A", "obj": [ { "foo": "hello_from_the_other_side" } ] }'
-
-  - match: { errors: false }
-
-  - do:
-      search:
-        index: test
-        sort: name
-
-  - match:  { hits.total.value: 2 }
-  - match: { hits.hits.0._source.name: A }
-  - match: { hits.hits.0._source.obj: [ { "foo": "hello_from_the_other_side" } ] }
-  - match: { hits.hits.1._source.name: B }
-  - match: { hits.hits.1._source.obj: null }
diff --git a/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/indices.create/21_synthetic_source_stored.yml b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/indices.create/21_synthetic_source_stored.yml
new file mode 100644
index 0000000000000..917f0540c4dd4
--- /dev/null
+++ b/rest-api-spec/src/yamlRestTest/resources/rest-api-spec/test/indices.create/21_synthetic_source_stored.yml
@@ -0,0 +1,732 @@
+---
+object param - object array:
+  - requires:
+      cluster_features: ["mapper.track_ignored_source"]
+      reason: requires tracking ignored source
+
+  - do:
+      indices.create:
+        index: test
+        body:
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              id:
+                type: integer
+              regular:
+                properties:
+                  span:
+                    properties:
+                      id:
+                        type: keyword
+                  trace:
+                    properties:
+                      id:
+                        type: keyword
+              stored:
+                store_array_source: true
+                properties:
+                  span:
+                    properties:
+                      id:
+                        type: keyword
+                  trace:
+                    properties:
+                      id:
+                        type: keyword
+
+  - do:
+      bulk:
+        index: test
+        refresh: true
+        body:
+          - '{ "create": { } }'
+          - '{  "id": 1, "regular": [ { "trace": { "id": "a" }, "span": { "id": "1" } }, { "trace": { "id": "b" }, "span": { "id": "1" } } ] }'
+          - '{ "create": { } }'
+          - '{  "id": 2, "stored": [ { "trace": { "id": "a" }, "span": { "id": "1" } }, { "trace": { "id": "b" }, "span": { "id": "1" } } ] }'
+
+  - do:
+      search:
+        index: test
+        sort: id
+
+  - length: { hits.hits.0._source.regular: 2 }
+  - match: { hits.hits.0._source.regular.span.id: "1" }
+  - match: { hits.hits.0._source.regular.trace.id: [ "a", "b" ] }
+
+  - length: { hits.hits.1._source.stored: 2 }
+  - match: { hits.hits.1._source.stored.0.trace.id: a  }
+  - match: { hits.hits.1._source.stored.0.span.id: "1"  }
+  - match: { hits.hits.1._source.stored.1.trace.id: b }
+  - match: { hits.hits.1._source.stored.1.span.id: "1" }
+
+
+---
+object param - object array within array:
+  - requires:
+      cluster_features: ["mapper.track_ignored_source"]
+      reason: requires tracking ignored source
+
+  - do:
+      indices.create:
+        index: test
+        body:
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              stored:
+                store_array_source: true
+                properties:
+                  path:
+                    store_array_source: true
+                    properties:
+                      to:
+                        properties:
+                          trace:
+                            type: keyword
+
+  - do:
+      bulk:
+        index: test
+        refresh: true
+        body:
+          - '{ "create": { } }'
+          - '{ "stored": [ { "path": [{ "to": { "trace": "A" } }, { "to": { "trace": "B" } } ] }, { "path": { "to": { "trace": "C" } } } ] }'
+
+  - do:
+      search:
+        index: test
+
+  - length: { hits.hits.0._source.stored: 2 }
+  - match: { hits.hits.0._source.stored.0.path.0.to.trace: A }
+  - match: { hits.hits.0._source.stored.0.path.1.to.trace: B }
+  - match: { hits.hits.0._source.stored.1.path.to.trace: C }
+
+
+---
+object param - no object array:
+  - requires:
+      cluster_features: ["mapper.track_ignored_source"]
+      reason: requires tracking ignored source
+
+  - do:
+      indices.create:
+        index: test
+        body:
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              stored:
+                store_array_source: true
+                properties:
+                  span:
+                    properties:
+                      id:
+                        type: keyword
+                  trace:
+                    properties:
+                      id:
+                        type: keyword
+
+  - do:
+      bulk:
+        index: test
+        refresh: true
+        body:
+          - '{ "create": { } }'
+          - '{ "stored": { "trace": { "id": "a" }, "span": { "id": "b" } } }'
+
+  - do:
+      search:
+        index: test
+
+  - match: { hits.hits.0._source.stored.trace.id: a  }
+  - match: { hits.hits.0._source.stored.span.id: b  }
+
+
+---
+object param - field ordering in object array:
+  - requires:
+      cluster_features: ["mapper.track_ignored_source"]
+      reason: requires tracking ignored source
+
+  - do:
+      indices.create:
+        index: test
+        body:
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              a:
+                type: keyword
+              b:
+                store_array_source: true
+                properties:
+                  aa:
+                    type: keyword
+                  bb:
+                    type: keyword
+              c:
+                type: keyword
+              d:
+                store_array_source: true
+                properties:
+                  aa:
+                    type: keyword
+                  bb:
+                    type: keyword
+
+  - do:
+      bulk:
+        index: test
+        refresh: true
+        body:
+          - '{ "create": { } }'
+          - '{ "c": 1, "d": [ { "bb": 10, "aa": 20 }, { "aa": 30, "bb": 40 } ], "a": 2, "b": [ { "bb": 100, "aa": 200 }, { "aa": 300, "bb": 400 } ] }'
+
+  - do:
+      search:
+        index: test
+
+  - length: { hits.hits.0._source: 4 }
+  - match: { hits.hits.0._source: { "a": "2", "b": [ { "bb": 100, "aa": 200 }, { "aa": 300, "bb": 400 } ], "c": "1", "d": [ { "bb": 10, "aa": 20 }, { "aa": 30, "bb": 40 } ] } }
+
+
+---
+object param - nested object array next to other fields:
+  - requires:
+      cluster_features: ["mapper.track_ignored_source"]
+      reason: requires tracking ignored source
+
+  - do:
+      indices.create:
+        index: test
+        body:
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              a:
+                type: keyword
+              b:
+                properties:
+                  c:
+                    store_array_source: true
+                    properties:
+                      aa:
+                        type: keyword
+                      bb:
+                        type: keyword
+                  d:
+                    properties:
+                      aa:
+                        type: keyword
+                      bb:
+                        type: keyword
+                  e:
+                    type: keyword
+              f:
+                type: keyword
+
+  - do:
+      bulk:
+        index: test
+        refresh: true
+        body:
+          - '{ "create": { } }'
+          - '{ "a": 1, "b": { "c": [ { "bb": 10, "aa": 20 }, { "aa": 30, "bb": 40 } ], "d": [ { "bb": 100, "aa": 200 }, { "aa": 300, "bb": 400 } ], "e": 1000 }, "f": 2000 }'
+
+  - do:
+      search:
+        index: test
+
+  - match: { hits.hits.0._source.a: "1" }
+  - match: { hits.hits.0._source.b.c:  [{ "bb": 10, "aa": 20 }, { "aa": 30, "bb": 40 }] }
+  - match: { hits.hits.0._source.b.d.aa: [ "200", "300" ] }
+  - match: { hits.hits.0._source.b.d.bb: [ "100", "400" ] }
+  - match: { hits.hits.0._source.b.e: "1000" }
+  - match: { hits.hits.0._source.f: "2000" }
+
+
+---
+object param - nested object with stored array:
+  - requires:
+      cluster_features: ["mapper.track_ignored_source"]
+      reason: requires tracking ignored source
+
+  - do:
+      indices.create:
+        index: test
+        body:
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              name:
+                type: keyword
+              nested_array_regular:
+                type: nested
+              nested_array_stored:
+                type: nested
+                store_array_source: true
+
+  - do:
+      bulk:
+        index: test
+        refresh: true
+        body:
+          - '{ "create": { } }'
+          - '{ "name": "A", "nested_array_regular": [ { "b": [ { "c": 10 }, { "c": 100 } ] }, { "b": [ { "c": 20 }, { "c": 200 } ] } ] }'
+          - '{ "create": { } }'
+          - '{ "name": "B", "nested_array_stored": [ { "b": [ { "c": 10 }, { "c": 100 } ] }, { "b": [ { "c": 20 }, { "c": 200 } ] } ] }'
+
+  - match: { errors: false }
+
+  - do:
+      search:
+        index: test
+        sort: name
+  - match:  { hits.total.value: 2 }
+  - match:  { hits.hits.0._source.name: A }
+  - match: { hits.hits.0._source.nested_array_regular.0.b.c: [ 10, 100] }
+  - match: { hits.hits.0._source.nested_array_regular.1.b.c: [ 20, 200] }
+  - match: { hits.hits.1._source.name: B }
+  - match: { hits.hits.1._source.nested_array_stored.0.b.0.c: 10 }
+  - match: { hits.hits.1._source.nested_array_stored.0.b.1.c: 100 }
+  - match: { hits.hits.1._source.nested_array_stored.1.b.0.c: 20 }
+  - match: { hits.hits.1._source.nested_array_stored.1.b.1.c: 200 }
+
+
+---
+# 112156
+stored field under object with store_array_source:
+  - requires:
+      cluster_features: ["mapper.source.synthetic_source_stored_fields_advance_fix"]
+      reason: requires bug fix to be implemented
+
+  - do:
+      indices.create:
+        index: test
+        body:
+          settings:
+            index:
+              sort.field: "name"
+              sort.order: "asc"
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              name:
+                type: keyword
+              obj:
+                store_array_source: true
+                properties:
+                  foo:
+                    type: keyword
+                    store: true
+
+  - do:
+      bulk:
+        index: test
+        refresh: true
+        body:
+          - '{ "create": { } }'
+          - '{ "name": "B", "obj": null }'
+          - '{ "create": { } }'
+          - '{ "name": "A", "obj": [ { "foo": "hello_from_the_other_side" } ] }'
+
+  - match: { errors: false }
+
+  - do:
+      search:
+        index: test
+        sort: name
+
+  - match:  { hits.total.value: 2 }
+  - match: { hits.hits.0._source.name: A }
+  - match: { hits.hits.0._source.obj: [ { "foo": "hello_from_the_other_side" } ] }
+  - match: { hits.hits.1._source.name: B }
+  - match: { hits.hits.1._source.obj: null }
+
+
+---
+index param - root arrays:
+  - requires:
+      cluster_features: ["mapper.synthetic_source_keep"]
+      reason: requires tracking ignored source
+
+  - do:
+      indices.create:
+        index: test
+        body:
+          settings:
+            index:
+              mapping:
+                synthetic_source_keep: arrays
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              id:
+                type: integer
+              leaf:
+                type: integer
+              obj:
+                properties:
+                  span:
+                    properties:
+                      id:
+                        type: keyword
+                  trace:
+                    properties:
+                      id:
+                        type: keyword
+
+  - do:
+      bulk:
+        index: test
+        refresh: true
+        body:
+          - '{ "create": { } }'
+          - '{  "id": 1, "leaf": [30, 20, 10], "obj": [ { "trace": { "id": "a" }, "span": { "id": "1" } }, { "trace": { "id": "b" }, "span": { "id": "1" } } ] }'
+          - '{ "create": { } }'
+          - '{  "id": 2, "leaf": [130, 120, 110], "obj": [ { "trace": { "id": "aa" }, "span": { "id": "2" } }, { "trace": { "id": "bb" }, "span": { "id": "2" } } ] }'
+
+  - do:
+      search:
+        index: test
+        sort: id
+
+  - match: { hits.hits.0._source.id: 1  }
+  - match: { hits.hits.0._source.leaf: [30, 20, 10]  }
+  - length: { hits.hits.0._source.obj: 2 }
+  - match: { hits.hits.0._source.obj.0.trace.id: a  }
+  - match: { hits.hits.0._source.obj.0.span.id: "1"  }
+  - match: { hits.hits.0._source.obj.1.trace.id: b }
+  - match: { hits.hits.0._source.obj.1.span.id: "1" }
+
+  - match: { hits.hits.1._source.id: 2 }
+  - match: { hits.hits.1._source.leaf: [ 130, 120, 110 ] }
+  - length: { hits.hits.1._source.obj: 2 }
+  - match: { hits.hits.1._source.obj.0.trace.id: aa }
+  - match: { hits.hits.1._source.obj.0.span.id: "2" }
+  - match: { hits.hits.1._source.obj.1.trace.id: bb }
+  - match: { hits.hits.1._source.obj.1.span.id: "2" }
+
+
+---
+index param - dynamic root arrays:
+  - requires:
+      cluster_features: ["mapper.synthetic_source_keep"]
+      reason: requires tracking ignored source
+
+  - do:
+      indices.create:
+        index: test
+        body:
+          settings:
+            index:
+              mapping:
+                synthetic_source_keep: arrays
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              id:
+                type: integer
+
+  - do:
+      bulk:
+        index: test
+        refresh: true
+        body:
+          - '{ "create": { } }'
+          - '{  "id": 1, "leaf": [30, 20, 10], "obj": [ { "trace": { "id": "a" }, "span": { "id": "1" } }, { "trace": { "id": "b" }, "span": { "id": "1" } } ] }'
+          - '{ "create": { } }'
+          - '{  "id": 2, "leaf": [130, 120, 110], "obj": [ { "trace": { "id": "aa" }, "span": { "id": "2" } }, { "trace": { "id": "bb" }, "span": { "id": "2" } } ] }'
+
+  - do:
+      search:
+        index: test
+        sort: id
+
+  - match: { hits.hits.0._source.id: 1  }
+  - match: { hits.hits.0._source.leaf: [30, 20, 10]  }
+  - length: { hits.hits.0._source.obj: 2 }
+  - match: { hits.hits.0._source.obj.0.trace.id: a  }
+  - match: { hits.hits.0._source.obj.0.span.id: "1"  }
+  - match: { hits.hits.0._source.obj.1.trace.id: b }
+  - match: { hits.hits.0._source.obj.1.span.id: "1" }
+
+  - match: { hits.hits.1._source.id: 2 }
+  - match: { hits.hits.1._source.leaf: [ 130, 120, 110 ] }
+  - length: { hits.hits.1._source.obj: 2 }
+  - match: { hits.hits.1._source.obj.0.trace.id: aa }
+  - match: { hits.hits.1._source.obj.0.span.id: "2" }
+  - match: { hits.hits.1._source.obj.1.trace.id: bb }
+  - match: { hits.hits.1._source.obj.1.span.id: "2" }
+
+
+---
+index param - object array within array:
+  - requires:
+      cluster_features: ["mapper.synthetic_source_keep"]
+      reason: requires tracking ignored source
+
+  - do:
+      indices.create:
+        index: test
+        body:
+          settings:
+            index:
+              mapping:
+                synthetic_source_keep: arrays
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              stored:
+                properties:
+                  path:
+                    properties:
+                      to:
+                        properties:
+                          trace:
+                            type: keyword
+                          values:
+                            type: integer
+
+  - do:
+      bulk:
+        index: test
+        refresh: true
+        body:
+          - '{ "create": { } }'
+          - '{ "stored": [ { "path": [{ "to": { "trace": "A", "values": [2, 1] } }, { "to": { "trace": "B", "values": [2, 1] } } ] }, { "path": { "to": { "trace": "C", "values": 3 } } } ] }'
+
+  - do:
+      search:
+        index: test
+
+  - length: { hits.hits.0._source.stored: 2 }
+  - match: { hits.hits.0._source.stored.0.path.0.to.trace: A }
+  - match: { hits.hits.0._source.stored.0.path.0.to.values: [2, 1] }
+  - match: { hits.hits.0._source.stored.0.path.1.to.trace: B }
+  - match: { hits.hits.0._source.stored.0.path.1.to.values: [2, 1] }
+  - match: { hits.hits.0._source.stored.1.path.to.trace: C }
+  - match: { hits.hits.0._source.stored.1.path.to.values: 3 }
+
+
+---
+index param - no object array:
+  - requires:
+      cluster_features: ["mapper.synthetic_source_keep"]
+      reason: requires tracking ignored source
+
+  - do:
+      indices.create:
+        index: test
+        body:
+          settings:
+            index:
+              mapping:
+                synthetic_source_keep: arrays
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              stored:
+                properties:
+                  span:
+                    properties:
+                      id:
+                        type: keyword
+                  trace:
+                    properties:
+                      id:
+                        type: keyword
+
+  - do:
+      bulk:
+        index: test
+        refresh: true
+        body:
+          - '{ "create": { } }'
+          - '{ "stored": { "trace": { "id": "a" }, "span": { "id": "b" } } }'
+
+  - do:
+      search:
+        index: test
+
+  - match: { hits.hits.0._source.stored.trace.id: a  }
+  - match: { hits.hits.0._source.stored.span.id: b  }
+
+
+---
+index param - field ordering:
+  - requires:
+      cluster_features: ["mapper.synthetic_source_keep"]
+      reason: requires tracking ignored source
+
+  - do:
+      indices.create:
+        index: test
+        body:
+          settings:
+            index:
+              mapping:
+                synthetic_source_keep: arrays
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              a:
+                type: keyword
+              b:
+                properties:
+                  aa:
+                    type: keyword
+                  bb:
+                    type: keyword
+              c:
+                type: keyword
+              d:
+                properties:
+                  aa:
+                    type: keyword
+                  bb:
+                    type: keyword
+
+  - do:
+      bulk:
+        index: test
+        refresh: true
+        body:
+          - '{ "create": { } }'
+          - '{ "c": [30, 20, 10], "d": [ { "bb": 10, "aa": 20 }, { "aa": 30, "bb": 40 } ], "a": 2, "b": [ { "bb": 100, "aa": 200 }, { "aa": 300, "bb": 400 } ] }'
+
+  - do:
+      search:
+        index: test
+
+  - length: { hits.hits.0._source: 4 }
+  - match: { hits.hits.0._source: { "a": "2", "b": [ { "bb": 100, "aa": 200 }, { "aa": 300, "bb": 400 } ], "c": [30, 20, 10], "d": [ { "bb": 10, "aa": 20 }, { "aa": 30, "bb": 40 } ] } }
+
+
+---
+index param - nested arrays:
+  - requires:
+      cluster_features: ["mapper.synthetic_source_keep"]
+      reason: requires tracking ignored source
+
+  - do:
+      indices.create:
+        index: test
+        body:
+          settings:
+            index:
+              mapping:
+                synthetic_source_keep: arrays
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              a:
+                type: keyword
+              b:
+                properties:
+                  c:
+                    properties:
+                      aa:
+                        type: keyword
+                      bb:
+                        type: keyword
+                  d:
+                    type: integer
+                  e:
+                    type: keyword
+              f:
+                type: keyword
+
+  - do:
+      bulk:
+        index: test
+        refresh: true
+        body:
+          - '{ "create": { } }'
+          - '{ "a": 1, "b": { "c": [ { "bb": 10, "aa": 20 }, { "aa": 30, "bb": 40 } ], "d": [ 300, 200, 100 ], "e": 1000 }, "f": 2000 }'
+          - '{ "create": { } }'
+          - '{ "a": 11, "b": { "c": [ { "bb": 110, "aa": 120 }, { "aa": 130, "bb": 140 } ], "d": [ 1300, 1200, 1100 ], "e": 11000 }, "f": 12000 }'
+
+
+  - do:
+      search:
+        index: test
+        sort: a
+
+  - match: { hits.hits.0._source.a: "1" }
+  - match: { hits.hits.0._source.b.c:  [{ "bb": 10, "aa": 20 }, { "aa": 30, "bb": 40 }] }
+  - match: { hits.hits.0._source.b.d:  [ 300, 200, 100 ] }
+  - match: { hits.hits.0._source.b.e: "1000" }
+  - match: { hits.hits.0._source.f: "2000" }
+
+  - match: { hits.hits.1._source.a: "11" }
+  - match: { hits.hits.1._source.b.c: [ { "bb": 110, "aa": 120 }, { "aa": 130, "bb": 140 } ] }
+  - match: { hits.hits.1._source.b.d: [ 1300, 1200, 1100 ] }
+  - match: { hits.hits.1._source.b.e: "11000" }
+  - match: { hits.hits.1._source.f: "12000" }
+
+---
+index param - nested object with stored array:
+  - requires:
+      cluster_features: ["mapper.synthetic_source_keep"]
+      reason: requires tracking ignored source
+
+  - do:
+      indices.create:
+        index: test
+        body:
+          settings:
+            index:
+              mapping:
+                synthetic_source_keep: arrays
+          mappings:
+            _source:
+              mode: synthetic
+            properties:
+              name:
+                type: keyword
+              nested:
+                type: nested
+
+  - do:
+      bulk:
+        index: test
+        refresh: true
+        body:
+          - '{ "create": { } }'
+          - '{ "name": "A", "nested": [ { "b": [ { "c": 10 }, { "c": 100 } ] }, { "b": [ { "c": 20 }, { "c": 200 } ] } ] }'
+          - '{ "create": { } }'
+          - '{ "name": "B", "nested": [ { "b": [ { "c": 30 }, { "c": 300 } ] }, { "b": [ { "c": 40 }, { "c": 400 } ] } ] }'
+
+  - match: { errors: false }
+
+  - do:
+      search:
+        index: test
+        sort: name
+  - match:  { hits.total.value: 2 }
+  - match:  { hits.hits.0._source.name: A }
+  - match: { hits.hits.0._source.nested.0.b.0.c: 10 }
+  - match: { hits.hits.0._source.nested.0.b.1.c: 100 }
+  - match: { hits.hits.0._source.nested.1.b.0.c: 20 }
+  - match: { hits.hits.0._source.nested.1.b.1.c: 200 }
+  - match: { hits.hits.1._source.name: B }
+  - match: { hits.hits.1._source.nested.0.b.0.c: 30 }
+  - match: { hits.hits.1._source.nested.0.b.1.c: 300 }
+  - match: { hits.hits.1._source.nested.1.b.0.c: 40 }
+  - match: { hits.hits.1._source.nested.1.b.1.c: 400 }
diff --git a/server/src/main/java/org/elasticsearch/common/settings/IndexScopedSettings.java b/server/src/main/java/org/elasticsearch/common/settings/IndexScopedSettings.java
index fe6616cb4fb8e..6adf181014023 100644
--- a/server/src/main/java/org/elasticsearch/common/settings/IndexScopedSettings.java
+++ b/server/src/main/java/org/elasticsearch/common/settings/IndexScopedSettings.java
@@ -181,6 +181,7 @@ public final class IndexScopedSettings extends AbstractScopedSettings {
         IndexSettings.TIME_SERIES_ES87TSDB_CODEC_ENABLED_SETTING,
         IndexSettings.PREFER_ILM_SETTING,
         DataStreamFailureStoreDefinition.FAILURE_STORE_DEFINITION_VERSION_SETTING,
+        FieldMapper.SYNTHETIC_SOURCE_KEEP_INDEX_SETTING,
 
         // validate that built-in similarities don't get redefined
         Setting.groupSetting("index.similarity.", (s) -> {
diff --git a/server/src/main/java/org/elasticsearch/index/IndexSettings.java b/server/src/main/java/org/elasticsearch/index/IndexSettings.java
index 944d50f7ea06c..509d37fd6077d 100644
--- a/server/src/main/java/org/elasticsearch/index/IndexSettings.java
+++ b/server/src/main/java/org/elasticsearch/index/IndexSettings.java
@@ -24,6 +24,7 @@
 import org.elasticsearch.common.unit.ByteSizeUnit;
 import org.elasticsearch.common.unit.ByteSizeValue;
 import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.index.mapper.Mapper;
 import org.elasticsearch.index.translog.Translog;
 import org.elasticsearch.ingest.IngestService;
 import org.elasticsearch.node.Node;
@@ -793,6 +794,16 @@ private void setRetentionLeaseMillis(final TimeValue retentionLease) {
 
     private final IndexRouting indexRouting;
 
+    /**
+     * The default mode for storing source, for all mappers not overriding this setting.
+     * This is only relevant for indexes configured with synthetic-source code.
+     */
+    public Mapper.SourceKeepMode sourceKeepMode() {
+        return sourceKeepMode;
+    }
+
+    private final Mapper.SourceKeepMode sourceKeepMode;
+
     /**
      * Returns the default search fields for this index.
      */
@@ -922,6 +933,7 @@ public IndexSettings(final IndexMetadata indexMetadata, final Settings nodeSetti
         mappingFieldNameLengthLimit = scopedSettings.get(INDEX_MAPPING_FIELD_NAME_LENGTH_LIMIT_SETTING);
         mappingDimensionFieldsLimit = scopedSettings.get(INDEX_MAPPING_DIMENSION_FIELDS_LIMIT_SETTING);
         indexRouting = IndexRouting.fromIndexMetadata(indexMetadata);
+        sourceKeepMode = scopedSettings.get(Mapper.SYNTHETIC_SOURCE_KEEP_INDEX_SETTING);
         es87TSDBCodecEnabled = scopedSettings.get(TIME_SERIES_ES87TSDB_CODEC_ENABLED_SETTING);
 
         scopedSettings.addSettingsUpdateConsumer(
diff --git a/server/src/main/java/org/elasticsearch/index/mapper/DocumentParser.java b/server/src/main/java/org/elasticsearch/index/mapper/DocumentParser.java
index 35f0130c58706..f020b8128bb13 100644
--- a/server/src/main/java/org/elasticsearch/index/mapper/DocumentParser.java
+++ b/server/src/main/java/org/elasticsearch/index/mapper/DocumentParser.java
@@ -297,7 +297,7 @@ static void parseObjectOrNested(DocumentParserContext context) throws IOExceptio
 
         if (context.parent().isNested()) {
             // Handle a nested object that doesn't contain an array. Arrays are handled in #parseNonDynamicArray.
-            if (context.parent().storeArraySource() && context.mappingLookup().isSourceSynthetic() && context.getClonedSource() == false) {
+            if (context.parent().storeArraySource() && context.canAddIgnoredField()) {
                 Tuple<DocumentParserContext, XContentBuilder> tuple = XContentDataHelper.cloneSubContext(context);
                 context.addIgnoredField(
                     new IgnoredSourceFieldMapper.NameValue(
@@ -686,11 +686,16 @@ private static void parseNonDynamicArray(
         // Check if we need to record the array source. This only applies to synthetic source.
         if (context.canAddIgnoredField()) {
             boolean objectRequiresStoringSource = mapper instanceof ObjectMapper objectMapper
-                && (objectMapper.storeArraySource() || objectMapper.dynamic == ObjectMapper.Dynamic.RUNTIME);
+                && (objectMapper.storeArraySource()
+                    || (context.sourceKeepModeFromIndexSettings() == Mapper.SourceKeepMode.ARRAYS
+                        && objectMapper instanceof NestedObjectMapper == false)
+                    || objectMapper.dynamic == ObjectMapper.Dynamic.RUNTIME);
             boolean fieldWithFallbackSyntheticSource = mapper instanceof FieldMapper fieldMapper
                 && fieldMapper.syntheticSourceMode() == FieldMapper.SyntheticSourceMode.FALLBACK;
+            boolean fieldWithStoredArraySource = mapper instanceof FieldMapper fieldMapper
+                && context.sourceKeepModeFromIndexSettings() == Mapper.SourceKeepMode.ARRAYS;
             boolean dynamicRuntimeContext = context.dynamic() == ObjectMapper.Dynamic.RUNTIME;
-            if (objectRequiresStoringSource || fieldWithFallbackSyntheticSource || dynamicRuntimeContext) {
+            if (objectRequiresStoringSource || fieldWithFallbackSyntheticSource || dynamicRuntimeContext || fieldWithStoredArraySource) {
                 Tuple<DocumentParserContext, XContentBuilder> tuple = XContentDataHelper.cloneSubContext(context);
                 context.addIgnoredField(
                     IgnoredSourceFieldMapper.NameValue.fromContext(
diff --git a/server/src/main/java/org/elasticsearch/index/mapper/DocumentParserContext.java b/server/src/main/java/org/elasticsearch/index/mapper/DocumentParserContext.java
index 248369b249007..3a84162b86c27 100644
--- a/server/src/main/java/org/elasticsearch/index/mapper/DocumentParserContext.java
+++ b/server/src/main/java/org/elasticsearch/index/mapper/DocumentParserContext.java
@@ -329,6 +329,10 @@ public final boolean canAddIgnoredField() {
         return mappingLookup.isSourceSynthetic() && clonedSource == false;
     }
 
+    Mapper.SourceKeepMode sourceKeepModeFromIndexSettings() {
+        return indexSettings().sourceKeepMode();
+    }
+
     /**
      * Description on the document being parsed used in error messages. Not
      * called unless there is an error.
diff --git a/server/src/main/java/org/elasticsearch/index/mapper/Mapper.java b/server/src/main/java/org/elasticsearch/index/mapper/Mapper.java
index 2c1e01c3cd196..9469ee29ff0a3 100644
--- a/server/src/main/java/org/elasticsearch/index/mapper/Mapper.java
+++ b/server/src/main/java/org/elasticsearch/index/mapper/Mapper.java
@@ -10,7 +10,9 @@
 
 import org.apache.lucene.document.FieldType;
 import org.elasticsearch.common.Strings;
+import org.elasticsearch.common.settings.Setting;
 import org.elasticsearch.common.util.StringLiteralDeduplicator;
+import org.elasticsearch.features.NodeFeature;
 import org.elasticsearch.index.IndexVersion;
 import org.elasticsearch.index.IndexVersions;
 import org.elasticsearch.xcontent.ToXContentFragment;
@@ -22,6 +24,57 @@
 
 public abstract class Mapper implements ToXContentFragment, Iterable<Mapper> {
 
+    public static final NodeFeature SYNTHETIC_SOURCE_KEEP_FEATURE = new NodeFeature("mapper.synthetic_source_keep");
+
+    static final String SYNTHETIC_SOURCE_KEEP_PARAM = "synthetic_source_keep";
+
+    // Only relevant for synthetic source mode.
+    public enum SourceKeepMode {
+        NONE("none"),      // No source recording
+        ARRAYS("arrays"),  // Store source for arrays of mapped fields
+        ALL("all");        // Store source for both singletons and arrays of mapped fields
+
+        SourceKeepMode(String name) {
+            this.name = name;
+        }
+
+        static SourceKeepMode from(String input) {
+            if (input.equals(NONE.name)) {
+                return NONE;
+            }
+            if (input.equals(ALL.name)) {
+                return ALL;
+            }
+            if (input.equals(ARRAYS.name)) {
+                return ARRAYS;
+            }
+            throw new IllegalArgumentException("Unknown " + SYNTHETIC_SOURCE_KEEP_PARAM + " value [" + input + "]");
+        }
+
+        @Override
+        public String toString() {
+            return name;
+        }
+
+        private final String name;
+    }
+
+    // Only relevant for indexes configured with synthetic source mode. Otherwise, it has no effect.
+    // Controls the default behavior for storing the source of leaf fields and objects, in singleton or array form.
+    // Setting to SourceKeepMode.ALL is equivalent to disabling synthetic source, so this is not allowed.
+    public static final Setting<SourceKeepMode> SYNTHETIC_SOURCE_KEEP_INDEX_SETTING = Setting.enumSetting(
+        SourceKeepMode.class,
+        "index.mapping.synthetic_source_keep",
+        SourceKeepMode.NONE,
+        value -> {
+            if (value == SourceKeepMode.ALL) {
+                throw new IllegalArgumentException("index.mapping.synthetic_source_keep can't be set to [" + value.toString() + "]");
+            }
+        },
+        Setting.Property.IndexScope,
+        Setting.Property.ServerlessPublic
+    );
+
     public abstract static class Builder {
 
         private String leafName;
diff --git a/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java b/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java
index 63bbef061c61f..2e250726b98ca 100644
--- a/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java
+++ b/server/src/main/java/org/elasticsearch/index/mapper/MapperFeatures.java
@@ -34,7 +34,8 @@ public Set<NodeFeature> getFeatures() {
             BooleanFieldMapper.BOOLEAN_DIMENSION,
             ObjectMapper.SUBOBJECTS_AUTO,
             KeywordFieldMapper.KEYWORD_NORMALIZER_SYNTHETIC_SOURCE,
-            SourceFieldMapper.SYNTHETIC_SOURCE_STORED_FIELDS_ADVANCE_FIX
+            SourceFieldMapper.SYNTHETIC_SOURCE_STORED_FIELDS_ADVANCE_FIX,
+            Mapper.SYNTHETIC_SOURCE_KEEP_FEATURE
         );
     }
 }
diff --git a/server/src/test/java/org/elasticsearch/index/mapper/IgnoredSourceFieldMapperTests.java b/server/src/test/java/org/elasticsearch/index/mapper/IgnoredSourceFieldMapperTests.java
index dcb5cd1711c8c..61c4068cedf4a 100644
--- a/server/src/test/java/org/elasticsearch/index/mapper/IgnoredSourceFieldMapperTests.java
+++ b/server/src/test/java/org/elasticsearch/index/mapper/IgnoredSourceFieldMapperTests.java
@@ -48,6 +48,14 @@ private String getSyntheticSourceWithFieldLimit(CheckedConsumer<XContentBuilder,
         return syntheticSource(documentMapper, build);
     }
 
+    private MapperService createMapperServiceWithStoredArraySource(XContentBuilder mappings) throws IOException {
+        Settings settings = Settings.builder()
+            .put(getIndexSettings())
+            .put(Mapper.SYNTHETIC_SOURCE_KEEP_INDEX_SETTING.getKey(), "arrays")
+            .build();
+        return createMapperService(settings, mappings);
+    }
+
     public void testIgnoredBoolean() throws IOException {
         boolean value = randomBoolean();
         assertEquals("{\"my_value\":" + value + "}", getSyntheticSourceWithFieldLimit(b -> b.field("my_value", value)));
@@ -485,6 +493,108 @@ public void testMixedDisabledEnabledObjects() throws IOException {
         );
     }
 
+    public void testIndexStoredArraySourceRootValueArray() throws IOException {
+        DocumentMapper documentMapper = createMapperServiceWithStoredArraySource(syntheticSourceMapping(b -> {
+            b.startObject("int_value").field("type", "integer").endObject();
+            b.startObject("bool_value").field("type", "boolean").endObject();
+        })).documentMapper();
+        var syntheticSource = syntheticSource(documentMapper, b -> {
+            b.array("int_value", new int[] { 30, 20, 10 });
+            b.field("bool_value", true);
+        });
+        assertEquals("""
+            {"bool_value":true,"int_value":[30,20,10]}""", syntheticSource);
+    }
+
+    public void testIndexStoredArraySourceRootObjectArray() throws IOException {
+        DocumentMapper documentMapper = createMapperServiceWithStoredArraySource(syntheticSourceMapping(b -> {
+            b.startObject("path");
+            {
+                b.field("type", "object");
+                b.startObject("properties");
+                {
+                    b.startObject("int_value").field("type", "integer").endObject();
+                }
+                b.endObject();
+            }
+            b.endObject();
+            b.startObject("bool_value").field("type", "boolean").endObject();
+        })).documentMapper();
+        var syntheticSource = syntheticSource(documentMapper, b -> {
+            b.startArray("path");
+            b.startObject().field("int_value", 10).endObject();
+            b.startObject().field("int_value", 20).endObject();
+            b.endArray();
+            b.field("bool_value", true);
+        });
+        assertEquals("""
+            {"bool_value":true,"path":[{"int_value":10},{"int_value":20}]}""", syntheticSource);
+    }
+
+    public void testIndexStoredArraySourceNestedValueArray() throws IOException {
+        DocumentMapper documentMapper = createMapperServiceWithStoredArraySource(syntheticSourceMapping(b -> {
+            b.startObject("path");
+            {
+                b.field("type", "object");
+                b.startObject("properties");
+                {
+                    b.startObject("int_value").field("type", "integer").endObject();
+                    b.startObject("bool_value").field("type", "boolean").endObject();
+                }
+                b.endObject();
+            }
+            b.endObject();
+        })).documentMapper();
+        var syntheticSource = syntheticSource(documentMapper, b -> {
+            b.startObject("path");
+            {
+                b.array("int_value", new int[] { 30, 20, 10 });
+                b.field("bool_value", true);
+            }
+            b.endObject();
+        });
+        assertEquals("""
+            {"path":{"bool_value":true,"int_value":[30,20,10]}}""", syntheticSource);
+    }
+
+    public void testIndexStoredArraySourceNestedObjectArray() throws IOException {
+        DocumentMapper documentMapper = createMapperServiceWithStoredArraySource(syntheticSourceMapping(b -> {
+            b.startObject("path");
+            {
+                b.field("type", "object");
+                b.startObject("properties");
+                {
+                    b.startObject("to");
+                    {
+                        b.field("type", "object");
+                        b.startObject("properties");
+                        {
+                            b.startObject("int_value").field("type", "integer").endObject();
+                        }
+                        b.endObject();
+                    }
+                    b.endObject();
+                    b.startObject("bool_value").field("type", "boolean").endObject();
+                }
+                b.endObject();
+            }
+            b.endObject();
+        })).documentMapper();
+        var syntheticSource = syntheticSource(documentMapper, b -> {
+            b.startObject("path");
+            {
+                b.startArray("to");
+                b.startObject().field("int_value", 10).endObject();
+                b.startObject().field("int_value", 20).endObject();
+                b.endArray();
+                b.field("bool_value", true);
+            }
+            b.endObject();
+        });
+        assertEquals("""
+            {"path":{"bool_value":true,"to":[{"int_value":10},{"int_value":20}]}}""", syntheticSource);
+    }
+
     public void testRootArray() throws IOException {
         DocumentMapper documentMapper = createMapperService(syntheticSourceMapping(b -> {
             b.startObject("path");